From affe00f6fbd7b0705be1fecbf70ce6bf302cf6c2 Mon Sep 17 00:00:00 2001 From: Harrison Deng Date: Tue, 16 Nov 2021 00:31:48 -0500 Subject: [PATCH] Line termination change and old code. --- .Rprofile | 258 +- .gitignore | 88 +- .tmp.R | 76 +- .utilities.R | 1308 +- 2021-10-12_In-Class_exploration.R | 514 +- ABC-Install_all_packages.R | 322 +- ABC-addSACCE_APSESproteins.R | 200 +- ABC-units.R | 138 +- ABC-units.Rproj | 32 +- BIN-ALI-BLAST.R | 222 +- BIN-ALI-Dotplot.R | 390 +- BIN-ALI-MSA.R | 1256 +- BIN-ALI-Optimal_sequence_alignment.R | 730 +- BIN-ALI-Similarity.R | 626 +- BIN-Data_integration.R | 432 +- BIN-FUNC-Domain_annotation.R | 870 +- BIN-FUNC-Semantic_similarity.R | 338 +- BIN-MYSPE.R | 702 +- BIN-PHYLO-Data_preparation.R | 468 +- BIN-PHYLO-Tree_analysis.R | 812 +- BIN-PHYLO-Tree_building.R | 336 +- BIN-PPI-Analysis.R | 646 +- BIN-SEQA-Composition.R | 504 +- BIN-Sequence.R | 788 +- BIN-Storing_data.R | 1368 +- FND-Genetic_code.R | 698 +- FND-MAT-Graphs_and_networks.R | 1382 +- FND-STA-Information_theory.R | 448 +- FND-STA-Probability_distribution.R | 2646 +- FND-STA-Significance.R | 702 +- README.md | 4 +- RPR-Biostrings.R | 490 +- RPR-ChimeraX_remote.R | 330 +- RPR-FASTA.R | 644 +- RPR-GEO2R.R | 1348 +- RPR-Genetic_code_optimality.R | 770 +- RPR-Introduction.R | 100 +- RPR-PROSITE_POST.R | 336 +- RPR-Pipe.R | 270 +- RPR-RegEx.R | 360 +- RPR-SX-PDB.R | 1658 +- RPR-UniProt_GET.R | 270 +- RPR-Unit_testing.R | 468 +- RPR-eUtils_XML.R | 332 +- data/0TST.pdb | 20 +- data/1BM8.pdb | 3104 +- data/2F1C.fa | 8 +- data/3FG7.fa | 12 +- data/MBP1_SACCE.json | 40 +- data/PTPN5_HSa_coding.fa | 60 +- data/RAB39B_HSa_coding.fa | 24 +- data/RandomPhobiaPage.txt | 262 +- data/S288C_YDL056W_MBP1_coding.fsa | 84 +- data/SGD_features.README.txt | 94 +- data/SGD_features.tab | 32908 ++++++++++---------- data/Species.csv | 2030 +- data/intogen-KRAS-distribution-data.tsv | 358 +- data/intogen-OR1A1-distribution-data.tsv | 98 +- data/intogen-PTPN11-distribution-data.tsv | 226 +- data/refAPSES.mfa | 78 +- data/refAPSES_PSI-BLAST.json | 980 +- data/refAnnotations.json | 232 +- data/refFeatures.json | 94 +- data/refMBP1Proteins.json | 310 +- data/refTaxonomy.json | 44 +- data/referenceDomainAnnotations.txt | 230 +- functionTemplate.R | 74 +- myScripts/.myProfile.R | 42 +- myScripts/ABC-INT-Mutation_impact-code.R | 105 +- myScripts/BIN-Storing_data.R | 80 +- myScripts/CUTOLTaxonomy.json | 8 +- myScripts/MBP1_CUTOL.json | 38 +- myScripts/README-myScripts.txt | 16 +- myScripts/makeProteinDB.R | 8 +- myScripts/myScript.R | 76 +- plottingReference.R | 2868 +- scriptTemplate.R | 150 +- scripts/ABC-createRefDB.R | 60 +- scripts/ABC-dbUtilities.R | 1348 +- scripts/ABC-makeMYSPElist.R | 886 +- scripts/ABC-makeSTRINGedges.R | 336 +- scripts/ABC-makeScCCnet.R | 334 +- scripts/ABC-writeALN.R | 270 +- scripts/ABC-writeMFA.R | 242 +- scripts/BLAST.R | 768 +- tests/test_biCode.R | 64 +- 86 files changed, 37873 insertions(+), 37876 deletions(-) diff --git a/.Rprofile b/.Rprofile index e958186..0d2dd54 100644 --- a/.Rprofile +++ b/.Rprofile @@ -1,129 +1,129 @@ -# .Rprofile -# -# This script is automatically executed on startup -# ============================================================================== - -init <- function() { - - # Create a local copy of myScript.R if not done yet. - if (! file.exists("myScript.R") && file.exists(".tmp.R")) { - file.copy(".tmp.R", "myScript.R") - cat("A new file \"myScript.R\" was created. You can use it for\n") - cat("notes and code experiments.\n\n") - } - - cat("\n\n") - cat("Please open the file \".myProfile.R\" (click on the file-name in the\n") - cat("\"files\" pane), edit it and save it.\n") - cat("Then click the checkbox, and use the More -> Move... dialogue\n") - cat("to move it into the \"myScripts\" folder.\n\n") - - file.edit("ABC-units.R") - return(invisible(NULL)) -} - -if (! file.exists("./myScripts/.myProfile.R")) { - cat("\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n") - cat(" =================") - cat("\n\n") - cat(" WELCOME !\n") - cat("\n") - cat(" Type 'init()' to begin\n\n") - cat("\n") - cat(" =================") - cat("\n\n") - -} else { # local profile exists ... validate state: - cat("\n\nLoading local functions ...") - - source(".utilities.R") # local profile appears sane, source utilities - source("./myScripts/.myProfile.R") - - if (! exists("myEMail")) { # ... has eMail been defined? - cat("ERROR !\n") - cat("=======\n") - cat("The file \"./myScripts/.myProfile.R\" exists, but\n") - cat("the variable \"myEMail\" was not loaded.\n") - cat("Please contact your instructor to continue.\n\n") - } - if (! exists("myStudentNumber")) { # ... has the Student Number been defined? - cat("ERROR !\n") - cat("=======\n") - cat("The file \"./myScripts/.myProfile.R\" exists, but\n") - cat("the variable \"myStudentNumber\" was not loaded.\n") - cat("Please contact your instructor to continue.\n\n") - } - if (! grepl("^(100.{7})|(99.{7})$", as.character(myStudentNumber))) { - cat("ERROR !\n") # is the Student Number valid? - cat("=======\n") - cat("The file \"./myScripts/.myProfile.R\" exists, but\n") - cat("your Student Number could not be validated.\n") - cat("Please examine the file \"./myScripts/.myProfile.R\"\n") - cat(" and fix the problem or contact your instructor to continue.\n\n") - } - - - if (! exists("MYSPE")) { # if MYSPE has not yet been defined, define it now - # ... and write it into the profile. - prf <- readLines("./myScripts/.myProfile.R") - iEmail <- grep("^\\s*myStudentNumber\\s*<-", prf) - out <- prf[1:iEmail] - out <- c(out, sprintf("MYSPE <- \"%s\" ", - getMYSPE(myStudentNumber))) - out <- c(out, prf[(iEmail+1):length(prf)]) - writeLines(out, "./myScripts/.myProfile.R") - - cat("\n") - cat(sprintf("MYSPE (%s) was added to \"./myScripts/.myProfile.R\"\n\n", - getMYSPE(myStudentNumber))) - MYSPE <- getMYSPE(myStudentNumber) # ... define it for immediate use - rm(prf, iEmail, out) # cleanup - } - cat("... done.\n\n") -} - -if (default.stringsAsFactors()) { - cat("WARNING.\n") - cat("========\n") - cat("Your default \"stringsAsFactors\" parameter is set to \"TRUE\".\n") - cat("This will break some of the code.\n") - cat("Please contact your instructor to troubleshoot and fix this issue.\n") - cat("\n") -} - -errText <- list() -errText[["noProfileFile"]] <- ' -Your PROFILE FILE does not exist. This problem must be fixed to continue. - - The code expects the file "./myScripts/.myProfile.R" to exist and to - contain your correct eMail address and student number. Detailed - instructions were given when you first ran the init() command. - - Try running init() again and follow the instructions. Reload youR RStudio - session and start over with this file. - - If this does not fix the problem, ask for help. -' - -errText[["noStudentNumber"]] <- ' -Your STUDENT NUMBER has not been defined. This problem must be fixed to continue. - - The code expects the file "./myScripts/.myProfile.R" to exist and to - contain your correct eMail address and student number. This file gets - sourced when you start a new R-session, but since you see this error - message there was a problem. - - Perhaps you need to restart your R-session. Try closing the RStudio - project and reopening it from the File > Recent Projects menu. - - Perhaps there was a syntax error in your file. Then not all the - instructions in the file are executed. Check the file: is your - email perhpas not defined? Or did you type it without qwuoataion - marks? - - Try fixing problems, and then restart R as described above. - - If none of this fixes the problem, ask for help. -' - -# [END] +# .Rprofile +# +# This script is automatically executed on startup +# ============================================================================== + +init <- function() { + + # Create a local copy of myScript.R if not done yet. + if (! file.exists("myScript.R") && file.exists(".tmp.R")) { + file.copy(".tmp.R", "myScript.R") + cat("A new file \"myScript.R\" was created. You can use it for\n") + cat("notes and code experiments.\n\n") + } + + cat("\n\n") + cat("Please open the file \".myProfile.R\" (click on the file-name in the\n") + cat("\"files\" pane), edit it and save it.\n") + cat("Then click the checkbox, and use the More -> Move... dialogue\n") + cat("to move it into the \"myScripts\" folder.\n\n") + + file.edit("ABC-units.R") + return(invisible(NULL)) +} + +if (! file.exists("./myScripts/.myProfile.R")) { + cat("\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n") + cat(" =================") + cat("\n\n") + cat(" WELCOME !\n") + cat("\n") + cat(" Type 'init()' to begin\n\n") + cat("\n") + cat(" =================") + cat("\n\n") + +} else { # local profile exists ... validate state: + cat("\n\nLoading local functions ...") + + source(".utilities.R") # local profile appears sane, source utilities + source("./myScripts/.myProfile.R") + + if (! exists("myEMail")) { # ... has eMail been defined? + cat("ERROR !\n") + cat("=======\n") + cat("The file \"./myScripts/.myProfile.R\" exists, but\n") + cat("the variable \"myEMail\" was not loaded.\n") + cat("Please contact your instructor to continue.\n\n") + } + if (! exists("myStudentNumber")) { # ... has the Student Number been defined? + cat("ERROR !\n") + cat("=======\n") + cat("The file \"./myScripts/.myProfile.R\" exists, but\n") + cat("the variable \"myStudentNumber\" was not loaded.\n") + cat("Please contact your instructor to continue.\n\n") + } + if (! grepl("^(100.{7})|(99.{7})$", as.character(myStudentNumber))) { + cat("ERROR !\n") # is the Student Number valid? + cat("=======\n") + cat("The file \"./myScripts/.myProfile.R\" exists, but\n") + cat("your Student Number could not be validated.\n") + cat("Please examine the file \"./myScripts/.myProfile.R\"\n") + cat(" and fix the problem or contact your instructor to continue.\n\n") + } + + + if (! exists("MYSPE")) { # if MYSPE has not yet been defined, define it now + # ... and write it into the profile. + prf <- readLines("./myScripts/.myProfile.R") + iEmail <- grep("^\\s*myStudentNumber\\s*<-", prf) + out <- prf[1:iEmail] + out <- c(out, sprintf("MYSPE <- \"%s\" ", + getMYSPE(myStudentNumber))) + out <- c(out, prf[(iEmail+1):length(prf)]) + writeLines(out, "./myScripts/.myProfile.R") + + cat("\n") + cat(sprintf("MYSPE (%s) was added to \"./myScripts/.myProfile.R\"\n\n", + getMYSPE(myStudentNumber))) + MYSPE <- getMYSPE(myStudentNumber) # ... define it for immediate use + rm(prf, iEmail, out) # cleanup + } + cat("... done.\n\n") +} + +if (default.stringsAsFactors()) { + cat("WARNING.\n") + cat("========\n") + cat("Your default \"stringsAsFactors\" parameter is set to \"TRUE\".\n") + cat("This will break some of the code.\n") + cat("Please contact your instructor to troubleshoot and fix this issue.\n") + cat("\n") +} + +errText <- list() +errText[["noProfileFile"]] <- ' +Your PROFILE FILE does not exist. This problem must be fixed to continue. + + The code expects the file "./myScripts/.myProfile.R" to exist and to + contain your correct eMail address and student number. Detailed + instructions were given when you first ran the init() command. + + Try running init() again and follow the instructions. Reload youR RStudio + session and start over with this file. + + If this does not fix the problem, ask for help. +' + +errText[["noStudentNumber"]] <- ' +Your STUDENT NUMBER has not been defined. This problem must be fixed to continue. + + The code expects the file "./myScripts/.myProfile.R" to exist and to + contain your correct eMail address and student number. This file gets + sourced when you start a new R-session, but since you see this error + message there was a problem. + + Perhaps you need to restart your R-session. Try closing the RStudio + project and reopening it from the File > Recent Projects menu. + + Perhaps there was a syntax error in your file. Then not all the + instructions in the file are executed. Check the file: is your + email perhpas not defined? Or did you type it without qwuoataion + marks? + + Try fixing problems, and then restart R as described above. + + If none of this fixes the problem, ask for help. +' + +# [END] diff --git a/.gitignore b/.gitignore index 272f5f0..843ac93 100644 --- a/.gitignore +++ b/.gitignore @@ -1,44 +1,44 @@ -# Miscellaneous -.Ds_store -instructor/ -dev/ -# myScripts/ # We don't want to ignore this so we can save our work to our own fork. - -# History files -.Rhistory -.Rapp.history - -# Session Data files -# .RData - -# Files produced in assingments -data/APSESphyloSet.mfa -data/APSEStreeRproml.rds - -# Example code in package build process -*-Ex.R - -# Output files from R CMD build -/*.tar.gz - -# Output files from R CMD check -/*.Rcheck/ - -# RStudio files -.Rproj.user/ - -# produced vignettes -vignettes/*.html -vignettes/*.pdf - -# OAuth2 token, see https://github.com/hadley/httr/releases/tag/v0.3 -.httr-oauth - -# knitr and R markdown default cache directories -/*_cache/ -/cache/ - -# Temporary files created by R markdown -*.utf8.md -*.knit.md -.Rproj.user +# Miscellaneous +.Ds_store +instructor/ +dev/ +# myScripts/ # We don't want to ignore this so we can save our work to our own fork. + +# History files +.Rhistory +.Rapp.history + +# Session Data files +# .RData + +# Files produced in assingments +data/APSESphyloSet.mfa +data/APSEStreeRproml.rds + +# Example code in package build process +*-Ex.R + +# Output files from R CMD build +/*.tar.gz + +# Output files from R CMD check +/*.Rcheck/ + +# RStudio files +.Rproj.user/ + +# produced vignettes +vignettes/*.html +vignettes/*.pdf + +# OAuth2 token, see https://github.com/hadley/httr/releases/tag/v0.3 +.httr-oauth + +# knitr and R markdown default cache directories +/*_cache/ +/cache/ + +# Temporary files created by R markdown +*.utf8.md +*.knit.md +.Rproj.user diff --git a/.tmp.R b/.tmp.R index f42a47e..178b255 100644 --- a/.tmp.R +++ b/.tmp.R @@ -1,38 +1,38 @@ -# myScript.R -# -# --- As you work with this file, you can delete the instructions below -------- -# Write your notes and code experiments into this document. Save it -# from time to time - however I recommend that you do not _commit_ -# your saved version. -# -# As long as you do not _commit_ this script to version control, -# you can _pull_ updated versions of the entire project from GitHub -# by using the RStudio version control interface. However, once -# you _commit_ any file in your local version, RStudio will require -# you to resolve conflicts before you can _pull_ updates. -# --- As you work with this file, you can delete the instructions above -------- -# -## Purpose: <...> -# -# Version: <...> -# -# Date: <...> -# Author: () -# -# Versions: -# -# -# -# TODO: -# <...> -# -# ==================================================================== - - - - - - - -# [END] - +# myScript.R +# +# --- As you work with this file, you can delete the instructions below -------- +# Write your notes and code experiments into this document. Save it +# from time to time - however I recommend that you do not _commit_ +# your saved version. +# +# As long as you do not _commit_ this script to version control, +# you can _pull_ updated versions of the entire project from GitHub +# by using the RStudio version control interface. However, once +# you _commit_ any file in your local version, RStudio will require +# you to resolve conflicts before you can _pull_ updates. +# --- As you work with this file, you can delete the instructions above -------- +# +## Purpose: <...> +# +# Version: <...> +# +# Date: <...> +# Author: () +# +# Versions: +# +# +# +# TODO: +# <...> +# +# ==================================================================== + + + + + + + +# [END] + diff --git a/.utilities.R b/.utilities.R index c7d4fc3..24a4804 100644 --- a/.utilities.R +++ b/.utilities.R @@ -1,654 +1,654 @@ -# tocID <- "./.utilities.R" -# -# Miscellaneous R code to support the project -# -# Version: 1.5 -# Date: 2017-09 - 2021-09 -# Author: Boris Steipe -# -# V 1.5 rewrite getMYSPE() -# V 1.4 Maintenance, and new validation utilities -# V 1.3.1 prefix Biostrings:: to subseq() -# V 1.3 load msa support functions -# V 1.2 update database utilities to support 2017 version of JSON sources -# V 1.1 2017 updates for ABC-units -# V 1.0 First code -# -# ToDo: -# Notes: -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ----------------------------------------------------------- -#TOC> 1 SCRIPTS TO SOURCE 53 -#TOC> 2 PACKAGES 59 -#TOC> 3 DATA & CONSTANTS 70 -#TOC> 4 SUPPORT FUNCTIONS 117 -#TOC> 4.01 objectInfo() 120 -#TOC> 4.02 biCode() 148 -#TOC> 4.03 sameSpecies() 182 -#TOC> 4.04 validateFA() 202 -#TOC> 4.05 readFASTA() 310 -#TOC> 4.06 writeFASTA() 345 -#TOC> 4.07 pBar() 378 -#TOC> 4.08 waitTimer() 400 -#TOC> 4.09 fetchMSAmotif() 428 -#TOC> 4.10 H() (Shannon entropy) 472 -#TOC> 4.11 CX() (ChimeraX remote command) 485 -#TOC> 5 FUNCTIONS TO CUSTOMIZE ASSIGNMENTS 542 -#TOC> 5.01 seal() 544 -#TOC> 5.02 getMYSPE() 548 -#TOC> 5.03 selectPDBrep() 564 -#TOC> 5.04 sealKey() 599 -#TOC> 5.05 selectChi2() 629 -#TOC> 5.06 selectENSP() 642 -#TOC> -#TOC> ========================================================================== - - -# = 1 SCRIPTS TO SOURCE =================================================== - -source("./scripts/ABC-dbUtilities.R") -source("./scripts/ABC-writeALN.R") -source("./scripts/ABC-writeMFA.R") - -# = 2 PACKAGES ============================================================ - -if (! requireNamespace("digest", quietly = TRUE)) { - install.packages("digest") -} - -if (! requireNamespace("jsonlite", quietly = TRUE)) { - install.packages("jsonlite") -} - - -# = 3 DATA & CONSTANTS ==================================================== - -# cf. https://www.bioinformatics.org/sms/iupac.html -AAVALID <- "acdefghiklmnpqrstvwyACDEFGHIKLMNPQRSTVWY*-" -NUCVALID <- "acgtuACGTU-" -NUCAMBIG <- "acgtACGTryswkmbdhvnRYSWKMBDHVN-" - -# A colour palette for amino acid properties -AACOLS <- character() -AACOLS["R"] <- "#5770ff" # Positive -AACOLS["K"] <- "#4785EE" # -AACOLS["H"] <- "#37a1de" # -AACOLS["E"] <- "#ff6f59" # Negative -AACOLS["D"] <- "#ff7391" # -AACOLS["N"] <- "#C9D4FF" # Hydrophilic -AACOLS["Q"] <- "#CADFFC" # -AACOLS["S"] <- "#CBEAF9" # -AACOLS["T"] <- "#CDF5F7" # -AACOLS["Y"] <- "#FBFFC9" # Hydrophobic -AACOLS["W"] <- "#EDFDC8" # -AACOLS["F"] <- "#DFFCC8" # -AACOLS["I"] <- "#D2FBC8" # -AACOLS["L"] <- "#C4FAC7" # -AACOLS["M"] <- "#B7F9C7" # -AACOLS["V"] <- "#A9F8C7" # -AACOLS["A"] <- "#9CF7C7" # -AACOLS["G"] <- "#d2d2d2" # Glycine -AACOLS["C"] <- "#fff963" # Cysteine -AACOLS["P"] <- "#edc06d" # Proline -AACOLS <- gsub("$", "80", AACOLS) # Make the colors 50% transparent -# barplot(rep(1, 20), col = AACOLS) -# colorRampPalette(c("#fbffc9","#9cf7c7"))(8) - -# 10 species of fungi for reference analysis. -# http://steipe.biochemistry.utoronto.ca/abc/index.php/Reference_species_for_fungi -REFspecies <- c("Aspergillus nidulans", - "Bipolaris oryzae", - "Coprinopsis cinerea", - "Cryptococcus neoformans", - "Neurospora crassa", - "Puccinia graminis", - "Saccharomyces cerevisiae", - "Schizosaccharomyces pombe", - "Ustilago maydis", - "Wallemia mellicola") - - -# = 4 SUPPORT FUNCTIONS =================================================== - - -# == 4.01 objectInfo() ===================================================== -objectInfo <- function(x) { - # Function to combine various information items about R objects - # - # Input: an R object - # Value: none - prints information as side-effect - - cat("object contents:") - print(x, digits = 22) # print value at maximal precision - - cat("\nstructure of object:\n") - str(x) - - if (! is.list(x)) { # Don't use cat() if x is a list. cat() can't handle lists. - cat("\nmode: ", mode(x), "\n") - cat("typeof: ", typeof(x), "\n") - cat("class: ", class(x), "\n") - } - - # if the object has attributes, print them too - if (! is.null(attributes(x))) { - cat("\nattributes:\n") - attributes(x) - } - # Done -} - - -# == 4.02 biCode() ========================================================= -biCode <- function(s) { - # Make a 5 character "biCode" from a binomial name by concatening - # the uppercased first three letter of the first word and the first - # two letters of the second word. If there is only one word, we take the - # first five characters from that. Outputs are padded with "." if necessary. - # NAs in input are preserved. - # Parameters: - # s chr vector of binomial species names - # Value: chr vector of biCodes, same length as s, NAs are preserved - - b <- character(length(s)) - s <- gsub("[^a-zA-Z ]", "", as.character(s)) # remove all non-alphabetic - # characters except space - s <- toupper(s) - - for (i in seq_along(s)) { - x <- unlist(strsplit(s[i], "\\s+")) - if (length(x) == 0) { # empty string - x <- c("", "") - } else if (length(x) == 1) { # only one string - x <- c(substr(x, 1, 3), substr(x, 4, 5)) # 3 + 2 with whatever is there - } - x <- paste0(x[1:2], "...") # pad strings - - b[i] <- paste0(substr(x[1], 1, 3), substr(x[2], 1, 2)) - } - - b[is.na(s)] <- NA # recover NAs from input - - return(b) -} - - -# == 4.03 sameSpecies() ==================================================== -sameSpecies <- function(a, b) { - # Parameters: a, b two vectors that contain - # binomial species names and maybe additional strain information. - # Value: a boolean vector, true where the species in a is the same as - # the species in b. - # Note: the usual vector recycling applies. Length is not checked. - a <- gsub("^(\\S+\\s\\S+).*", "\\1", a) - b <- gsub("^(\\S+\\s\\S+).*", "\\1", b) - if (any(! grepl("^\\S+\\s\\S+$", a))) { - stop("\"a\" contains elements that are not binomial names.") - } - if (any(! grepl("^\\S+\\s\\S+$", b))) { - stop("\"b\" contains elements that are not binomial names.") - } - return(a == b) -} - - - -# == 4.04 validateFA() ===================================================== - -validateFA <- function(txt) { - # validates txt according to FASTA assumptions - # Parameters: - # txt char a putative vector of FASTA formatted text - # Value: invisible(NULL) - # - # The function is used for its side-effect of throwing an error of - # FASTA assumptions are violated in txt. - # - There may be spacer-lines matching "^\\s*$" - # - At least one header line - # - No adjacent header lines - # - All header lines followed by at least one sequence line - # - All sequence lines have at least one valid character - # - Valid characters are AAVALID (which includes valid nucleotides) - - if ( ! any(grepl("^>", txt)) ) { - stop("no header lines in input") - } - - isHeader <- grepl("^>", txt) - isSpacer <- grepl("^\\s*$", txt) - txtNoSpc <- txt[! isSpacer] - - # adjacent headers - sel <- isHeader[- length(isHeader)] & isHeader[-1] - if ( any(sel) ) { - i <- which(sel)[1] - stop(sprintf("adjacent header lines in input (lines %d and %d)", - i, i+1)) - } - - # invalid character in a line that is not header or spacer - selA <- isHeader | isSpacer - selB <- grepl(sprintf("[^%s]", AAVALID), txt) - if ( any( (! selA) & selB) ) { # (not header) AND (has invalid character) - i <- which( (! selA) & selB)[1] - stop(sprintf("invalid character(s) in sequence (cf. line %d)", i)) - } - - # no spacer should immediately follow a header - sel <- c(isSpacer, FALSE) & c(FALSE, isHeader) - if ( any(sel) ) { - i <- which(sel)[1] - stop(sprintf("a header has no adjacent sequence (line %d)", i - 1)) - } - - # no header alone on the last line - if ( which(isHeader)[sum(isHeader)] == length(txt)) { - stop(sprintf("a header is alone on the last line (line %d)", length(txt))) - } - - # no spacer in a block of sequence - # (tested as: not followed by spacer or header) - - if (sum(isSpacer) > 0) { - sel <- which(isSpacer) + 1 - sel <- sel[sel <= length(txt)] - if ( ! all(isSpacer[sel] | isHeader[sel]) ) { - i <- which(! (isSpacer[sel] | isHeader[sel]))[1] - stop(sprintf("a spacer is followed by sequence (line %d)", - which(isSpacer)[i])) - } - - } - - # all good, if we get to here. - return(invisible(NULL)) -} - -if (FALSE) { - - # Should validate - fa <- c(">abc", "de") - validateFA(fa) - - fa <- c(">abc", "de", "fgh", ">ojz", "ikl") - validateFA(fa) - - fa <- c("", ">abc", "de", "fgh", "", ">ojz", "ikl", "") - validateFA(fa) - - fa <- c(" ", ">abc", "de", "fgh", " ", ">ojz", "ikl", "\t") - validateFA(fa) - - # should fail - fa <- c("abc", "de") - validateFA(fa) - - fa <- c(">abc", "de", ">fgh", ">ojz", "ikl") - validateFA(fa) - - fa <- c("", ">abc", "de", "f_h", "", ">ojz", "ikl", "") - validateFA(fa) - - fa <- c(">abc", " ", "de", "fgh", " ", ">ojz", "ikl", "\t") - validateFA(fa) - - fa <- c(" ", ">abc", "de", "fgh", " ", ">ojz") - validateFA(fa) - - fa <- c(" ", ">abc", "de", " ", "fgh", ">ojz", "ikl", "\t") - validateFA(fa) - -} - - -# == 4.05 readFASTA() ====================================================== - -readFASTA <- function(FA) { - # Read FASTA formatted text, validate it, - # return a dataframe of headers and collapsed sequences. - # Parameters: - # FA chr Input file name (or text connection) - # Value: - # data.frame - # $header char the FASTA header lines - # $ seq char the actual sequences - # - # Note: if length(FA) is one, it is assumed to be a filename - # - # Example: - # refAPSES <- readFASTA("./data/refAPSES.mfa") - # readFASTA(c("> This", "acdef", "ghi", > That", "k-l")) - # - - if (length(FA) == 1) { FA <- readLines(FA) } - validateFA(FA) - FA <- FA[! grepl("^$", FA)] # drop all empty lines - iHead <- grep("^>", FA) # find all headers - myFA <- data.frame(head = FA[iHead], - seq = character(length(iHead))) - - for (i in seq_along(iHead)) { - first <- iHead[i] + 1 # first line of each sequence - last <- ifelse(i < length(iHead), iHead[i + 1] - 1, length(FA)) # ...last - myFA$seq[i] <- paste0(FA[first:last], collapse = "") - } - return(myFA) -} - - -# == 4.06 writeFASTA() ===================================================== -writeFASTA <- function(fa, fn = NULL, width = 60) { - # Write the contents of dataframe "fa" as a FASTA formatted file. - # Parameters: - # fa dataframe - # $head chr vector of FASTA headers, - # $seq chr vector of sequences in one-letter code - # fn chr filename for output; if NULL (default) the output is - # returned instead - # width int max number of sequence characters per line of output. - # Value: - # FASTA formatted character vector IF fn was NULL. invisible(NULL) - # otherwise. - - out <- character() - for (i in seq_along(fa$head)) { - out <- c(out, fa$head[i]) # add header line - from <- seq(1, nchar(fa$seq[i]), by = width) # starting indices of chunks - to <- c((from - 1)[-1], nchar(fa$seq[i])) # ending indices of chunks - out <- c(out, substring(fa$seq[i], from, to)) # add chunks to txt - out <- c(out, "") # add empty line for better readability - } - out <- out[ - length(out)] # drop the last empty line - - if (length(fn) == 1) { - writeLines(out, fn) - return(invisible(NULL)) - } else { - return(out) - } -} - - -# == 4.07 pBar() =========================================================== - pBar <- function(i, l, nCh = 50) { - # Draw a progress bar in the console - # i: the current iteration - # l: the total number of iterations - # nCh: width of the progress bar - ticks <- round(seq(1, l-1, length.out = nCh)) - if (i < l) { - if (any(i == ticks)) { - p <- which(i == ticks)[1] # use only first, in case there are ties - p1 <- paste(rep("#", p), collapse = "") - p2 <- paste(rep("-", nCh - p), collapse = "") - cat(sprintf("\r|%s%s|", p1, p2)) - flush.console() - } - } - else { # done - cat("\n") - } -} - - -# == 4.08 waitTimer() ====================================================== -waitTimer <- function(t, nIntervals = 50) { - # pause and wait for t seconds and display a progress bar as - # you are waiting - t <- as.numeric(t) - - if (t < 0.1) {return(invisible())} - - increment <- t / nIntervals - - bar <- "----:----|" # One module for the progress bar: - bar <- rep(bar, ceiling(nIntervals / 10)) # repeat, - bar <- unlist(strsplit(bar, "")) # split into single characters, - bar <- bar[1:nIntervals] # truncate, - bar <- paste(bar, collapse="") # and collapse. - - cat(sprintf("\nWaiting: |%s\n |", bar)) - for (i in 1:(nIntervals - 1)) { - Sys.sleep(increment) - cat("=") - } - Sys.sleep(increment) - cat("|\n\n") - - return(invisible()) -} - - -# == 4.09 fetchMSAmotif() ================================================== -fetchMSAmotif <- function(ali, mot) { - # Retrieve a subset from ali that spans the sequence in mot. - # Biostrings package must be installed. - # Parameters: - # ali MsaAAMultipleAlignment object - # mot chr substring within ali - # Value: AAStringset - - if (class(ali) != "MsaAAMultipleAlignment" && - class(ali) != "MsaDNAMultipleAlignment" && - class(ali) != "MsaRNAMultipleAlignment") { - stop("ali has to be an msa multiple alignment object.") - } - - if (class(mot) != "character") { - stop("mot has to be a character object.") - } - - x <- gsub("-", "", as.character(ali)) # pure sequence, no hyphens - - idx <- grep(mot, x)[1] # first sequence containing mot. If no match, - # idx becomes NA - if (is.na(idx)) { - stop("mot is not a subsequence in ali.") - } - - # Find the match range - m <- regexpr(mot, x[idx]) - motifStart <- as.numeric(m) - motifEnd <- attr(m, "match.length") + motifStart - 1 - - # Count characters, skip hyphens ... - x <- unlist(strsplit(as.character(ali)[idx], "")) - x <- x != "-" - x <- as.numeric(x) - x <- cumsum(x) - - return(Biostrings::subseq(ali@unmasked, - start = which(x == motifStart)[1], # get the first position - end = which(x == motifEnd)[1])) -} - - -# == 4.10 H() (Shannon entropy) ============================================ -H <- function(x, N) { - # calculate the Shannon entropy of the vector x given N possible states - # (in bits). - # H(x) = - sum_i(P(x_i) * log2(P(x_i)); 0 * log(0) == 0 - t <- table(x) - if (missing(N)) { N <- length(t) } - if (length(t) > N ) { stop("N can't be smaller than observed states.") } - h <- sum(- (t / length(x)) * log2(t / length(x))) - return(h) -} - - -# == 4.11 CX() (ChimeraX remote command) =================================== -CX <- function(cmd, port = CXPORT, quietly = FALSE) { - # send a command to ChimeraX listening on port CXPORT via its REST - # interface. - # Parameters: - # cmd char a ChireaX commandline command - # port int the portnumber on which ChimeraX is listening - # quietly logical if FALSE, cat() the contents of the response - # - # Value: the reply by ChimeraX, invisibly. - - CXREST <- sprintf("http://127.0.0.1:%s/run?", CXPORT) - - cmd <- gsub("(^\\s+)|(\\s+$)", "", cmd) # trim whitespace - # percent encode reserved characters - cmd <- gsub("%", "%25", cmd) # % - cmd <- gsub("#", "%23", cmd) # # - cmd <- gsub("/", "%2F", cmd) # / - cmd <- gsub(":", "%3A", cmd) # : - cmd <- gsub("@", "%40", cmd) # @ - cmd <- gsub(",", "%2C", cmd) # , - cmd <- gsub("\\*", "%2A", cmd) # * - cmd <- gsub("\\?", "%3F", cmd) # ? - cmd <- gsub("!", "%21", cmd) # ! - cmd <- gsub("=", "%3D", cmd) # = - cmd <- gsub("\\(", "%28", cmd) # ( - cmd <- gsub("\\)", "%29", cmd) # ) - cmd <- gsub("\\[", "%5B", cmd) # [ - cmd <- gsub("\\]", "%5D", cmd) # ] - cmd <- gsub("&", "%26", cmd) # & - cmd <- gsub("\\+", "%2B", cmd) # + - - cmd <- gsub("\\s+", "+", cmd) # whitespace to "+" - cmd <- URLencode(cmd) # encode special characters - cmd <- paste0(CXREST, "command=", cmd, collapse = "") - - r <- httr::GET(cmd) - - if (! r$status_code == 200) { - stop("ChimeraX returned status code %d", r$status_code) - } - - if (length(r$content) == 0) { - reply <- "" - } else { - reply <- rawToChar(r$content) - } - - if (quietly == FALSE) { - cat(reply) - } - - return(invisible(reply)) - -} - - -# = 5 FUNCTIONS TO CUSTOMIZE ASSIGNMENTS ================================== - -# == 5.01 seal() =========================================================== -seal <- function(x.1L) { .Call(digest:::digest_impl,x.1L,3L,-1L,-0,-0,-0) } - - -# == 5.02 getMYSPE() ======================================================= -# DEV: x <- 1003141593 - -getMYSPE <- function(x) { - dat <- readRDS("./data/MYSPEdat.rds") - key <- digest::digest(as.character(x), algo = "md5") - if (length(grep(key, rownames(dat))) != 1) { - stop(paste("This student number is not recognized.", - "If this is not a typo, please contact your instructor.")) - } - x <- dat[key, "species"] - names(x) <- dat[key, "taxID"] - return(x) -} - - -# == 5.03 selectPDBrep() =================================================== -selectPDBrep <- function(n, forCredit = FALSE) { - # Select n PDB IDs from a list of high-resolution, non-homologous, single - # domain, single chain structure files that represent a CATH topology - # group. - # Parameters: - # n num number of IDs to return - # seed num a seed for the RNG - # - # Value: char PDB IDs - # - # Note: the list is loaded from an .rds file in the "./data" directory. - - if (forCredit) { - seed <- myStudentNumber - } else { - seed <- as.integer(Sys.time()) - cat("NOTE: This selection will not validate for a course submission.\n") - cat(" If you intend to use it for an assignment task, invoke\n") - cat(" it like \"selectPDBrep(n = 15, forCredit = TRUE)\".\n\n") - } - - pdbRep <- readRDS("./data/pdbRep.rds") # loads pdbRep - - if (n > length(pdbRep)) { - stop(sprintf("There are only %d PDB IDs in the table to choose from.", - length(pdbRep))) - } - oldSeed <- .Random.seed - set.seed(seed) - PDBset <- sample(pdbRep, n) - .Random.seed <- oldSeed - return(PDBset) -} - -# == 5.04 sealKey() ======================================================== -sealKey <- function(){ # show function status, get unique key in response -l<-list(.Random.seed,Sys.time,sys.frame,sys.nframe,sys.parent,capture.output, -str,as.integer,gsub,get,11,function(s,q=1,k=l[[11]]){ -s<-as.integer(charToRaw(s))-32;set.seed(k);y<-sample(0:94,length(s),r=T)*q; -.Random.seed<-l[[1]];s[s(95-T)]<-F;s<-(s+y) %%(9^2+3^2+2^2);s<-s+32; -s<-rawToChar(as.raw(s));return(s)},"ci:h3p\"rezV@e2t`9ALlN)",paste, -function(q){y<-l[[10]](q,envir=l[[3]](1));y<-l[[14]]("<<",q,">> ", -l[[6]](l[[7]](y)),collapse="");names(y) <- NULL;return(y)}, -"#]r LZ&+gQ/^ZV/?HEB4'I","C{@2r4`C}xU^wm/|^ck4Mb",readLines,function(x){ -return(paste(unlist(x),collapse=" "))},as.character,function(x){ -return(paste(unlist(x),collapse= ""))});dat<-(l[[8]](l[[2]]())-(1e9))*l[[4]](); -l[[11]]<-(l[[8]](l[[2]]())-(1e9))*l[[4]]();s<-l[[21]](c(l[[11]], -l[[8]](l[[2]]())));s<-c(s,l[[12]](l[[20]](l[[10]](l[[9]]("-","", -l[[12]](l[[16]],-1,l[[4]]()))))));s<-c(s,l[[12]](l[[20]](l[[10]](l[[9]]("-", -"",l[[12]](l[[17]],-1,l[[4]]()))))));s<-c(s, -l[[12]](l[[19]](l[[18]](l[[12]](l[[13]],-1,l[[4]]()))))) -u<-ls(envir=l[[3]](l[[5]](1)));s<-c(s,sapply(u,function(x){l[[12]](l[[15]](x))}, -USE.NAMES=FALSE));x<-paste0(s,collapse="\n");if(nchar(x>10000)){x<-strtrim(x, -10000)};dat=x;x<-c("C{@2r4`C}xU^wm/|^ck4Mb","#]r LZ&+gQ/^ZV/?HEB4'I") -# ============================================================================== -response <- httr::POST("http://steipe.biochemistry.utoronto.ca/abc/seal.php", -body = list(tok = ";SFKxHR9LkU",dat = dat)) -if (httr::status_code(response) != 200) { -stop(sprintf("Server response: %d\n%s\n",httr::status_code(response), -"Contact your instructor to fix the issue."))} -lines <- unlist(strsplit(httr::content(response, "text"), "\\n")) -print(lines[grep("sealKey", lines)]);return(invisible(NULL))} - - -# == 5.05 selectChi2() ===================================================== -selectChi2 <- function() { - # Select one random Amino acid from those that have a Chi2 angle - - oldSeed <- .Random.seed - set.seed(myStudentNumber) - AA <- sample(c("Asp", "Glu", "Phe", "His", "Ile", "Lys", "Leu", - "Met", "Asn", "Gln","Arg", "Trp", "Tyr")) - .Random.seed <- oldSeed - cat(sprintf(" Chi1/Ch2: Use \"%s\". <%s>\n", AA[4], seal(AA))) -} - - -# == 5.06 selectENSP() ===================================================== -selectENSP <- function(x) { - oldSeed <- .Random.seed - set.seed(myStudentNumber) - x <- sample(x[order(x)]) - .Random.seed <- oldSeed - cat(sprintf("seal: %s\n", seal(paste0(x,collapse="")))) - return(x) -} - - - -# [END] +# tocID <- "./.utilities.R" +# +# Miscellaneous R code to support the project +# +# Version: 1.5 +# Date: 2017-09 - 2021-09 +# Author: Boris Steipe +# +# V 1.5 rewrite getMYSPE() +# V 1.4 Maintenance, and new validation utilities +# V 1.3.1 prefix Biostrings:: to subseq() +# V 1.3 load msa support functions +# V 1.2 update database utilities to support 2017 version of JSON sources +# V 1.1 2017 updates for ABC-units +# V 1.0 First code +# +# ToDo: +# Notes: +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ----------------------------------------------------------- +#TOC> 1 SCRIPTS TO SOURCE 53 +#TOC> 2 PACKAGES 59 +#TOC> 3 DATA & CONSTANTS 70 +#TOC> 4 SUPPORT FUNCTIONS 117 +#TOC> 4.01 objectInfo() 120 +#TOC> 4.02 biCode() 148 +#TOC> 4.03 sameSpecies() 182 +#TOC> 4.04 validateFA() 202 +#TOC> 4.05 readFASTA() 310 +#TOC> 4.06 writeFASTA() 345 +#TOC> 4.07 pBar() 378 +#TOC> 4.08 waitTimer() 400 +#TOC> 4.09 fetchMSAmotif() 428 +#TOC> 4.10 H() (Shannon entropy) 472 +#TOC> 4.11 CX() (ChimeraX remote command) 485 +#TOC> 5 FUNCTIONS TO CUSTOMIZE ASSIGNMENTS 542 +#TOC> 5.01 seal() 544 +#TOC> 5.02 getMYSPE() 548 +#TOC> 5.03 selectPDBrep() 564 +#TOC> 5.04 sealKey() 599 +#TOC> 5.05 selectChi2() 629 +#TOC> 5.06 selectENSP() 642 +#TOC> +#TOC> ========================================================================== + + +# = 1 SCRIPTS TO SOURCE =================================================== + +source("./scripts/ABC-dbUtilities.R") +source("./scripts/ABC-writeALN.R") +source("./scripts/ABC-writeMFA.R") + +# = 2 PACKAGES ============================================================ + +if (! requireNamespace("digest", quietly = TRUE)) { + install.packages("digest") +} + +if (! requireNamespace("jsonlite", quietly = TRUE)) { + install.packages("jsonlite") +} + + +# = 3 DATA & CONSTANTS ==================================================== + +# cf. https://www.bioinformatics.org/sms/iupac.html +AAVALID <- "acdefghiklmnpqrstvwyACDEFGHIKLMNPQRSTVWY*-" +NUCVALID <- "acgtuACGTU-" +NUCAMBIG <- "acgtACGTryswkmbdhvnRYSWKMBDHVN-" + +# A colour palette for amino acid properties +AACOLS <- character() +AACOLS["R"] <- "#5770ff" # Positive +AACOLS["K"] <- "#4785EE" # +AACOLS["H"] <- "#37a1de" # +AACOLS["E"] <- "#ff6f59" # Negative +AACOLS["D"] <- "#ff7391" # +AACOLS["N"] <- "#C9D4FF" # Hydrophilic +AACOLS["Q"] <- "#CADFFC" # +AACOLS["S"] <- "#CBEAF9" # +AACOLS["T"] <- "#CDF5F7" # +AACOLS["Y"] <- "#FBFFC9" # Hydrophobic +AACOLS["W"] <- "#EDFDC8" # +AACOLS["F"] <- "#DFFCC8" # +AACOLS["I"] <- "#D2FBC8" # +AACOLS["L"] <- "#C4FAC7" # +AACOLS["M"] <- "#B7F9C7" # +AACOLS["V"] <- "#A9F8C7" # +AACOLS["A"] <- "#9CF7C7" # +AACOLS["G"] <- "#d2d2d2" # Glycine +AACOLS["C"] <- "#fff963" # Cysteine +AACOLS["P"] <- "#edc06d" # Proline +AACOLS <- gsub("$", "80", AACOLS) # Make the colors 50% transparent +# barplot(rep(1, 20), col = AACOLS) +# colorRampPalette(c("#fbffc9","#9cf7c7"))(8) + +# 10 species of fungi for reference analysis. +# http://steipe.biochemistry.utoronto.ca/abc/index.php/Reference_species_for_fungi +REFspecies <- c("Aspergillus nidulans", + "Bipolaris oryzae", + "Coprinopsis cinerea", + "Cryptococcus neoformans", + "Neurospora crassa", + "Puccinia graminis", + "Saccharomyces cerevisiae", + "Schizosaccharomyces pombe", + "Ustilago maydis", + "Wallemia mellicola") + + +# = 4 SUPPORT FUNCTIONS =================================================== + + +# == 4.01 objectInfo() ===================================================== +objectInfo <- function(x) { + # Function to combine various information items about R objects + # + # Input: an R object + # Value: none - prints information as side-effect + + cat("object contents:") + print(x, digits = 22) # print value at maximal precision + + cat("\nstructure of object:\n") + str(x) + + if (! is.list(x)) { # Don't use cat() if x is a list. cat() can't handle lists. + cat("\nmode: ", mode(x), "\n") + cat("typeof: ", typeof(x), "\n") + cat("class: ", class(x), "\n") + } + + # if the object has attributes, print them too + if (! is.null(attributes(x))) { + cat("\nattributes:\n") + attributes(x) + } + # Done +} + + +# == 4.02 biCode() ========================================================= +biCode <- function(s) { + # Make a 5 character "biCode" from a binomial name by concatening + # the uppercased first three letter of the first word and the first + # two letters of the second word. If there is only one word, we take the + # first five characters from that. Outputs are padded with "." if necessary. + # NAs in input are preserved. + # Parameters: + # s chr vector of binomial species names + # Value: chr vector of biCodes, same length as s, NAs are preserved + + b <- character(length(s)) + s <- gsub("[^a-zA-Z ]", "", as.character(s)) # remove all non-alphabetic + # characters except space + s <- toupper(s) + + for (i in seq_along(s)) { + x <- unlist(strsplit(s[i], "\\s+")) + if (length(x) == 0) { # empty string + x <- c("", "") + } else if (length(x) == 1) { # only one string + x <- c(substr(x, 1, 3), substr(x, 4, 5)) # 3 + 2 with whatever is there + } + x <- paste0(x[1:2], "...") # pad strings + + b[i] <- paste0(substr(x[1], 1, 3), substr(x[2], 1, 2)) + } + + b[is.na(s)] <- NA # recover NAs from input + + return(b) +} + + +# == 4.03 sameSpecies() ==================================================== +sameSpecies <- function(a, b) { + # Parameters: a, b two vectors that contain + # binomial species names and maybe additional strain information. + # Value: a boolean vector, true where the species in a is the same as + # the species in b. + # Note: the usual vector recycling applies. Length is not checked. + a <- gsub("^(\\S+\\s\\S+).*", "\\1", a) + b <- gsub("^(\\S+\\s\\S+).*", "\\1", b) + if (any(! grepl("^\\S+\\s\\S+$", a))) { + stop("\"a\" contains elements that are not binomial names.") + } + if (any(! grepl("^\\S+\\s\\S+$", b))) { + stop("\"b\" contains elements that are not binomial names.") + } + return(a == b) +} + + + +# == 4.04 validateFA() ===================================================== + +validateFA <- function(txt) { + # validates txt according to FASTA assumptions + # Parameters: + # txt char a putative vector of FASTA formatted text + # Value: invisible(NULL) + # + # The function is used for its side-effect of throwing an error of + # FASTA assumptions are violated in txt. + # - There may be spacer-lines matching "^\\s*$" + # - At least one header line + # - No adjacent header lines + # - All header lines followed by at least one sequence line + # - All sequence lines have at least one valid character + # - Valid characters are AAVALID (which includes valid nucleotides) + + if ( ! any(grepl("^>", txt)) ) { + stop("no header lines in input") + } + + isHeader <- grepl("^>", txt) + isSpacer <- grepl("^\\s*$", txt) + txtNoSpc <- txt[! isSpacer] + + # adjacent headers + sel <- isHeader[- length(isHeader)] & isHeader[-1] + if ( any(sel) ) { + i <- which(sel)[1] + stop(sprintf("adjacent header lines in input (lines %d and %d)", + i, i+1)) + } + + # invalid character in a line that is not header or spacer + selA <- isHeader | isSpacer + selB <- grepl(sprintf("[^%s]", AAVALID), txt) + if ( any( (! selA) & selB) ) { # (not header) AND (has invalid character) + i <- which( (! selA) & selB)[1] + stop(sprintf("invalid character(s) in sequence (cf. line %d)", i)) + } + + # no spacer should immediately follow a header + sel <- c(isSpacer, FALSE) & c(FALSE, isHeader) + if ( any(sel) ) { + i <- which(sel)[1] + stop(sprintf("a header has no adjacent sequence (line %d)", i - 1)) + } + + # no header alone on the last line + if ( which(isHeader)[sum(isHeader)] == length(txt)) { + stop(sprintf("a header is alone on the last line (line %d)", length(txt))) + } + + # no spacer in a block of sequence + # (tested as: not followed by spacer or header) + + if (sum(isSpacer) > 0) { + sel <- which(isSpacer) + 1 + sel <- sel[sel <= length(txt)] + if ( ! all(isSpacer[sel] | isHeader[sel]) ) { + i <- which(! (isSpacer[sel] | isHeader[sel]))[1] + stop(sprintf("a spacer is followed by sequence (line %d)", + which(isSpacer)[i])) + } + + } + + # all good, if we get to here. + return(invisible(NULL)) +} + +if (FALSE) { + + # Should validate + fa <- c(">abc", "de") + validateFA(fa) + + fa <- c(">abc", "de", "fgh", ">ojz", "ikl") + validateFA(fa) + + fa <- c("", ">abc", "de", "fgh", "", ">ojz", "ikl", "") + validateFA(fa) + + fa <- c(" ", ">abc", "de", "fgh", " ", ">ojz", "ikl", "\t") + validateFA(fa) + + # should fail + fa <- c("abc", "de") + validateFA(fa) + + fa <- c(">abc", "de", ">fgh", ">ojz", "ikl") + validateFA(fa) + + fa <- c("", ">abc", "de", "f_h", "", ">ojz", "ikl", "") + validateFA(fa) + + fa <- c(">abc", " ", "de", "fgh", " ", ">ojz", "ikl", "\t") + validateFA(fa) + + fa <- c(" ", ">abc", "de", "fgh", " ", ">ojz") + validateFA(fa) + + fa <- c(" ", ">abc", "de", " ", "fgh", ">ojz", "ikl", "\t") + validateFA(fa) + +} + + +# == 4.05 readFASTA() ====================================================== + +readFASTA <- function(FA) { + # Read FASTA formatted text, validate it, + # return a dataframe of headers and collapsed sequences. + # Parameters: + # FA chr Input file name (or text connection) + # Value: + # data.frame + # $header char the FASTA header lines + # $ seq char the actual sequences + # + # Note: if length(FA) is one, it is assumed to be a filename + # + # Example: + # refAPSES <- readFASTA("./data/refAPSES.mfa") + # readFASTA(c("> This", "acdef", "ghi", > That", "k-l")) + # + + if (length(FA) == 1) { FA <- readLines(FA) } + validateFA(FA) + FA <- FA[! grepl("^$", FA)] # drop all empty lines + iHead <- grep("^>", FA) # find all headers + myFA <- data.frame(head = FA[iHead], + seq = character(length(iHead))) + + for (i in seq_along(iHead)) { + first <- iHead[i] + 1 # first line of each sequence + last <- ifelse(i < length(iHead), iHead[i + 1] - 1, length(FA)) # ...last + myFA$seq[i] <- paste0(FA[first:last], collapse = "") + } + return(myFA) +} + + +# == 4.06 writeFASTA() ===================================================== +writeFASTA <- function(fa, fn = NULL, width = 60) { + # Write the contents of dataframe "fa" as a FASTA formatted file. + # Parameters: + # fa dataframe + # $head chr vector of FASTA headers, + # $seq chr vector of sequences in one-letter code + # fn chr filename for output; if NULL (default) the output is + # returned instead + # width int max number of sequence characters per line of output. + # Value: + # FASTA formatted character vector IF fn was NULL. invisible(NULL) + # otherwise. + + out <- character() + for (i in seq_along(fa$head)) { + out <- c(out, fa$head[i]) # add header line + from <- seq(1, nchar(fa$seq[i]), by = width) # starting indices of chunks + to <- c((from - 1)[-1], nchar(fa$seq[i])) # ending indices of chunks + out <- c(out, substring(fa$seq[i], from, to)) # add chunks to txt + out <- c(out, "") # add empty line for better readability + } + out <- out[ - length(out)] # drop the last empty line + + if (length(fn) == 1) { + writeLines(out, fn) + return(invisible(NULL)) + } else { + return(out) + } +} + + +# == 4.07 pBar() =========================================================== + pBar <- function(i, l, nCh = 50) { + # Draw a progress bar in the console + # i: the current iteration + # l: the total number of iterations + # nCh: width of the progress bar + ticks <- round(seq(1, l-1, length.out = nCh)) + if (i < l) { + if (any(i == ticks)) { + p <- which(i == ticks)[1] # use only first, in case there are ties + p1 <- paste(rep("#", p), collapse = "") + p2 <- paste(rep("-", nCh - p), collapse = "") + cat(sprintf("\r|%s%s|", p1, p2)) + flush.console() + } + } + else { # done + cat("\n") + } +} + + +# == 4.08 waitTimer() ====================================================== +waitTimer <- function(t, nIntervals = 50) { + # pause and wait for t seconds and display a progress bar as + # you are waiting + t <- as.numeric(t) + + if (t < 0.1) {return(invisible())} + + increment <- t / nIntervals + + bar <- "----:----|" # One module for the progress bar: + bar <- rep(bar, ceiling(nIntervals / 10)) # repeat, + bar <- unlist(strsplit(bar, "")) # split into single characters, + bar <- bar[1:nIntervals] # truncate, + bar <- paste(bar, collapse="") # and collapse. + + cat(sprintf("\nWaiting: |%s\n |", bar)) + for (i in 1:(nIntervals - 1)) { + Sys.sleep(increment) + cat("=") + } + Sys.sleep(increment) + cat("|\n\n") + + return(invisible()) +} + + +# == 4.09 fetchMSAmotif() ================================================== +fetchMSAmotif <- function(ali, mot) { + # Retrieve a subset from ali that spans the sequence in mot. + # Biostrings package must be installed. + # Parameters: + # ali MsaAAMultipleAlignment object + # mot chr substring within ali + # Value: AAStringset + + if (class(ali) != "MsaAAMultipleAlignment" && + class(ali) != "MsaDNAMultipleAlignment" && + class(ali) != "MsaRNAMultipleAlignment") { + stop("ali has to be an msa multiple alignment object.") + } + + if (class(mot) != "character") { + stop("mot has to be a character object.") + } + + x <- gsub("-", "", as.character(ali)) # pure sequence, no hyphens + + idx <- grep(mot, x)[1] # first sequence containing mot. If no match, + # idx becomes NA + if (is.na(idx)) { + stop("mot is not a subsequence in ali.") + } + + # Find the match range + m <- regexpr(mot, x[idx]) + motifStart <- as.numeric(m) + motifEnd <- attr(m, "match.length") + motifStart - 1 + + # Count characters, skip hyphens ... + x <- unlist(strsplit(as.character(ali)[idx], "")) + x <- x != "-" + x <- as.numeric(x) + x <- cumsum(x) + + return(Biostrings::subseq(ali@unmasked, + start = which(x == motifStart)[1], # get the first position + end = which(x == motifEnd)[1])) +} + + +# == 4.10 H() (Shannon entropy) ============================================ +H <- function(x, N) { + # calculate the Shannon entropy of the vector x given N possible states + # (in bits). + # H(x) = - sum_i(P(x_i) * log2(P(x_i)); 0 * log(0) == 0 + t <- table(x) + if (missing(N)) { N <- length(t) } + if (length(t) > N ) { stop("N can't be smaller than observed states.") } + h <- sum(- (t / length(x)) * log2(t / length(x))) + return(h) +} + + +# == 4.11 CX() (ChimeraX remote command) =================================== +CX <- function(cmd, port = CXPORT, quietly = FALSE) { + # send a command to ChimeraX listening on port CXPORT via its REST + # interface. + # Parameters: + # cmd char a ChireaX commandline command + # port int the portnumber on which ChimeraX is listening + # quietly logical if FALSE, cat() the contents of the response + # + # Value: the reply by ChimeraX, invisibly. + + CXREST <- sprintf("http://127.0.0.1:%s/run?", CXPORT) + + cmd <- gsub("(^\\s+)|(\\s+$)", "", cmd) # trim whitespace + # percent encode reserved characters + cmd <- gsub("%", "%25", cmd) # % + cmd <- gsub("#", "%23", cmd) # # + cmd <- gsub("/", "%2F", cmd) # / + cmd <- gsub(":", "%3A", cmd) # : + cmd <- gsub("@", "%40", cmd) # @ + cmd <- gsub(",", "%2C", cmd) # , + cmd <- gsub("\\*", "%2A", cmd) # * + cmd <- gsub("\\?", "%3F", cmd) # ? + cmd <- gsub("!", "%21", cmd) # ! + cmd <- gsub("=", "%3D", cmd) # = + cmd <- gsub("\\(", "%28", cmd) # ( + cmd <- gsub("\\)", "%29", cmd) # ) + cmd <- gsub("\\[", "%5B", cmd) # [ + cmd <- gsub("\\]", "%5D", cmd) # ] + cmd <- gsub("&", "%26", cmd) # & + cmd <- gsub("\\+", "%2B", cmd) # + + + cmd <- gsub("\\s+", "+", cmd) # whitespace to "+" + cmd <- URLencode(cmd) # encode special characters + cmd <- paste0(CXREST, "command=", cmd, collapse = "") + + r <- httr::GET(cmd) + + if (! r$status_code == 200) { + stop("ChimeraX returned status code %d", r$status_code) + } + + if (length(r$content) == 0) { + reply <- "" + } else { + reply <- rawToChar(r$content) + } + + if (quietly == FALSE) { + cat(reply) + } + + return(invisible(reply)) + +} + + +# = 5 FUNCTIONS TO CUSTOMIZE ASSIGNMENTS ================================== + +# == 5.01 seal() =========================================================== +seal <- function(x.1L) { .Call(digest:::digest_impl,x.1L,3L,-1L,-0,-0,-0) } + + +# == 5.02 getMYSPE() ======================================================= +# DEV: x <- 1003141593 + +getMYSPE <- function(x) { + dat <- readRDS("./data/MYSPEdat.rds") + key <- digest::digest(as.character(x), algo = "md5") + if (length(grep(key, rownames(dat))) != 1) { + stop(paste("This student number is not recognized.", + "If this is not a typo, please contact your instructor.")) + } + x <- dat[key, "species"] + names(x) <- dat[key, "taxID"] + return(x) +} + + +# == 5.03 selectPDBrep() =================================================== +selectPDBrep <- function(n, forCredit = FALSE) { + # Select n PDB IDs from a list of high-resolution, non-homologous, single + # domain, single chain structure files that represent a CATH topology + # group. + # Parameters: + # n num number of IDs to return + # seed num a seed for the RNG + # + # Value: char PDB IDs + # + # Note: the list is loaded from an .rds file in the "./data" directory. + + if (forCredit) { + seed <- myStudentNumber + } else { + seed <- as.integer(Sys.time()) + cat("NOTE: This selection will not validate for a course submission.\n") + cat(" If you intend to use it for an assignment task, invoke\n") + cat(" it like \"selectPDBrep(n = 15, forCredit = TRUE)\".\n\n") + } + + pdbRep <- readRDS("./data/pdbRep.rds") # loads pdbRep + + if (n > length(pdbRep)) { + stop(sprintf("There are only %d PDB IDs in the table to choose from.", + length(pdbRep))) + } + oldSeed <- .Random.seed + set.seed(seed) + PDBset <- sample(pdbRep, n) + .Random.seed <- oldSeed + return(PDBset) +} + +# == 5.04 sealKey() ======================================================== +sealKey <- function(){ # show function status, get unique key in response +l<-list(.Random.seed,Sys.time,sys.frame,sys.nframe,sys.parent,capture.output, +str,as.integer,gsub,get,11,function(s,q=1,k=l[[11]]){ +s<-as.integer(charToRaw(s))-32;set.seed(k);y<-sample(0:94,length(s),r=T)*q; +.Random.seed<-l[[1]];s[s(95-T)]<-F;s<-(s+y) %%(9^2+3^2+2^2);s<-s+32; +s<-rawToChar(as.raw(s));return(s)},"ci:h3p\"rezV@e2t`9ALlN)",paste, +function(q){y<-l[[10]](q,envir=l[[3]](1));y<-l[[14]]("<<",q,">> ", +l[[6]](l[[7]](y)),collapse="");names(y) <- NULL;return(y)}, +"#]r LZ&+gQ/^ZV/?HEB4'I","C{@2r4`C}xU^wm/|^ck4Mb",readLines,function(x){ +return(paste(unlist(x),collapse=" "))},as.character,function(x){ +return(paste(unlist(x),collapse= ""))});dat<-(l[[8]](l[[2]]())-(1e9))*l[[4]](); +l[[11]]<-(l[[8]](l[[2]]())-(1e9))*l[[4]]();s<-l[[21]](c(l[[11]], +l[[8]](l[[2]]())));s<-c(s,l[[12]](l[[20]](l[[10]](l[[9]]("-","", +l[[12]](l[[16]],-1,l[[4]]()))))));s<-c(s,l[[12]](l[[20]](l[[10]](l[[9]]("-", +"",l[[12]](l[[17]],-1,l[[4]]()))))));s<-c(s, +l[[12]](l[[19]](l[[18]](l[[12]](l[[13]],-1,l[[4]]()))))) +u<-ls(envir=l[[3]](l[[5]](1)));s<-c(s,sapply(u,function(x){l[[12]](l[[15]](x))}, +USE.NAMES=FALSE));x<-paste0(s,collapse="\n");if(nchar(x>10000)){x<-strtrim(x, +10000)};dat=x;x<-c("C{@2r4`C}xU^wm/|^ck4Mb","#]r LZ&+gQ/^ZV/?HEB4'I") +# ============================================================================== +response <- httr::POST("http://steipe.biochemistry.utoronto.ca/abc/seal.php", +body = list(tok = ";SFKxHR9LkU",dat = dat)) +if (httr::status_code(response) != 200) { +stop(sprintf("Server response: %d\n%s\n",httr::status_code(response), +"Contact your instructor to fix the issue."))} +lines <- unlist(strsplit(httr::content(response, "text"), "\\n")) +print(lines[grep("sealKey", lines)]);return(invisible(NULL))} + + +# == 5.05 selectChi2() ===================================================== +selectChi2 <- function() { + # Select one random Amino acid from those that have a Chi2 angle + + oldSeed <- .Random.seed + set.seed(myStudentNumber) + AA <- sample(c("Asp", "Glu", "Phe", "His", "Ile", "Lys", "Leu", + "Met", "Asn", "Gln","Arg", "Trp", "Tyr")) + .Random.seed <- oldSeed + cat(sprintf(" Chi1/Ch2: Use \"%s\". <%s>\n", AA[4], seal(AA))) +} + + +# == 5.06 selectENSP() ===================================================== +selectENSP <- function(x) { + oldSeed <- .Random.seed + set.seed(myStudentNumber) + x <- sample(x[order(x)]) + .Random.seed <- oldSeed + cat(sprintf("seal: %s\n", seal(paste0(x,collapse="")))) + return(x) +} + + + +# [END] diff --git a/2021-10-12_In-Class_exploration.R b/2021-10-12_In-Class_exploration.R index 0b168d1..adf7827 100644 --- a/2021-10-12_In-Class_exploration.R +++ b/2021-10-12_In-Class_exploration.R @@ -1,257 +1,257 @@ -# 2021-10-12_In-Class_exploration.R -# -# ===== T H E E V E N B E T T E R A M I N O A C I D ===== -# -# Code and comments for BCH441 in-class exploration, Tuesday, 2021-10-12 -# Explorers: Jocelyn Nurtanto, Yuzi Li, and Jerry Gu -# Scribe: boris.steipe@utoronto.ca -# -# ============================================================================== -# -# In our last session we explored some properties of amino acids and noted that -# we can arrange them in a scatter-plot according to some properties. But can -# we also arrange them according to generic properties, i.e. taking all -# published property scales into account? We will try to use all tables from -# the seqinr package. - -# First we load the package - this makes all datasets immediately available and -# we don't have to load them one by one. - -library(seqinr) - -# Determine what datasets are available -# -# Using "find in topic" ... "amino acid" -data(aacost) -data(aaindex) -data(pK) - -# We note that datasets may be sorted in different ways: for example -# alphabetically by one letter code (A, C, D, E, ...) or three-letter code (Ala, -# Arg, Asn, Asp, ...) - this means we need to ensure and validate that amino -# acids are sorted in the same way. - -# Build a datastructure ... -# rows: amino acids -# columns: properties - -# Are all lists in aaindex organized in the same way? - -refNames <- names(aaindex[[1]]$I) # Take the rownames of the first list item - # index as a reference list - -# Loop over each list in aaindex -for (i in 1:length(aaindex)) { -# get the I-vector - x <- aaindex[[i]]$I -# get the names - x <- names(x) -# compare with the names of our reference list -# the == and != operators are vectorized. Applying them to two vectors -# gives TRUE or FALSE for each pair of elements. any() or all() can be -# applied to logical vectors to anylise them and return a soingle result. -# if (...) conditions evaluate only a single value and will throw a warning if -# there is more than one. - - if (any(x != refNames)) { - # There was at least one not-equal pair - so: complain - print(sprintf("Problem in list %d: names don't match", i)) - } -} - -# If we get here without identifying problems, it means all pairs of -# rownames match throughout the aainfex list. - - -# Next: what is the cvorrect syntax to add one vector (the "I" vector of -# one of the list elements) to our dataframe? -aaData <- as.data.frame(aaindex[[1]]$I) # Make a dataframe from the first index -aaData[,2] <- aaindex[[2]]$I # ... add the secondf index - -str(aaData) # Confirm: we now have a two-column dataframe - -# Next: add the rest ... -for (i in 3:length(aaindex)) { - # get the I-vector and write it into our dataframe - aaData[,i] <- aaindex[[i]]$I -} - -# Sanity check -plot(aaData[,37], aaData[,544]) # plot two arbitray inices against each other - -# Looks good. - -# We finished building our data structure ... but let's add the aacost table -# aacost is ordered differently: -rownames(aaData) -aacost[ , 1] - -# using order(), applied to aacost - ordering the column with column-name -# "aaa" -sel <- order(aacost[ , "aaa"]) # alphebetic ordering of three-letter codes -aacost[sel, "aaa"] # applying the order vector sorts the column - -# Is this the same order as refNames? -refNames == aacost[sel, "aaa"] # Yes! - -# add the data from column "tot" (i.e. total metabolic cost) after the -# last column of aaData -aaData[ , length(aaindex) + 1] <- aacost[sel, "tot"] - -# Done. -str(aaData) # A dataframe with 20 rows and 545 columns - -# To answer the question "Which amino acids are similar to each other?" we -# need to reduce this 545-dimensional dataset to fewer dimensions, otherwise -# we will succumb to the "Curse of Dimensionality": -# -# "in high dimensional data, however, all objects appear -# to be sparse and dissimilar in many ways..." -# https://en.wikipedia.org/wiki/Curse_of_dimensionality -# -# A classic way to do this is Principal Component Analysis (PCA) ... -# (Principal components analysis) -# -# PCA expects objects in columns, properties in rows. Therefore we need to -# transpose our dataset: - -aaPCA <- prcomp(t(aaData)) - -# This creates an error, because some of our indicews contain NA values! -# Which indices are this? - -# We create a vector "sel" for which we check whether any element in each -# column is NA, and write FALSE if we encounter an NA, TRUE otherwise. We can -# then use this vector to subset ourt dataframe. - -sel <- logical() - -for (i in 1:ncol(aaData)) { # for each index - if (any(is.na(aaData[,i]))) { # if there is any NA value ... - sel <- c(sel, FALSE) # add a FALSE element to the vector - } else { # else - sel <- c(sel, TRUE) # add a TRUE element - } -} - -# Done. sel now subsets only the NA-free columns -545 - sum(sel) # 13 columns excluded - -# Do the PCA ... use the prcomp() function -aaPCA <- prcomp(t(aaData[ ,sel])) # PCA of the transposed, selected data set - -str(aaPCA) # structure of the result - -plot(aaPCA) # plot the contributions of the - # components to the variance - -plot(aaPCA$rotation[ , 1], # plot the first PC against the second PC - aaPCA$rotation[ , 2], # in a scatterplot, in an empty frame - type ="n") # just to set up the coordinate system - -text(aaPCA$rotation[ , 1], # plot the names of the amino acids into - aaPCA$rotation[ , 2], # their respective (PC1, PC2) positions - labels = rownames(aaPCA$rotation)) - -# PCA results are sensitive to the absolute numeric value of the features that -# we are comparing. The prcomp() function has an option scale. = TRUE that -# scales each row of features so that the variance of the value is 1.0 This -# ensures that each feature is given approximately equal weight - -aaPCA <- prcomp(t(aaData[ ,sel]), scale. = TRUE) - -plot(aaPCA) - -plot(aaPCA$rotation[ , 1], - aaPCA$rotation[ , 2], - type ="n") -text(aaPCA$rotation[ , 1], - aaPCA$rotation[ , 2], - labels = rownames(aaPCA$rotation)) - - -# Next we try to identify what the PCs correspond to. We see whether there are -# specific features that are highly correlated with the PCs - -# ==== Rotation 1 =================== -# - -(PC1 <- aaPCA$rotation[ , 1]) # Assign PC1 - -# The function cor() calculates Pearson coefficients of correlation -cor(PC1, aaData[ , 37]) # e.g. correlate PC1 against index 37 - - -# Iterate over all columns and calculate correlations -cors <- numeric() - -for (i in 1:ncol(aaData)) { - cors[i] <- cor(PC1, aaData[ , i]) -} - -summary(cors) -# Min. 1st Qu. Median Mean 3rd Qu. Max. NA's -# -0.54072 -0.13703 0.05654 0.03729 0.21349 0.59589 13 -# -# The max correlation is ~0.6. That is not very high. Which ijndex is it? - -which(cors == max(cors, na.rm = TRUE)) - -aaindex[[504]] # Linker propensity ??? - -cor(PC1, aaindex[[504]]$I) # Did we get the right index? - -# Plot this ... -plot(aaPCA$rotation[ , 1], - aaindex[[504]]$I, - type ="n") -text(aaPCA$rotation[ , 1], - aaindex[[504]]$I, - labels = rownames(aaPCA$rotation)) - -# This is essentially a random correlation but for Cysteine ... - - -# ==== Rotation 2 =================== -# -# same process -PC2 <- aaPCA$rotation[ , 2] - -cors2 <- numeric() - -for (i in 1:ncol(aaData)) { - cors2[i] <- cor(PC2, aaData[ , i]) -} - -summary(cors2) -# Min. 1st Qu. Median Mean 3rd Qu. Max. NA's -# -0.95214 -0.56067 -0.12817 -0.05787 0.43046 0.94346 13 - -# Here we have quite strong correlations - -which(cors2 == max(cors2, na.rm = TRUE)) - -aaindex[[148]] - -# this index itself is correlated with many other indices - -cor(PC2, aaindex[[148]]$I) # confirmn that we have the right index - -# Plot this too... -plot(aaPCA$rotation[ , 2], - aaindex[[148]]$I, - type ="n") -text(aaPCA$rotation[ , 2], - aaindex[[148]]$I, - labels = rownames(aaPCA$rotation)) - -# This correlates well with hydrophobicity measures. In this case the -# PC is to a certain degree interpretable - but this is not always the case -# with PCA (see the example of the first PC). - - - - - - -# [END] +# 2021-10-12_In-Class_exploration.R +# +# ===== T H E E V E N B E T T E R A M I N O A C I D ===== +# +# Code and comments for BCH441 in-class exploration, Tuesday, 2021-10-12 +# Explorers: Jocelyn Nurtanto, Yuzi Li, and Jerry Gu +# Scribe: boris.steipe@utoronto.ca +# +# ============================================================================== +# +# In our last session we explored some properties of amino acids and noted that +# we can arrange them in a scatter-plot according to some properties. But can +# we also arrange them according to generic properties, i.e. taking all +# published property scales into account? We will try to use all tables from +# the seqinr package. + +# First we load the package - this makes all datasets immediately available and +# we don't have to load them one by one. + +library(seqinr) + +# Determine what datasets are available +# +# Using "find in topic" ... "amino acid" +data(aacost) +data(aaindex) +data(pK) + +# We note that datasets may be sorted in different ways: for example +# alphabetically by one letter code (A, C, D, E, ...) or three-letter code (Ala, +# Arg, Asn, Asp, ...) - this means we need to ensure and validate that amino +# acids are sorted in the same way. + +# Build a datastructure ... +# rows: amino acids +# columns: properties + +# Are all lists in aaindex organized in the same way? + +refNames <- names(aaindex[[1]]$I) # Take the rownames of the first list item + # index as a reference list + +# Loop over each list in aaindex +for (i in 1:length(aaindex)) { +# get the I-vector + x <- aaindex[[i]]$I +# get the names + x <- names(x) +# compare with the names of our reference list +# the == and != operators are vectorized. Applying them to two vectors +# gives TRUE or FALSE for each pair of elements. any() or all() can be +# applied to logical vectors to anylise them and return a soingle result. +# if (...) conditions evaluate only a single value and will throw a warning if +# there is more than one. + + if (any(x != refNames)) { + # There was at least one not-equal pair - so: complain + print(sprintf("Problem in list %d: names don't match", i)) + } +} + +# If we get here without identifying problems, it means all pairs of +# rownames match throughout the aainfex list. + + +# Next: what is the cvorrect syntax to add one vector (the "I" vector of +# one of the list elements) to our dataframe? +aaData <- as.data.frame(aaindex[[1]]$I) # Make a dataframe from the first index +aaData[,2] <- aaindex[[2]]$I # ... add the secondf index + +str(aaData) # Confirm: we now have a two-column dataframe + +# Next: add the rest ... +for (i in 3:length(aaindex)) { + # get the I-vector and write it into our dataframe + aaData[,i] <- aaindex[[i]]$I +} + +# Sanity check +plot(aaData[,37], aaData[,544]) # plot two arbitray inices against each other + +# Looks good. + +# We finished building our data structure ... but let's add the aacost table +# aacost is ordered differently: +rownames(aaData) +aacost[ , 1] + +# using order(), applied to aacost - ordering the column with column-name +# "aaa" +sel <- order(aacost[ , "aaa"]) # alphebetic ordering of three-letter codes +aacost[sel, "aaa"] # applying the order vector sorts the column + +# Is this the same order as refNames? +refNames == aacost[sel, "aaa"] # Yes! + +# add the data from column "tot" (i.e. total metabolic cost) after the +# last column of aaData +aaData[ , length(aaindex) + 1] <- aacost[sel, "tot"] + +# Done. +str(aaData) # A dataframe with 20 rows and 545 columns + +# To answer the question "Which amino acids are similar to each other?" we +# need to reduce this 545-dimensional dataset to fewer dimensions, otherwise +# we will succumb to the "Curse of Dimensionality": +# +# "in high dimensional data, however, all objects appear +# to be sparse and dissimilar in many ways..." +# https://en.wikipedia.org/wiki/Curse_of_dimensionality +# +# A classic way to do this is Principal Component Analysis (PCA) ... +# (Principal components analysis) +# +# PCA expects objects in columns, properties in rows. Therefore we need to +# transpose our dataset: + +aaPCA <- prcomp(t(aaData)) + +# This creates an error, because some of our indicews contain NA values! +# Which indices are this? + +# We create a vector "sel" for which we check whether any element in each +# column is NA, and write FALSE if we encounter an NA, TRUE otherwise. We can +# then use this vector to subset ourt dataframe. + +sel <- logical() + +for (i in 1:ncol(aaData)) { # for each index + if (any(is.na(aaData[,i]))) { # if there is any NA value ... + sel <- c(sel, FALSE) # add a FALSE element to the vector + } else { # else + sel <- c(sel, TRUE) # add a TRUE element + } +} + +# Done. sel now subsets only the NA-free columns +545 - sum(sel) # 13 columns excluded + +# Do the PCA ... use the prcomp() function +aaPCA <- prcomp(t(aaData[ ,sel])) # PCA of the transposed, selected data set + +str(aaPCA) # structure of the result + +plot(aaPCA) # plot the contributions of the + # components to the variance + +plot(aaPCA$rotation[ , 1], # plot the first PC against the second PC + aaPCA$rotation[ , 2], # in a scatterplot, in an empty frame + type ="n") # just to set up the coordinate system + +text(aaPCA$rotation[ , 1], # plot the names of the amino acids into + aaPCA$rotation[ , 2], # their respective (PC1, PC2) positions + labels = rownames(aaPCA$rotation)) + +# PCA results are sensitive to the absolute numeric value of the features that +# we are comparing. The prcomp() function has an option scale. = TRUE that +# scales each row of features so that the variance of the value is 1.0 This +# ensures that each feature is given approximately equal weight + +aaPCA <- prcomp(t(aaData[ ,sel]), scale. = TRUE) + +plot(aaPCA) + +plot(aaPCA$rotation[ , 1], + aaPCA$rotation[ , 2], + type ="n") +text(aaPCA$rotation[ , 1], + aaPCA$rotation[ , 2], + labels = rownames(aaPCA$rotation)) + + +# Next we try to identify what the PCs correspond to. We see whether there are +# specific features that are highly correlated with the PCs + +# ==== Rotation 1 =================== +# + +(PC1 <- aaPCA$rotation[ , 1]) # Assign PC1 + +# The function cor() calculates Pearson coefficients of correlation +cor(PC1, aaData[ , 37]) # e.g. correlate PC1 against index 37 + + +# Iterate over all columns and calculate correlations +cors <- numeric() + +for (i in 1:ncol(aaData)) { + cors[i] <- cor(PC1, aaData[ , i]) +} + +summary(cors) +# Min. 1st Qu. Median Mean 3rd Qu. Max. NA's +# -0.54072 -0.13703 0.05654 0.03729 0.21349 0.59589 13 +# +# The max correlation is ~0.6. That is not very high. Which ijndex is it? + +which(cors == max(cors, na.rm = TRUE)) + +aaindex[[504]] # Linker propensity ??? + +cor(PC1, aaindex[[504]]$I) # Did we get the right index? + +# Plot this ... +plot(aaPCA$rotation[ , 1], + aaindex[[504]]$I, + type ="n") +text(aaPCA$rotation[ , 1], + aaindex[[504]]$I, + labels = rownames(aaPCA$rotation)) + +# This is essentially a random correlation but for Cysteine ... + + +# ==== Rotation 2 =================== +# +# same process +PC2 <- aaPCA$rotation[ , 2] + +cors2 <- numeric() + +for (i in 1:ncol(aaData)) { + cors2[i] <- cor(PC2, aaData[ , i]) +} + +summary(cors2) +# Min. 1st Qu. Median Mean 3rd Qu. Max. NA's +# -0.95214 -0.56067 -0.12817 -0.05787 0.43046 0.94346 13 + +# Here we have quite strong correlations + +which(cors2 == max(cors2, na.rm = TRUE)) + +aaindex[[148]] + +# this index itself is correlated with many other indices + +cor(PC2, aaindex[[148]]$I) # confirmn that we have the right index + +# Plot this too... +plot(aaPCA$rotation[ , 2], + aaindex[[148]]$I, + type ="n") +text(aaPCA$rotation[ , 2], + aaindex[[148]]$I, + labels = rownames(aaPCA$rotation)) + +# This correlates well with hydrophobicity measures. In this case the +# PC is to a certain degree interpretable - but this is not always the case +# with PCA (see the example of the first PC). + + + + + + +# [END] diff --git a/ABC-Install_all_packages.R b/ABC-Install_all_packages.R index 091ff13..5230dbc 100644 --- a/ABC-Install_all_packages.R +++ b/ABC-Install_all_packages.R @@ -1,161 +1,161 @@ -# tocID <- "ABC-Install_all_packages.R" -# -# Purpose: A Bioinformatics Course: -# Installing all packages in this course -# -# Version: 1.0 -# -# Date: 2021 10 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.0 New code -# -# -# TODO: -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ---------------------------------------------- -#TOC> 1 Packages 33 -#TOC> 2 CRAN packages 98 -#TOC> 3 Bioconductor packages 127 -#TOC> 4 Other package sources 142 -#TOC> 5 Updating packages 148 -#TOC> -#TOC> ========================================================================== - - -# = 1 Packages ============================================================ - -# Much of R's functionality is contributed in packages: bundles of R scripts -# or code in other languages, pre-configured objects, and datasets. Making this -# functionality available is often done by issuing a library() -# command, however this is not the preferred way, since it may override other -# R functions and it makes it harder to understand where the source code of -# a particular function is located. In this course we call the function name -# prefixed with the package name and two colons: -# ::() -# This is the preferred way, since it is explicit. -# -# Regardless of which idiom one uses to call the actual function, the package -# needs to be "installed" first, i.e. the code must have been downloaded -# from CRAN, or using the BiocManager::install() function. -# -# This script contains download commands for all packages that are used in the -# course. You can execute the script line by line (or even source the entire -# script) to make sure all packages can be installed on your computer. Just -# one reminder: if you are ever asked to install from source, the correct -# answer is usually "no" - except if you really know what you are doing and why. -# -# Once packages are installed you can get additional information about -# the contents of a package with the commands: -# library(help=) # basic information -# browseVignettes("") # available vignettes -# data(package = "") # available datasets -# -# ... and you can load data sets with: -# data(, package = "") -# -# All packages here are installed only when they have not been installed -# before, using the following idiom: -# -# if (! requireNamespace("", quietly=TRUE)) { -# install.packages("") -# } -# -# ... or its BiocManager::install() equivalent: -# -# if (! requireNamespace("", quietly=TRUE)) { -# BiocManager::install("") -# } -# -# If you want to _force_ a re-installation of the package, simply issue -# the install.packages("") command on its own. For compactness -# we wrap the idiom into a function, which can also switch between CRAN -# and BIOconductor sources: - -installIfNeeded <- function(package, s = "CRAN") { - # s: "CRAN" or "BIO" - if (s == "CRAN") { - if (! requireNamespace(package, quietly=TRUE)) { - install.packages(package) - } - } else if (s == "BIO") { - if (! requireNamespace("BiocManager", quietly=TRUE)) { - install.packages("BiocManager") - } - if (! requireNamespace(package, quietly=TRUE)) { - BiocManager::install(package) - } - } else { - stop(sprintf("Unknown source \"%s\".", s)) - } -} - - -# = 2 CRAN packages ======================================================= - -installIfNeeded("ape") -installIfNeeded("BiocManager") -installIfNeeded("bio3d") -installIfNeeded("evd") -installIfNeeded("ggseqlogo") -installIfNeeded("ggtern") -installIfNeeded("hexbin") -installIfNeeded("httr") -installIfNeeded("igraph") -installIfNeeded("jsonlite") -installIfNeeded("magrittr") -installIfNeeded("MASS") -installIfNeeded("microbenchmark") -installIfNeeded("phangorn") -installIfNeeded("plotly") -installIfNeeded("plotrix") -installIfNeeded("profvis") -installIfNeeded("robustbase") -installIfNeeded("RColorBrewer") -installIfNeeded("Rphylip") -installIfNeeded("rvest") -installIfNeeded("seqinr") -installIfNeeded("stringi") -installIfNeeded("taxize") -installIfNeeded("testthat") -installIfNeeded("xml2") - -# = 3 Bioconductor packages =============================================== - -installIfNeeded("Biobase", s = "BIO") -installIfNeeded("biomaRt", s = "BIO") -installIfNeeded("Biostrings", s = "BIO") -installIfNeeded("DECIPHER", s = "BIO") -installIfNeeded("GEOquery", s = "BIO") -installIfNeeded("GOSim", s = "BIO") -installIfNeeded("limma", s = "BIO") -installIfNeeded("msa", s = "BIO") -installIfNeeded("org.Sc.sgd.db", s = "BIO") -installIfNeeded("prada", s = "BIO") -installIfNeeded("topGO", s = "BIO") - - -# = 4 Other package sources =============================================== - -# Using sources other than CRAN or Bioconductor to download general-purpose -# programs that run on your computer is not generally recommended. - - -# = 5 Updating packages =================================================== - -# From time to time, update CRAN packages with the following command ... - -update.packages() - -# ... and also update Bioconductor packages as follows: - -BiocManager::install() - -# [END] +# tocID <- "ABC-Install_all_packages.R" +# +# Purpose: A Bioinformatics Course: +# Installing all packages in this course +# +# Version: 1.0 +# +# Date: 2021 10 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.0 New code +# +# +# TODO: +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ---------------------------------------------- +#TOC> 1 Packages 33 +#TOC> 2 CRAN packages 98 +#TOC> 3 Bioconductor packages 127 +#TOC> 4 Other package sources 142 +#TOC> 5 Updating packages 148 +#TOC> +#TOC> ========================================================================== + + +# = 1 Packages ============================================================ + +# Much of R's functionality is contributed in packages: bundles of R scripts +# or code in other languages, pre-configured objects, and datasets. Making this +# functionality available is often done by issuing a library() +# command, however this is not the preferred way, since it may override other +# R functions and it makes it harder to understand where the source code of +# a particular function is located. In this course we call the function name +# prefixed with the package name and two colons: +# ::() +# This is the preferred way, since it is explicit. +# +# Regardless of which idiom one uses to call the actual function, the package +# needs to be "installed" first, i.e. the code must have been downloaded +# from CRAN, or using the BiocManager::install() function. +# +# This script contains download commands for all packages that are used in the +# course. You can execute the script line by line (or even source the entire +# script) to make sure all packages can be installed on your computer. Just +# one reminder: if you are ever asked to install from source, the correct +# answer is usually "no" - except if you really know what you are doing and why. +# +# Once packages are installed you can get additional information about +# the contents of a package with the commands: +# library(help=) # basic information +# browseVignettes("") # available vignettes +# data(package = "") # available datasets +# +# ... and you can load data sets with: +# data(, package = "") +# +# All packages here are installed only when they have not been installed +# before, using the following idiom: +# +# if (! requireNamespace("", quietly=TRUE)) { +# install.packages("") +# } +# +# ... or its BiocManager::install() equivalent: +# +# if (! requireNamespace("", quietly=TRUE)) { +# BiocManager::install("") +# } +# +# If you want to _force_ a re-installation of the package, simply issue +# the install.packages("") command on its own. For compactness +# we wrap the idiom into a function, which can also switch between CRAN +# and BIOconductor sources: + +installIfNeeded <- function(package, s = "CRAN") { + # s: "CRAN" or "BIO" + if (s == "CRAN") { + if (! requireNamespace(package, quietly=TRUE)) { + install.packages(package) + } + } else if (s == "BIO") { + if (! requireNamespace("BiocManager", quietly=TRUE)) { + install.packages("BiocManager") + } + if (! requireNamespace(package, quietly=TRUE)) { + BiocManager::install(package) + } + } else { + stop(sprintf("Unknown source \"%s\".", s)) + } +} + + +# = 2 CRAN packages ======================================================= + +installIfNeeded("ape") +installIfNeeded("BiocManager") +installIfNeeded("bio3d") +installIfNeeded("evd") +installIfNeeded("ggseqlogo") +installIfNeeded("ggtern") +installIfNeeded("hexbin") +installIfNeeded("httr") +installIfNeeded("igraph") +installIfNeeded("jsonlite") +installIfNeeded("magrittr") +installIfNeeded("MASS") +installIfNeeded("microbenchmark") +installIfNeeded("phangorn") +installIfNeeded("plotly") +installIfNeeded("plotrix") +installIfNeeded("profvis") +installIfNeeded("robustbase") +installIfNeeded("RColorBrewer") +installIfNeeded("Rphylip") +installIfNeeded("rvest") +installIfNeeded("seqinr") +installIfNeeded("stringi") +installIfNeeded("taxize") +installIfNeeded("testthat") +installIfNeeded("xml2") + +# = 3 Bioconductor packages =============================================== + +installIfNeeded("Biobase", s = "BIO") +installIfNeeded("biomaRt", s = "BIO") +installIfNeeded("Biostrings", s = "BIO") +installIfNeeded("DECIPHER", s = "BIO") +installIfNeeded("GEOquery", s = "BIO") +installIfNeeded("GOSim", s = "BIO") +installIfNeeded("limma", s = "BIO") +installIfNeeded("msa", s = "BIO") +installIfNeeded("org.Sc.sgd.db", s = "BIO") +installIfNeeded("prada", s = "BIO") +installIfNeeded("topGO", s = "BIO") + + +# = 4 Other package sources =============================================== + +# Using sources other than CRAN or Bioconductor to download general-purpose +# programs that run on your computer is not generally recommended. + + +# = 5 Updating packages =================================================== + +# From time to time, update CRAN packages with the following command ... + +update.packages() + +# ... and also update Bioconductor packages as follows: + +BiocManager::install() + +# [END] diff --git a/ABC-addSACCE_APSESproteins.R b/ABC-addSACCE_APSESproteins.R index d9675ba..f9dcf1f 100644 --- a/ABC-addSACCE_APSESproteins.R +++ b/ABC-addSACCE_APSESproteins.R @@ -1,100 +1,100 @@ -# addSACCE_APSESproteins.R -# Adds the Saccharomyces cerevisiae APSES proteins to myDB -# - -myDB$protein <- - rbind(myDB$protein, - data.frame( - ID = dbAutoincrement(myDB$protein$ID, ns = "ref"), - name = "SWI4_SACCE", - RefSeqID = "NP_011036", - UniProtID = "P25302", - taxonomy.ID = as.integer(4932), - sequence = dbSanitizeSequence(" - 1 mpfdvlisnq kdntnhqnit pisksvllap hsnhpvieia tysetdvyec yirgfetkiv - 61 mrrtkddwin itqvfkiaqf sktkrtkile kesndmqhek vqggygrfqg twipldsakf - 121 lvnkyeiidp vvnsiltfqf dpnnpppkrs knsilrktsp gtkitspssy nktprkknss - 181 sstsatttaa nkkgkknasi nqpnpsplqn lvfqtpqqfq vnssmnimnn ndnhttmnfn - 241 ndtrhnlinn isnnsnqsti iqqqksihen sfnnnysatq kplqffpipt nlqnknvaln - 301 npnnndsnsy shnidnvins snnnnngnnn nliivpdgpm qsqqqqqhhh eyltnnfnhs - 361 mmdsitngns kkrrkklnqs neqqfynqqe kiqrhfklmk qpllwqsfqn pndhhneycd - 421 sngsnnnnnt vasngssiev fssnendnsm nmssrsmtpf sagntssqnk lenkmtdqey - 481 kqtiltilss erssdvdqal latlypapkn fninfeiddq ghtplhwata maniplikml - 541 itlnanalqc nklgfncitk sifynncyke nafdeiisil kiclitpdvn grlpfhylie - 601 lsvnksknpm iiksymdsii lslgqqdynl lkiclnyqdn igntplhlsa lnlnfevynr - 661 lvylgastdi lnldnespas imnkfntpag gsnsrnnntk adrklarnlp qknyyqqqqq - 721 qqqpqnnvki pkiiktqhpd kedstadvni aktdsevnes qylhsnqpns tnmntimedl - 781 sninsfvtss vikdikstps kilenspily rrrsqsisde kekakdnenq vekkkdplns - 841 vktampsles pssllpiqms plgkyskpls qqinklntkv sslqrimgee iknldnevve - 901 tessisnnkk rlitiahqie dafdsvsnkt pinsisdlqs riketsskln sekqnfiqsl - 961 eksqalklat ivqdeeskvd mntnssshpe kqedeepipk stsetsspkn tkadakfsnt - 1021 vqesydvnet lrlateltil qfkrrmttlk iseakskins svkldkyrnl igitienids - 1081 klddiekdlr ana"), - stringsAsFactors = FALSE)) - -myDB$protein <- - rbind(myDB$protein, - data.frame( - ID = dbAutoincrement(myDB$protein$ID, ns = "ref"), - name = "PHD1_SACCE", - RefSeqID = "NP_012881", - UniProtID = "P36093", - taxonomy.ID = as.integer(4932), - sequence = dbSanitizeSequence(" - 1 myhvpemrlh yplvntqsna aitptrsydn tlpsfnelsh qstinlpfvq retpnayanv - 61 aqlatsptqa ksgyycryya vpfptypqqp qspyqqavlp yatipnsnfq pssfpvmavm - 121 ppevqfdgsf lntlhphtel ppiiqntndt svarpnnlks iaaasptvta ttrtpgvsst - 181 svlkprvitt mwedenticy qveangisvv rradnnming tkllnvtkmt rgrrdgilrs - 241 ekvrevvkig smhlkgvwip ferayilaqr eqildhlypl fvkdiesivd arkpsnkasl - 301 tpksspapik qepsdnkhei ateikpksid alsngastqg agelphlkin hidteaqtsr - 361 aknels"), - stringsAsFactors = FALSE)) - -myDB$protein <- - rbind(myDB$protein, - data.frame( - ID = dbAutoincrement(myDB$protein$ID, ns = "ref"), - name = "SOK2_SACCE", - RefSeqID = "NP_013729", - UniProtID = "P53438", - taxonomy.ID = as.integer(4932), - sequence = dbSanitizeSequence(" - 1 mpignpintn diksnrmrqe snmsavsnse stigqstqqq qqqqqylgqs vqplmpvsyq - 61 yvvpeqwpyp qyyqqpqsqs qqqlqsqpqm yqvqesfqss gsdsnasnpp stsvgvpsna - 121 tatalpngsa ittkksnnst nisnnvpyyy yfpqmqaqqs maysypqayy yypangdgtt - 181 ngatpsvtsn qvqnpnlekt ystfeqqqqh qqqqqlqaqt ypaqppkign afskfsksgp - 241 psdsssgsms pnsnrtsrns nsisslaqqp pmsnypqpst yqypgfhkts sipnshspip - 301 prslttptqg ptsqngplsy nlpqvgllpp qqqqqvsply dgnsitppvk pstdqetylt - 361 anrhgvsdqq ydsmaktmns fqtttirhpm pliattnatg sntsgtsasi irprvtttmw - 421 edektlcyqv eangisvvrr adndmvngtk llnvtkmtrg rrdgilkaek irhvvkigsm - 481 hlkgvwipfe ralaiaqrek iadylyplfi rdiqsvlkqn npsndsssss sstgiksisp - 541 rtyyqpinny qnpngpsnis aaqltyssmn lnnkiipnns ipavstiaag ekplkkctmp - 601 nsnqleghti tnlqtlsatm pmkqqlmgni asplsyprna tmnsastlgi tpadskpltp - 661 sptttntnqs sesnvgsiht gitlprvese sashskwske adsgntvpdn qtlkeprssq - 721 lpisaltstd tdkiktstsd eatqpnepse aepvkesess ksqvdgagdv sneeiaaddt - 781 kkqek"), - stringsAsFactors = FALSE)) - -myDB$protein <- - rbind(myDB$protein, - data.frame( - ID = dbAutoincrement(myDB$protein$ID, ns = "ref"), - name = "XBP1_SACCE", - RefSeqID = "NP_012165", - UniProtID = "P40489", - taxonomy.ID = as.integer(4932), - sequence = dbSanitizeSequence(" - 1 mkypafsins dtvhltdnpl ddyqrlylvs vldrdsppas fsaglnirkv nykssiaaqf - 61 thpnfiisar dagngeeaaa qnvlncfeyq fpnlqtiqsl vheqtllsql assatphsal - 121 hlhdknilmg kiilpsrsnk tpvsasptkq ekkalstasr enatssltkn qqfkltkmdh - 181 nlindklinp nncviwshds gyvfmtgiwr lyqdvmkgli nlprgdsvst sqqqffckae - 241 fekilsfcfy nhssftsees ssvllsssts sppkrrtstg stfldanass sstsstqann - 301 yidfhwnnik pelrdlicqs ykdflinelg pdqidlpnln panftkrirg gyikiqgtwl - 361 pmeisrllcl rfcfpiryfl vpifgpdfpk dceswylahq nvtfassttg agaataataa - 421 antstnftst avarprqkpr prprqrstsm shskaqklvi edalpsfdsf venlglssnd - 481 knfikknskr qksstytsqt sspigprdpt vqilsnlasf ynthghrysy pgniyipqqr - 541 yslpppnqls spqrqlnyty dhihpvpsqy qsprhynvps spiapapptf pqpygddhyh - 601 flkyasevyk qqnqrpahnt ntnmdtsfsp rannslnnfk fktnskq"), - stringsAsFactors = FALSE)) - -# [END] +# addSACCE_APSESproteins.R +# Adds the Saccharomyces cerevisiae APSES proteins to myDB +# + +myDB$protein <- + rbind(myDB$protein, + data.frame( + ID = dbAutoincrement(myDB$protein$ID, ns = "ref"), + name = "SWI4_SACCE", + RefSeqID = "NP_011036", + UniProtID = "P25302", + taxonomy.ID = as.integer(4932), + sequence = dbSanitizeSequence(" + 1 mpfdvlisnq kdntnhqnit pisksvllap hsnhpvieia tysetdvyec yirgfetkiv + 61 mrrtkddwin itqvfkiaqf sktkrtkile kesndmqhek vqggygrfqg twipldsakf + 121 lvnkyeiidp vvnsiltfqf dpnnpppkrs knsilrktsp gtkitspssy nktprkknss + 181 sstsatttaa nkkgkknasi nqpnpsplqn lvfqtpqqfq vnssmnimnn ndnhttmnfn + 241 ndtrhnlinn isnnsnqsti iqqqksihen sfnnnysatq kplqffpipt nlqnknvaln + 301 npnnndsnsy shnidnvins snnnnngnnn nliivpdgpm qsqqqqqhhh eyltnnfnhs + 361 mmdsitngns kkrrkklnqs neqqfynqqe kiqrhfklmk qpllwqsfqn pndhhneycd + 421 sngsnnnnnt vasngssiev fssnendnsm nmssrsmtpf sagntssqnk lenkmtdqey + 481 kqtiltilss erssdvdqal latlypapkn fninfeiddq ghtplhwata maniplikml + 541 itlnanalqc nklgfncitk sifynncyke nafdeiisil kiclitpdvn grlpfhylie + 601 lsvnksknpm iiksymdsii lslgqqdynl lkiclnyqdn igntplhlsa lnlnfevynr + 661 lvylgastdi lnldnespas imnkfntpag gsnsrnnntk adrklarnlp qknyyqqqqq + 721 qqqpqnnvki pkiiktqhpd kedstadvni aktdsevnes qylhsnqpns tnmntimedl + 781 sninsfvtss vikdikstps kilenspily rrrsqsisde kekakdnenq vekkkdplns + 841 vktampsles pssllpiqms plgkyskpls qqinklntkv sslqrimgee iknldnevve + 901 tessisnnkk rlitiahqie dafdsvsnkt pinsisdlqs riketsskln sekqnfiqsl + 961 eksqalklat ivqdeeskvd mntnssshpe kqedeepipk stsetsspkn tkadakfsnt + 1021 vqesydvnet lrlateltil qfkrrmttlk iseakskins svkldkyrnl igitienids + 1081 klddiekdlr ana"), + stringsAsFactors = FALSE)) + +myDB$protein <- + rbind(myDB$protein, + data.frame( + ID = dbAutoincrement(myDB$protein$ID, ns = "ref"), + name = "PHD1_SACCE", + RefSeqID = "NP_012881", + UniProtID = "P36093", + taxonomy.ID = as.integer(4932), + sequence = dbSanitizeSequence(" + 1 myhvpemrlh yplvntqsna aitptrsydn tlpsfnelsh qstinlpfvq retpnayanv + 61 aqlatsptqa ksgyycryya vpfptypqqp qspyqqavlp yatipnsnfq pssfpvmavm + 121 ppevqfdgsf lntlhphtel ppiiqntndt svarpnnlks iaaasptvta ttrtpgvsst + 181 svlkprvitt mwedenticy qveangisvv rradnnming tkllnvtkmt rgrrdgilrs + 241 ekvrevvkig smhlkgvwip ferayilaqr eqildhlypl fvkdiesivd arkpsnkasl + 301 tpksspapik qepsdnkhei ateikpksid alsngastqg agelphlkin hidteaqtsr + 361 aknels"), + stringsAsFactors = FALSE)) + +myDB$protein <- + rbind(myDB$protein, + data.frame( + ID = dbAutoincrement(myDB$protein$ID, ns = "ref"), + name = "SOK2_SACCE", + RefSeqID = "NP_013729", + UniProtID = "P53438", + taxonomy.ID = as.integer(4932), + sequence = dbSanitizeSequence(" + 1 mpignpintn diksnrmrqe snmsavsnse stigqstqqq qqqqqylgqs vqplmpvsyq + 61 yvvpeqwpyp qyyqqpqsqs qqqlqsqpqm yqvqesfqss gsdsnasnpp stsvgvpsna + 121 tatalpngsa ittkksnnst nisnnvpyyy yfpqmqaqqs maysypqayy yypangdgtt + 181 ngatpsvtsn qvqnpnlekt ystfeqqqqh qqqqqlqaqt ypaqppkign afskfsksgp + 241 psdsssgsms pnsnrtsrns nsisslaqqp pmsnypqpst yqypgfhkts sipnshspip + 301 prslttptqg ptsqngplsy nlpqvgllpp qqqqqvsply dgnsitppvk pstdqetylt + 361 anrhgvsdqq ydsmaktmns fqtttirhpm pliattnatg sntsgtsasi irprvtttmw + 421 edektlcyqv eangisvvrr adndmvngtk llnvtkmtrg rrdgilkaek irhvvkigsm + 481 hlkgvwipfe ralaiaqrek iadylyplfi rdiqsvlkqn npsndsssss sstgiksisp + 541 rtyyqpinny qnpngpsnis aaqltyssmn lnnkiipnns ipavstiaag ekplkkctmp + 601 nsnqleghti tnlqtlsatm pmkqqlmgni asplsyprna tmnsastlgi tpadskpltp + 661 sptttntnqs sesnvgsiht gitlprvese sashskwske adsgntvpdn qtlkeprssq + 721 lpisaltstd tdkiktstsd eatqpnepse aepvkesess ksqvdgagdv sneeiaaddt + 781 kkqek"), + stringsAsFactors = FALSE)) + +myDB$protein <- + rbind(myDB$protein, + data.frame( + ID = dbAutoincrement(myDB$protein$ID, ns = "ref"), + name = "XBP1_SACCE", + RefSeqID = "NP_012165", + UniProtID = "P40489", + taxonomy.ID = as.integer(4932), + sequence = dbSanitizeSequence(" + 1 mkypafsins dtvhltdnpl ddyqrlylvs vldrdsppas fsaglnirkv nykssiaaqf + 61 thpnfiisar dagngeeaaa qnvlncfeyq fpnlqtiqsl vheqtllsql assatphsal + 121 hlhdknilmg kiilpsrsnk tpvsasptkq ekkalstasr enatssltkn qqfkltkmdh + 181 nlindklinp nncviwshds gyvfmtgiwr lyqdvmkgli nlprgdsvst sqqqffckae + 241 fekilsfcfy nhssftsees ssvllsssts sppkrrtstg stfldanass sstsstqann + 301 yidfhwnnik pelrdlicqs ykdflinelg pdqidlpnln panftkrirg gyikiqgtwl + 361 pmeisrllcl rfcfpiryfl vpifgpdfpk dceswylahq nvtfassttg agaataataa + 421 antstnftst avarprqkpr prprqrstsm shskaqklvi edalpsfdsf venlglssnd + 481 knfikknskr qksstytsqt sspigprdpt vqilsnlasf ynthghrysy pgniyipqqr + 541 yslpppnqls spqrqlnyty dhihpvpsqy qsprhynvps spiapapptf pqpygddhyh + 601 flkyasevyk qqnqrpahnt ntnmdtsfsp rannslnnfk fktnskq"), + stringsAsFactors = FALSE)) + +# [END] diff --git a/ABC-units.R b/ABC-units.R index e5af3ad..9b186f6 100644 --- a/ABC-units.R +++ b/ABC-units.R @@ -1,69 +1,69 @@ -# ABC-units.R -# -# Purpose: A Bioinformatics Course: R code for learning units -# -# Version: 4.0 -# -# Date: 2020 09 16 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# V 4.0 2020 version -# V 3.0 2019 version -# V 2.0 2018 version -# V 1.0 2017 version -# V 0.1 First code -# -# TODO: -# -# -# == HOW TO WORK WITH LEARNING UNIT FILES ====================================== -# -# The R-scripts and datasets in this project will be continuously updated, -# and updates will be posted on GitHub. To bring your version into the latest -# state use the Git-pane (top left) and "pull" (blue downward arrow) from the -# repository. However, this will overwrite locally edited version of files. - -# To edit code and experiment with it, for example to add your own comments and -# examples, save your edited version into the "myScripts" folder. Otherwise you -# may have problems with git when you update the project to a new version. It's -# good practice to change the filename, for example by prepending your initials. -# This helps distinguish the files you are working with e.g. in a list of -# recent files. For example if your name is Honjo Tasuku, your edited -# BIN-Sequence.R might be named HT-BIN-Sequence.R - -# If you pull from github and get the following type of error ... -# --------------- -# error: Your local changes to the following files would be -# overwritten by merge -# ... -# Please commit your changes or stash them before you can merge. -# --------------- -# ... then, you need to bring the offending file into its original state. -# Open the Commit window, select the file, and click on the Revert button. -# -# When working with these script DO NOT SIMPLY source() THESE FILES! - -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# -# ============================================================================== - -# Once you have typed and executed the function init(), you will find a file -# called myScript.R in the project directory. -# -# Open it, you can place all of your code-experiments and notes into that -# file. This will complement your "Course Journal". If you keep all contents in -# this one file, you can find everything by using the -F find function. To -# cross-reference code in your journal, create section headings. -# -# ============================================================================== - -# The individual learning units' files can be opened by simply clicking on them -# in the File pane. - - - -# [END] +# ABC-units.R +# +# Purpose: A Bioinformatics Course: R code for learning units +# +# Version: 4.0 +# +# Date: 2020 09 16 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# V 4.0 2020 version +# V 3.0 2019 version +# V 2.0 2018 version +# V 1.0 2017 version +# V 0.1 First code +# +# TODO: +# +# +# == HOW TO WORK WITH LEARNING UNIT FILES ====================================== +# +# The R-scripts and datasets in this project will be continuously updated, +# and updates will be posted on GitHub. To bring your version into the latest +# state use the Git-pane (top left) and "pull" (blue downward arrow) from the +# repository. However, this will overwrite locally edited version of files. + +# To edit code and experiment with it, for example to add your own comments and +# examples, save your edited version into the "myScripts" folder. Otherwise you +# may have problems with git when you update the project to a new version. It's +# good practice to change the filename, for example by prepending your initials. +# This helps distinguish the files you are working with e.g. in a list of +# recent files. For example if your name is Honjo Tasuku, your edited +# BIN-Sequence.R might be named HT-BIN-Sequence.R + +# If you pull from github and get the following type of error ... +# --------------- +# error: Your local changes to the following files would be +# overwritten by merge +# ... +# Please commit your changes or stash them before you can merge. +# --------------- +# ... then, you need to bring the offending file into its original state. +# Open the Commit window, select the file, and click on the Revert button. +# +# When working with these script DO NOT SIMPLY source() THESE FILES! + +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# +# ============================================================================== + +# Once you have typed and executed the function init(), you will find a file +# called myScript.R in the project directory. +# +# Open it, you can place all of your code-experiments and notes into that +# file. This will complement your "Course Journal". If you keep all contents in +# this one file, you can find everything by using the -F find function. To +# cross-reference code in your journal, create section headings. +# +# ============================================================================== + +# The individual learning units' files can be opened by simply clicking on them +# in the File pane. + + + +# [END] diff --git a/ABC-units.Rproj b/ABC-units.Rproj index 0fbb9ec..9f01719 100644 --- a/ABC-units.Rproj +++ b/ABC-units.Rproj @@ -1,16 +1,16 @@ -Version: 1.0 - -RestoreWorkspace: No -SaveWorkspace: No -AlwaysSaveHistory: No - -EnableCodeIndexing: Yes -UseSpacesForTab: Yes -NumSpacesForTab: 2 -Encoding: UTF-8 - -RnwWeave: knitr -LaTeX: XeLaTeX - -AutoAppendNewline: Yes -StripTrailingWhitespace: Yes +Version: 1.0 + +RestoreWorkspace: No +SaveWorkspace: No +AlwaysSaveHistory: No + +EnableCodeIndexing: Yes +UseSpacesForTab: Yes +NumSpacesForTab: 2 +Encoding: UTF-8 + +RnwWeave: knitr +LaTeX: XeLaTeX + +AutoAppendNewline: Yes +StripTrailingWhitespace: Yes diff --git a/BIN-ALI-BLAST.R b/BIN-ALI-BLAST.R index d7014ac..451f511 100644 --- a/BIN-ALI-BLAST.R +++ b/BIN-ALI-BLAST.R @@ -1,111 +1,111 @@ -# tocID <- "BIN-ALI-BLAST.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the BIN-ALI-BLAST unit. -# -# ============================================================================== -# -# Version: 1.3 -# -# Date: 2017-10 - 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.3 2020 Maintenance -# 1.2 Change from require() to requireNamespace(), -# use ::() idiom throughout -# 1.1 Fixed parsing logic. -# 1.0 First live version 2017. -# 0.1 First code copied from 2016 material. -# -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> --------------------------------------------------- -#TOC> 1 Defining the APSES domain 45 -#TOC> 2 Executing the BLAST search 75 -#TOC> 3 Analysing results 97 -#TOC> -#TOC> ========================================================================== - - -# = 1 Defining the APSES domain =========================================== - -# Load your protein database -source("makeProteinDB.R") - -# Get the APSES domain sequence via your MBP1_MYSPE feature annotation. (You -# have entered this data into your database in the -# BIN-ALI-Optimal_sequence_alignment unit.) - -( myOrth <- sprintf("MBP1_%s", biCode(MYSPE)) ) # If this is not the correct - # name of the Mbp1 orthologue - # of Mbp1 in your protein - # database, DON'T continue. We - # need to fix this problem. - # Get in touch. - -(proID <- myDB$protein$ID[myDB$protein$name == myOrth]) -(ftrID <- myDB$feature$ID[myDB$feature$name == "APSES fold"]) -(fanID <- myDB$annotation$ID[myDB$annotation$proteinID == proID & - myDB$annotation$featureID == ftrID]) -(start <- myDB$annotation$start[myDB$annotation$ID == fanID]) -(end <- myDB$annotation$end[myDB$annotation$ID == fanID]) -(apses <- substr(myDB$protein$sequence[myDB$protein$ID == proID], - start, - end)) - -# The MYSPE "apses" sequence is the sequence that we will use for our reverse -# BLAST search. - - -# = 2 Executing the BLAST search ========================================== - -# The ./scripts/BLAST.R code defines two functions to access the BLAST interface -# through its Web API, and to parse results. Have a look at the script, then -# source it: - -source("./scripts/BLAST.R") - -# Use BLAST() to find the best match to the MYSPE APSES domain in Saccharomyces -# cerevisiae: - -BLASTresults <- BLAST(apses, # MYSPE APSES domain sequence - db = "refseq_protein", # database to search in - nHits = 10, # - E = 0.01, # - limits = "txid559292[ORGN]") # S. cerevisiae S288c - - -length(BLASTresults$hits) # There should be at least one hit there. Ask for - # advice in case this step fails. - - -# = 3 Analysing results =================================================== - -(topHit <- BLASTresults$hits[[1]]) # Get the top hit - -# What is the refseq ID of the top hit -topHit$accession - -# If this is "NP_010227.1" you have confirmed the RBM of the MYSPE apses -# domain. If it is not, ask me for advice. - - - - - -# [END] +# tocID <- "BIN-ALI-BLAST.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the BIN-ALI-BLAST unit. +# +# ============================================================================== +# +# Version: 1.3 +# +# Date: 2017-10 - 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.3 2020 Maintenance +# 1.2 Change from require() to requireNamespace(), +# use ::() idiom throughout +# 1.1 Fixed parsing logic. +# 1.0 First live version 2017. +# 0.1 First code copied from 2016 material. +# +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> --------------------------------------------------- +#TOC> 1 Defining the APSES domain 45 +#TOC> 2 Executing the BLAST search 75 +#TOC> 3 Analysing results 97 +#TOC> +#TOC> ========================================================================== + + +# = 1 Defining the APSES domain =========================================== + +# Load your protein database +source("makeProteinDB.R") + +# Get the APSES domain sequence via your MBP1_MYSPE feature annotation. (You +# have entered this data into your database in the +# BIN-ALI-Optimal_sequence_alignment unit.) + +( myOrth <- sprintf("MBP1_%s", biCode(MYSPE)) ) # If this is not the correct + # name of the Mbp1 orthologue + # of Mbp1 in your protein + # database, DON'T continue. We + # need to fix this problem. + # Get in touch. + +(proID <- myDB$protein$ID[myDB$protein$name == myOrth]) +(ftrID <- myDB$feature$ID[myDB$feature$name == "APSES fold"]) +(fanID <- myDB$annotation$ID[myDB$annotation$proteinID == proID & + myDB$annotation$featureID == ftrID]) +(start <- myDB$annotation$start[myDB$annotation$ID == fanID]) +(end <- myDB$annotation$end[myDB$annotation$ID == fanID]) +(apses <- substr(myDB$protein$sequence[myDB$protein$ID == proID], + start, + end)) + +# The MYSPE "apses" sequence is the sequence that we will use for our reverse +# BLAST search. + + +# = 2 Executing the BLAST search ========================================== + +# The ./scripts/BLAST.R code defines two functions to access the BLAST interface +# through its Web API, and to parse results. Have a look at the script, then +# source it: + +source("./scripts/BLAST.R") + +# Use BLAST() to find the best match to the MYSPE APSES domain in Saccharomyces +# cerevisiae: + +BLASTresults <- BLAST(apses, # MYSPE APSES domain sequence + db = "refseq_protein", # database to search in + nHits = 10, # + E = 0.01, # + limits = "txid559292[ORGN]") # S. cerevisiae S288c + + +length(BLASTresults$hits) # There should be at least one hit there. Ask for + # advice in case this step fails. + + +# = 3 Analysing results =================================================== + +(topHit <- BLASTresults$hits[[1]]) # Get the top hit + +# What is the refseq ID of the top hit +topHit$accession + +# If this is "NP_010227.1" you have confirmed the RBM of the MYSPE apses +# domain. If it is not, ask me for advice. + + + + + +# [END] diff --git a/BIN-ALI-Dotplot.R b/BIN-ALI-Dotplot.R index e7834ac..e57aac6 100644 --- a/BIN-ALI-Dotplot.R +++ b/BIN-ALI-Dotplot.R @@ -1,195 +1,195 @@ -# tocID <- "BIN-ALI-Dotplot.R" -# -# -# ============================================================================== -# -# Purpose: A Bioinformatics Course: -# R code accompanying the BIN-ALI-Dotplot unit. -# -# Version: 0.2 -# -# Date: 2019 01 07 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 0.2 Change from require() to requireNamespace(), -# use ::() idiom throughout -# 0.1 First code copied from 2016 material. -# -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> -------------------------------------- -#TOC> 1 ___Section___ 42 -#TOC> 2 Tasks 190 -#TOC> -#TOC> ========================================================================== - - -# = 1 ___Section___ ======================================================= - -if (!requireNamespace("BiocManager", quietly=TRUE)) { - install.packages("BiocManager") -} -if (!requireNamespace("Biostrings", quietly=TRUE)) { - BiocManager::install("Biostrings") -} -# Package information: -# library(help = Biostrings) # basic information -# browseVignettes("Biostrings") # available vignettes -# data(package = "Biostrings") # available datasets - -if (!requireNamespace("seqinr", quietly=TRUE)) { - install.packages("seqinr") -} - - -# Let's load BLOSUM62 -data(BLOSUM62, package = "Biostrings") - -# Now let's craft code for a dotplot. That's surprisingly simple. We build a -# matrix that has as many rows as one sequence, as many columns as another. Then -# we go through every cell of the matrix and enter the pairscore we encounter -# for the amino acid pair whose position corresponds to the row and column -# index. Finally we visualize the matrix in a plot. -# - -# First we fetch our sequences and split them into single characters. -sel <- myDB$protein$name == "MBP1_SACCE" -MBP1_SACCE <- seqinr::s2c(myDB$protein$sequence[sel]) - -sel <- myDB$protein$name == paste("MBP1_", biCode(MYSPE), sep = "") -MBP1_MYSPE <- seqinr::s2c(myDB$protein$sequence[sel]) - -# Check that we have two character vectors of the expected length. -str(MBP1_SACCE) -str(MBP1_MYSPE) - -# How do we get the pairscore values? Consider: a single pair of amino acids can -# be obtained from sequence SACCE and MYSPE eg. from position 13 and 21 ... -MBP1_SACCE[13] -MBP1_MYSPE[21] - -# ... using these as subsetting expressions, we can pull the pairscore -# from the MDM -BLOSUM62[MBP1_SACCE[13], MBP1_MYSPE[21]] - -# First we build an empty matrix that will hold all pairscores ... -dotMat <- matrix(numeric(length(MBP1_SACCE) * length(MBP1_MYSPE)), - nrow = length(MBP1_SACCE), ncol = length(MBP1_MYSPE)) - -# ... then we loop over the sequences and store the scores in the matrix. -# -for (i in 1:length(MBP1_SACCE)) { - for (j in 1:length(MBP1_MYSPE)) { - dotMat[i, j] <- BLOSUM62[MBP1_SACCE[i], MBP1_MYSPE[j]] - } -} - -# Even though this is a large matrix, this does not take much time ... -# Let's have a look at a small block of the values: - -dotMat[1:10, 1:10] - -# Rows in this matrix correspond to an amino acid from MBP1_SACCE, columns in -# the matrix correspond to an amino acid from MBP1_MYSPE. - -# To plot this, we use the image() function. Here, with default parameters. - -image(dotMat) - -# Be patient, this takes a few moments to render: more than 500,000 values. -# Nice. -# What do you expect? -# What would similar sequences look like? -# What do you see? - -#You migh notice a thin line of yellow along the diagonal, moving approximately -# from bottom left to top right, fading in and out of existence. This is the -# signature of extended sequence similarity. - -# Let's magnify this a bit by looking at only the first 200 amino acids ... -image(dotMat[1:200, 1:200]) - -# ... and, according to our normal writing convention, we would like the -# diagonal to run from top-left to bottom-right since we write from left to -# right and from top to bottom... -image(dotMat[1:200, 1:200], ylim = 1.0:0.0) - -# ... and we would like the range of the x- and y- axis to correspond to the -# sequence position ... -image(x = 1:200, y = 1:200, dotMat[1:200, 1:200], ylim=c(200,1)) - -# ... and labels! Axis labels would be nice ... -image(x = 1:200, y = 1:200, dotMat[1:200, 1:200], ylim=c(200,1), - xlab = "MBP1_MYSPE", ylab = "MBP1_SACCE" ) - -# ... and why don't we have axis-numbers on all four sides? Go, make that right -# too ... -len <- 200 -image(x = 1:len, y = 1:len, dotMat[1:len, 1:len], ylim=c(len,1), - xlab = "MBP1_MYSPE", ylab = "MBP1_SACCE", axes = FALSE) -box() -axis(1, at = c(1, seq(10, len, by=10))) -axis(2, at = c(1, seq(10, len, by=10))) -axis(3, at = c(1, seq(10, len, by=10))) -axis(4, at = c(1, seq(10, len, by=10))) - -# ... you get the idea, we can infinitely customize our plot. However a good way -# to do this is to develop a particular view for, say, a report or publication -# in a script and then put it into a function. I have put a function into the -# utilities file and called it dotPlot2(). Why not dotPlot() ... that's because -# there already is a dotplot function in the seqinr package: - -seqinr::dotPlot(MBP1_SACCE, MBP1_MYSPE) # seqinr -dotPlot2(MBP1_SACCE, MBP1_MYSPE, xlab = "SACCE", ylab = "MYSPE") # Our's - -# Which one do you prefer? You can probably see the block patterns that arise -# from segments of repetitive, low complexity sequence. But you probably have to -# look very closely to discern the faint diagonals that correspond to similar -# sequence. - - -# Let's see if we can enhance the contrast between distributed noise and the -# actual alignment of conserved residues. We can filter the dot matrix with a -# pattern that enhances diagonally repeated values. Every value in the matrix -# will be replaced by a weighted average of its neighborhood. Here is a -# diagonal-filter: - -myFilter <- matrix(numeric(25), nrow = 5) -myFilter[1, ] <- c( 1, 0, 0, 0, 0) -myFilter[2, ] <- c( 0, 1, 0, 0, 0) -myFilter[3, ] <- c( 0, 0, 1, 0, 0) -myFilter[4, ] <- c( 0, 0, 0, 1, 0) -myFilter[5, ] <- c( 0, 0, 0, 0, 1) - -# I have added the option to read such filters (or others that you could define on your own) as a parameter of the function. - -dotPlot2(MBP1_SACCE, MBP1_MYSPE, xlab = "SACCE", ylab = "MYSPE", f = myFilter) - -# I think the result shows quite nicely how the two sequences are globally -# related and where the regions of sequence similarity are. Play with this a bit -# ... Can you come up with a better filter? If so, eMail us. - - - - -# = 2 Tasks =============================================================== - - - - -# [END] +# tocID <- "BIN-ALI-Dotplot.R" +# +# +# ============================================================================== +# +# Purpose: A Bioinformatics Course: +# R code accompanying the BIN-ALI-Dotplot unit. +# +# Version: 0.2 +# +# Date: 2019 01 07 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 0.2 Change from require() to requireNamespace(), +# use ::() idiom throughout +# 0.1 First code copied from 2016 material. +# +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> -------------------------------------- +#TOC> 1 ___Section___ 42 +#TOC> 2 Tasks 190 +#TOC> +#TOC> ========================================================================== + + +# = 1 ___Section___ ======================================================= + +if (!requireNamespace("BiocManager", quietly=TRUE)) { + install.packages("BiocManager") +} +if (!requireNamespace("Biostrings", quietly=TRUE)) { + BiocManager::install("Biostrings") +} +# Package information: +# library(help = Biostrings) # basic information +# browseVignettes("Biostrings") # available vignettes +# data(package = "Biostrings") # available datasets + +if (!requireNamespace("seqinr", quietly=TRUE)) { + install.packages("seqinr") +} + + +# Let's load BLOSUM62 +data(BLOSUM62, package = "Biostrings") + +# Now let's craft code for a dotplot. That's surprisingly simple. We build a +# matrix that has as many rows as one sequence, as many columns as another. Then +# we go through every cell of the matrix and enter the pairscore we encounter +# for the amino acid pair whose position corresponds to the row and column +# index. Finally we visualize the matrix in a plot. +# + +# First we fetch our sequences and split them into single characters. +sel <- myDB$protein$name == "MBP1_SACCE" +MBP1_SACCE <- seqinr::s2c(myDB$protein$sequence[sel]) + +sel <- myDB$protein$name == paste("MBP1_", biCode(MYSPE), sep = "") +MBP1_MYSPE <- seqinr::s2c(myDB$protein$sequence[sel]) + +# Check that we have two character vectors of the expected length. +str(MBP1_SACCE) +str(MBP1_MYSPE) + +# How do we get the pairscore values? Consider: a single pair of amino acids can +# be obtained from sequence SACCE and MYSPE eg. from position 13 and 21 ... +MBP1_SACCE[13] +MBP1_MYSPE[21] + +# ... using these as subsetting expressions, we can pull the pairscore +# from the MDM +BLOSUM62[MBP1_SACCE[13], MBP1_MYSPE[21]] + +# First we build an empty matrix that will hold all pairscores ... +dotMat <- matrix(numeric(length(MBP1_SACCE) * length(MBP1_MYSPE)), + nrow = length(MBP1_SACCE), ncol = length(MBP1_MYSPE)) + +# ... then we loop over the sequences and store the scores in the matrix. +# +for (i in 1:length(MBP1_SACCE)) { + for (j in 1:length(MBP1_MYSPE)) { + dotMat[i, j] <- BLOSUM62[MBP1_SACCE[i], MBP1_MYSPE[j]] + } +} + +# Even though this is a large matrix, this does not take much time ... +# Let's have a look at a small block of the values: + +dotMat[1:10, 1:10] + +# Rows in this matrix correspond to an amino acid from MBP1_SACCE, columns in +# the matrix correspond to an amino acid from MBP1_MYSPE. + +# To plot this, we use the image() function. Here, with default parameters. + +image(dotMat) + +# Be patient, this takes a few moments to render: more than 500,000 values. +# Nice. +# What do you expect? +# What would similar sequences look like? +# What do you see? + +#You migh notice a thin line of yellow along the diagonal, moving approximately +# from bottom left to top right, fading in and out of existence. This is the +# signature of extended sequence similarity. + +# Let's magnify this a bit by looking at only the first 200 amino acids ... +image(dotMat[1:200, 1:200]) + +# ... and, according to our normal writing convention, we would like the +# diagonal to run from top-left to bottom-right since we write from left to +# right and from top to bottom... +image(dotMat[1:200, 1:200], ylim = 1.0:0.0) + +# ... and we would like the range of the x- and y- axis to correspond to the +# sequence position ... +image(x = 1:200, y = 1:200, dotMat[1:200, 1:200], ylim=c(200,1)) + +# ... and labels! Axis labels would be nice ... +image(x = 1:200, y = 1:200, dotMat[1:200, 1:200], ylim=c(200,1), + xlab = "MBP1_MYSPE", ylab = "MBP1_SACCE" ) + +# ... and why don't we have axis-numbers on all four sides? Go, make that right +# too ... +len <- 200 +image(x = 1:len, y = 1:len, dotMat[1:len, 1:len], ylim=c(len,1), + xlab = "MBP1_MYSPE", ylab = "MBP1_SACCE", axes = FALSE) +box() +axis(1, at = c(1, seq(10, len, by=10))) +axis(2, at = c(1, seq(10, len, by=10))) +axis(3, at = c(1, seq(10, len, by=10))) +axis(4, at = c(1, seq(10, len, by=10))) + +# ... you get the idea, we can infinitely customize our plot. However a good way +# to do this is to develop a particular view for, say, a report or publication +# in a script and then put it into a function. I have put a function into the +# utilities file and called it dotPlot2(). Why not dotPlot() ... that's because +# there already is a dotplot function in the seqinr package: + +seqinr::dotPlot(MBP1_SACCE, MBP1_MYSPE) # seqinr +dotPlot2(MBP1_SACCE, MBP1_MYSPE, xlab = "SACCE", ylab = "MYSPE") # Our's + +# Which one do you prefer? You can probably see the block patterns that arise +# from segments of repetitive, low complexity sequence. But you probably have to +# look very closely to discern the faint diagonals that correspond to similar +# sequence. + + +# Let's see if we can enhance the contrast between distributed noise and the +# actual alignment of conserved residues. We can filter the dot matrix with a +# pattern that enhances diagonally repeated values. Every value in the matrix +# will be replaced by a weighted average of its neighborhood. Here is a +# diagonal-filter: + +myFilter <- matrix(numeric(25), nrow = 5) +myFilter[1, ] <- c( 1, 0, 0, 0, 0) +myFilter[2, ] <- c( 0, 1, 0, 0, 0) +myFilter[3, ] <- c( 0, 0, 1, 0, 0) +myFilter[4, ] <- c( 0, 0, 0, 1, 0) +myFilter[5, ] <- c( 0, 0, 0, 0, 1) + +# I have added the option to read such filters (or others that you could define on your own) as a parameter of the function. + +dotPlot2(MBP1_SACCE, MBP1_MYSPE, xlab = "SACCE", ylab = "MYSPE", f = myFilter) + +# I think the result shows quite nicely how the two sequences are globally +# related and where the regions of sequence similarity are. Play with this a bit +# ... Can you come up with a better filter? If so, eMail us. + + + + +# = 2 Tasks =============================================================== + + + + +# [END] diff --git a/BIN-ALI-MSA.R b/BIN-ALI-MSA.R index 0265d21..d293682 100644 --- a/BIN-ALI-MSA.R +++ b/BIN-ALI-MSA.R @@ -1,628 +1,628 @@ -# tocID <- "BIN-ALI-MSA.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the BIN-ALI-MSA unit. -# -# Version: 1.3 -# -# Date: 2017-10 - 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.3 2020 updates -# 1.2 Change from require() to requireNamespace(), -# use ::() idiom throughout -# 1.1 Added fetchMSAmotif() -# 1.0 Fully refactored and rewritten for 2017 -# 0.1 First code copied from 2016 material. -# -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ------------------------------------------------------------------ -#TOC> 1 Preparations 55 -#TOC> 2 Aligning full length MBP1 proteins 97 -#TOC> 2.1 Preparing Sequences 108 -#TOC> 2.2 Compute the MSA 133 -#TOC> 3 Analyzing an MSA 154 -#TOC> 4 Comparing MSAs 226 -#TOC> 4.1 Importing an alignment to msa 235 -#TOC> 4.1.1 importing an .aln file 244 -#TOC> 4.1.2 Creating an MsaAAMultipleAlignment object 275 -#TOC> 4.2 More alignments 326 -#TOC> 4.3 Computing comparison metrics 338 -#TOC> 5 Profile-Profile alignments 476 -#TOC> 6 Sequence Logos 549 -#TOC> 6.1 Subsetting an alignment by motif 558 -#TOC> 6.2 Plot a Sequence Logo 607 -#TOC> -#TOC> ========================================================================== - - -# = 1 Preparations ======================================================== - -# You need to reload you protein database, including changes that might -# have been made to the reference files. If you have worked with the -# prerequisite units, you should have a script named "./myScripts/makeProteinDB.R" -# that will create the myDB object with a protein and feature database. -# Ask for advice if not. -source("./myScripts/makeProteinDB.R") - - -if (! requireNamespace("BiocManager", quietly=TRUE)) { - install.packages("BiocManager") -} -if (! requireNamespace("Biostrings", quietly=TRUE)) { - BiocManager::install("Biostrings") -} -# Package information: -# library(help = Biostrings) # basic information -# browseVignettes("Biostrings") # available vignettes -# data(package = "Biostrings") # available datasets - -# Multiple sequence alignment algorithms are provided in -# the Bioconductor msa package. - -if (! requireNamespace("msa", quietly=TRUE)) { - BiocManager::install("msa") -} -# Package information: -# library(help=msa) # basic information -# browseVignettes("msa") # available vignettes -# data(package = "msa") # available datasets - - -# If an installation asks you if you want to update older packages, I recommend -# to always answer "a" for "all" unless you have an important reason not to. But -# if the installer asks you whether you want to compile from source, answer "n" -# for "no" unless you need new functionality in a particular bleeding-edge -# version of a package. - -help(package = "msa") - - -# = 2 Aligning full length MBP1 proteins ================================== - -# In the Wiki part of this unit you have -# - aligned full length MBP1 protein sequences at the EBI using T-Coffee -# - saved the resulting alignment in CLUSTAL format -# to the file "MBP1orthologuesTC.aln" - -# In this section we will calculate an MSA of the same sequences using -# algorithms in the msa packages, and we will compare the two alignments. - - -# == 2.1 Preparing Sequences =============================================== - -# We have used the biostrings' AAString() function before; for multiple -# alignments we need an AAStringSet(). AAStringSets are produced from vectors -# of sequence. - -sel <- grep("MBP1", myDB$protein$name) -MBP1set <- Biostrings::AAStringSet(myDB$protein$sequence[sel]) - -# To help us make sense of the alignment we need to add the names for -# the sequences. Names for a seqSet object are held in the ranges slot... - -MBP1set@ranges@NAMES <- myDB$protein$name[sel] - -MBP1set - -# You should have eleven sequences in this set, ask for advice if you don't. - -# The little step of adding names is actually really very important. That's -# because the aligned sequences are meaningless strings of characters unless we -# can easily identify their biological relationships. Creating MSAs that are -# only identified by e.g. their RefSeq ids is a type of cargo-cult -# bioinformatics that we encounter a lot. The point of the alignment is not to -# create it, but to interpret it! - -# == 2.2 Compute the MSA =================================================== - -# The alignment itself is very simple. msa has msaMuscle() and msaClustalOmega() -# to produce alignments. (It also has msaClustalW() which is kind of -# embarrassing since that hasn't been the algorithm of first choice for -# decades. Don't use that one for real work.) - - -# Let's run an alignment with "Muscle" -(msaM <- msa::msaMuscle( MBP1set, order = "aligned")) - -# ... or to see the whole thing (cf. ?MsaAAMultipleAlignment ... print method): -msa::print(msaM, show=c("alignment", "complete"), showConsensus=FALSE) - - -# You see that the alignment object has sequence strings with hyphens as -# indel-characters. The names are printed to the console. And you also see that -# the order has not been preserved, but the most similar sequences are now -# adjacent to each other. - - -# = 3 Analyzing an MSA ==================================================== - -# You probabaly realize that computing an MSA is not that hard. It's not -# entirely trivial to collect meaningful sequences via e.g. PSI-BLAST ... but -# then computing the alignment gives you a result quickly. But what does it -# mean? What information does the MSA contain? - -# Let's have a first look at conserved vs. diverged regions of the MSA. msa -# provides the function msaConservationScore() which outputs a vector of scores. -# The scores are the sum of pairscores for the column: for example a perfectly -# conserved column of histidines would have the following score in our MSA -# of eleven sequences: -# - one (H, H) pair score is 8 in BLOSUM62; -# - there are (n^2 - n) / 2 pairs that can be formed between amino acids -# in a column from n sequences; -# - therefore the column score is 8 * (11^2 - 11) / 2 == 440 - -# attach the BLOSUM62 package from the Biostrings package -data(BLOSUM62, package = "Biostrings") - -msaMScores <- msa::msaConservationScore(msaM, substitutionMatrix = BLOSUM62) -plot(msaMScores, type = "l", col = "#205C5E", xlab = "Alignment Position") - -# That plot shows the well-aligned regions (domains ?) of the sequence, but it -# could use some smoothing. Options for smoothing such plots include calculating -# averages in sliding windows ("moving average"), and lowess() smoothing. Here -# is a quick demo of a moving average smoothing, to illustrate the principle. - -wRadius <- 15 # we take the mean of all values around a point +- wRadius -len <- length(msaMScores) -v <- msaMScores -for (i in (1 + wRadius):(len - wRadius)) { - v[i] <- mean(msaMScores[(i - wRadius):(i + wRadius)]) # mean of values in - # window around i -} -points(v, col = "#FFFFFF", type = "l", lwd = 4.5) -points(v, col = "#3DAEB2", type = "l", lwd = 3) - - -# You can set a threshold and use rle() to define ranges of values that fall -# above and below the threshold, and thus approximate domain boundaries: -thrsh <- 30 -(highScoringRanges <- rle(v > thrsh)) -(idx <- c(1, cumsum(highScoringRanges$lengths))) -for (i in seq_along(highScoringRanges$lengths)) { - if (highScoringRanges$values[i] == TRUE) { # If this range is above threshold, - rect(idx[i], thrsh, idx[i+1], max(v), # ... draw a rectangle - col = "#205C5E33") # ... with a transparent color. - cat(sprintf("Possible domain from %d to %d\n", idx[i], idx[i+1])) - } -} - -# Getting this right requires a bit of fiddling with the window radius and -# threshold (experiment with that a bit), but once we are satisfied, we can use -# the boundaries to print the MSA alignments separately for domains. -# Unfortunately the msa package provides no native way to extract blocks of the -# alignment for further processing, but your .utilities.R script contains a -# function to write alignment objects and sequence sets to .aln formatted -# output. Have a look: - -writeALN - -# Print out the aligned blocks -for (i in seq_along(highScoringRanges$lengths)) { - if (highScoringRanges$values[i] == TRUE) { # If this range is above threshold, - cat(sprintf("\n\nPossible domain from %d to %d\n", idx[i], idx[i+1])) - writeALN(msaM, range = c(idx[i], idx[i+1])) - } -} - - - -# = 4 Comparing MSAs ====================================================== - -# Let's compare the results of different alignment algorithms. We computed a -# vector of scores above, and we can compare that for different alignment -# algorithms. This is not trivial, so we'll need to look at that data in -# different ways and explore it. But first, let's get more alignments to compare -# with. - - -# == 4.1 Importing an alignment to msa ===================================== - -# We computed a T-Coffee alignment at the EBI. msa has no native import function -# so we need to improvise, and it's a bit of a pain to do - but a good -# illustration of strategies to convert data into any kind of object: -# - read an .aln file -# - adjust the sequence names -# - convert to msaAAMultipleAlignment object - -# === 4.1.1 importing an .aln file - -# The seqinr package has a function to read CLUSTAL W formatted .aln files ... -if (! requireNamespace("seqinr", quietly=TRUE)) { - install.packages("seqinr") -} -# Package information: -# library(help=seqinr) # basic information -# browseVignettes("seqinr") # available vignettes -# data(package = "seqinr") # available datasets - -# read the T-coffee aligned file that you donwloaded from the EBI MSA tools -# (cf. http://steipe.biochemistry.utoronto.ca/abc/index.php/BIN-ALI-MSA) -tmp <- seqinr::read.alignment("msaT.aln", format = "clustal") - -# read.alignment() returns a list. $seq is a list of strings, one for each -# complete alignment. However, they are converted to lower case. -x <- toupper(unlist(tmp$seq)) # get the sequences, uppercase - -# $nam contains the names. -(names(x) <- tmp$nam) - -# Note that the names in the file are refseq IDs, we need to replace the -# RefSeqIDs with the database names: -for (i in seq_along(x)) { - # find the index of the RefSeqID - id <- gsub("\\..*$", "", names(x)[i]) # fetch the name, drop the version - sel <- which(myDB$protein$RefSeqID == id) # get the index - names(x)[i] <- myDB$protein$name[sel] # get the name -} - -# === 4.1.2 Creating an MsaAAMultipleAlignment object - -# MsaAAMultipleAlignment objects are S4 objects that contain AAStringSet objects -# in their @unmasked slot, and a few additional items. Rather then build the -# object from scratch, we copy an existing object, and overwrite the data in its -# slots with what we need. Our goal is pragmatic, we want an object that msa's -# functions will accept as input. - -# First: convert our named char vector into an AAstringSet -x <- Biostrings::AAStringSet(x) - -# Then: create a new MsaAAMultipleAlignment S4 object. The msa package has -# defined what such an object should look like, with the SetClass() function. To -# create a new object, simply use the new() function, define the class that the -# object would have, and fill the slots with something that has the right type. -# How do we know the right type and the slot names? Easy! We just use -# str() to get the information. - -str(msaM) - -# There is a catch however in the way R makes such operations specific to -# the packages they need them: the function that creates the class is -# defined as a "generic", and when it is called, R looks in the package -# namespace for a more specific function with precise instructions what -# to do. However, we have not loaded the package namespace - we access all -# of the functions directly with the msa:: prefix. This method breaks down -# when generic functions are involved. I.e. - we could make it work, but -# the amount of code we need then is unreasonable. The straightforward -# way is to load the package. We can still use the prefix notation for -# its functions, just to emphasize where the function comes from. But since -# the namespace then exists, we ensure that generics are properly dispatched. - -library(msa) # load the msa package namespace - -msaT <- new("MsaAAMultipleAlignment", # create new MsaAAMultipleAlignment object - unmasked = x, # "unmasked" slot takes an AAStringSet - version = "T-Coffee", # "version" slot takes a string - params = list(), # "params" takes a list(), we leave the - # list empty, but we could add the - # alignment parameters that we used at - # the EBI here. - call = "imported from T-coffee alignment") # also a string - -str(msaT) - - -msaT # Now we have fabricated an msaAAMultipleAlignment object, and we can - # use the msa package functions on it - -msaTScores <- msa::msaConservationScore(msaT, substitutionMatrix = BLOSUM62) - -# == 4.2 More alignments =================================================== - -# Next, we calculate alignments with msa's two other alignment options: -# CLUSTAL Omega -(msaO <- msa::msaClustalOmega( MBP1set, order = "aligned")) -msaOScores <- msa::msaConservationScore(msaO, substitutionMatrix = BLOSUM62) - -# CLUSTAL W -(msaW <- msa::msaClustalW( MBP1set, order = "aligned")) -msaWScores <- msa::msaConservationScore(msaW, substitutionMatrix = BLOSUM62) - - -# == 4.3 Computing comparison metrics ====================================== - -# Ready to compare. - -# ... sum of alignment scores of alignment divided by sum of alignment scores -# of reference alignment (arbitrarily using CLUSTAL W as reference) - -sRef <- sum(msaWScores) -sum(msaWScores) / sRef # CLUSTAl W -sum(msaOScores) / sRef # CLUSTAL O -sum(msaTScores) / sRef # T-COFFEE -sum(msaMScores) / sRef # MUSCLE - -# ... mean alignment scores (higher is better) - -mean(msaWScores) # CLUSTAl W -mean(msaOScores) # CLUSTAL O -mean(msaTScores) # T-COFFEE -mean(msaMScores) # MUSCLE - -# total number of gaps (lower is better) -countGaps <- function(ali) { - x <- paste0(as.character(ali), collapse = "") - aa <- nchar(gsub("-", "", x)) - return(nchar(x) - aa) -} - -countGaps(msaW) # CLUSTAl W -countGaps(msaO) # CLUSTAL O -countGaps(msaT) # T-COFFEE -countGaps(msaM) # MUSCLE - -# number of indels in alignment (lower is less fragmented) -countIndels <- function(ali) { - x <- paste0(as.character(ali), collapse = "") # collapse into single string - x <- unlist(strsplit(x, "")) # split into characters - x <- x == "-" # convert into boolean - x <- rle(x) # calculate rle - # every run of TRUE is one indel event - return(sum(x$values)) -} - -countIndels(msaW) # CLUSTAl W -countIndels(msaO) # CLUSTAL O -countIndels(msaT) # T-COFFEE -countIndels(msaM) # MUSCLE - -# Let's look at the distribution of alignment scores: -boxplot(list(CLUSTAL.W = msaWScores, - CLUSTAL.O = msaOScores, - T.COFFEE = msaTScores, - MUSCLE = msaMScores), - cex.axis = 0.8, - col = c("#7D556488", "#74628F88", "#5E78A188", "#3DAEB288")) - -# CLUSTAL W and CLUSTAL O don't look all that different. T-Coffee tends to have -# a tighter distribution with less negative scores. Muscle has a slightly higher -# mean and generally higher scores. - -# Boxplots are convenient, but don't give us much detail about the shape of the -# distribution. For that, we need histograms, or density plots. - -plot(density(msaWScores), - type = "l", - col = "#7D5564", - lwd = 1.5, - ylim = c(0, (max(density(msaWScores)$y) * 1.3)), - main = "Comparing MSA algorithms", - xlab = "Alignment Score", - ylab = "Density") -points(density(msaOScores), - type = "l", - lwd = 1.5, - col = "#74628F") -points(density(msaTScores), - type = "l", - lwd = 1.5, - col = "#5E78A1") -points(density(msaMScores), - type = "l", - lwd = 1.5, - col = "#3DAEB2") -legend("topright", - legend = c("MUSCLE", "T-COFFEE", "CLUSTAL O", "CLUSTAL W"), - col = c("#3DAEB2", "#5E78A1", "#74628F", "#7D5564"), - lwd = 2, - cex = 0.7, - bty = "n") - -# The density plots confirm in more detail that CLUSTAL W misses some of the -# higher-scoring possibilities, that wherever CLUSTAL O is bad, it is quite bad, -# that T-COFFEE has fewer poorly scoring columns but misses some of the better -# scoring possibilities, and that MUSCLE appears to do best overall. - -# Can we attribute these differences to sections of the alignment in which the -# algorithms did better or worse? Let's plot the scores cumulatively. The -# alignments have different lengths, so we plot the scores on the respective -# fraction of the alignement length. - -plot(seq(0, 1, length.out = length(msaWScores)), # x- axis: fraction of length - cumsum(msaWScores), - type = "l", - col = "#7D5564", - lwd = 1.5, - ylim = c(0, max(cumsum(msaMScores))), - main = "Comparing MSA algorithms", - xlab = "Alignment Position", - ylab = "Cumulative Alignment Score") -points(seq(0, 1, length.out = length(msaOScores)), # x- axis: fraction of length - cumsum(msaOScores), - type = "l", - lwd = 1.5, - col = "#74628F") -points(seq(0, 1, length.out = length(msaTScores)), # x- axis: fraction of length - cumsum(msaTScores), - type = "l", - lwd = 1.5, - col = "#5E78A1") -points(seq(0, 1, length.out = length(msaMScores)), # x- axis: fraction of length - cumsum(msaMScores), - type = "l", - lwd = 1.5, - col = "#3DAEB2") -legend("bottomright", - legend = c("MUSCLE", "T-COFFEE", "CLUSTAL O", "CLUSTAL W"), - col = c("#3DAEB2", "#5E78A1", "#74628F", "#7D5564"), - lwd = 2, - cex = 0.7, - bty = "n") - -# Your alignment is going to be different from mine, due to the inclusion of -# MYSPE - but what I see is that MUSCLE gives the highest score overall, and -# achieves this with fewer indels than most, and the lowest number of gaps of -# all algorithms. - -# To actually compare regions of alignments, we need to align alignments. - - -# = 5 Profile-Profile alignments ========================================== - - -# Profile-profile alignments are the most powerful way to pick up distant -# relationships between sequence families. The can be used, for example to build -# a profile from structural superpositions of crystal structures, and then map a -# MSA alignment onto those features. Here we will use profile-profile comparison -# to compare two MSAs with each other, by aligning them. The algorithm is -# provided by the DECIPHER package. - -if (! requireNamespace("DECIPHER", quietly=TRUE)) { - BiocManager::install("DECIPHER") -} -# Package information: -# library(help = DECIPHER) # basic information -# browseVignettes("DECIPHER") # available vignettes -# data(package = "DECIPHER") # available datasets - -# AlignProfiles() takes two AAStringSets as input. Let's compare the MUSCLE and -# CLUSTAL W alignments: we could do this directly ... -DECIPHER::AlignProfiles(msaW@unmasked, msaM@unmasked) - -# But for ease of comparison, we'll reorder the sequences of the CLUSTAL W -# alignment into the same order as the MUSCLE alignment: -m <- as.character(msaM) -w <- as.character(msaW)[names(m)] - -(ppa <- DECIPHER::AlignProfiles(AAStringSet(w), AAStringSet(m))) - -# Conveniently, AlignProfiles() returns an AAStringSet, so we can use our -# writeALN function to show it. Here is an arbitrary block, from somewhere in -# the middle of the alignment: - -writeALN(ppa, range = c(751, 810)) - -# If you look at this for a while, you can begin to figue out where the -# algorithms made different decisions about where to insert gaps, and how to -# move segments of sequence around. But matters become more clear if we -# post-process this profile-profile alignment. Let's replace all hyphens that -# the pp-alignment has inserted with blanks, and let's add a separator line down -# the middle between the two alignments. - -x <- unlist(strsplit(as.character(ppa), "")) # unlist all -dim(x) <- c(width(ppa)[1], length(ppa)) # form into matrix by columns -x <- t(x) # transpose the matrix -(a1 <- 1:(nrow(x)/2)) # rows of alignment 1 -(a2 <- ((nrow(x)/2) + 1):nrow(x)) # rows of alignment 2 -for (i in 1:ncol(x)) { - if (all(x[a1, i] == "-")) { x[a1, i] <- " " } # blank hyphens that shift - if (all(x[a2, i] == "-")) { x[a2, i] <- " " } # original alignment blocks -} - -# collapse the matrix into strings -ppa2 <- character() -for (i in 1:nrow(x)) { - ppa2[i] <- paste0(x[i, ], collapse = "") - names(ppa2)[i] <- names(ppa)[i] -} - -# add a separator line -x <- paste0(rep("-", width(ppa)[1]), collapse = "") -ppa2 <- c(ppa2[a1], x, ppa2[a2]) - -# inspect -writeALN(ppa2, range = c(800, 960)) - -# Again, go explore, and get a sense of what's going on. You may find that -# CLUSTAL W has a tendency to insert short gaps all over the alignment, whereas -# MUSCLE keeps indels in blocks. CLUSTAL's behaviour is exactly what I would -# expect from an algorithm that builds alignments incrementally from pairwise -# local alignments, without global refinement. - - -# = 6 Sequence Logos ====================================================== - -# To visualize the information that we can get about structure and function with -# an MSA, we'll calculate a sequence logo of the Mbp1 recognition helix - the -# part of the structure that inserts into the major groove of the DNA and -# provides sequence specificity to the DNA binding of this transcription factor. -# Helix-B in Mbp1 with four residues upstream and downstream spans the sequence -# 43-ANFAKAKRTRILEKEVLKE-61 - -# == 6.1 Subsetting an alignment by motif ================================== - -# Finding the location of such an substring in an alignment is not entirely -# trivial, because the alignment might have produced indels in that sequence. -# Our strategy can be: -# - fetch the sequence from the alignment -# - remove all hyphens -# - find the range where the target sequence matches -# - count how many characters in all there are in the aligned sequence, up -# to the start and end of the match -# - these numbers define the range of the match in the alignment. - -x <- as.character(msaM)["MBP1_SACCE"] -xAA <- gsub("-", "", x) - -motif <- "ANFAKAKRTRILEKEVLKE" -(m <- regexpr(motif, xAA)) # matched in position 43, with a length of 19 -(motifStart <- as.numeric(m)) -(motifEnd <- attr(m, "match.length") + motifStart - 1) - -# To count characters, we split the string into single characters ... -x <- unlist(strsplit(x, "")) - -# ... convert this into a boolean, which is true if the character is not -# a hyphen ... -x <- x != "-" - -# ... cast this into a numeric, which turns TRUE into 1 and FALSE into 0 ... -x <- as.numeric(x) - -# ... and sum up the cumulative sum. -x <- cumsum(x) - -# Now we can find where the 43'd and 61'st characters are located in the -# alignment string ... -(aliStart <- which(x == motifStart)[1]) # get the first hit if there are more -(aliEnd <- which(x == motifEnd)[1]) - -# ... and subset the alignment - -(motifAli <- subseq(msaM@unmasked, start = aliStart, end = aliEnd)) - -# Packaging this into a function is convenient to have, therefore I have added -# such a function to the .utilities.R script: fetchMSAmotif(). Try it: - -wing <- "HEKVQGGFGKYQGTWV" # the MBP1_SACCE APSES "wing" sequence -writeALN(fetchMSAmotif(msaM, wing)) - - -# == 6.2 Plot a Sequence Logo ============================================== - -# The Bioconductor seqLogo:: packager handles only DNA sequences, but there are -# now several good options to plot sequence logos in R, these include dagLogo, -# DiffLogo, Logolas, and motifStack. For our example we will use ggseqlogo -# written by by Omar Waghi, a former UofT BCB student who is now at the EBI. - -if (! requireNamespace("ggseqlogo", quietly=TRUE)) { - install.packages(("ggseqlogo")) -} -# Package information: -# library(help=ggseqlogo) # basic information -# browseVignettes("ggseqlogo") # available vignettes -# data(package = "ggseqlogo") # available datasets - -ggseqlogo::ggseqlogo(as.character(motifAli)) - - - - - -# [END] +# tocID <- "BIN-ALI-MSA.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the BIN-ALI-MSA unit. +# +# Version: 1.3 +# +# Date: 2017-10 - 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.3 2020 updates +# 1.2 Change from require() to requireNamespace(), +# use ::() idiom throughout +# 1.1 Added fetchMSAmotif() +# 1.0 Fully refactored and rewritten for 2017 +# 0.1 First code copied from 2016 material. +# +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ------------------------------------------------------------------ +#TOC> 1 Preparations 55 +#TOC> 2 Aligning full length MBP1 proteins 97 +#TOC> 2.1 Preparing Sequences 108 +#TOC> 2.2 Compute the MSA 133 +#TOC> 3 Analyzing an MSA 154 +#TOC> 4 Comparing MSAs 226 +#TOC> 4.1 Importing an alignment to msa 235 +#TOC> 4.1.1 importing an .aln file 244 +#TOC> 4.1.2 Creating an MsaAAMultipleAlignment object 275 +#TOC> 4.2 More alignments 326 +#TOC> 4.3 Computing comparison metrics 338 +#TOC> 5 Profile-Profile alignments 476 +#TOC> 6 Sequence Logos 549 +#TOC> 6.1 Subsetting an alignment by motif 558 +#TOC> 6.2 Plot a Sequence Logo 607 +#TOC> +#TOC> ========================================================================== + + +# = 1 Preparations ======================================================== + +# You need to reload you protein database, including changes that might +# have been made to the reference files. If you have worked with the +# prerequisite units, you should have a script named "./myScripts/makeProteinDB.R" +# that will create the myDB object with a protein and feature database. +# Ask for advice if not. +source("./myScripts/makeProteinDB.R") + + +if (! requireNamespace("BiocManager", quietly=TRUE)) { + install.packages("BiocManager") +} +if (! requireNamespace("Biostrings", quietly=TRUE)) { + BiocManager::install("Biostrings") +} +# Package information: +# library(help = Biostrings) # basic information +# browseVignettes("Biostrings") # available vignettes +# data(package = "Biostrings") # available datasets + +# Multiple sequence alignment algorithms are provided in +# the Bioconductor msa package. + +if (! requireNamespace("msa", quietly=TRUE)) { + BiocManager::install("msa") +} +# Package information: +# library(help=msa) # basic information +# browseVignettes("msa") # available vignettes +# data(package = "msa") # available datasets + + +# If an installation asks you if you want to update older packages, I recommend +# to always answer "a" for "all" unless you have an important reason not to. But +# if the installer asks you whether you want to compile from source, answer "n" +# for "no" unless you need new functionality in a particular bleeding-edge +# version of a package. + +help(package = "msa") + + +# = 2 Aligning full length MBP1 proteins ================================== + +# In the Wiki part of this unit you have +# - aligned full length MBP1 protein sequences at the EBI using T-Coffee +# - saved the resulting alignment in CLUSTAL format +# to the file "MBP1orthologuesTC.aln" + +# In this section we will calculate an MSA of the same sequences using +# algorithms in the msa packages, and we will compare the two alignments. + + +# == 2.1 Preparing Sequences =============================================== + +# We have used the biostrings' AAString() function before; for multiple +# alignments we need an AAStringSet(). AAStringSets are produced from vectors +# of sequence. + +sel <- grep("MBP1", myDB$protein$name) +MBP1set <- Biostrings::AAStringSet(myDB$protein$sequence[sel]) + +# To help us make sense of the alignment we need to add the names for +# the sequences. Names for a seqSet object are held in the ranges slot... + +MBP1set@ranges@NAMES <- myDB$protein$name[sel] + +MBP1set + +# You should have eleven sequences in this set, ask for advice if you don't. + +# The little step of adding names is actually really very important. That's +# because the aligned sequences are meaningless strings of characters unless we +# can easily identify their biological relationships. Creating MSAs that are +# only identified by e.g. their RefSeq ids is a type of cargo-cult +# bioinformatics that we encounter a lot. The point of the alignment is not to +# create it, but to interpret it! + +# == 2.2 Compute the MSA =================================================== + +# The alignment itself is very simple. msa has msaMuscle() and msaClustalOmega() +# to produce alignments. (It also has msaClustalW() which is kind of +# embarrassing since that hasn't been the algorithm of first choice for +# decades. Don't use that one for real work.) + + +# Let's run an alignment with "Muscle" +(msaM <- msa::msaMuscle( MBP1set, order = "aligned")) + +# ... or to see the whole thing (cf. ?MsaAAMultipleAlignment ... print method): +msa::print(msaM, show=c("alignment", "complete"), showConsensus=FALSE) + + +# You see that the alignment object has sequence strings with hyphens as +# indel-characters. The names are printed to the console. And you also see that +# the order has not been preserved, but the most similar sequences are now +# adjacent to each other. + + +# = 3 Analyzing an MSA ==================================================== + +# You probabaly realize that computing an MSA is not that hard. It's not +# entirely trivial to collect meaningful sequences via e.g. PSI-BLAST ... but +# then computing the alignment gives you a result quickly. But what does it +# mean? What information does the MSA contain? + +# Let's have a first look at conserved vs. diverged regions of the MSA. msa +# provides the function msaConservationScore() which outputs a vector of scores. +# The scores are the sum of pairscores for the column: for example a perfectly +# conserved column of histidines would have the following score in our MSA +# of eleven sequences: +# - one (H, H) pair score is 8 in BLOSUM62; +# - there are (n^2 - n) / 2 pairs that can be formed between amino acids +# in a column from n sequences; +# - therefore the column score is 8 * (11^2 - 11) / 2 == 440 + +# attach the BLOSUM62 package from the Biostrings package +data(BLOSUM62, package = "Biostrings") + +msaMScores <- msa::msaConservationScore(msaM, substitutionMatrix = BLOSUM62) +plot(msaMScores, type = "l", col = "#205C5E", xlab = "Alignment Position") + +# That plot shows the well-aligned regions (domains ?) of the sequence, but it +# could use some smoothing. Options for smoothing such plots include calculating +# averages in sliding windows ("moving average"), and lowess() smoothing. Here +# is a quick demo of a moving average smoothing, to illustrate the principle. + +wRadius <- 15 # we take the mean of all values around a point +- wRadius +len <- length(msaMScores) +v <- msaMScores +for (i in (1 + wRadius):(len - wRadius)) { + v[i] <- mean(msaMScores[(i - wRadius):(i + wRadius)]) # mean of values in + # window around i +} +points(v, col = "#FFFFFF", type = "l", lwd = 4.5) +points(v, col = "#3DAEB2", type = "l", lwd = 3) + + +# You can set a threshold and use rle() to define ranges of values that fall +# above and below the threshold, and thus approximate domain boundaries: +thrsh <- 30 +(highScoringRanges <- rle(v > thrsh)) +(idx <- c(1, cumsum(highScoringRanges$lengths))) +for (i in seq_along(highScoringRanges$lengths)) { + if (highScoringRanges$values[i] == TRUE) { # If this range is above threshold, + rect(idx[i], thrsh, idx[i+1], max(v), # ... draw a rectangle + col = "#205C5E33") # ... with a transparent color. + cat(sprintf("Possible domain from %d to %d\n", idx[i], idx[i+1])) + } +} + +# Getting this right requires a bit of fiddling with the window radius and +# threshold (experiment with that a bit), but once we are satisfied, we can use +# the boundaries to print the MSA alignments separately for domains. +# Unfortunately the msa package provides no native way to extract blocks of the +# alignment for further processing, but your .utilities.R script contains a +# function to write alignment objects and sequence sets to .aln formatted +# output. Have a look: + +writeALN + +# Print out the aligned blocks +for (i in seq_along(highScoringRanges$lengths)) { + if (highScoringRanges$values[i] == TRUE) { # If this range is above threshold, + cat(sprintf("\n\nPossible domain from %d to %d\n", idx[i], idx[i+1])) + writeALN(msaM, range = c(idx[i], idx[i+1])) + } +} + + + +# = 4 Comparing MSAs ====================================================== + +# Let's compare the results of different alignment algorithms. We computed a +# vector of scores above, and we can compare that for different alignment +# algorithms. This is not trivial, so we'll need to look at that data in +# different ways and explore it. But first, let's get more alignments to compare +# with. + + +# == 4.1 Importing an alignment to msa ===================================== + +# We computed a T-Coffee alignment at the EBI. msa has no native import function +# so we need to improvise, and it's a bit of a pain to do - but a good +# illustration of strategies to convert data into any kind of object: +# - read an .aln file +# - adjust the sequence names +# - convert to msaAAMultipleAlignment object + +# === 4.1.1 importing an .aln file + +# The seqinr package has a function to read CLUSTAL W formatted .aln files ... +if (! requireNamespace("seqinr", quietly=TRUE)) { + install.packages("seqinr") +} +# Package information: +# library(help=seqinr) # basic information +# browseVignettes("seqinr") # available vignettes +# data(package = "seqinr") # available datasets + +# read the T-coffee aligned file that you donwloaded from the EBI MSA tools +# (cf. http://steipe.biochemistry.utoronto.ca/abc/index.php/BIN-ALI-MSA) +tmp <- seqinr::read.alignment("msaT.aln", format = "clustal") + +# read.alignment() returns a list. $seq is a list of strings, one for each +# complete alignment. However, they are converted to lower case. +x <- toupper(unlist(tmp$seq)) # get the sequences, uppercase + +# $nam contains the names. +(names(x) <- tmp$nam) + +# Note that the names in the file are refseq IDs, we need to replace the +# RefSeqIDs with the database names: +for (i in seq_along(x)) { + # find the index of the RefSeqID + id <- gsub("\\..*$", "", names(x)[i]) # fetch the name, drop the version + sel <- which(myDB$protein$RefSeqID == id) # get the index + names(x)[i] <- myDB$protein$name[sel] # get the name +} + +# === 4.1.2 Creating an MsaAAMultipleAlignment object + +# MsaAAMultipleAlignment objects are S4 objects that contain AAStringSet objects +# in their @unmasked slot, and a few additional items. Rather then build the +# object from scratch, we copy an existing object, and overwrite the data in its +# slots with what we need. Our goal is pragmatic, we want an object that msa's +# functions will accept as input. + +# First: convert our named char vector into an AAstringSet +x <- Biostrings::AAStringSet(x) + +# Then: create a new MsaAAMultipleAlignment S4 object. The msa package has +# defined what such an object should look like, with the SetClass() function. To +# create a new object, simply use the new() function, define the class that the +# object would have, and fill the slots with something that has the right type. +# How do we know the right type and the slot names? Easy! We just use +# str() to get the information. + +str(msaM) + +# There is a catch however in the way R makes such operations specific to +# the packages they need them: the function that creates the class is +# defined as a "generic", and when it is called, R looks in the package +# namespace for a more specific function with precise instructions what +# to do. However, we have not loaded the package namespace - we access all +# of the functions directly with the msa:: prefix. This method breaks down +# when generic functions are involved. I.e. - we could make it work, but +# the amount of code we need then is unreasonable. The straightforward +# way is to load the package. We can still use the prefix notation for +# its functions, just to emphasize where the function comes from. But since +# the namespace then exists, we ensure that generics are properly dispatched. + +library(msa) # load the msa package namespace + +msaT <- new("MsaAAMultipleAlignment", # create new MsaAAMultipleAlignment object + unmasked = x, # "unmasked" slot takes an AAStringSet + version = "T-Coffee", # "version" slot takes a string + params = list(), # "params" takes a list(), we leave the + # list empty, but we could add the + # alignment parameters that we used at + # the EBI here. + call = "imported from T-coffee alignment") # also a string + +str(msaT) + + +msaT # Now we have fabricated an msaAAMultipleAlignment object, and we can + # use the msa package functions on it + +msaTScores <- msa::msaConservationScore(msaT, substitutionMatrix = BLOSUM62) + +# == 4.2 More alignments =================================================== + +# Next, we calculate alignments with msa's two other alignment options: +# CLUSTAL Omega +(msaO <- msa::msaClustalOmega( MBP1set, order = "aligned")) +msaOScores <- msa::msaConservationScore(msaO, substitutionMatrix = BLOSUM62) + +# CLUSTAL W +(msaW <- msa::msaClustalW( MBP1set, order = "aligned")) +msaWScores <- msa::msaConservationScore(msaW, substitutionMatrix = BLOSUM62) + + +# == 4.3 Computing comparison metrics ====================================== + +# Ready to compare. + +# ... sum of alignment scores of alignment divided by sum of alignment scores +# of reference alignment (arbitrarily using CLUSTAL W as reference) + +sRef <- sum(msaWScores) +sum(msaWScores) / sRef # CLUSTAl W +sum(msaOScores) / sRef # CLUSTAL O +sum(msaTScores) / sRef # T-COFFEE +sum(msaMScores) / sRef # MUSCLE + +# ... mean alignment scores (higher is better) + +mean(msaWScores) # CLUSTAl W +mean(msaOScores) # CLUSTAL O +mean(msaTScores) # T-COFFEE +mean(msaMScores) # MUSCLE + +# total number of gaps (lower is better) +countGaps <- function(ali) { + x <- paste0(as.character(ali), collapse = "") + aa <- nchar(gsub("-", "", x)) + return(nchar(x) - aa) +} + +countGaps(msaW) # CLUSTAl W +countGaps(msaO) # CLUSTAL O +countGaps(msaT) # T-COFFEE +countGaps(msaM) # MUSCLE + +# number of indels in alignment (lower is less fragmented) +countIndels <- function(ali) { + x <- paste0(as.character(ali), collapse = "") # collapse into single string + x <- unlist(strsplit(x, "")) # split into characters + x <- x == "-" # convert into boolean + x <- rle(x) # calculate rle + # every run of TRUE is one indel event + return(sum(x$values)) +} + +countIndels(msaW) # CLUSTAl W +countIndels(msaO) # CLUSTAL O +countIndels(msaT) # T-COFFEE +countIndels(msaM) # MUSCLE + +# Let's look at the distribution of alignment scores: +boxplot(list(CLUSTAL.W = msaWScores, + CLUSTAL.O = msaOScores, + T.COFFEE = msaTScores, + MUSCLE = msaMScores), + cex.axis = 0.8, + col = c("#7D556488", "#74628F88", "#5E78A188", "#3DAEB288")) + +# CLUSTAL W and CLUSTAL O don't look all that different. T-Coffee tends to have +# a tighter distribution with less negative scores. Muscle has a slightly higher +# mean and generally higher scores. + +# Boxplots are convenient, but don't give us much detail about the shape of the +# distribution. For that, we need histograms, or density plots. + +plot(density(msaWScores), + type = "l", + col = "#7D5564", + lwd = 1.5, + ylim = c(0, (max(density(msaWScores)$y) * 1.3)), + main = "Comparing MSA algorithms", + xlab = "Alignment Score", + ylab = "Density") +points(density(msaOScores), + type = "l", + lwd = 1.5, + col = "#74628F") +points(density(msaTScores), + type = "l", + lwd = 1.5, + col = "#5E78A1") +points(density(msaMScores), + type = "l", + lwd = 1.5, + col = "#3DAEB2") +legend("topright", + legend = c("MUSCLE", "T-COFFEE", "CLUSTAL O", "CLUSTAL W"), + col = c("#3DAEB2", "#5E78A1", "#74628F", "#7D5564"), + lwd = 2, + cex = 0.7, + bty = "n") + +# The density plots confirm in more detail that CLUSTAL W misses some of the +# higher-scoring possibilities, that wherever CLUSTAL O is bad, it is quite bad, +# that T-COFFEE has fewer poorly scoring columns but misses some of the better +# scoring possibilities, and that MUSCLE appears to do best overall. + +# Can we attribute these differences to sections of the alignment in which the +# algorithms did better or worse? Let's plot the scores cumulatively. The +# alignments have different lengths, so we plot the scores on the respective +# fraction of the alignement length. + +plot(seq(0, 1, length.out = length(msaWScores)), # x- axis: fraction of length + cumsum(msaWScores), + type = "l", + col = "#7D5564", + lwd = 1.5, + ylim = c(0, max(cumsum(msaMScores))), + main = "Comparing MSA algorithms", + xlab = "Alignment Position", + ylab = "Cumulative Alignment Score") +points(seq(0, 1, length.out = length(msaOScores)), # x- axis: fraction of length + cumsum(msaOScores), + type = "l", + lwd = 1.5, + col = "#74628F") +points(seq(0, 1, length.out = length(msaTScores)), # x- axis: fraction of length + cumsum(msaTScores), + type = "l", + lwd = 1.5, + col = "#5E78A1") +points(seq(0, 1, length.out = length(msaMScores)), # x- axis: fraction of length + cumsum(msaMScores), + type = "l", + lwd = 1.5, + col = "#3DAEB2") +legend("bottomright", + legend = c("MUSCLE", "T-COFFEE", "CLUSTAL O", "CLUSTAL W"), + col = c("#3DAEB2", "#5E78A1", "#74628F", "#7D5564"), + lwd = 2, + cex = 0.7, + bty = "n") + +# Your alignment is going to be different from mine, due to the inclusion of +# MYSPE - but what I see is that MUSCLE gives the highest score overall, and +# achieves this with fewer indels than most, and the lowest number of gaps of +# all algorithms. + +# To actually compare regions of alignments, we need to align alignments. + + +# = 5 Profile-Profile alignments ========================================== + + +# Profile-profile alignments are the most powerful way to pick up distant +# relationships between sequence families. The can be used, for example to build +# a profile from structural superpositions of crystal structures, and then map a +# MSA alignment onto those features. Here we will use profile-profile comparison +# to compare two MSAs with each other, by aligning them. The algorithm is +# provided by the DECIPHER package. + +if (! requireNamespace("DECIPHER", quietly=TRUE)) { + BiocManager::install("DECIPHER") +} +# Package information: +# library(help = DECIPHER) # basic information +# browseVignettes("DECIPHER") # available vignettes +# data(package = "DECIPHER") # available datasets + +# AlignProfiles() takes two AAStringSets as input. Let's compare the MUSCLE and +# CLUSTAL W alignments: we could do this directly ... +DECIPHER::AlignProfiles(msaW@unmasked, msaM@unmasked) + +# But for ease of comparison, we'll reorder the sequences of the CLUSTAL W +# alignment into the same order as the MUSCLE alignment: +m <- as.character(msaM) +w <- as.character(msaW)[names(m)] + +(ppa <- DECIPHER::AlignProfiles(AAStringSet(w), AAStringSet(m))) + +# Conveniently, AlignProfiles() returns an AAStringSet, so we can use our +# writeALN function to show it. Here is an arbitrary block, from somewhere in +# the middle of the alignment: + +writeALN(ppa, range = c(751, 810)) + +# If you look at this for a while, you can begin to figue out where the +# algorithms made different decisions about where to insert gaps, and how to +# move segments of sequence around. But matters become more clear if we +# post-process this profile-profile alignment. Let's replace all hyphens that +# the pp-alignment has inserted with blanks, and let's add a separator line down +# the middle between the two alignments. + +x <- unlist(strsplit(as.character(ppa), "")) # unlist all +dim(x) <- c(width(ppa)[1], length(ppa)) # form into matrix by columns +x <- t(x) # transpose the matrix +(a1 <- 1:(nrow(x)/2)) # rows of alignment 1 +(a2 <- ((nrow(x)/2) + 1):nrow(x)) # rows of alignment 2 +for (i in 1:ncol(x)) { + if (all(x[a1, i] == "-")) { x[a1, i] <- " " } # blank hyphens that shift + if (all(x[a2, i] == "-")) { x[a2, i] <- " " } # original alignment blocks +} + +# collapse the matrix into strings +ppa2 <- character() +for (i in 1:nrow(x)) { + ppa2[i] <- paste0(x[i, ], collapse = "") + names(ppa2)[i] <- names(ppa)[i] +} + +# add a separator line +x <- paste0(rep("-", width(ppa)[1]), collapse = "") +ppa2 <- c(ppa2[a1], x, ppa2[a2]) + +# inspect +writeALN(ppa2, range = c(800, 960)) + +# Again, go explore, and get a sense of what's going on. You may find that +# CLUSTAL W has a tendency to insert short gaps all over the alignment, whereas +# MUSCLE keeps indels in blocks. CLUSTAL's behaviour is exactly what I would +# expect from an algorithm that builds alignments incrementally from pairwise +# local alignments, without global refinement. + + +# = 6 Sequence Logos ====================================================== + +# To visualize the information that we can get about structure and function with +# an MSA, we'll calculate a sequence logo of the Mbp1 recognition helix - the +# part of the structure that inserts into the major groove of the DNA and +# provides sequence specificity to the DNA binding of this transcription factor. +# Helix-B in Mbp1 with four residues upstream and downstream spans the sequence +# 43-ANFAKAKRTRILEKEVLKE-61 + +# == 6.1 Subsetting an alignment by motif ================================== + +# Finding the location of such an substring in an alignment is not entirely +# trivial, because the alignment might have produced indels in that sequence. +# Our strategy can be: +# - fetch the sequence from the alignment +# - remove all hyphens +# - find the range where the target sequence matches +# - count how many characters in all there are in the aligned sequence, up +# to the start and end of the match +# - these numbers define the range of the match in the alignment. + +x <- as.character(msaM)["MBP1_SACCE"] +xAA <- gsub("-", "", x) + +motif <- "ANFAKAKRTRILEKEVLKE" +(m <- regexpr(motif, xAA)) # matched in position 43, with a length of 19 +(motifStart <- as.numeric(m)) +(motifEnd <- attr(m, "match.length") + motifStart - 1) + +# To count characters, we split the string into single characters ... +x <- unlist(strsplit(x, "")) + +# ... convert this into a boolean, which is true if the character is not +# a hyphen ... +x <- x != "-" + +# ... cast this into a numeric, which turns TRUE into 1 and FALSE into 0 ... +x <- as.numeric(x) + +# ... and sum up the cumulative sum. +x <- cumsum(x) + +# Now we can find where the 43'd and 61'st characters are located in the +# alignment string ... +(aliStart <- which(x == motifStart)[1]) # get the first hit if there are more +(aliEnd <- which(x == motifEnd)[1]) + +# ... and subset the alignment + +(motifAli <- subseq(msaM@unmasked, start = aliStart, end = aliEnd)) + +# Packaging this into a function is convenient to have, therefore I have added +# such a function to the .utilities.R script: fetchMSAmotif(). Try it: + +wing <- "HEKVQGGFGKYQGTWV" # the MBP1_SACCE APSES "wing" sequence +writeALN(fetchMSAmotif(msaM, wing)) + + +# == 6.2 Plot a Sequence Logo ============================================== + +# The Bioconductor seqLogo:: packager handles only DNA sequences, but there are +# now several good options to plot sequence logos in R, these include dagLogo, +# DiffLogo, Logolas, and motifStack. For our example we will use ggseqlogo +# written by by Omar Waghi, a former UofT BCB student who is now at the EBI. + +if (! requireNamespace("ggseqlogo", quietly=TRUE)) { + install.packages(("ggseqlogo")) +} +# Package information: +# library(help=ggseqlogo) # basic information +# browseVignettes("ggseqlogo") # available vignettes +# data(package = "ggseqlogo") # available datasets + +ggseqlogo::ggseqlogo(as.character(motifAli)) + + + + + +# [END] diff --git a/BIN-ALI-Optimal_sequence_alignment.R b/BIN-ALI-Optimal_sequence_alignment.R index 54919f2..1960cd2 100644 --- a/BIN-ALI-Optimal_sequence_alignment.R +++ b/BIN-ALI-Optimal_sequence_alignment.R @@ -1,365 +1,365 @@ -# tocID <- "BIN-ALI-Optimal_sequence_alignment.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the BIN-ALI-Optimal_sequence_alignment unit. -# -# ============================================================================== -# Version: 1.7.1 -# -# Date: 2017-09 - 2020-10 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.7.1 add jsonlite:: to fromjJSON() in code sample and ./myScripts/ -# 1.7 2020 updates -# 1.6 Maintenance -# 1.5 Change from require() to requireNamespace(), -# use ::() idiom throughout -# 1.4 Pull s2c() from seqinr package, rather then loading the -# entire library. -# 1.3 Updated confirmation task with correct logic -# 1.2 Added missing load of seqinr package -# 1.1 Update annotation file logic - it could already have been -# prepared in the BIN-FUNC-Annotation unit. -# 1.0.1 bugfix -# 1.0 First 2017 live version. -# 0.1 First code copied from 2016 material. -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> -------------------------------------------------------------------------- -#TOC> 1 Prepare 58 -#TOC> 2 Biostrings Pairwise Alignment 75 -#TOC> 2.1 Optimal global alignment 93 -#TOC> 2.2 Optimal local alignment 156 -#TOC> 3 APSES Domain annotation by alignment 180 -#TOC> 4 Update your database script 261 -#TOC> 4.1 Preparing an annotation file ... 267 -#TOC> 4.1.1 If you HAVE NOT done the BIN-FUNC-Annotation unit 269 -#TOC> 4.1.2 If you HAVE done the BIN-FUNC-Annotation unit 314 -#TOC> 4.2 Execute and Validate 338 -#TOC> -#TOC> ========================================================================== - - -# = 1 Prepare ============================================================= - -if (! requireNamespace("seqinr", quietly=TRUE)) { - install.packages("seqinr") -} -# You can get package information with the following commands: -# library(help = seqinr) # basic information -# browseVignettes("seqinr") # available vignettes -# data(package = "seqinr") # available datasets - - -# You need to recreate the protein database that you have constructed in the -# BIN-Storing_data unit. - -source("./myScripts/makeProteinDB.R") - - -# = 2 Biostrings Pairwise Alignment ======================================= - - -if (!requireNamespace("BiocManager", quietly=TRUE)) { - install.packages("BiocManager") -} -if (!requireNamespace("Biostrings", quietly=TRUE)) { - BiocManager::install("Biostrings") -} -# Package information: -# library(help = Biostrings) # basic information -# browseVignettes("Biostrings") # available vignettes -# data(package = "Biostrings") # available datasets - - -# Biostrings stores sequences in "XString" objects. Once we have converted our -# target sequences to AAString objects, the alignment itself is straightforward. - -# == 2.1 Optimal global alignment ========================================== - -# The pairwiseAlignment() function was written to behave -# exactly like the functions you encountered on the EMBOSS server. - -# First: make AAString objects ... -sel <- myDB$protein$name == "MBP1_SACCE" -aaMBP1_SACCE <- Biostrings::AAString(myDB$protein$sequence[sel]) - -sel <- myDB$protein$name == paste("MBP1_", biCode(MYSPE), sep = "") -aaMBP1_MYSPE <- Biostrings::AAString(myDB$protein$sequence[sel]) - -?pairwiseAlignment -# ... and align. -# Global optimal alignment with end-gap penalties is default. -ali1 <- Biostrings::pairwiseAlignment( - aaMBP1_SACCE, - aaMBP1_MYSPE, - substitutionMatrix = "BLOSUM62", - gapOpening = 10, - gapExtension = 0.5) - -str(ali1) # ... it's complicated - -# This is a Biostrings alignment object. But we can use Biostrings functions to -# tame it: -ali1 -Biostrings::writePairwiseAlignments(ali1) # That should look familiar - -# And we can make the internal structure work for us (@ is for classes as -# $ is for lists ...) -str(ali1@pattern) -ali1@pattern -ali1@pattern@range -ali1@pattern@indel -ali1@pattern@mismatch - -# or work with "normal" R functions -# the alignment length -nchar(as.character(ali1@pattern)) - -# the number of identities -sum(seqinr::s2c(as.character(ali1@pattern)) == - seqinr::s2c(as.character(ali1@subject))) - -# ... e.g. to calculate the percentage of identities -100 * - sum(seqinr::s2c(as.character(ali1@pattern)) == - seqinr::s2c(as.character(ali1@subject))) / - nchar(as.character(ali1@pattern)) -# ... which should be the same as reported in the writePairwiseAlignments() -# output. Awkward to type? Then it calls for a function: -# -percentID <- function(al) { - # returns the percent-identity of a Biostrings alignment object - return(100 * - sum(seqinr::s2c(as.character(al@pattern)) == - seqinr::s2c(as.character(al@subject))) / - nchar(as.character(al@pattern))) -} - -percentID(ali1) - -# == 2.2 Optimal local alignment =========================================== - -# Compare with local optimal alignment (like EMBOSS Water) -ali2 <- Biostrings::pairwiseAlignment( - aaMBP1_SACCE, - aaMBP1_MYSPE, - type = "local", - substitutionMatrix = "BLOSUM62", - gapOpening = 50, - gapExtension = 10) - -Biostrings::writePairwiseAlignments(ali2) -# This has probably only aligned the N-terminal DNA binding domain - but that -# one has quite high sequence identity: -percentID(ali2) - -# == TASK: == - -# Compare the two alignments. I have weighted the local alignment heavily -# towards an ungapped alignment by setting very high gap penalties. Try changing -# the gap penalties and see what happens: how does the number of indels change, -# how does the length of indels change... - - -# = 3 APSES Domain annotation by alignment ================================ - -# In this section we define the MYSPE APSES sequence by performing a global, -# optimal sequence alignment of the yeast APSES domain with the full length -# protein sequence of the protein that was the most similar to the yeast APSES -# domain. -# - -# I have annotated the yeast APSES domain as a feature in the -# database. To view the annotation, we can retrieve it via the proteinID and -# featureID. Here is the yeast protein ID: -(proID <- myDB$protein$ID[myDB$protein$name == "MBP1_SACCE"]) - - -# ... and if you look at the feature table, you can identify the feature ID -(ftrID <- myDB$feature$ID[myDB$feature$name == "APSES fold"]) - -# ... and with the two annotations we can get the corresponding ID from the -# annotation table -(fanID <- myDB$annotation$ID[myDB$annotation$proteinID == proID & - myDB$annotation$featureID == ftrID]) - -myDB$annotation[myDB$annotation$ID == proID & - myDB$annotation$ID == ftrID, ] - -# The annotation record contains the start and end coordinates which we can use -# to define the APSES domain sequence with a substr() expression. - -(start <- myDB$annotation$start[myDB$annotation$ID == fanID]) -(end <- myDB$annotation$end[myDB$annotation$ID == fanID]) -(apses <- substr(myDB$protein$sequence[myDB$protein$ID == proID], - start, - end)) - -# Lots of code. But don't get lost. Let's recapitulate what we have done: we -# have selected from the sequence column of the protein table the sequence whose -# name is "MBP1_SACCE", and selected from the annotation table the start -# and end coordinates of the annotation that joins an "APSES fold" feature with -# the sequence, and used the start and end coordinates to extract a substring. - -# Let's convert this to an AAstring and assign it: -aaMB1_SACCE_APSES <- Biostrings::AAString(apses) - -# Now let's align these two sequences of very different length without end-gap -# penalties using the "overlap" type. "overlap" turns the -# end-gap penalties off and that is crucially important since -# the sequences have very different length. - -aliApses <- Biostrings::pairwiseAlignment( - aaMB1_SACCE_APSES, - aaMBP1_MYSPE, - type = "overlap", - substitutionMatrix = "BLOSUM62", - gapOpening = 10, - gapExtension = 0.5) - -# Inspect the result. The aligned sequences should be clearly -# homologous, and have (almost) no indels. The entire "pattern" -# sequence from QIYSAR ... to ... KPLFDF should be matched -# with the "query". Is this correct? -Biostrings::writePairwiseAlignments(aliApses) - -# If this is correct, you can extract the matched sequence from -# the alignment object. The syntax is a bit different from what -# you have seen before: this is an "S4 object", not a list. No -# worries: as.character() returns a normal string. -as.character(aliApses@subject) - -# Now, what are the aligned start and end coordinates? You can read them from -# the output of writePairwiseAlignments(), or you can get them from the range of -# the match. - -str(aliApses@subject@range) - -# start is: -aliApses@subject@range@start - -# ... and end is: -aliApses@subject@range@start + aliApses@subject@range@width - 1 - - -# = 4 Update your database script ========================================= - - -# Since we have this feature defined now, we can create a feature annotation -# right away and store it in myDB. - -# == 4.1 Preparing an annotation file ... ================================== -# -# === 4.1.1 If you HAVE NOT done the BIN-FUNC-Annotation unit -# -# -# You DON'T already have a file called "-Annotations.json" in the -# ./myScripts/ directory: -# -# - Make a copy of the file "./data/refAnnotations.json" and put it in your -# myScripts/ directory. -# -# - Give it a name that is structured like "-Annotations.json" - e.g. -# if MYSPE is called "Crptycoccus neoformans", your file should be called -# "CRYNE-Annotations.json" (and the "name" of your Mbp1 orthologue is -# "MBP1_CRYNE"). -# -# - Open the file in the RStudio editor and delete all blocks for -# the Mbp1 protein annotations except the first one. -# -# - From that block, delete all lines except for the line that says: -# -# {"pName" : "MBP1_SACCE", "fName" : "APSES fold", "start" : "4", "end" : "102"}, -# -# - Then delete the comma at the end of the line (your file will just have -# this one annotation). -# -# - Edit that annotation: change MBP1_SACCE to MBP1_ and change the -# "start" and "end" features to the coordinates you just discovered for the -# APSES domain in your sequence. -# -# - Save the file in your myScripts/ directory -# -## - Validate your file online at https://jsonlint.com/ -# -# - Update your "./myScripts/makeProteinDB.R" script to load your new -# annotation when you recreate the database. Open the script in the -# RStudio editor, and add the following command at the end: -# -# myDB <- dbAddAnnotation(myDB, -# jsonlite::fromJSON("./myScripts/-Annotations.json")) -# ^^^^^^^ -# edit this! -# - save and close the file. -# -# Then SKIP the next section. -# -# -# === 4.1.2 If you HAVE done the BIN-FUNC-Annotation unit -# -# -# You DO already have a file called "-Annotations.json" in the -# ./myScripts/ directory: -# -# - Open the file in the RStudio editor. -# -# - Below the last feature lines (but before the closing "]") add the -# following feature line (without the "#") -# -# {"pName" : "MBP1_SACCE", "fName" : "APSES fold", "start" : "4", "end" : "102"} -# -# - Edit that annotation: change MBP1_SACCE to MBP1_ and change the -# "start" and "end" features to the coordinates you just discovered for the -# APSES domain in your sequence. -# -# - Add a comma after the preceding feature line. -# -# - Save your file. -# -# - Validate your file online at https://jsonlint.com/ -# -# -# == 4.2 Execute and Validate ============================================== -# -# - source() your database creation script: -# -# source("./myScripts/makeProteinDB.R") -# -# This should run without errors or warnings. If it doesn't work and you -# can't figure out quickly what's happening, ask on the mailing list for -# help. -# -# - Confirm -# The following commands should retrieve the correct start and end -# coordinates and sequence of the MBP1_MYSPE APSES domain: - -sel <- which(myDB$protein$name == paste("MBP1_", biCode(MYSPE), sep = "")) - -(proID <- myDB$protein$ID[sel]) -(ftrID <- myDB$feature$ID[myDB$feature$name == "APSES fold"]) -(fanID <- myDB$annotation$ID[myDB$annotation$proteinID == proID & - myDB$annotation$featureID == ftrID]) -(start <- myDB$annotation$start[myDB$annotation$ID == fanID]) -(end <- myDB$annotation$end[myDB$annotation$ID == fanID]) -(apses <- substr(myDB$protein$sequence[myDB$protein$ID == proID], - start, - end)) - - -# [END] +# tocID <- "BIN-ALI-Optimal_sequence_alignment.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the BIN-ALI-Optimal_sequence_alignment unit. +# +# ============================================================================== +# Version: 1.7.1 +# +# Date: 2017-09 - 2020-10 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.7.1 add jsonlite:: to fromjJSON() in code sample and ./myScripts/ +# 1.7 2020 updates +# 1.6 Maintenance +# 1.5 Change from require() to requireNamespace(), +# use ::() idiom throughout +# 1.4 Pull s2c() from seqinr package, rather then loading the +# entire library. +# 1.3 Updated confirmation task with correct logic +# 1.2 Added missing load of seqinr package +# 1.1 Update annotation file logic - it could already have been +# prepared in the BIN-FUNC-Annotation unit. +# 1.0.1 bugfix +# 1.0 First 2017 live version. +# 0.1 First code copied from 2016 material. +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> -------------------------------------------------------------------------- +#TOC> 1 Prepare 58 +#TOC> 2 Biostrings Pairwise Alignment 75 +#TOC> 2.1 Optimal global alignment 93 +#TOC> 2.2 Optimal local alignment 156 +#TOC> 3 APSES Domain annotation by alignment 180 +#TOC> 4 Update your database script 261 +#TOC> 4.1 Preparing an annotation file ... 267 +#TOC> 4.1.1 If you HAVE NOT done the BIN-FUNC-Annotation unit 269 +#TOC> 4.1.2 If you HAVE done the BIN-FUNC-Annotation unit 314 +#TOC> 4.2 Execute and Validate 338 +#TOC> +#TOC> ========================================================================== + + +# = 1 Prepare ============================================================= + +if (! requireNamespace("seqinr", quietly=TRUE)) { + install.packages("seqinr") +} +# You can get package information with the following commands: +# library(help = seqinr) # basic information +# browseVignettes("seqinr") # available vignettes +# data(package = "seqinr") # available datasets + + +# You need to recreate the protein database that you have constructed in the +# BIN-Storing_data unit. + +source("./myScripts/makeProteinDB.R") + + +# = 2 Biostrings Pairwise Alignment ======================================= + + +if (!requireNamespace("BiocManager", quietly=TRUE)) { + install.packages("BiocManager") +} +if (!requireNamespace("Biostrings", quietly=TRUE)) { + BiocManager::install("Biostrings") +} +# Package information: +# library(help = Biostrings) # basic information +# browseVignettes("Biostrings") # available vignettes +# data(package = "Biostrings") # available datasets + + +# Biostrings stores sequences in "XString" objects. Once we have converted our +# target sequences to AAString objects, the alignment itself is straightforward. + +# == 2.1 Optimal global alignment ========================================== + +# The pairwiseAlignment() function was written to behave +# exactly like the functions you encountered on the EMBOSS server. + +# First: make AAString objects ... +sel <- myDB$protein$name == "MBP1_SACCE" +aaMBP1_SACCE <- Biostrings::AAString(myDB$protein$sequence[sel]) + +sel <- myDB$protein$name == paste("MBP1_", biCode(MYSPE), sep = "") +aaMBP1_MYSPE <- Biostrings::AAString(myDB$protein$sequence[sel]) + +?pairwiseAlignment +# ... and align. +# Global optimal alignment with end-gap penalties is default. +ali1 <- Biostrings::pairwiseAlignment( + aaMBP1_SACCE, + aaMBP1_MYSPE, + substitutionMatrix = "BLOSUM62", + gapOpening = 10, + gapExtension = 0.5) + +str(ali1) # ... it's complicated + +# This is a Biostrings alignment object. But we can use Biostrings functions to +# tame it: +ali1 +Biostrings::writePairwiseAlignments(ali1) # That should look familiar + +# And we can make the internal structure work for us (@ is for classes as +# $ is for lists ...) +str(ali1@pattern) +ali1@pattern +ali1@pattern@range +ali1@pattern@indel +ali1@pattern@mismatch + +# or work with "normal" R functions +# the alignment length +nchar(as.character(ali1@pattern)) + +# the number of identities +sum(seqinr::s2c(as.character(ali1@pattern)) == + seqinr::s2c(as.character(ali1@subject))) + +# ... e.g. to calculate the percentage of identities +100 * + sum(seqinr::s2c(as.character(ali1@pattern)) == + seqinr::s2c(as.character(ali1@subject))) / + nchar(as.character(ali1@pattern)) +# ... which should be the same as reported in the writePairwiseAlignments() +# output. Awkward to type? Then it calls for a function: +# +percentID <- function(al) { + # returns the percent-identity of a Biostrings alignment object + return(100 * + sum(seqinr::s2c(as.character(al@pattern)) == + seqinr::s2c(as.character(al@subject))) / + nchar(as.character(al@pattern))) +} + +percentID(ali1) + +# == 2.2 Optimal local alignment =========================================== + +# Compare with local optimal alignment (like EMBOSS Water) +ali2 <- Biostrings::pairwiseAlignment( + aaMBP1_SACCE, + aaMBP1_MYSPE, + type = "local", + substitutionMatrix = "BLOSUM62", + gapOpening = 50, + gapExtension = 10) + +Biostrings::writePairwiseAlignments(ali2) +# This has probably only aligned the N-terminal DNA binding domain - but that +# one has quite high sequence identity: +percentID(ali2) + +# == TASK: == + +# Compare the two alignments. I have weighted the local alignment heavily +# towards an ungapped alignment by setting very high gap penalties. Try changing +# the gap penalties and see what happens: how does the number of indels change, +# how does the length of indels change... + + +# = 3 APSES Domain annotation by alignment ================================ + +# In this section we define the MYSPE APSES sequence by performing a global, +# optimal sequence alignment of the yeast APSES domain with the full length +# protein sequence of the protein that was the most similar to the yeast APSES +# domain. +# + +# I have annotated the yeast APSES domain as a feature in the +# database. To view the annotation, we can retrieve it via the proteinID and +# featureID. Here is the yeast protein ID: +(proID <- myDB$protein$ID[myDB$protein$name == "MBP1_SACCE"]) + + +# ... and if you look at the feature table, you can identify the feature ID +(ftrID <- myDB$feature$ID[myDB$feature$name == "APSES fold"]) + +# ... and with the two annotations we can get the corresponding ID from the +# annotation table +(fanID <- myDB$annotation$ID[myDB$annotation$proteinID == proID & + myDB$annotation$featureID == ftrID]) + +myDB$annotation[myDB$annotation$ID == proID & + myDB$annotation$ID == ftrID, ] + +# The annotation record contains the start and end coordinates which we can use +# to define the APSES domain sequence with a substr() expression. + +(start <- myDB$annotation$start[myDB$annotation$ID == fanID]) +(end <- myDB$annotation$end[myDB$annotation$ID == fanID]) +(apses <- substr(myDB$protein$sequence[myDB$protein$ID == proID], + start, + end)) + +# Lots of code. But don't get lost. Let's recapitulate what we have done: we +# have selected from the sequence column of the protein table the sequence whose +# name is "MBP1_SACCE", and selected from the annotation table the start +# and end coordinates of the annotation that joins an "APSES fold" feature with +# the sequence, and used the start and end coordinates to extract a substring. + +# Let's convert this to an AAstring and assign it: +aaMB1_SACCE_APSES <- Biostrings::AAString(apses) + +# Now let's align these two sequences of very different length without end-gap +# penalties using the "overlap" type. "overlap" turns the +# end-gap penalties off and that is crucially important since +# the sequences have very different length. + +aliApses <- Biostrings::pairwiseAlignment( + aaMB1_SACCE_APSES, + aaMBP1_MYSPE, + type = "overlap", + substitutionMatrix = "BLOSUM62", + gapOpening = 10, + gapExtension = 0.5) + +# Inspect the result. The aligned sequences should be clearly +# homologous, and have (almost) no indels. The entire "pattern" +# sequence from QIYSAR ... to ... KPLFDF should be matched +# with the "query". Is this correct? +Biostrings::writePairwiseAlignments(aliApses) + +# If this is correct, you can extract the matched sequence from +# the alignment object. The syntax is a bit different from what +# you have seen before: this is an "S4 object", not a list. No +# worries: as.character() returns a normal string. +as.character(aliApses@subject) + +# Now, what are the aligned start and end coordinates? You can read them from +# the output of writePairwiseAlignments(), or you can get them from the range of +# the match. + +str(aliApses@subject@range) + +# start is: +aliApses@subject@range@start + +# ... and end is: +aliApses@subject@range@start + aliApses@subject@range@width - 1 + + +# = 4 Update your database script ========================================= + + +# Since we have this feature defined now, we can create a feature annotation +# right away and store it in myDB. + +# == 4.1 Preparing an annotation file ... ================================== +# +# === 4.1.1 If you HAVE NOT done the BIN-FUNC-Annotation unit +# +# +# You DON'T already have a file called "-Annotations.json" in the +# ./myScripts/ directory: +# +# - Make a copy of the file "./data/refAnnotations.json" and put it in your +# myScripts/ directory. +# +# - Give it a name that is structured like "-Annotations.json" - e.g. +# if MYSPE is called "Crptycoccus neoformans", your file should be called +# "CRYNE-Annotations.json" (and the "name" of your Mbp1 orthologue is +# "MBP1_CRYNE"). +# +# - Open the file in the RStudio editor and delete all blocks for +# the Mbp1 protein annotations except the first one. +# +# - From that block, delete all lines except for the line that says: +# +# {"pName" : "MBP1_SACCE", "fName" : "APSES fold", "start" : "4", "end" : "102"}, +# +# - Then delete the comma at the end of the line (your file will just have +# this one annotation). +# +# - Edit that annotation: change MBP1_SACCE to MBP1_ and change the +# "start" and "end" features to the coordinates you just discovered for the +# APSES domain in your sequence. +# +# - Save the file in your myScripts/ directory +# +## - Validate your file online at https://jsonlint.com/ +# +# - Update your "./myScripts/makeProteinDB.R" script to load your new +# annotation when you recreate the database. Open the script in the +# RStudio editor, and add the following command at the end: +# +# myDB <- dbAddAnnotation(myDB, +# jsonlite::fromJSON("./myScripts/-Annotations.json")) +# ^^^^^^^ +# edit this! +# - save and close the file. +# +# Then SKIP the next section. +# +# +# === 4.1.2 If you HAVE done the BIN-FUNC-Annotation unit +# +# +# You DO already have a file called "-Annotations.json" in the +# ./myScripts/ directory: +# +# - Open the file in the RStudio editor. +# +# - Below the last feature lines (but before the closing "]") add the +# following feature line (without the "#") +# +# {"pName" : "MBP1_SACCE", "fName" : "APSES fold", "start" : "4", "end" : "102"} +# +# - Edit that annotation: change MBP1_SACCE to MBP1_ and change the +# "start" and "end" features to the coordinates you just discovered for the +# APSES domain in your sequence. +# +# - Add a comma after the preceding feature line. +# +# - Save your file. +# +# - Validate your file online at https://jsonlint.com/ +# +# +# == 4.2 Execute and Validate ============================================== +# +# - source() your database creation script: +# +# source("./myScripts/makeProteinDB.R") +# +# This should run without errors or warnings. If it doesn't work and you +# can't figure out quickly what's happening, ask on the mailing list for +# help. +# +# - Confirm +# The following commands should retrieve the correct start and end +# coordinates and sequence of the MBP1_MYSPE APSES domain: + +sel <- which(myDB$protein$name == paste("MBP1_", biCode(MYSPE), sep = "")) + +(proID <- myDB$protein$ID[sel]) +(ftrID <- myDB$feature$ID[myDB$feature$name == "APSES fold"]) +(fanID <- myDB$annotation$ID[myDB$annotation$proteinID == proID & + myDB$annotation$featureID == ftrID]) +(start <- myDB$annotation$start[myDB$annotation$ID == fanID]) +(end <- myDB$annotation$end[myDB$annotation$ID == fanID]) +(apses <- substr(myDB$protein$sequence[myDB$protein$ID == proID], + start, + end)) + + +# [END] diff --git a/BIN-ALI-Similarity.R b/BIN-ALI-Similarity.R index 2af180e..6fcf204 100644 --- a/BIN-ALI-Similarity.R +++ b/BIN-ALI-Similarity.R @@ -1,313 +1,313 @@ -# tocID <- "BIN-ALI-Similarity.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the BIN-ALI-Similarity unit. -# -# Version: 1.2 -# -# Date: 2017-10 - 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.2 2020 Updates -# 1.1 Change from require() to requireNamespace(), -# use ::() idiom throughout -# 1.0 Refactored for 2017; add aaindex, ternary plot. -# 0.1 First code copied from 2016 material. -# -# -# TODO: -# Update ggtern:: ternary plot to use aacol dots under text -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ---------------------------------------------- -#TOC> 1 Amino Acid Properties 43 -#TOC> 2 Mutation Data matrix 189 -#TOC> 3 Background score 230 -#TOC> -#TOC> ========================================================================== - - -# = 1 Amino Acid Properties =============================================== - -# A large collection of amino acid property tables is available via the seqinr -# package: - -if (! requireNamespace("seqinr", quietly=TRUE)) { - install.packages("seqinr") -} -# Package information: -# library(help = seqinr) # basic information -# browseVignettes("seqinr") # available vignettes -# data(package = "seqinr") # available datasets - -# A true Labor of Love has gone into the compilation of the seqinr "aaindex" -# data: - -?aaindex -data(aaindex, package = "seqinr") # load the aaindex list from the package - -length(aaindex) - -# Here are all the index descriptions -for (i in 1:length(aaindex)) { - cat(paste(i, ": ", aaindex[[i]]$D, "\n", sep="")) -} - -# It's a bit cumbersome to search through the descriptions ... here is a -# function to make this easier: - -searchAAindex <- function(patt) { - # Searches the aaindex descriptions for regular expression "patt" - # and prints index number and description. - hits <- which(sapply(aaindex, function(x) length(grep(patt, x$D)) > 0)) - for (i in seq_along(hits)) { - cat(sprintf("%3d\t%s\n", hits[i], aaindex[[ hits[i] ]]$D)) - } -} - - -searchAAindex("free energy") # Search for "free energy" -searchAAindex("(size)|(volume)") # Search for "size" or "volume": - - - - -# Let's examine ... -# ... a hydrophobicity index -(Y <- aaindex[[528]][c("D", "I")]) - -# ... a volume index -(V <- aaindex[[150]][c("D", "I")]) - -# ... and one of our own: side-chain pK values as reported by -# Pace et al. (2009) JBC 284:13285-13289, with non-ionizable pKs set -# to 7.4 (physiological pH) -K <- list(I = c( 7.4, # Ala - 12.3, # Arg - 7.4, # Asn - 3.9, # Asp - 8.6, # Cys - 7.4, # Gln - 4.3, # Glu - 7.4, # Gly - 6.5, # His - 7.4, # Ile - 7.4, # Leu - 10.4, # Lys - 7.4, # Met - 7.4, # Phe - 7.4, # Pro - 7.4, # Ser - 7.4, # Thr - 7.4, # Trp - 9.8, # Tyr - 7.4)) # Val -names(K$I) <- c("Ala","Arg","Asn","Asp","Cys","Gln","Glu","Gly","His","Ile", - "Leu","Lys","Met","Phe","Pro","Ser","Thr","Trp","Tyr","Val") - - -# Given these biophysical indices, how similar are the amino acids? We have three-dimensions of measures here. Scatterplots can only display two dimensions ... - -# pull the names from Y$I, convert them to single letter code, and reorder the -# AACOLS palette accordingly ... -aac <- AACOLS[toupper(seqinr::a(names(Y$I)))] - -plot(Y$I, V$I, - xlab = "hydrophobicity", ylab = "volume", - pch = 21, - cex = 6, - col = aac, - bg = aac) -text(Y$I, V$I, names(Y$I), cex = 0.8) - -plot(Y$I, K$I, - xlab = "hydrophobicity", ylab = "pK", - pch = 21, - cex = 6, - col = aac, - bg = aac) -text(Y$I, K$I, names(Y$I), cex = 0.8) - -# ... but how do we plot 3D data? Plotting into a 3D cube is possible, but such -# plots are in general unintuitive and hard to interpret. One alternative is a -# so-called "ternary plot": - -if (! requireNamespace("ggtern", quietly=TRUE)) { - install.packages("ggtern") -} -# Package information: -# library(help = ggtern) # basic information -# browseVignettes("ggtern") # available vignettes -# data(package = "ggtern") # available datasets - - - -# collect into data frame, normalize to (0.05, 0.95) -myDat <- data.frame("phi" = 0.9*(((Y$I-min(Y$I))/(max(Y$I)-min(Y$I))))+0.05, - "vol" = 0.9*(((V$I-min(V$I))/(max(V$I)-min(V$I))))+0.05, - "pK" = 0.9*(((K$I-min(K$I))/(max(K$I)-min(K$I))))+0.05, - stringsAsFactors = FALSE) -rownames(myDat) <- names(Y$I) - -ggtern::ggtern(data = myDat, - ggplot2::aes(x = vol, - y = phi, - z = pK, - label = rownames(myDat))) + ggplot2::geom_text() - -# This results in a mapping of amino acids relative to each other that is -# similar to the Venn diagram you have seen in the notes. - -# ... or we could use principal components analysis, to pull out the -# best projection of the three feature dimensions into two. (Done here without delving -# into the theory ...) -prc <- prcomp(myDat) -plot(prc$x[,1], prc$x[,2], xlab="", ylab="", xaxt="n", yaxt="n", - pch=19, cex=6, col=aad, cex.main=0.7, - main="Principal Component Analysis of Amino Acid Features") -text(prc$x[,1], prc$x[,2], names(Y$I), cex = 0.8, col="#00000088") - -# This matches the intuition rather well in that "similar" amino acids are close -# on the plot. But we can't interpret the distances in terms of just one of the -# parameters. Whatever - nature has a different way to define similarity: -# mutations to similar amino acids are less likely to break the protein. - - -# = 2 Mutation Data matrix ================================================ - -# A mutation data matrix encodes all amino acid pairscores in a matrix. - -# The Biostrings package contains the most common mutation data matrices. - -if (! requireNamespace("BiocManager", quietly=TRUE)) { - install.packages("BiocManager") -} -if (! requireNamespace("Biostrings", quietly=TRUE)) { - BiocManager::install("Biostrings") -} -# Package information: -# library(help=Biostrings) # basic information -# browseVignettes("Biostrings") # available vignettes -# data(package = "Biostrings") # available datasets - -# Let's attach the BLOSUM62 mutation data matrix from the package -data(BLOSUM62, package = "Biostrings") - -# ... and see what it contains. (You've seen this matrix before.) -BLOSUM62 - -# We can simply access values via the row/column names. -# Identical amino acids have high scores ... -BLOSUM62["H", "H"] # Score for a pair of two histidines -BLOSUM62["S", "S"] # Score for a pair of two serines - -# Similar amino acids have low positive scores ... -BLOSUM62["L", "I"] # Score for a leucine / lysine pair -BLOSUM62["F", "Y"] # etc. - -# Dissimilar amino acids have negative scores ... -BLOSUM62["L", "K"] # Score for a leucine / lysine pair -BLOSUM62["Q", "P"] # etc. - - -BLOSUM62["R", "W"] # the matrix is symmetric! -BLOSUM62["W", "R"] - - -# = 3 Background score ==================================================== - -# The mutation data matrix is designed to give high scores to homologous -# sequences, low scores to non-homologous sequences. What score on average -# should we expect for a random sequence? - -# If we sample amino acid pairs at random, we will get a score that is the -# average of the individual pairscores in the matrix. Omitting the ambiguity -# codes and the gap character: - -sum(BLOSUM62[1:20, 1:20])/400 - -# But that score could be higher for real sequences, for which the amino acid -# distribution is not random. For example membrane proteins have a large number -# of hydrophobic residues - an alignment of unrelated proteins might produce -# positive scores. And there are other proteins with biased amino acid -# compositions, in particular poteins that interact with multiple other -# proteins. Let's test how this impacts the background score by comparing a -# sequence with shuffled sequences. These have the same composition, but are -# obvioulsy not homologous. The data directory contains the FASTA file for the -# PDB ID 3FG7 - a villin headpiece structure with a large amount of -# low-complexity amino acid sequence ... - -aa3FG7 <- Biostrings::readAAStringSet("./data/3FG7.fa")[[1]] - -# ... and the FASTA file for the E. coli OmpG outer membrane porin (PDB: 2F1C) -# with an exceptionally high percentage of hydrophobic residues. - -aa2F1C <- Biostrings::readAAStringSet("./data/2F1C.fa")[[1]] - -# Here is a function that takes two sequences and -# returns their average pairscore. - -averagePairScore <- function(a, b, MDM = BLOSUM62) { - # Returns average pairscore of two sequences. - # Parameters: - # a, b chr amino acid sequence string - # MDM mutation data matrix. Default is BLOSUM62 - # Value: num average pairscore. - a <- unlist(strsplit(a, "")) - b <- unlist(strsplit(b, "")) - v <- 0 - for (i in seq_along(a)) { - v <- v + MDM[ a[i], b[i] ] - } - return(v / length(a)) -} - -orig3FG7 <- toString(aa3FG7) -orig2F1C <- toString(aa2F1C) -N <- 1000 -scores3FG7 <- numeric(N) -scores2F1C <- numeric(N) -for (i in 1:N) { - scores3FG7[i] <- averagePairScore(orig3FG7, toString(sample(aa3FG7))) - scores2F1C[i] <- averagePairScore(orig2F1C, toString(sample(aa2F1C))) -} - -# Plot the distributions -hist(scores3FG7, - col="#5599EE33", - breaks = seq(-1.5, 0, by=0.1), - main = "Pairscores for randomly shuffled sequences", - xlab = "Average pairscore from BLOSUM 62") -hist(scores2F1C, - col="#55EE9933", - breaks = seq(-1.5, 0, by=0.1), - add = TRUE) -abline(v = sum(BLOSUM62[1:20, 1:20])/400, col = "firebrick", lwd = 2) -legend('topright', - c("3FG7 (villin)", "2F1C (OmpG)"), - fill = c("#5599EE33", "#55EE9933"), bty = 'n', - inset = 0.1) - -# This is an important result: even though we have shuffled significantly biased -# sequences, and the average scores trend above the average of the mutation data -# matrix, the average scores still remain comfortably below zero. This means -# that we can't (in general) improve a high-scoring alignment by simply -# extending it with randomly matched residues. We will only improve the score if -# the similarity of newly added residues is larger than what we expect to get by -# random chance! - - -# [END] +# tocID <- "BIN-ALI-Similarity.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the BIN-ALI-Similarity unit. +# +# Version: 1.2 +# +# Date: 2017-10 - 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.2 2020 Updates +# 1.1 Change from require() to requireNamespace(), +# use ::() idiom throughout +# 1.0 Refactored for 2017; add aaindex, ternary plot. +# 0.1 First code copied from 2016 material. +# +# +# TODO: +# Update ggtern:: ternary plot to use aacol dots under text +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ---------------------------------------------- +#TOC> 1 Amino Acid Properties 43 +#TOC> 2 Mutation Data matrix 189 +#TOC> 3 Background score 230 +#TOC> +#TOC> ========================================================================== + + +# = 1 Amino Acid Properties =============================================== + +# A large collection of amino acid property tables is available via the seqinr +# package: + +if (! requireNamespace("seqinr", quietly=TRUE)) { + install.packages("seqinr") +} +# Package information: +# library(help = seqinr) # basic information +# browseVignettes("seqinr") # available vignettes +# data(package = "seqinr") # available datasets + +# A true Labor of Love has gone into the compilation of the seqinr "aaindex" +# data: + +?aaindex +data(aaindex, package = "seqinr") # load the aaindex list from the package + +length(aaindex) + +# Here are all the index descriptions +for (i in 1:length(aaindex)) { + cat(paste(i, ": ", aaindex[[i]]$D, "\n", sep="")) +} + +# It's a bit cumbersome to search through the descriptions ... here is a +# function to make this easier: + +searchAAindex <- function(patt) { + # Searches the aaindex descriptions for regular expression "patt" + # and prints index number and description. + hits <- which(sapply(aaindex, function(x) length(grep(patt, x$D)) > 0)) + for (i in seq_along(hits)) { + cat(sprintf("%3d\t%s\n", hits[i], aaindex[[ hits[i] ]]$D)) + } +} + + +searchAAindex("free energy") # Search for "free energy" +searchAAindex("(size)|(volume)") # Search for "size" or "volume": + + + + +# Let's examine ... +# ... a hydrophobicity index +(Y <- aaindex[[528]][c("D", "I")]) + +# ... a volume index +(V <- aaindex[[150]][c("D", "I")]) + +# ... and one of our own: side-chain pK values as reported by +# Pace et al. (2009) JBC 284:13285-13289, with non-ionizable pKs set +# to 7.4 (physiological pH) +K <- list(I = c( 7.4, # Ala + 12.3, # Arg + 7.4, # Asn + 3.9, # Asp + 8.6, # Cys + 7.4, # Gln + 4.3, # Glu + 7.4, # Gly + 6.5, # His + 7.4, # Ile + 7.4, # Leu + 10.4, # Lys + 7.4, # Met + 7.4, # Phe + 7.4, # Pro + 7.4, # Ser + 7.4, # Thr + 7.4, # Trp + 9.8, # Tyr + 7.4)) # Val +names(K$I) <- c("Ala","Arg","Asn","Asp","Cys","Gln","Glu","Gly","His","Ile", + "Leu","Lys","Met","Phe","Pro","Ser","Thr","Trp","Tyr","Val") + + +# Given these biophysical indices, how similar are the amino acids? We have three-dimensions of measures here. Scatterplots can only display two dimensions ... + +# pull the names from Y$I, convert them to single letter code, and reorder the +# AACOLS palette accordingly ... +aac <- AACOLS[toupper(seqinr::a(names(Y$I)))] + +plot(Y$I, V$I, + xlab = "hydrophobicity", ylab = "volume", + pch = 21, + cex = 6, + col = aac, + bg = aac) +text(Y$I, V$I, names(Y$I), cex = 0.8) + +plot(Y$I, K$I, + xlab = "hydrophobicity", ylab = "pK", + pch = 21, + cex = 6, + col = aac, + bg = aac) +text(Y$I, K$I, names(Y$I), cex = 0.8) + +# ... but how do we plot 3D data? Plotting into a 3D cube is possible, but such +# plots are in general unintuitive and hard to interpret. One alternative is a +# so-called "ternary plot": + +if (! requireNamespace("ggtern", quietly=TRUE)) { + install.packages("ggtern") +} +# Package information: +# library(help = ggtern) # basic information +# browseVignettes("ggtern") # available vignettes +# data(package = "ggtern") # available datasets + + + +# collect into data frame, normalize to (0.05, 0.95) +myDat <- data.frame("phi" = 0.9*(((Y$I-min(Y$I))/(max(Y$I)-min(Y$I))))+0.05, + "vol" = 0.9*(((V$I-min(V$I))/(max(V$I)-min(V$I))))+0.05, + "pK" = 0.9*(((K$I-min(K$I))/(max(K$I)-min(K$I))))+0.05, + stringsAsFactors = FALSE) +rownames(myDat) <- names(Y$I) + +ggtern::ggtern(data = myDat, + ggplot2::aes(x = vol, + y = phi, + z = pK, + label = rownames(myDat))) + ggplot2::geom_text() + +# This results in a mapping of amino acids relative to each other that is +# similar to the Venn diagram you have seen in the notes. + +# ... or we could use principal components analysis, to pull out the +# best projection of the three feature dimensions into two. (Done here without delving +# into the theory ...) +prc <- prcomp(myDat) +plot(prc$x[,1], prc$x[,2], xlab="", ylab="", xaxt="n", yaxt="n", + pch=19, cex=6, col=aad, cex.main=0.7, + main="Principal Component Analysis of Amino Acid Features") +text(prc$x[,1], prc$x[,2], names(Y$I), cex = 0.8, col="#00000088") + +# This matches the intuition rather well in that "similar" amino acids are close +# on the plot. But we can't interpret the distances in terms of just one of the +# parameters. Whatever - nature has a different way to define similarity: +# mutations to similar amino acids are less likely to break the protein. + + +# = 2 Mutation Data matrix ================================================ + +# A mutation data matrix encodes all amino acid pairscores in a matrix. + +# The Biostrings package contains the most common mutation data matrices. + +if (! requireNamespace("BiocManager", quietly=TRUE)) { + install.packages("BiocManager") +} +if (! requireNamespace("Biostrings", quietly=TRUE)) { + BiocManager::install("Biostrings") +} +# Package information: +# library(help=Biostrings) # basic information +# browseVignettes("Biostrings") # available vignettes +# data(package = "Biostrings") # available datasets + +# Let's attach the BLOSUM62 mutation data matrix from the package +data(BLOSUM62, package = "Biostrings") + +# ... and see what it contains. (You've seen this matrix before.) +BLOSUM62 + +# We can simply access values via the row/column names. +# Identical amino acids have high scores ... +BLOSUM62["H", "H"] # Score for a pair of two histidines +BLOSUM62["S", "S"] # Score for a pair of two serines + +# Similar amino acids have low positive scores ... +BLOSUM62["L", "I"] # Score for a leucine / lysine pair +BLOSUM62["F", "Y"] # etc. + +# Dissimilar amino acids have negative scores ... +BLOSUM62["L", "K"] # Score for a leucine / lysine pair +BLOSUM62["Q", "P"] # etc. + + +BLOSUM62["R", "W"] # the matrix is symmetric! +BLOSUM62["W", "R"] + + +# = 3 Background score ==================================================== + +# The mutation data matrix is designed to give high scores to homologous +# sequences, low scores to non-homologous sequences. What score on average +# should we expect for a random sequence? + +# If we sample amino acid pairs at random, we will get a score that is the +# average of the individual pairscores in the matrix. Omitting the ambiguity +# codes and the gap character: + +sum(BLOSUM62[1:20, 1:20])/400 + +# But that score could be higher for real sequences, for which the amino acid +# distribution is not random. For example membrane proteins have a large number +# of hydrophobic residues - an alignment of unrelated proteins might produce +# positive scores. And there are other proteins with biased amino acid +# compositions, in particular poteins that interact with multiple other +# proteins. Let's test how this impacts the background score by comparing a +# sequence with shuffled sequences. These have the same composition, but are +# obvioulsy not homologous. The data directory contains the FASTA file for the +# PDB ID 3FG7 - a villin headpiece structure with a large amount of +# low-complexity amino acid sequence ... + +aa3FG7 <- Biostrings::readAAStringSet("./data/3FG7.fa")[[1]] + +# ... and the FASTA file for the E. coli OmpG outer membrane porin (PDB: 2F1C) +# with an exceptionally high percentage of hydrophobic residues. + +aa2F1C <- Biostrings::readAAStringSet("./data/2F1C.fa")[[1]] + +# Here is a function that takes two sequences and +# returns their average pairscore. + +averagePairScore <- function(a, b, MDM = BLOSUM62) { + # Returns average pairscore of two sequences. + # Parameters: + # a, b chr amino acid sequence string + # MDM mutation data matrix. Default is BLOSUM62 + # Value: num average pairscore. + a <- unlist(strsplit(a, "")) + b <- unlist(strsplit(b, "")) + v <- 0 + for (i in seq_along(a)) { + v <- v + MDM[ a[i], b[i] ] + } + return(v / length(a)) +} + +orig3FG7 <- toString(aa3FG7) +orig2F1C <- toString(aa2F1C) +N <- 1000 +scores3FG7 <- numeric(N) +scores2F1C <- numeric(N) +for (i in 1:N) { + scores3FG7[i] <- averagePairScore(orig3FG7, toString(sample(aa3FG7))) + scores2F1C[i] <- averagePairScore(orig2F1C, toString(sample(aa2F1C))) +} + +# Plot the distributions +hist(scores3FG7, + col="#5599EE33", + breaks = seq(-1.5, 0, by=0.1), + main = "Pairscores for randomly shuffled sequences", + xlab = "Average pairscore from BLOSUM 62") +hist(scores2F1C, + col="#55EE9933", + breaks = seq(-1.5, 0, by=0.1), + add = TRUE) +abline(v = sum(BLOSUM62[1:20, 1:20])/400, col = "firebrick", lwd = 2) +legend('topright', + c("3FG7 (villin)", "2F1C (OmpG)"), + fill = c("#5599EE33", "#55EE9933"), bty = 'n', + inset = 0.1) + +# This is an important result: even though we have shuffled significantly biased +# sequences, and the average scores trend above the average of the mutation data +# matrix, the average scores still remain comfortably below zero. This means +# that we can't (in general) improve a high-scoring alignment by simply +# extending it with randomly matched residues. We will only improve the score if +# the similarity of newly added residues is larger than what we expect to get by +# random chance! + + +# [END] diff --git a/BIN-Data_integration.R b/BIN-Data_integration.R index c5e9dc5..0097472 100644 --- a/BIN-Data_integration.R +++ b/BIN-Data_integration.R @@ -1,216 +1,216 @@ -# tocID <- "BIN-Data_integration.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the BIN-Data_integration unit. -# -# Version: 1.2 -# -# Date: 2018-10 - 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.2 2020 Maintenance and updates -# 1.1 Change from require() to requireNamespace(), -# use ::() idiom throughout -# 1.0.1 Bugfix: UniProt ID Mapping service API change -# 1.0 First live version -# -# -# TODO: -# Develop a fungi-specific BioMart example. -# (cf. -# https://cran.r-project.org/web/packages/biomartr/vignettes/Functional_Annotation.html ) -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ------------------------------------------------- -#TOC> 1 Identifier mapping 42 -#TOC> 2 Cross-referencing tables 165 -#TOC> -#TOC> ========================================================================== - - -# = 1 Identifier mapping ================================================== - -# UniProt provides a well-designed ID mapping tool that can be accessed -# online at http://www.uniprot.org/mapping/ -# -# Here we will use the UniProt Web API for this tool to map identifiers. The -# UniProt ID mapping service supports a "RESTful API": responses can be obtained -# simply via a Web- browsers request. Such requests are commonly sent via the -# GET or POST verbs that a Webserver responds to, when a client asks for data. -# GET requests are visible in the URL of the request; POST requests are not -# directly visible, they are commonly used to send the contents of forms, or -# when transmitting larger, complex data items. The UniProt ID mapping sevice -# can accept long lists of IDs, thus using the POST mechanism makes sense. GET() -# and POST() functions are part of the httr package. - -# To begin, we load httr, which supports sending and receiving data via the -# http protocol, just like a Web browser. -if (! requireNamespace("httr", quietly=TRUE)) { - install.packages("httr") -} -# Package information: -# library(help = httr) # basic information -# browseVignettes("httr") # available vignettes -# data(package = "httr") # available datasets - - -# We will walk through the process with the refSeqID -# of yeast Mbp1 and Swi4, and we will also enter a dummy ID to check what -# happens if the ID can't be mapped: -myQueryIDs <- "NP_010227 NP_00000 NP_011036" - - -# The UniProt ID mapping service API is very straightforward to use: just define -# the URL of the server and send a list of items labelled as "query" in the body -# of the request. GET() and POST() are functions from httr. - -# Note. A recent bug in the interaction between the server expectations and the -# curl client libraries requires the following initialization -httr::set_config(httr::config(http_version = 0)) -# cf. https://stackoverflow.com/questions/44610845/stream-error-in-the-http-2-framing-layer-bigrquery-commands-error-in-r-studio-b - - -URL <- "https://www.uniprot.org/mapping/" -response <- httr::POST(URL, - body = list(from = "P_REFSEQ_AC", # Refseq Protein - to = "ACC", # UniProt ID - format = "tab", - query = myQueryIDs)) - -cat(httr::content(response)) - -# We need to check the status code - if it is not 200, an error ocurred and we -# can't process the result: -httr::status_code(response) - -# If the query is successful, tabbed text is returned. We can assign that to a -# data frame. Note that we use textConnection() to read data directly from a char object, which can go in the spot where read.delim() expects a file-name argument. - -myMappedIDs <- read.delim(file = textConnection(httr::content(response)), - sep = "\t", - stringsAsFactors = FALSE) -myMappedIDs - -# If this works as expected, you should see: -# From To -# 1 NP_010227 P39678 -# 2 NP_011036 P25302 -# -# ... and note that there are only two entries, because nothing was returned -# for the dummy "RefSeq ID" NP_00000 - -# If the query can't be fulfilled because of a problem with the server, a -# WebPage is returned. But the server status is also returned and we can check -# the status code. I have lately gotten many "503" status codes: Server Not -# Available... - -# We wrap this into a function: - -myIDmap <- function (s, mapFrom = "P_REFSEQ_AC", mapTo = "ACC") { - # Use UniProt ID mapping service to map one or more IDs - # Parameters: - # s char A string of separated IDs - # mapFrom char the database in which the IDs in s are valid. Default - # is RefSeq protein - # mapTo char the database in which the target IDs are valid. Default - # is UniProtKB - # Value - # a data frame of mapped IDs, with column names From and To, or an - # empty data frame if the mapping was unsuccessful. No rows are returned - # for IDs that are not mapped. - - # Initialize curl - httr::set_config(httr::config(http_version = 0)) - - URL <- "https://www.uniprot.org/uploadlists/" - response <- httr::POST(URL, - body = list(from = mapFrom, - to = mapTo, - format = "tab", - query = s)) - - if (httr::status_code(response) == 200) { # 200: oK - myMap <- read.delim(file = textConnection(httr::content(response)), - sep = "\t", - stringsAsFactors = FALSE) - colnames(myMap) <- c("From", "To") - } else { - myMap <- data.frame() - warning(paste("No uniProt ID mapping returned:", - "server sent status", - httr::status_code(response))) - } - - return(myMap) -} - -# Try it out ... -myIDmap("NP_010227 NP_011036 NP_012881 NP_013729 NP_012165") - -# A function UniProtIDmap() is in the ABC-dbUtilities.R script and it is loaded -# into your workspace on startup. - - -# = 2 Cross-referencing tables ============================================ - -# Sometimes we get the IDs we need to map in a large table, e.g. from a list of -# genes in a model organism database such as SGD, or from the Human Genen -# Nomenclature commission. How do we map one set of identifiers to another one? - -# The function to use is match(). -# Here is a tiny set of identifiers taken from a much larger table to -# illustrate the principle: -# - -myIDs <- data.frame(uID = c("P38903", "P31383", "P47177", "P47096", "Q07747", - "Q08641", "P47129", "P52910", "P00330", "P81450"), - name = c("2A5D", "2AAA", "2NDP", "3HAO", "AAD4", - "AB140", "ACF4", "ACS2", "ADH1", "ATP18"), - refID = c("NP_014657", "NP_009386", - "NP_012683", "NP_012559", - "NP_010038", "NP_014882", - "NP_012616", "NP_013254", - "NP_014555", "NP_013629")) - -myIDs - -# Say we want to map "NP_010038", "NP_012559", and "NP_013629", in that order to -# their gene names. -myQuery <- c("NP_010038", "NP_999999", "NP_013629") - -# %in% will only tell us if these IDs are present in the table: -myQuery %in% myIDs$refID - -# ... but not where they are located. But match() does what we need here: -match(myQuery, myIDs$refID) - -# ... and we can use the result to subset the column that we want to map to: -myIDs$name[match(myQuery, myIDs$refID)] - -# Note that the output preserves the NA - i.e. the length of the mapped -# values is exactly the same as the length of the query. - -# task: map the three genes to their UniProt Identifier. - - -# -# Note: if you want to do very many queries in very large tables, use the -# fmatch() function in the "fastmatch" package for a considerable -# speedup. - - - - -# [END] +# tocID <- "BIN-Data_integration.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the BIN-Data_integration unit. +# +# Version: 1.2 +# +# Date: 2018-10 - 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.2 2020 Maintenance and updates +# 1.1 Change from require() to requireNamespace(), +# use ::() idiom throughout +# 1.0.1 Bugfix: UniProt ID Mapping service API change +# 1.0 First live version +# +# +# TODO: +# Develop a fungi-specific BioMart example. +# (cf. +# https://cran.r-project.org/web/packages/biomartr/vignettes/Functional_Annotation.html ) +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ------------------------------------------------- +#TOC> 1 Identifier mapping 42 +#TOC> 2 Cross-referencing tables 165 +#TOC> +#TOC> ========================================================================== + + +# = 1 Identifier mapping ================================================== + +# UniProt provides a well-designed ID mapping tool that can be accessed +# online at http://www.uniprot.org/mapping/ +# +# Here we will use the UniProt Web API for this tool to map identifiers. The +# UniProt ID mapping service supports a "RESTful API": responses can be obtained +# simply via a Web- browsers request. Such requests are commonly sent via the +# GET or POST verbs that a Webserver responds to, when a client asks for data. +# GET requests are visible in the URL of the request; POST requests are not +# directly visible, they are commonly used to send the contents of forms, or +# when transmitting larger, complex data items. The UniProt ID mapping sevice +# can accept long lists of IDs, thus using the POST mechanism makes sense. GET() +# and POST() functions are part of the httr package. + +# To begin, we load httr, which supports sending and receiving data via the +# http protocol, just like a Web browser. +if (! requireNamespace("httr", quietly=TRUE)) { + install.packages("httr") +} +# Package information: +# library(help = httr) # basic information +# browseVignettes("httr") # available vignettes +# data(package = "httr") # available datasets + + +# We will walk through the process with the refSeqID +# of yeast Mbp1 and Swi4, and we will also enter a dummy ID to check what +# happens if the ID can't be mapped: +myQueryIDs <- "NP_010227 NP_00000 NP_011036" + + +# The UniProt ID mapping service API is very straightforward to use: just define +# the URL of the server and send a list of items labelled as "query" in the body +# of the request. GET() and POST() are functions from httr. + +# Note. A recent bug in the interaction between the server expectations and the +# curl client libraries requires the following initialization +httr::set_config(httr::config(http_version = 0)) +# cf. https://stackoverflow.com/questions/44610845/stream-error-in-the-http-2-framing-layer-bigrquery-commands-error-in-r-studio-b + + +URL <- "https://www.uniprot.org/mapping/" +response <- httr::POST(URL, + body = list(from = "P_REFSEQ_AC", # Refseq Protein + to = "ACC", # UniProt ID + format = "tab", + query = myQueryIDs)) + +cat(httr::content(response)) + +# We need to check the status code - if it is not 200, an error ocurred and we +# can't process the result: +httr::status_code(response) + +# If the query is successful, tabbed text is returned. We can assign that to a +# data frame. Note that we use textConnection() to read data directly from a char object, which can go in the spot where read.delim() expects a file-name argument. + +myMappedIDs <- read.delim(file = textConnection(httr::content(response)), + sep = "\t", + stringsAsFactors = FALSE) +myMappedIDs + +# If this works as expected, you should see: +# From To +# 1 NP_010227 P39678 +# 2 NP_011036 P25302 +# +# ... and note that there are only two entries, because nothing was returned +# for the dummy "RefSeq ID" NP_00000 + +# If the query can't be fulfilled because of a problem with the server, a +# WebPage is returned. But the server status is also returned and we can check +# the status code. I have lately gotten many "503" status codes: Server Not +# Available... + +# We wrap this into a function: + +myIDmap <- function (s, mapFrom = "P_REFSEQ_AC", mapTo = "ACC") { + # Use UniProt ID mapping service to map one or more IDs + # Parameters: + # s char A string of separated IDs + # mapFrom char the database in which the IDs in s are valid. Default + # is RefSeq protein + # mapTo char the database in which the target IDs are valid. Default + # is UniProtKB + # Value + # a data frame of mapped IDs, with column names From and To, or an + # empty data frame if the mapping was unsuccessful. No rows are returned + # for IDs that are not mapped. + + # Initialize curl + httr::set_config(httr::config(http_version = 0)) + + URL <- "https://www.uniprot.org/uploadlists/" + response <- httr::POST(URL, + body = list(from = mapFrom, + to = mapTo, + format = "tab", + query = s)) + + if (httr::status_code(response) == 200) { # 200: oK + myMap <- read.delim(file = textConnection(httr::content(response)), + sep = "\t", + stringsAsFactors = FALSE) + colnames(myMap) <- c("From", "To") + } else { + myMap <- data.frame() + warning(paste("No uniProt ID mapping returned:", + "server sent status", + httr::status_code(response))) + } + + return(myMap) +} + +# Try it out ... +myIDmap("NP_010227 NP_011036 NP_012881 NP_013729 NP_012165") + +# A function UniProtIDmap() is in the ABC-dbUtilities.R script and it is loaded +# into your workspace on startup. + + +# = 2 Cross-referencing tables ============================================ + +# Sometimes we get the IDs we need to map in a large table, e.g. from a list of +# genes in a model organism database such as SGD, or from the Human Genen +# Nomenclature commission. How do we map one set of identifiers to another one? + +# The function to use is match(). +# Here is a tiny set of identifiers taken from a much larger table to +# illustrate the principle: +# + +myIDs <- data.frame(uID = c("P38903", "P31383", "P47177", "P47096", "Q07747", + "Q08641", "P47129", "P52910", "P00330", "P81450"), + name = c("2A5D", "2AAA", "2NDP", "3HAO", "AAD4", + "AB140", "ACF4", "ACS2", "ADH1", "ATP18"), + refID = c("NP_014657", "NP_009386", + "NP_012683", "NP_012559", + "NP_010038", "NP_014882", + "NP_012616", "NP_013254", + "NP_014555", "NP_013629")) + +myIDs + +# Say we want to map "NP_010038", "NP_012559", and "NP_013629", in that order to +# their gene names. +myQuery <- c("NP_010038", "NP_999999", "NP_013629") + +# %in% will only tell us if these IDs are present in the table: +myQuery %in% myIDs$refID + +# ... but not where they are located. But match() does what we need here: +match(myQuery, myIDs$refID) + +# ... and we can use the result to subset the column that we want to map to: +myIDs$name[match(myQuery, myIDs$refID)] + +# Note that the output preserves the NA - i.e. the length of the mapped +# values is exactly the same as the length of the query. + +# task: map the three genes to their UniProt Identifier. + + +# +# Note: if you want to do very many queries in very large tables, use the +# fmatch() function in the "fastmatch" package for a considerable +# speedup. + + + + +# [END] diff --git a/BIN-FUNC-Domain_annotation.R b/BIN-FUNC-Domain_annotation.R index 018b056..11b5103 100644 --- a/BIN-FUNC-Domain_annotation.R +++ b/BIN-FUNC-Domain_annotation.R @@ -1,435 +1,435 @@ -# tocID <- "BIN-FUNC-Domain_annotation.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the BIN-FUNC-Domain_annotation unit. -# -# ============================================================================== -# Version: 1.4 -# -# Date: 2017-11 - 2020-10 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.4 Add code for shared data import from the Wiki -# 1.3 Add code for database export to JSON and instructions -# for uploading annotations to the Public Student Wiki page -# 1.2 Consistently: data in ./myScripts/ ; -# begin SHARING DATA section -# 1.1 2020 Updates -# 1.0 Live version 2017 -# 0.1 First code copied from 2016 material. -# -# TODO: -# Put the domain plot into a function -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> --------------------------------------------------------------------- -#TOC> 1 Update your database script 51 -#TOC> 1.1 Preparing an annotation file ... 58 -#TOC> 1.1.1 BEFORE "BIN-ALI-Optimal_sequence_alignment" 61 -#TOC> 1.1.2 AFTER "BIN-ALI-Optimal_sequence_alignment" 109 -#TOC> 1.2 Execute and Validate 136 -#TOC> 2 Plot Annotations 161 -#TOC> 3 SHARING DATA 287 -#TOC> 3.1 Post MBP1_MYSPE as JSON data 303 -#TOC> 3.2 Import shared MBP1_MYSPE from the Wiki 326 -#TOC> -#TOC> ========================================================================== - - -# = 1 Update your database script ========================================= - - -# Since you have recorded domain features at the SMART database, we can store -# the feature annotations in myDB ... - - -# == 1.1 Preparing an annotation file ... ================================== - - -# === 1.1.1 BEFORE "BIN-ALI-Optimal_sequence_alignment" -# -# IF YOU HAVE NOT YET COMPLETED THE BIN-ALI-OPTIMAL_SEQUENCE_ALIGNMENT UNIT: -# -# You DON'T already have a file called "-Annotations.json" in the -# ./myScripts/ directory: -# -# - Make a copy of the file "./data/refAnnotations.json" and put it in your -# myScripts/ directory. -# -# - Give it a name that is structured like "-Annotations.json" - e.g. -# if MYSPE is called "Crptycoccus neoformans", your file should be called -# "CRYNE-Annotations.json" (and the "name" of your Mbp1 orthologue is -# "MBP1_CRYNE"). -# -# - Open the file in the RStudio editor and delete all blocks for -# the Mbp1 protein annotations except the first one. -# -# - From that block, delete all lines that have annotations you did not -# find in SMART for MBP1_MYSPE. -# -# - Make enough copies of the "Ankyrin fold" and "low complexity" region -# lines to have a line for each feature you found. -# -# - Then delete the comma at the end of the last line. -# -# - Edit the annotations: change MBP1_SACCE to MBP1_ everywhere -# and change the "start" and "end" features to the coordinates you -# recorded in the SMART database. -# -# - Save your file in the ./myScripts/ folder. -# -# - Validate your file online at https://jsonlint.com/ -# -# - Update your "./myScripts/makeProteinDB.R" script to load your new -# annotation when you recreate the database. Open the script in the -# RStudio editor, and add the following command at the end: -# -# myDB <- dbAddAnnotation(myDB, -# jsonlite::fromJSON("./myScripts/-Annotations.json")) -# ^^^^^^^ -# edit this! -# -# - save and close the file. -# -# Then SKIP the next section. -# -# -# === 1.1.2 AFTER "BIN-ALI-Optimal_sequence_alignment" -# -# IF YOU HAVE ALREADY COMPLETED THE BIN-ALI-OPTIMAL_SEQUENCE_ALIGNMENT UNIT: -# -# You SHOULD have a file called "-Annotations.json" in the -# ./myScripts/ directory: -# -# - Open the file in the RStudio editor. -# -# - Make as many copies of the "APSES fold" line as you have found -# features in SMART. -# -# - Add a comma after every line except for the last one -# -# - Edit the annotations but include only features that are in the -# myDB$feature table. Check which features are in the database by executing -# -# myDB$feature$name -# -# - Update the "start" and "end" coordinates for each feature to the -# values you found. -# -# - Save your file. -# -# - Validate your file online at https://jsonlint.com/ -# -# -# == 1.2 Execute and Validate ============================================== -# -# - source() your database creation script: -# -# source("./myScripts/makeProteinDB.R") -# -# This should run without errors or warnings. If it doesn't work and you -# can't figure out quickly what's happening, ask for help on the -# Discussion Board. -# -# - Confirm -# The following commands should retrieve all of the features that have been -# annotated for MBP1_MYSPE - -sel <- myDB$protein$name == paste("MBP1_", biCode(MYSPE), sep = "") - -(proID <- myDB$protein$ID[sel]) -(fanIDs <- myDB$annotation$ID[myDB$annotation$proteinID == proID]) -(ftrIDs <- unique(myDB$annotation$featureID[fanIDs])) -myDB$feature$name[ftrIDs] # This should list ALL of your annotated features - # (once). If not, consider what could have gone wrong - # and ask on the list if you have difficulties fixing - # it. - - -# = 2 Plot Annotations ==================================================== - -# In this section we will plot domain annotations as colored rectangles on a -# sequence, as an example of using the R plotting system for generic, data -# driven images. - -# We need a small utility function that draws the annotation boxes on a -# representation of sequence. It should accept the start and end coordinates, -# the y value where it should be plotted and the color of the box, and plot a -# rectangle using R's rect() function. - -drawBox <- function(xStart, xEnd, y, myCol, DELTA = 0.2) { - # Draw a box from xStart to xEnd at y, filled with colour myCol - # The height of the box is y +- DELTA - rect(xStart, (y - DELTA), xEnd, (y + DELTA), - border = "black", col = myCol) -} - -# test this: -plot(c(-1.5, 1.5), c(0, 0), type = "l") -drawBox(-1, 1, 0.0, "peachpuff") - -# Next, we define a function to plot annotations for one protein: the name of -# the protein, a horizontal grey line for its length, and all of its features. - -plotProtein <- function(DB, name, y) { - # DB: protein database - # name: the name of the protein in the database. - # y: height where to draw the plot - # - # Define colors: we create a vector of color values, one for - # each feature, and we give it names of the feature ID. Then we - # can easily get the color value from the feature name. - # A: make a vector of color values. The syntax may appear unusual - - # colorRampPalette() returns a function, and we simply append - # the parameter (number-of-features) without assigning the function - # to its own variable name. - ftrCol <- colorRampPalette(c("#f2003c", "#F0A200", "#f0ea00", - "#62C923", "#0A9A9B", "#1958C3", - "#8000D3", "#D0007F"), - space="Lab", - interpolate="linear")(nrow(DB$feature)) - # B: Features may overlap, so we make the colors transparent by setting - # their "alpha channel" to 1/3 (hex: 55) - ftrCol <- paste0(ftrCol, "55") - # C: we asssign names - names(ftrCol) <- DB$feature$ID - # E.g. color for the third feature: ftrCol[ DB$feature$ID[3] ] - - # find the row-index of the protein ID in the protein table of DB - iProtein <- which(DB$protein$name == name) - - # write the name of the protein - text(-30, y, adj=1, labels=name, cex=0.75 ) - - #draw a line from 0 to nchar(sequence-of-the-protein) - lines(c(0, nchar(DB$protein$sequence[iProtein])), c(y, y), - lwd=3, col="#999999") - - # get the rows of feature annotations for the protein - iFtr <- which(DB$annotation$proteinID == DB$protein$ID[iProtein]) - - # draw a colored box for each feature - for (i in iFtr) { - drawBox(DB$annotation$start[i], - DB$annotation$end[i], - y, - ftrCol[ DB$annotation$featureID[i] ]) - } -} - -# Plot each annotated protein: -# Get the rows of all unique annotated Mbp1 proteins in myDB - -iRows <- grep("^MBP1_", myDB$protein$name) - -# define the size of the plot-frame to accomodate all proteins -yMax <- length(iRows) * 1.1 -xMax <- max(nchar(myDB$protein$sequence[iRows])) * 1.1 # longest sequence - -# plot an empty frame -oPar <- par(mar = c(4.2, 0.1, 3, 0.1)) # save the current plot parameters and - # decrease margins -plot(1, 1, - xlim = c(-200, xMax + 100), - ylim = c(0, yMax), - type = "n", - axes = FALSE, - bty = "n", - main = "Mbp1 orthologue domain annotations", - xlab = "sequence position", - cex.axis = 0.8, - ylab="") -axis(1, at = seq(0, xMax, by = 100)) -myCol <- colorRampPalette(c("#f2003c", "#F0A200", - "#f0ea00", "#62C923", - "#0A9A9B", "#1958C3", - "#8000D3", "#D0007F"), - space="Lab", - interpolate="linear")(nrow(myDB$feature)) -myCol <- paste0(myCol, "55") -legend(xMax - 150, 7, - legend = myDB$feature$name, - cex = 0.7, - fill = myCol, - bty = "n") - -# Finally, iterate over all proteins and call plotProtein() -for (i in seq_along(iRows)) { - plotProtein(myDB, myDB$protein$name[iRows[i]], i) -} -par(oPar) # reset the plot parameters - - -# The plot shows what is variable and what is constant about the annotations in -# a group of related proteins. Your MBP1_MYSPE annotations should appear at the -# top. - -# Task: -# Put a copy of the plot into your journal and interpret it with respect -# to MBP1_MYSPE, i.e. and note what you learn about MBP1_MYSPE from the plot. - -# Task: -# It would be better to align the motif borders, at least approximately (not -# all proteins have all motifs). How would you go about doing that? - -# = 3 SHARING DATA ======================================================== - -# It's particularly interesting to compare such annotations across many -# homologous proteins. I have created a page on the Student Wiki () that you can -# edit, and then download the data from the entire class directly to your -# RStudio project. -# - -# I have provided a function that extracts all information that refers to a -# single protein from the database, and prints it out as well-formatted JSON, -# suitable to be pasted into our shareable Wiki-page. There is a fair amount of -# bookkeeping involved, but the code is not otherwise very enlightening so I -# will spare you the details - it's in "./scripts/ABC-dbUtilities.R" if you -# would want to have a look. - - -# == 3.1 Post MBP1_MYSPE as JSON data ====================================== - -# Task: -# ===== -# 1: Run the following code: - -cat("{{Vspace}}", - "", - "
",
-    dbProt2JSON(sprintf("MBP1_%s", biCode(MYSPE))),
-    "
", - "", - "", sep = "\n" -) - -# 2: Copy the entire output from the console. -# 3: Navigate to -# http://steipe.biochemistry.utoronto.ca/abc/students/index.php/Public -# ... edit the page, and paste your output at the top. -# 4: Save your edits. - - - -# == 3.2 Import shared MBP1_MYSPE from the Wiki ============================ - -# Once we have collected a number of protein annotations, we can access the -# Wiki-page and import the data into our database. The Wiki page is an html -# document with lots of MediaWiki specific stuff - but the contents we are -# interested in is enclosed in
 ... 
tags. These -# work like normal HTML
 tags, but we have defined a special class for them
-# to make it easy to parse out the contents we want. The rvest:: package in
-# combination with xml2:: provides us with all the tools we need for such
-# "Webscraping" of data....
-
-if (! requireNamespace("rvest", quietly=TRUE)) {
-  install.packages("rvest")
-}
-
-if (! requireNamespace("xml2", quietly=TRUE)) {
-  install.packages("xml2")
-}
-
-# Here's the process:
-# The URL is an "open" page on the student Wiki. Users that are not logged in
-# can view the contents, but you can only edit if you are logged in.
-myURL <- "http://steipe.biochemistry.utoronto.ca/abc/students/index.php/Public"
-
-# First thing is to retrieve the HTML from the url...
-x <- xml2::read_html(myURL)
-
-# This retrieves the page source, but that still needs to be parsed into its
-# logical elements. HTML is a subset of XML and such documents are structured as
-# trees, that have "nodes" which are demarcated with "tags". rvest::html_nodes()
-# parses out the document structure and then uses a so-called "xpath" expression
-# to select nodes we are interested in. Now, xpath is one of those specialized
-# languages of which there are a few more to learn than one would care for. You
-# MUST know how to format sprintf() expressions, and you SHOULD be competent
-# with regular expressions. But if you want to be really competent in your work,
-# basic HTML and CSS is required ... and enough knowledge about xpath to be able
-# to search on Stackoverflow for what you need for parsing data out of Web
-# documents...
-
-# The expression we use below is:
-#   - get any node anywhere in the tree ("//*") ...
-#   - that has a particular attribute("[@ ... ]").
-#   - The attribute we want is that the class of the node is "protein-data";
-#      that is the class we have defined for our 
 tags.
-# As a result of this selection, we get a list of pointers to the document tree.
-y <- rvest::html_nodes(x, xpath ='//*[@class="protein-data"]')
-
-# Next we fetch the actual payload - the text - from the tree:
-# rvest::html_text() gets the text from the list of pointers. The result is a
-# normal list of character strings.
-z <- rvest::html_text(y)
-
-# Finally we can iterate over the list, and add all proteins we don't already
-# have to our database. There may well be items that are rejected because they
-# are already present in the database - for example, unless somebody has
-# annotated new features, all of the features are already there. Don't worry -
-# that is intended; we don't want duplicate entries.
-
-for (thisJSON in z) {
-  thisData <- jsonlite::fromJSON(thisJSON)
-  if (! thisData$protein$name %in% myDB$protein$name) {
-    myDB <- dbAddProtein(myDB, thisData$protein)
-    myDB <- dbAddTaxonomy(myDB, thisData$taxonomy)
-    myDB <- dbAddFeature(myDB, thisData$feature)
-    myDB <- dbAddAnnotation(myDB, thisData$annotation)
-  }
-}
-
-# Finally, we can repeat our domain plot with the results - which now includes the shared proteins:
-
-iRows <- grep("^MBP1_", myDB$protein$name)
-yMax <- length(iRows) * 1.1
-xMax <- max(nchar(myDB$protein$sequence[iRows])) * 1.1  # longest sequence
-
-# plot an empty frame
-oPar <- par(mar = c(4.2, 0.1, 3, 0.1))
-plot(1, 1,
-     xlim = c(-200, xMax + 100),
-     ylim = c(0, yMax),
-     type = "n",
-     axes = FALSE,
-     bty = "n",
-     main = "Mbp1 orthologue domain annotations",
-     xlab = "sequence position",
-     cex.axis = 0.8,
-     ylab="")
-axis(1, at = seq(0, xMax, by = 100))
-myCol <- colorRampPalette(c("#f2003c", "#F0A200",
-                            "#f0ea00", "#62C923",
-                            "#0A9A9B", "#1958C3",
-                            "#8000D3", "#D0007F"),
-                          space="Lab",
-                          interpolate="linear")(nrow(myDB$feature))
-myCol <- paste0(myCol, "55")
-legend(xMax - 150, 7,
-       legend = myDB$feature$name,
-       cex = 0.7,
-       fill = myCol,
-       bty = "n")
-
-for (i in seq_along(iRows)) {
-  plotProtein(myDB, myDB$protein$name[iRows[i]], i)
-}
-par(oPar)  # reset the plot parameters
-
-# ... the more proteins we can compare, the more we learn about the
-# architectural principles of this family's domains.
-
-
-# [END]
+# tocID <- "BIN-FUNC-Domain_annotation.R"
+#
+# Purpose:  A Bioinformatics Course:
+#              R code accompanying the BIN-FUNC-Domain_annotation unit.
+#
+# ==============================================================================
+# Version:  1.4
+#
+# Date:     2017-11  -  2020-10
+# Author:   Boris Steipe (boris.steipe@utoronto.ca)
+#
+# Versions:
+#           1.4    Add code for shared data import from the Wiki
+#           1.3    Add code for database export to JSON and instructions
+#                  for uploading annotations to the Public Student Wiki page
+#           1.2    Consistently: data in ./myScripts/ ;
+#                    begin SHARING DATA section
+#           1.1    2020 Updates
+#           1.0    Live version 2017
+#           0.1    First code copied from 2016 material.
+#
+# TODO:
+#           Put the domain plot into a function
+#
+# == DO NOT SIMPLY  source()  THIS FILE! =======================================
+#
+# If there are portions you don't understand, use R's help system, Google for an
+# answer, or ask your instructor. Don't continue if you don't understand what's
+# going on. That's not how it works ...
+#
+# ==============================================================================
+
+
+#TOC> ==========================================================================
+#TOC> 
+#TOC>   Section  Title                                                 Line
+#TOC> ---------------------------------------------------------------------
+#TOC>   1        Update your database script                             51
+#TOC>   1.1        Preparing an annotation file ...                      58
+#TOC>   1.1.1          BEFORE  "BIN-ALI-Optimal_sequence_alignment"      61
+#TOC>   1.1.2          AFTER "BIN-ALI-Optimal_sequence_alignment"       109
+#TOC>   1.2        Execute and Validate                                 136
+#TOC>   2        Plot Annotations                                       161
+#TOC>   3        SHARING DATA                                           287
+#TOC>   3.1        Post MBP1_MYSPE as JSON data                         303
+#TOC>   3.2        Import shared MBP1_MYSPE from the Wiki               326
+#TOC> 
+#TOC> ==========================================================================
+
+
+# =    1  Update your database script  =========================================
+
+
+# Since you have recorded domain features at the SMART database, we can store
+# the feature annotations in myDB ...
+
+
+# ==   1.1  Preparing an annotation file ...  ==================================
+
+
+# ===   1.1.1  BEFORE  "BIN-ALI-Optimal_sequence_alignment"
+#
+#   IF YOU HAVE NOT YET COMPLETED THE BIN-ALI-OPTIMAL_SEQUENCE_ALIGNMENT UNIT:
+#
+#   You DON'T already have a file called "-Annotations.json" in the
+#   ./myScripts/ directory:
+#
+#   - Make a copy of the file "./data/refAnnotations.json" and put it in your
+#     myScripts/ directory.
+#
+#   - Give it a name that is structured like "-Annotations.json" - e.g.
+#     if MYSPE is called "Crptycoccus neoformans", your file should be called
+#     "CRYNE-Annotations.json" (and the "name" of your Mbp1 orthologue is
+#     "MBP1_CRYNE").
+#
+#   - Open the file in the RStudio editor and delete all blocks for
+#     the Mbp1 protein annotations except the first one.
+#
+#   - From that block, delete all lines that have annotations you did not
+#     find in SMART for MBP1_MYSPE.
+#
+#   - Make enough copies of the "Ankyrin fold" and "low complexity" region
+#     lines to have a line for each feature you found.
+#
+#   - Then delete the comma at the end of the last line.
+#
+#   - Edit the annotations: change MBP1_SACCE  to MBP1_ everywhere
+#     and change the "start" and "end" features to the coordinates you
+#     recorded in the SMART database.
+#
+#   - Save your file in the ./myScripts/ folder.
+#
+#   - Validate your file online at https://jsonlint.com/
+#
+#   - Update your "./myScripts/makeProteinDB.R" script to load your new
+#     annotation when you recreate the database. Open the script in the
+#     RStudio editor, and add the following command at the end:
+#
+#     myDB <- dbAddAnnotation(myDB,
+#         jsonlite::fromJSON("./myScripts/-Annotations.json"))
+#                                         ^^^^^^^
+#                                        edit this!
+#
+#   - save and close the file.
+#
+# Then SKIP the next section.
+#
+#
+# ===   1.1.2  AFTER "BIN-ALI-Optimal_sequence_alignment"  
+#
+#   IF YOU HAVE ALREADY COMPLETED THE BIN-ALI-OPTIMAL_SEQUENCE_ALIGNMENT UNIT:
+#
+#   You SHOULD have a file called "-Annotations.json" in the
+#  ./myScripts/ directory:
+#
+#   - Open the file in the RStudio editor.
+#
+#   - Make as many copies of the "APSES fold" line as you have found
+#     features in SMART.
+#
+#   - Add a comma after every line except for the last one
+#
+#   - Edit the annotations but include only features that are in the
+#     myDB$feature table. Check which features are in the database by executing
+#
+#        myDB$feature$name
+#
+#   - Update the "start" and "end" coordinates for each feature to the
+#     values you found.
+#
+#   - Save your file.
+#
+#   - Validate your file online at https://jsonlint.com/
+#
+#
+# ==   1.2  Execute and Validate  ==============================================
+#
+#   - source() your database creation script:
+#
+#     source("./myScripts/makeProteinDB.R")
+#
+#     This should run without errors or warnings. If it doesn't work and you
+#     can't figure out quickly what's happening, ask for help on the
+#     Discussion Board.
+#
+#   - Confirm
+#     The following commands should retrieve all of the features that have been
+#     annotated for MBP1_MYSPE
+
+sel <- myDB$protein$name == paste("MBP1_", biCode(MYSPE), sep = "")
+
+(proID  <- myDB$protein$ID[sel])
+(fanIDs <- myDB$annotation$ID[myDB$annotation$proteinID == proID])
+(ftrIDs <- unique(myDB$annotation$featureID[fanIDs]))
+myDB$feature$name[ftrIDs] # This should list ALL of your annotated features
+                          # (once). If not, consider what could have gone wrong
+                          # and ask on the list if you have difficulties fixing
+                          # it.
+
+
+# =    2  Plot Annotations  ====================================================
+
+# In this section we will plot domain annotations as colored rectangles on a
+# sequence, as an example of using the R plotting system for generic, data
+# driven images.
+
+# We need a small utility function that draws the annotation boxes on a
+# representation of sequence. It should accept the start and end coordinates,
+# the y value where it should be plotted and the color of the box, and plot a
+# rectangle using R's rect() function.
+
+drawBox <- function(xStart, xEnd, y, myCol, DELTA = 0.2) {
+  # Draw a box from xStart to xEnd at y, filled with colour myCol
+  # The height of the box is y +- DELTA
+  rect(xStart, (y - DELTA), xEnd, (y + DELTA),
+       border = "black", col = myCol)
+}
+
+# test this:
+plot(c(-1.5, 1.5), c(0, 0), type = "l")
+drawBox(-1, 1, 0.0, "peachpuff")
+
+# Next, we define a function to plot annotations for one protein: the name of
+# the protein, a horizontal grey line for its length, and all of its features.
+
+plotProtein <- function(DB, name, y) {
+  # DB: protein database
+  # name: the name of the protein in the database.
+  # y: height where to draw the plot
+  #
+  # Define colors: we create a vector of color values, one for
+  # each feature, and we give it names of the feature ID. Then we
+  # can easily get the color value from the feature name.
+  # A: make a vector of color values. The syntax may appear unusual -
+  #    colorRampPalette() returns a function, and we simply append
+  #    the parameter (number-of-features) without assigning the function
+  #    to its own variable name.
+  ftrCol <- colorRampPalette(c("#f2003c", "#F0A200", "#f0ea00",
+                               "#62C923", "#0A9A9B", "#1958C3",
+                               "#8000D3", "#D0007F"),
+                             space="Lab",
+                             interpolate="linear")(nrow(DB$feature))
+  # B: Features may overlap, so we make the colors transparent by setting
+  #    their "alpha channel" to 1/3  (hex: 55)
+  ftrCol <- paste0(ftrCol, "55")
+  # C: we asssign names
+  names(ftrCol) <- DB$feature$ID
+  # E.g. color for the third feature: ftrCol[ DB$feature$ID[3] ]
+
+  # find the row-index of the protein ID in the protein table of DB
+  iProtein <- which(DB$protein$name == name)
+
+  # write the name of the protein
+  text(-30, y, adj=1, labels=name, cex=0.75 )
+
+  #draw a line from 0 to nchar(sequence-of-the-protein)
+  lines(c(0, nchar(DB$protein$sequence[iProtein])), c(y, y),
+        lwd=3, col="#999999")
+
+  # get the rows of feature annotations for the protein
+  iFtr <- which(DB$annotation$proteinID == DB$protein$ID[iProtein])
+
+  # draw a colored box for each feature
+  for (i in iFtr) {
+    drawBox(DB$annotation$start[i],
+            DB$annotation$end[i],
+            y,
+            ftrCol[ DB$annotation$featureID[i] ])
+  }
+}
+
+# Plot each annotated protein:
+# Get the rows of all unique annotated Mbp1 proteins in myDB
+
+iRows <- grep("^MBP1_", myDB$protein$name)
+
+# define the size of the plot-frame to accomodate all proteins
+yMax <- length(iRows) * 1.1
+xMax <- max(nchar(myDB$protein$sequence[iRows])) * 1.1  # longest sequence
+
+# plot an empty frame
+oPar <- par(mar = c(4.2, 0.1, 3, 0.1))  # save the current plot parameters and
+                                        # decrease margins
+plot(1, 1,
+     xlim = c(-200, xMax + 100),
+     ylim = c(0, yMax),
+     type = "n",
+     axes = FALSE,
+     bty = "n",
+     main = "Mbp1 orthologue domain annotations",
+     xlab = "sequence position",
+     cex.axis = 0.8,
+     ylab="")
+axis(1, at = seq(0, xMax, by = 100))
+myCol <- colorRampPalette(c("#f2003c", "#F0A200",
+                            "#f0ea00", "#62C923",
+                            "#0A9A9B", "#1958C3",
+                            "#8000D3", "#D0007F"),
+                          space="Lab",
+                          interpolate="linear")(nrow(myDB$feature))
+myCol <- paste0(myCol, "55")
+legend(xMax - 150, 7,
+       legend = myDB$feature$name,
+       cex = 0.7,
+       fill = myCol,
+       bty = "n")
+
+# Finally, iterate over all proteins and call plotProtein()
+for (i in seq_along(iRows)) {
+  plotProtein(myDB, myDB$protein$name[iRows[i]], i)
+}
+par(oPar)  # reset the plot parameters
+
+
+# The plot shows what is variable and what is constant about the annotations in
+# a group of related proteins. Your MBP1_MYSPE annotations should appear at the
+# top.
+
+# Task:
+#    Put a copy of the plot into your journal and interpret it with respect
+#    to MBP1_MYSPE, i.e. and note what you learn about MBP1_MYSPE from the plot.
+
+# Task:
+#    It would be better to align the motif borders, at least approximately (not
+#    all proteins have all motifs). How would you go about doing that?
+
+# =    3  SHARING DATA  ========================================================
+
+# It's particularly interesting to compare such annotations across many
+# homologous proteins. I have created a page on the Student Wiki () that you can
+# edit, and then download the data from the entire class directly to your
+# RStudio project.
+#
+
+# I have provided a function that extracts all information that refers to a
+# single protein from the database, and prints it out as well-formatted JSON,
+# suitable to be pasted into our shareable Wiki-page. There is a fair amount of
+# bookkeeping involved, but the code is not otherwise very enlightening so I
+# will spare you the details - it's in "./scripts/ABC-dbUtilities.R" if you
+# would want to have a look.
+
+
+# ==   3.1  Post MBP1_MYSPE as JSON data  ======================================
+
+# Task:
+# =====
+# 1: Run the following code:
+
+cat("{{Vspace}}",
+    "",
+    "
",
+    dbProt2JSON(sprintf("MBP1_%s", biCode(MYSPE))),
+    "
", + "", + "", sep = "\n" +) + +# 2: Copy the entire output from the console. +# 3: Navigate to +# http://steipe.biochemistry.utoronto.ca/abc/students/index.php/Public +# ... edit the page, and paste your output at the top. +# 4: Save your edits. + + + +# == 3.2 Import shared MBP1_MYSPE from the Wiki ============================ + +# Once we have collected a number of protein annotations, we can access the +# Wiki-page and import the data into our database. The Wiki page is an html +# document with lots of MediaWiki specific stuff - but the contents we are +# interested in is enclosed in
 ... 
tags. These +# work like normal HTML
 tags, but we have defined a special class for them
+# to make it easy to parse out the contents we want. The rvest:: package in
+# combination with xml2:: provides us with all the tools we need for such
+# "Webscraping" of data....
+
+if (! requireNamespace("rvest", quietly=TRUE)) {
+  install.packages("rvest")
+}
+
+if (! requireNamespace("xml2", quietly=TRUE)) {
+  install.packages("xml2")
+}
+
+# Here's the process:
+# The URL is an "open" page on the student Wiki. Users that are not logged in
+# can view the contents, but you can only edit if you are logged in.
+myURL <- "http://steipe.biochemistry.utoronto.ca/abc/students/index.php/Public"
+
+# First thing is to retrieve the HTML from the url...
+x <- xml2::read_html(myURL)
+
+# This retrieves the page source, but that still needs to be parsed into its
+# logical elements. HTML is a subset of XML and such documents are structured as
+# trees, that have "nodes" which are demarcated with "tags". rvest::html_nodes()
+# parses out the document structure and then uses a so-called "xpath" expression
+# to select nodes we are interested in. Now, xpath is one of those specialized
+# languages of which there are a few more to learn than one would care for. You
+# MUST know how to format sprintf() expressions, and you SHOULD be competent
+# with regular expressions. But if you want to be really competent in your work,
+# basic HTML and CSS is required ... and enough knowledge about xpath to be able
+# to search on Stackoverflow for what you need for parsing data out of Web
+# documents...
+
+# The expression we use below is:
+#   - get any node anywhere in the tree ("//*") ...
+#   - that has a particular attribute("[@ ... ]").
+#   - The attribute we want is that the class of the node is "protein-data";
+#      that is the class we have defined for our 
 tags.
+# As a result of this selection, we get a list of pointers to the document tree.
+y <- rvest::html_nodes(x, xpath ='//*[@class="protein-data"]')
+
+# Next we fetch the actual payload - the text - from the tree:
+# rvest::html_text() gets the text from the list of pointers. The result is a
+# normal list of character strings.
+z <- rvest::html_text(y)
+
+# Finally we can iterate over the list, and add all proteins we don't already
+# have to our database. There may well be items that are rejected because they
+# are already present in the database - for example, unless somebody has
+# annotated new features, all of the features are already there. Don't worry -
+# that is intended; we don't want duplicate entries.
+
+for (thisJSON in z) {
+  thisData <- jsonlite::fromJSON(thisJSON)
+  if (! thisData$protein$name %in% myDB$protein$name) {
+    myDB <- dbAddProtein(myDB, thisData$protein)
+    myDB <- dbAddTaxonomy(myDB, thisData$taxonomy)
+    myDB <- dbAddFeature(myDB, thisData$feature)
+    myDB <- dbAddAnnotation(myDB, thisData$annotation)
+  }
+}
+
+# Finally, we can repeat our domain plot with the results - which now includes the shared proteins:
+
+iRows <- grep("^MBP1_", myDB$protein$name)
+yMax <- length(iRows) * 1.1
+xMax <- max(nchar(myDB$protein$sequence[iRows])) * 1.1  # longest sequence
+
+# plot an empty frame
+oPar <- par(mar = c(4.2, 0.1, 3, 0.1))
+plot(1, 1,
+     xlim = c(-200, xMax + 100),
+     ylim = c(0, yMax),
+     type = "n",
+     axes = FALSE,
+     bty = "n",
+     main = "Mbp1 orthologue domain annotations",
+     xlab = "sequence position",
+     cex.axis = 0.8,
+     ylab="")
+axis(1, at = seq(0, xMax, by = 100))
+myCol <- colorRampPalette(c("#f2003c", "#F0A200",
+                            "#f0ea00", "#62C923",
+                            "#0A9A9B", "#1958C3",
+                            "#8000D3", "#D0007F"),
+                          space="Lab",
+                          interpolate="linear")(nrow(myDB$feature))
+myCol <- paste0(myCol, "55")
+legend(xMax - 150, 7,
+       legend = myDB$feature$name,
+       cex = 0.7,
+       fill = myCol,
+       bty = "n")
+
+for (i in seq_along(iRows)) {
+  plotProtein(myDB, myDB$protein$name[iRows[i]], i)
+}
+par(oPar)  # reset the plot parameters
+
+# ... the more proteins we can compare, the more we learn about the
+# architectural principles of this family's domains.
+
+
+# [END]
diff --git a/BIN-FUNC-Semantic_similarity.R b/BIN-FUNC-Semantic_similarity.R
index 632468c..592cc89 100644
--- a/BIN-FUNC-Semantic_similarity.R
+++ b/BIN-FUNC-Semantic_similarity.R
@@ -1,169 +1,169 @@
-# tocID <- "BIN-FUNC-Semantic_similarity.R"
-#
-# Purpose:  A Bioinformatics Course:
-#              R code accompanying the BIN-FUNC_Semantic_similarity unit.
-#
-# Version:  1.2
-#
-# Date:     2017-11  -  2020-09
-# Author:   Boris Steipe (boris.steipe@utoronto.ca)
-#
-# Versions:
-#           1.2    2020 Maintenance
-#           1.1    Change from require() to requireNamespace(),
-#                      use ::() idiom throughout,
-#                      use Biocmanager:: not biocLite()
-#           1.0    New code.
-#
-#
-# TODO:
-#
-#
-# == DO NOT SIMPLY  source()  THIS FILE! =======================================
-#
-# If there are portions you don't understand, use R's help system, Google for an
-# answer, or ask your instructor. Don't continue if you don't understand what's
-# going on. That's not how it works ...
-#
-# ==============================================================================
-
-
-#TOC> ==========================================================================
-#TOC> 
-#TOC>   Section  Title                                                Line
-#TOC> --------------------------------------------------------------------
-#TOC>   1        Preparations: Packages, AnnotationDB, Setup            43
-#TOC>   2        Fetch GO Annotations                                  100
-#TOC>   3        Semantic Similarities                                 109
-#TOC>   4        GO Term Enrichment in Gene Sets                       127
-#TOC> 
-#TOC> ==========================================================================
-
-
-# =    1  Preparations: Packages, AnnotationDB, Setup  =========================
-
-if (! requireNamespace("BiocManager", quietly = TRUE)) {
-  install.packages("BiocManager")
-}
-
-# GOSim is an R-package in the Bioconductor project.
-if (! requireNamespace("GOSim", quietly = TRUE)) {
-  BiocManager::install("GOSim")
-}
-# Package information:
-#  library(help = GOSim)       # basic information
-#  browseVignettes("GOSim")    # available vignettes
-#  data(package = "GOSim")     # available datasets
-
-# GOSim makes extensive assumptions about loaded packages, and many base
-# methods are masked. We will thus use library(GOSim) to load it
-# in its entirety and with all packages it depends on. We will still use
-# the ::() syntax in the code below, but this now serves
-# more of a didactic purpose, rather than actual syntax requirements.
-
-library(GOSim)
-
-# GOSim loads human annotations in  org.Hs.eg.db  by default. We load yeast
-# annotations instead...
-if (! requireNamespace("org.Sc.sgd.db", quietly = TRUE)) {
-  BiocManager::install("org.Sc.sgd.db")
-}
-
-# Bioconductor annotation packages won't work stably unless we actually load
-# them:
-library(org.Sc.sgd.db)
-
-# org.Sc.sgd.db is a Bioconductor annotation database curated by SGD. Such
-# databases exist for all model organisms. It's a kind of a fancy data frame
-# from which we can get annotations by rows (genes) with the keys() funtion ...
-AnnotationDbi::keys(org.Sc.sgd.db)[1500:1510]
-
-# ... and the types of available annotations with the columns() function
-AnnotationDbi::columns(org.Sc.sgd.db)
-
-# Note that one of the columns is "GO" ... and we load that into the
-# datastructures used by GOSim:
-
-# Choose GOterms to use
-GOSim::setEvidenceLevel(evidences = "all",
-                        organism = org.Sc.sgdORGANISM,
-                        gomap = org.Sc.sgdGO)
-
-# Use Biological Process ontology
-GOSim::setOntology("BP", loadIC = FALSE)
-
-# confirm that we loaded the correct ontology
-head(get("gomap", envir = GOSimEnv))
-
-
-
-# =    2  Fetch GO Annotations  ================================================
-
-
-# All keys being used here are yeast systematic names.
-
-# Get one set of annotations
-GOSim::getGOInfo(c("YDL056W"))  # Mbp1
-
-
-# =    3  Semantic Similarities  ===============================================
-
-
-# Get semantic similarities between genes
-?getGeneSim
-
-# There are _many_ different metrics of term similarity implemented
-# in this package.
-
-                                                         # Mbp1 and...
-GOSim::getGeneSim("YDL056W","YLR182W",similarity = "OA") # Swi6 - MCB complex
-GOSim::getGeneSim("YDL056W","YER111C",similarity = "OA") # Swi4 - collaborators
-GOSim::getGeneSim("YDL056W","YBR160W",similarity = "OA") # Cdc28 - mediator
-GOSim::getGeneSim("YDL056W","YGR108W",similarity = "OA") # Clb1 - antagonist
-GOSim::getGeneSim("YDL056W","YLR079W",similarity = "OA") # Sic1 - antagonist
-GOSim::getGeneSim("YDL056W","YJL130C",similarity = "OA") # Pgk1 - Gluconeogenesis
-
-
-# =    4  GO Term Enrichment in Gene Sets  =====================================
-
-
-# Calculating GO term enrichment in gene sets is done with the Bioconductor
-# topGO package.
-if (! requireNamespace("topGO", quietly = TRUE)) {
-  BiocManager::install("topGO")
-}
-# Package information:
-#  library(help = topGO)       # basic information
-#  browseVignettes("topGO")    # available vignettes
-#  data(package = "topGO")     # available datasets
-
-# Once again - assumptions are made by GOsim that require us to load the
-# topGO package wholesale:
-library(topGO)
-
-# Let's define a gene set: GOterm enrichment for G1/S switch activators:
-mySet <- c("YFR028C", # Cdc14
-           "YDL056W", # Mbp1
-           "YLR182W", # Swi6
-           "YER111C", # Swi4
-           "YOR083W", # Whi5
-           "YBR160W", # Cdc28
-           "YMR199W", # Cln1
-           "YPL256C", # Cln2
-           "YAL040C") # Cln3
-
-allGenes <- AnnotationDbi::keys(org.Sc.sgd.db)
-allGenes <- allGenes[grep("^Y", allGenes)]  # This is the context against which
-                                            # we define enrichment
-
-myEnr <- GOenrichment(mySet, allGenes)
-
-sort(myEnr$p.values)  # Any significantly enriched terms? All of these are ...
-
-#Most significantly enriched is GO:0071931. What is this?
-annotate::getGOTerm("GO:0071931")  # ... makes sense.
-
-
-
-
-# [END]
+# tocID <- "BIN-FUNC-Semantic_similarity.R"
+#
+# Purpose:  A Bioinformatics Course:
+#              R code accompanying the BIN-FUNC_Semantic_similarity unit.
+#
+# Version:  1.2
+#
+# Date:     2017-11  -  2020-09
+# Author:   Boris Steipe (boris.steipe@utoronto.ca)
+#
+# Versions:
+#           1.2    2020 Maintenance
+#           1.1    Change from require() to requireNamespace(),
+#                      use ::() idiom throughout,
+#                      use Biocmanager:: not biocLite()
+#           1.0    New code.
+#
+#
+# TODO:
+#
+#
+# == DO NOT SIMPLY  source()  THIS FILE! =======================================
+#
+# If there are portions you don't understand, use R's help system, Google for an
+# answer, or ask your instructor. Don't continue if you don't understand what's
+# going on. That's not how it works ...
+#
+# ==============================================================================
+
+
+#TOC> ==========================================================================
+#TOC> 
+#TOC>   Section  Title                                                Line
+#TOC> --------------------------------------------------------------------
+#TOC>   1        Preparations: Packages, AnnotationDB, Setup            43
+#TOC>   2        Fetch GO Annotations                                  100
+#TOC>   3        Semantic Similarities                                 109
+#TOC>   4        GO Term Enrichment in Gene Sets                       127
+#TOC> 
+#TOC> ==========================================================================
+
+
+# =    1  Preparations: Packages, AnnotationDB, Setup  =========================
+
+if (! requireNamespace("BiocManager", quietly = TRUE)) {
+  install.packages("BiocManager")
+}
+
+# GOSim is an R-package in the Bioconductor project.
+if (! requireNamespace("GOSim", quietly = TRUE)) {
+  BiocManager::install("GOSim")
+}
+# Package information:
+#  library(help = GOSim)       # basic information
+#  browseVignettes("GOSim")    # available vignettes
+#  data(package = "GOSim")     # available datasets
+
+# GOSim makes extensive assumptions about loaded packages, and many base
+# methods are masked. We will thus use library(GOSim) to load it
+# in its entirety and with all packages it depends on. We will still use
+# the ::() syntax in the code below, but this now serves
+# more of a didactic purpose, rather than actual syntax requirements.
+
+library(GOSim)
+
+# GOSim loads human annotations in  org.Hs.eg.db  by default. We load yeast
+# annotations instead...
+if (! requireNamespace("org.Sc.sgd.db", quietly = TRUE)) {
+  BiocManager::install("org.Sc.sgd.db")
+}
+
+# Bioconductor annotation packages won't work stably unless we actually load
+# them:
+library(org.Sc.sgd.db)
+
+# org.Sc.sgd.db is a Bioconductor annotation database curated by SGD. Such
+# databases exist for all model organisms. It's a kind of a fancy data frame
+# from which we can get annotations by rows (genes) with the keys() funtion ...
+AnnotationDbi::keys(org.Sc.sgd.db)[1500:1510]
+
+# ... and the types of available annotations with the columns() function
+AnnotationDbi::columns(org.Sc.sgd.db)
+
+# Note that one of the columns is "GO" ... and we load that into the
+# datastructures used by GOSim:
+
+# Choose GOterms to use
+GOSim::setEvidenceLevel(evidences = "all",
+                        organism = org.Sc.sgdORGANISM,
+                        gomap = org.Sc.sgdGO)
+
+# Use Biological Process ontology
+GOSim::setOntology("BP", loadIC = FALSE)
+
+# confirm that we loaded the correct ontology
+head(get("gomap", envir = GOSimEnv))
+
+
+
+# =    2  Fetch GO Annotations  ================================================
+
+
+# All keys being used here are yeast systematic names.
+
+# Get one set of annotations
+GOSim::getGOInfo(c("YDL056W"))  # Mbp1
+
+
+# =    3  Semantic Similarities  ===============================================
+
+
+# Get semantic similarities between genes
+?getGeneSim
+
+# There are _many_ different metrics of term similarity implemented
+# in this package.
+
+                                                         # Mbp1 and...
+GOSim::getGeneSim("YDL056W","YLR182W",similarity = "OA") # Swi6 - MCB complex
+GOSim::getGeneSim("YDL056W","YER111C",similarity = "OA") # Swi4 - collaborators
+GOSim::getGeneSim("YDL056W","YBR160W",similarity = "OA") # Cdc28 - mediator
+GOSim::getGeneSim("YDL056W","YGR108W",similarity = "OA") # Clb1 - antagonist
+GOSim::getGeneSim("YDL056W","YLR079W",similarity = "OA") # Sic1 - antagonist
+GOSim::getGeneSim("YDL056W","YJL130C",similarity = "OA") # Pgk1 - Gluconeogenesis
+
+
+# =    4  GO Term Enrichment in Gene Sets  =====================================
+
+
+# Calculating GO term enrichment in gene sets is done with the Bioconductor
+# topGO package.
+if (! requireNamespace("topGO", quietly = TRUE)) {
+  BiocManager::install("topGO")
+}
+# Package information:
+#  library(help = topGO)       # basic information
+#  browseVignettes("topGO")    # available vignettes
+#  data(package = "topGO")     # available datasets
+
+# Once again - assumptions are made by GOsim that require us to load the
+# topGO package wholesale:
+library(topGO)
+
+# Let's define a gene set: GOterm enrichment for G1/S switch activators:
+mySet <- c("YFR028C", # Cdc14
+           "YDL056W", # Mbp1
+           "YLR182W", # Swi6
+           "YER111C", # Swi4
+           "YOR083W", # Whi5
+           "YBR160W", # Cdc28
+           "YMR199W", # Cln1
+           "YPL256C", # Cln2
+           "YAL040C") # Cln3
+
+allGenes <- AnnotationDbi::keys(org.Sc.sgd.db)
+allGenes <- allGenes[grep("^Y", allGenes)]  # This is the context against which
+                                            # we define enrichment
+
+myEnr <- GOenrichment(mySet, allGenes)
+
+sort(myEnr$p.values)  # Any significantly enriched terms? All of these are ...
+
+#Most significantly enriched is GO:0071931. What is this?
+annotate::getGOTerm("GO:0071931")  # ... makes sense.
+
+
+
+
+# [END]
diff --git a/BIN-MYSPE.R b/BIN-MYSPE.R
index 7abe397..57267e4 100644
--- a/BIN-MYSPE.R
+++ b/BIN-MYSPE.R
@@ -1,351 +1,351 @@
-# tocID <- "BIN-MYSPE.R"
-#
-# Purpose: A Bioinformatics Course:
-#              R code accompanying the BIN-MYSPE unit
-#
-#
-# Version: 1.4
-#
-# Date:    2017-09 - 2021-10
-# Author:  Boris Steipe (boris.steipe@utoronto.ca)
-#
-# V 1.4    Add troubleshooting hints via errText[[...]]
-# V 1.3    2021 update of MYSPE mechanics; fix a bug no one had complained about
-# V 1.2    Reorganized proportional plot section into a "further reading"
-#          section, added nested-box, and sankey plot visualization of
-#          proportions. Introduced plotly.
-# V 1.1    2020 Workflow changes
-# V 1.0.1  Move ABC-makeMYSPElist.R to ./scripts directory
-# V 1.0    Final code, after rewriting BLAST parser and updating MYSPElist
-# V 0.1    First code copied from BCH441_A03_makeMYSPElist.R
-#
-# TODO:    Sample solution for sankey plot function.
-#
-#
-# == HOW TO WORK WITH LEARNING UNIT FILES ======================================
-#
-# DO NOT SIMPLY  source()  THESE FILES!
-#
-# If there are portions you don't understand, use R's help system, Google for an
-# answer, or ask your instructor. Don't continue if you don't understand what's
-#  going on. That's not how it works ...
-#
-# ==============================================================================
-
-
-#TOC> ==========================================================================
-#TOC> 
-#TOC>   Section  Title                                             Line
-#TOC> -----------------------------------------------------------------
-#TOC>   1        PREPARATIONS                                        52
-#TOC>   2        SUITABLE MYSPE SPECIES                              65
-#TOC>   3        ADOPT "MYSPE"                                       89
-#TOC>   4        FURTHER READING: PLOTTING PROPORTIONS              128
-#TOC>   4.1        Percentages                                      146
-#TOC>   4.2        Visualizing proportions: Pie chart               165
-#TOC>   4.3        Visualizing proportions: Nested squares          243
-#TOC>   4.4        Visualizing proportions: Sankey diagrams         280
-#TOC> 
-#TOC> ==========================================================================
-
-
-# =    1  PREPARATIONS  ========================================================
-#
-
-# Execute the two conditionals below:
-if (! file.exists("./myScripts/.myProfile.R")) {
-  stop(errText[["noProfileFile"]])     # message defined in .Rprofile
-}
-
-if (! exists("myStudentNumber")) {
-  stop(errText[["noStudentNumber"]])   # message defined in .Rprofile
-}
-
-
-# =    2  SUITABLE MYSPE SPECIES  ==============================================
-
-
-# In this unit we will select one species from a list of genome sequenced fungi
-# and write it into your personalized profile file. This species will be called
-# "MYSPE" (My Species) for other learning units and exercises.
-
-# A detailed description of the process of compiling the list of genome
-# sequenced fungi with protein annotations and Mbp1 homologues is in the file
-# ./scripts/ABC-makeMYSPElist.R  In brief, data for genome-sequenced fungi
-# was retrieved from https://fungi.ensembl.org; a search for homologues to
-# yeast Mbp1 was performed with BLAST at the NCBI, and the data was merged.
-# A representative organism at each genus-level was chosen from those hits
-# that actual;ly have a homologue. Finally, a mapping table was constructed to
-# asymmetrically retrieve unique species: a student number will retrieve
-# a species, but (public) knowledge of the species cannot reconstruct the
-# student number.
-
-# Task: Study ./scripts/ABC-makeMYSPElist.R, it implements a typical workflow
-#       of selecting and combining data from various data resources. Studying
-#       it will give you a better sense of how such workflows can be
-#       implemented in practice.
-
-
-# =    3  ADOPT "MYSPE"  =======================================================
-
-# Execute:
-( MYSPE <- getMYSPE(myStudentNumber) )
-
-# If this produced an error, this session has not been properly set up. You
-# may not yet have run  init()  and edited  .myProfile.R , or that file is not
-# in your  myScripts/  folder. Fix this, and execute:
-#
-#    source(".Rprofile") .
-
-# If this produced NA, your Student Number may not be correct, or you are not in
-# my class-list. Contact me. Otherwise, this should have printed a species name,
-# and the taxonomy ID of its genome-sequenced strain. This is your unique
-# speciesfor this course. Note it in your journal ...
-
-biCode(MYSPE) # and also note it's "BiCode" ...
-( myTaxID <- names(MYSPE) )  # and its taxID
-
-
-# Task:
-# =====
-#   Note down the species name and its five letter BiCode on your Student
-#   Wiki user page. Use this species whenever this or future assignments refer
-#   to MYSPE. Whenever you start a session, it will automatically be loaded
-#   from  myScripts/.myProfile.R  and is available as  MYSPE .
-
-# Here is some more information about MYSPE, taken from the table of genome-
-# sequenced fungi that is in your ./data folder.
-fungiDat <- read.csv("data/Species.csv")
-iMs <- which(fungiDat$Taxon.ID == myTaxID)
-
-( myOr <- fungiDat$Classification[iMs] )  # Taxonomic order
-( myGn <- gsub("\\s.*", "", MYSPE))       # Taxonomic genus
-( mySt <- fungiDat$Name[iMs] )            # Taxonomic strain
-
-# That's all.
-
-
-# =    4  FURTHER READING: PLOTTING PROPORTIONS  ===============================
-
-# The material below is an exploration of data-preparation and plotting
-# techniques; you can treat this as additional practice and further reading and
-# I expect that some of the code and plotting examples may be useful in a
-# different context.
-
-# A frequent task is to visualize the proportion of elements with given
-# categories in a sample. For example, we might ask what the proportion of the
-# different orders of fungi is the order of MYSPE? Let's first collect the
-# numbers.
-
-( nFungi <- nrow(fungiDat) )                            # sequenced fungi
-( nOrder <- sum(grepl(myOr, fungiDat$Classification)) ) # same order as MYSPE
-( nGenus <- sum(grepl(myGn, fungiDat$Name)) )           # same genus as MYSPE
-( nSpecies <- sum(grepl(MYSPE, fungiDat$Name)) )        # same species as MYSPE
-
-
-# ==   4.1  Percentages  =======================================================
-
-# The zeroth-order approach to visualization is simply to print percentages:
-
-cat(sprintf("\n%s comprise %5.2f%% of fungi.",
-        myOr,
-        (nOrder * 100) / nFungi))
-
-# ... or, adding the actual numbers:
-
-cat(sprintf("\n%s comprise %5.2f%% of fungi (%d of %d).",
-            myOr,
-            (nOrder * 100) / nFungi,
-            nOrder,
-            nFungi))
-
-# But that's hard to visualize for most of us, and anyway, we don't know how
-# that relates to other orders.
-
-# ==   4.2  Visualizing proportions: Pie chart  ================================
-
-# Often, we will use a pie chart instead. Pie charts are rather informal types
-# of plots, not well suited for analysis. But easy to do:
-
-# Define four colors to identify the four categories
-pCol <- c("#ed394e", "#ff9582", "#ffd5c4", "#f2f2f0")
-
-oPar <- par(mar = c(0.1, 0.1, 2.5, 0.1))   # set margins to ~ 0
-                                           # and remember the
-                                           # previous setting
-
-pie(c(nSpecies,                            # subtract numbers since these
-      nGenus - nSpecies,                   # categories are mutually contained
-      nOrder - nGenus - nSpecies,          # in each other
-      nFungi - nOrder - nGenus - nSpecies),
-      labels = "",
-      radius = 0.9,
-      main = "MYSPE in genome-sequenced fungi",
-      lty = 0,                             # turn borders for wedges off
-      col = pCol,
-      clockwise = TRUE,
-      init.angle = 90)
-
-title(main=MYSPE, line=0, cex.main=0.7)    # add a title to the plot
-
-legend(x = 0.95, y = 0.8,    # place at legend here
-       legend = c("Species", "Genus", "Order", "Fungi"),
-       y.intersp = 2,                      # line spacing for labels
-       cex = 0.8,                          # character size for labels
-       bty = "n",                          # "no" box around the legend
-       pt.cex = 2,                         # size of colour boxes
-       pch = 15,                           # a filled square
-       col = pCol)
-
-par(oPar)                                  # reset graphics state
-
-# Unless MYSPE is one of the frequently sequenced species, there will only be a
-# very thin wedge visible. Pie charts are not well suited to visualize small
-# proportions.
-
-# It is a little more useful if we have non-nested proportions - like the
-# number of species in the same order overall:
-
-myTbl <- sort(table(fungiDat$Classification), decreasing = TRUE)
-head(myTbl)
-
-# pie() does a reasonable job out of the box to interpret table() data:
-pie(myTbl)
-
-# ... we can improve this quickly with a bit of tweaking:
-
-N <- length(myTbl)
-sel <- myOr == names(myTbl) # TRUE for the MYSPE order, FALSE elsewhere
-
-myCol <- rep(pCol[4], N)       # N elements of pCol[1]
-myCol[sel] <- pCol[1]          # replace this one color
-
-myLbl <- rep("", N)            # N labels of ""
-myLbl[sel] <- myOr             # replace this one label with the MYSPE order
-
-
-oPar <- par(mar = c(0.1, 0.1, 2.5, 0.1))   # set margins to ~ 0
-
-pie(myTbl,
-    labels = myLbl,
-    radius = 0.9,
-    main = "MYSPE order",
-    border = "#DDDDDD",
-    col = myCol,
-    clockwise = TRUE,
-    init.angle = 90)
-
-par(oPar)                                  # reset graphics state
-
-# But the overall problem remains.
-
-
-# ==   4.3  Visualizing proportions: Nested squares  ===========================
-
-# A simple alternative is to draw such proportions as nested squares:
-
-x <- sqrt(nFungi)
-
-# set margins to ~ 0 and type to square
-oPar <- par(mar = c(0.1, 0.1, 0.1, 0.1), pty = "s")
-
-# empty, square plot
-plot(c(0, x), c(0, x), xlim = c(0, x), ylim = c(0, x),
-     type="n", axes=FALSE, xlab="", ylab="")
-
-# basic square for all genomes
-rect(0, 0, x,              x,              col = pCol[4])
-
-# grid
-u <- 0:floor(x)
-N <- length(u)
-segments(rep(0, N), u, rep(x, N), u, col = "#0000FF18")
-segments(u, rep(0, N), u, rep(x, N), col = "#0000FF18")
-# each square on this grid is one genome
-
-# colored squares
-rect(0, 0, sqrt(nOrder),   sqrt(nOrder),   col = pCol[3])
-rect(0, 0, sqrt(nGenus),   sqrt(nGenus),   col = pCol[2])
-rect(0, 0, sqrt(nSpecies), sqrt(nSpecies), col = pCol[1])
-
-# labels
-text(x/2, x/2,      "Fungi")
-text(x * 0.08, x * 0.11, myOr,   pos = 4, cex = 0.9)
-text(x * 0.08, x * 0.06, myGn,   pos = 4, cex = 0.8)
-text(x * 0.08, x * 0.02, MYSPE, pos = 4, cex = 0.7)
-
-par(oPar)                                  # reset graphics state
-
-
-# ==   4.4  Visualizing proportions: Sankey diagrams  ==========================
-
-# Sankey diagrams are an excellent way to visualize complicated nested
-# proportions and their changes (see here for example:
-# https://www.r-graph-gallery.com/sankey-diagram.html). Here is a very simple
-# example with the MYSPE proportions, as an illustration of the plotting
-# principle.
-
-if (! requireNamespace("plotly")) {
-  install.packages("plotly")
-}
-# Package information:
-#  library(help   = plotly)     # basic information
-#  browseVignettes("plotly")    # available vignettes
-#  data(package  = "plotly")    # available datasets
-
-# Here, we use the plotly package that wraps a very well developed javascript
-# library with many options for interactive plots. I am producing this plot
-# hard-coded for the sample organism "Sporothrix schenkii"; you would need
-# to change the code to adapt it to your own MYSPE - or even build a function
-# for this. Do try this if you have a bit of coding experience, sankey diagrams
-# are a good way to show hierarchical data relations - and if you get this
-# working for your own organism you can be proud that you have understood
-# how preparing the data works.
-
-
-myNodes <- list(label = c("Fungi (1014)",              # 0 <- node ID
-                          "Ophiostomatales (6)",       # 1
-                          "Other...",                  # 2
-                          "Sporothrix (4)",            # 3
-                          "Other...",                  # 4
-                          "Sporothrix schenckii (2)",  # 5
-                          "Other..."                   # 6
-                          ),
-                x = c(0.1, 0.4, 0.4, 0.7, 0.7, 1.0, 1.0),
-                y = c(0.3, 0.1, 0.7, 0.2, 0.7, 0.3, 0.7),
-                color = c("#f2f2f0", #
-                          "#ffd5c4",
-                          "#CCCCCC",
-                          "#ff9582",
-                          "#CCCCCC",
-                          "#ed394e",
-                          "#CCCCCC"
-                          ),
-                pad = 15,
-                thickness = 20,
-                line = list(color = "black",
-                            width = 0.5))
-
-myLinks <- list(source = c(0, 0, 1, 1, 3, 3),   # i.e. there is a link of
-                target = c(1, 2, 3, 4, 5, 6),   # weight 6 between node 0
-                value =  c(6, 18, 4, 2, 2, 2))  # and node 1
-
-# Setting up the actual plot ...
-fig  <-  plotly::plot_ly(type = "sankey",
-                         arrangement = "snap",
-                         orientation = "h",
-                         node = myNodes,
-                         link = myLinks)
-
-# Adding and adjusting a few layout parameters
-fig <- plotly::layout(fig,
-              title = "Fungi Genomes - Classification",
-              font = list(size = 10))
-
-fig     # plot the diagram
-
-# Note that the plot appears in the Viewer window, not the Plot window, and that
-# it is interactive: you can hover over nodes and links, and drag the nodes
-# around.
-
-# [END]
+# tocID <- "BIN-MYSPE.R"
+#
+# Purpose: A Bioinformatics Course:
+#              R code accompanying the BIN-MYSPE unit
+#
+#
+# Version: 1.4
+#
+# Date:    2017-09 - 2021-10
+# Author:  Boris Steipe (boris.steipe@utoronto.ca)
+#
+# V 1.4    Add troubleshooting hints via errText[[...]]
+# V 1.3    2021 update of MYSPE mechanics; fix a bug no one had complained about
+# V 1.2    Reorganized proportional plot section into a "further reading"
+#          section, added nested-box, and sankey plot visualization of
+#          proportions. Introduced plotly.
+# V 1.1    2020 Workflow changes
+# V 1.0.1  Move ABC-makeMYSPElist.R to ./scripts directory
+# V 1.0    Final code, after rewriting BLAST parser and updating MYSPElist
+# V 0.1    First code copied from BCH441_A03_makeMYSPElist.R
+#
+# TODO:    Sample solution for sankey plot function.
+#
+#
+# == HOW TO WORK WITH LEARNING UNIT FILES ======================================
+#
+# DO NOT SIMPLY  source()  THESE FILES!
+#
+# If there are portions you don't understand, use R's help system, Google for an
+# answer, or ask your instructor. Don't continue if you don't understand what's
+#  going on. That's not how it works ...
+#
+# ==============================================================================
+
+
+#TOC> ==========================================================================
+#TOC> 
+#TOC>   Section  Title                                             Line
+#TOC> -----------------------------------------------------------------
+#TOC>   1        PREPARATIONS                                        52
+#TOC>   2        SUITABLE MYSPE SPECIES                              65
+#TOC>   3        ADOPT "MYSPE"                                       89
+#TOC>   4        FURTHER READING: PLOTTING PROPORTIONS              128
+#TOC>   4.1        Percentages                                      146
+#TOC>   4.2        Visualizing proportions: Pie chart               165
+#TOC>   4.3        Visualizing proportions: Nested squares          243
+#TOC>   4.4        Visualizing proportions: Sankey diagrams         280
+#TOC> 
+#TOC> ==========================================================================
+
+
+# =    1  PREPARATIONS  ========================================================
+#
+
+# Execute the two conditionals below:
+if (! file.exists("./myScripts/.myProfile.R")) {
+  stop(errText[["noProfileFile"]])     # message defined in .Rprofile
+}
+
+if (! exists("myStudentNumber")) {
+  stop(errText[["noStudentNumber"]])   # message defined in .Rprofile
+}
+
+
+# =    2  SUITABLE MYSPE SPECIES  ==============================================
+
+
+# In this unit we will select one species from a list of genome sequenced fungi
+# and write it into your personalized profile file. This species will be called
+# "MYSPE" (My Species) for other learning units and exercises.
+
+# A detailed description of the process of compiling the list of genome
+# sequenced fungi with protein annotations and Mbp1 homologues is in the file
+# ./scripts/ABC-makeMYSPElist.R  In brief, data for genome-sequenced fungi
+# was retrieved from https://fungi.ensembl.org; a search for homologues to
+# yeast Mbp1 was performed with BLAST at the NCBI, and the data was merged.
+# A representative organism at each genus-level was chosen from those hits
+# that actual;ly have a homologue. Finally, a mapping table was constructed to
+# asymmetrically retrieve unique species: a student number will retrieve
+# a species, but (public) knowledge of the species cannot reconstruct the
+# student number.
+
+# Task: Study ./scripts/ABC-makeMYSPElist.R, it implements a typical workflow
+#       of selecting and combining data from various data resources. Studying
+#       it will give you a better sense of how such workflows can be
+#       implemented in practice.
+
+
+# =    3  ADOPT "MYSPE"  =======================================================
+
+# Execute:
+( MYSPE <- getMYSPE(myStudentNumber) )
+
+# If this produced an error, this session has not been properly set up. You
+# may not yet have run  init()  and edited  .myProfile.R , or that file is not
+# in your  myScripts/  folder. Fix this, and execute:
+#
+#    source(".Rprofile") .
+
+# If this produced NA, your Student Number may not be correct, or you are not in
+# my class-list. Contact me. Otherwise, this should have printed a species name,
+# and the taxonomy ID of its genome-sequenced strain. This is your unique
+# speciesfor this course. Note it in your journal ...
+
+biCode(MYSPE) # and also note it's "BiCode" ...
+( myTaxID <- names(MYSPE) )  # and its taxID
+
+
+# Task:
+# =====
+#   Note down the species name and its five letter BiCode on your Student
+#   Wiki user page. Use this species whenever this or future assignments refer
+#   to MYSPE. Whenever you start a session, it will automatically be loaded
+#   from  myScripts/.myProfile.R  and is available as  MYSPE .
+
+# Here is some more information about MYSPE, taken from the table of genome-
+# sequenced fungi that is in your ./data folder.
+fungiDat <- read.csv("data/Species.csv")
+iMs <- which(fungiDat$Taxon.ID == myTaxID)
+
+( myOr <- fungiDat$Classification[iMs] )  # Taxonomic order
+( myGn <- gsub("\\s.*", "", MYSPE))       # Taxonomic genus
+( mySt <- fungiDat$Name[iMs] )            # Taxonomic strain
+
+# That's all.
+
+
+# =    4  FURTHER READING: PLOTTING PROPORTIONS  ===============================
+
+# The material below is an exploration of data-preparation and plotting
+# techniques; you can treat this as additional practice and further reading and
+# I expect that some of the code and plotting examples may be useful in a
+# different context.
+
+# A frequent task is to visualize the proportion of elements with given
+# categories in a sample. For example, we might ask what the proportion of the
+# different orders of fungi is the order of MYSPE? Let's first collect the
+# numbers.
+
+( nFungi <- nrow(fungiDat) )                            # sequenced fungi
+( nOrder <- sum(grepl(myOr, fungiDat$Classification)) ) # same order as MYSPE
+( nGenus <- sum(grepl(myGn, fungiDat$Name)) )           # same genus as MYSPE
+( nSpecies <- sum(grepl(MYSPE, fungiDat$Name)) )        # same species as MYSPE
+
+
+# ==   4.1  Percentages  =======================================================
+
+# The zeroth-order approach to visualization is simply to print percentages:
+
+cat(sprintf("\n%s comprise %5.2f%% of fungi.",
+        myOr,
+        (nOrder * 100) / nFungi))
+
+# ... or, adding the actual numbers:
+
+cat(sprintf("\n%s comprise %5.2f%% of fungi (%d of %d).",
+            myOr,
+            (nOrder * 100) / nFungi,
+            nOrder,
+            nFungi))
+
+# But that's hard to visualize for most of us, and anyway, we don't know how
+# that relates to other orders.
+
+# ==   4.2  Visualizing proportions: Pie chart  ================================
+
+# Often, we will use a pie chart instead. Pie charts are rather informal types
+# of plots, not well suited for analysis. But easy to do:
+
+# Define four colors to identify the four categories
+pCol <- c("#ed394e", "#ff9582", "#ffd5c4", "#f2f2f0")
+
+oPar <- par(mar = c(0.1, 0.1, 2.5, 0.1))   # set margins to ~ 0
+                                           # and remember the
+                                           # previous setting
+
+pie(c(nSpecies,                            # subtract numbers since these
+      nGenus - nSpecies,                   # categories are mutually contained
+      nOrder - nGenus - nSpecies,          # in each other
+      nFungi - nOrder - nGenus - nSpecies),
+      labels = "",
+      radius = 0.9,
+      main = "MYSPE in genome-sequenced fungi",
+      lty = 0,                             # turn borders for wedges off
+      col = pCol,
+      clockwise = TRUE,
+      init.angle = 90)
+
+title(main=MYSPE, line=0, cex.main=0.7)    # add a title to the plot
+
+legend(x = 0.95, y = 0.8,    # place at legend here
+       legend = c("Species", "Genus", "Order", "Fungi"),
+       y.intersp = 2,                      # line spacing for labels
+       cex = 0.8,                          # character size for labels
+       bty = "n",                          # "no" box around the legend
+       pt.cex = 2,                         # size of colour boxes
+       pch = 15,                           # a filled square
+       col = pCol)
+
+par(oPar)                                  # reset graphics state
+
+# Unless MYSPE is one of the frequently sequenced species, there will only be a
+# very thin wedge visible. Pie charts are not well suited to visualize small
+# proportions.
+
+# It is a little more useful if we have non-nested proportions - like the
+# number of species in the same order overall:
+
+myTbl <- sort(table(fungiDat$Classification), decreasing = TRUE)
+head(myTbl)
+
+# pie() does a reasonable job out of the box to interpret table() data:
+pie(myTbl)
+
+# ... we can improve this quickly with a bit of tweaking:
+
+N <- length(myTbl)
+sel <- myOr == names(myTbl) # TRUE for the MYSPE order, FALSE elsewhere
+
+myCol <- rep(pCol[4], N)       # N elements of pCol[1]
+myCol[sel] <- pCol[1]          # replace this one color
+
+myLbl <- rep("", N)            # N labels of ""
+myLbl[sel] <- myOr             # replace this one label with the MYSPE order
+
+
+oPar <- par(mar = c(0.1, 0.1, 2.5, 0.1))   # set margins to ~ 0
+
+pie(myTbl,
+    labels = myLbl,
+    radius = 0.9,
+    main = "MYSPE order",
+    border = "#DDDDDD",
+    col = myCol,
+    clockwise = TRUE,
+    init.angle = 90)
+
+par(oPar)                                  # reset graphics state
+
+# But the overall problem remains.
+
+
+# ==   4.3  Visualizing proportions: Nested squares  ===========================
+
+# A simple alternative is to draw such proportions as nested squares:
+
+x <- sqrt(nFungi)
+
+# set margins to ~ 0 and type to square
+oPar <- par(mar = c(0.1, 0.1, 0.1, 0.1), pty = "s")
+
+# empty, square plot
+plot(c(0, x), c(0, x), xlim = c(0, x), ylim = c(0, x),
+     type="n", axes=FALSE, xlab="", ylab="")
+
+# basic square for all genomes
+rect(0, 0, x,              x,              col = pCol[4])
+
+# grid
+u <- 0:floor(x)
+N <- length(u)
+segments(rep(0, N), u, rep(x, N), u, col = "#0000FF18")
+segments(u, rep(0, N), u, rep(x, N), col = "#0000FF18")
+# each square on this grid is one genome
+
+# colored squares
+rect(0, 0, sqrt(nOrder),   sqrt(nOrder),   col = pCol[3])
+rect(0, 0, sqrt(nGenus),   sqrt(nGenus),   col = pCol[2])
+rect(0, 0, sqrt(nSpecies), sqrt(nSpecies), col = pCol[1])
+
+# labels
+text(x/2, x/2,      "Fungi")
+text(x * 0.08, x * 0.11, myOr,   pos = 4, cex = 0.9)
+text(x * 0.08, x * 0.06, myGn,   pos = 4, cex = 0.8)
+text(x * 0.08, x * 0.02, MYSPE, pos = 4, cex = 0.7)
+
+par(oPar)                                  # reset graphics state
+
+
+# ==   4.4  Visualizing proportions: Sankey diagrams  ==========================
+
+# Sankey diagrams are an excellent way to visualize complicated nested
+# proportions and their changes (see here for example:
+# https://www.r-graph-gallery.com/sankey-diagram.html). Here is a very simple
+# example with the MYSPE proportions, as an illustration of the plotting
+# principle.
+
+if (! requireNamespace("plotly")) {
+  install.packages("plotly")
+}
+# Package information:
+#  library(help   = plotly)     # basic information
+#  browseVignettes("plotly")    # available vignettes
+#  data(package  = "plotly")    # available datasets
+
+# Here, we use the plotly package that wraps a very well developed javascript
+# library with many options for interactive plots. I am producing this plot
+# hard-coded for the sample organism "Sporothrix schenkii"; you would need
+# to change the code to adapt it to your own MYSPE - or even build a function
+# for this. Do try this if you have a bit of coding experience, sankey diagrams
+# are a good way to show hierarchical data relations - and if you get this
+# working for your own organism you can be proud that you have understood
+# how preparing the data works.
+
+
+myNodes <- list(label = c("Fungi (1014)",              # 0 <- node ID
+                          "Ophiostomatales (6)",       # 1
+                          "Other...",                  # 2
+                          "Sporothrix (4)",            # 3
+                          "Other...",                  # 4
+                          "Sporothrix schenckii (2)",  # 5
+                          "Other..."                   # 6
+                          ),
+                x = c(0.1, 0.4, 0.4, 0.7, 0.7, 1.0, 1.0),
+                y = c(0.3, 0.1, 0.7, 0.2, 0.7, 0.3, 0.7),
+                color = c("#f2f2f0", #
+                          "#ffd5c4",
+                          "#CCCCCC",
+                          "#ff9582",
+                          "#CCCCCC",
+                          "#ed394e",
+                          "#CCCCCC"
+                          ),
+                pad = 15,
+                thickness = 20,
+                line = list(color = "black",
+                            width = 0.5))
+
+myLinks <- list(source = c(0, 0, 1, 1, 3, 3),   # i.e. there is a link of
+                target = c(1, 2, 3, 4, 5, 6),   # weight 6 between node 0
+                value =  c(6, 18, 4, 2, 2, 2))  # and node 1
+
+# Setting up the actual plot ...
+fig  <-  plotly::plot_ly(type = "sankey",
+                         arrangement = "snap",
+                         orientation = "h",
+                         node = myNodes,
+                         link = myLinks)
+
+# Adding and adjusting a few layout parameters
+fig <- plotly::layout(fig,
+              title = "Fungi Genomes - Classification",
+              font = list(size = 10))
+
+fig     # plot the diagram
+
+# Note that the plot appears in the Viewer window, not the Plot window, and that
+# it is interactive: you can hover over nodes and links, and drag the nodes
+# around.
+
+# [END]
diff --git a/BIN-PHYLO-Data_preparation.R b/BIN-PHYLO-Data_preparation.R
index 407faff..41a8369 100644
--- a/BIN-PHYLO-Data_preparation.R
+++ b/BIN-PHYLO-Data_preparation.R
@@ -1,234 +1,234 @@
-# tocID <- "BIN-PHYLO-Data_preparation.R"
-#
-# Purpose:  A Bioinformatics Course:
-#              R code accompanying the BIN-PHYLO-Data_preparation unit.
-#
-# Version:  1.2
-#
-# Date:     2017-10  -  2020-09
-# Author:   Boris Steipe (boris.steipe@utoronto.ca)
-#
-# Versions:
-#           1.2    2020 Maintenance
-#           1.1    Change from require() to requireNamespace(),
-#                      use ::() idiom throughout,
-#                      use Biocmanager:: not biocLite()
-#           1.0    First 2017 version
-#           0.1    First code copied from 2016 material.
-#
-#
-# TODO:
-#
-#
-# == DO NOT SIMPLY  source()  THIS FILE! =======================================
-#
-# If there are portions you don't understand, use R's help system, Google for an
-# answer, or ask your instructor. Don't continue if you don't understand what's
-# going on. That's not how it works ...
-#
-# ==============================================================================
-
-
-#TOC> ==========================================================================
-#TOC> 
-#TOC>   Section  Title                                     Line
-#TOC> ---------------------------------------------------------
-#TOC>   1        Preparations                                45
-#TOC>   2        Fetching sequences                          77
-#TOC>   3        Multiple Sequence Alignment                118
-#TOC>   4        Reviewing and Editing Alignments           137
-#TOC>   4.1        Masking workflow                         153
-#TOC> 
-#TOC> ==========================================================================
-
-
-# =    1  Preparations  ========================================================
-
-
-# You need to reload your protein database, including changes that might have
-# been made to the reference files. If you have worked with the prerequiste
-# units, you should have a script named "makeProteinDB.R" that will create the
-# myDB object with a protein and feature database. Ask for advice if not.
-source("myScripts/makeProteinDB.R")
-
-# Load packages we need
-
-if (! requireNamespace("BiocManager", quietly = TRUE)) {
-  install.packages("BiocManager")
-}
-if (! requireNamespace("Biostrings", quietly = TRUE)) {
-  BiocManager::install("Biostrings")
-}
-# Package information:
-#  library(help = Biostrings)       # basic information
-#  browseVignettes("Biostrings")    # available vignettes
-#  data(package = "Biostrings")     # available datasets
-
-
-if (! requireNamespace("msa", quietly = TRUE)) {
-  BiocManager::install("msa")
-}
-# Package information:
-#  library(help = msa)       # basic information
-#  browseVignettes("msa")  # available vignettes
-#  data(package = "msa")   # available datasets
-
-
-# =    2  Fetching sequences  ==================================================
-
-
-# myDB contains the ten Mbp1 orthologues from the reference species and the Mbp1
-# RBM for MYSPE. We will construct a phylogenetic tree from the proteins' APSES
-# domains. You have annotated their ranges as a feature. The following code
-# retrieves the sequences from myDB. You have seen similar code in other units.
-
-sel <- grep("^MBP1_", myDB$protein$name)
-(proNames <- myDB$protein$name[sel])
-(proIDs <- myDB$protein$ID[sel])
-
-(sel <- myDB$feature$ID[myDB$feature$name == "APSES fold"])
-(fanIDs <- myDB$annotation$ID[myDB$annotation$proteinID %in% proIDs & # %in% !
-                              myDB$annotation$featureID == sel])      #  ==  !
-                                                                      # Why?
-APSI <- character(length(fanIDs))
-
-for (i in seq_along(fanIDs)) {
-  sel   <- myDB$annotation$ID == fanIDs[i]  # get the feature row index
-  proID <- myDB$annotation$proteinID[sel]   # get its protein ID
-  start <- myDB$annotation$start[sel]       # get start ...
-  end   <- myDB$annotation$end[sel]         # ... and end
-
-  sel <- myDB$protein$ID == proID           # get the protein row index ...
-                                            # ... and the sequence
-  APSI[i] <- substring(myDB$protein$sequence[sel], start, end)
-  names(APSI)[i] <- (myDB$protein$name[sel])
-}
-
-head(APSI)
-
-# Let's add the E.coli Kila-N domain sequence as an outgroup, for rooting our
-# phylogenetic tree (see the unit's Wiki page for details on the sequence).
-
-APSI <- c(APSI,
-"IDGEIIHLRAKDGYINATSMCRTAGKLLSDYTRLKTTQEFFDELSRDMGIPISELIQSFKGGRPENQGTWVHPDIAINLAQ")
-names(APSI)[length(APSI)] <- "KILA_ESCCO"
-tail(APSI)
-
-
-# =    3  Multiple Sequence Alignment  =========================================
-
-# This vector of sequences with named elements fulfills the requirements to be
-# imported as a Biostrings object - an AAStringSet - which we need as input for
-# the MSA algorithms in Biostrings.
-#
-
-APSESSet <- Biostrings::AAStringSet(APSI)
-APSESMsa <- msa::msaMuscle(APSESSet, order = "aligned")
-
-# Nb. msaMuscle() sometimes fails - reproducibly, but I am not sure why. If
-# that happens in your case, just use msaClustalOmega() instead.
-
-# inspect the alignment.
-writeALN(APSESMsa)
-
-# What do you think? Is this a good alignment for phylogenetic inference?
-
-
-# =    4  Reviewing and Editing Alignments  ====================================
-
-
-# Head back to the Wiki page for this unit and read up on the background
-# first.
-
-# Let's mask out all columns that have observations for
-# less than 1/3 of the sequences in the dataset. This
-# means they have more than round(nrow(msaSet) * (2/3))
-# hyphens in a column.
-#
-# We take all sequences, split them into single
-# characters, and put them into a matrix. Then we
-# go through the matrix, column by column and decide
-# whether we want to include that column.
-
-# ==   4.1  Masking workflow  ==================================================
-
-# get the length of the alignment
-(lenAli <- APSESMsa@unmasked@ranges@width[1])
-
-# initialize a matrix that can hold all characters
-# individually
-msaMatrix <- matrix(character(nrow(APSESMsa) * lenAli),
-                    ncol = lenAli)
-
-# assign the correct rownames
-rownames(msaMatrix) <- APSESMsa@unmasked@ranges@NAMES
-for (i in 1:nrow(APSESMsa)) {
-  msaMatrix[i, ] <- unlist(strsplit(as.character(APSESMsa@unmasked[i]), ""))
-}
-
-# inspect the result
-msaMatrix[1:7, 30:40]
-
-# Now let's make a logical vector with an element for each column that selects
-# which columns should be masked out.
-
-# The number of hyphens in a column is easy to count. Consider:
-
-    msaMatrix[ , 20]             # column 20
-    msaMatrix[ , 20] == "-"      # TRUE for all gap characters
-sum(msaMatrix[ , 20] == "-")     # adds 1 for each TRUE
-
-# Thus filling our logical vector is simple:
-
-# initialize a mask
-colMask <- logical(ncol(msaMatrix))
-
-# define the threshold for rejecting a column
-limit <- round(nrow(APSESMsa) * (2/3))
-
-# iterate over all columns, and write TRUE if there are less-or-equal to "limit"
-# hyphens, FALSE if there are more - i.e. TRUE columns will be used for analysis
-# and FALSE columns will be rejected.
-for (i in 1:ncol(msaMatrix)) {
-  count <- sum(msaMatrix[ , i] == "-")
-  colMask[i] <- count <= limit # TRUE if less-or-equal to limit, FALSE if not
-}
-
-# Inspect the mask
-colMask
-
-# How many positions are being kept?
-sum(colMask)
-
-cat(sprintf("We are masking %4.2f %% of alignment columns.\n",
-            100 * (1 - (sum(colMask) / length(colMask)))))
-
-
-# Next, we use colMask to remove the masked columns from the matrix
-# in one step:
-maskedMatrix <- msaMatrix[ , colMask]
-
-# check:
-ncol(maskedMatrix)
-
-# ... then collapse each row of single characters back into a string ...
-APSESphyloSet <- character()
-for (i in 1:nrow(maskedMatrix)) {
-  APSESphyloSet[i] <- paste(maskedMatrix[i, ], collapse="")
-}
-names(APSESphyloSet) <- rownames(maskedMatrix)
-
-# inspect ...
-writeALN(APSESphyloSet)
-
-# As you see, we have removed a three residue insertion from MBP1_NEUCR, and
-# several indels from the KILA_ESCCO outgroup sequence.
-
-
-# We save the aligned, masked domains to a file in the data/ directory,
-# in multi-FASTA format.
-writeMFA(APSESphyloSet, myCon = "data/APSESphyloSet.mfa")
-
-
-
-# [END]
+# tocID <- "BIN-PHYLO-Data_preparation.R"
+#
+# Purpose:  A Bioinformatics Course:
+#              R code accompanying the BIN-PHYLO-Data_preparation unit.
+#
+# Version:  1.2
+#
+# Date:     2017-10  -  2020-09
+# Author:   Boris Steipe (boris.steipe@utoronto.ca)
+#
+# Versions:
+#           1.2    2020 Maintenance
+#           1.1    Change from require() to requireNamespace(),
+#                      use ::() idiom throughout,
+#                      use Biocmanager:: not biocLite()
+#           1.0    First 2017 version
+#           0.1    First code copied from 2016 material.
+#
+#
+# TODO:
+#
+#
+# == DO NOT SIMPLY  source()  THIS FILE! =======================================
+#
+# If there are portions you don't understand, use R's help system, Google for an
+# answer, or ask your instructor. Don't continue if you don't understand what's
+# going on. That's not how it works ...
+#
+# ==============================================================================
+
+
+#TOC> ==========================================================================
+#TOC> 
+#TOC>   Section  Title                                     Line
+#TOC> ---------------------------------------------------------
+#TOC>   1        Preparations                                45
+#TOC>   2        Fetching sequences                          77
+#TOC>   3        Multiple Sequence Alignment                118
+#TOC>   4        Reviewing and Editing Alignments           137
+#TOC>   4.1        Masking workflow                         153
+#TOC> 
+#TOC> ==========================================================================
+
+
+# =    1  Preparations  ========================================================
+
+
+# You need to reload your protein database, including changes that might have
+# been made to the reference files. If you have worked with the prerequiste
+# units, you should have a script named "makeProteinDB.R" that will create the
+# myDB object with a protein and feature database. Ask for advice if not.
+source("myScripts/makeProteinDB.R")
+
+# Load packages we need
+
+if (! requireNamespace("BiocManager", quietly = TRUE)) {
+  install.packages("BiocManager")
+}
+if (! requireNamespace("Biostrings", quietly = TRUE)) {
+  BiocManager::install("Biostrings")
+}
+# Package information:
+#  library(help = Biostrings)       # basic information
+#  browseVignettes("Biostrings")    # available vignettes
+#  data(package = "Biostrings")     # available datasets
+
+
+if (! requireNamespace("msa", quietly = TRUE)) {
+  BiocManager::install("msa")
+}
+# Package information:
+#  library(help = msa)       # basic information
+#  browseVignettes("msa")  # available vignettes
+#  data(package = "msa")   # available datasets
+
+
+# =    2  Fetching sequences  ==================================================
+
+
+# myDB contains the ten Mbp1 orthologues from the reference species and the Mbp1
+# RBM for MYSPE. We will construct a phylogenetic tree from the proteins' APSES
+# domains. You have annotated their ranges as a feature. The following code
+# retrieves the sequences from myDB. You have seen similar code in other units.
+
+sel <- grep("^MBP1_", myDB$protein$name)
+(proNames <- myDB$protein$name[sel])
+(proIDs <- myDB$protein$ID[sel])
+
+(sel <- myDB$feature$ID[myDB$feature$name == "APSES fold"])
+(fanIDs <- myDB$annotation$ID[myDB$annotation$proteinID %in% proIDs & # %in% !
+                              myDB$annotation$featureID == sel])      #  ==  !
+                                                                      # Why?
+APSI <- character(length(fanIDs))
+
+for (i in seq_along(fanIDs)) {
+  sel   <- myDB$annotation$ID == fanIDs[i]  # get the feature row index
+  proID <- myDB$annotation$proteinID[sel]   # get its protein ID
+  start <- myDB$annotation$start[sel]       # get start ...
+  end   <- myDB$annotation$end[sel]         # ... and end
+
+  sel <- myDB$protein$ID == proID           # get the protein row index ...
+                                            # ... and the sequence
+  APSI[i] <- substring(myDB$protein$sequence[sel], start, end)
+  names(APSI)[i] <- (myDB$protein$name[sel])
+}
+
+head(APSI)
+
+# Let's add the E.coli Kila-N domain sequence as an outgroup, for rooting our
+# phylogenetic tree (see the unit's Wiki page for details on the sequence).
+
+APSI <- c(APSI,
+"IDGEIIHLRAKDGYINATSMCRTAGKLLSDYTRLKTTQEFFDELSRDMGIPISELIQSFKGGRPENQGTWVHPDIAINLAQ")
+names(APSI)[length(APSI)] <- "KILA_ESCCO"
+tail(APSI)
+
+
+# =    3  Multiple Sequence Alignment  =========================================
+
+# This vector of sequences with named elements fulfills the requirements to be
+# imported as a Biostrings object - an AAStringSet - which we need as input for
+# the MSA algorithms in Biostrings.
+#
+
+APSESSet <- Biostrings::AAStringSet(APSI)
+APSESMsa <- msa::msaMuscle(APSESSet, order = "aligned")
+
+# Nb. msaMuscle() sometimes fails - reproducibly, but I am not sure why. If
+# that happens in your case, just use msaClustalOmega() instead.
+
+# inspect the alignment.
+writeALN(APSESMsa)
+
+# What do you think? Is this a good alignment for phylogenetic inference?
+
+
+# =    4  Reviewing and Editing Alignments  ====================================
+
+
+# Head back to the Wiki page for this unit and read up on the background
+# first.
+
+# Let's mask out all columns that have observations for
+# less than 1/3 of the sequences in the dataset. This
+# means they have more than round(nrow(msaSet) * (2/3))
+# hyphens in a column.
+#
+# We take all sequences, split them into single
+# characters, and put them into a matrix. Then we
+# go through the matrix, column by column and decide
+# whether we want to include that column.
+
+# ==   4.1  Masking workflow  ==================================================
+
+# get the length of the alignment
+(lenAli <- APSESMsa@unmasked@ranges@width[1])
+
+# initialize a matrix that can hold all characters
+# individually
+msaMatrix <- matrix(character(nrow(APSESMsa) * lenAli),
+                    ncol = lenAli)
+
+# assign the correct rownames
+rownames(msaMatrix) <- APSESMsa@unmasked@ranges@NAMES
+for (i in 1:nrow(APSESMsa)) {
+  msaMatrix[i, ] <- unlist(strsplit(as.character(APSESMsa@unmasked[i]), ""))
+}
+
+# inspect the result
+msaMatrix[1:7, 30:40]
+
+# Now let's make a logical vector with an element for each column that selects
+# which columns should be masked out.
+
+# The number of hyphens in a column is easy to count. Consider:
+
+    msaMatrix[ , 20]             # column 20
+    msaMatrix[ , 20] == "-"      # TRUE for all gap characters
+sum(msaMatrix[ , 20] == "-")     # adds 1 for each TRUE
+
+# Thus filling our logical vector is simple:
+
+# initialize a mask
+colMask <- logical(ncol(msaMatrix))
+
+# define the threshold for rejecting a column
+limit <- round(nrow(APSESMsa) * (2/3))
+
+# iterate over all columns, and write TRUE if there are less-or-equal to "limit"
+# hyphens, FALSE if there are more - i.e. TRUE columns will be used for analysis
+# and FALSE columns will be rejected.
+for (i in 1:ncol(msaMatrix)) {
+  count <- sum(msaMatrix[ , i] == "-")
+  colMask[i] <- count <= limit # TRUE if less-or-equal to limit, FALSE if not
+}
+
+# Inspect the mask
+colMask
+
+# How many positions are being kept?
+sum(colMask)
+
+cat(sprintf("We are masking %4.2f %% of alignment columns.\n",
+            100 * (1 - (sum(colMask) / length(colMask)))))
+
+
+# Next, we use colMask to remove the masked columns from the matrix
+# in one step:
+maskedMatrix <- msaMatrix[ , colMask]
+
+# check:
+ncol(maskedMatrix)
+
+# ... then collapse each row of single characters back into a string ...
+APSESphyloSet <- character()
+for (i in 1:nrow(maskedMatrix)) {
+  APSESphyloSet[i] <- paste(maskedMatrix[i, ], collapse="")
+}
+names(APSESphyloSet) <- rownames(maskedMatrix)
+
+# inspect ...
+writeALN(APSESphyloSet)
+
+# As you see, we have removed a three residue insertion from MBP1_NEUCR, and
+# several indels from the KILA_ESCCO outgroup sequence.
+
+
+# We save the aligned, masked domains to a file in the data/ directory,
+# in multi-FASTA format.
+writeMFA(APSESphyloSet, myCon = "data/APSESphyloSet.mfa")
+
+
+
+# [END]
diff --git a/BIN-PHYLO-Tree_analysis.R b/BIN-PHYLO-Tree_analysis.R
index 3dabf5b..3e9da20 100644
--- a/BIN-PHYLO-Tree_analysis.R
+++ b/BIN-PHYLO-Tree_analysis.R
@@ -1,406 +1,406 @@
-# tocID <- "BIN-PHYLO-Tree_analysis.R"
-#
-# Purpose:  A Bioinformatics Course:
-#              R code accompanying the BIN-PHYLO-Tree_analysis unit.
-#
-# Version:  1.2
-#
-# Date:     2017-10  -  2020-09
-# Author:   Boris Steipe (boris.steipe@utoronto.ca)
-#
-# Versions:
-#           1.2    2020 updates. Deprecate iTol and use taxize:: instead.
-#                  Rewrite of tip re-ordering. Better handling of
-#                  messages. pBar() for randomization.
-#           1.1    Change from require() to requireNamespace(),
-#                      use ::() idiom throughout,
-#                      use Biocmanager:: not biocLite()
-#           1.0.2  Typo in variable name, style changes
-#           1.0.1  Wrong section heading
-#           1.0    First 2017 version
-#           0.1    First code copied from 2016 material.
-#
-#
-# TODO:
-#
-#
-# == DO NOT SIMPLY  source()  THIS FILE! =======================================
-#
-# If there are portions you don't understand, use R's help system, Google for an
-# answer, or ask your instructor. Don't continue if you don't understand what's
-# going on. That's not how it works ...
-#
-# ==============================================================================
-
-
-#TOC> ==========================================================================
-#TOC> 
-#TOC>   Section  Title                              Line
-#TOC> --------------------------------------------------
-#TOC>   1        Preparation and Tree Plot            50
-#TOC>   2        SPECIES REFERENCE TREE               66
-#TOC>   3        Tree Analysis                       117
-#TOC>   3.1        Rooting Trees                     177
-#TOC>   3.2        Rotating Clades                   222
-#TOC>   3.3        Computing tree distances          309
-#TOC> 
-#TOC> ==========================================================================
-
-
-# =    1  Preparation and Tree Plot  ===========================================
-
-
-if (! requireNamespace("ape", quietly = TRUE)) {
-  install.packages("ape")
-}
-# Package information:
-#  library(help = ape)       # basic information
-#  browseVignettes("ape")    # available vignettes
-#  data(package = "ape")     # available datasets
-
-# We change the graphics parameters from time to time, let's define the
-# default so we can recreate a sane state:
-dev.off()
-PAR <- par()
-
-# =    2  SPECIES REFERENCE TREE  ==============================================
-
-# Before we do any kind of phylogenetic analysis of genes from several species,
-# we MUST have a reference tree of the taxonomic relationships in hand. This
-# context is absolutely required for the interpretation of our tree.
-
-# We have the tax-ids in our database, and the NCBI has the species tree - we just need some way to extract the subtree that corresponds to our taxons of interest. Here's how to use the taxize:: package.
-
-if (! requireNamespace("taxize", quietly = TRUE)) {
-  install.packages("taxize")
-}
-# Package information:
-#  library(help   = taxize)       # basic information
-#  browseVignettes("taxize")    # available vignettes
-#  data(package  = "taxize")     # available datasets
-
-( mySOI <- c(myDB$taxonomy$ID, "83333") )
-myClass <- taxize::classification(mySOI, db = "ncbi")
-str(myClass)
-
-myClass[[1]]
-
-fungiTree <- taxize::class2tree(myClass, check = TRUE)
-plot(fungiTree)
-
-# The tree produced by taxize:: contains full length species names,
-# but it would be more convenient if it had bicodes instead. Also, the actual
-# tree is only part of the list(), which will cause problems later:
-str(fungiTree)
-
-# we therefor simplify
-fungiTree <- fungiTree$phylo
-str(fungiTree)
-
-# The species names are in a vector $phylo$tip.label of this list.
-# We can use biCode() to shorten them.
-fungiTree$tip.label <- biCode(fungiTree$tip.label)
-
-# Plot the tree
-nSP <- length(fungiTree$tip.label)
-plot(fungiTree, cex = 0.8, root.edge = TRUE, no.margin = TRUE)
-text(-1, nSP - 0.5, "Species Tree:\nFungi", pos = 4)
-ape::nodelabels(text = fungiTree$node.label,
-                cex = 0.6,
-                adj = 0.2,
-                bg = "#D4F2DA")
-# Note that you can use the arrow buttons in the menu above the plot pane to
-# scroll back to plots you have created earlier - so you can reference back to
-# this species tree in your later analysis.
-
-
-# =    3  Tree Analysis  =======================================================
-
-
-# 1.1  Visualizing your tree
-# The trees that are produced by Rphylip are stored as an object of class
-# "phylo". This is a class for phylogenetic trees that is widely used in the
-# community, practically all R phylogenetics packages will options to read and
-# manipulate such trees. Outside of R, a popular interchange format is the
-# Newick_format that you have seen above. It's easy to output your calculated
-# trees in Newick format and visualize them elsewhere.
-
-# The "phylo" class object is one of R's "S3" objects and methods to plot and
-# print it have been defined with the Rphylip package, and in ape. You can
-# simply call plot() and R knows what to do with  and how
-# to plot it. The underlying function is plot.phylo(), and documentation for its
-# many options can by found by typing:
-
-?plot.phylo
-
-# We load the APSES sequence tree that you produced in the
-# BIN-PHYLO-Tree_building unit:
-apsTree <- readRDS(file = "data/APSEStreeRproml.rds")
-
-plot(apsTree) # default type is "phylogram"
-plot(apsTree, type = "unrooted")
-plot(apsTree, type = "fan", no.margin = TRUE)
-
-# rescale to show all of the labels:
-# record the current plot parameters by assigning them to a variable ...
-(tmp <- plot(apsTree, type="fan", no.margin = TRUE, plot=FALSE))
-# ... and adjust the plot limits for a new plot:
-plot(apsTree,
-     type = "fan",
-     x.lim = tmp$x.lim * 1.8,
-     y.lim = tmp$y.lim * 1.8,
-     cex = 0.8,
-     no.margin = TRUE)
-
-# Inspect the tree object
-str(apsTree)
-apsTree$tip.label
-apsTree$edge
-apsTree$edge.length
-
-# show the node / edge and tip labels on a plot
-plot(apsTree)
-ape::nodelabels()
-ape::edgelabels()
-ape::tiplabels()
-
-# show the number of nodes, edges and tips
-ape::Nnode(apsTree)
-ape::Nedge(apsTree)
-ape::Ntip(apsTree)
-
-par(PAR)   # reset graphics state
-
-# Finally, write the tree to console in Newick format
-ape::write.tree(apsTree)
-
-# ==   3.1  Rooting Trees  =====================================================
-
-# In order to analyse the tree, it is helpful to root it first and reorder its
-# clades. Contrary to documentation, Rproml() returns an unrooted tree.
-
-ape::is.rooted(apsTree)
-
-# You can root the tree with the command root() from the "ape" package.
-
-plot(apsTree)
-
-# add labels for internal nodes and tips
-ape::nodelabels(cex = 0.5, frame = "circle")
-ape::tiplabels(cex = 0.5, frame = "rect")
-
-# The outgroup of the tree (KILA ESCCO) is tip "11" in my sample tree, it may be a different
-# number in yours. Substitute the correct node number below for "outgroup".
-apsTree <- ape::root(apsTree, outgroup = 11, resolve.root = TRUE)
-plot(apsTree)
-ape::is.rooted(apsTree)
-
-# This tree _looks_ unchanged, beacuse when the root trifurcation was resolved,
-# an edge of length zero was added to connect the MRCA (Most Recent Common
-# Ancestor) of the ingroup.
-
-# The edge lengths are stored in the phylo object:
-apsTree$edge.length
-
-# ... and you can assign a small arbitrary value to the edge
-# to show how it connects to the tree without having an
-# overlap.
-apsTree$edge.length[1] <- 0.1
-plot(apsTree, cex = 0.7)
-ape::nodelabels(text = "MRCA", node = 12, cex = 0.5, adj = 0.1, bg = "#ff8866")
-
-
-# This procedure does however not assign an actual length to a root edge, and
-# therefore no root edge is visible on the plot. Why? , you might ask. I ask
-# myself that too. We'll just add a length by hand.
-
-apsTree$root.edge <- mean(apsTree$edge.length) * 1.5
-plot(apsTree, cex = 0.7, root.edge = TRUE)
-ape::nodelabels(text = "MRCA", node = 12, cex = 0.5, adj = 0.8, bg = "#ff8866")
-
-
-# ==   3.2  Rotating Clades  ===================================================
-
-# To interpret the tree, it is useful to rotate the clades so that they appear
-# in the order expected from the cladogram of species.
-
-# We can either rotate around individual internal nodes ...
-layout(matrix(1:2, 1, 2))
-plot(apsTree, no.margin = TRUE, root.edge = TRUE)
-ape::nodelabels(node = 13, cex = 0.7, bg = "#ff8866")
-plot(ape::rotate(apsTree, node = 13), no.margin = TRUE, root.edge = TRUE)
-ape::nodelabels(node = 13, cex = 0.7, bg = "#88ff66")
-# Note that the species at the bottom of the clade descending from node
-# 17 is now plotted at the top.
-
-par(PAR)   # reset graphics state
-
-# ... or we can rearrange the tree so it corresponds as well as possible to a
-# predefined tip ordering. Here we use the ordering that taxize:: has inferred
-# from the NCBI taxonomic classification.
-
-nOrg <- length(apsTree$tip.label)
-
-plot(fungiTree,
-     no.margin = FALSE, root.edge = TRUE)
-ape::nodelabels(text = fungiTree$node.label,
-                cex = 0.5,
-                adj = 0.2,
-                bg = "#D4F2DA")
-
-# These are the fungi tree tips ...
-fungiTree$tip.label
-# ... and their order is determined by the edge-list that is stored in
-fungiTree$edge
-# which edges join the tips?
-ape::tiplabels(cex = 0.5, frame = "rect")
-# as you can see, the tips (range [1:nOrg] ) are in column 2 and they are
-# ordered from bottom to top.
-# And each tip number is the index of the species in the tip.label vector. So we can take column 2, subset it, and use it to get a list of species in the order of the tree ...
-
-sel <- fungiTree$edge[ , 2 ] <= nOrg
-( oSp <- fungiTree$tip.label[fungiTree$edge[sel , 2 ]] )
-
-# Now, here are the genes of the apsTree tips ...
-apsTree$tip.label
-
-# ... and the "constraint"  we need for reordering, according to the help page
-# of ape::rotateConstr(), is "a vector specifying the order of the tips as they
-# should appear (from bottom to top)". Thus we need to add the "MBP1_" prefix to our vector
-oSp <- gsub("^", "MBP1_", oSp)
-( oSp <- gsub("MBP1_ESSCO", "KILA_ESCCO", oSp) )
-
-# Then we can plot the two trees to compare: the fungi- tree
-par(PAR)   # reset graphics state
-layout(matrix(1:2, 1, 2))
-plot(fungiTree,
-    no.margin = TRUE,
-     root.edge = TRUE)
-ape::nodelabels(text = fungiTree$node.label,
-                cex = 0.5,
-                adj = 0.2,
-                bg = "#D4F2DA")
-
-# and the re-organized apsesTree ...
-plot(ape::rotateConstr(apsTree, constraint = oSp[]),
-     no.margin = TRUE,
-     root.edge = TRUE)
-
-par(PAR)   # reset graphics state
-
-# As you can see, the reordering is not perfect, since the topologies are
-# different, mostly due to the unresolved nodes in the reference tree. One
-# could play with that ...
-
-
-# Task: Study the two trees and consider their similarities and differences.
-#         What do you expect? What do you find? Note that this is not a "mixed"
-#         gene tree yet, since it contains only a single gene for the species
-#         we considered. All of the branch points in this tree are speciation
-#         events. Thus the gene tree should have the same topology as the
-#         species tree. Does it? Are the differences important? How many
-#         branches would you need to remove and reinsert elsewhere to get the
-#         same topology as the species tree?
-
-# In order to quantify how different these two trees are, we need to compute
-# tree distances.
-
-
-# ==   3.3  Computing tree distances  ==========================================
-
-
-# Many superb phylogeny tools are contributed by the phangorn package.
-
-if (! requireNamespace("phangorn", quietly = TRUE)) {
-  install.packages("phangorn")
-}
-# Package information:
-#  library(help = phangorn)       # basic information
-#  browseVignettes("phangorn")    # available vignettes
-#  data(package = "phangorn")     # available datasets
-
-# To compare two trees, they must have the same tip labels. We delete "MBP1_" or
-# "KILA_" from the existing tip labels in a copy of our APSES domain tree.
-apsTree2 <- apsTree
-apsTree2$tip.label <- gsub("(MBP1_)|(KILA_)", "", apsTree2$tip.label)
-
-
-# phangorn provides several functions to compute tree-differences (and there
-# is a _whole_ lot of theory on how to compare trees). treedist() returns the
-# "symmetric difference"
-phangorn::treedist(fungiTree, apsTree2, check.labels = TRUE)
-
-# Numbers. What do they mean? How much more similar is our apsTree to the
-# (presumably) ground truth of fungiTree than a random tree would be?
-# The ape package provides the function rtree()
-# to compute random trees.
-
-ape::rtree(n = length(apsTree2$tip.label), # number of tips
-          rooted = TRUE,                   # we rooted the tree above,
-                                           #  and fungiTree is rooted anyway
-          tip.label = apsTree2$tip.label,  # use the apsTree2 labels
-          br = NULL)                       # don't generate branch lengths since
-                                           #   fungiTree has none, so we can't
-                                           #   compare them anyway.
-
-# (Note the warning message about non-binary trees; we'll suppress that later
-#  by wrapping the function call in supressMessages(); we don't want to
-#  print it 10,000 times :-)
-
-
-# Let's compute some random trees this way, calculate the distances to
-# fungiTree, and then compare the values we get for apsTree2. The random
-# trees are provided by ape::rtree().
-
-N <- 10000  # takes about 15 seconds, and we'll use the pBar function,
-            # defined in .utilities.R  to keep track of where we are at:
-myTreeDistances <- matrix(numeric(N * 2), ncol = 2)
-colnames(myTreeDistances) <- c("symm", "path")
-
-set.seed(112358)
-for (i in 1:N) {
-  pBar(i, N)
-  xTree <- ape::rtree(n = length(apsTree2$tip.label),
-                      rooted = TRUE,
-                      tip.label = apsTree2$tip.label,
-                      br = NULL)
-  myTreeDistances[i, ] <- suppressMessages(phangorn::treedist(fungiTree, xTree))
-}
-set.seed(NULL)                      # reset the random number generator
-
-table(myTreeDistances[, "symm"])
-
-( symmObs <- phangorn::treedist(fungiTree, apsTree2)[1] )
-
-# Random events less-or-equal to observation, divided by total number of
-# events gives us the empirical p-value.
-cat(sprintf("\nEmpirical p-value for symmetric diff. of observed tree is %1.4f\n",
-            (sum(myTreeDistances[ , "symm"] <= symmObs) + 1) / (N + 1)))
-
-par(PAR)   # reset graphics state
-hist(myTreeDistances[, "path"],
-     col = "aliceblue",
-     main = "Distances of random Trees to fungiTree")
-(pathObs <- phangorn::treedist(fungiTree, apsTree2)[2])
-abline(v = pathObs, col = "chartreuse")
-
-# Random events less-or-equal to observation, divided by total number of
-# events gives us the empirical p-value.
-cat(sprintf("\nEmpirical p-value for path diff. of observed tree is %1.4f\n",
-            (sum(myTreeDistances[ , "path"] <= symmObs) + 1) / (N + 1)))
-
-# Indeed, our apsTree is _very_ much more similar to the species tree than
-# we would expect by random chance.
-
-# What do we gain from that analysis? Analyzing the tree we get from a single
-# gene of orthologous sequences is a positive control in our computational
-# experiment. If these genes are indeed orthologues, a correct tree-building
-# program ought to give us a tree that exactly matches the species tree.
-# Evaluating how far off we are from the known correct result gives us a way to
-# validate our workflow and our algorithm. If we can't get that right, we can't
-# expect to get "real" data right either. Employing such positive controls in
-# every computational experiment is essential for research. Not doing so is
-# Cargo Cult Bioinformatics.
-
-
-# [END]
+# tocID <- "BIN-PHYLO-Tree_analysis.R"
+#
+# Purpose:  A Bioinformatics Course:
+#              R code accompanying the BIN-PHYLO-Tree_analysis unit.
+#
+# Version:  1.2
+#
+# Date:     2017-10  -  2020-09
+# Author:   Boris Steipe (boris.steipe@utoronto.ca)
+#
+# Versions:
+#           1.2    2020 updates. Deprecate iTol and use taxize:: instead.
+#                  Rewrite of tip re-ordering. Better handling of
+#                  messages. pBar() for randomization.
+#           1.1    Change from require() to requireNamespace(),
+#                      use ::() idiom throughout,
+#                      use Biocmanager:: not biocLite()
+#           1.0.2  Typo in variable name, style changes
+#           1.0.1  Wrong section heading
+#           1.0    First 2017 version
+#           0.1    First code copied from 2016 material.
+#
+#
+# TODO:
+#
+#
+# == DO NOT SIMPLY  source()  THIS FILE! =======================================
+#
+# If there are portions you don't understand, use R's help system, Google for an
+# answer, or ask your instructor. Don't continue if you don't understand what's
+# going on. That's not how it works ...
+#
+# ==============================================================================
+
+
+#TOC> ==========================================================================
+#TOC> 
+#TOC>   Section  Title                              Line
+#TOC> --------------------------------------------------
+#TOC>   1        Preparation and Tree Plot            50
+#TOC>   2        SPECIES REFERENCE TREE               66
+#TOC>   3        Tree Analysis                       117
+#TOC>   3.1        Rooting Trees                     177
+#TOC>   3.2        Rotating Clades                   222
+#TOC>   3.3        Computing tree distances          309
+#TOC> 
+#TOC> ==========================================================================
+
+
+# =    1  Preparation and Tree Plot  ===========================================
+
+
+if (! requireNamespace("ape", quietly = TRUE)) {
+  install.packages("ape")
+}
+# Package information:
+#  library(help = ape)       # basic information
+#  browseVignettes("ape")    # available vignettes
+#  data(package = "ape")     # available datasets
+
+# We change the graphics parameters from time to time, let's define the
+# default so we can recreate a sane state:
+dev.off()
+PAR <- par()
+
+# =    2  SPECIES REFERENCE TREE  ==============================================
+
+# Before we do any kind of phylogenetic analysis of genes from several species,
+# we MUST have a reference tree of the taxonomic relationships in hand. This
+# context is absolutely required for the interpretation of our tree.
+
+# We have the tax-ids in our database, and the NCBI has the species tree - we just need some way to extract the subtree that corresponds to our taxons of interest. Here's how to use the taxize:: package.
+
+if (! requireNamespace("taxize", quietly = TRUE)) {
+  install.packages("taxize")
+}
+# Package information:
+#  library(help   = taxize)       # basic information
+#  browseVignettes("taxize")    # available vignettes
+#  data(package  = "taxize")     # available datasets
+
+( mySOI <- c(myDB$taxonomy$ID, "83333") )
+myClass <- taxize::classification(mySOI, db = "ncbi")
+str(myClass)
+
+myClass[[1]]
+
+fungiTree <- taxize::class2tree(myClass, check = TRUE)
+plot(fungiTree)
+
+# The tree produced by taxize:: contains full length species names,
+# but it would be more convenient if it had bicodes instead. Also, the actual
+# tree is only part of the list(), which will cause problems later:
+str(fungiTree)
+
+# we therefor simplify
+fungiTree <- fungiTree$phylo
+str(fungiTree)
+
+# The species names are in a vector $phylo$tip.label of this list.
+# We can use biCode() to shorten them.
+fungiTree$tip.label <- biCode(fungiTree$tip.label)
+
+# Plot the tree
+nSP <- length(fungiTree$tip.label)
+plot(fungiTree, cex = 0.8, root.edge = TRUE, no.margin = TRUE)
+text(-1, nSP - 0.5, "Species Tree:\nFungi", pos = 4)
+ape::nodelabels(text = fungiTree$node.label,
+                cex = 0.6,
+                adj = 0.2,
+                bg = "#D4F2DA")
+# Note that you can use the arrow buttons in the menu above the plot pane to
+# scroll back to plots you have created earlier - so you can reference back to
+# this species tree in your later analysis.
+
+
+# =    3  Tree Analysis  =======================================================
+
+
+# 1.1  Visualizing your tree
+# The trees that are produced by Rphylip are stored as an object of class
+# "phylo". This is a class for phylogenetic trees that is widely used in the
+# community, practically all R phylogenetics packages will options to read and
+# manipulate such trees. Outside of R, a popular interchange format is the
+# Newick_format that you have seen above. It's easy to output your calculated
+# trees in Newick format and visualize them elsewhere.
+
+# The "phylo" class object is one of R's "S3" objects and methods to plot and
+# print it have been defined with the Rphylip package, and in ape. You can
+# simply call plot() and R knows what to do with  and how
+# to plot it. The underlying function is plot.phylo(), and documentation for its
+# many options can by found by typing:
+
+?plot.phylo
+
+# We load the APSES sequence tree that you produced in the
+# BIN-PHYLO-Tree_building unit:
+apsTree <- readRDS(file = "data/APSEStreeRproml.rds")
+
+plot(apsTree) # default type is "phylogram"
+plot(apsTree, type = "unrooted")
+plot(apsTree, type = "fan", no.margin = TRUE)
+
+# rescale to show all of the labels:
+# record the current plot parameters by assigning them to a variable ...
+(tmp <- plot(apsTree, type="fan", no.margin = TRUE, plot=FALSE))
+# ... and adjust the plot limits for a new plot:
+plot(apsTree,
+     type = "fan",
+     x.lim = tmp$x.lim * 1.8,
+     y.lim = tmp$y.lim * 1.8,
+     cex = 0.8,
+     no.margin = TRUE)
+
+# Inspect the tree object
+str(apsTree)
+apsTree$tip.label
+apsTree$edge
+apsTree$edge.length
+
+# show the node / edge and tip labels on a plot
+plot(apsTree)
+ape::nodelabels()
+ape::edgelabels()
+ape::tiplabels()
+
+# show the number of nodes, edges and tips
+ape::Nnode(apsTree)
+ape::Nedge(apsTree)
+ape::Ntip(apsTree)
+
+par(PAR)   # reset graphics state
+
+# Finally, write the tree to console in Newick format
+ape::write.tree(apsTree)
+
+# ==   3.1  Rooting Trees  =====================================================
+
+# In order to analyse the tree, it is helpful to root it first and reorder its
+# clades. Contrary to documentation, Rproml() returns an unrooted tree.
+
+ape::is.rooted(apsTree)
+
+# You can root the tree with the command root() from the "ape" package.
+
+plot(apsTree)
+
+# add labels for internal nodes and tips
+ape::nodelabels(cex = 0.5, frame = "circle")
+ape::tiplabels(cex = 0.5, frame = "rect")
+
+# The outgroup of the tree (KILA ESCCO) is tip "11" in my sample tree, it may be a different
+# number in yours. Substitute the correct node number below for "outgroup".
+apsTree <- ape::root(apsTree, outgroup = 11, resolve.root = TRUE)
+plot(apsTree)
+ape::is.rooted(apsTree)
+
+# This tree _looks_ unchanged, beacuse when the root trifurcation was resolved,
+# an edge of length zero was added to connect the MRCA (Most Recent Common
+# Ancestor) of the ingroup.
+
+# The edge lengths are stored in the phylo object:
+apsTree$edge.length
+
+# ... and you can assign a small arbitrary value to the edge
+# to show how it connects to the tree without having an
+# overlap.
+apsTree$edge.length[1] <- 0.1
+plot(apsTree, cex = 0.7)
+ape::nodelabels(text = "MRCA", node = 12, cex = 0.5, adj = 0.1, bg = "#ff8866")
+
+
+# This procedure does however not assign an actual length to a root edge, and
+# therefore no root edge is visible on the plot. Why? , you might ask. I ask
+# myself that too. We'll just add a length by hand.
+
+apsTree$root.edge <- mean(apsTree$edge.length) * 1.5
+plot(apsTree, cex = 0.7, root.edge = TRUE)
+ape::nodelabels(text = "MRCA", node = 12, cex = 0.5, adj = 0.8, bg = "#ff8866")
+
+
+# ==   3.2  Rotating Clades  ===================================================
+
+# To interpret the tree, it is useful to rotate the clades so that they appear
+# in the order expected from the cladogram of species.
+
+# We can either rotate around individual internal nodes ...
+layout(matrix(1:2, 1, 2))
+plot(apsTree, no.margin = TRUE, root.edge = TRUE)
+ape::nodelabels(node = 13, cex = 0.7, bg = "#ff8866")
+plot(ape::rotate(apsTree, node = 13), no.margin = TRUE, root.edge = TRUE)
+ape::nodelabels(node = 13, cex = 0.7, bg = "#88ff66")
+# Note that the species at the bottom of the clade descending from node
+# 17 is now plotted at the top.
+
+par(PAR)   # reset graphics state
+
+# ... or we can rearrange the tree so it corresponds as well as possible to a
+# predefined tip ordering. Here we use the ordering that taxize:: has inferred
+# from the NCBI taxonomic classification.
+
+nOrg <- length(apsTree$tip.label)
+
+plot(fungiTree,
+     no.margin = FALSE, root.edge = TRUE)
+ape::nodelabels(text = fungiTree$node.label,
+                cex = 0.5,
+                adj = 0.2,
+                bg = "#D4F2DA")
+
+# These are the fungi tree tips ...
+fungiTree$tip.label
+# ... and their order is determined by the edge-list that is stored in
+fungiTree$edge
+# which edges join the tips?
+ape::tiplabels(cex = 0.5, frame = "rect")
+# as you can see, the tips (range [1:nOrg] ) are in column 2 and they are
+# ordered from bottom to top.
+# And each tip number is the index of the species in the tip.label vector. So we can take column 2, subset it, and use it to get a list of species in the order of the tree ...
+
+sel <- fungiTree$edge[ , 2 ] <= nOrg
+( oSp <- fungiTree$tip.label[fungiTree$edge[sel , 2 ]] )
+
+# Now, here are the genes of the apsTree tips ...
+apsTree$tip.label
+
+# ... and the "constraint"  we need for reordering, according to the help page
+# of ape::rotateConstr(), is "a vector specifying the order of the tips as they
+# should appear (from bottom to top)". Thus we need to add the "MBP1_" prefix to our vector
+oSp <- gsub("^", "MBP1_", oSp)
+( oSp <- gsub("MBP1_ESSCO", "KILA_ESCCO", oSp) )
+
+# Then we can plot the two trees to compare: the fungi- tree
+par(PAR)   # reset graphics state
+layout(matrix(1:2, 1, 2))
+plot(fungiTree,
+    no.margin = TRUE,
+     root.edge = TRUE)
+ape::nodelabels(text = fungiTree$node.label,
+                cex = 0.5,
+                adj = 0.2,
+                bg = "#D4F2DA")
+
+# and the re-organized apsesTree ...
+plot(ape::rotateConstr(apsTree, constraint = oSp[]),
+     no.margin = TRUE,
+     root.edge = TRUE)
+
+par(PAR)   # reset graphics state
+
+# As you can see, the reordering is not perfect, since the topologies are
+# different, mostly due to the unresolved nodes in the reference tree. One
+# could play with that ...
+
+
+# Task: Study the two trees and consider their similarities and differences.
+#         What do you expect? What do you find? Note that this is not a "mixed"
+#         gene tree yet, since it contains only a single gene for the species
+#         we considered. All of the branch points in this tree are speciation
+#         events. Thus the gene tree should have the same topology as the
+#         species tree. Does it? Are the differences important? How many
+#         branches would you need to remove and reinsert elsewhere to get the
+#         same topology as the species tree?
+
+# In order to quantify how different these two trees are, we need to compute
+# tree distances.
+
+
+# ==   3.3  Computing tree distances  ==========================================
+
+
+# Many superb phylogeny tools are contributed by the phangorn package.
+
+if (! requireNamespace("phangorn", quietly = TRUE)) {
+  install.packages("phangorn")
+}
+# Package information:
+#  library(help = phangorn)       # basic information
+#  browseVignettes("phangorn")    # available vignettes
+#  data(package = "phangorn")     # available datasets
+
+# To compare two trees, they must have the same tip labels. We delete "MBP1_" or
+# "KILA_" from the existing tip labels in a copy of our APSES domain tree.
+apsTree2 <- apsTree
+apsTree2$tip.label <- gsub("(MBP1_)|(KILA_)", "", apsTree2$tip.label)
+
+
+# phangorn provides several functions to compute tree-differences (and there
+# is a _whole_ lot of theory on how to compare trees). treedist() returns the
+# "symmetric difference"
+phangorn::treedist(fungiTree, apsTree2, check.labels = TRUE)
+
+# Numbers. What do they mean? How much more similar is our apsTree to the
+# (presumably) ground truth of fungiTree than a random tree would be?
+# The ape package provides the function rtree()
+# to compute random trees.
+
+ape::rtree(n = length(apsTree2$tip.label), # number of tips
+          rooted = TRUE,                   # we rooted the tree above,
+                                           #  and fungiTree is rooted anyway
+          tip.label = apsTree2$tip.label,  # use the apsTree2 labels
+          br = NULL)                       # don't generate branch lengths since
+                                           #   fungiTree has none, so we can't
+                                           #   compare them anyway.
+
+# (Note the warning message about non-binary trees; we'll suppress that later
+#  by wrapping the function call in supressMessages(); we don't want to
+#  print it 10,000 times :-)
+
+
+# Let's compute some random trees this way, calculate the distances to
+# fungiTree, and then compare the values we get for apsTree2. The random
+# trees are provided by ape::rtree().
+
+N <- 10000  # takes about 15 seconds, and we'll use the pBar function,
+            # defined in .utilities.R  to keep track of where we are at:
+myTreeDistances <- matrix(numeric(N * 2), ncol = 2)
+colnames(myTreeDistances) <- c("symm", "path")
+
+set.seed(112358)
+for (i in 1:N) {
+  pBar(i, N)
+  xTree <- ape::rtree(n = length(apsTree2$tip.label),
+                      rooted = TRUE,
+                      tip.label = apsTree2$tip.label,
+                      br = NULL)
+  myTreeDistances[i, ] <- suppressMessages(phangorn::treedist(fungiTree, xTree))
+}
+set.seed(NULL)                      # reset the random number generator
+
+table(myTreeDistances[, "symm"])
+
+( symmObs <- phangorn::treedist(fungiTree, apsTree2)[1] )
+
+# Random events less-or-equal to observation, divided by total number of
+# events gives us the empirical p-value.
+cat(sprintf("\nEmpirical p-value for symmetric diff. of observed tree is %1.4f\n",
+            (sum(myTreeDistances[ , "symm"] <= symmObs) + 1) / (N + 1)))
+
+par(PAR)   # reset graphics state
+hist(myTreeDistances[, "path"],
+     col = "aliceblue",
+     main = "Distances of random Trees to fungiTree")
+(pathObs <- phangorn::treedist(fungiTree, apsTree2)[2])
+abline(v = pathObs, col = "chartreuse")
+
+# Random events less-or-equal to observation, divided by total number of
+# events gives us the empirical p-value.
+cat(sprintf("\nEmpirical p-value for path diff. of observed tree is %1.4f\n",
+            (sum(myTreeDistances[ , "path"] <= symmObs) + 1) / (N + 1)))
+
+# Indeed, our apsTree is _very_ much more similar to the species tree than
+# we would expect by random chance.
+
+# What do we gain from that analysis? Analyzing the tree we get from a single
+# gene of orthologous sequences is a positive control in our computational
+# experiment. If these genes are indeed orthologues, a correct tree-building
+# program ought to give us a tree that exactly matches the species tree.
+# Evaluating how far off we are from the known correct result gives us a way to
+# validate our workflow and our algorithm. If we can't get that right, we can't
+# expect to get "real" data right either. Employing such positive controls in
+# every computational experiment is essential for research. Not doing so is
+# Cargo Cult Bioinformatics.
+
+
+# [END]
diff --git a/BIN-PHYLO-Tree_building.R b/BIN-PHYLO-Tree_building.R
index 106fac4..3ed7277 100644
--- a/BIN-PHYLO-Tree_building.R
+++ b/BIN-PHYLO-Tree_building.R
@@ -1,168 +1,168 @@
-# tocID <- "BIN-PHYLO-Tree_building.R"
-#
-# Purpose:  A Bioinformatics Course:
-#              R code accompanying the BIN-PHYLO-Tree_building unit.
-#
-# Version:  1.2
-#
-# Date:     2017-10   2020-09
-# Author:   Boris Steipe (boris.steipe@utoronto.ca)
-#
-# Versions:
-#           1.2    deprecate save()/load() for saveRDS()/readRDS(); Mac:
-#                  instructions to authorize proml.app
-#           1.1    Change from require() to requireNamespace(),
-#                      use ::() idiom throughout,
-#           1.0    First 2017 version
-#           0.1    First code copied from 2016 material.
-#
-#
-# TODO:
-#           Add MrBayes
-# https://cran.r-project.org/web/packages/phangorn/vignettes/IntertwiningTreesAndNetworks.html
-#
-# == DO NOT SIMPLY  source()  THIS FILE! =======================================
-#
-# If there are portions you don't understand, use R's help system, Google for an
-# answer, or ask your instructor. Don't continue if you don't understand what's
-# going on. That's not how it works ...
-#
-# ==============================================================================
-
-
-#TOC> ==========================================================================
-#TOC> 
-#TOC>   Section  Title                                       Line
-#TOC> -----------------------------------------------------------
-#TOC>   1        Calculating Trees                             48
-#TOC>   1.1        PROMLPATH ...                               68
-#TOC>   1.1.1          ... on the Mac                          73
-#TOC>   1.1.2          ... on Windows                         101
-#TOC>   1.1.3          ... on Linux                           115
-#TOC>   1.1.4          Confirming PROMLPATH                   120
-#TOC>   1.2        Building a maximum likelihood tree         134
-#TOC> 
-#TOC> ==========================================================================
-
-
-# =    1  Calculating Trees  ===================================================
-
-
-# Follow the instructions found at phylip's home on the Web to install. If you
-# are on a Windows computer, take note of the installation directory.
-
-# After you have installed Phylip on your computer, install the R package that
-# provides an interface to the Phylip functions.
-
-if (! requireNamespace("Rphylip", quietly = TRUE)) {
-  install.packages("Rphylip")
-}
-# Package information:
-#  library(help = Rphylip)       # basic information
-#  browseVignettes("Rphylip")    # available vignettes
-#  data(package = "Rphylip")     # available datasets
-
-# This will install RPhylip, as well as its dependency, the package "ape".
-
-
-# ==   1.1  PROMLPATH ...  =====================================================
-# The next part may be tricky. You will need to figure out where
-# on your computer Phylip has been installed and define the path
-# to the proml program that calculates a maximum-likelihood tree.
-
-# ===   1.1.1  ... on the Mac                    
-# On the Mac, the standard installation places a phylip folder
-# in the /Applications directory. That folder contains all the
-# individual phylip programs as .app files. These are not
-# the actual executables, but "app" files are actually directories
-# that contain the required resources for a program to run.
-
-# The executable is in a subdirectory and you can point Rphylip
-# directly to that subdirectory to find the program it needs:
-# PROMLPATH <- "/Applications/phylip-3.695/exe/proml.app/Contents/MacOS"
-
-# However, RPHYLIP will not be able to run PHYLIP applications immediately,
-# because they have not been "signed" by the PHYLIP developers. The process
-# will terminate by your system, with a warning.
-
-#   -  Navigate to the phylip folder in your ~/Applications directory
-#   -  Descend into the "exe" folder and find  proml.app
-#   -  Ctrl-click  proml.app  and choose "Open". A dialogue will show that
-#      says: "macOS cannot verify the developer of “proml.app”.
-#             Are you sure you want to open it?"
-#   -  Click open to continue. You may need to allow access to the terminal
-#      as well. When the proml terminal session open, you can type
-#      Ctrl-c to abort the program and close the window.
-#
-#   This adds proml.app to the list of known-good programs and you will not
-#   need to repeat this process.
-#
-
-# ===   1.1.2  ... on Windows                    
-# On Windows you need to know where the programs have been installed, and you
-# need to specify a path that is correct for the Windows OS. Find the folder
-# that is named "exe", and right-click to inspect its properties. The path
-# should be listed among them.
-
-# If the path looks like "C:\Users\Meng\Programs\phylip-3.695\exe", then your
-# assignment has to be
-# PROMLPATH <- "C:/Users/Meng/Programs/phylip-3.695/exe"
-# (Note: "/", not "\")
-
-# I have heard that your path must not contain spaces, and it is prudent to
-# avoid other special characters as well.
-
-# ===   1.1.3  ... on Linux                      
-# If you are running Linux I trust you know what to do. It's probably
-# something like
-# PROMLPATH <- "/usr/local/phylip-3.695/bin"
-
-# ===   1.1.4  Confirming PROMLPATH              
-# Confirm that the settings are right.
-PROMLPATH                # returns the path
-list.dirs(PROMLPATH)     # returns the directories in that path
-list.files(PROMLPATH)    # lists the files [1] "proml"   "proml.command"
-
-# If "proml" is NOT among the files that the last command returns, you
-# can't continue. Ask on the mailing list for advice.
-
-# If everything is good, you can add the line that defines PROMLPATH to
-# myScripts/.myProfile.R - the path will then be automatically set when
-# you quit RStudio and return.
-
-
-# ==   1.2  Building a maximum likelihood tree  ================================
-# Now read the mfa file you have saved in the BIB-PHYLO-Data_preparation unit,
-# as a "proseq" object with the read.protein() function of the RPhylip package:
-
-apsIn <- Rphylip::read.protein("data/APSESphyloSet.mfa")
-str(apsIn)
-
-# ... and you are ready to build a tree.
-
-# There are many fast options in PHYLIP - we will use the most _accurate_ one
-# that it has: proml, a maximum-likelihood tree building program for protein
-# data.
-
-# Building maximum-likelihood trees can eat as much computer time
-# as you can throw at it. Calculating a tree of 48 APSES domains
-# with default parameters of Rproml() runs for more than half a day
-# on my computer. But we have only twelve sequences here, so the
-# process will take us about 5 to 15 minutes. Run this, and anjoy a good cup
-# of coffee while you are waiting.
-
-apsTree <- Rphylip::Rproml(apsIn, path=PROMLPATH)
-
-# A quick first look:
-
-plot(apsTree)
-
-# save your tree:
-saveRDS(apsTree, file = "data/APSEStreeRproml.rds")
-
-# If this did not work, ask for advice.
-
-
-
-
-# [END]
+# tocID <- "BIN-PHYLO-Tree_building.R"
+#
+# Purpose:  A Bioinformatics Course:
+#              R code accompanying the BIN-PHYLO-Tree_building unit.
+#
+# Version:  1.2
+#
+# Date:     2017-10   2020-09
+# Author:   Boris Steipe (boris.steipe@utoronto.ca)
+#
+# Versions:
+#           1.2    deprecate save()/load() for saveRDS()/readRDS(); Mac:
+#                  instructions to authorize proml.app
+#           1.1    Change from require() to requireNamespace(),
+#                      use ::() idiom throughout,
+#           1.0    First 2017 version
+#           0.1    First code copied from 2016 material.
+#
+#
+# TODO:
+#           Add MrBayes
+# https://cran.r-project.org/web/packages/phangorn/vignettes/IntertwiningTreesAndNetworks.html
+#
+# == DO NOT SIMPLY  source()  THIS FILE! =======================================
+#
+# If there are portions you don't understand, use R's help system, Google for an
+# answer, or ask your instructor. Don't continue if you don't understand what's
+# going on. That's not how it works ...
+#
+# ==============================================================================
+
+
+#TOC> ==========================================================================
+#TOC> 
+#TOC>   Section  Title                                       Line
+#TOC> -----------------------------------------------------------
+#TOC>   1        Calculating Trees                             48
+#TOC>   1.1        PROMLPATH ...                               68
+#TOC>   1.1.1          ... on the Mac                          73
+#TOC>   1.1.2          ... on Windows                         101
+#TOC>   1.1.3          ... on Linux                           115
+#TOC>   1.1.4          Confirming PROMLPATH                   120
+#TOC>   1.2        Building a maximum likelihood tree         134
+#TOC> 
+#TOC> ==========================================================================
+
+
+# =    1  Calculating Trees  ===================================================
+
+
+# Follow the instructions found at phylip's home on the Web to install. If you
+# are on a Windows computer, take note of the installation directory.
+
+# After you have installed Phylip on your computer, install the R package that
+# provides an interface to the Phylip functions.
+
+if (! requireNamespace("Rphylip", quietly = TRUE)) {
+  install.packages("Rphylip")
+}
+# Package information:
+#  library(help = Rphylip)       # basic information
+#  browseVignettes("Rphylip")    # available vignettes
+#  data(package = "Rphylip")     # available datasets
+
+# This will install RPhylip, as well as its dependency, the package "ape".
+
+
+# ==   1.1  PROMLPATH ...  =====================================================
+# The next part may be tricky. You will need to figure out where
+# on your computer Phylip has been installed and define the path
+# to the proml program that calculates a maximum-likelihood tree.
+
+# ===   1.1.1  ... on the Mac                    
+# On the Mac, the standard installation places a phylip folder
+# in the /Applications directory. That folder contains all the
+# individual phylip programs as .app files. These are not
+# the actual executables, but "app" files are actually directories
+# that contain the required resources for a program to run.
+
+# The executable is in a subdirectory and you can point Rphylip
+# directly to that subdirectory to find the program it needs:
+# PROMLPATH <- "/Applications/phylip-3.695/exe/proml.app/Contents/MacOS"
+
+# However, RPHYLIP will not be able to run PHYLIP applications immediately,
+# because they have not been "signed" by the PHYLIP developers. The process
+# will terminate by your system, with a warning.
+
+#   -  Navigate to the phylip folder in your ~/Applications directory
+#   -  Descend into the "exe" folder and find  proml.app
+#   -  Ctrl-click  proml.app  and choose "Open". A dialogue will show that
+#      says: "macOS cannot verify the developer of “proml.app”.
+#             Are you sure you want to open it?"
+#   -  Click open to continue. You may need to allow access to the terminal
+#      as well. When the proml terminal session open, you can type
+#      Ctrl-c to abort the program and close the window.
+#
+#   This adds proml.app to the list of known-good programs and you will not
+#   need to repeat this process.
+#
+
+# ===   1.1.2  ... on Windows                    
+# On Windows you need to know where the programs have been installed, and you
+# need to specify a path that is correct for the Windows OS. Find the folder
+# that is named "exe", and right-click to inspect its properties. The path
+# should be listed among them.
+
+# If the path looks like "C:\Users\Meng\Programs\phylip-3.695\exe", then your
+# assignment has to be
+# PROMLPATH <- "C:/Users/Meng/Programs/phylip-3.695/exe"
+# (Note: "/", not "\")
+
+# I have heard that your path must not contain spaces, and it is prudent to
+# avoid other special characters as well.
+
+# ===   1.1.3  ... on Linux                      
+# If you are running Linux I trust you know what to do. It's probably
+# something like
+# PROMLPATH <- "/usr/local/phylip-3.695/bin"
+
+# ===   1.1.4  Confirming PROMLPATH              
+# Confirm that the settings are right.
+PROMLPATH                # returns the path
+list.dirs(PROMLPATH)     # returns the directories in that path
+list.files(PROMLPATH)    # lists the files [1] "proml"   "proml.command"
+
+# If "proml" is NOT among the files that the last command returns, you
+# can't continue. Ask on the mailing list for advice.
+
+# If everything is good, you can add the line that defines PROMLPATH to
+# myScripts/.myProfile.R - the path will then be automatically set when
+# you quit RStudio and return.
+
+
+# ==   1.2  Building a maximum likelihood tree  ================================
+# Now read the mfa file you have saved in the BIB-PHYLO-Data_preparation unit,
+# as a "proseq" object with the read.protein() function of the RPhylip package:
+
+apsIn <- Rphylip::read.protein("data/APSESphyloSet.mfa")
+str(apsIn)
+
+# ... and you are ready to build a tree.
+
+# There are many fast options in PHYLIP - we will use the most _accurate_ one
+# that it has: proml, a maximum-likelihood tree building program for protein
+# data.
+
+# Building maximum-likelihood trees can eat as much computer time
+# as you can throw at it. Calculating a tree of 48 APSES domains
+# with default parameters of Rproml() runs for more than half a day
+# on my computer. But we have only twelve sequences here, so the
+# process will take us about 5 to 15 minutes. Run this, and anjoy a good cup
+# of coffee while you are waiting.
+
+apsTree <- Rphylip::Rproml(apsIn, path=PROMLPATH)
+
+# A quick first look:
+
+plot(apsTree)
+
+# save your tree:
+saveRDS(apsTree, file = "data/APSEStreeRproml.rds")
+
+# If this did not work, ask for advice.
+
+
+
+
+# [END]
diff --git a/BIN-PPI-Analysis.R b/BIN-PPI-Analysis.R
index 4884ba8..9eb350e 100644
--- a/BIN-PPI-Analysis.R
+++ b/BIN-PPI-Analysis.R
@@ -1,323 +1,323 @@
-# tocID <- "BIN-PPI-Analysis.R"
-#
-#
-# Purpose:  A Bioinformatics Course:
-#              R code accompanying the BIN-PPI-Analysis unit.
-#
-# Version:   1.4
-#
-# Date:     2017-08  -  2020-10
-# Author:   Boris Steipe (boris.steipe@utoronto.ca)
-#
-# Versions:
-#           1.4    Update vector ID's for betweenness centrality.
-#           1.3    Bugfix: called the wrong function on ENSPsel in l. 220
-#           1.2    2020 Updates; Rewrite for new STRINg V11;
-#                  Deprecate save()/load() for saveRDS()/readRDS()
-#           1.1    Change from require() to requireNamespace(),
-#                      use ::() idiom throughout,
-#                      use Biocmanager:: not biocLite()
-#           1.0    First live version
-#           0.1    First code copied from 2016 material.
-#
-# TODO:
-#
-#
-# == DO NOT SIMPLY  source()  THIS FILE! =======================================
-#
-# If there are portions you don't understand, use R's help system, Google for an
-# answer, or ask your instructor. Don't continue if you don't understand what's
-# going on. That's not how it works ...
-#
-# ==============================================================================
-
-
-#TOC> ==========================================================================
-#TOC>
-#TOC>   Section  Title                                           Line
-#TOC> ---------------------------------------------------------------
-#TOC>   1        Setup and data                                    50
-#TOC>   2        Functional Edges in the Human Proteome            86
-#TOC>   2.1        Cliques                                        129
-#TOC>   2.2        Communities                                    170
-#TOC>   2.3        Betweenness Centrality                         184
-#TOC>   3        biomaRt                                          231
-#TOC>   4        Task for submission                              302
-#TOC>
-#TOC> ==========================================================================
-
-
-# =    1  Setup and data  ======================================================
-
-
-# Not surprisingly, the analysis of PPI networks needs iGraph:
-
-if (! requireNamespace("igraph", quietly = TRUE)) {
-  install.packages("igraph")
-}
-# Package information:
-#  library(help = igraph)       # basic information
-#  browseVignettes("igraph")    # available vignettes
-#  data(package = "igraph")     # available datasets
-
-# In order for you to explore some real, biological networks, I give you a
-# dataframe of functional relationships of human proteins that I have downloaded
-# from the STRING database. The full table has 8.5 million records, here is a
-# subset of records with combined confidence scores > 980
-
-# The selected set of edges with a confidence of > 964 is a dataframe with about
-# 50,000 edges and 8,400 unique proteins. Incidentaly, that's about the size of
-# a fungal proteome. You can load the saved dataframe here (To read more about
-# what the scores mean, see http://www.ncbi.nlm.nih.gov/pubmed/15608232 ).
-
-STRINGedges <- readRDS("./data/STRINGedges.rds")
-
-head(STRINGedges)
-
-# Note that STRING has appended the tax-ID for Homo sapiens - 9606 - to the
-# Ensemble transcript identifiers that start with ENSP. We'll remove them:
-
-STRINGedges$a <- gsub("^9606\\.", "", STRINGedges$a)
-STRINGedges$b <- gsub("^9606\\.", "", STRINGedges$b)
-
-head(STRINGedges)
-
-
-# =    2  Functional Edges in the Human Proteome  ==============================
-
-
-# There are many possibilities to explore interesting aspects of biological
-# networks, we will keep with some very simple procedures here but you have
-# to be aware that this is barely scratching the surface of possibilities.
-# However, once the network exists in your computer, it is comparatively
-# easy to find information online about the many, many options to analyze.
-
-
-# Make a graph from this dataframe
-?igraph::graph_from_data_frame
-
-gSTR <- igraph::graph_from_data_frame(STRINGedges, directed = FALSE)
-
-# CAUTION you DON'T want to plot a graph with 8,000 nodes and 50,000 edges -
-# layout of such large graphs is possible, but requires specialized code. Google
-# for  if you are curious. Also, consider what one can
-# really learn from plotting such a graph ...
-
-# Of course simple computations on this graph are reasonably fast:
-
-compSTR <- igraph::components(gSTR)
-summary(compSTR) # our graph is fully connected!
-
-hist(log(igraph::degree(gSTR)), col="#FEE0AF")
-# this actually does look rather scale-free
-
-(freqRank <- table(igraph::degree(gSTR)))
-plot(log10(as.numeric(names(freqRank)) + 1),
-     log10(as.numeric(freqRank)), type = "b",
-     pch = 21, bg = "#FEE0AF",
-     xlab = "log(Rank)", ylab = "log(frequency)",
-     main = "8,400 nodes from the human functional interaction network")
-
-# This looks very scale-free indeed.
-
-(regressionLine <- lm(log10(as.numeric(freqRank)) ~
-                      log10(as.numeric(names(freqRank)) + 1)))
-abline(regressionLine, col = "firebrick")
-
-# Now explore some more:
-
-# ==   2.1  Cliques  ===========================================================
-
-# Let's find the largest cliques. Remember: a clique is a fully connected
-# subgraph, i.e. a subgraph in which every node is connected to every other.
-# Biological complexes often appear as cliques in interaction graphs.
-
-igraph::clique_num(gSTR)
-# The largest clique has 81 members.
-
-(C <- igraph::largest_cliques(gSTR)[[1]])
-
-# Pick one of the proteins and find out what this fully connected cluster of 81
-# proteins is (you can simply Google for any of the IDs). Is this expected?
-
-# Plot this ...
-R <- igraph::induced_subgraph(gSTR, C) # a graph from a selected set of vertices
-
-# color the vertices along a color spectrum
-vCol <- rainbow(igraph::gorder(R)) # "order" of a graph == number of nodes
-
-# color the edges to have the same color as the originating node
-eCol <- character()
-for (i in seq_along(vCol)) {
-  eCol <- c(eCol, rep(vCol[i], igraph::gorder(R)))
-}
-
-oPar <- par(mar= rep(0,4)) # Turn margins off
-plot(R,
-     layout = igraph::layout_in_circle(R),
-     vertex.size = 3,
-     vertex.color = vCol,
-     edge.color = eCol,
-     edge.width = 0.1,
-     vertex.label = NA)
-par(oPar)
-
-# ... well: remember: a clique means every node is connected to every other
-# node. We have 81 * 81 = 6,561 edges. This is what a matrix model of PPI
-# networks looks like for large complexes.
-
-
-# ==   2.2  Communities  =======================================================
-
-set.seed(112358)                       # set RNG seed for repeatable randomness
-gSTRclusters <- igraph::cluster_infomap(gSTR)
-set.seed(NULL)                         # reset the RNG
-
-igraph::modularity(gSTRclusters) # ... measures how separated the different
-                                 # membership types are from each other
-tMem <- table(igraph::membership(gSTRclusters))
-length(tMem)  # About 700 communities identified
-hist(tMem, breaks = 50, col = "skyblue")  # most clusters are small ...
-range(tMem) # ... but one has > 200 members
-
-
-# ==   2.3  Betweenness Centrality  ============================================
-
-# Let's find the nodes with the 10 - highest betweenness centralities.
-#
-BC <- igraph::centr_betw(gSTR)
-
-# remember: BC$res contains the results
-head(BC$res)
-
-BC$res[1]   # betweenness centrality of node 1 in the graph ...
-# ... which one is node 1?
-igraph::V(gSTR)[1]
-
-# to get the ten-highest nodes, we simply label the elements of BC with their
-# index ...
-names(BC$res) <- as.character(1:length(BC$res))
-
-# ... and then we sort:
-sBC <- sort(BC$res, decreasing = TRUE)
-head(sBC)
-
-# This ordered vector means: node 3 has the highest betweenness centrality,
-# node 721 has the second highest, etc.
-
-(BCsel <- as.numeric(names(sBC)[1:10]))
-
-# We can use the first ten labels to subset the nodes in gSTR and fetch the
-# IDs...
-(ENSPsel <- names(igraph::V(gSTR)[BCsel]))
-
-# Task:
-# =====
-# IMPORTANT, IF YOU INTEND TO SUBMIT YOUR ANALYSIS FOR CREDIT
-# We are going to use these IDs to produce some output for a submitted task:
-# therefore I need you to execute the following line, note the "seal" that this
-# returns, and not change myENSPsel later:
-
-myENSPsel <- selectENSP(ENSPsel)
-
-#  Next, to find what these proteins are...
-
-# We could now Google for all of these IDs to learn more about them. But really,
-# googling for IDs one after the other, that would be lame. Let's instead use
-# the very, very useful biomaRt package to translate these Ensemble IDs into
-# gene symbols.
-
-
-# =    3  biomaRt  =============================================================
-
-
-# IDs are just labels, but for _bio_informatics we need to learn more about the
-# biological function of the genes or proteins that we retrieve via graph data
-# mining. biomaRt is the tool of choice. It's a package distributed by the
-# bioconductor project. This here is not a biomaRt tutorial (that's for another
-# day), simply a few lines of sample code to get you started on the specific use
-# case of retrieving descriptions for ensembl protein IDs.
-
-if (! requireNamespace("BiocManager", quietly = TRUE)) {
-  install.packages("BiocManager")
-}
-if (! requireNamespace("biomaRt", quietly = TRUE)) {
-  BiocManager::install("biomaRt")
-}
-# Package information:
-#  library(help = biomaRt)       # basic information
-#  browseVignettes("biomaRt")    # available vignettes
-#  data(package = "biomaRt")     # available datasets
-
-# define which dataset to use ... this takes a while for download
-myMart <- biomaRt::useMart("ensembl", dataset="hsapiens_gene_ensembl")
-
-# what filters are defined?
-( filters <- biomaRt::listFilters(myMart) )
-
-
-# and what attributes can we filter for?
-( attributes <- biomaRt::listAttributes(myMart) )
-
-
-# Soooo many options - let's look for the correct name of filters that are
-# useful for ENSP IDs ...
-filters[grep("ENSP", filters$description), ]
-
-# ... and the correct attribute names for gene symbols and descriptions ...
-attributes[grep("symbol", attributes$description, ignore.case = TRUE), ]
-attributes[grep("description", attributes$description, ignore.case = TRUE), ]
-
-
-# ... so we can put this together: here is a syntax example:
-biomaRt::getBM(filters = "ensembl_peptide_id",
-               attributes = c("hgnc_symbol",
-                              "wikigene_description",
-                              "interpro_description",
-                              "phenotype_description"),
-               values = "ENSP00000000442",
-               mart = myMart)
-
-# A simple loop will now get us the information for our 10 most central genes
-# from the human subset of STRING.
-
-CPdefs <- list()  # Since we don't know how many matches one of our queries
-# will return, we'll put the result dataframes into a list.
-
-for (ID in myENSPsel) {
-  CPdefs[[ID]] <- biomaRt::getBM(filters = "ensembl_peptide_id",
-                                 attributes = c("hgnc_symbol",
-                                                "wikigene_description",
-                                                "interpro_description",
-                                                "phenotype_description"),
-                                 values = ID,
-                                 mart = myMart)
-}
-
-
-# So what are the proteins with the ten highest betweenness centralities?
-#  ... are you surprised? (I am! Really.)
-
-
-# =    4  Task for submission  =================================================
-
-# Write a loop that will go through your personalized list of Ensemble IDs and
-#    for each ID:
-#    --  print the ID,
-#    --  print the first row's HGNC symbol,
-#    --  print the first row's wikigene description.
-#    --  print the first row's phenotype.
-#
-# Write your thoughts about this group of genes.
-#
-# (Hint, you can structure your loop in the same way as the loop that
-# created CPdefs. )
-
-# Submit the "seal" for your ENSP vector, the ENSP vector itself, the R code
-# for this loop and its output into your report if you are submitting
-# anything for credit for this unit. Please read the requirements carefully.
-
-
-
-
-# [END]
+# tocID <- "BIN-PPI-Analysis.R"
+#
+#
+# Purpose:  A Bioinformatics Course:
+#              R code accompanying the BIN-PPI-Analysis unit.
+#
+# Version:   1.4
+#
+# Date:     2017-08  -  2020-10
+# Author:   Boris Steipe (boris.steipe@utoronto.ca)
+#
+# Versions:
+#           1.4    Update vector ID's for betweenness centrality.
+#           1.3    Bugfix: called the wrong function on ENSPsel in l. 220
+#           1.2    2020 Updates; Rewrite for new STRINg V11;
+#                  Deprecate save()/load() for saveRDS()/readRDS()
+#           1.1    Change from require() to requireNamespace(),
+#                      use ::() idiom throughout,
+#                      use Biocmanager:: not biocLite()
+#           1.0    First live version
+#           0.1    First code copied from 2016 material.
+#
+# TODO:
+#
+#
+# == DO NOT SIMPLY  source()  THIS FILE! =======================================
+#
+# If there are portions you don't understand, use R's help system, Google for an
+# answer, or ask your instructor. Don't continue if you don't understand what's
+# going on. That's not how it works ...
+#
+# ==============================================================================
+
+
+#TOC> ==========================================================================
+#TOC>
+#TOC>   Section  Title                                           Line
+#TOC> ---------------------------------------------------------------
+#TOC>   1        Setup and data                                    50
+#TOC>   2        Functional Edges in the Human Proteome            86
+#TOC>   2.1        Cliques                                        129
+#TOC>   2.2        Communities                                    170
+#TOC>   2.3        Betweenness Centrality                         184
+#TOC>   3        biomaRt                                          231
+#TOC>   4        Task for submission                              302
+#TOC>
+#TOC> ==========================================================================
+
+
+# =    1  Setup and data  ======================================================
+
+
+# Not surprisingly, the analysis of PPI networks needs iGraph:
+
+if (! requireNamespace("igraph", quietly = TRUE)) {
+  install.packages("igraph")
+}
+# Package information:
+#  library(help = igraph)       # basic information
+#  browseVignettes("igraph")    # available vignettes
+#  data(package = "igraph")     # available datasets
+
+# In order for you to explore some real, biological networks, I give you a
+# dataframe of functional relationships of human proteins that I have downloaded
+# from the STRING database. The full table has 8.5 million records, here is a
+# subset of records with combined confidence scores > 980
+
+# The selected set of edges with a confidence of > 964 is a dataframe with about
+# 50,000 edges and 8,400 unique proteins. Incidentaly, that's about the size of
+# a fungal proteome. You can load the saved dataframe here (To read more about
+# what the scores mean, see http://www.ncbi.nlm.nih.gov/pubmed/15608232 ).
+
+STRINGedges <- readRDS("./data/STRINGedges.rds")
+
+head(STRINGedges)
+
+# Note that STRING has appended the tax-ID for Homo sapiens - 9606 - to the
+# Ensemble transcript identifiers that start with ENSP. We'll remove them:
+
+STRINGedges$a <- gsub("^9606\\.", "", STRINGedges$a)
+STRINGedges$b <- gsub("^9606\\.", "", STRINGedges$b)
+
+head(STRINGedges)
+
+
+# =    2  Functional Edges in the Human Proteome  ==============================
+
+
+# There are many possibilities to explore interesting aspects of biological
+# networks, we will keep with some very simple procedures here but you have
+# to be aware that this is barely scratching the surface of possibilities.
+# However, once the network exists in your computer, it is comparatively
+# easy to find information online about the many, many options to analyze.
+
+
+# Make a graph from this dataframe
+?igraph::graph_from_data_frame
+
+gSTR <- igraph::graph_from_data_frame(STRINGedges, directed = FALSE)
+
+# CAUTION you DON'T want to plot a graph with 8,000 nodes and 50,000 edges -
+# layout of such large graphs is possible, but requires specialized code. Google
+# for  if you are curious. Also, consider what one can
+# really learn from plotting such a graph ...
+
+# Of course simple computations on this graph are reasonably fast:
+
+compSTR <- igraph::components(gSTR)
+summary(compSTR) # our graph is fully connected!
+
+hist(log(igraph::degree(gSTR)), col="#FEE0AF")
+# this actually does look rather scale-free
+
+(freqRank <- table(igraph::degree(gSTR)))
+plot(log10(as.numeric(names(freqRank)) + 1),
+     log10(as.numeric(freqRank)), type = "b",
+     pch = 21, bg = "#FEE0AF",
+     xlab = "log(Rank)", ylab = "log(frequency)",
+     main = "8,400 nodes from the human functional interaction network")
+
+# This looks very scale-free indeed.
+
+(regressionLine <- lm(log10(as.numeric(freqRank)) ~
+                      log10(as.numeric(names(freqRank)) + 1)))
+abline(regressionLine, col = "firebrick")
+
+# Now explore some more:
+
+# ==   2.1  Cliques  ===========================================================
+
+# Let's find the largest cliques. Remember: a clique is a fully connected
+# subgraph, i.e. a subgraph in which every node is connected to every other.
+# Biological complexes often appear as cliques in interaction graphs.
+
+igraph::clique_num(gSTR)
+# The largest clique has 81 members.
+
+(C <- igraph::largest_cliques(gSTR)[[1]])
+
+# Pick one of the proteins and find out what this fully connected cluster of 81
+# proteins is (you can simply Google for any of the IDs). Is this expected?
+
+# Plot this ...
+R <- igraph::induced_subgraph(gSTR, C) # a graph from a selected set of vertices
+
+# color the vertices along a color spectrum
+vCol <- rainbow(igraph::gorder(R)) # "order" of a graph == number of nodes
+
+# color the edges to have the same color as the originating node
+eCol <- character()
+for (i in seq_along(vCol)) {
+  eCol <- c(eCol, rep(vCol[i], igraph::gorder(R)))
+}
+
+oPar <- par(mar= rep(0,4)) # Turn margins off
+plot(R,
+     layout = igraph::layout_in_circle(R),
+     vertex.size = 3,
+     vertex.color = vCol,
+     edge.color = eCol,
+     edge.width = 0.1,
+     vertex.label = NA)
+par(oPar)
+
+# ... well: remember: a clique means every node is connected to every other
+# node. We have 81 * 81 = 6,561 edges. This is what a matrix model of PPI
+# networks looks like for large complexes.
+
+
+# ==   2.2  Communities  =======================================================
+
+set.seed(112358)                       # set RNG seed for repeatable randomness
+gSTRclusters <- igraph::cluster_infomap(gSTR)
+set.seed(NULL)                         # reset the RNG
+
+igraph::modularity(gSTRclusters) # ... measures how separated the different
+                                 # membership types are from each other
+tMem <- table(igraph::membership(gSTRclusters))
+length(tMem)  # About 700 communities identified
+hist(tMem, breaks = 50, col = "skyblue")  # most clusters are small ...
+range(tMem) # ... but one has > 200 members
+
+
+# ==   2.3  Betweenness Centrality  ============================================
+
+# Let's find the nodes with the 10 - highest betweenness centralities.
+#
+BC <- igraph::centr_betw(gSTR)
+
+# remember: BC$res contains the results
+head(BC$res)
+
+BC$res[1]   # betweenness centrality of node 1 in the graph ...
+# ... which one is node 1?
+igraph::V(gSTR)[1]
+
+# to get the ten-highest nodes, we simply label the elements of BC with their
+# index ...
+names(BC$res) <- as.character(1:length(BC$res))
+
+# ... and then we sort:
+sBC <- sort(BC$res, decreasing = TRUE)
+head(sBC)
+
+# This ordered vector means: node 3 has the highest betweenness centrality,
+# node 721 has the second highest, etc.
+
+(BCsel <- as.numeric(names(sBC)[1:10]))
+
+# We can use the first ten labels to subset the nodes in gSTR and fetch the
+# IDs...
+(ENSPsel <- names(igraph::V(gSTR)[BCsel]))
+
+# Task:
+# =====
+# IMPORTANT, IF YOU INTEND TO SUBMIT YOUR ANALYSIS FOR CREDIT
+# We are going to use these IDs to produce some output for a submitted task:
+# therefore I need you to execute the following line, note the "seal" that this
+# returns, and not change myENSPsel later:
+
+myENSPsel <- selectENSP(ENSPsel)
+
+#  Next, to find what these proteins are...
+
+# We could now Google for all of these IDs to learn more about them. But really,
+# googling for IDs one after the other, that would be lame. Let's instead use
+# the very, very useful biomaRt package to translate these Ensemble IDs into
+# gene symbols.
+
+
+# =    3  biomaRt  =============================================================
+
+
+# IDs are just labels, but for _bio_informatics we need to learn more about the
+# biological function of the genes or proteins that we retrieve via graph data
+# mining. biomaRt is the tool of choice. It's a package distributed by the
+# bioconductor project. This here is not a biomaRt tutorial (that's for another
+# day), simply a few lines of sample code to get you started on the specific use
+# case of retrieving descriptions for ensembl protein IDs.
+
+if (! requireNamespace("BiocManager", quietly = TRUE)) {
+  install.packages("BiocManager")
+}
+if (! requireNamespace("biomaRt", quietly = TRUE)) {
+  BiocManager::install("biomaRt")
+}
+# Package information:
+#  library(help = biomaRt)       # basic information
+#  browseVignettes("biomaRt")    # available vignettes
+#  data(package = "biomaRt")     # available datasets
+
+# define which dataset to use ... this takes a while for download
+myMart <- biomaRt::useMart("ensembl", dataset="hsapiens_gene_ensembl")
+
+# what filters are defined?
+( filters <- biomaRt::listFilters(myMart) )
+
+
+# and what attributes can we filter for?
+( attributes <- biomaRt::listAttributes(myMart) )
+
+
+# Soooo many options - let's look for the correct name of filters that are
+# useful for ENSP IDs ...
+filters[grep("ENSP", filters$description), ]
+
+# ... and the correct attribute names for gene symbols and descriptions ...
+attributes[grep("symbol", attributes$description, ignore.case = TRUE), ]
+attributes[grep("description", attributes$description, ignore.case = TRUE), ]
+
+
+# ... so we can put this together: here is a syntax example:
+biomaRt::getBM(filters = "ensembl_peptide_id",
+               attributes = c("hgnc_symbol",
+                              "wikigene_description",
+                              "interpro_description",
+                              "phenotype_description"),
+               values = "ENSP00000000442",
+               mart = myMart)
+
+# A simple loop will now get us the information for our 10 most central genes
+# from the human subset of STRING.
+
+CPdefs <- list()  # Since we don't know how many matches one of our queries
+# will return, we'll put the result dataframes into a list.
+
+for (ID in myENSPsel) {
+  CPdefs[[ID]] <- biomaRt::getBM(filters = "ensembl_peptide_id",
+                                 attributes = c("hgnc_symbol",
+                                                "wikigene_description",
+                                                "interpro_description",
+                                                "phenotype_description"),
+                                 values = ID,
+                                 mart = myMart)
+}
+
+
+# So what are the proteins with the ten highest betweenness centralities?
+#  ... are you surprised? (I am! Really.)
+
+
+# =    4  Task for submission  =================================================
+
+# Write a loop that will go through your personalized list of Ensemble IDs and
+#    for each ID:
+#    --  print the ID,
+#    --  print the first row's HGNC symbol,
+#    --  print the first row's wikigene description.
+#    --  print the first row's phenotype.
+#
+# Write your thoughts about this group of genes.
+#
+# (Hint, you can structure your loop in the same way as the loop that
+# created CPdefs. )
+
+# Submit the "seal" for your ENSP vector, the ENSP vector itself, the R code
+# for this loop and its output into your report if you are submitting
+# anything for credit for this unit. Please read the requirements carefully.
+
+
+
+
+# [END]
diff --git a/BIN-SEQA-Composition.R b/BIN-SEQA-Composition.R
index cb0d111..f33b965 100644
--- a/BIN-SEQA-Composition.R
+++ b/BIN-SEQA-Composition.R
@@ -1,252 +1,252 @@
-# tocID <- "BIN-SEQA-Composition.R"
-#
-# Purpose: A Bioinformatics Course:
-#              R code accompanying the BIN-SEQA-Comparison unit
-#
-# Version: 1.2
-#
-# Date:    2017-11  -  2020-09
-# Author:  Boris Steipe (boris.steipe@utoronto.ca)
-#
-#           1.2    2020 Maintenance
-#           1.1    Change from require() to requireNamespace(),
-#                      use ::() idiom throughout,
-#                      use Biocmanager:: not biocLite()
-# Versions:
-#           1.0    First live version 2017
-#           0.1    First code copied from BCH441_A03_makeYFOlist.R
-#
-# TODO:
-#
-#
-# == HOW TO WORK WITH LEARNING UNIT FILES ======================================
-#
-# DO NOT SIMPLY  source()  THESE FILES!
-# If there are portions you don't understand, use R's help system, Google for an
-# answer, or ask your instructor. Don't continue if you don't understand what's
-#  going on. That's not how it works ...
-#
-# ==============================================================================
-
-
-#TOC> ==========================================================================
-#TOC> 
-#TOC>   Section  Title                                      Line
-#TOC> ----------------------------------------------------------
-#TOC>   1        Preparation                                  48
-#TOC>   2        Aggregate properties                         69
-#TOC>   3        Sequence Composition Enrichment             113
-#TOC>   3.1        Barplot, and side-by-side barplot         136
-#TOC>   3.2        Plotting ratios                           171
-#TOC>   3.3        Plotting log ratios                       188
-#TOC>   3.4        Sort by frequency                         204
-#TOC>   3.5        Color by amino acid type                  221
-#TOC> 
-#TOC> ==========================================================================
-
-
-# =    1  Preparation  =========================================================
-
-if (! requireNamespace("seqinr", quietly = TRUE)) {
-  install.packages("seqinr")
-}
-# Package information:
-#  library(help = seqinr)       # basic information
-#  browseVignettes("seqinr")    # available vignettes
-#  data(package = "seqinr")     # available datasets
-
-# Load a reference sequence to work with:
-
-# If you have done the BIN-Storing_data unit:
-   source("makeProteinDB.R")
-   sel <- which(myDB$protein$name == sprintf("MBP1_%s", biCode(MYSPE)))
-   mySeq <- myDB$protein$sequence[sel]
-
-# If not, use the yeast Mbp1 sequence:
-   mySeq <- dbSanitizeSequence(fromJSON("./data/MBP1_SACCE.json")$sequence)
-
-
-# =    2  Aggregate properties  ================================================
-
-
-# Let's try a simple function from seqinr: computing the pI of the sequence
-?seqinr::computePI
-
-# This takes as input a vector of upper-case AA codes
-
-# We can use the function strsplit() to split the string
-# into single characters
-
-(s <- strsplit(mySeq, "")) # splitting on the empty spring
-                           # splits into single characters
-s <- unlist(s)             # strsplit() returns a list! Why?
-                           # (But we don't need a list now...)
-
-# Alternatively, seqinr provides
-# the function s2c() to convert strings into
-# character vectors (and c2s to convert them back).
-
-seqinr::s2c(mySeq)
-
-
-seqinr::computePI(seqinr::s2c(mySeq))  # isoelectric point
-seqinr::pmw(seqinr::s2c(mySeq))        # molecular weight
-seqinr::AAstat(seqinr::s2c(mySeq))     # This also plots the distribution of
-                                       # values along the sequence
-
-# A true Labor of Love has gone into the
-# compilation of the "aaindex" data:
-
-?seqinr::aaindex
-data(aaindex, package = "seqinr")  # "attach" the dataset - i.e. make it
-                                   # accessible as an R object
-
-length(aaindex)  # no seqinr:: needed for the dataset since we just
-                 # "attached" it with data()
-
-# Here are all the index descriptions
-for (i in 1:length(aaindex)) {
-  cat(paste(i, ": ", aaindex[[i]]$D, "\n", sep=""))
-}
-
-
-# =    3  Sequence Composition Enrichment  =====================================
-
-
-# Lets use one of the indices to calculate and plot amino-acid
-# composition enrichment:
-aaindex[[459]]$D
-
-#
-# Let's construct an enrichment plot to compare average frequencies
-# with the amino acid counts in our sequence.
-
-(refData <- aaindex[[459]]$I)                # reference frequencies in %
-names(refData) <- seqinr::a(names(refData))  # change names to single-letter
-                                             # code using seqinr's "a()" function
-sum(refData)
-refData        # ... in %
-
-
-# tabulate the amino acid counts in mySeq
-(obsData <- table(seqinr::s2c(mySeq)))        # counts
-(obsData <- 100 * (obsData / sum(obsData)))   # frequencies
-
-
-# ==   3.1  Barplot, and side-by-side barplot  =================================
-
-barplot(obsData, col = "#CCCCCC", cex.names = 0.7)
-abline(h = 100/20, col="#BB0000")
-
-barplot(refData, col = "#BB0000", cex.names = 0.7)
-abline(h = 100/20, col="#555555")
-
-# Ok: first problem - the values in obsData are in alphabetical order. But the
-# values in refData are in alphabetical order of amino acid name: alanine,
-# arginine, asparagine, aspartic acid ... A, R, N, D, E ... you will see this
-# order a lot - one of the old biochemistry tropes in the field. So we need to
-# re-order one of the vectors to match the other. That's easy though:
-refData
-(refData <- refData[names(obsData)])
-
-barplot(refData, col = "#BB0000", cex.names = 0.7)
-abline(h = 100/20, col="#555555")
-
-# To compare the values, we want to see them in a barplot, side-by-side ...
-barplot(rbind(obsData, refData),
-        ylim = c(0, 12),
-        beside = TRUE,
-        col = c("#CCCCCC", "#BB0000"),
-        cex.names = 0.7)
-abline(h = 100/20, col="#00000044")
-
-# ... and add a legend
-legend (x = 1, y = 12,
-        legend = c("mySeq", "Average composition"),
-        fill = c("#CCCCCC", "#BB0000"),
-        cex = 0.7,
-        bty = "n")
-
-
-# ==   3.2  Plotting ratios  ===================================================
-
-# To better compare the values, we'll calculate ratios between
-# obsData and refData
-
-barplot(obsData / refData,
-        col = "#CCCCCC",
-        ylab = "Sequence / Average",
-        ylim = c(0, 2.5),
-        cex.names = 0.7)
-abline(h = 1, col="#BB0000")
-abline(h = c(1/2, 2), lty = 2, col="#BB000055")
-
-# ... but  ratios are not very good here, since the difference in height on the
-# plot now depends on the order we compare in: ratios of 1/2 and 2 (dotted
-# lines) are exactly the same fold-difference !
-
-# ==   3.3  Plotting log ratios  ===============================================
-
-# A better way to display this
-# is to plot log(ratios).
-
-barplot(log(obsData / refData),
-        col = "#CCCCCC",
-        ylab = "log(Sequence / Average)",
-        ylim = log(c(1/3, 3)),
-        cex.names = 0.7)
-abline(h = log(1), col="#BB0000")
-abline(h = log(c(1/2, 2)), lty = 2, col="#BB000055")
-
-# Note how the two-fold difference lines are now the same distance from the
-# line of equal ratio.
-
-# ==   3.4  Sort by frequency  =================================================
-
-barplot(sort(log(obsData / refData), decreasing = TRUE),
-        ylim = log(c(1/3, 3)),
-        col = "#CCCCCC",
-        ylab = "log(Sequence / Average)",
-        cex.names = 0.7)
-abline(h = log(1), col="#BB0000")
-abline(h = log(c(1/2, 2)), lty = 2, col="#BB000055")
-
-yTxt <- log(0.9)
-arrows(4, yTxt, 0, yTxt, length = 0.07)
-text(5.5, yTxt, "Enriched", cex = 0.7)
-yTxt <- log(1.1)
-arrows(20, yTxt, 24, yTxt, length = 0.07)
-text(19.5, yTxt, "Depleted", pos = 2, cex = 0.7)
-
-# ==   3.5  Color by amino acid type  ==========================================
-
-# Color the bars by amino acid type. Use AACOLS , defined in the .utilities.R
-# script, or define your own.
-
-barplot(rep(1, 20), names.arg = names(AACOLS), col = AACOLS, cex.names = 0.5)
-
-lR <- sort(log(obsData / refData), decreasing = TRUE)
-barplot(lR,
-        ylim = log(c(1/3, 3)),
-        col = AACOLS[names(lR)],
-        ylab = "log(Sequence / Average)",
-        cex.names = 0.7)
-abline(h = log(1), col="#00000055")
-abline(h = log(c(1/2, 2)), lty = 2, col="#00000033")
-
-yTxt <- log(0.9)
-arrows(4, yTxt, 0, yTxt, length = 0.07)
-text(5.5, yTxt, "Enriched", cex = 0.7)
-yTxt <- log(1.1)
-arrows(20, yTxt, 24, yTxt, length = 0.07)
-text(19.5, yTxt, "Depleted", pos = 2, cex = 0.7)
-
-
-# Task:
-#   Interpret this plot. (Can you?) Which types of amino acids are enriched?
-#   Depleted?
-
-
-
-
-# [END]
+# tocID <- "BIN-SEQA-Composition.R"
+#
+# Purpose: A Bioinformatics Course:
+#              R code accompanying the BIN-SEQA-Comparison unit
+#
+# Version: 1.2
+#
+# Date:    2017-11  -  2020-09
+# Author:  Boris Steipe (boris.steipe@utoronto.ca)
+#
+#           1.2    2020 Maintenance
+#           1.1    Change from require() to requireNamespace(),
+#                      use ::() idiom throughout,
+#                      use Biocmanager:: not biocLite()
+# Versions:
+#           1.0    First live version 2017
+#           0.1    First code copied from BCH441_A03_makeYFOlist.R
+#
+# TODO:
+#
+#
+# == HOW TO WORK WITH LEARNING UNIT FILES ======================================
+#
+# DO NOT SIMPLY  source()  THESE FILES!
+# If there are portions you don't understand, use R's help system, Google for an
+# answer, or ask your instructor. Don't continue if you don't understand what's
+#  going on. That's not how it works ...
+#
+# ==============================================================================
+
+
+#TOC> ==========================================================================
+#TOC> 
+#TOC>   Section  Title                                      Line
+#TOC> ----------------------------------------------------------
+#TOC>   1        Preparation                                  48
+#TOC>   2        Aggregate properties                         69
+#TOC>   3        Sequence Composition Enrichment             113
+#TOC>   3.1        Barplot, and side-by-side barplot         136
+#TOC>   3.2        Plotting ratios                           171
+#TOC>   3.3        Plotting log ratios                       188
+#TOC>   3.4        Sort by frequency                         204
+#TOC>   3.5        Color by amino acid type                  221
+#TOC> 
+#TOC> ==========================================================================
+
+
+# =    1  Preparation  =========================================================
+
+if (! requireNamespace("seqinr", quietly = TRUE)) {
+  install.packages("seqinr")
+}
+# Package information:
+#  library(help = seqinr)       # basic information
+#  browseVignettes("seqinr")    # available vignettes
+#  data(package = "seqinr")     # available datasets
+
+# Load a reference sequence to work with:
+
+# If you have done the BIN-Storing_data unit:
+   source("makeProteinDB.R")
+   sel <- which(myDB$protein$name == sprintf("MBP1_%s", biCode(MYSPE)))
+   mySeq <- myDB$protein$sequence[sel]
+
+# If not, use the yeast Mbp1 sequence:
+   mySeq <- dbSanitizeSequence(fromJSON("./data/MBP1_SACCE.json")$sequence)
+
+
+# =    2  Aggregate properties  ================================================
+
+
+# Let's try a simple function from seqinr: computing the pI of the sequence
+?seqinr::computePI
+
+# This takes as input a vector of upper-case AA codes
+
+# We can use the function strsplit() to split the string
+# into single characters
+
+(s <- strsplit(mySeq, "")) # splitting on the empty spring
+                           # splits into single characters
+s <- unlist(s)             # strsplit() returns a list! Why?
+                           # (But we don't need a list now...)
+
+# Alternatively, seqinr provides
+# the function s2c() to convert strings into
+# character vectors (and c2s to convert them back).
+
+seqinr::s2c(mySeq)
+
+
+seqinr::computePI(seqinr::s2c(mySeq))  # isoelectric point
+seqinr::pmw(seqinr::s2c(mySeq))        # molecular weight
+seqinr::AAstat(seqinr::s2c(mySeq))     # This also plots the distribution of
+                                       # values along the sequence
+
+# A true Labor of Love has gone into the
+# compilation of the "aaindex" data:
+
+?seqinr::aaindex
+data(aaindex, package = "seqinr")  # "attach" the dataset - i.e. make it
+                                   # accessible as an R object
+
+length(aaindex)  # no seqinr:: needed for the dataset since we just
+                 # "attached" it with data()
+
+# Here are all the index descriptions
+for (i in 1:length(aaindex)) {
+  cat(paste(i, ": ", aaindex[[i]]$D, "\n", sep=""))
+}
+
+
+# =    3  Sequence Composition Enrichment  =====================================
+
+
+# Lets use one of the indices to calculate and plot amino-acid
+# composition enrichment:
+aaindex[[459]]$D
+
+#
+# Let's construct an enrichment plot to compare average frequencies
+# with the amino acid counts in our sequence.
+
+(refData <- aaindex[[459]]$I)                # reference frequencies in %
+names(refData) <- seqinr::a(names(refData))  # change names to single-letter
+                                             # code using seqinr's "a()" function
+sum(refData)
+refData        # ... in %
+
+
+# tabulate the amino acid counts in mySeq
+(obsData <- table(seqinr::s2c(mySeq)))        # counts
+(obsData <- 100 * (obsData / sum(obsData)))   # frequencies
+
+
+# ==   3.1  Barplot, and side-by-side barplot  =================================
+
+barplot(obsData, col = "#CCCCCC", cex.names = 0.7)
+abline(h = 100/20, col="#BB0000")
+
+barplot(refData, col = "#BB0000", cex.names = 0.7)
+abline(h = 100/20, col="#555555")
+
+# Ok: first problem - the values in obsData are in alphabetical order. But the
+# values in refData are in alphabetical order of amino acid name: alanine,
+# arginine, asparagine, aspartic acid ... A, R, N, D, E ... you will see this
+# order a lot - one of the old biochemistry tropes in the field. So we need to
+# re-order one of the vectors to match the other. That's easy though:
+refData
+(refData <- refData[names(obsData)])
+
+barplot(refData, col = "#BB0000", cex.names = 0.7)
+abline(h = 100/20, col="#555555")
+
+# To compare the values, we want to see them in a barplot, side-by-side ...
+barplot(rbind(obsData, refData),
+        ylim = c(0, 12),
+        beside = TRUE,
+        col = c("#CCCCCC", "#BB0000"),
+        cex.names = 0.7)
+abline(h = 100/20, col="#00000044")
+
+# ... and add a legend
+legend (x = 1, y = 12,
+        legend = c("mySeq", "Average composition"),
+        fill = c("#CCCCCC", "#BB0000"),
+        cex = 0.7,
+        bty = "n")
+
+
+# ==   3.2  Plotting ratios  ===================================================
+
+# To better compare the values, we'll calculate ratios between
+# obsData and refData
+
+barplot(obsData / refData,
+        col = "#CCCCCC",
+        ylab = "Sequence / Average",
+        ylim = c(0, 2.5),
+        cex.names = 0.7)
+abline(h = 1, col="#BB0000")
+abline(h = c(1/2, 2), lty = 2, col="#BB000055")
+
+# ... but  ratios are not very good here, since the difference in height on the
+# plot now depends on the order we compare in: ratios of 1/2 and 2 (dotted
+# lines) are exactly the same fold-difference !
+
+# ==   3.3  Plotting log ratios  ===============================================
+
+# A better way to display this
+# is to plot log(ratios).
+
+barplot(log(obsData / refData),
+        col = "#CCCCCC",
+        ylab = "log(Sequence / Average)",
+        ylim = log(c(1/3, 3)),
+        cex.names = 0.7)
+abline(h = log(1), col="#BB0000")
+abline(h = log(c(1/2, 2)), lty = 2, col="#BB000055")
+
+# Note how the two-fold difference lines are now the same distance from the
+# line of equal ratio.
+
+# ==   3.4  Sort by frequency  =================================================
+
+barplot(sort(log(obsData / refData), decreasing = TRUE),
+        ylim = log(c(1/3, 3)),
+        col = "#CCCCCC",
+        ylab = "log(Sequence / Average)",
+        cex.names = 0.7)
+abline(h = log(1), col="#BB0000")
+abline(h = log(c(1/2, 2)), lty = 2, col="#BB000055")
+
+yTxt <- log(0.9)
+arrows(4, yTxt, 0, yTxt, length = 0.07)
+text(5.5, yTxt, "Enriched", cex = 0.7)
+yTxt <- log(1.1)
+arrows(20, yTxt, 24, yTxt, length = 0.07)
+text(19.5, yTxt, "Depleted", pos = 2, cex = 0.7)
+
+# ==   3.5  Color by amino acid type  ==========================================
+
+# Color the bars by amino acid type. Use AACOLS , defined in the .utilities.R
+# script, or define your own.
+
+barplot(rep(1, 20), names.arg = names(AACOLS), col = AACOLS, cex.names = 0.5)
+
+lR <- sort(log(obsData / refData), decreasing = TRUE)
+barplot(lR,
+        ylim = log(c(1/3, 3)),
+        col = AACOLS[names(lR)],
+        ylab = "log(Sequence / Average)",
+        cex.names = 0.7)
+abline(h = log(1), col="#00000055")
+abline(h = log(c(1/2, 2)), lty = 2, col="#00000033")
+
+yTxt <- log(0.9)
+arrows(4, yTxt, 0, yTxt, length = 0.07)
+text(5.5, yTxt, "Enriched", cex = 0.7)
+yTxt <- log(1.1)
+arrows(20, yTxt, 24, yTxt, length = 0.07)
+text(19.5, yTxt, "Depleted", pos = 2, cex = 0.7)
+
+
+# Task:
+#   Interpret this plot. (Can you?) Which types of amino acids are enriched?
+#   Depleted?
+
+
+
+
+# [END]
diff --git a/BIN-Sequence.R b/BIN-Sequence.R
index 4ce3e51..ba5f627 100644
--- a/BIN-Sequence.R
+++ b/BIN-Sequence.R
@@ -1,394 +1,394 @@
-# tocID <- "BIN-Sequence.R"
-#
-# Purpose:  A Bioinformatics Course:
-#              R code accompanying the BIN-Sequence unit.
-#
-# Version:  1.5
-#
-# Date:     2017-09  - 2020-09
-# Author:   Boris Steipe (boris.steipe@utoronto.ca)
-#
-# Versions:
-#           1.5    2020 Updates
-#           1.4    Change from require() to requireNamespace(),
-#                      use ::() idiom throughout,
-#                      use Biocmanager:: not biocLite()
-#           1.3    Update set.seed() usage
-#           1.2    Removed irrelevant task. How did that even get in there? smh
-#           1.1    Add chartr()
-#           1.0    First live version 2017.
-#
-# TODO:
-#
-#
-# == DO NOT SIMPLY  source()  THIS FILE! =======================================
-#
-# If there are portions you don't understand, use R's help system, Google for an
-# answer, or ask your instructor. Don't continue if you don't understand what's
-# going on. That's not how it works ...
-#
-# ==============================================================================
-
-
-#TOC> ==========================================================================
-#TOC>
-#TOC>   Section  Title                                Line
-#TOC> ----------------------------------------------------
-#TOC>   1        Prepare                                63
-#TOC>   2        Storing Sequence                       80
-#TOC>   3        String properties                     109
-#TOC>   4        Substrings                            116
-#TOC>   5        Creating strings: sprintf()           137
-#TOC>   6        Changing strings                      172
-#TOC>   6.1.1          Changing case                   174
-#TOC>   6.1.2          Reverse                         179
-#TOC>   6.1.3          Change characters               183
-#TOC>   6.1.4          Substitute characters           211
-#TOC>   6.2        stringi and stringr                 231
-#TOC>   6.3        dbSanitizeSequence()                241
-#TOC>   7        Permuting and sampling                253
-#TOC>   7.1        Permutations                        260
-#TOC>   7.2        Sampling                            306
-#TOC>   7.2.1          Equiprobable characters         308
-#TOC>   7.2.2          Defined probability vector      350
-#TOC>
-#TOC> ==========================================================================
-
-
-# =    1  Prepare  =============================================================
-
-# Much basic sequence handling is supported by the Bioconductor package
-# Biostrings.
-
-if (! requireNamespace("BiocManager", quietly = TRUE)) {
-  install.packages("BiocManager")
-}
-if (! requireNamespace("Biostrings", quietly = TRUE)) {
-  BiocManager::install("Biostrings")
-}
-# Package information:
-#  library(help = Biostrings)       # basic information
-#  browseVignettes("Biostrings")    # available vignettes
-#  data(package = "Biostrings")     # available datasets
-
-
-# =    2  Storing Sequence  ====================================================
-
-
-# Sequences can be represented and stored as vectors of single characters ...
-(v <- c("D", "I", "V", "M", "T", "Q"))
-
-# ... as strings ...
-(s <- "DIVMTQ")
-
-# ... or as more complex objects with rich metadata e.g. as a Biostrings
-# DNAstring, RNAstring, AAString, etc.
-(a <- Biostrings::AAString("DIVMTQ"))
-
-# ... and all of these representations can be interconverted:
-
-# string to vector ...
-unlist(strsplit(s, ""))
-
-# vector to string ...
-paste(v, sep = "", collapse = "")
-
-# ... and AAstring to plain string.
-as.character(a)
-
-# Since operations with character vectors trivially follow all other vector
-# conventions and syntax, and we will look at Biostrings methods in more
-# detail in a later unit, we will focus on basic strings in the following.
-
-
-# =    3  String properties  ===================================================
-
-
-length(s) # why ???
-nchar(s)  # Aha!
-
-
-# =    4  Substrings  ==========================================================
-
-# Use the substr() function
-substr(s, 2, 4)
-
-# or the similar substring()
-substring(s, 2, 4)
-
-# Note: both functions are vectorized (i.e. they operate on vectors
-# of arguments, you don't need to loop over input)...
-myBiCodes <- c("HOMSA", "MUSMU", "FUGRU", "XENLA")
-substr(   myBiCodes, 1, 3)
-substring(myBiCodes, 1, 3)
-
-# ... however only substring() will also use vectors for start and stop
-s <- "gatattgtgatgacccagtaa"       # a DNA sequence
-(vI <- seq(1, nchar(s), by = 3))   # an index vector
-substr(   s, vI, vI+2)             # ... returns only the first nucleotide triplet
-substring(s, vI, vI+2)             # ... returns all triplets
-
-
-# =    5  Creating strings: sprintf()  =========================================
-
-
-# Sprintf is a very smart, very powerful function and has cognates in all
-# other programming languages. It has a bit of a  learning curve, but this is
-# totally worth it:
-# the function takes a format string, and a list of other arguments. It returns
-# a formatted string. Here are some examples - watch carefully for sprintf()
-# calls elsewhere in the code.
-
-sprintf("Just a string.")
-sprintf("A string and the number %d.", 5)
-sprintf("More numbers: %d ate %d.", 7, 9) # Sorry
-sprintf("Pi is ~ %1.2f ...", pi)
-sprintf("or more accurately ~ %1.11f.", pi)
-x <- "bottles of beer"
-N <- 99
-sprintf("%d %s on the wall, %d %s - \ntake %s: %d %s on the wall.",
-        N, x, N, x, "one down, and pass it around", N - 1, x)
-
-# Note that in the last example, the value of the string was displayed with
-# R's usual print-formatting function and therefore the line-break "\n" did
-# not actually break the line. To have line breaks, tabs etc, you need to use
-# cat() to display the string:
-
-for (i in N:(N-4)) {
-  cat(sprintf("%d %s on the wall, %d %s - \ntake %s: %d %s on the wall.\n\n",
-              i, x, i, x, "one down, and pass it around", i - 1, x))
-}
-
-# sprintf() is vectorized: if one of its parameters is a vector, it
-# will generate one output string for each of the vector's elements:
-cat(sprintf("\n%s fish", c("one", "two", "red", "blue")))
-
-
-# =    6  Changing strings  ====================================================
-
-# ===   6.1.1  Changing case
-tolower(s)
-toupper(tolower(s))
-
-
-# ===   6.1.2  Reverse
-# (This used to work in Biostrings, apparently it doesn't work anymore. Why?)
-# Biostrings::str_rev(s)
-# The following works, of course, but awkward:
-s
-paste0(rev(unlist(strsplit(s, ""))), collapse = "")
-
-# reverse complement
-COMP <- c("t", "g", "c", "a")
-names(COMP) <- c("a", "c", "g", "t")     # mapping the complement via names
-s
-paste0(COMP[rev(unlist(strsplit(s, "")))], collapse = "")
-
-
-# ===   6.1.3  Change characters
-# chartr(old, new, x) maps all characters in x that appear in "old" to the
-# correpsonding character in "new." Kind of like the COMP vector above ...
-
-chartr("aeio", "uuuu", "We hold these truths to be self-evident ...")
-
-# One could implement toupper() and tolower() with this - remember that R has
-# character vectors of uppercase and lowercase letters as language constants.
-chartr(paste0(letters, collapse = ""),
-       paste0(LETTERS, collapse = ""),
-       "Twinkle, twinkle little star, how I wonder what you are.")
-
-# One amusing way to use the function  is for a reversible substitution
-# cypher.
-alBet <- "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz .,;:?0123456789"
-set.seed(112358)                       # set RNG seed for repeatable randomness
-( myCypher <- paste0(sample(unlist(strsplit(alBet, ""))), collapse = "") )
-set.seed(NULL)                         # reset the RNG
-
-# encode ...
-(x <- chartr(alBet, myCypher, "... seven for a secret, never to be told."))
-
-# decode ...
-chartr(myCypher, alBet, x)
-# (Nb. substitution cyphers are easy to crack!)
-
-
-# ===   6.1.4  Substitute characters
-# gsub can change lengths.
-#   Example: implementing the binary Fibonacci sequence:
-#   0 -> 1; 1 -> 10 , in three nested gsub() statements
-( s <- 1 )
-( s <- gsub("2", "10", gsub("0", "1", gsub("1", "2", s))) )
-
-# Iterate this line a few times ...
-#
-# cf. http://www.maths.surrey.ac.uk/hosted-sites/R.Knott/Fibonacci/fibrab.html
-# for the features of the sequence.
-
-# I use gsub() often to delete unwanted characters ...
-# ... select something, and substitute the empty string for it.
-(s <- gsub("-", "", s))
-
-# For example: clean up a sequence
-# copy/paste from UniProt
-(s <- "        10         20         30         40         50
-MSNQIYSARY SGVDVYEFIH STGSIMKRKK DDWVNATHIL KAANFAKAKR ")
-
-
-# remove numbers
-(s <- gsub("[0-9]", "", s))
-
-# remove "whitespace" (spaces, tabs, line breaks)...
-(s <- gsub("\\s", "", s))
-
-# ==   6.2  stringi and stringr  ===============================================
-
-# But there are also specialized functions eg. to remove leading/trailing
-# whitespace which may be important to sanitize user input etc. Have a look at
-# the function descriptions for the stringr and the stringi package. stringr is
-# part of the tidyverse, and for the most part a wrapper for stringi functions.
-# https://github.com/tidyverse/stringr
-
-
-
-# ==   6.3  dbSanitizeSequence()  ==============================================
-
-# In our learning units, we use a function dbSanitizeSequence() to clean up
-# sequences that may be copy/pasted from Web-sources
-
-cat( s <- ">FASTA header will be removed
-10         20         30         40         50
-MSNQIYSARY SGVDVYEFIH STGSIMKRKK DDWVNATHIL KAANFAKAKR " )
-
-dbSanitizeSequence(s)
-
-
-# =    7  Permuting and sampling  ==============================================
-
-
-# An important aspect of working with strings is generating random strings
-# with given statistical properties: reference items to evaluate significance.
-
-
-# ==   7.1  Permutations  ======================================================
-
-
-# One way to produce such reference items is to permute a string. A permuted
-# string has the same composition as the original, but all positional
-# information is lost. The sample() function can be used to permute:
-
-# This is the sequence of the ompA secretion signal
-(s <- unlist(strsplit("MKKTAIAVALAGFATVAQA", "")))
-
-(x <- sample(s, length(s)))  # permuted
-
-# Here's a small example how such permuted strings may be useful. As you look
-# at the ompA sequence, you suspect that the two lysines near the +-charged
-# N-terminus may not be accidental, but selected for a positively charged
-# N-terminus. What is the chance that such a sequence has two lysines close to
-# the N-terminus simply by chance? Or put differently: what is the average
-# distance of two lysines in such a sequence to the N-terminus. First, we
-# need an expression that measures the distance. A simple use of the which()
-# function will do just fine.
-
-which(s == "K")        # shows they are in position 2 and 3, so ...
-mean(which(s == "K"))  # ... gives us the average, and ...
-mean(which(x == "K"))  # ... gives us the average of the permuted sequence.
-
-# So what does the distribution look like? Lets do 10,000 trials.
-
-(s <- unlist(strsplit("MKKTAIAVALAGFATVAQA", "")))
-N <- 10000
-d <- numeric(N)
-
-set.seed(112358)                       # set RNG seed for repeatable randomness
-for (i in 1:N) {
-  d[i] <- mean(which(sample(s, length(s)) == "K"))
-}
-set.seed(NULL)                         # reset the RNG
-
-hist(d, breaks = 20)
-abline(v = 2.5, lwd = 2, col = "firebrick")
-sum(d <= 2.5) # 276. 276 of our 10000 samples are just as bunched near the
-              # N-terminus or more. That's just below the signifcance
-              # threshold of 5 %. It's a trend, but to be sure we are looking
-              # at a biological effect we would need to see more
-              # sequences.
-
-
-# ==   7.2  Sampling  ==========================================================
-
-# ===   7.2.1  Equiprobable characters
-
-# Assume you need a large random-nucleotide string for some statistical model.
-# How to create such a string? sample() can easily create it:
-
-nuc <- c("A", "C", "G", "T")
-N <- 100
-
-set.seed(16818)                        # set RNG seed for repeatable randomness
-v <- sample(nuc, N, replace = TRUE)
-set.seed(NULL)                         # reset the RNG
-
-(mySeq <- paste(v, collapse = ""))
-
-# What's the GC content?
-table(v)
-sum(table(v)[c("G", "C")]) # 51 is close to expected
-
-# What's the number of CpG motifs? Easy to check with the stringi
-# stri_match_all() function
-
-if (! requireNamespace("stringi", quietly = TRUE)) {
-  install.packages("stringi")
-}
-# Package information:
-#  library(help = stringi)       # basic information
-#  browseVignettes("stringi")    # available vignettes
-#  data(package = "stringi")     # available datasets
-
-
-(x <- stringi::stri_match_all(mySeq, regex = "CG"))
-length(unlist(x))
-
-# Now you could compare that number with yeast DNA sequences, and determine
-# whether there are more or less CpG motifs than expected by chance.
-# (cf. https://en.wikipedia.org/wiki/CpG_site)
-# But hold on: is that a fair comparison? sample() gives us all four nucleotides
-# with the same probability. But the yeast genomic DNA GC content is only
-# 38%. So you would expect fewer CpG motifs based on the statistical properties
-# of the smaller number of Cs and Gs - before biology even comes into play. How
-# do we account for that?
-
-# ===   7.2.2  Defined probability vector
-
-# This is where we need to know how to create samples with specific probability
-# distributions. A crude hack would be to create a sampling source vector with
-# 19 C, 19 G, 31 A and 31 T
-c(rep("C", 19), rep("G", 19), rep(c("A"), 31), rep(c("T"), 31))
-# ... but that doesn't scale if the numeric accuracy needs to be higher.
-#
-# However sample() has an argument that takes care of that: you can explicitly
-# specify the probabilities with which each element of the the sampling vector
-# should be chosen:
-
-nuc <- c("A", "C", "G", "T")
-N <- 100
-myProb <- c(0.31, 0.19, 0.19, 0.31)    # sampling probabilities
-
-set.seed(16818)                       # set RNG seed for repeatable randomness
-v <- sample(nuc, N, prob = myProb, replace = TRUE)
-set.seed(NULL)                         # reset the RNG
-
-(mySeq <- paste(v, collapse = ""))
-
-# What's the GC content?
-table(v)
-sum(table(v)[c("G", "C")]) # Close to expected
-
-# What's the number of CpG motifs?
-(x <- stringi::stri_match_all(mySeq, regex = "CG"))
-# ... not a single one in this case.
-
-
-
-# [END]
+# tocID <- "BIN-Sequence.R"
+#
+# Purpose:  A Bioinformatics Course:
+#              R code accompanying the BIN-Sequence unit.
+#
+# Version:  1.5
+#
+# Date:     2017-09  - 2020-09
+# Author:   Boris Steipe (boris.steipe@utoronto.ca)
+#
+# Versions:
+#           1.5    2020 Updates
+#           1.4    Change from require() to requireNamespace(),
+#                      use ::() idiom throughout,
+#                      use Biocmanager:: not biocLite()
+#           1.3    Update set.seed() usage
+#           1.2    Removed irrelevant task. How did that even get in there? smh
+#           1.1    Add chartr()
+#           1.0    First live version 2017.
+#
+# TODO:
+#
+#
+# == DO NOT SIMPLY  source()  THIS FILE! =======================================
+#
+# If there are portions you don't understand, use R's help system, Google for an
+# answer, or ask your instructor. Don't continue if you don't understand what's
+# going on. That's not how it works ...
+#
+# ==============================================================================
+
+
+#TOC> ==========================================================================
+#TOC>
+#TOC>   Section  Title                                Line
+#TOC> ----------------------------------------------------
+#TOC>   1        Prepare                                63
+#TOC>   2        Storing Sequence                       80
+#TOC>   3        String properties                     109
+#TOC>   4        Substrings                            116
+#TOC>   5        Creating strings: sprintf()           137
+#TOC>   6        Changing strings                      172
+#TOC>   6.1.1          Changing case                   174
+#TOC>   6.1.2          Reverse                         179
+#TOC>   6.1.3          Change characters               183
+#TOC>   6.1.4          Substitute characters           211
+#TOC>   6.2        stringi and stringr                 231
+#TOC>   6.3        dbSanitizeSequence()                241
+#TOC>   7        Permuting and sampling                253
+#TOC>   7.1        Permutations                        260
+#TOC>   7.2        Sampling                            306
+#TOC>   7.2.1          Equiprobable characters         308
+#TOC>   7.2.2          Defined probability vector      350
+#TOC>
+#TOC> ==========================================================================
+
+
+# =    1  Prepare  =============================================================
+
+# Much basic sequence handling is supported by the Bioconductor package
+# Biostrings.
+
+if (! requireNamespace("BiocManager", quietly = TRUE)) {
+  install.packages("BiocManager")
+}
+if (! requireNamespace("Biostrings", quietly = TRUE)) {
+  BiocManager::install("Biostrings")
+}
+# Package information:
+#  library(help = Biostrings)       # basic information
+#  browseVignettes("Biostrings")    # available vignettes
+#  data(package = "Biostrings")     # available datasets
+
+
+# =    2  Storing Sequence  ====================================================
+
+
+# Sequences can be represented and stored as vectors of single characters ...
+(v <- c("D", "I", "V", "M", "T", "Q"))
+
+# ... as strings ...
+(s <- "DIVMTQ")
+
+# ... or as more complex objects with rich metadata e.g. as a Biostrings
+# DNAstring, RNAstring, AAString, etc.
+(a <- Biostrings::AAString("DIVMTQ"))
+
+# ... and all of these representations can be interconverted:
+
+# string to vector ...
+unlist(strsplit(s, ""))
+
+# vector to string ...
+paste(v, sep = "", collapse = "")
+
+# ... and AAstring to plain string.
+as.character(a)
+
+# Since operations with character vectors trivially follow all other vector
+# conventions and syntax, and we will look at Biostrings methods in more
+# detail in a later unit, we will focus on basic strings in the following.
+
+
+# =    3  String properties  ===================================================
+
+
+length(s) # why ???
+nchar(s)  # Aha!
+
+
+# =    4  Substrings  ==========================================================
+
+# Use the substr() function
+substr(s, 2, 4)
+
+# or the similar substring()
+substring(s, 2, 4)
+
+# Note: both functions are vectorized (i.e. they operate on vectors
+# of arguments, you don't need to loop over input)...
+myBiCodes <- c("HOMSA", "MUSMU", "FUGRU", "XENLA")
+substr(   myBiCodes, 1, 3)
+substring(myBiCodes, 1, 3)
+
+# ... however only substring() will also use vectors for start and stop
+s <- "gatattgtgatgacccagtaa"       # a DNA sequence
+(vI <- seq(1, nchar(s), by = 3))   # an index vector
+substr(   s, vI, vI+2)             # ... returns only the first nucleotide triplet
+substring(s, vI, vI+2)             # ... returns all triplets
+
+
+# =    5  Creating strings: sprintf()  =========================================
+
+
+# Sprintf is a very smart, very powerful function and has cognates in all
+# other programming languages. It has a bit of a  learning curve, but this is
+# totally worth it:
+# the function takes a format string, and a list of other arguments. It returns
+# a formatted string. Here are some examples - watch carefully for sprintf()
+# calls elsewhere in the code.
+
+sprintf("Just a string.")
+sprintf("A string and the number %d.", 5)
+sprintf("More numbers: %d ate %d.", 7, 9) # Sorry
+sprintf("Pi is ~ %1.2f ...", pi)
+sprintf("or more accurately ~ %1.11f.", pi)
+x <- "bottles of beer"
+N <- 99
+sprintf("%d %s on the wall, %d %s - \ntake %s: %d %s on the wall.",
+        N, x, N, x, "one down, and pass it around", N - 1, x)
+
+# Note that in the last example, the value of the string was displayed with
+# R's usual print-formatting function and therefore the line-break "\n" did
+# not actually break the line. To have line breaks, tabs etc, you need to use
+# cat() to display the string:
+
+for (i in N:(N-4)) {
+  cat(sprintf("%d %s on the wall, %d %s - \ntake %s: %d %s on the wall.\n\n",
+              i, x, i, x, "one down, and pass it around", i - 1, x))
+}
+
+# sprintf() is vectorized: if one of its parameters is a vector, it
+# will generate one output string for each of the vector's elements:
+cat(sprintf("\n%s fish", c("one", "two", "red", "blue")))
+
+
+# =    6  Changing strings  ====================================================
+
+# ===   6.1.1  Changing case
+tolower(s)
+toupper(tolower(s))
+
+
+# ===   6.1.2  Reverse
+# (This used to work in Biostrings, apparently it doesn't work anymore. Why?)
+# Biostrings::str_rev(s)
+# The following works, of course, but awkward:
+s
+paste0(rev(unlist(strsplit(s, ""))), collapse = "")
+
+# reverse complement
+COMP <- c("t", "g", "c", "a")
+names(COMP) <- c("a", "c", "g", "t")     # mapping the complement via names
+s
+paste0(COMP[rev(unlist(strsplit(s, "")))], collapse = "")
+
+
+# ===   6.1.3  Change characters
+# chartr(old, new, x) maps all characters in x that appear in "old" to the
+# correpsonding character in "new." Kind of like the COMP vector above ...
+
+chartr("aeio", "uuuu", "We hold these truths to be self-evident ...")
+
+# One could implement toupper() and tolower() with this - remember that R has
+# character vectors of uppercase and lowercase letters as language constants.
+chartr(paste0(letters, collapse = ""),
+       paste0(LETTERS, collapse = ""),
+       "Twinkle, twinkle little star, how I wonder what you are.")
+
+# One amusing way to use the function  is for a reversible substitution
+# cypher.
+alBet <- "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz .,;:?0123456789"
+set.seed(112358)                       # set RNG seed for repeatable randomness
+( myCypher <- paste0(sample(unlist(strsplit(alBet, ""))), collapse = "") )
+set.seed(NULL)                         # reset the RNG
+
+# encode ...
+(x <- chartr(alBet, myCypher, "... seven for a secret, never to be told."))
+
+# decode ...
+chartr(myCypher, alBet, x)
+# (Nb. substitution cyphers are easy to crack!)
+
+
+# ===   6.1.4  Substitute characters
+# gsub can change lengths.
+#   Example: implementing the binary Fibonacci sequence:
+#   0 -> 1; 1 -> 10 , in three nested gsub() statements
+( s <- 1 )
+( s <- gsub("2", "10", gsub("0", "1", gsub("1", "2", s))) )
+
+# Iterate this line a few times ...
+#
+# cf. http://www.maths.surrey.ac.uk/hosted-sites/R.Knott/Fibonacci/fibrab.html
+# for the features of the sequence.
+
+# I use gsub() often to delete unwanted characters ...
+# ... select something, and substitute the empty string for it.
+(s <- gsub("-", "", s))
+
+# For example: clean up a sequence
+# copy/paste from UniProt
+(s <- "        10         20         30         40         50
+MSNQIYSARY SGVDVYEFIH STGSIMKRKK DDWVNATHIL KAANFAKAKR ")
+
+
+# remove numbers
+(s <- gsub("[0-9]", "", s))
+
+# remove "whitespace" (spaces, tabs, line breaks)...
+(s <- gsub("\\s", "", s))
+
+# ==   6.2  stringi and stringr  ===============================================
+
+# But there are also specialized functions eg. to remove leading/trailing
+# whitespace which may be important to sanitize user input etc. Have a look at
+# the function descriptions for the stringr and the stringi package. stringr is
+# part of the tidyverse, and for the most part a wrapper for stringi functions.
+# https://github.com/tidyverse/stringr
+
+
+
+# ==   6.3  dbSanitizeSequence()  ==============================================
+
+# In our learning units, we use a function dbSanitizeSequence() to clean up
+# sequences that may be copy/pasted from Web-sources
+
+cat( s <- ">FASTA header will be removed
+10         20         30         40         50
+MSNQIYSARY SGVDVYEFIH STGSIMKRKK DDWVNATHIL KAANFAKAKR " )
+
+dbSanitizeSequence(s)
+
+
+# =    7  Permuting and sampling  ==============================================
+
+
+# An important aspect of working with strings is generating random strings
+# with given statistical properties: reference items to evaluate significance.
+
+
+# ==   7.1  Permutations  ======================================================
+
+
+# One way to produce such reference items is to permute a string. A permuted
+# string has the same composition as the original, but all positional
+# information is lost. The sample() function can be used to permute:
+
+# This is the sequence of the ompA secretion signal
+(s <- unlist(strsplit("MKKTAIAVALAGFATVAQA", "")))
+
+(x <- sample(s, length(s)))  # permuted
+
+# Here's a small example how such permuted strings may be useful. As you look
+# at the ompA sequence, you suspect that the two lysines near the +-charged
+# N-terminus may not be accidental, but selected for a positively charged
+# N-terminus. What is the chance that such a sequence has two lysines close to
+# the N-terminus simply by chance? Or put differently: what is the average
+# distance of two lysines in such a sequence to the N-terminus. First, we
+# need an expression that measures the distance. A simple use of the which()
+# function will do just fine.
+
+which(s == "K")        # shows they are in position 2 and 3, so ...
+mean(which(s == "K"))  # ... gives us the average, and ...
+mean(which(x == "K"))  # ... gives us the average of the permuted sequence.
+
+# So what does the distribution look like? Lets do 10,000 trials.
+
+(s <- unlist(strsplit("MKKTAIAVALAGFATVAQA", "")))
+N <- 10000
+d <- numeric(N)
+
+set.seed(112358)                       # set RNG seed for repeatable randomness
+for (i in 1:N) {
+  d[i] <- mean(which(sample(s, length(s)) == "K"))
+}
+set.seed(NULL)                         # reset the RNG
+
+hist(d, breaks = 20)
+abline(v = 2.5, lwd = 2, col = "firebrick")
+sum(d <= 2.5) # 276. 276 of our 10000 samples are just as bunched near the
+              # N-terminus or more. That's just below the signifcance
+              # threshold of 5 %. It's a trend, but to be sure we are looking
+              # at a biological effect we would need to see more
+              # sequences.
+
+
+# ==   7.2  Sampling  ==========================================================
+
+# ===   7.2.1  Equiprobable characters
+
+# Assume you need a large random-nucleotide string for some statistical model.
+# How to create such a string? sample() can easily create it:
+
+nuc <- c("A", "C", "G", "T")
+N <- 100
+
+set.seed(16818)                        # set RNG seed for repeatable randomness
+v <- sample(nuc, N, replace = TRUE)
+set.seed(NULL)                         # reset the RNG
+
+(mySeq <- paste(v, collapse = ""))
+
+# What's the GC content?
+table(v)
+sum(table(v)[c("G", "C")]) # 51 is close to expected
+
+# What's the number of CpG motifs? Easy to check with the stringi
+# stri_match_all() function
+
+if (! requireNamespace("stringi", quietly = TRUE)) {
+  install.packages("stringi")
+}
+# Package information:
+#  library(help = stringi)       # basic information
+#  browseVignettes("stringi")    # available vignettes
+#  data(package = "stringi")     # available datasets
+
+
+(x <- stringi::stri_match_all(mySeq, regex = "CG"))
+length(unlist(x))
+
+# Now you could compare that number with yeast DNA sequences, and determine
+# whether there are more or less CpG motifs than expected by chance.
+# (cf. https://en.wikipedia.org/wiki/CpG_site)
+# But hold on: is that a fair comparison? sample() gives us all four nucleotides
+# with the same probability. But the yeast genomic DNA GC content is only
+# 38%. So you would expect fewer CpG motifs based on the statistical properties
+# of the smaller number of Cs and Gs - before biology even comes into play. How
+# do we account for that?
+
+# ===   7.2.2  Defined probability vector
+
+# This is where we need to know how to create samples with specific probability
+# distributions. A crude hack would be to create a sampling source vector with
+# 19 C, 19 G, 31 A and 31 T
+c(rep("C", 19), rep("G", 19), rep(c("A"), 31), rep(c("T"), 31))
+# ... but that doesn't scale if the numeric accuracy needs to be higher.
+#
+# However sample() has an argument that takes care of that: you can explicitly
+# specify the probabilities with which each element of the the sampling vector
+# should be chosen:
+
+nuc <- c("A", "C", "G", "T")
+N <- 100
+myProb <- c(0.31, 0.19, 0.19, 0.31)    # sampling probabilities
+
+set.seed(16818)                       # set RNG seed for repeatable randomness
+v <- sample(nuc, N, prob = myProb, replace = TRUE)
+set.seed(NULL)                         # reset the RNG
+
+(mySeq <- paste(v, collapse = ""))
+
+# What's the GC content?
+table(v)
+sum(table(v)[c("G", "C")]) # Close to expected
+
+# What's the number of CpG motifs?
+(x <- stringi::stri_match_all(mySeq, regex = "CG"))
+# ... not a single one in this case.
+
+
+
+# [END]
diff --git a/BIN-Storing_data.R b/BIN-Storing_data.R
index 7a76d12..f8bb4d7 100644
--- a/BIN-Storing_data.R
+++ b/BIN-Storing_data.R
@@ -1,684 +1,684 @@
-# tocID <- "BIN-Storing_data.R"
-#
-# Purpose: A Bioinformatics Course:
-#              R code accompanying the BIN-Storing_data unit
-#
-# Version: 1.3.2
-#
-# Date:    2017-10  -  2021-09
-# Author:  Boris Steipe (boris.steipe@utoronto.ca)
-#
-# V 1.3.2  2021 minimal maintenance
-# V 1.3.1  add overlooked  jsonlite:: prefix to fromJson()
-# V 1.3    Made file locations more consistent. All student-edited files
-#          go into the myScripts directory
-# V 1.2    2020 updates. Finally removed stringAsFactors  :-)
-# V 1.1    Add instructions to retrieve UniProt ID from ID mapping service.
-# V 1.0    First live version, complete rebuilt. Now using JSON data sources.
-# V 0.1    First code copied from BCH441_A03_makeYFOlist.R
-#
-# TODO:
-#  The sameSpecies() approach is a bit of a hack - can we solve the
-#  species vs. strain issue in a more principled way?
-#
-# == HOW TO WORK WITH LEARNING UNIT FILES ======================================
-#
-# DO NOT SIMPLY  source()  THESE FILES!
-#
-# If there are portions you don't understand, use R's help system, Google for an
-# answer, or ask your instructor. Don't continue if you don't understand what's
-#  going on. That's not how it works ...
-#
-# ==============================================================================
-
-
-#TOC> ==========================================================================
-#TOC>
-#TOC>   Section  Title                                                   Line
-#TOC> -----------------------------------------------------------------------
-#TOC>   1        A Relational Datamodel in R: review                       63
-#TOC>   1.1        Building a sample database structure                   103
-#TOC>   1.1.1          completing the database                            209
-#TOC>   1.2        Querying the database                                  242
-#TOC>   1.3        Task: submit for credit (part 1/2)                     273
-#TOC>   2        Implementing the protein datamodel                       297
-#TOC>   2.1        JSON formatted source data                             323
-#TOC>   2.2        "Sanitizing" sequence data                             364
-#TOC>   2.3        Create a protein table for our data model              386
-#TOC>   2.3.1          Initialize the database                            388
-#TOC>   2.3.2          Add data                                           400
-#TOC>   2.4        Complete the database                                  420
-#TOC>   2.4.1          Examples of navigating the database                447
-#TOC>   2.5        Updating the database                                  479
-#TOC>   3        Add your own data                                        491
-#TOC>   3.1        Find a protein                                         499
-#TOC>   3.2        Put the information into JSON files                    530
-#TOC>   3.3        Create an R script to create your own database         572
-#TOC>   3.3.1          Check and validate                                 600
-#TOC>   3.4        Task: submit for credit (part 2/2)                     645
-#TOC>
-#TOC> ==========================================================================
-
-
-# =    1  A Relational Datamodel in R: review  =================================
-
-# A disclaimer at first: we are not building an industry-strength database at
-# all here - but we are employing principles of such a database to keep common
-# types of lab-data well organized. Don't think of this as emulating or even
-# replacing a "real" database, but think of this as improving the ad hoc
-# approaches we normally employ to store data in the lab. That does not mean
-# such ad hoc approaches are necessarily bad - the best solution always depends
-# on your objectives, the details of your tasks, and the context in which you
-# are working.
-
-# The principle we follow in implementing a relational data model is to build a
-# list of dataframes . This list is our "database":
-#  - Each _entity_ of the datamodel is a dataframe. In an SQL database, these
-#    would also be called "tables". In a spreadsheet this would be a "sheet".
-#  - Each instance of an entity, i.e. one stored _item_, is a row of the data
-#    frame. In an SQL database this would be a record. In a spreadsheet this is
-#    a row.
-#  - Each _attribute_ of an entity is is a column of the dataframe. In an SQL
-#    database this is a column, in a spreadsheet too.
-#  - This doesn't necessarily solve the question of how we will store and curate
-#    our source data - we will defer that to later. At first we talk only about
-#    data representation internal to our R session, where we need it for
-#    processing and analysis.
-
-# Lets review syntax for creating and accessing such a structure, a list of data
-# frames. You'll have to be absolutely confident with this, or you'll get lost
-# in all the later learning units. We'll start from a compact example, a tiny
-# database of philosophers to keep things brief. That database will have three
-# tables: person, works and book. Person stores biographical data, book stores
-# books, and works is a join table associating persons with their work. You
-# should already be familiar with "join tables" and why we need them. This is
-# the structure:
-#
-# person: id, name, born, died, school
-# book:   id, title, published
-# works:  id, person$id, book$id
-
-# Perhaps draw out this schema to make things more clear.
-
-# ==   1.1  Building a sample database structure  ==============================
-
-# Let's build this structure.
-
-philDB <- list()  # This is an empty list
-
-# This is a data frame that we initialize with two philosophers
-x <- data.frame(id = c(1,2),
-                name = c("Laozi", "Martin Heidegger"),
-                born = c(NA, "1889"),
-                died = c("531 BCE", "1976"),
-                school = c("Daoism", "Phenomenology"))
-str(x)
-
-# Lets add the dataframe to the philDB list and call it "person" there.
-philDB[["person"]] <- x
-str(philDB)
-
-# and let's remove x so we don't mix up things later.
-rm(x)
-
-# We can address elements with the usual subsetting operators. I will use
-# the $ operator for tables and columns, the [] operator for elements in
-# columns. For example ...
-
-philDB$person$name[1]   # Laozi
-
-# task: Write an expression that returns all "school" entries from the
-#       person table.
-
-# Let's now add another person. There are several ways to do this, the
-# conceptually cleanest is to create a one-row dataframe with the data, and
-# rbind() it to the existing dataframe. Doing this, we must take care that
-# the data frame column names are identical. What happens if they are not?
-# Let's find out:
-(x <- data.frame(a=1:4, b=11:14))
-(y <- data.frame(a=6, c=17))
-rbind(x, y)
-
-(y <- data.frame(a=6, b=17))
-rbind(x, y)
-
-# All clear? That's good - this behaviour provides us with a sanity check on the
-# operation. Incidentally: rbind(x, y) did NOT change the table ...
-x
-# rather rbind() had the chnaged table as its return value and that's why it
-# was printed. To actually change the table, you need to ASSIGN the return
-# value  of rbind() ... like so:
-x <- rbind(x, y)
-
-# To continue ...
-(x <- data.frame(id = 2,
-                 name = "Zhuangzi",
-                 born = "369 BCE",
-                 died = "286 BCE",
-                 school = "Daoism"))
-
-# Add this to the "person" table in our database with rbind() ...
-philDB$person <- rbind(philDB$person, x)
-
-# ... and examine the result:
-str(philDB)
-
-# We made a serious error in our data! Did you spot it?
-#
-# If not, look at ...
-philDB$person$id
-# ... does that look oK?
-#
-# Absolutely not! "id" is the Primary Key in the table, and it has to be
-# unique. How can we guarantee it to be unique? Certainly not when we
-# enter it by hand. We need a function that generates a unique key. Here's
-# a simple version, without any error-checking. It assumes that a column
-# named "id" exists in the table, and that it holds the Primary Keys:
-autoincrement <- function(table) {
-  return(max(table$id) + 1)
-}
-
-#Try it:
-autoincrement(philDB$person)
-
-# Once that is clear, let's remove the Zhuangzi entry and recreate it correctly.
-# Many ways to remove, here we use a logical expression to select matching
-# record(s), apply the results to subset the data frame, and overwrite the
-# existing table with the new one.
-
-sel <- !(philDB$person$name == "Zhuangzi")   # select ...
-philDB$person <- philDB$person[sel, ]        # ... and replace
-
-str(philDB)
-
-# Now let's add Zhuangzi with correct data. Note how we use the autoincrement
-# function for the id
-
-x <- data.frame(id = autoincrement(philDB$person),
-                name = "Zhuangzi",
-                born = "369 BCE",
-                died = "286 BCE",
-                school = "Daoism")
-philDB$person <- rbind(philDB$person, x)
-str(philDB)
-
-# So far so good. Be honest with yourself. If you didn't follow any of this,
-# go back, re-read, play with it, and ask for help. These are the foundations.
-
-
-# ===   1.1.1  completing the database
-
-
-# Next I'll add one more person, and create the other two tables:
-
-x <- data.frame(id = autoincrement(philDB$person),
-                name = "Kongzi",
-                born = "551 BCE",
-                died = "479 BCE",
-                school = "Confucianism")
-philDB$person <- rbind(philDB$person, x)
-
-# a table of major works ...
-philDB[["books"]] <- data.frame(id = 1:5,
-                                title = c("Zhuangzi",
-                                          "Analects",
-                                          "Being and Time",
-                                          "Daodejing",
-                                          "On the Way to Language"),
-                                published = c("300 BCE",
-                                              "220 BCE",
-                                              "1927",
-                                              "530 BCE",
-                                              "1959"))
-
-# a "join" table that links works and their author ...
-philDB[["works"]] <- data.frame(id = 1:5,
-                                personID = c(3, 4, 2, 1, 2),
-                                bookID = c(1, 2, 3, 4, 5))
-
-str(philDB)
-
-
-# ==   1.2  Querying the database  =============================================
-
-
-# To retrieve data, we need to subset tables, possibly based on conditions we
-# find in other tables. Sometimes we can simply get the information, e.g.
-# all names ...
-philDB$person$name
-# ... or all book titles ...
-philDB$books$title
-
-# ... but sometimes we need to cross-reference information via join tables. Here
-# is an example where we list authors and their works, sorted alphabetically by
-# author:
-(sel <- order(philDB$person$name))   # check out ?order and describe to
-                                     # someone you know what it does, so that
-                                     # you are sure you understand it. Its
-                                     # indirection can be a bit tricky to
-                                     # understand.
-( pID <- philDB$person$id[sel] )
-sel <- numeric()   # initialize the vector
-for (ID in pID) {
-  sel <- which(philDB$works$personID == ID)          # get all rows for which
-                                                     # the condition is TRUE
-  cat(sprintf("%s: ", philDB$person$name[ID]))       # output the person
-  cat(sprintf("\"%s\"  ", philDB$books$title[sel]))  # output the book
-  cat("\n")
-}
-
-# Examine the intermediate results and trace the logic until this is clear.
-
-
-# ==   1.3  Task: submit for credit (part 1/2)  ================================
-
-
-#    Write code that adds another philosopher to the datamodel:
-#       Immanuel Kant, (1724 - 1804), Enlightenment Philosophy.
-#       Works: Critique of Pure Reason (1781), Critique of Judgement (1790)
-#    Paste your code into your submission page. Enclose it in 
 ... 
-# tags. -# -# Write and submit code that lists the philosophical schools in -# alphabetical order, and the books associated with them, also -# alphabetically. Format your output like: -# Confucianism -# Analects - (220 BCE) -# Daoism -# Daodejing - (530 BCE) -# ... etc. -# -# Show the output of your code. Make sure the code itself is enclosed -# in
 ... 
tags. DO NOT POST A SCREENSHOT OF YOUR OUTPUT, -# BUT COPY THE EXACT, COMPLETE OUTPUT, PASTE IT INTO YOUR SUBMISSION, -# AND FORMAT IT CORRECTLY. - -# == Submission: Code to list the philosophical schools in alphabetical order as well as their respective books in alphabetical order. - -schools <- unique(philDB$person$school) -schools <- sort(schools) - -for (s in schools) { - cat(sprintf("%s\n", s)) - authors = which(philDB$person$school == s) - for (author in authors) { - works = which(philDB$works$personID == author) - for (work in works) { - bookId = which(philDB$books$id == philDB$works$bookID[work]) - cat(sprintf("\t%s - (%s)\n", philDB$books$title[bookId], philDB$books$published[bookId])) - } - } -} - - -# = 2 Implementing the protein datamodel ================================== - - -# Working with the code above has probably illustrated a few concerns about -# curating data and storing it for analysis. In particular the join tables -# seem problematic - figuring out the correct IDs, it's easy to make -# mistakes. -# - Data needs to be captured in a human-readable form so it can be verified -# and validated; -# - Some aspects of the database should _never_ be done by hand because -# errors are easy to make and hard to see. That essentially includes -# every operation that has to do with abstract, primary keys; -# - Elementary operations we need to support are: adding data, selecting -# data, modifying data and deleting data. - -# We will therefore construct our protein database in the following way: -# - For each table, we will keep the primary information in JSON files. There -# it is easy to read, edit if needed, and modify it. -# - We will use simple scripts to read the JSON data and assemble it in -# our database for further analysis. -# - I have constructed initial files for yeast Mbp1 and nine other reference -# species. -# - I have written a small number of utility functions to read those files -# and assemble them into a database. - - -# == 2.1 JSON formatted source data ======================================== - - -# Have a look at the structure of the yeast Mbp1 protein data: -file.show("./data/MBP1_SACCE.json") - -# - The whole thing is an array: [ ... ]. This is not necessary for a single -# object, but we will have more objects in other files. And it's perfectly -# legal to have an array with a single element. -# - The data is formatted as "key" : "value" pairs inside an object { ... }. -# This keeps the association between data items and their semantics -# explicit. -# - All keys are strings and they are unique in the object. -# - Values are mostly single strings and integers ... -# - ... except for "sequence". That one is an array of strings. Why? This is to -# make it easier to format and maintain the data. JSON does not allow line -# breaks within strings, but the strings we copy/paste from Genbank or other -# sources might have line breaks, sequence numbers etc. So we need to -# sanitize the sequence at some point. But since we need to do that -# anyway, it is easier to see the whole sequence if we store it in chunks. - -# The .utilities.R script that get's loaded whenever you open this project -# has already made sure the "jsonlite" package exists on your computer. This -# package supports our work with .json formatted data. - -if (! requireNamespace("jsonlite", quietly = TRUE)) { - install.packages("jsonlite") -} -# Package information: -# library(help = jsonlite) # basic information -# browseVignettes("jsonlite") # available vignettes -# data(package = "jsonlite") # available datasets - - -x <- jsonlite::fromJSON("./data/MBP1_SACCE.json") -str(x) - -x$name -unlist(x$sequence) - - -# == 2.2 "Sanitizing" sequence data ======================================== - - -# Examine the dbSanitizeSequence() function: - -dbSanitizeSequence - -# Try: - -dbSanitizeSequence(c("GAA", "ttc")) -dbSanitizeSequence("MsnQ00%0 I@#>YSary S - G1 V2DV3Y>") -x <- " - 1 msnqiysary sgvdvyefih stgsimkrkk ddwvnathil kaanfakakr trilekevlk - 61 ethekvqggf gkyqgtwvpl niakqlaekf svydqlkplf dftqtdgsas pppapkhhha - 121 skvdrkkair sastsaimet krnnkkaeen qfqsskilgn ptaaprkrgr pvgstrgsrr - ... - " # copy/paste from Genbank - -dbSanitizeSequence(x) - - -# == 2.3 Create a protein table for our data model ========================= - -# === 2.3.1 Initialize the database - - -# The function dbInit contains all the code to return a list of empty -# data frames for our data model. - -dbInit - -myDB <- dbInit() -str(myDB) - - -# === 2.3.2 Add data - - -# fromJSON() returns a dataframe that we can readily process to add data -# to our table. Have a look at the function to add protein entries: - -dbAddProtein - -myDB <- dbAddProtein(myDB, jsonlite::fromJSON("./data/MBP1_SACCE.json")) -str(myDB) - -# Lets check that the 833 amino acids of the yeast MBP1 sequence have -# safely arrived. Note the genral idiom we use here to retrieve the data: -# we define a boolean vector that satisfies a condition, then we subset -# a column with that vector. - -sel <- myDB$protein$name == "MBP1_SACCE" -nchar(myDB$protein$sequence[sel]) - - -# == 2.4 Complete the database ============================================= - - -# Completing the database with Mbp1 data and data for 9 other "reference" -# species is more of the same. I have assembled the code in a script -# "./scripts/ABC-createRefDB.R" - open it, check it out, and then source it. -# It's really very simple, just reading some prepared files of data I have -# formatted with JSON, and assembling the data in our data model. -# -# The code is also very simple and in particular there is no checking for errors -# or inconsistencies. Have a look: - -# Totally straightforward ... -dbAddTaxonomy -dbAddFeature - -# Just slightly more complex, since we need to match the protein or feature -# name in the JSON file with its internal ID, and, when doing that confirm -# that it CAN be matched and that the match is UNIQUE -dbAddAnnotation - -# Now: create the database -source("./scripts/ABC-createRefDB.R") - -str(myDB) - - -# === 2.4.1 Examples of navigating the database - - -# You can look at the contents of the tables in the usual way we access -# elements from lists and dataframes. Here are some examples: -myDB$protein -myDB$protein$RefSeqID -myDB$protein[,"name"] -myDB$taxonomy -myDB$taxonomy$species -biCode(myDB$taxonomy$species) - -# Comparing two tables: -# Are all of the taxonomyIDs in the protein table present in the -# taxonomy table? We ought to check, because the way we imported the -# data from JSON objects, we could have omitted or forgotten some. But we can -# check this with one simple expression. Unravel it and study its components. - -all(myDB$protein$taxonomyID %in% myDB$taxonomy$ID) - -# If this is not TRUE, you MUST fix the problem before continuing. - -# Cross-referencing information: -# What is the species name of the protein whose name is "MBP1_COPCI"? - -sel <- myDB$protein$name == "MBP1_COPCI" -x <- myDB$protein$taxonomyID[sel] - -sel <- myDB$taxonomy$ID == x -myDB$taxonomy$species[sel] - - -# == 2.5 Updating the database ============================================= - - -# Basic tasks for databases include retrieving data, selecting data, updating -# and deleting data. Here we will take a simple, pedestrian approach: -# -# In case we need to modify any of the data, we modify it in the JSON file -# save that, and recreate the database. The myDB database will only be -# used for analysis. -# - - -# = 3 Add your own data =================================================== - - -# You have defined a genome sequence fungus as "MYSPE", and your final task -# will be to find the protein in MYSPE that is most similar to yeast Mbp1, and -# to enter its information into the database. - - -# == 3.1 Find a protein ==================================================== - - -# The BLAST algorithm will be properly introduced in a later learning unit - -# for now just use it in the following way: -# -# - Navigate to https://blast.ncbi.nlm.nih.gov/Blast.cgi and click on -# Protein BLAST. -# - Enter NP_010227 into the "Query Sequence" field. -# - Choose "Reference proteins (refseq_protein)" as the "Database" in the -# "Choose Search Set" section. -# - Paste the MYSPE species name into the "Organism" field. -# -# - Click the "BLAST" button. - -# You will probably get more than one result. If you get dozens of results or -# more, or if you get no results, something went wrong. Reconsider whether the -# problem was with your input, try something different, or ask for help. - -# Otherwise, look for the top-hit in the "Descriptions" tab In some cases -# there will be more than one hit with nearly similar E-values. If this is the -# case for MYSPE, choose the one with the higher degree of similarity (more -# identities) with the N-terminus of the query - i.e. the Query sequence of -# the first ~ 100 amino acids. - -# - If you are submitting this unit for credit, you will need to paste the -# relevant section of the BLAST results into your submission page (see task). # - Follow the link to the protein data page, linked from "Accession". -# - From there, in a separate tab, open the link to the taxonomy database page -# for MYSPE which is linked from the "ORGANISM" record. - - -# == 3.2 Put the information into JSON files =============================== - - -# - Next make a copy of the file "./data/MBP1_SACCE.json" in the "data" -# directory and give it a new name that corresponds to MYSPE - e.g. if -# MYSPE is called "Crptycoccus neoformans", your file should be called -# "MBP1_CRYNE.json"; in that case "MBP1_CRYNE" would also be the -# "name" of your protein. Open the file in the RStudio editor and replace -# all of the MBP1_SACCE data with the corresponding data of your protein. -# -# Note: The UniProt ID may not be listed on the NCBI page. To retrieve -# it, navigate to http://www.uniprot.org/mapping/ , paste your RefSeq ID -# into the query field, make sure "RefSeqProtein" is selected for "From" -# and "UniProtKB" is selected for "To", and click "Go". In case this does -# not retrieve a single UniProt ID, contact me. -# -# Save your .json file into your myScripts directory. -# -# Confirm this step: -if (file.exists(sprintf("./myScripts/MBP1_%s.json", biCode(MYSPE)))) { - cat("Excellent - all good to continue.\n") -} else { - stop(sprintf(" The file \"./myScripts/MBP1_%s.json\" does not exist", - biCode(MYSPE))) -} -# -# -# - Do a similar thing for the MYSPE taxonomy entry. Copy -# "./data/refTaxonomy.json" and make a new file named "MYSPEtaxonomy.json". -# Create a valid JSON file with only one single entry - that of MYSPE. -# -# Confirm this step: -if (file.exists(sprintf("./myScripts/%staxonomy.json", biCode(MYSPE)))) { - cat("Excellent - all good to continue.\n") -} else { - stop(sprintf(" The file \"./myScripts/%staxonomy.json\" does not exist", - biCode(MYSPE))) -} - -# - Validate your two files online at https://jsonlint.com/ - - -# == 3.3 Create an R script to create your own database ==================== - - -# Next: to create your own database. -# - Make a new R script, call it "makeProteinDB.R" -# - enter the following expression as the first command: -# source("./scripts/ABC-createRefDB.R") -# - than add the two commands that add your protein and taxonomy data, -# they should look like: -# -# myDB <- dbAddProtein(myDB, -# jsonlite::fromJSON("./myScripts/MBP1_.json")) -# myDB <- dbAddTaxonomy(myDB, -# jsonlite::fromJSON("./myScripts/taxonomy.json")) -# -# -# - save the .json file in the ./myScripts/ folder and source() it: -# -# source("./myScripts/makeProteinDB.R") # <<<- This command ... -# -# ... needs to be executed whenever you recreate the database. In particular, -# whenever you have added or modified data in any of the JSON files. Later you -# will add more information. - -# Remember this principle. Don't rely on objects in memory - you might -# "break" them with a code experiment. But always have a script with -# which you can create what you need. - -# === 3.3.1 Check and validate - - -# Is your protein named according to the pattern "MBP1_MYSPE"? It should be. -# And does the taxonomy table contain the systematic name? It should be the same -# that you get when you type MYSPE into the console. - -# Let's compute sequence lengths on the fly (with the function nchar() ), and -# open this with the table viewer function View() - -View(cbind(myDB$protein[ , c("ID", "name", "RefSeqID")], - length = nchar(myDB$protein$sequence))) - -# Does your protein appear in the last row of this table? Where does your -# protein's length fall relative to the reference proteins? About the same? Much -# shorter? Much longer? If it is less then 500 amino acids long, I would suspect -# an error. Contact me for advice. - -# Is that the right sequence? Is it the same as the one on the NCBI protein -# database page? -myDB$protein$sequence[nrow(myDB$protein)] - -# If not, don't continue! Fix the problem first. -# Let me repeat: If this does not give you the right sequence of the MYSPE -# Mbp1 homologue, DO NOT CONTINUE. Fix the problem. - -# Is that the right taxonomy ID and binomial name for MYSPE? -# This question may be a bit non-trivial ... MYSPE is a species, but the -# recorded taxonomy ID may be a strain. We have a utility function, -# sameSpecies() that normalizes organism name to the binomial species. -# -sel <- sameSpecies(myDB$taxonomy$species, MYSPE) -myDB$taxonomy[sel, ] - -# If not, or if the result was "<0 rows> ... " then DO NOT CONTINUE. -# Fix the problem first. - -# Does this give you the right refseq ID for MBP1_MYSPE? -sel <- myDB$protein$name == paste0("MBP1_", biCode(MYSPE)) -myDB$protein$RefSeqID[sel] - -# If not, or if the result was "<0 rows> ... " then DO NOT CONTINUE. -# Fix the problem first. - - -# == 3.4 Task: submit for credit (part 2/2) ================================ - - -# - On your submission page, copy/paste the BLAST result headers from the -# "Alignments" tab, to demonstrate that the data justifies your choice of -# protein; you don't need to paste the whole alignment, just the header(s). -# Note the relevant values separately: eValue, coverage, %ID etc. and link -# to your protein's NCBI protein database page. (Note: in case there are -# more than one high-scoring segments included for the SAME protein, you -# need to show the results for all of its high-scoring segments.) -# - Copy and paste the contents of your two JSON files on your submission -# page on the Student Wiki. Make sure they are enclosed in
 ... 
-# tags. -# - Execute the three commands below and show the result on your submission page - -biCode(myDB$taxonomy$species) %in% biCode(MYSPE) -sel <- sameSpecies(myDB$taxonomy$species, MYSPE) -myDB$protein$taxonomyID %in% myDB$taxonomy$ID[sel] - -# That is all. - - -# [END] +# tocID <- "BIN-Storing_data.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the BIN-Storing_data unit +# +# Version: 1.3.2 +# +# Date: 2017-10 - 2021-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# V 1.3.2 2021 minimal maintenance +# V 1.3.1 add overlooked jsonlite:: prefix to fromJson() +# V 1.3 Made file locations more consistent. All student-edited files +# go into the myScripts directory +# V 1.2 2020 updates. Finally removed stringAsFactors :-) +# V 1.1 Add instructions to retrieve UniProt ID from ID mapping service. +# V 1.0 First live version, complete rebuilt. Now using JSON data sources. +# V 0.1 First code copied from BCH441_A03_makeYFOlist.R +# +# TODO: +# The sameSpecies() approach is a bit of a hack - can we solve the +# species vs. strain issue in a more principled way? +# +# == HOW TO WORK WITH LEARNING UNIT FILES ====================================== +# +# DO NOT SIMPLY source() THESE FILES! +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ----------------------------------------------------------------------- +#TOC> 1 A Relational Datamodel in R: review 63 +#TOC> 1.1 Building a sample database structure 103 +#TOC> 1.1.1 completing the database 209 +#TOC> 1.2 Querying the database 242 +#TOC> 1.3 Task: submit for credit (part 1/2) 273 +#TOC> 2 Implementing the protein datamodel 297 +#TOC> 2.1 JSON formatted source data 323 +#TOC> 2.2 "Sanitizing" sequence data 364 +#TOC> 2.3 Create a protein table for our data model 386 +#TOC> 2.3.1 Initialize the database 388 +#TOC> 2.3.2 Add data 400 +#TOC> 2.4 Complete the database 420 +#TOC> 2.4.1 Examples of navigating the database 447 +#TOC> 2.5 Updating the database 479 +#TOC> 3 Add your own data 491 +#TOC> 3.1 Find a protein 499 +#TOC> 3.2 Put the information into JSON files 530 +#TOC> 3.3 Create an R script to create your own database 572 +#TOC> 3.3.1 Check and validate 600 +#TOC> 3.4 Task: submit for credit (part 2/2) 645 +#TOC> +#TOC> ========================================================================== + + +# = 1 A Relational Datamodel in R: review ================================= + +# A disclaimer at first: we are not building an industry-strength database at +# all here - but we are employing principles of such a database to keep common +# types of lab-data well organized. Don't think of this as emulating or even +# replacing a "real" database, but think of this as improving the ad hoc +# approaches we normally employ to store data in the lab. That does not mean +# such ad hoc approaches are necessarily bad - the best solution always depends +# on your objectives, the details of your tasks, and the context in which you +# are working. + +# The principle we follow in implementing a relational data model is to build a +# list of dataframes . This list is our "database": +# - Each _entity_ of the datamodel is a dataframe. In an SQL database, these +# would also be called "tables". In a spreadsheet this would be a "sheet". +# - Each instance of an entity, i.e. one stored _item_, is a row of the data +# frame. In an SQL database this would be a record. In a spreadsheet this is +# a row. +# - Each _attribute_ of an entity is is a column of the dataframe. In an SQL +# database this is a column, in a spreadsheet too. +# - This doesn't necessarily solve the question of how we will store and curate +# our source data - we will defer that to later. At first we talk only about +# data representation internal to our R session, where we need it for +# processing and analysis. + +# Lets review syntax for creating and accessing such a structure, a list of data +# frames. You'll have to be absolutely confident with this, or you'll get lost +# in all the later learning units. We'll start from a compact example, a tiny +# database of philosophers to keep things brief. That database will have three +# tables: person, works and book. Person stores biographical data, book stores +# books, and works is a join table associating persons with their work. You +# should already be familiar with "join tables" and why we need them. This is +# the structure: +# +# person: id, name, born, died, school +# book: id, title, published +# works: id, person$id, book$id + +# Perhaps draw out this schema to make things more clear. + +# == 1.1 Building a sample database structure ============================== + +# Let's build this structure. + +philDB <- list() # This is an empty list + +# This is a data frame that we initialize with two philosophers +x <- data.frame(id = c(1,2), + name = c("Laozi", "Martin Heidegger"), + born = c(NA, "1889"), + died = c("531 BCE", "1976"), + school = c("Daoism", "Phenomenology")) +str(x) + +# Lets add the dataframe to the philDB list and call it "person" there. +philDB[["person"]] <- x +str(philDB) + +# and let's remove x so we don't mix up things later. +rm(x) + +# We can address elements with the usual subsetting operators. I will use +# the $ operator for tables and columns, the [] operator for elements in +# columns. For example ... + +philDB$person$name[1] # Laozi + +# task: Write an expression that returns all "school" entries from the +# person table. + +# Let's now add another person. There are several ways to do this, the +# conceptually cleanest is to create a one-row dataframe with the data, and +# rbind() it to the existing dataframe. Doing this, we must take care that +# the data frame column names are identical. What happens if they are not? +# Let's find out: +(x <- data.frame(a=1:4, b=11:14)) +(y <- data.frame(a=6, c=17)) +rbind(x, y) + +(y <- data.frame(a=6, b=17)) +rbind(x, y) + +# All clear? That's good - this behaviour provides us with a sanity check on the +# operation. Incidentally: rbind(x, y) did NOT change the table ... +x +# rather rbind() had the chnaged table as its return value and that's why it +# was printed. To actually change the table, you need to ASSIGN the return +# value of rbind() ... like so: +x <- rbind(x, y) + +# To continue ... +(x <- data.frame(id = 2, + name = "Zhuangzi", + born = "369 BCE", + died = "286 BCE", + school = "Daoism")) + +# Add this to the "person" table in our database with rbind() ... +philDB$person <- rbind(philDB$person, x) + +# ... and examine the result: +str(philDB) + +# We made a serious error in our data! Did you spot it? +# +# If not, look at ... +philDB$person$id +# ... does that look oK? +# +# Absolutely not! "id" is the Primary Key in the table, and it has to be +# unique. How can we guarantee it to be unique? Certainly not when we +# enter it by hand. We need a function that generates a unique key. Here's +# a simple version, without any error-checking. It assumes that a column +# named "id" exists in the table, and that it holds the Primary Keys: +autoincrement <- function(table) { + return(max(table$id) + 1) +} + +#Try it: +autoincrement(philDB$person) + +# Once that is clear, let's remove the Zhuangzi entry and recreate it correctly. +# Many ways to remove, here we use a logical expression to select matching +# record(s), apply the results to subset the data frame, and overwrite the +# existing table with the new one. + +sel <- !(philDB$person$name == "Zhuangzi") # select ... +philDB$person <- philDB$person[sel, ] # ... and replace + +str(philDB) + +# Now let's add Zhuangzi with correct data. Note how we use the autoincrement +# function for the id + +x <- data.frame(id = autoincrement(philDB$person), + name = "Zhuangzi", + born = "369 BCE", + died = "286 BCE", + school = "Daoism") +philDB$person <- rbind(philDB$person, x) +str(philDB) + +# So far so good. Be honest with yourself. If you didn't follow any of this, +# go back, re-read, play with it, and ask for help. These are the foundations. + + +# === 1.1.1 completing the database + + +# Next I'll add one more person, and create the other two tables: + +x <- data.frame(id = autoincrement(philDB$person), + name = "Kongzi", + born = "551 BCE", + died = "479 BCE", + school = "Confucianism") +philDB$person <- rbind(philDB$person, x) + +# a table of major works ... +philDB[["books"]] <- data.frame(id = 1:5, + title = c("Zhuangzi", + "Analects", + "Being and Time", + "Daodejing", + "On the Way to Language"), + published = c("300 BCE", + "220 BCE", + "1927", + "530 BCE", + "1959")) + +# a "join" table that links works and their author ... +philDB[["works"]] <- data.frame(id = 1:5, + personID = c(3, 4, 2, 1, 2), + bookID = c(1, 2, 3, 4, 5)) + +str(philDB) + + +# == 1.2 Querying the database ============================================= + + +# To retrieve data, we need to subset tables, possibly based on conditions we +# find in other tables. Sometimes we can simply get the information, e.g. +# all names ... +philDB$person$name +# ... or all book titles ... +philDB$books$title + +# ... but sometimes we need to cross-reference information via join tables. Here +# is an example where we list authors and their works, sorted alphabetically by +# author: +(sel <- order(philDB$person$name)) # check out ?order and describe to + # someone you know what it does, so that + # you are sure you understand it. Its + # indirection can be a bit tricky to + # understand. +( pID <- philDB$person$id[sel] ) +sel <- numeric() # initialize the vector +for (ID in pID) { + sel <- which(philDB$works$personID == ID) # get all rows for which + # the condition is TRUE + cat(sprintf("%s: ", philDB$person$name[ID])) # output the person + cat(sprintf("\"%s\" ", philDB$books$title[sel])) # output the book + cat("\n") +} + +# Examine the intermediate results and trace the logic until this is clear. + + +# == 1.3 Task: submit for credit (part 1/2) ================================ + + +# Write code that adds another philosopher to the datamodel: +# Immanuel Kant, (1724 - 1804), Enlightenment Philosophy. +# Works: Critique of Pure Reason (1781), Critique of Judgement (1790) +# Paste your code into your submission page. Enclose it in
 ... 
+# tags. +# +# Write and submit code that lists the philosophical schools in +# alphabetical order, and the books associated with them, also +# alphabetically. Format your output like: +# Confucianism +# Analects - (220 BCE) +# Daoism +# Daodejing - (530 BCE) +# ... etc. +# +# Show the output of your code. Make sure the code itself is enclosed +# in
 ... 
tags. DO NOT POST A SCREENSHOT OF YOUR OUTPUT, +# BUT COPY THE EXACT, COMPLETE OUTPUT, PASTE IT INTO YOUR SUBMISSION, +# AND FORMAT IT CORRECTLY. + +# == Submission: Code to list the philosophical schools in alphabetical order as well as their respective books in alphabetical order. + +schools <- unique(philDB$person$school) +schools <- sort(schools) + +for (s in schools) { + cat(sprintf("%s\n", s)) + authors = which(philDB$person$school == s) + for (author in authors) { + works = which(philDB$works$personID == author) + for (work in works) { + bookId = which(philDB$books$id == philDB$works$bookID[work]) + cat(sprintf("\t%s - (%s)\n", philDB$books$title[bookId], philDB$books$published[bookId])) + } + } +} + + +# = 2 Implementing the protein datamodel ================================== + + +# Working with the code above has probably illustrated a few concerns about +# curating data and storing it for analysis. In particular the join tables +# seem problematic - figuring out the correct IDs, it's easy to make +# mistakes. +# - Data needs to be captured in a human-readable form so it can be verified +# and validated; +# - Some aspects of the database should _never_ be done by hand because +# errors are easy to make and hard to see. That essentially includes +# every operation that has to do with abstract, primary keys; +# - Elementary operations we need to support are: adding data, selecting +# data, modifying data and deleting data. + +# We will therefore construct our protein database in the following way: +# - For each table, we will keep the primary information in JSON files. There +# it is easy to read, edit if needed, and modify it. +# - We will use simple scripts to read the JSON data and assemble it in +# our database for further analysis. +# - I have constructed initial files for yeast Mbp1 and nine other reference +# species. +# - I have written a small number of utility functions to read those files +# and assemble them into a database. + + +# == 2.1 JSON formatted source data ======================================== + + +# Have a look at the structure of the yeast Mbp1 protein data: +file.show("./data/MBP1_SACCE.json") + +# - The whole thing is an array: [ ... ]. This is not necessary for a single +# object, but we will have more objects in other files. And it's perfectly +# legal to have an array with a single element. +# - The data is formatted as "key" : "value" pairs inside an object { ... }. +# This keeps the association between data items and their semantics +# explicit. +# - All keys are strings and they are unique in the object. +# - Values are mostly single strings and integers ... +# - ... except for "sequence". That one is an array of strings. Why? This is to +# make it easier to format and maintain the data. JSON does not allow line +# breaks within strings, but the strings we copy/paste from Genbank or other +# sources might have line breaks, sequence numbers etc. So we need to +# sanitize the sequence at some point. But since we need to do that +# anyway, it is easier to see the whole sequence if we store it in chunks. + +# The .utilities.R script that get's loaded whenever you open this project +# has already made sure the "jsonlite" package exists on your computer. This +# package supports our work with .json formatted data. + +if (! requireNamespace("jsonlite", quietly = TRUE)) { + install.packages("jsonlite") +} +# Package information: +# library(help = jsonlite) # basic information +# browseVignettes("jsonlite") # available vignettes +# data(package = "jsonlite") # available datasets + + +x <- jsonlite::fromJSON("./data/MBP1_SACCE.json") +str(x) + +x$name +unlist(x$sequence) + + +# == 2.2 "Sanitizing" sequence data ======================================== + + +# Examine the dbSanitizeSequence() function: + +dbSanitizeSequence + +# Try: + +dbSanitizeSequence(c("GAA", "ttc")) +dbSanitizeSequence("MsnQ00%0 I@#>YSary S + G1 V2DV3Y>") +x <- " + 1 msnqiysary sgvdvyefih stgsimkrkk ddwvnathil kaanfakakr trilekevlk + 61 ethekvqggf gkyqgtwvpl niakqlaekf svydqlkplf dftqtdgsas pppapkhhha + 121 skvdrkkair sastsaimet krnnkkaeen qfqsskilgn ptaaprkrgr pvgstrgsrr + ... + " # copy/paste from Genbank + +dbSanitizeSequence(x) + + +# == 2.3 Create a protein table for our data model ========================= + +# === 2.3.1 Initialize the database + + +# The function dbInit contains all the code to return a list of empty +# data frames for our data model. + +dbInit + +myDB <- dbInit() +str(myDB) + + +# === 2.3.2 Add data + + +# fromJSON() returns a dataframe that we can readily process to add data +# to our table. Have a look at the function to add protein entries: + +dbAddProtein + +myDB <- dbAddProtein(myDB, jsonlite::fromJSON("./data/MBP1_SACCE.json")) +str(myDB) + +# Lets check that the 833 amino acids of the yeast MBP1 sequence have +# safely arrived. Note the genral idiom we use here to retrieve the data: +# we define a boolean vector that satisfies a condition, then we subset +# a column with that vector. + +sel <- myDB$protein$name == "MBP1_SACCE" +nchar(myDB$protein$sequence[sel]) + + +# == 2.4 Complete the database ============================================= + + +# Completing the database with Mbp1 data and data for 9 other "reference" +# species is more of the same. I have assembled the code in a script +# "./scripts/ABC-createRefDB.R" - open it, check it out, and then source it. +# It's really very simple, just reading some prepared files of data I have +# formatted with JSON, and assembling the data in our data model. +# +# The code is also very simple and in particular there is no checking for errors +# or inconsistencies. Have a look: + +# Totally straightforward ... +dbAddTaxonomy +dbAddFeature + +# Just slightly more complex, since we need to match the protein or feature +# name in the JSON file with its internal ID, and, when doing that confirm +# that it CAN be matched and that the match is UNIQUE +dbAddAnnotation + +# Now: create the database +source("./scripts/ABC-createRefDB.R") + +str(myDB) + + +# === 2.4.1 Examples of navigating the database + + +# You can look at the contents of the tables in the usual way we access +# elements from lists and dataframes. Here are some examples: +myDB$protein +myDB$protein$RefSeqID +myDB$protein[,"name"] +myDB$taxonomy +myDB$taxonomy$species +biCode(myDB$taxonomy$species) + +# Comparing two tables: +# Are all of the taxonomyIDs in the protein table present in the +# taxonomy table? We ought to check, because the way we imported the +# data from JSON objects, we could have omitted or forgotten some. But we can +# check this with one simple expression. Unravel it and study its components. + +all(myDB$protein$taxonomyID %in% myDB$taxonomy$ID) + +# If this is not TRUE, you MUST fix the problem before continuing. + +# Cross-referencing information: +# What is the species name of the protein whose name is "MBP1_COPCI"? + +sel <- myDB$protein$name == "MBP1_COPCI" +x <- myDB$protein$taxonomyID[sel] + +sel <- myDB$taxonomy$ID == x +myDB$taxonomy$species[sel] + + +# == 2.5 Updating the database ============================================= + + +# Basic tasks for databases include retrieving data, selecting data, updating +# and deleting data. Here we will take a simple, pedestrian approach: +# +# In case we need to modify any of the data, we modify it in the JSON file +# save that, and recreate the database. The myDB database will only be +# used for analysis. +# + + +# = 3 Add your own data =================================================== + + +# You have defined a genome sequence fungus as "MYSPE", and your final task +# will be to find the protein in MYSPE that is most similar to yeast Mbp1, and +# to enter its information into the database. + + +# == 3.1 Find a protein ==================================================== + + +# The BLAST algorithm will be properly introduced in a later learning unit - +# for now just use it in the following way: +# +# - Navigate to https://blast.ncbi.nlm.nih.gov/Blast.cgi and click on +# Protein BLAST. +# - Enter NP_010227 into the "Query Sequence" field. +# - Choose "Reference proteins (refseq_protein)" as the "Database" in the +# "Choose Search Set" section. +# - Paste the MYSPE species name into the "Organism" field. +# +# - Click the "BLAST" button. + +# You will probably get more than one result. If you get dozens of results or +# more, or if you get no results, something went wrong. Reconsider whether the +# problem was with your input, try something different, or ask for help. + +# Otherwise, look for the top-hit in the "Descriptions" tab In some cases +# there will be more than one hit with nearly similar E-values. If this is the +# case for MYSPE, choose the one with the higher degree of similarity (more +# identities) with the N-terminus of the query - i.e. the Query sequence of +# the first ~ 100 amino acids. + +# - If you are submitting this unit for credit, you will need to paste the +# relevant section of the BLAST results into your submission page (see task). # - Follow the link to the protein data page, linked from "Accession". +# - From there, in a separate tab, open the link to the taxonomy database page +# for MYSPE which is linked from the "ORGANISM" record. + + +# == 3.2 Put the information into JSON files =============================== + + +# - Next make a copy of the file "./data/MBP1_SACCE.json" in the "data" +# directory and give it a new name that corresponds to MYSPE - e.g. if +# MYSPE is called "Crptycoccus neoformans", your file should be called +# "MBP1_CRYNE.json"; in that case "MBP1_CRYNE" would also be the +# "name" of your protein. Open the file in the RStudio editor and replace +# all of the MBP1_SACCE data with the corresponding data of your protein. +# +# Note: The UniProt ID may not be listed on the NCBI page. To retrieve +# it, navigate to http://www.uniprot.org/mapping/ , paste your RefSeq ID +# into the query field, make sure "RefSeqProtein" is selected for "From" +# and "UniProtKB" is selected for "To", and click "Go". In case this does +# not retrieve a single UniProt ID, contact me. +# +# Save your .json file into your myScripts directory. +# +# Confirm this step: +if (file.exists(sprintf("./myScripts/MBP1_%s.json", biCode(MYSPE)))) { + cat("Excellent - all good to continue.\n") +} else { + stop(sprintf(" The file \"./myScripts/MBP1_%s.json\" does not exist", + biCode(MYSPE))) +} +# +# +# - Do a similar thing for the MYSPE taxonomy entry. Copy +# "./data/refTaxonomy.json" and make a new file named "MYSPEtaxonomy.json". +# Create a valid JSON file with only one single entry - that of MYSPE. +# +# Confirm this step: +if (file.exists(sprintf("./myScripts/%staxonomy.json", biCode(MYSPE)))) { + cat("Excellent - all good to continue.\n") +} else { + stop(sprintf(" The file \"./myScripts/%staxonomy.json\" does not exist", + biCode(MYSPE))) +} + +# - Validate your two files online at https://jsonlint.com/ + + +# == 3.3 Create an R script to create your own database ==================== + + +# Next: to create your own database. +# - Make a new R script, call it "makeProteinDB.R" +# - enter the following expression as the first command: +# source("./scripts/ABC-createRefDB.R") +# - than add the two commands that add your protein and taxonomy data, +# they should look like: +# +# myDB <- dbAddProtein(myDB, +# jsonlite::fromJSON("./myScripts/MBP1_.json")) +# myDB <- dbAddTaxonomy(myDB, +# jsonlite::fromJSON("./myScripts/taxonomy.json")) +# +# +# - save the .json file in the ./myScripts/ folder and source() it: +# +# source("./myScripts/makeProteinDB.R") # <<<- This command ... +# +# ... needs to be executed whenever you recreate the database. In particular, +# whenever you have added or modified data in any of the JSON files. Later you +# will add more information. + +# Remember this principle. Don't rely on objects in memory - you might +# "break" them with a code experiment. But always have a script with +# which you can create what you need. + +# === 3.3.1 Check and validate + + +# Is your protein named according to the pattern "MBP1_MYSPE"? It should be. +# And does the taxonomy table contain the systematic name? It should be the same +# that you get when you type MYSPE into the console. + +# Let's compute sequence lengths on the fly (with the function nchar() ), and +# open this with the table viewer function View() + +View(cbind(myDB$protein[ , c("ID", "name", "RefSeqID")], + length = nchar(myDB$protein$sequence))) + +# Does your protein appear in the last row of this table? Where does your +# protein's length fall relative to the reference proteins? About the same? Much +# shorter? Much longer? If it is less then 500 amino acids long, I would suspect +# an error. Contact me for advice. + +# Is that the right sequence? Is it the same as the one on the NCBI protein +# database page? +myDB$protein$sequence[nrow(myDB$protein)] + +# If not, don't continue! Fix the problem first. +# Let me repeat: If this does not give you the right sequence of the MYSPE +# Mbp1 homologue, DO NOT CONTINUE. Fix the problem. + +# Is that the right taxonomy ID and binomial name for MYSPE? +# This question may be a bit non-trivial ... MYSPE is a species, but the +# recorded taxonomy ID may be a strain. We have a utility function, +# sameSpecies() that normalizes organism name to the binomial species. +# +sel <- sameSpecies(myDB$taxonomy$species, MYSPE) +myDB$taxonomy[sel, ] + +# If not, or if the result was "<0 rows> ... " then DO NOT CONTINUE. +# Fix the problem first. + +# Does this give you the right refseq ID for MBP1_MYSPE? +sel <- myDB$protein$name == paste0("MBP1_", biCode(MYSPE)) +myDB$protein$RefSeqID[sel] + +# If not, or if the result was "<0 rows> ... " then DO NOT CONTINUE. +# Fix the problem first. + + +# == 3.4 Task: submit for credit (part 2/2) ================================ + + +# - On your submission page, copy/paste the BLAST result headers from the +# "Alignments" tab, to demonstrate that the data justifies your choice of +# protein; you don't need to paste the whole alignment, just the header(s). +# Note the relevant values separately: eValue, coverage, %ID etc. and link +# to your protein's NCBI protein database page. (Note: in case there are +# more than one high-scoring segments included for the SAME protein, you +# need to show the results for all of its high-scoring segments.) +# - Copy and paste the contents of your two JSON files on your submission +# page on the Student Wiki. Make sure they are enclosed in
 ... 
+# tags. +# - Execute the three commands below and show the result on your submission page + +biCode(myDB$taxonomy$species) %in% biCode(MYSPE) +sel <- sameSpecies(myDB$taxonomy$species, MYSPE) +myDB$protein$taxonomyID %in% myDB$taxonomy$ID[sel] + +# That is all. + + +# [END] diff --git a/FND-Genetic_code.R b/FND-Genetic_code.R index 132d8ce..585f7b0 100644 --- a/FND-Genetic_code.R +++ b/FND-Genetic_code.R @@ -1,349 +1,349 @@ -# tocID <- "FND-Genetic_code.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the FND-Genetic_code unit. -# -# Version: 1.2 -# -# Date: 2017 10 - 2019 01 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.2 2020 Maintenance -# 1.1 Change from require() to requireNamespace(), -# use ::() idiom throughout, -# use Biocmanager:: not biocLite() -# 1.0.1 Comment on "incomplete final line" warning in FASTA -# 1.0 First live version -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ---------------------------------------------------------------- -#TOC> 1 Storing the genetic code 45 -#TOC> 1.1 Genetic code in Biostrings 63 -#TOC> 2 Working with the genetic code 94 -#TOC> 2.1 Translate a sequence. 129 -#TOC> 3 An alternative representation: 3D array 212 -#TOC> 3.1 Print a Genetic code table 246 -#TOC> 4 Tasks 272 -#TOC> -#TOC> ========================================================================== - - -# = 1 Storing the genetic code ============================================ - -# The genetic code maps trinucleotide codons to amino acids. To store it, we -# need some mechanism to associate the two representations. The most -# convenient way to do that is a "named vector" which holds the amino acid -# code and assigns the codons as names to its elements. - -x <- c("M", "H", "H", "*", "*", "*") -names(x) <- c("ATG", "CAC", "CAT", "TAA", "TAG", "TGA") -x - -# Then we can access the vector by the codon as name, and retrieve the -# amino acid ... - -x["ATG"] -x["CAC"] -x["TAA"] - -# ... or the names of elements, to retrieve the codon(s) -names(x)[x == "M"] -names(x)[x == "H"] -names(x)[x == "*"] - - -# == 1.1 Genetic code in Biostrings ======================================== - -# Coveniently, the standard genetic code as well as its alternatives are -# available in the Bioconductor "Biostrings" package: - - -if (! requireNamespace("BiocManager", quietly = TRUE)) { - install.packages("BiocManager") -} -if (! requireNamespace("Biostrings", quietly = TRUE)) { - BiocManager::install("Biostrings") -} -# Package information: -# library(help = Biostrings) # basic information -# browseVignettes("Biostrings") # available vignettes -# data(package = "Biostrings") # available datasets - - -# The standard genetic code vector -Biostrings::GENETIC_CODE - -# The table of genetic codes. This information corresponds to this page -# at the NCBI: -# https://www.ncbi.nlm.nih.gov/Taxonomy/taxonomyhome.html/index.cgi?chapter=tgencodes -Biostrings::GENETIC_CODE_TABLE - -# Most of the alternative codes are mitochondrial codes. The id of the -# Alternative Yeast Nuclear code is "12" -Biostrings::getGeneticCode("12") # Alternative Yeast Nuclear - - -# = 2 Working with the genetic code ======================================= - -# We'll use Biostrings::GENETIC_CODE a lot in this script, so we'll assign it -# to a "local" variable, rather than retrieving it from the package all the -# time. - -GC <- Biostrings::GENETIC_CODE - -# This is a named vector of characters ... - -str(GC) - -# ... which also stores the alternative initiation codons TTG and CTG in -# an attribute of the vector. (Alternative initiation codons sometimes are -# used instead of ATG to intiate translation, if translation is not initiated -# at ATG thses are still translated with fMet.) - -attr(GC, "alt_init_codons") - -# But the key to use this vector is in the "names" which we use for subsetting -# the list of amino acids in whatever way we need. -names(GC) - -# The translation of "TGG" ... -GC["TGG"] - -# All stop codons -names(GC)[GC == "*"] - -# All start codons -names(GC)[GC == "M"] # ... or -c(names(GC)[GC == "M"], - attr(GC, "alt_init_codons")) - - -# == 2.1 Translate a sequence. ============================================= - - -# I have provided a gene sequence in the data directory: -# S288C_YDL056W_MBP1_coding.fsa is the yeast Mbp1 FASTA sequence. - -# read it -mbp1 <- readLines("./data/S288C_YDL056W_MBP1_coding.fsa") - -# You will notice that this generates a Warning message: -# Warning message: -# In readLines("./data/S288C_YDL056W_MBP1_coding.fsa") : -# incomplete final line found on './data/S288C_YDL056W_MBP1_coding.fsa' - -# The reason for this is that the last character of the file is the letter "A" -# and not a "\n" line break. This file is exactly how it was sent from the -# NCBI server; I think good, defensive programming practice would have been to -# include some kind of an end-marker in the file, like a final "\n". This helps -# us recognize an incomplete transmission. Let's parse the actual sequence from -# the file, and then check for completeness. - - -head(mbp1) - -# drop the first line (header) -mbp1 <- mbp1[-1] -head(mbp1) - -# concatenate it all to a single string -mbp1 <- paste(mbp1, sep = "", collapse = "") - -# how long is it? -nchar(mbp1) - -# how many codons? -nchar(mbp1)/3 - -# That looks correct for the 833 aa sequence plus 1 stop codon. This gives us a -# first verification that the file we read is complete, the nucleotides of a -# complete ORF should be divisible by 3. - -# Extract the codons. There are many ways to split a long string into chunks -# of three characters. Here we use the Biostrings codons() function. codons() -# requires an object of type DNAstring - a special kind of string with -# attributes that are useful for Biostrings. Thus we convert the sequence first -# with DNAstring(), then split it up, then convert it into a plain -# character vector. -mbp1Codons <- as.character(Biostrings::codons(Biostrings::DNAString(mbp1))) - -head(mbp1Codons) - -# now translate each codon - -mbp1AA <- character(834) -for (i in seq_along(mbp1Codons)) { - mbp1AA[i] <- GC[mbp1Codons[i]] -} - -head(mbp1Codons) -head(mbp1AA) - -tail(mbp1Codons) -tail(mbp1AA) # Note the stop! - -# The TAA "ochre" stop codon is our second verification that the nucleotide -# sequence is complete: a stop codon can't appear internally in an ORF. - -# We can work with the mbp1AA vector, for example to tabulate the -# amino acid frequencies: -table(mbp1AA) -sort(table(mbp1AA), decreasing = TRUE) - -# Or we can paste all elements together into a single string. But let's remove -# the stop, it's not actually a part of the sequence. To remove the last element -# of a vector, re-assign it with a vector minus the index of the last element: -mbp1AA <- mbp1AA[-(length(mbp1AA))] -tail(mbp1AA) # Note the stop is gone! - -# paste it together, collapsing the elements using an empty string as the -# separation-character (i.e.: nothing) -(Mbp1 <- paste(mbp1AA, sep = "", collapse = "")) - - -# = 3 An alternative representation: 3D array ============================= - - -# We don't use 3D arrays often - usually just 2D tables and data frames, so -# here is a good opportunity to review the syntax of 3D arrays with a -# genetic code cube: - -# Initialize, using A G C T as the names of the elements in each dimension -cCube <- array(data = character(64), - dim = c(4, 4, 4), - dimnames = list(c("A", "G", "C", "T"), - c("A", "G", "C", "T"), - c("A", "G", "C", "T"))) - -# fill it with amino acid codes using three nested loops -for (i in 1:4) { - for (j in 1:4) { - for (k in 1:4) { - myCodon <- paste(dimnames(cCube)[[1]][i], - dimnames(cCube)[[2]][j], - dimnames(cCube)[[3]][k], - sep = "", - collapse = "") - cCube[i, j, k] <- GC[myCodon] - } - } -} - -# confirm -cCube["A", "T", "G"] # methionine -cCube["T", "T", "T"] # phenylalanine -cCube["T", "A", "G"] # stop (amber) - - - -# == 3.1 Print a Genetic code table ======================================== - - -# The data structure of our cCube is well suited to print a table. In the -# "standard" way to print the genetic code, we write codons with the same -# second nucleotide in columns, and arrange rows in blocks of same -# first nucleotide, varying the third nucleotide fastest. This maximizes the -# similarity of adjacent amino acids in the table if we print the -# nucleotides in the order T C A G. It's immidiately obvious that the code -# is not random: the universal genetic code is exceptionally error tolerant in -# the sense that mutations (or single-nucleotide translation errors) are likely -# to result in an amino acid with similar biophysical properties as the -# original. - -nuc <- c("T", "C", "A", "G") - -# (calling variables f, s, t to indicate first, second, and third position ...) -for (f in nuc) { # first varies in blocks - for (t in nuc) { # third varies in columns - for (s in nuc) { # second varies in rows - cat(sprintf("%s%s%s: %s ", f, s, t, cCube[f, s, t])) - } - cat("\n") - } - cat("\n") -} - - -# = 4 Tasks =============================================================== - - -# Task: What do you need to change to print the table with U instead -# of T? Try it. - - -# Task: Point mutations are more often transitions (purine -> purine; -# pyrimidine -> pyrimidine) than transversions (purine -> pyrimidine; -# pyrimidine -> purine), even though twice as many transversions -# are possible in the code. This is most likely due a deamination / -# tautomerization process that favours C -> T changes. If the code -# indeed minimizes the effect of mutations, you would expect that -# codons that differ by a transition code for more similar amino acids -# than codons that differ by a transversion. Is that true? List the set -# of all amino acid pairs that are encoded by codons with a C -> T -# transition. Then list the set of amino acid pairs with a C -> A -# transversion. Which set of pairs is more similar? - - -# Task: How many stop codons do the two mbp1-gene derived amino acid sequences -# have if you translate them in the 2. or the 3. frame? - - -# Task: How does the amino acid composition change if you translate the mbp1 -# gene with the Alternative Yeast Nuclear code that is used by the -# "GTC clade" of fungi? -# (cf. https://en.wikipedia.org/wiki/Alternative_yeast_nuclear_code ) - -# Solution: - - # Fetch the code - Biostrings::GENETIC_CODE_TABLE - Biostrings::GENETIC_CODE_TABLE$name[Biostrings::GENETIC_CODE_TABLE$id=="12"] - altYcode <- Biostrings::getGeneticCode("12") - - # what's the difference? - (delta <- which(Biostrings::GENETIC_CODE != altYcode)) - - Biostrings::GENETIC_CODE[delta] - altYcode[delta] - - # translate - altYAA <- character(834) - for (i in seq_along(mbp1Codons)) { - altYAA[i] <- altYcode[mbp1Codons[i]] - } - - table(mbp1AA) - table(altYAA) - -# Task: The genetic code has significant redundacy, i.e. there are up to six -# codons that code for the same amino acid. Write code that lists how -# many amino acids are present how often i.e. it should tell you that -# two amino acids are encoded only with a single codon, three amino -# acids have six codons, etc. Solution below, but don't peek. There -# are many possible ways to do this. -# -# -# Solution: -( x <- table(table(Biostrings::GENETIC_CODE)) ) - -# confirm -sum(x * as.numeric(names(x))) - - - -# [END] +# tocID <- "FND-Genetic_code.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the FND-Genetic_code unit. +# +# Version: 1.2 +# +# Date: 2017 10 - 2019 01 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.2 2020 Maintenance +# 1.1 Change from require() to requireNamespace(), +# use ::() idiom throughout, +# use Biocmanager:: not biocLite() +# 1.0.1 Comment on "incomplete final line" warning in FASTA +# 1.0 First live version +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ---------------------------------------------------------------- +#TOC> 1 Storing the genetic code 45 +#TOC> 1.1 Genetic code in Biostrings 63 +#TOC> 2 Working with the genetic code 94 +#TOC> 2.1 Translate a sequence. 129 +#TOC> 3 An alternative representation: 3D array 212 +#TOC> 3.1 Print a Genetic code table 246 +#TOC> 4 Tasks 272 +#TOC> +#TOC> ========================================================================== + + +# = 1 Storing the genetic code ============================================ + +# The genetic code maps trinucleotide codons to amino acids. To store it, we +# need some mechanism to associate the two representations. The most +# convenient way to do that is a "named vector" which holds the amino acid +# code and assigns the codons as names to its elements. + +x <- c("M", "H", "H", "*", "*", "*") +names(x) <- c("ATG", "CAC", "CAT", "TAA", "TAG", "TGA") +x + +# Then we can access the vector by the codon as name, and retrieve the +# amino acid ... + +x["ATG"] +x["CAC"] +x["TAA"] + +# ... or the names of elements, to retrieve the codon(s) +names(x)[x == "M"] +names(x)[x == "H"] +names(x)[x == "*"] + + +# == 1.1 Genetic code in Biostrings ======================================== + +# Coveniently, the standard genetic code as well as its alternatives are +# available in the Bioconductor "Biostrings" package: + + +if (! requireNamespace("BiocManager", quietly = TRUE)) { + install.packages("BiocManager") +} +if (! requireNamespace("Biostrings", quietly = TRUE)) { + BiocManager::install("Biostrings") +} +# Package information: +# library(help = Biostrings) # basic information +# browseVignettes("Biostrings") # available vignettes +# data(package = "Biostrings") # available datasets + + +# The standard genetic code vector +Biostrings::GENETIC_CODE + +# The table of genetic codes. This information corresponds to this page +# at the NCBI: +# https://www.ncbi.nlm.nih.gov/Taxonomy/taxonomyhome.html/index.cgi?chapter=tgencodes +Biostrings::GENETIC_CODE_TABLE + +# Most of the alternative codes are mitochondrial codes. The id of the +# Alternative Yeast Nuclear code is "12" +Biostrings::getGeneticCode("12") # Alternative Yeast Nuclear + + +# = 2 Working with the genetic code ======================================= + +# We'll use Biostrings::GENETIC_CODE a lot in this script, so we'll assign it +# to a "local" variable, rather than retrieving it from the package all the +# time. + +GC <- Biostrings::GENETIC_CODE + +# This is a named vector of characters ... + +str(GC) + +# ... which also stores the alternative initiation codons TTG and CTG in +# an attribute of the vector. (Alternative initiation codons sometimes are +# used instead of ATG to intiate translation, if translation is not initiated +# at ATG thses are still translated with fMet.) + +attr(GC, "alt_init_codons") + +# But the key to use this vector is in the "names" which we use for subsetting +# the list of amino acids in whatever way we need. +names(GC) + +# The translation of "TGG" ... +GC["TGG"] + +# All stop codons +names(GC)[GC == "*"] + +# All start codons +names(GC)[GC == "M"] # ... or +c(names(GC)[GC == "M"], + attr(GC, "alt_init_codons")) + + +# == 2.1 Translate a sequence. ============================================= + + +# I have provided a gene sequence in the data directory: +# S288C_YDL056W_MBP1_coding.fsa is the yeast Mbp1 FASTA sequence. + +# read it +mbp1 <- readLines("./data/S288C_YDL056W_MBP1_coding.fsa") + +# You will notice that this generates a Warning message: +# Warning message: +# In readLines("./data/S288C_YDL056W_MBP1_coding.fsa") : +# incomplete final line found on './data/S288C_YDL056W_MBP1_coding.fsa' + +# The reason for this is that the last character of the file is the letter "A" +# and not a "\n" line break. This file is exactly how it was sent from the +# NCBI server; I think good, defensive programming practice would have been to +# include some kind of an end-marker in the file, like a final "\n". This helps +# us recognize an incomplete transmission. Let's parse the actual sequence from +# the file, and then check for completeness. + + +head(mbp1) + +# drop the first line (header) +mbp1 <- mbp1[-1] +head(mbp1) + +# concatenate it all to a single string +mbp1 <- paste(mbp1, sep = "", collapse = "") + +# how long is it? +nchar(mbp1) + +# how many codons? +nchar(mbp1)/3 + +# That looks correct for the 833 aa sequence plus 1 stop codon. This gives us a +# first verification that the file we read is complete, the nucleotides of a +# complete ORF should be divisible by 3. + +# Extract the codons. There are many ways to split a long string into chunks +# of three characters. Here we use the Biostrings codons() function. codons() +# requires an object of type DNAstring - a special kind of string with +# attributes that are useful for Biostrings. Thus we convert the sequence first +# with DNAstring(), then split it up, then convert it into a plain +# character vector. +mbp1Codons <- as.character(Biostrings::codons(Biostrings::DNAString(mbp1))) + +head(mbp1Codons) + +# now translate each codon + +mbp1AA <- character(834) +for (i in seq_along(mbp1Codons)) { + mbp1AA[i] <- GC[mbp1Codons[i]] +} + +head(mbp1Codons) +head(mbp1AA) + +tail(mbp1Codons) +tail(mbp1AA) # Note the stop! + +# The TAA "ochre" stop codon is our second verification that the nucleotide +# sequence is complete: a stop codon can't appear internally in an ORF. + +# We can work with the mbp1AA vector, for example to tabulate the +# amino acid frequencies: +table(mbp1AA) +sort(table(mbp1AA), decreasing = TRUE) + +# Or we can paste all elements together into a single string. But let's remove +# the stop, it's not actually a part of the sequence. To remove the last element +# of a vector, re-assign it with a vector minus the index of the last element: +mbp1AA <- mbp1AA[-(length(mbp1AA))] +tail(mbp1AA) # Note the stop is gone! + +# paste it together, collapsing the elements using an empty string as the +# separation-character (i.e.: nothing) +(Mbp1 <- paste(mbp1AA, sep = "", collapse = "")) + + +# = 3 An alternative representation: 3D array ============================= + + +# We don't use 3D arrays often - usually just 2D tables and data frames, so +# here is a good opportunity to review the syntax of 3D arrays with a +# genetic code cube: + +# Initialize, using A G C T as the names of the elements in each dimension +cCube <- array(data = character(64), + dim = c(4, 4, 4), + dimnames = list(c("A", "G", "C", "T"), + c("A", "G", "C", "T"), + c("A", "G", "C", "T"))) + +# fill it with amino acid codes using three nested loops +for (i in 1:4) { + for (j in 1:4) { + for (k in 1:4) { + myCodon <- paste(dimnames(cCube)[[1]][i], + dimnames(cCube)[[2]][j], + dimnames(cCube)[[3]][k], + sep = "", + collapse = "") + cCube[i, j, k] <- GC[myCodon] + } + } +} + +# confirm +cCube["A", "T", "G"] # methionine +cCube["T", "T", "T"] # phenylalanine +cCube["T", "A", "G"] # stop (amber) + + + +# == 3.1 Print a Genetic code table ======================================== + + +# The data structure of our cCube is well suited to print a table. In the +# "standard" way to print the genetic code, we write codons with the same +# second nucleotide in columns, and arrange rows in blocks of same +# first nucleotide, varying the third nucleotide fastest. This maximizes the +# similarity of adjacent amino acids in the table if we print the +# nucleotides in the order T C A G. It's immidiately obvious that the code +# is not random: the universal genetic code is exceptionally error tolerant in +# the sense that mutations (or single-nucleotide translation errors) are likely +# to result in an amino acid with similar biophysical properties as the +# original. + +nuc <- c("T", "C", "A", "G") + +# (calling variables f, s, t to indicate first, second, and third position ...) +for (f in nuc) { # first varies in blocks + for (t in nuc) { # third varies in columns + for (s in nuc) { # second varies in rows + cat(sprintf("%s%s%s: %s ", f, s, t, cCube[f, s, t])) + } + cat("\n") + } + cat("\n") +} + + +# = 4 Tasks =============================================================== + + +# Task: What do you need to change to print the table with U instead +# of T? Try it. + + +# Task: Point mutations are more often transitions (purine -> purine; +# pyrimidine -> pyrimidine) than transversions (purine -> pyrimidine; +# pyrimidine -> purine), even though twice as many transversions +# are possible in the code. This is most likely due a deamination / +# tautomerization process that favours C -> T changes. If the code +# indeed minimizes the effect of mutations, you would expect that +# codons that differ by a transition code for more similar amino acids +# than codons that differ by a transversion. Is that true? List the set +# of all amino acid pairs that are encoded by codons with a C -> T +# transition. Then list the set of amino acid pairs with a C -> A +# transversion. Which set of pairs is more similar? + + +# Task: How many stop codons do the two mbp1-gene derived amino acid sequences +# have if you translate them in the 2. or the 3. frame? + + +# Task: How does the amino acid composition change if you translate the mbp1 +# gene with the Alternative Yeast Nuclear code that is used by the +# "GTC clade" of fungi? +# (cf. https://en.wikipedia.org/wiki/Alternative_yeast_nuclear_code ) + +# Solution: + + # Fetch the code + Biostrings::GENETIC_CODE_TABLE + Biostrings::GENETIC_CODE_TABLE$name[Biostrings::GENETIC_CODE_TABLE$id=="12"] + altYcode <- Biostrings::getGeneticCode("12") + + # what's the difference? + (delta <- which(Biostrings::GENETIC_CODE != altYcode)) + + Biostrings::GENETIC_CODE[delta] + altYcode[delta] + + # translate + altYAA <- character(834) + for (i in seq_along(mbp1Codons)) { + altYAA[i] <- altYcode[mbp1Codons[i]] + } + + table(mbp1AA) + table(altYAA) + +# Task: The genetic code has significant redundacy, i.e. there are up to six +# codons that code for the same amino acid. Write code that lists how +# many amino acids are present how often i.e. it should tell you that +# two amino acids are encoded only with a single codon, three amino +# acids have six codons, etc. Solution below, but don't peek. There +# are many possible ways to do this. +# +# +# Solution: +( x <- table(table(Biostrings::GENETIC_CODE)) ) + +# confirm +sum(x * as.numeric(names(x))) + + + +# [END] diff --git a/FND-MAT-Graphs_and_networks.R b/FND-MAT-Graphs_and_networks.R index 760636c..654f909 100644 --- a/FND-MAT-Graphs_and_networks.R +++ b/FND-MAT-Graphs_and_networks.R @@ -1,691 +1,691 @@ -# tocID <- "FND-MAT-Graphs_and_networks.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the FND-MAT-Graphs_and_networks unit. -# -# Version: 1.2 -# -# Date: 2017 10 - 2019 01 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.2 Change from require() to requireNamespace(), -# use ::() idiom throughout -# 1.1 Update set.seed() usage -# 1.0 First final version for learning units. -# 0.1 First code copied from 2016 material. -# -# -# TODO: Add some explicit tasks and sample solutions. -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> -------------------------------------------------------------- -#TOC> 1 REVIEW 50 -#TOC> 2 DEGREE DISTRIBUTIONS 206 -#TOC> 2.1 Random graph 212 -#TOC> 2.2 scale-free graph (Barabasi-Albert) 260 -#TOC> 2.3 Random geometric graph 326 -#TOC> 3 A CLOSER LOOK AT THE igraph:: PACKAGE 448 -#TOC> 3.1 Basics 451 -#TOC> 3.2 Components 523 -#TOC> 4 RANDOM GRAPHS AND GRAPH METRICS 542 -#TOC> 4.1 Diameter 579 -#TOC> 5 GRAPH CLUSTERING 648 -#TOC> -#TOC> ========================================================================== - - -# = 1 REVIEW ============================================================== - -# This tutorial covers basic concepts of graph theory and analysis in R. Make -# sure you have pulled the latest version of the project from the GitHub -# repository. - -# Let's explore some of the basic ideas of graph theory by starting with a small -# random graph. - - -# To begin let's write a little function that will create random "gene" names; -# there's no particular purpose to this other than to make our graphs look a -# little more "biological" ... -makeRandomGenenames <- function(N) { - nam <- character() - while (length(nam) < N) { - a <- paste0(c(sample(LETTERS, 1), sample(letters, 2)), - collapse="") # one uppercase, two lowercase letters - n <- sample(1:9, 1) # one number - nam[length(nam) + 1] <- paste(a, n, sep="") # store in vector - nam <- unique(nam) # delete if this was a duplicate - } - return(nam) -} - -N <- 20 - -set.seed(112358) # set RNG seed for repeatable randomness -( Nnames <- makeRandomGenenames(N) ) -set.seed(NULL) # reset the RNG - -# One way to represent graphs in a computer is as an "adjacency matrix". In this -# matrix, each row and each column represents a node, and the cell at the -# intersection of a row and column contains a value/TRUE if there is an edge, -# 0/FALSE otherwise. - -# Let's create an adjacency matrix for our random graph: let's say a pair -# of nodes has probability p <- 0.09 to have an edge, and our graph is -# symmetric , i.e. it is an undirected graph, and it has neither self-edges, -# i.e. loops, nor multiple edges between the same nodes, i.e. it -# is a "simple" graph. We use the Nnames vector as node labels. - -makeRandomAM <- function(nam, p = 0.1) { - # Make a random adjacency matrix for a set of nodes with edge probability p - # Parameters: - # nam: a character vector of unique node names. - # p: probability that a random pair of nodes will have an edge. - # - # Value: an adjacency matrix for a simple, undirected graph - # - - N <- length(nam) - AM <- matrix(numeric(N * N), ncol = N) # Adjacency matrix, pre-filled with 0 - rownames(AM) <- nam - colnames(AM) <- nam - for (iRow in 1:(N-1)) { # Note how we make sure iRow != iCol - this prevents - # loops (self-edges) - for (iCol in (iRow+1):N) { - if (runif(1) < p) { # runif() creates uniform random numbers - # between 0 and 1. The expression is TRUE with - # probability p. if it is TRUE ... - AM[iRow, iCol] <- 1 # ... record an edge for the pair (iRow, iCol) - } - } - } - return(AM) -} - -set.seed(112358) # set RNG seed for repeatable randomness -( myRandAM <- makeRandomAM(Nnames, p = 0.09) ) -set.seed(NULL) # reset the RNG - - -# Listing the matrix is not very informative - we should plot this graph. The -# standard package for work with graphs in r is "igraph::". We'll go into more -# details of the igraph:: package a bit later, for now we just use it to plot: - -if (! requireNamespace("igraph", quietly = TRUE)) { - install.packages("igraph") -} -# Package information: -# library(help = igraph) # basic information -# browseVignettes("igraph") # available vignettes -# data(package = "igraph") # available datasets - - -myG <- igraph::graph_from_adjacency_matrix(myRandAM, mode = "undirected") - -set.seed(112358) # set RNG seed for repeatable randomness - # calculate layout coordinates -myGxy <- igraph::layout_with_graphopt(myG, - charge=0.0012) -set.seed(NULL) # reset the RNG - - -# The igraph:: package adds its own function to the collection of plot() -# functions; R makes the selection which plot function to use based on the class -# of the object that we request to plot. This plot function has parameters -# layout - the x,y coordinates of the nodes; -# vertex.color - which I define to color by node-degree -# vertex size - which I define to increase with node-degree -# vertex.label - which I set to combine the names of the vertices of the -# graph - names(V(iG)) - with the node degree - degree(iG). -# See ?igraph.plotting for the complete list of parameters - - -oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off -plot(myG, - layout = myGxy, - rescale = FALSE, - xlim = c(min(myGxy[,1]) * 0.99, max(myGxy[,1]) * 1.01), - ylim = c(min(myGxy[,2]) * 0.99, max(myGxy[,2]) * 1.01), - vertex.color=heat.colors(max(igraph::degree(myG)+1))[igraph::degree(myG)+1], - vertex.size = 1000 + (900 * igraph::degree(myG)), - vertex.label = sprintf("%s(%i)", names(igraph::V(myG)), igraph::degree(myG)), - vertex.label.family = "sans", - vertex.label.cex = 0.7) -par(oPar) # reset plot window - - -# The simplest descriptor of a graph are the number of nodes, edges, and the -# degree-distribution. In our example, the number of nodes was given: N; the -# number of edges can easily be calculated from the adjacency matrix. In our -# matrix, we have entered 1 for every edge. Thus we simply sum over the matrix: -sum(myRandAM) - -# Is that what you expect? - -# What about the degree distribution? We can get that simply by summing over the -# rows and summing over the columns and adding the two vectors. - -rowSums(myRandAM) + colSums(myRandAM) # check this against the plot! - -# The function degree() gives the same values -igraph::degree(myG) - -# Let's plot the degree distribution in a histogram: -degG <- igraph::degree(myG) -brk <- seq(min(degG)-0.5, max(degG)+0.5, by=1) # define histogram breaks -hist(degG, breaks=brk, col="#A5CCF5", - xlim = c(-1,8), xaxt = "n", - main = "Node degrees", xlab = "Degree", ylab = "Number") # plot histogram -axis(side = 1, at = 0:7) - -# Note: I don't _have_ to define breaks, the hist() function usually does so -# quite well, automatically. But for this purpose I want the columns of the -# histogram to represent exactly one node-degree difference. - -# A degree distribution is actually a very informative descriptor of graphs, -# since it is very sensitive to the generating mechanism. For biological -# networks, that is one of the key questions we are interested in: how was the -# network formed? Asking about the mechanism, the way the interactions -# support function and shape the fitness landscape in which the cell evolves, -# connects our mathematical abstraction with biological insight. - - -# = 2 DEGREE DISTRIBUTIONS ================================================ - -# Let's simulate a few graphs that are a bit bigger to get a better sense of -# their degree distributions: -# - -# == 2.1 Random graph ====================================================== - -N <- 200 - -set.seed(31415927) # set RNG seed for repeatable randomness -my200AM <- makeRandomAM(as.character(1:N), p = 0.015) -set.seed(NULL) # reset the RNG - -myG200 <- igraph::graph_from_adjacency_matrix(my200AM, mode = "undirected") -myGxy <- igraph::layout_with_graphopt(myG200, charge=0.0001) # calculate layout - # coordinates - -oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off, save graphics state -plot(myG200, - layout = myGxy, - rescale = FALSE, - xlim = c(min(myGxy[,1]) * 0.99, max(myGxy[,1]) * 1.01), - ylim = c(min(myGxy[,2]) * 0.99, max(myGxy[,2]) * 1.01), - vertex.color=heat.colors(max(igraph::degree(myG200)+1))[igraph::degree(myG200)+1], - vertex.size = 150 + (70 * igraph::degree(myG200)), - vertex.label = NA) -par(oPar) # restore graphics state - -# This graph has thirteen singletons and one large, connected component. Many -# biological graphs look approximately like this. - -# Calculate degree distributions -dg <- igraph::degree(myG200) -brk <- seq(min(dg)-0.5, max(dg)+0.5, by=1) -hist(dg, breaks=brk, col="#A5F5CC", - xlim = c(-1,11), xaxt = "n", - main = "Node degrees", xlab = "Degree", ylab = "Number") # plot histogram -axis(side = 1, at = 0:10) - - -# Note the pronounced peak of this distribution: this is not "scale-free". -# Here is the log-log plot of frequency vs. degree-rank ... - -( freqRank <- table(dg) ) -plot(log10(as.numeric(names(freqRank)) + 1), - log10(as.numeric(freqRank)), type = "b", - pch = 21, bg = "#A5F5CC", - xlab = "log(Rank)", ylab = "log(frequency)", - main = "200 nodes in a random network") - -# ... which shows us that this does NOT correspond to the single-slope linear -# relationship that we expect for a "scale-free" graph. - -# == 2.2 scale-free graph (Barabasi-Albert) ================================ - -# What does one of those intriguing "scale-free" distributions look like? The -# iGraph:: package has a function to make random graphs according to the -# Barabasi-Albert model of scale-free graphs. It is: sample_pa(), where pa -# stands for "preferential attachment". Preferential attachment is _one_ type of -# process that will yield scale-free distributions. - -N <- 200 - -set.seed(31415927) # set RNG seed for repeatable randomness -GBA <- igraph::sample_pa(N, power = 0.8, directed = FALSE) -set.seed(NULL) # reset the RNG - -GBAxy <- igraph::layout_with_graphopt(GBA, charge=0.0001) - -oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off, save graphics state -plot(GBA, - layout = GBAxy, - rescale = FALSE, - xlim = c(min(GBAxy[,1]) * 0.99, max(GBAxy[,1]) * 1.01), - ylim = c(min(GBAxy[,2]) * 0.99, max(GBAxy[,2]) * 1.01), - vertex.color=heat.colors(max(igraph::degree(GBA)+1))[igraph::degree(GBA)+1], - vertex.size = 200 + (30 * igraph::degree(GBA)), - vertex.label = NA) -par(oPar) # restore graphics state - -# This is a very obviously different graph! Some biological networks have -# features that look like that - but in my experience the hub nodes are usually -# not that distinct. But then again, that really depends on the parameter -# "power". Play with the "power" parameter and get a sense for what difference -# this makes. Also: note that the graph has only a single component - no -# singletons. - -# What's the degree distribution of this graph? -( dg <- igraph::degree(GBA) ) -brk <- seq(min(dg)-0.5, max(dg)+0.5, by=1) -hist(dg, breaks=brk, col="#DCF5B5", - xlim = c(0,max(dg)+1), xaxt = "n", - main = "Node degrees 200 nodes PA graph", - xlab = "Degree", ylab = "Number") -axis(side = 1, at = seq(0, max(dg)+1, by=5)) - -# Most nodes have a degree of 1, but one node has a degree of 19. - -(freqRank <- table(dg)) -plot(log10(as.numeric(names(freqRank)) + 1), - log10(as.numeric(freqRank)), type = "b", - pch = 21, bg = "#DCF5B5", - xlab = "log(Rank)", ylab = "log(frequency)", - main = "200 nodes in a preferential-attachment network") - -# Sort-of linear, but many of the higher ranked nodes have a frequency of only -# one. That behaviour smooths out in larger graphs - let's try 100000 nodes: -# -N <- 10000 -X <- igraph::sample_pa(N, power = 0.8, directed = FALSE) # 100,000 nodes -freqRank <- table(igraph::degree(X)) -plot(log10(as.numeric(names(freqRank)) + 1), - log10(as.numeric(freqRank)), type = "b", - xlab = "log(Rank)", ylab = "log(frequency)", - pch = 21, bg = "#A5F5CC", - main = "100,000 nodes in a random, scale-free network") -rm(X) - - -# == 2.3 Random geometric graph ============================================ - -# Finally, let's simulate a random geometric graph and look at the degree -# distribution. Remember: these graphs have a high probability to have edges -# between nodes that are "close" together - an entirely biological notion. - -# We'll randomly place our nodes in a box. Then we'll define the -# probability for two nodes to have an edge to be a function of their Euclidian -# distance in the box. - -# Here is a function that makes an adjacency matrix for such graphs. iGraph:: -# has a similar function, sample_grg(), which connects nodes that are closer -# than a cutoff, the function I give you below is a bit more interesting since -# it creates edges according to a probability that is determined by a -# generalized logistic function of the distance. This sigmoidal function gives -# a smooth cutoff and creates more "natural" graphs. Otherwise, the function is -# very similar to the random graph function, except that we output the -# "coordinates" of the nodes together with the adjacency matrix which we then -# use for the layout. list() FTW. - - -makeRandomGeometricAM <- function(nam, B = 25, Q = 0.001, t = 0.6) { - # Make an adjacency matrix for an undirected random geometric graph from - # edges connected with probabilities according to a generalized logistic - # function. - # Parameters: - # nam: a character vector of unique names - # B, Q, t: probability that a random pair (i, j) of nodes gets an - # edge determined by a generalized logistic function - # p <- 1 - 1/((1 + (Q * (exp(-B * (x-t)))))^(1 / 0.9))) - # - # Value: a list with the following components: - # AM$mat : an adjacency matrix - # AM$nam : labels for the nodes - # AM$x : x-coordinates for the nodes - # AM$y : y-coordinates for the nodes - # - nu <- 1 # probably not useful to change - AM <- list() - AM$nam <- nam - N <- length(AM$nam) - AM$mat <- matrix(numeric(N * N), ncol = N) # The adjacency matrix - rownames(AM$mat) <- AM$nam - colnames(AM$mat) <- AM$nam - AM$x <- runif(N) # Randomly place nodes into the unit square - AM$y <- runif(N) - for (iRow in 1:(N-1)) { # Same principles as in makeRandomGraph() - for (iCol in (iRow+1):N) { - # geometric distance ... - d <- sqrt((AM$x[iRow] - AM$x[iCol])^2 + - (AM$y[iRow] - AM$y[iCol])^2) # Pythagoras - # distance dependent probability - p <- 1 - 1/((1 + (Q * (exp(-B * (d-t)))))^(1 / nu)) - if (runif(1) < p) { - AM$mat[iRow, iCol] <- 1 - } - } - } - return(AM) -} - -# Getting the parameters of a generalized logistic right takes a bit of -# experimenting. If you are interested, you can try a few variations. Or you can -# look up the function at -# https://en.wikipedia.org/wiki/Generalised_logistic_function - -# This function computes generalized logistics ... -# genLog <- function(x, B = 25, Q = 0.001, t = 0.5) { -# # generalized logistic (sigmoid) -# nu <- 1 -# return(1 - 1/((1 + (Q * (exp(-B * (x-t)))))^(1 / nu))) -# } -# -# ... and this code plots p-values over the distances we could encouter between -# our nodes: from 0 to sqrt(2) i.e. the diagonal of the unit square in which we -# will place our nodes. -# x <- seq(0, sqrt(2), length.out = 50) -# plot(x, genLog(x), type="l", col="#AA0000", ylim = c(0, 1), -# xlab = "d", ylab = "p(edge)") - -# 200 node random geomteric graph -N <- 200 -set.seed(112358) # set RNG seed for repeatable randomness -rGAM <- makeRandomGeometricAM(as.character(1:N), t = 0.4) -set.seed(NULL) # reset the RNG - - -myGRG <- igraph::graph_from_adjacency_matrix(rGAM$mat, mode = "undirected") - -oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off -plot(myGRG, - layout = cbind(rGAM$x, rGAM$y), # use our node coordinates for layout, - rescale = FALSE, - xlim = c(min(rGAM$x) * 0.9, max(rGAM$x) * 1.1), - ylim = c(min(rGAM$y) * 0.9, max(rGAM$y) * 1.1), - vertex.color=heat.colors(max(igraph::degree(myGRG)+1))[igraph::degree(myGRG)+1], - vertex.size = 0.1 + (0.2 * igraph::degree(myGRG)), - vertex.label = NA) -par(oPar) - -# degree distribution: -(dg <- igraph::degree(myGRG)) -brk <- seq(min(dg) - 0.5, max(dg) + 0.5, by = 1) -hist(dg, breaks = brk, col = "#FCC6D2", - xlim = c(0, 25), xaxt = "n", - main = "Node degrees: 200 nodes RG graph", - xlab = "Degree", ylab = "Number") -axis(side = 1, at = c(0, min(dg):max(dg))) - -# You'll find that this is kind of in-between the random, and the scale-free -# graph. We do have hubs, but they are not as extreme as in the scale-free case; -# and we have have no singletons, in contrast to the random graph. - -(freqRank <- table(dg)) -plot(log10(as.numeric(names(freqRank)) + 1), - log10(as.numeric(freqRank)), type = "b", - pch = 21, bg = "#FCC6D2", - xlab = "log(Rank)", ylab = "log(frequency)", - main = "200 nodes in a random geometric network") - - - -# = 3 A CLOSER LOOK AT THE igraph:: PACKAGE =============================== - - -# == 3.1 Basics ============================================================ - -# The basic object of the igraph:: package is a graph object. Let's explore the -# first graph some more, the one we built with our random gene names: -summary(myG) - -# This output means: this is an IGRAPH graph, with U = UN-directed edges -# and N = named nodes, that has 20 nodes and 20 edges. For details, see -?igraph::print.igraph - -mode(myG) -class(myG) - -# This means an igraph:: graph object is a special list object; it is opaque in -# the sense that a user is never expected to modify its components directly, but -# through a variety of helper functions which the package provides. There are -# many ways to construct graphs - from adjacency matrices, as we have just done, -# from edge lists, or by producing random graphs according to a variety of -# recipes, called _games_ in this package. - -# Two basic functions retrieve nodes "Vertices", and "Edges": -igraph::V(myG) -igraph::E(myG) - -# additional properties can be retrieved from the Vertices ... -igraph::V(myG)$name - - -# As with many R objects, loading the package provides special functions that -# can be accessed via the same name as the basic R functions, for example: - -print(myG) -plot(myG) # this is the result of default plot parameters - -# ... where plot() allows the usual flexibility of fine-tuning the plot. We -# first layout the node coordinates with the Fruchtermann-Reingold algorithm - a -# force-directed layout that applies an ettractive potential along edges (which -# pulls nodes together) and a repulsive potential to nodes (so they don't -# overlap). Note the use of the degree() function to color and scale nodes and -# labels by degree and the use of the V() function to retrieve the vertex names. -# See ?plot.igraph for details." - -# Plot with some customizing parameters -oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off -plot(myG, - layout = igraph::layout_with_fr(myG), - vertex.color=heat.colors(max(igraph::degree(myG)+1))[igraph::degree(myG)+1], - vertex.size = 12 + (5 * igraph::degree(myG)), - vertex.label.cex = 0.4 + (0.15 * igraph::degree(myG)), - edge.width = 2, - vertex.label = igraph::V(myG)$name, - vertex.label.family = "sans", - vertex.label.cex = 0.9) -par(oPar) - -# ... or with a different layout: -oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off -plot(myG, - layout = igraph::layout_in_circle(myG), - vertex.color=heat.colors(max(igraph::degree(myG)+1))[igraph::degree(myG)+1], - vertex.size = 12 + (5 * igraph::degree(myG)), - vertex.label.cex = 0.4 + (0.15 * igraph::degree(myG)), - edge.width = 2, - vertex.label = igraph::V(myG)$name, - vertex.label.family = "sans", - vertex.label.cex = 0.9) -par(oPar) - -# igraph:: has a large number of graph-layout functions: see -# ?layout_ and try them all. - - -# == 3.2 Components ======================================================== - -# The function igrap::components() tells us whether there are components of the -# graph in which there is no path to other components. -igraph::components(myG) - -# In the _membership_ vector, nodes are annotated with the index of the -# component they are part of. Sui7 is the only node of component 2, Cyj1 is in -# the third component etc. This is perhaps more clear if we sort by component -# index -sort(igraph::components(myG)$membership, decreasing = TRUE) - -# Retrieving e.g. the members of the first component from the list can be done by subsetting: - -(sel <- igraph::components(myG)$membership == 1) # boolean vector .. -(c1 <- igraph::components(myG)$membership[sel]) -names(c1) - - -# = 4 RANDOM GRAPHS AND GRAPH METRICS ===================================== - - -# Let's explore some of the more interesting, topological graph measures. We -# start by building a somewhat bigger graph. We aren't quite sure whether -# biological graphs are small-world, or random-geometric, or -# preferential-attachment ... but igraph:: has ways to simulate the basic ones -# (and we could easily simulate our own). Look at the following help pages: - -?igraph::sample_gnm # see also sample_gnp for the Erdös-Rényi models -?igraph::sample_smallworld # for the Watts & Strogatz model -?igraph::sample_pa # for the Barabasi-Albert model - -# But note that there are many more sample_ functions. Check out the docs! - -# Let's look at betweenness measures for our first graph. Here: the nodes again -# colored by degree. Degree centrality states: nodes of higher degree are -# considered to be more central. And that's also the way the force-directed -# layout drawas them, obviously. - -set.seed(112358) # set RNG seed for repeatable randomness -myGxy <- igraph::layout_with_fr(myG) # calculate layout coordinates -set.seed(NULL) # reset the RNG - -oPar <- par(mar = rep(0, 4)) # turn margins off, save graphics state -plot(myG, - layout = myGxy, - rescale = FALSE, - xlim = c(min(myGxy[,1]) * 0.99, max(myGxy[,1]) * 1.01), - ylim = c(min(myGxy[,2]) * 0.99, max(myGxy[,2]) * 1.01), - vertex.color=heat.colors(max(igraph::degree(myG)+1))[igraph::degree(myG)+1], - vertex.size = 40 + (15 * igraph::degree(myG)), - vertex.label.cex = 0.4 + (0.15 * igraph::degree(myG)), - vertex.label = igraph::V(myG)$name, - vertex.label.family = "sans") -par(oPar) # restore graphics state - -# == 4.1 Diameter ========================================================== - -igraph::diameter(myG) # The diameter of a graph is its maximum length - # shortest path. - -# let's plot this path: here are the nodes ... -igraph::get_diameter(myG) - -# ... and we can get the x, y coordinates from iGxy by subsetting with the node -# names. The we draw the diameter-path with a transparent, thick pink line: -lines(myGxy[igraph::get_diameter(myG),], lwd=10, col="#ff63a788") - -# == Centralization scores - -?igraph::centralize -# replot our graph, and color by log_betweenness: - -bC <- igraph::centr_betw(myG) # calculate betweenness centrality -nodeBetw <- bC$res -nodeBetw <- round(log(nodeBetw +1)) + 1 - -oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off -plot(myG, - layout = myGxy, - rescale = FALSE, - xlim = c(min(myGxy[,1]) * 0.99, max(myGxy[,1]) * 1.01), - ylim = c(min(myGxy[,2]) * 0.99, max(myGxy[,2]) * 1.01), - vertex.color=heat.colors(max(igraph::degree(myG)+1))[igraph::degree(myG)+1], - vertex.size = 40 + (15 * igraph::degree(myG)), - vertex.label.cex = 0.4 + (0.15 * igraph::degree(myG)), - vertex.label = igraph::V(myG)$name, - vertex.label.family = "sans") -par(oPar) - -# Note that the betweenness - the number of shortest paths that pass through a -# node, is in general higher for high-degree nodes - but not always: Eqr2 has -# higher betweenness than Itv7: this measure really depends on the detailed -# local topology of the graph." - -# Can you use centr_eigen() and centr_degree() to calculate the respective -# values? That's something I would expect you to be able to do. -# -# Lets plot betweenness centrality for our random geometric graph: - -bCmyGRG <- igraph::centr_betw(myGRG) # calculate betweenness centrality - -nodeBetw <- bCmyGRG$res -nodeBetw <- round((log(nodeBetw +1))^2.5) + 1 - -# colours and size proportional to betweenness -oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off -plot(myGRG, - layout = cbind(rGAM$x, rGAM$y), # use our node coordinates for layout, - rescale = FALSE, - xlim = c(min(rGAM$x) * 0.9, max(rGAM$x) * 1.1), - ylim = c(min(rGAM$y) * 0.9, max(rGAM$y) * 1.1), - vertex.color=heat.colors(max(nodeBetw))[nodeBetw], - vertex.size = 0.1 + (0.03 * nodeBetw), - vertex.label = NA) -par(oPar) - -igraph::diameter(myGRG) -lines(rGAM$x[igraph::get_diameter(myGRG)], - rGAM$y[igraph::get_diameter(myGRG)], - lwd = 10, - col = "#ff335533") - - - -# = 5 GRAPH CLUSTERING ==================================================== - - -# Clustering finds "communities" in graphs - and depending what the edges -# represent, these could be complexes, pathways, biological systems or similar. -# There are many graph-clustering algorithms. One approach with many attractive -# properties is the Map Equation, developed by Martin Rosvall. See: -# http://www.ncbi.nlm.nih.gov/pubmed/18216267 and htttp://www.mapequation.org - - -myGRGclusters <- igraph::cluster_infomap(myGRG) -igraph::modularity(myGRGclusters) # ... measures how separated the different - # membership types are from each other -igraph::membership(myGRGclusters) # which nodes are in what cluster? -table(igraph::membership(myGRGclusters)) # how large are the clusters? - -# The largest cluster has 48 members, the second largest has 25, etc. - - -# Lets plot our graph again, coloring the nodes of the first five communities by -# their cluster membership: - -# first, make a vector with as many grey colors as we have communities ... -commColors <- rep("#f1eef6", max(igraph::membership(myGRGclusters))) -# ... then overwrite the first five with "real colors" - something like rust, -# lilac, pink, and mauve or so. -commColors[1:5] <- c("#980043", "#dd1c77", "#df65b0", "#c994c7", "#d4b9da") - - -oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off -plot(myGRG, - layout = cbind(rGAM$x, rGAM$y), - rescale = FALSE, - xlim = c(min(rGAM$x) * 0.9, max(rGAM$x) * 1.1), - ylim = c(min(rGAM$y) * 0.9, max(rGAM$y) * 1.1), - vertex.color=commColors[igraph::membership(myGRGclusters)], - vertex.size = 0.3 + (0.4 * igraph::degree(myGRG)), - vertex.label = NA) -par(oPar) - -# That's all. - - -# [END] +# tocID <- "FND-MAT-Graphs_and_networks.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the FND-MAT-Graphs_and_networks unit. +# +# Version: 1.2 +# +# Date: 2017 10 - 2019 01 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.2 Change from require() to requireNamespace(), +# use ::() idiom throughout +# 1.1 Update set.seed() usage +# 1.0 First final version for learning units. +# 0.1 First code copied from 2016 material. +# +# +# TODO: Add some explicit tasks and sample solutions. +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> -------------------------------------------------------------- +#TOC> 1 REVIEW 50 +#TOC> 2 DEGREE DISTRIBUTIONS 206 +#TOC> 2.1 Random graph 212 +#TOC> 2.2 scale-free graph (Barabasi-Albert) 260 +#TOC> 2.3 Random geometric graph 326 +#TOC> 3 A CLOSER LOOK AT THE igraph:: PACKAGE 448 +#TOC> 3.1 Basics 451 +#TOC> 3.2 Components 523 +#TOC> 4 RANDOM GRAPHS AND GRAPH METRICS 542 +#TOC> 4.1 Diameter 579 +#TOC> 5 GRAPH CLUSTERING 648 +#TOC> +#TOC> ========================================================================== + + +# = 1 REVIEW ============================================================== + +# This tutorial covers basic concepts of graph theory and analysis in R. Make +# sure you have pulled the latest version of the project from the GitHub +# repository. + +# Let's explore some of the basic ideas of graph theory by starting with a small +# random graph. + + +# To begin let's write a little function that will create random "gene" names; +# there's no particular purpose to this other than to make our graphs look a +# little more "biological" ... +makeRandomGenenames <- function(N) { + nam <- character() + while (length(nam) < N) { + a <- paste0(c(sample(LETTERS, 1), sample(letters, 2)), + collapse="") # one uppercase, two lowercase letters + n <- sample(1:9, 1) # one number + nam[length(nam) + 1] <- paste(a, n, sep="") # store in vector + nam <- unique(nam) # delete if this was a duplicate + } + return(nam) +} + +N <- 20 + +set.seed(112358) # set RNG seed for repeatable randomness +( Nnames <- makeRandomGenenames(N) ) +set.seed(NULL) # reset the RNG + +# One way to represent graphs in a computer is as an "adjacency matrix". In this +# matrix, each row and each column represents a node, and the cell at the +# intersection of a row and column contains a value/TRUE if there is an edge, +# 0/FALSE otherwise. + +# Let's create an adjacency matrix for our random graph: let's say a pair +# of nodes has probability p <- 0.09 to have an edge, and our graph is +# symmetric , i.e. it is an undirected graph, and it has neither self-edges, +# i.e. loops, nor multiple edges between the same nodes, i.e. it +# is a "simple" graph. We use the Nnames vector as node labels. + +makeRandomAM <- function(nam, p = 0.1) { + # Make a random adjacency matrix for a set of nodes with edge probability p + # Parameters: + # nam: a character vector of unique node names. + # p: probability that a random pair of nodes will have an edge. + # + # Value: an adjacency matrix for a simple, undirected graph + # + + N <- length(nam) + AM <- matrix(numeric(N * N), ncol = N) # Adjacency matrix, pre-filled with 0 + rownames(AM) <- nam + colnames(AM) <- nam + for (iRow in 1:(N-1)) { # Note how we make sure iRow != iCol - this prevents + # loops (self-edges) + for (iCol in (iRow+1):N) { + if (runif(1) < p) { # runif() creates uniform random numbers + # between 0 and 1. The expression is TRUE with + # probability p. if it is TRUE ... + AM[iRow, iCol] <- 1 # ... record an edge for the pair (iRow, iCol) + } + } + } + return(AM) +} + +set.seed(112358) # set RNG seed for repeatable randomness +( myRandAM <- makeRandomAM(Nnames, p = 0.09) ) +set.seed(NULL) # reset the RNG + + +# Listing the matrix is not very informative - we should plot this graph. The +# standard package for work with graphs in r is "igraph::". We'll go into more +# details of the igraph:: package a bit later, for now we just use it to plot: + +if (! requireNamespace("igraph", quietly = TRUE)) { + install.packages("igraph") +} +# Package information: +# library(help = igraph) # basic information +# browseVignettes("igraph") # available vignettes +# data(package = "igraph") # available datasets + + +myG <- igraph::graph_from_adjacency_matrix(myRandAM, mode = "undirected") + +set.seed(112358) # set RNG seed for repeatable randomness + # calculate layout coordinates +myGxy <- igraph::layout_with_graphopt(myG, + charge=0.0012) +set.seed(NULL) # reset the RNG + + +# The igraph:: package adds its own function to the collection of plot() +# functions; R makes the selection which plot function to use based on the class +# of the object that we request to plot. This plot function has parameters +# layout - the x,y coordinates of the nodes; +# vertex.color - which I define to color by node-degree +# vertex size - which I define to increase with node-degree +# vertex.label - which I set to combine the names of the vertices of the +# graph - names(V(iG)) - with the node degree - degree(iG). +# See ?igraph.plotting for the complete list of parameters + + +oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off +plot(myG, + layout = myGxy, + rescale = FALSE, + xlim = c(min(myGxy[,1]) * 0.99, max(myGxy[,1]) * 1.01), + ylim = c(min(myGxy[,2]) * 0.99, max(myGxy[,2]) * 1.01), + vertex.color=heat.colors(max(igraph::degree(myG)+1))[igraph::degree(myG)+1], + vertex.size = 1000 + (900 * igraph::degree(myG)), + vertex.label = sprintf("%s(%i)", names(igraph::V(myG)), igraph::degree(myG)), + vertex.label.family = "sans", + vertex.label.cex = 0.7) +par(oPar) # reset plot window + + +# The simplest descriptor of a graph are the number of nodes, edges, and the +# degree-distribution. In our example, the number of nodes was given: N; the +# number of edges can easily be calculated from the adjacency matrix. In our +# matrix, we have entered 1 for every edge. Thus we simply sum over the matrix: +sum(myRandAM) + +# Is that what you expect? + +# What about the degree distribution? We can get that simply by summing over the +# rows and summing over the columns and adding the two vectors. + +rowSums(myRandAM) + colSums(myRandAM) # check this against the plot! + +# The function degree() gives the same values +igraph::degree(myG) + +# Let's plot the degree distribution in a histogram: +degG <- igraph::degree(myG) +brk <- seq(min(degG)-0.5, max(degG)+0.5, by=1) # define histogram breaks +hist(degG, breaks=brk, col="#A5CCF5", + xlim = c(-1,8), xaxt = "n", + main = "Node degrees", xlab = "Degree", ylab = "Number") # plot histogram +axis(side = 1, at = 0:7) + +# Note: I don't _have_ to define breaks, the hist() function usually does so +# quite well, automatically. But for this purpose I want the columns of the +# histogram to represent exactly one node-degree difference. + +# A degree distribution is actually a very informative descriptor of graphs, +# since it is very sensitive to the generating mechanism. For biological +# networks, that is one of the key questions we are interested in: how was the +# network formed? Asking about the mechanism, the way the interactions +# support function and shape the fitness landscape in which the cell evolves, +# connects our mathematical abstraction with biological insight. + + +# = 2 DEGREE DISTRIBUTIONS ================================================ + +# Let's simulate a few graphs that are a bit bigger to get a better sense of +# their degree distributions: +# + +# == 2.1 Random graph ====================================================== + +N <- 200 + +set.seed(31415927) # set RNG seed for repeatable randomness +my200AM <- makeRandomAM(as.character(1:N), p = 0.015) +set.seed(NULL) # reset the RNG + +myG200 <- igraph::graph_from_adjacency_matrix(my200AM, mode = "undirected") +myGxy <- igraph::layout_with_graphopt(myG200, charge=0.0001) # calculate layout + # coordinates + +oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off, save graphics state +plot(myG200, + layout = myGxy, + rescale = FALSE, + xlim = c(min(myGxy[,1]) * 0.99, max(myGxy[,1]) * 1.01), + ylim = c(min(myGxy[,2]) * 0.99, max(myGxy[,2]) * 1.01), + vertex.color=heat.colors(max(igraph::degree(myG200)+1))[igraph::degree(myG200)+1], + vertex.size = 150 + (70 * igraph::degree(myG200)), + vertex.label = NA) +par(oPar) # restore graphics state + +# This graph has thirteen singletons and one large, connected component. Many +# biological graphs look approximately like this. + +# Calculate degree distributions +dg <- igraph::degree(myG200) +brk <- seq(min(dg)-0.5, max(dg)+0.5, by=1) +hist(dg, breaks=brk, col="#A5F5CC", + xlim = c(-1,11), xaxt = "n", + main = "Node degrees", xlab = "Degree", ylab = "Number") # plot histogram +axis(side = 1, at = 0:10) + + +# Note the pronounced peak of this distribution: this is not "scale-free". +# Here is the log-log plot of frequency vs. degree-rank ... + +( freqRank <- table(dg) ) +plot(log10(as.numeric(names(freqRank)) + 1), + log10(as.numeric(freqRank)), type = "b", + pch = 21, bg = "#A5F5CC", + xlab = "log(Rank)", ylab = "log(frequency)", + main = "200 nodes in a random network") + +# ... which shows us that this does NOT correspond to the single-slope linear +# relationship that we expect for a "scale-free" graph. + +# == 2.2 scale-free graph (Barabasi-Albert) ================================ + +# What does one of those intriguing "scale-free" distributions look like? The +# iGraph:: package has a function to make random graphs according to the +# Barabasi-Albert model of scale-free graphs. It is: sample_pa(), where pa +# stands for "preferential attachment". Preferential attachment is _one_ type of +# process that will yield scale-free distributions. + +N <- 200 + +set.seed(31415927) # set RNG seed for repeatable randomness +GBA <- igraph::sample_pa(N, power = 0.8, directed = FALSE) +set.seed(NULL) # reset the RNG + +GBAxy <- igraph::layout_with_graphopt(GBA, charge=0.0001) + +oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off, save graphics state +plot(GBA, + layout = GBAxy, + rescale = FALSE, + xlim = c(min(GBAxy[,1]) * 0.99, max(GBAxy[,1]) * 1.01), + ylim = c(min(GBAxy[,2]) * 0.99, max(GBAxy[,2]) * 1.01), + vertex.color=heat.colors(max(igraph::degree(GBA)+1))[igraph::degree(GBA)+1], + vertex.size = 200 + (30 * igraph::degree(GBA)), + vertex.label = NA) +par(oPar) # restore graphics state + +# This is a very obviously different graph! Some biological networks have +# features that look like that - but in my experience the hub nodes are usually +# not that distinct. But then again, that really depends on the parameter +# "power". Play with the "power" parameter and get a sense for what difference +# this makes. Also: note that the graph has only a single component - no +# singletons. + +# What's the degree distribution of this graph? +( dg <- igraph::degree(GBA) ) +brk <- seq(min(dg)-0.5, max(dg)+0.5, by=1) +hist(dg, breaks=brk, col="#DCF5B5", + xlim = c(0,max(dg)+1), xaxt = "n", + main = "Node degrees 200 nodes PA graph", + xlab = "Degree", ylab = "Number") +axis(side = 1, at = seq(0, max(dg)+1, by=5)) + +# Most nodes have a degree of 1, but one node has a degree of 19. + +(freqRank <- table(dg)) +plot(log10(as.numeric(names(freqRank)) + 1), + log10(as.numeric(freqRank)), type = "b", + pch = 21, bg = "#DCF5B5", + xlab = "log(Rank)", ylab = "log(frequency)", + main = "200 nodes in a preferential-attachment network") + +# Sort-of linear, but many of the higher ranked nodes have a frequency of only +# one. That behaviour smooths out in larger graphs - let's try 100000 nodes: +# +N <- 10000 +X <- igraph::sample_pa(N, power = 0.8, directed = FALSE) # 100,000 nodes +freqRank <- table(igraph::degree(X)) +plot(log10(as.numeric(names(freqRank)) + 1), + log10(as.numeric(freqRank)), type = "b", + xlab = "log(Rank)", ylab = "log(frequency)", + pch = 21, bg = "#A5F5CC", + main = "100,000 nodes in a random, scale-free network") +rm(X) + + +# == 2.3 Random geometric graph ============================================ + +# Finally, let's simulate a random geometric graph and look at the degree +# distribution. Remember: these graphs have a high probability to have edges +# between nodes that are "close" together - an entirely biological notion. + +# We'll randomly place our nodes in a box. Then we'll define the +# probability for two nodes to have an edge to be a function of their Euclidian +# distance in the box. + +# Here is a function that makes an adjacency matrix for such graphs. iGraph:: +# has a similar function, sample_grg(), which connects nodes that are closer +# than a cutoff, the function I give you below is a bit more interesting since +# it creates edges according to a probability that is determined by a +# generalized logistic function of the distance. This sigmoidal function gives +# a smooth cutoff and creates more "natural" graphs. Otherwise, the function is +# very similar to the random graph function, except that we output the +# "coordinates" of the nodes together with the adjacency matrix which we then +# use for the layout. list() FTW. + + +makeRandomGeometricAM <- function(nam, B = 25, Q = 0.001, t = 0.6) { + # Make an adjacency matrix for an undirected random geometric graph from + # edges connected with probabilities according to a generalized logistic + # function. + # Parameters: + # nam: a character vector of unique names + # B, Q, t: probability that a random pair (i, j) of nodes gets an + # edge determined by a generalized logistic function + # p <- 1 - 1/((1 + (Q * (exp(-B * (x-t)))))^(1 / 0.9))) + # + # Value: a list with the following components: + # AM$mat : an adjacency matrix + # AM$nam : labels for the nodes + # AM$x : x-coordinates for the nodes + # AM$y : y-coordinates for the nodes + # + nu <- 1 # probably not useful to change + AM <- list() + AM$nam <- nam + N <- length(AM$nam) + AM$mat <- matrix(numeric(N * N), ncol = N) # The adjacency matrix + rownames(AM$mat) <- AM$nam + colnames(AM$mat) <- AM$nam + AM$x <- runif(N) # Randomly place nodes into the unit square + AM$y <- runif(N) + for (iRow in 1:(N-1)) { # Same principles as in makeRandomGraph() + for (iCol in (iRow+1):N) { + # geometric distance ... + d <- sqrt((AM$x[iRow] - AM$x[iCol])^2 + + (AM$y[iRow] - AM$y[iCol])^2) # Pythagoras + # distance dependent probability + p <- 1 - 1/((1 + (Q * (exp(-B * (d-t)))))^(1 / nu)) + if (runif(1) < p) { + AM$mat[iRow, iCol] <- 1 + } + } + } + return(AM) +} + +# Getting the parameters of a generalized logistic right takes a bit of +# experimenting. If you are interested, you can try a few variations. Or you can +# look up the function at +# https://en.wikipedia.org/wiki/Generalised_logistic_function + +# This function computes generalized logistics ... +# genLog <- function(x, B = 25, Q = 0.001, t = 0.5) { +# # generalized logistic (sigmoid) +# nu <- 1 +# return(1 - 1/((1 + (Q * (exp(-B * (x-t)))))^(1 / nu))) +# } +# +# ... and this code plots p-values over the distances we could encouter between +# our nodes: from 0 to sqrt(2) i.e. the diagonal of the unit square in which we +# will place our nodes. +# x <- seq(0, sqrt(2), length.out = 50) +# plot(x, genLog(x), type="l", col="#AA0000", ylim = c(0, 1), +# xlab = "d", ylab = "p(edge)") + +# 200 node random geomteric graph +N <- 200 +set.seed(112358) # set RNG seed for repeatable randomness +rGAM <- makeRandomGeometricAM(as.character(1:N), t = 0.4) +set.seed(NULL) # reset the RNG + + +myGRG <- igraph::graph_from_adjacency_matrix(rGAM$mat, mode = "undirected") + +oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off +plot(myGRG, + layout = cbind(rGAM$x, rGAM$y), # use our node coordinates for layout, + rescale = FALSE, + xlim = c(min(rGAM$x) * 0.9, max(rGAM$x) * 1.1), + ylim = c(min(rGAM$y) * 0.9, max(rGAM$y) * 1.1), + vertex.color=heat.colors(max(igraph::degree(myGRG)+1))[igraph::degree(myGRG)+1], + vertex.size = 0.1 + (0.2 * igraph::degree(myGRG)), + vertex.label = NA) +par(oPar) + +# degree distribution: +(dg <- igraph::degree(myGRG)) +brk <- seq(min(dg) - 0.5, max(dg) + 0.5, by = 1) +hist(dg, breaks = brk, col = "#FCC6D2", + xlim = c(0, 25), xaxt = "n", + main = "Node degrees: 200 nodes RG graph", + xlab = "Degree", ylab = "Number") +axis(side = 1, at = c(0, min(dg):max(dg))) + +# You'll find that this is kind of in-between the random, and the scale-free +# graph. We do have hubs, but they are not as extreme as in the scale-free case; +# and we have have no singletons, in contrast to the random graph. + +(freqRank <- table(dg)) +plot(log10(as.numeric(names(freqRank)) + 1), + log10(as.numeric(freqRank)), type = "b", + pch = 21, bg = "#FCC6D2", + xlab = "log(Rank)", ylab = "log(frequency)", + main = "200 nodes in a random geometric network") + + + +# = 3 A CLOSER LOOK AT THE igraph:: PACKAGE =============================== + + +# == 3.1 Basics ============================================================ + +# The basic object of the igraph:: package is a graph object. Let's explore the +# first graph some more, the one we built with our random gene names: +summary(myG) + +# This output means: this is an IGRAPH graph, with U = UN-directed edges +# and N = named nodes, that has 20 nodes and 20 edges. For details, see +?igraph::print.igraph + +mode(myG) +class(myG) + +# This means an igraph:: graph object is a special list object; it is opaque in +# the sense that a user is never expected to modify its components directly, but +# through a variety of helper functions which the package provides. There are +# many ways to construct graphs - from adjacency matrices, as we have just done, +# from edge lists, or by producing random graphs according to a variety of +# recipes, called _games_ in this package. + +# Two basic functions retrieve nodes "Vertices", and "Edges": +igraph::V(myG) +igraph::E(myG) + +# additional properties can be retrieved from the Vertices ... +igraph::V(myG)$name + + +# As with many R objects, loading the package provides special functions that +# can be accessed via the same name as the basic R functions, for example: + +print(myG) +plot(myG) # this is the result of default plot parameters + +# ... where plot() allows the usual flexibility of fine-tuning the plot. We +# first layout the node coordinates with the Fruchtermann-Reingold algorithm - a +# force-directed layout that applies an ettractive potential along edges (which +# pulls nodes together) and a repulsive potential to nodes (so they don't +# overlap). Note the use of the degree() function to color and scale nodes and +# labels by degree and the use of the V() function to retrieve the vertex names. +# See ?plot.igraph for details." + +# Plot with some customizing parameters +oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off +plot(myG, + layout = igraph::layout_with_fr(myG), + vertex.color=heat.colors(max(igraph::degree(myG)+1))[igraph::degree(myG)+1], + vertex.size = 12 + (5 * igraph::degree(myG)), + vertex.label.cex = 0.4 + (0.15 * igraph::degree(myG)), + edge.width = 2, + vertex.label = igraph::V(myG)$name, + vertex.label.family = "sans", + vertex.label.cex = 0.9) +par(oPar) + +# ... or with a different layout: +oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off +plot(myG, + layout = igraph::layout_in_circle(myG), + vertex.color=heat.colors(max(igraph::degree(myG)+1))[igraph::degree(myG)+1], + vertex.size = 12 + (5 * igraph::degree(myG)), + vertex.label.cex = 0.4 + (0.15 * igraph::degree(myG)), + edge.width = 2, + vertex.label = igraph::V(myG)$name, + vertex.label.family = "sans", + vertex.label.cex = 0.9) +par(oPar) + +# igraph:: has a large number of graph-layout functions: see +# ?layout_ and try them all. + + +# == 3.2 Components ======================================================== + +# The function igrap::components() tells us whether there are components of the +# graph in which there is no path to other components. +igraph::components(myG) + +# In the _membership_ vector, nodes are annotated with the index of the +# component they are part of. Sui7 is the only node of component 2, Cyj1 is in +# the third component etc. This is perhaps more clear if we sort by component +# index +sort(igraph::components(myG)$membership, decreasing = TRUE) + +# Retrieving e.g. the members of the first component from the list can be done by subsetting: + +(sel <- igraph::components(myG)$membership == 1) # boolean vector .. +(c1 <- igraph::components(myG)$membership[sel]) +names(c1) + + +# = 4 RANDOM GRAPHS AND GRAPH METRICS ===================================== + + +# Let's explore some of the more interesting, topological graph measures. We +# start by building a somewhat bigger graph. We aren't quite sure whether +# biological graphs are small-world, or random-geometric, or +# preferential-attachment ... but igraph:: has ways to simulate the basic ones +# (and we could easily simulate our own). Look at the following help pages: + +?igraph::sample_gnm # see also sample_gnp for the Erdös-Rényi models +?igraph::sample_smallworld # for the Watts & Strogatz model +?igraph::sample_pa # for the Barabasi-Albert model + +# But note that there are many more sample_ functions. Check out the docs! + +# Let's look at betweenness measures for our first graph. Here: the nodes again +# colored by degree. Degree centrality states: nodes of higher degree are +# considered to be more central. And that's also the way the force-directed +# layout drawas them, obviously. + +set.seed(112358) # set RNG seed for repeatable randomness +myGxy <- igraph::layout_with_fr(myG) # calculate layout coordinates +set.seed(NULL) # reset the RNG + +oPar <- par(mar = rep(0, 4)) # turn margins off, save graphics state +plot(myG, + layout = myGxy, + rescale = FALSE, + xlim = c(min(myGxy[,1]) * 0.99, max(myGxy[,1]) * 1.01), + ylim = c(min(myGxy[,2]) * 0.99, max(myGxy[,2]) * 1.01), + vertex.color=heat.colors(max(igraph::degree(myG)+1))[igraph::degree(myG)+1], + vertex.size = 40 + (15 * igraph::degree(myG)), + vertex.label.cex = 0.4 + (0.15 * igraph::degree(myG)), + vertex.label = igraph::V(myG)$name, + vertex.label.family = "sans") +par(oPar) # restore graphics state + +# == 4.1 Diameter ========================================================== + +igraph::diameter(myG) # The diameter of a graph is its maximum length + # shortest path. + +# let's plot this path: here are the nodes ... +igraph::get_diameter(myG) + +# ... and we can get the x, y coordinates from iGxy by subsetting with the node +# names. The we draw the diameter-path with a transparent, thick pink line: +lines(myGxy[igraph::get_diameter(myG),], lwd=10, col="#ff63a788") + +# == Centralization scores + +?igraph::centralize +# replot our graph, and color by log_betweenness: + +bC <- igraph::centr_betw(myG) # calculate betweenness centrality +nodeBetw <- bC$res +nodeBetw <- round(log(nodeBetw +1)) + 1 + +oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off +plot(myG, + layout = myGxy, + rescale = FALSE, + xlim = c(min(myGxy[,1]) * 0.99, max(myGxy[,1]) * 1.01), + ylim = c(min(myGxy[,2]) * 0.99, max(myGxy[,2]) * 1.01), + vertex.color=heat.colors(max(igraph::degree(myG)+1))[igraph::degree(myG)+1], + vertex.size = 40 + (15 * igraph::degree(myG)), + vertex.label.cex = 0.4 + (0.15 * igraph::degree(myG)), + vertex.label = igraph::V(myG)$name, + vertex.label.family = "sans") +par(oPar) + +# Note that the betweenness - the number of shortest paths that pass through a +# node, is in general higher for high-degree nodes - but not always: Eqr2 has +# higher betweenness than Itv7: this measure really depends on the detailed +# local topology of the graph." + +# Can you use centr_eigen() and centr_degree() to calculate the respective +# values? That's something I would expect you to be able to do. +# +# Lets plot betweenness centrality for our random geometric graph: + +bCmyGRG <- igraph::centr_betw(myGRG) # calculate betweenness centrality + +nodeBetw <- bCmyGRG$res +nodeBetw <- round((log(nodeBetw +1))^2.5) + 1 + +# colours and size proportional to betweenness +oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off +plot(myGRG, + layout = cbind(rGAM$x, rGAM$y), # use our node coordinates for layout, + rescale = FALSE, + xlim = c(min(rGAM$x) * 0.9, max(rGAM$x) * 1.1), + ylim = c(min(rGAM$y) * 0.9, max(rGAM$y) * 1.1), + vertex.color=heat.colors(max(nodeBetw))[nodeBetw], + vertex.size = 0.1 + (0.03 * nodeBetw), + vertex.label = NA) +par(oPar) + +igraph::diameter(myGRG) +lines(rGAM$x[igraph::get_diameter(myGRG)], + rGAM$y[igraph::get_diameter(myGRG)], + lwd = 10, + col = "#ff335533") + + + +# = 5 GRAPH CLUSTERING ==================================================== + + +# Clustering finds "communities" in graphs - and depending what the edges +# represent, these could be complexes, pathways, biological systems or similar. +# There are many graph-clustering algorithms. One approach with many attractive +# properties is the Map Equation, developed by Martin Rosvall. See: +# http://www.ncbi.nlm.nih.gov/pubmed/18216267 and htttp://www.mapequation.org + + +myGRGclusters <- igraph::cluster_infomap(myGRG) +igraph::modularity(myGRGclusters) # ... measures how separated the different + # membership types are from each other +igraph::membership(myGRGclusters) # which nodes are in what cluster? +table(igraph::membership(myGRGclusters)) # how large are the clusters? + +# The largest cluster has 48 members, the second largest has 25, etc. + + +# Lets plot our graph again, coloring the nodes of the first five communities by +# their cluster membership: + +# first, make a vector with as many grey colors as we have communities ... +commColors <- rep("#f1eef6", max(igraph::membership(myGRGclusters))) +# ... then overwrite the first five with "real colors" - something like rust, +# lilac, pink, and mauve or so. +commColors[1:5] <- c("#980043", "#dd1c77", "#df65b0", "#c994c7", "#d4b9da") + + +oPar <- par(mar= c(0, 0, 0, 0)) # Turn margins off +plot(myGRG, + layout = cbind(rGAM$x, rGAM$y), + rescale = FALSE, + xlim = c(min(rGAM$x) * 0.9, max(rGAM$x) * 1.1), + ylim = c(min(rGAM$y) * 0.9, max(rGAM$y) * 1.1), + vertex.color=commColors[igraph::membership(myGRGclusters)], + vertex.size = 0.3 + (0.4 * igraph::degree(myGRG)), + vertex.label = NA) +par(oPar) + +# That's all. + + +# [END] diff --git a/FND-STA-Information_theory.R b/FND-STA-Information_theory.R index a5eb783..230e0a7 100644 --- a/FND-STA-Information_theory.R +++ b/FND-STA-Information_theory.R @@ -1,224 +1,224 @@ -# tocID <- "FND-STA-Information_theory.R" -# -# ============================================================================== -# -# Purpose: A Bioinformatics Course: -# R code accompanying the FND-STA-Information_theory unit. -# -# Version: 0.2.1 -# -# Date: 2017 - 2021 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 0.2.1 Maintenance -# 0.2 Under development -# 0.1 First code copied from 2016 material. -# -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> -------------------------------------- -#TOC> 1 ___Section___ 39 -#TOC> -#TOC> ========================================================================== - - -# = 1 ___Section___ ======================================================= - -# What level of information is "significant" - -# Assume the background distribution is the database frequencies of -# amino acids: - -AAref <- numeric() # Uniprot frequencies October 2017, slightly adjusted to -# sum to 1.0 -AAref["A"] <- 0.0904 -AAref["C"] <- 0.0123 -AAref["D"] <- 0.0545 -AAref["E"] <- 0.0617 -AAref["F"] <- 0.0394 -AAref["G"] <- 0.0724 -AAref["H"] <- 0.0221 -AAref["I"] <- 0.0573 -AAref["K"] <- 0.0504 -AAref["L"] <- 0.0986 -AAref["M"] <- 0.0240 -AAref["N"] <- 0.0392 -AAref["P"] <- 0.0486 -AAref["Q"] <- 0.0381 -AAref["R"] <- 0.0570 -AAref["S"] <- 0.0673 -AAref["T"] <- 0.0558 -AAref["V"] <- 0.0686 -AAref["W"] <- 0.0129 -AAref["Y"] <- 0.0294 -sum(AAref) - -# Function to calculate Shannon entropy -H <- function(pmf) { - # Calculate Shannon entropy - # Parameters: - # pmf (numeric) probability mass function: a vector of states and - # associated probabilities. Each element of - # pmf must be in (0, 1] and sum(pmf) must be 1. - # Value: - # Shannon entropy in bits. - # Examples: - # H(c(A=0.25, C=0.25, G=0.25, T=0.25)) # 2 bits entropy in a random - # # nucleotide sequence - # H(1) # If all elements are the same, entropy is zero - # - if (any(pmf <= 0 | pmf > 1) || isFALSE(all.equal(1.0, sum(pmf)))) { - stop("Input is not a discrete probability distribution.") - } - H <- -sum(pmf * (log(pmf) / log(2))) - return(H) -} - -# Why use all.equal()? Exact comparisons with floating point numbers are -# brittle. Consider for example: -1/6 + 1/6 + 1/6 + 1/6 + 1/6 + 1/6 == 1 -print(1/6 + 1/6 + 1/6 + 1/6 + 1/6 + 1/6, digits = 22) # 0.9999999999999998889777 -# all.equal() tests for _near_ equality with tolerance of ~ 1.5e-8 - - - -# Entropy of the database frequencies (in bits): -(Href <- H(AAref)) - -# for comparison: entropy if all amino acids are equiprobable -H(rep(0.05, 20)) - - -# Set up a simulation to estimate the distribution of Information values -# from random sequences drawn from AAref. This is the distribution for the -# statistical null hypothesis: -nObs <- 15 # number of observations (e.g aligned sequences) -# nObs <- 80 -nTrials <- 10000 # number of trials -IObs <- numeric(nTrials) # vector to store Information in each trial -simCounts <- numeric(20) # vector to tabulate our information ... -names(simCounts) <- names(AAref)# ... with the names of AAref - - -for (i in 1:nTrials) { # simulate ... - - # sample AAref letters, nObs times, with the probabilities of AAref: - AAobs <- sample(names(AAref), size = nObs, prob = AAref, replace = TRUE) - - x <- table(AAobs) # table simulated observations - simCounts[1:20] <- rep(0, length(simCounts)) # initialize simCounts to 0 - simCounts[names(x)] <- x # overwrite with observed counts - simCounts <- simCounts + 0.5 # add Jeffreys' pseudocounts - Hobs <- H(simCounts/sum(simCounts)) # counts to frequency, calc. H - IObs[i] <- Href - Hobs # store information -} - -# evaluate -hist(IObs, col = "#C9F4E3", xlim = c(-0.2, 1.0), breaks = 25) -abline(v = quantile(IObs, c(0.05, 0.95)), col = "#AA00CC") - -# The purple lines are drawn at the 5% quantiles of the Iobs distributions - -# i.e. an actual observation that lies outside the purple lines is deemed -# "significant"(1)(2). Of course, this is only true to the degree that the -# database frequencies are a valid model for the null-hypothesis on the -# sequence position we are considering here. - -# (1) If we use 5% quantiles, this means a value is significantly larger -# than expected, and we ignore cases when the value is < 0; if we -# consider both smaller and larger values, we need to use 2.5% quantiles, -# since 5% of all observations lie outside the 0.025 and 0.975 -# quantiles. -# -# (2) For an actual observation of counts, we calculate its observed -# _empirical_p_Value_ as (nCounts + 1)/(nTotal + 1). - - -# You can probably now appreciate that information is a bit of a shortcut for -# biological sequences, and does not really take the different inherent -# frequencies based on the character of the amino acids into account. For -# example, L is the most frequent and C is the least frequent, but if we have an -# alignment of 1000 sequences and we see that the frequencies for L and C are -# swapped, that would be _very_ surprising - nevertheless, the information would -# be 0. In order to take that into account, we should actually compute -# Kullback-Leibler divergences. - - -# Swap C and L frequencies -p <- AAref -q <- AAref -q["L"] <- AAref["C"] -q["C"] <- AAref["L"] -H(p) -H(q) - -KLdiv <- function(p, q) { - # p and q are two pmfs of discrete probability distributions - # with the same outcomes, which are nowhere 0. - # Value: Kullback-Leibler divergence sum(p * log( p / q))). - - if (length(p) != length(q)) { - stop("PANIC: input vector lengths differ!") - } - if (any(c((p == 0), (q == 0)))) { - stop("PANIC: 0's found in input vectors!") - } - - return(sum(p * log( p / q ))) -} - -KLdiv(p, p) -KLdiv(p, q) - - -nObs <- 15 # number of observations (e.g aligned sequences) -# nObs <- 80 -nTrials <- 10000 # number of trials -KLdivObs <- numeric(nTrials) # vector to store Information in each trial -simCounts <- numeric(20) # vector to tabulate our information ... -names(simCounts) <- names(AAref)# ... with the names of AAref - - -for (i in 1:nTrials) { # simulate ... - - # sample AAref letters, nObs times, with the probabilities of AAref: - AAobs <- sample(names(AAref), size = nObs, prob = AAref, replace = TRUE) - - x <- table(AAobs) # table simulated observations - simCounts[1:20] <- rep(0, length(simCounts)) # initialize simCounts to 0 - simCounts[names(x)] <- x # overwrite with observed counts - simCounts <- simCounts + 0.5 # add Jeffreys' pseudocounts - simCounts <- simCounts/sum(simCounts) # counts to frequency - KLdivObs[i] <- sum(simCounts * log( simCounts / AAref )) # store KLdiv -} - -# evaluate -hist(KLdivObs, col = "#C9F4E3", breaks = 25) -abline(v = quantile(KLdivObs, c(0.05, 0.95)), col = "#AA00CC") -quantile(KLdivObs, 0.992) - -# Running the simulation with KL does not give a fundamentally -# different behaviour - since we are just randomly sampling. But KL would be -# more sensitive in case there is biological selection, where the sampling is no -# longer random. If I run the same simulation, with nObs <- 80 but calculating -# KLdiv instead of information, I get a 5% quantile at 0.15 - but the C/L -# frequency swap gives me a KL divergence of 0.18 - this is significant at p = -# 0.008 - (remember, Information is 0 in this case). So that's actually quite a -# nice addition to the toolbox. - - -# [END] +# tocID <- "FND-STA-Information_theory.R" +# +# ============================================================================== +# +# Purpose: A Bioinformatics Course: +# R code accompanying the FND-STA-Information_theory unit. +# +# Version: 0.2.1 +# +# Date: 2017 - 2021 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 0.2.1 Maintenance +# 0.2 Under development +# 0.1 First code copied from 2016 material. +# +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> -------------------------------------- +#TOC> 1 ___Section___ 39 +#TOC> +#TOC> ========================================================================== + + +# = 1 ___Section___ ======================================================= + +# What level of information is "significant" + +# Assume the background distribution is the database frequencies of +# amino acids: + +AAref <- numeric() # Uniprot frequencies October 2017, slightly adjusted to +# sum to 1.0 +AAref["A"] <- 0.0904 +AAref["C"] <- 0.0123 +AAref["D"] <- 0.0545 +AAref["E"] <- 0.0617 +AAref["F"] <- 0.0394 +AAref["G"] <- 0.0724 +AAref["H"] <- 0.0221 +AAref["I"] <- 0.0573 +AAref["K"] <- 0.0504 +AAref["L"] <- 0.0986 +AAref["M"] <- 0.0240 +AAref["N"] <- 0.0392 +AAref["P"] <- 0.0486 +AAref["Q"] <- 0.0381 +AAref["R"] <- 0.0570 +AAref["S"] <- 0.0673 +AAref["T"] <- 0.0558 +AAref["V"] <- 0.0686 +AAref["W"] <- 0.0129 +AAref["Y"] <- 0.0294 +sum(AAref) + +# Function to calculate Shannon entropy +H <- function(pmf) { + # Calculate Shannon entropy + # Parameters: + # pmf (numeric) probability mass function: a vector of states and + # associated probabilities. Each element of + # pmf must be in (0, 1] and sum(pmf) must be 1. + # Value: + # Shannon entropy in bits. + # Examples: + # H(c(A=0.25, C=0.25, G=0.25, T=0.25)) # 2 bits entropy in a random + # # nucleotide sequence + # H(1) # If all elements are the same, entropy is zero + # + if (any(pmf <= 0 | pmf > 1) || isFALSE(all.equal(1.0, sum(pmf)))) { + stop("Input is not a discrete probability distribution.") + } + H <- -sum(pmf * (log(pmf) / log(2))) + return(H) +} + +# Why use all.equal()? Exact comparisons with floating point numbers are +# brittle. Consider for example: +1/6 + 1/6 + 1/6 + 1/6 + 1/6 + 1/6 == 1 +print(1/6 + 1/6 + 1/6 + 1/6 + 1/6 + 1/6, digits = 22) # 0.9999999999999998889777 +# all.equal() tests for _near_ equality with tolerance of ~ 1.5e-8 + + + +# Entropy of the database frequencies (in bits): +(Href <- H(AAref)) + +# for comparison: entropy if all amino acids are equiprobable +H(rep(0.05, 20)) + + +# Set up a simulation to estimate the distribution of Information values +# from random sequences drawn from AAref. This is the distribution for the +# statistical null hypothesis: +nObs <- 15 # number of observations (e.g aligned sequences) +# nObs <- 80 +nTrials <- 10000 # number of trials +IObs <- numeric(nTrials) # vector to store Information in each trial +simCounts <- numeric(20) # vector to tabulate our information ... +names(simCounts) <- names(AAref)# ... with the names of AAref + + +for (i in 1:nTrials) { # simulate ... + + # sample AAref letters, nObs times, with the probabilities of AAref: + AAobs <- sample(names(AAref), size = nObs, prob = AAref, replace = TRUE) + + x <- table(AAobs) # table simulated observations + simCounts[1:20] <- rep(0, length(simCounts)) # initialize simCounts to 0 + simCounts[names(x)] <- x # overwrite with observed counts + simCounts <- simCounts + 0.5 # add Jeffreys' pseudocounts + Hobs <- H(simCounts/sum(simCounts)) # counts to frequency, calc. H + IObs[i] <- Href - Hobs # store information +} + +# evaluate +hist(IObs, col = "#C9F4E3", xlim = c(-0.2, 1.0), breaks = 25) +abline(v = quantile(IObs, c(0.05, 0.95)), col = "#AA00CC") + +# The purple lines are drawn at the 5% quantiles of the Iobs distributions - +# i.e. an actual observation that lies outside the purple lines is deemed +# "significant"(1)(2). Of course, this is only true to the degree that the +# database frequencies are a valid model for the null-hypothesis on the +# sequence position we are considering here. + +# (1) If we use 5% quantiles, this means a value is significantly larger +# than expected, and we ignore cases when the value is < 0; if we +# consider both smaller and larger values, we need to use 2.5% quantiles, +# since 5% of all observations lie outside the 0.025 and 0.975 +# quantiles. +# +# (2) For an actual observation of counts, we calculate its observed +# _empirical_p_Value_ as (nCounts + 1)/(nTotal + 1). + + +# You can probably now appreciate that information is a bit of a shortcut for +# biological sequences, and does not really take the different inherent +# frequencies based on the character of the amino acids into account. For +# example, L is the most frequent and C is the least frequent, but if we have an +# alignment of 1000 sequences and we see that the frequencies for L and C are +# swapped, that would be _very_ surprising - nevertheless, the information would +# be 0. In order to take that into account, we should actually compute +# Kullback-Leibler divergences. + + +# Swap C and L frequencies +p <- AAref +q <- AAref +q["L"] <- AAref["C"] +q["C"] <- AAref["L"] +H(p) +H(q) + +KLdiv <- function(p, q) { + # p and q are two pmfs of discrete probability distributions + # with the same outcomes, which are nowhere 0. + # Value: Kullback-Leibler divergence sum(p * log( p / q))). + + if (length(p) != length(q)) { + stop("PANIC: input vector lengths differ!") + } + if (any(c((p == 0), (q == 0)))) { + stop("PANIC: 0's found in input vectors!") + } + + return(sum(p * log( p / q ))) +} + +KLdiv(p, p) +KLdiv(p, q) + + +nObs <- 15 # number of observations (e.g aligned sequences) +# nObs <- 80 +nTrials <- 10000 # number of trials +KLdivObs <- numeric(nTrials) # vector to store Information in each trial +simCounts <- numeric(20) # vector to tabulate our information ... +names(simCounts) <- names(AAref)# ... with the names of AAref + + +for (i in 1:nTrials) { # simulate ... + + # sample AAref letters, nObs times, with the probabilities of AAref: + AAobs <- sample(names(AAref), size = nObs, prob = AAref, replace = TRUE) + + x <- table(AAobs) # table simulated observations + simCounts[1:20] <- rep(0, length(simCounts)) # initialize simCounts to 0 + simCounts[names(x)] <- x # overwrite with observed counts + simCounts <- simCounts + 0.5 # add Jeffreys' pseudocounts + simCounts <- simCounts/sum(simCounts) # counts to frequency + KLdivObs[i] <- sum(simCounts * log( simCounts / AAref )) # store KLdiv +} + +# evaluate +hist(KLdivObs, col = "#C9F4E3", breaks = 25) +abline(v = quantile(KLdivObs, c(0.05, 0.95)), col = "#AA00CC") +quantile(KLdivObs, 0.992) + +# Running the simulation with KL does not give a fundamentally +# different behaviour - since we are just randomly sampling. But KL would be +# more sensitive in case there is biological selection, where the sampling is no +# longer random. If I run the same simulation, with nObs <- 80 but calculating +# KLdiv instead of information, I get a 5% quantile at 0.15 - but the C/L +# frequency swap gives me a KL divergence of 0.18 - this is significant at p = +# 0.008 - (remember, Information is 0 in this case). So that's actually quite a +# nice addition to the toolbox. + + +# [END] diff --git a/FND-STA-Probability_distribution.R b/FND-STA-Probability_distribution.R index 0bd3573..60d1238 100644 --- a/FND-STA-Probability_distribution.R +++ b/FND-STA-Probability_distribution.R @@ -1,1323 +1,1323 @@ -# tocID <- "FND-STA-Probability_distribution.R" -# -# -# Purpose: A Bioinformatics Course: -# R code accompanying the FND-STA-Probability_distribution unit. -# -# Version: 1.6 -# -# Date: 2017-10 - 2020-11 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.6 Revise use of data argument to nls()/nlrob() -# 1.5 Extensive additions on Poisson and binomial distributions -# and regression fits -# 1.4 2020 Maintenance -# 1.3 Change from require() to requireNamespace(), -# use ::() idiom throughout, -# 1.2 Update set.seed() usage -# 1.1 Corrected empirical p-value -# 1.0 First code live version -# -# TODO: -# Add tasks -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> -------------------------------------------------------------------------- -#TOC> 1 Introduction 68 -#TOC> 2 Three fundamental distributions 131 -#TOC> 2.1 The Poisson Distribution 134 -#TOC> 2.2 The hypergeometric distribution 228 -#TOC> 2.2.1 Digression: qqplot() and residuals 376 -#TOC> 2.2.2 Fitting functions 436 -#TOC> 2.2.2.1 Fit a normal distribution (using nls() ) 506 -#TOC> 2.2.2.2 Fit a normal distribution (using nlrob()) ) 525 -#TOC> 2.2.2.3 Extreme Value distributions: Gumbel 552 -#TOC> 2.2.2.4 Extreme Value distributions: Weibull 579 -#TOC> 2.2.2.5 Logistic distribution 621 -#TOC> 2.2.2.6 Log-Logistic distribution 650 -#TOC> 2.2.2.7 Fitting a negative binomial distribution 679 -#TOC> 2.2.2.8 Fitting a binomial distribution 732 -#TOC> 2.3 The uniform distribution 844 -#TOC> 2.4 The Normal Distribution 864 -#TOC> 3 quantile-quantile comparison 905 -#TOC> 3.1 qqnorm() 915 -#TOC> 3.2 qqplot() 981 -#TOC> 4 Quantifying the difference 998 -#TOC> 4.1 Chi2 test for discrete distributions 1032 -#TOC> 4.2 Kullback-Leibler divergence 1124 -#TOC> 4.2.1 An example from tossing dice 1135 -#TOC> 4.2.2 An example from lognormal distributions 1257 -#TOC> 4.3 Continuous distributions: Kolmogorov-Smirnov test 1300 -#TOC> -#TOC> ========================================================================== - - -# = 1 Introduction ======================================================== - -# The space of possible outcomes of events is called a probability distribution -# and the properties of probability distributions are crucial to our work. Many -# distributions like the (discrete) Poisson, or the (continuous) Normal -# distribution have been characterized in great detail, their behaviour is well -# understood, and they are useful for countless applications - but we also need -# to able to work with ad hoc distributions that have never been seen before. - -# Let's get a few facts about probability distributions out of the way: - -# The "support" of a probability distribution is the range of outcomes that have -# a non-zero probability. The "domain" of a probability distribution is the -# range of probabilities that the distribution can take over its support. Think -# of this as the ranges on the x- and y-axis respectively. Thus the distribution -# can be written as p = f(x). - -# The integral over a probability distribution is always 1. This means: the -# distribution reflects the situation that an event does occur, any event, but -# there is not "no event". - -# R's inbuilt probability functions always come in four flavours: -# d... for "density": this is the probability density function (p.d.f.), -# the value of f(x) at x. -# p... for "probability": this is the cumulative distribution function -# (c.d.f.). It is 0 at the left edge of the support, and 1 at -# the right edge. -# q... for "quantile": The quantile function returns the x value at which p... -# takes a requested value. -# r... for "random": produces random numbers that are distributed according -# to the p.d.f. - -# To illustrate with the "Normal Distribution" (Gaussian distribution): - -# 1000 normally distributed values with default parameters: mean 0, sd 1. -r <- rnorm(1000) - -# pastel green: histogram of 1000 random samples -hist(r, - freq = FALSE, - breaks = 30, - xlim = c(-4, 4), - ylim = c(0, 1), - main = "Normal Distribution", - xlab = "x", - ylab = "f(x)", - col = "#E6FFF6") - -# 100 equally spaced point along x -x <- seq(-4, 4, length.out = 100) - -# black: c. d. f. along x. Note that this asymptotically reaches 1 -points(x, pnorm(x), type = "l") - -# dark red: p. d. f. along x -points(x, dnorm(x), type = "l", lwd = 2, col="firebrick") - -# purple: 1% and 99% quantiles -abline(v = qnorm(c(0.01, 0.99)), lwd = 0.5, col = "#CCAAFF") - -# Study this plot well and familiarize yourself with the terms. - - -# = 2 Three fundamental distributions ===================================== - - -# == 2.1 The Poisson Distribution ========================================== - -# The Poisson distribution is a discrete probability distribution that -# characterizes how many events we expect among a given number of observations -# if the mean probability of an event is known. Assume we know that there are -# 256 transcription factors among the 6091 protein-coding genes of yeast, then -# the probability of picking a transcription factor at random from all ORFs is -# 256/6091 ~= 4.2%. How many transcription factors do we expect in a sample of -# 250 genes - like, for example, the top 250 differentially expressed genes in -# an assay? This is a frequently encountered type of question, converging on the -# information contained in a "list of genes". Once an assay has yielded a list -# of genes, what can we learn from looking at staistical features of its -# membership. In the transcription factor model, the question is: how many -# transcription factors do we expect as members of our list - and did we -# actually observe more or less than that? -# -# It would seem that the the probability of encountering _one_ transcription -# factor among our genes is 256/6091 and therefore the number of transcription -# factors we expect to choose at random is (250 * 256)/6091 i.e. 10.50731 in the -# average over many trials. Let's repeat our experiment a million times and see what we get: - -N <- 1000000 # One million trials -genes <- numeric(6091) # All genes are 0 -genes[1:256] <- 1 # TFs are 1 - -hAssays <- numeric(N) # initialize vector -set.seed(112358) -for (i in 1:N) { - pBar(i, N) - hAssays[i] <- sum(sample(genes, 250)) # sum of TFs in our sample in this trial -} -set.seed(NULL) - -# And the average is: -mean(hAssays) # 10.50293 - -# ... which is superbly close to our expectation of 10.50731 - -# All good - but we won't get 10.5 transcription factors in our assay. We'll -# observe five. Or thirteen. Or thirtysix. Or none at all ... and then we ask -# ourselves: is the number of observed transcription factors significantly -# different from what we would have expected if our experiment identified a -# transcription factor just as likely as it identified any other gene? To answer -# this, we need to consider the probability distribution of possible outcomes of -# our assay. Back to the Poisson distribution. In R it is implemented as dpois() -# and its parameters are: the number of observed events, and the probability of -# observing an event: - -dpois(0, (250 * 256) / 6091) # Probability of seeing no TFs -dpois(1, (250 * 256) / 6091) # Probability of seing one ... -dpois(2, (250 * 256) / 6091) # Probability of seing two ... -dpois(3:10, (250 * 256) / 6091) # Probability of seing from three to ten ... -sum(dpois(0:4, (250 * 256) / 6091)) # Probability of seeing four or less ... - -sum(dpois(0:250, (250*256)/6091)) # The sum over all possibilities is (for - # any probability distribution) exactly one. - -# Lets plot these probabilities ... -nMax <- 28 - -x <- dpois(0:nMax, (250 * 256) / 6091) - -barMids <- barplot(x, - col = "#FCF3CF", - names.arg = as.character(0:nMax), - cex.names = 0.5, - axes = TRUE, - ylim = c(0, 0.15), - xlab = "# of TF in set", - ylab = "p") - -# ... and add our simulated assays: - -(th <- table(factor(hAssays, levels = 0:nMax))/N) - -points(barMids - 0.55, th, type = "s", col = "firebrick") -abline(v = (((250 * 256) / 6091) * (barMids[2] - barMids[1])) + barMids[1], - col = "#5588FF") # scale to the correct position in the barplot -legend("topright", - legend = c("Poisson", "simulated", "expectation"), - pch = c(22, NA, NA), # one box, two lines only - pt.cex = 1.4, # larger, to match bar-width better - pt.bg = c("#FCF3CF", NA, NA), # bg color only for the box - lty = c(0, 1, 1), # no line for the box - col = c("#000000", "firebrick", "#5588FF"), - bty = "n") # no frame around the legend - -# NOTE: The simulation shows us that our expectations about the number of -# transcription factors in a sample are almost, but not exactly Poisson -# distributed. Can you figure out where we went wrong? Maybe the -# Poisson distribution is not quite the correct distribution to -# model our expectations? - - -# == 2.2 The hypergeometric distribution =================================== - -# With that suspicion in mind, we reconsider what we were trying to achieve at -# each point of the Poisson distribution. Assume we have observed seven -# transcription factors in our set of 250 genes. So we asked: what is the -# probability of observing seven? And concluded: - -dpois(7, (250 * 256) / 6091) # Probability of seeing seven ... - -# ... which is the probability of seven events in 250 choices if the underlying -# probability is equal to fraction of transcription factors among genes. But -# wait: we weren't careful in our simulation. Assume that our first observed -# gene was a transcription factor. Is the probability of the next sample the -# same? Not quite: one transcription factor has been observed, 249 more samples -# need to be considered, and there are now 6090 genes to choose from. I.e. the -# mean probability changes with every observation: - -(250 * 256) / 6091 # First sample, a TF: p = 10.50731 -(249 * (256 - 1)) / (6091 - 1) # Second sample: p = 10.42611 (-0.992 %) - -# This is actually noticeable: the mean probability for transcription factors -# drops by about one percent after a transcription factor is observed. But what -# if we would have observed the first transcription factor as the tenth gene? - -(239 * (256 - 1)) / (6091 - 10) # Eleventh sample: p = 10.0222 (-0.954 %) - -# This is getting complicated and we need a different way to think about this if -# we don't want to enumerate all possibilities by hand. (There are far too -# many!) Generally, the probability of observing a certain number of events in a -# series is the number of ways to realize the desired outcome, divided by the -# number of possible outcomes. So, if we code transcription factors by "1" and -# other genes by "0", seven transcription factors could be - -# 01010100100100100100000000000000000000000 ..., or -# 01110111100000000000000000000000000000000 ..., or -# 11101001000010000000100000000000000000000 ..., or any other combination. - -# But crucially, our number of trials is limited and every "success" changes the -# probability of future successes. This is sampling without replacement! And -# sampling without replacement is modeled by the so-called "hypergeometric -# distribution". This is the big difference: when we are sampling WITH -# replacement, we can model the process with a Poisson distribution. When we are -# sampling WITHOUT replacement, we use a hypergeometric distribution instead. - -# Let's first re-run our simulated assays. We put the previous run into the -# vector "hAssays" which I prefixed "h" as in "hypergeometric" because I knew -# what was coming, and that I had sampled WITHOUT replacement because that is -# the default for the sample() function. Accordingly, we call the new samples -# "pAssays", where "p" stands for Poisson: - -N <- 1000000 # One million trials -genes <- numeric(6091) # All genes are 0 -genes[1:256] <- 1 # TFs are 1 - -pAssays <- numeric(N) # initialize vector -set.seed(112358) -for (i in 1:N) { - pBar(i, N) - pAssays[i] <- sum(sample(genes, 250, replace = TRUE)) -} -set.seed(NULL) - -# Now the average is: -mean(pAssays) # 10.50312 which is essentially the same as 10.50293 - -# And the plot ... - -nMax <- 28 -barMids <- barplot(dpois(0:nMax, (250 * 256) / 6091), - names.arg = as.character(0:nMax), - cex.names = 0.5, - axes = TRUE, - ylim = c(0, 0.15), - xlab = "# of TF in set", - ylab = "p", - col = "#FCF3CF") -abline(v = (((250 * 256) / 6091) * (barMids[2] - barMids[1])) + barMids[1], - col = "#5588FF") # scale to the correct position in the barplot -th <- table(factor(hAssays, levels = 0:nMax))/N -points(barMids - 0.55, th, type = "s", col = "firebrick") - -# Here are the new assays: -tp <- table(factor(pAssays, levels = 0:nMax))/N -points(barMids - 0.55, tp, type = "s", col = "seagreen") - -legend("topright", - legend = c("Poisson", - "no replacement", - "with replacement", - "expectation"), - pch = c(22, NA, NA, NA), - pt.cex = 1.4, - pt.bg = c("#FCF3CF", NA, NA, NA), - lty = c(0, 1, 1, 1), - col = c("#000000", "firebrick", "seagreen", "#5588FF"), - bty = "n") - -# Clearly .. the "correct" simulation, the simulation that is actually -# appropriate for the Poisson distribution, matches the theoretical values -# better. Now let's see how well the hypergeometric distribution matches our -# original simulated assays. -# The function dhyper(x, m, n, k) expects the following parameters: -# x: the number of observed positive events for which to -# compute the probability -# m: the number of positive events in the population -# n: the number of negative eventsw in the population -# k: the number of observations (or trials) - - dhyper(0, 256, 6091 - 256, 250) # Probability of seeing no TFs - dhyper(1, 256, 6091 - 256, 250) # Probability of seing one ... - dhyper(2, 256, 6091 - 256, 250) # Probability of seing two ... - dhyper(3:10, 256, 6091 - 256, 250) # Probability of three to ten ... -sum(dhyper(0:4, 256, 6091 - 256, 250)) # Probability of seeing four or less ... - -sum(dhyper(0:250, 256, 6091-256, 250)) # The sum over all possibilities is (for - # any probability distribution) - # exactly one. - -# Lets plot these probabilities like we did above ... -nMax <- 28 -x <- dhyper(0:nMax, 256, 6091 - 256, 250) - -barMids <- barplot(x, col = "#E6FFF6", - names.arg = as.character(0:nMax), - cex.names = 0.5, - axes = TRUE, - ylim = c(0, 0.15), - xlab = "# of TF in set", - ylab = "p") -abline(v = (mean(hAssays) * (barMids[2] - barMids[1])) + barMids[1], - col = "#5588FF") # scale to the correct position in the barplot -points(barMids - 0.55, th, type = "s", col = "firebrick") - -legend("topright", - legend = c("Hypergeometric", - "no replacement", - "expectation"), - pch = c(22, NA, NA), - pt.cex = 1.4, - pt.bg = c("#E6FFF6", NA, NA), - lty = c(0, 1, 1, 1), - col = c("#000000", "firebrick", "#5588FF"), - bty = "n") - -# This! -# This is what a correctly simulated distribution looks like. - - -# === 2.2.1 Digression: qqplot() and residuals - -# The indication that something was wrong with our simulation versus the -# theoretical expectation came from the observation that the differences between -# the barplot and theory were not quite random: the values near the mode were -# systematically too high, the values in the tails were systematically too low. -# This is a general principle: when you see a SYSTEMATIC deviation between -# simulation and theory, something is wrong with your understanding. Either -# there is a subtle error in how you set up the simulation, or a subtle -# misunderstanding about the requirements for the particular theory to apply. R -# has a general way to examine such differences: qqplot() plots the deviations -# between theory and observation ordered as ranks, i.e. not affected by absolute -# scale. (See here for an accessible introduction to qqplot() and the -# "quantiles" that it uses: -# https://data.library.virginia.edu/understanding-q-q-plots/) - -oPar <- par(mfrow = c(1, 2)) -qqplot( dpois(0:nMax, (250 * 256) / 6091), - th, - xlab = "Poisson distribution", - ylab = "sampling with replacement", - pch = 22, bg = "#FCF3CF") -abline(lm(th ~ dpois(0:nMax, (250 * 256) / 6091)), col = "seagreen") - -qqplot( dhyper(0:nMax, 256, 6091 - 256, 250), - th, - xlab = "hypergeometric distribution", - ylab = "sampling with replacement", - pch = 22, bg = "#E6FFF6") -abline(lm(th ~ dhyper(0:nMax, 256, 6091 - 256, 250)), col = "seagreen") - -par(oPar) - -# Similar information can be obtained from a residual plot, plotting differences -# between prediction and observation: - -oPar <- par(mfrow = c(1, 2)) -plot( dpois(0:nMax, (250 * 256) / 6091) - as.numeric(th), - type = "b", - ylim = c(-0.006, 0.006), - xlab = "# observations", - ylab = "Poisson density - obs.", - pch = 22, - bg = "#FCF3CF", - col = "#000000") -abline(h = 0, col = "seagreen") - -plot( dhyper(0:nMax, 256, 6091 - 256, 250) - as.numeric(th), - type = "b", - ylim = c(-0.006, 0.006), - xlab = "# observations", - ylab = "Hypergeometric density - obs.", - pch = 22, - bg = "#E6FFF6", - col = "#000000") -abline(h = 0, col = "seagreen") - -par(oPar) - - -# === 2.2.2 Fitting functions - -# Note that there is a further subtle catch: We did not actually ask about seven -# transcription factors! We asked about the probability of seven _different_ -# transcription factors - because, implicit in the assumptions I made about the -# assay (and reasonable for most gene lists), we count duplicates only once! -# Does this actually make a difference? We can model the situation by giving -# each transcription factor a name (or a number), sampling at random, and -# counting how many unique() factors we found in our sample: - -N <- 1000000 # One million trials -genes <- numeric(6091) # All genes are initially 0 -genes[1:256] <- 1:256 # TFs get a unique "name" - -# example sample: -set.seed(11235) -x <- sample(genes, 250, replace = TRUE) # Pick 250 random genes. -x[x != 0] # Note that 189 appears twice. -length(x[x != 0]) # We picked 8 transcription factors ... -unique(x) # but only 7 are unique (plus zero). -length(unique(x)) - 1 # Ignore the zero. - -# Do this a million times -uAssays <- numeric(N) # initialize vector -set.seed(112358) -for (i in 1:N) { - pBar(i, N) - uAssays[i] <- length(unique(sample(genes, 250, replace = TRUE))) - 1 -} -set.seed(NULL) - -# plot the poisson distribution (with replacement) as our baseline -nMax <- 28 -barMids <- barplot(dpois(0:nMax, (250 * 256) / 6091), - col = "#FCF3CF", - names.arg = as.character(0:nMax), - cex.names = 0.5, - axes = TRUE, - ylim = c(0, 0.15), - xlab = "# of TF in set", - ylab = "p") - -tu <- table(factor(uAssays, levels = 0:nMax))/N -points(barMids - 0.55, tu, type = "s", col = "#EE22FF") - -legend("topright", - legend = c("Poisson", - "unique genes"), - pch = c(22, NA), - pt.cex = 1.4, - pt.bg = c("#FCF3CF", NA), - lty = c(0, 1), - col = c("#000000", "#EE22FF"), - bty = "n") - -# Clearly, the distribution does not match our model exactly. - -# So what is the "correct" distribution that we could apply in this case? There -# may or may not be one readily available. What we can do instead is to use a -# more general model and fit parameters. This takes us to the domain of -# regression analysis and curve fitting. The general approach is as follows: -# - Decide on a statistical model; -# - Express it in parametrized form; -# - Fit the parameters; -# - Analyze the coefficients; - -# Insight into the underlying process that generated our data can be obtained -# by analyzing the fitted parameters, or simply plotting the results. Let's -# look at examples of fits to the sampled distribution above: - -# ==== 2.2.2.1 Fit a normal distribution (using nls() ) - -x <- 0:28 -plot(x, tu, type="s") -fit <- nls(tu ~ ( a / (sig*sqrt(2*pi)) ) * exp( (-1/2)*((x-mu)/sig)^2 ), - data = data.frame(x = 0:28, tu = tu), - start = c(a = 1, mu = 10, sig = 3)) # starting values - -points(x, predict(fit), col = "#CC00CC55", lwd = 2, - type = "s") - -coef(fit) -# a mu sig -# 0.9990932 10.0717835 3.0588930 - -sum(resid(fit)^2) -# [1] 0.0001613488 - - -# ==== 2.2.2.2 Fit a normal distribution (using nlrob()) ) - -# There's a bit of an art to chosing starting parameters correctly and if the -# nls() fit does not converge, more robust methods are called for. - -if (! requireNamespace("robustbase", quietly = TRUE)) { - install.packages("robustbase") -} - -x <- 0:28 -plot(x, tu, type="s") -fit <- robustbase::nlrob(tu ~ ( a / (sig*sqrt(6.2831853072)) ) * - exp( (-1/2)*((x-mu)/sig)^2 ), - data = data.frame(x = 0:28, - tu = tu), - start = c(a = 1, mu = 10, sig = 3)) # starting values - -points(x, predict(fit), col = "#CC00CC55", lwd = 2, type = "s") - -coef(fit) -# a mu sig -# 1.002162 10.059189 3.071217 - -sum(resid(fit)^2) -# [1] 0.0001630868 - - -# ==== 2.2.2.3 Extreme Value distributions: Gumbel - -# Many processes that involve "best-of" choices are better modelled with -# so-called extreme-value distributions: here is the Gumbel distribution -# from the evd package. - -if (! requireNamespace("evd", quietly = TRUE)) { - install.packages("evd") -} - -x <- 0:28 -plot(x, tu, type="s") - -fit <- robustbase::nlrob(tu ~ evd::dgumbel(x, loc = L, scale = S), - data = data.frame(tu = tu, x = 0:28), - start = c(L = 7.3, S = 2.82)) - -points(x, predict(fit), type = "s", col = "#55DD88") - -coef(fit) -# L S -# 9.322110 2.818266 - -sum(resid(fit)^2) -# [1] 0.001027447 - - -# ==== 2.2.2.4 Extreme Value distributions: Weibull - -# Weibull distributions are common in reliabilty analysis. I found the -# distribution particularly hard to fit as it is quite sensitive to inital -# parameter estimates. https://en.wikipedia.org/wiki/Weibull_distribution - -# NOTE: the parameter TH is > X -idx <- 4:28 -myX <- idx -myY <- as.numeric(tu)[idx] -plot(myX, myY, type="s") - -dWei <- function(x, th, l, k) { - a <- k/l - b <- ((x-th)/l)^(k-1) - c <- exp(-((x-th)/l)^k) - y <- a * b * c - return(y) -} - -set.seed(112358) -fit <- robustbase::nlrob(y ~ dWei(x, th = TH, l = L, k = K), - data = data.frame(y = myY, - x = myX), - lower = c(TH = 3.5, - L = 8, - K = 2.5), - upper = c(TH = 3.7, - L = 9, - K = 3), - method = "mtl") - -points(x, predict(fit), col = "#CC00CC55", lwd = 2, type = "s") - -coef(fit) -# TH L K -#3.630807 8.573898 2.795116 - -sum(resid(fit)^2) -# [1] 7.807073e-05 - - -# ==== 2.2.2.5 Logistic distribution - -# Similar to normal distribution, but with heavier tails -# https://en.wikipedia.org/wiki/Logistic_distribution - -myX <- 0:28 -myY <- as.numeric(tu) -plot(myX, myY, type="s") - -dLogi <- function(x, mu, s) { - y <- (exp(-(x-mu)/s)) / (s * (1+exp(-(x-mu)/s))^2) - return(y) -} - -fit <- robustbase::nlrob(y ~ dLogi(x, mu = M, s = S), - data = data.frame(y = myY, - x = myX), - start = c(M = 10, S = 3)) - -points(x, predict(fit), col = "#CC00CC55", lwd = 2, type = "s") - -coef(fit) -# M S -# 10.088968 1.891654 - -sum(resid(fit)^2) -# [1] 0.0004030595 - - -# ==== 2.2.2.6 Log-Logistic distribution - -# Special case of logistic, often used in survival analysis -# https://en.wikipedia.org/wiki/Log-logistic_distribution - -myX <- 0:28 -myY <- as.numeric(tu) -plot(myX, myY, type="s") - -dLogLogi <- function(x, a, b) { - y <- ((b/a)*(x/a)^(b-1)) / (1+((x/a)^b))^2 - return(y) -} - -fit <- robustbase::nlrob(y ~ dLogLogi(x, a = A, b = B), - data = data.frame(y = myY, - x = myX), - start = c(A = 9.5, B = 4.8)) - -points(x, predict(fit), col = "#CC00CC55", lwd = 2, type = "s") - -coef(fit) -# A B -# 10.310181 5.288385 - -sum(resid(fit)^2) -# [1] 0.0006343927 - - -# ==== 2.2.2.7 Fitting a negative binomial distribution - -# The negative binomial distribution is related to the Poisson distribution. -# Assume you are observing events and and counting how many successes of a -# Bernoulli process (essentially a coin-flip) we encounter before we encounter a -# failure. Unlike the Poisson, it models mean and variance separately and is therefore especially useful for overdispersed functions. (cf. https://en.wikipedia.org/wiki/Negative_binomial_distribution) -# - -x <- 0:28 -plot(x, tu, type="s") - -# Negative binomial -dNB <- function(x, r, p) { - # Note: r is an integer! - y <- choose((x + r - 1), (r - 1)) * (1-p)^x * p^r - return(y) -} - -set.seed(112358) -RR <- 104 -fit <- robustbase::nlrob(tu ~ dNB(x, r = RR, p = P), - data = data.frame(x = x, RR = RR), - lower = c(P = 0.01), - upper = c(P = 0.99), - method = "mtl") - -points(x, predict(fit), col = "#CC00CC55", lwd = 2, type = "s") - -coef(fit) -# P -# 0.9100729 - -sum(resid(fit)^2) -# [1] 0.0005669086 - -# Nb. the parameter R is not continuous: to optimize it as an integer, we try -# reasonable choices and record the best fit. -N <- 150 -R <- numeric(N) -for (thisR in 1:N) { - set.seed(112358) - fit <- robustbase::nlrob(y ~ dNB(x, r = thisR, p = P), - data = data.frame(x = x, - thisR = thisR), - lower = c(P = 0.01), - upper = c(P = 0.99), - method = "mtl") - R[thisR] <- sum(resid(fit)^2) -} -plot(R) -which(R == min(R)) - - -# ==== 2.2.2.8 Fitting a binomial distribution -# The workhorse distribution for Bernoulli proceeses -# cf. https://en.wikipedia.org/wiki/Binomial_distribution - - -myX <- 0:28 -myY <- as.numeric(tu) -plot(myX, myY, type="s") - -dBinom <- function(x, s, p) { - y <- choose(s, x) * (p^x) * ((1-p)^(s-x)) - return(y) -} - -fit <- robustbase::nlrob(y ~ dBinom(x, s = S, p = P), - data = data.frame(y = myY, - x = myX), - start = c(S = 240, P = 256/6091)) - -points(x, predict(fit), col = "#CC00CC55", lwd = 2, type = "s") - -coef(fit) -# S P -# 122.77746436 0.08376922 - -sum(resid(fit)^2) -# [1] 1.114272e-06 - -# Here we go: near perfect fit. But note the parameters! Can you identify the -# relationship of S and P to our model of choosing unique transcription factors -# in a random sampling process? - -# Remember what we started out with: -points(x, dBinom(x, 240, 256/6091), - col = "#00AAFF55", lwd = 2, type = "s") - -# The model has improved a lot from our starting-value guess. But how does an -# effective sample size of 122.78 relate to the actual value of 250 samples? And -# how does a probability for choosing a transcription factor of 0.0838 relate to -# having 256 transcription factors among 6091 genes (a fraction of 0.0420)? Well -# - if you stare at the numbers for a bit you might notice that the fitted -# sample size is about half of what we had, while the fitted probability is -# about twice that. Let's correct for the factor of two, and look at the fit ... - -points(x, dBinom(x, coef(fit)["S"] * 2 , coef(fit)["P"] / 2), - col = "#00FF8899", lwd = 2, type = "s") - -# interesting ... that's not so bad ... Essentially what this tells us is: our -# model is very similar to one in which our effective sample size would have -# been about 246 genes, not 250, and the number of our genes would have been -# close to 0.04188461 * 6091 ~= 255 transcription factors, not 256. Close, to - -# but not almost perfect. - -# Incidentally: would you have thought that we can -# detect the number of transcription factors in our sample +- 1 if we just -# sample frequently enough? - -# Let's examine the effect that applying various factors to size and probability -# have on our distribution: - - -z <- c(1/8:2 , 1, 2:8, 10, 20, 50) -myCols <- colorRampPalette(c("#00000022", - "#00000088", - "#DD0000DD", - "#0088FF88", - "#0088FF55", - "#0088FF22"), - alpha=TRUE)(length(z)) - -myLwd <- rep(1.25, length(z)) -myLwd[z == 1] <- 2.5 # make the actual fitted value stand out - -plot(x, y, type="s", ylim =c(0, 0.22), lwd = 5, col="#FF990077") - -for (i in seq_along(z)) { - points(x, dBinom(x, coef(fit)["S"] * z[i] , coef(fit)["P"] / z[i]), - col = myCols[i], type = "s") -} - -legend("topright", - legend = sprintf("%3.2f", z), - cex = 0.5, - col = myCols, - lwd = myLwd, - bty = "n") - -# We see how factors less than 1 applied to our actual sample size and fraction -# of transcription factors increasingly narrow the distribution; factors larger -# than one increasingly broaden the distribution but in a much slower manner. A -# factor of one (i.e. half size, double probability) hits the sweet spot and -# recaptures the essence of our observation. Clearly, this is a case of -# fortuitously cancelling errors. - - -# What is the take-home message here? -# - The standard Poisson and hypergeometric distributions apply to -# very specific models of choice processes (with/without replacement); -# - It is not trivial to choose the right statistical model for any particular -# real-world specification of a sampling process. Our model of unique -# choices is neither Poisson nor hypergeometric distributed. Once we have -# identified the parameters of a binomial distribution that models the -# process perfectly, we nevertheless note that we don't seem to be -# able to interpret the parameters easily. -# - Stochastic modeling allows us to validate whether the model is correct, -# but in case there are discrepancies it is not obvious what might be -# a more appropriate model and how to parametrize it. -# - If building an explicit stochastic model is not possible, we'll have to -# to do the best we can, in this case that would mean: choose a more -# general distribution and parametrize it. - - -# == 2.3 The uniform distribution ========================================== - -# The uniform distribution has the same probability over its entire support. R's -# runif() function takes the desired number, the min and the max as arguments. -# Let's plot a histogram of a million values between -1 and 1 to demonstrate. - -hist(runif(1e6, -1, 1), breaks = 20, col = "#FFE6F6") -abline(h = 1e6/20, col="firebrick") - -# One of the important uses of the uniform distribution is to write conditional -# expressions that are TRUE with a given probability. For example, to get TRUE -# values with a probability of 1/3, we pick a random number between 0 and 1, and -# ask whether the number is smaller than 1/3. Example: - -runif(10) < 1/3 - -#confirm with a million trials -sum(runif(1e6) < 1/3)/1e6 # should be close to 0.33333... - - -# == 2.4 The Normal Distribution =========================================== - -# The king of probability distributions. Why? That's because of the Central -# Limit Theorem (CLT) that essentially says that a process that is subject to -# small fluctuations will tend to normally distributed outcomes ... and in -# biology literally everything is subject to small fluctuations. - -# Lets simulate: Lets create a vector of 12345 numbers, choose samples of size -# 77 from that vector and calculate the mean. We do that 9999 times. I am just -# using odd numbers so it is clear in the code which number represents what. - -x <- runif(12345) -v <- numeric(9999) -for (i in 1:length(v)) { - v[i] <- mean(sample(x, 77)) -} - -hist(v, breaks = 20, col = "#F8DDFF") - -# Let's try this again, this time sampling from an exponential distribution ... -x <- rexp(12345) -v <- numeric(9999) -for (i in 1:length(v)) { - v[i] <- mean(sample(x, 77)) -} - -hist(v, breaks = 20, col = "#F8DDFF") - -# ... or from a t-distribution ... -x <- rt(12345, df = 3) -v <- numeric(9999) -for (i in 1:length(v)) { - v[i] <- mean(sample(x, 77)) -} - -hist(v, breaks = 20, col = "#F8DDFF", freq = FALSE) - -# The outcomes all give normal distributions, regardless what the details of our -# original distribution were! - - -# = 3 quantile-quantile comparison ======================================== - - -# Once we have observed a distribution of outcomes, the next task is often to -# quantify whether the values correspond to a known distribution. This can be -# done with quantile-quantile plots that plot the quantile values of one -# distribution against those of the other. Identically distributed quantiles lie -# on a straight line. - - -# == 3.1 qqnorm() ========================================================== - -# The functions qqnorm() and qqline() perform this -# comparison with the normal distribution. - -set.seed(112358) -x <- rnorm(100, mean=0, sd=1) # 100 normally distributed values -set.seed(NULL) - -qqnorm(x) -qqline(x, col = "seagreen") - -# Our variables in x appear normally distribute - which is not surprising since -# we produced them with rnorm(). What about the kind of sampling we did above? -# Let's test whether samples from an exponential distribution are normally -# distributed (previously we just visually inspected the histogram.) - -# Create a vector of sample means from the exponential distribution; use -# only a few samples for the mean -x <- rexp(12345) -v <- numeric(999) - -set.seed(112358) -for (i in 1:length(v)) { - v[i] <- mean(sample(x, 12)) -} -set.seed(NULL) - -qqnorm(v) -qqline(v, col = "turquoise") # normal - -#try with more samples -for (i in 1:length(v)) { - v[i] <- mean(sample(x, 77)) -} -qqnorm(v) -qqline(v, col = "steelblue") # normal - -#try with many samples -for (i in 1:length(v)) { - v[i] <- mean(sample(x, 374)) -} -qqnorm(v) -qqline(v, col = "plum") # normal - -# Exactly as the CLT predicts, the more often we sample - we tried -# 12, 77, and 374 samples - the more "normal" the distribution looks. - -# What does a distribution look like that is NOT normal? -# Let's try simulating an "Extreme value distribution". This type of -# distribution appears if we choose the max() of a sample - -set.seed(112358) -rEVD <- numeric(9999) -for (i in seq_along(rEVD)) { - rEVD[i] <- max(rnorm(100)) -} -set.seed(NULL) - -hist(rEVD, breaks = 20, col = "orchid") -# Note the long tail on the right! - -qqnorm(rEVD) -qqline(rEVD, col = "orchid") # Definitely not "normal"! - - -# == 3.2 qqplot() ========================================================== - -# qqplot() works like qqnorm(), except that we compare two arbitrary -# distribtutions, rather than one distribution against the normal distribution -# as we did before. Sample against sample. - -x <- seq(0, 4, length.out = 100) - -dl <- dlnorm(x) # log-normal distribution -dg <- dgamma(x, shape=1.5) # gamma distribution - -plot(dl, type="l") -points(dg, type="l", col = "maroon") - -qqplot(dl, dg) # clearly not equal - - -# = 4 Quantifying the difference ========================================== - -# Quantile-quantile plots give us a visual estimate, but how do we quantify the -# difference between distributions? Let's compare two types of extreme-value -# distributions, a lognormal distribution with the same distribution that is -# slightly shifted, and three gamma distributions with three different shape -# parameters. Let's define and visualize the distributions first, to see what -# we are comparing. - -x <- seq(0, 4, length.out = 100) - -set.seed(112358) -dl1 <- dlnorm(x) # log-normal distribution -dl2 <- dlnorm(x - 0.25) # log-normal distribution, shifted right (a bit) -dg1.2 <- dgamma(x, shape=1.2) # three gamma distributions with... -dg1.5 <- dgamma(x, shape=1.5) # ...wider, and wider... -dg1.9 <- dgamma(x, shape=1.9) # ...peak -set.seed(NULL) - -myCols <- c("black", "grey", "maroon", "turquoise", "steelblue") - -plot(dl1, type="l", lwd=2) # visualize the distributions -points(dl2, type="l", col = myCols[2]) -points(dg1.2, type="l", col = myCols[3]) -points(dg1.5, type="l", col = myCols[4]) -points(dg1.9, type="l", col = myCols[5]) -legend("topright", - legend = c("dl1", "dl2", "dg1.2", "dg1.5", "dg1.9"), - lty = 1, - lwd = c(2, 1, 1, 1, 1), - col = myCols, - bty = "n") - - -# == 4.1 Chi2 test for discrete distributions ============================== - -# The chi2 test can be used to compare discrete distributions - even though -# it is not ideal for this purpose. -# (https://stats.stackexchange.com/questions/113692) -# -# Let's draw 100 random variables according to our target distributions -N <- 100 -set.seed(112358) -rL1 <- rlnorm(N) # log-normal distribution -rL2 <- rlnorm(N, meanlog = 0.25) # log-normal distribution, shifted right -rG1.2 <- rgamma(N, shape=1.2) # three gamma distributions with... -rG1.5 <- rgamma(N, shape=1.5) # ...wider, and wider... -rG1.9 <- rgamma(N, shape=1.9) # ...peak -set.seed(NULL) - -maxX <- max(c(rL1, rL2, rG1.2, rG1.5, rG1.9)) - -myBreaks <- seq(0, 5, length.out = 10) # 9 intervals from 0 to 5... -myBreaks <- c(myBreaks, maxX) # ... and one that contains the outliers - -# It's easy to plot a histogram of one set of random deviates... -hist(rG1.5, breaks = myBreaks, col = myCols[4]) - -# ... but basic R has no inbuilt function to stack histogram bars side-by-side. -# We use the multhist() function in the plotrix package: check out the -# package information - plotrix has _many_ useful utilities to enhance -# plots or produce informative visualizations. - -if (! requireNamespace("plotrix", quietly = TRUE)) { - install.packages("plotrix") -} - -# Package information: -# library(help = plotrix) # basic information -# browseVignettes("plotrix") # available vignettes -# data(package = "plotrix") # available datasets - - -h <- plotrix::multhist(list(rL1, rL2, rG1.2, rG1.5, rG1.9 ), - breaks = myBreaks, - col = myCols) -legend("topright", - legend = c("rL1", "rL2", "rG1.2", "rG1.5", "rG1.9"), - pch=15, - col = myCols, - bty="n") - -# We have assigned the output of multihist to the variable h, which now -# contains the densities, midpoints, breaks etc. of the histogram ... -# as well as the matrix of counts: -h[[2]] - -# But using hist() or multhist() for binning is a bit of a hack - even though -# it works, of course. The "real" R function to bin data is cut(). cut() -# sorts the values of a vector into bins, and returns the bin-labels as -# integers. - -x <- cut(rL1, breaks = myBreaks, labels = FALSE) -table(x) - -countsL1 <- table(cut(rL1 , breaks = myBreaks, labels = FALSE)) -countsL2 <- table(cut(rL2 , breaks = myBreaks, labels = FALSE)) -countsG1.2 <- table(cut(rG1.2, breaks = myBreaks, labels = FALSE)) -countsG1.5 <- table(cut(rG1.5, breaks = myBreaks, labels = FALSE)) -countsG1.9 <- table(cut(rG1.9, breaks = myBreaks, labels = FALSE)) - - -chisq.test(countsL1, countsL2) - -# Note that this use of the chi2 test does not have very much power, since it -# does not assume the values for the bins are ordered, but takes them to -# be independent. Also, chisq.test() complains about the Chi-squared -# approximation to be possibly incorrect because some of the counts are small. -# In this case, rather than rely on the in-built chi-square table, we can do -# an explicit simulation to estimate the p-value for the null hypothesis. -# -chisq.test(countsL1, countsL2, simulate.p.value = TRUE, B = 10000) - -# Note that the probability that the samples came from the same distribution is -# quite high. We don't seem to be able to distinguish l1 and l2 with the chi2 -# test. - -# Let's calculate this for the other distribution too: - -chisq.test(countsL1, countsG1.2, simulate.p.value = TRUE, B = 10000) -chisq.test(countsL1, countsG1.5, simulate.p.value = TRUE, B = 10000) -chisq.test(countsL1, countsG1.9, simulate.p.value = TRUE, B = 10000) - -# As a result, we would conclude that none of these distributions are -# significantly different. - -# == 4.2 Kullback-Leibler divergence ======================================= - -# For discrete probability distributions, there is a much better statistic, the -# Kullback-Leibler divergence (or relative entropy). It is based in information -# theory, and evaluates how different the matched pairs of outcome categories -# are. Its inputs are the probability mass functions (p.m.f.) of the two -# functions to be compared. A probability mass function is the probability of -# every outcome the process can have. Kullback-Leibler divergence therefore can -# be applied to discrete distributions. But we need to talk a bit about -# converting counts to p.m.f.'s. - -# === 4.2.1 An example from tossing dice - -# The p.m.f of an honest die is (1:1/6, 2:1/6, 3:1/6, 4:1/6, 5:1/6, 6:1/6). But -# there is an issue when we convert sampled counts to frequencies, and estimate -# probabilities with these frequencies. The problem is: by chance we might not -# have observed a particular outcome! Consider this example: - -set.seed(47) -N <- 20 -(counts <- table(sample(1:6, N, replace = TRUE))) -set.seed(NULL) - -# We have not observed a "2"! -# -# Now, if we convert the counts to frequencies, and assume these to be -# probabilities, we get an observed p.m.f: -pmf <- numeric(6) -for (i in seq_along(counts)) { - outcome <- as.integer(names(counts)[i]) - pmf[outcome] <- counts[i]/N -} -names(pmf) <- 1:6 -pmf - -# This means we assign a probability of 0 to the outcome "2" - because we -# haven't observed it. But how do we compare it then? What does it mean when we -# should have 1/6 of "2"s but we have none whatsoever? Taken at face value it -# means we are comparing apples to oranges - essentially a five-faced die with a -# six-faced die - and therefore divergence is infinitely large. Obviously, that -# was just a problem caused by our limited sampling, but the question remains: -# how do we account for missing data? There are several solutions, for example, -# for ordered data one could substitute the average values of the two bracketing -# outcomes. But a simple and quite robust solution is to add "pseudocounts". -# This is called adding a Laplace prior, or a Jeffreys prior: in our case, -# simply add 0.5 to every category. - -# pmf of an honest die -pmfHD <- rep(1/6, 6) -names(pmfHD) <- 1:6 -pmfHD - -# pmf, estimated from our sampled counts with and without pseudocounts - -pmfPC <- numeric(6) + 0.5 -for (i in seq_along(counts)) { - outcome <- as.integer(names(counts)[i]) - pmfPC[outcome] <- counts[i] + pmfPC[outcome] -} -pmfPC <- pmfPC / sum(pmfPC) -names(pmfPC) <- 1:6 -pmf # before -pmfPC # after - -# The definition of a function that takes samples and returns a pmf -# with pseudocounts is straightforward, but requires a bit of juggling -# the observed values into the right slots. Here's what this can look like: - -pmfPC <- function(cts, nam) { - # Convert counts to a p.m.f, adding a pseudocount of 0.5 to all categories - # of outcomes (Jeffreys prior). - # Parameters: - # cts num raw counts - # nam names of the categories, converted to char - # Value a probability mass function - - nam <- as.character(nam) - if (!all(names(cts) %in% nam)) { - stop("PANIC: names in \"cts\" do not match \"nam\"!") - } - pmf <- numeric(length(nam)) - names(pmf) <- nam - pmf[names(cts)] <- cts[names(cts)] - pmf <- pmf + 0.5 # add pseudocounts - return(pmf/sum(pmf)) -} - - -# The definition of the Kullback-Leibler divergence itself is quite simple -# actually: for two distributions, p and q it is sum(p * log( p / q)) - -KLdiv <- function(p, q) { - # p and q are two pmfs of discrete probability distributions - # with the same outcomes, which are nowhere 0. - # Value: Kullback-Leibler divergence sum(p * log( p / q))). - - if (length(p) != length(q)) { - stop("PANIC: input vector lengths differ!") - } - if (any(c((p == 0), (q == 0)))) { - stop("PANIC: 0's found in input vectors!") - } - - return(sum(p * log( p / q ))) -} - -# Now we can calculate KL-divergences for our six-faced die example: - -KLdiv(rep(1/6, 6), pmfPC(counts, 1:6)) # p.m.f. of an honest die vs. our - # actual counts - -# Is that a lot? Let's look at the distribution of KL-divergences in our -# six-sided die scenario: p.m.f. of 20 samples each versus the theoretical -# p.m.f. - -N <- 1000 -nSample <- 20 -divs <- numeric(N) -for (i in 1:N) { - x <- table(sample(1:6, nSample, replace = TRUE)) - divs[i] <- KLdiv(rep(1/6, 6), pmfPC(x, 1:6)) -} - -hist(divs, - col = "whitesmoke", - xlab = "Kullback-Leibler divergence", - main = sprintf("%d samples of honest die", nSample)) -abline(v = KLdiv(rep(1/6, 6), pmfPC(counts, 1:6)), col="firebrick") - -# We see that our example sample (KL-divergence marked with the red line) is -# somewhat but not drastically atypical. - - -# === 4.2.2 An example from lognormal distributions - -# We had compared a set of lognormal and gamma distributions above, now we -# can use KL-divergence to quantify their similarity: - -pmfL1 <- pmfPC(countsL1, nam = 1:10) -pmfL2 <- pmfPC(countsL2, nam = 1:10) -KLdiv(pmfL1, pmfL2) # 0.1087 - -# To evaluate what this number means, we can run a simple simulation: we create -# random samples according to the rL1 distribution, calculate the Kullback -# Leibler divergence with countsL1, and compare the distribution we get with the -# value we observed as the difference with discL2. Essentially, this tells us -# the probability that countsL2 is actually a sample from the L1 function. -# Here we go: - -N <- 1000 -divs <- numeric(N) - -set.seed(31416) -for (i in 1:N) { - x <- rlnorm(100) # get random samples from our reference distributions - y <- table(cut(x, breaks = myBreaks, labels = FALSE)) # tabulate counts - q <- pmfPC(y, nam = 1:10) # convert to p.m.f. with pseudocounts - divs[i] <- KLdiv(pmfL1, q) # calculate Kullback-Leibler divergence -} -set.seed(NULL) - -hist(divs, - col = "thistle", - xlab = "Kullback-Leibler divergence", - main = sprintf("Samples from shifted lnorm()")) -abline(v = KLdiv(pmfL1, pmfL2), col="firebrick") - -# How many KL-divergences were less than the difference we observed? -sum(divs < KLdiv(pmfL1, pmfL2)) # 933 - -# Therefore the empirical p-value that the samples came from the same -# distribution is only 100 * ((N - 933) + 1) / (N + 1) (%) ... 6.8%. You see -# that this gives a much more powerful statistical approach than the chi2 test -# we used above. - - -# == 4.3 Continuous distributions: Kolmogorov-Smirnov test ================= - -# The Kolmogorov-Smirnov (KS) test is meant for continuous distributions, i.e. -# the probability it calculates assumes that the function values are all -# different. In the case of random samples, that is a reasonable assumption. KS -# is a two-sample goodness of fit test, i.e. it has a null-hypothesis that the -# samples were taken from the same (unknown) distribution, and then asks whether -# this is likely, given the actual values. It is sensitive both to differences -# in location (position of the mean), and differences in shape. R has the -# ks.test() function to calculate it. - -ks.test(dl1, dl2) # vs. shifted log-normal. -ks.test(dl1, dg1.2) # vs. the three gamma distributions -ks.test(dl1, dg1.5) -ks.test(dl1, dg1.9) -ks.test(dg1.5, dg1.9) # the two last gammas against each other - -# (The warnings about the presence of ties comes from the 0's in our function -# values). The p-value that these distributions are samples of the same -# probability distribution gets progressively smaller. - - - -# [END] +# tocID <- "FND-STA-Probability_distribution.R" +# +# +# Purpose: A Bioinformatics Course: +# R code accompanying the FND-STA-Probability_distribution unit. +# +# Version: 1.6 +# +# Date: 2017-10 - 2020-11 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.6 Revise use of data argument to nls()/nlrob() +# 1.5 Extensive additions on Poisson and binomial distributions +# and regression fits +# 1.4 2020 Maintenance +# 1.3 Change from require() to requireNamespace(), +# use ::() idiom throughout, +# 1.2 Update set.seed() usage +# 1.1 Corrected empirical p-value +# 1.0 First code live version +# +# TODO: +# Add tasks +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> -------------------------------------------------------------------------- +#TOC> 1 Introduction 68 +#TOC> 2 Three fundamental distributions 131 +#TOC> 2.1 The Poisson Distribution 134 +#TOC> 2.2 The hypergeometric distribution 228 +#TOC> 2.2.1 Digression: qqplot() and residuals 376 +#TOC> 2.2.2 Fitting functions 436 +#TOC> 2.2.2.1 Fit a normal distribution (using nls() ) 506 +#TOC> 2.2.2.2 Fit a normal distribution (using nlrob()) ) 525 +#TOC> 2.2.2.3 Extreme Value distributions: Gumbel 552 +#TOC> 2.2.2.4 Extreme Value distributions: Weibull 579 +#TOC> 2.2.2.5 Logistic distribution 621 +#TOC> 2.2.2.6 Log-Logistic distribution 650 +#TOC> 2.2.2.7 Fitting a negative binomial distribution 679 +#TOC> 2.2.2.8 Fitting a binomial distribution 732 +#TOC> 2.3 The uniform distribution 844 +#TOC> 2.4 The Normal Distribution 864 +#TOC> 3 quantile-quantile comparison 905 +#TOC> 3.1 qqnorm() 915 +#TOC> 3.2 qqplot() 981 +#TOC> 4 Quantifying the difference 998 +#TOC> 4.1 Chi2 test for discrete distributions 1032 +#TOC> 4.2 Kullback-Leibler divergence 1124 +#TOC> 4.2.1 An example from tossing dice 1135 +#TOC> 4.2.2 An example from lognormal distributions 1257 +#TOC> 4.3 Continuous distributions: Kolmogorov-Smirnov test 1300 +#TOC> +#TOC> ========================================================================== + + +# = 1 Introduction ======================================================== + +# The space of possible outcomes of events is called a probability distribution +# and the properties of probability distributions are crucial to our work. Many +# distributions like the (discrete) Poisson, or the (continuous) Normal +# distribution have been characterized in great detail, their behaviour is well +# understood, and they are useful for countless applications - but we also need +# to able to work with ad hoc distributions that have never been seen before. + +# Let's get a few facts about probability distributions out of the way: + +# The "support" of a probability distribution is the range of outcomes that have +# a non-zero probability. The "domain" of a probability distribution is the +# range of probabilities that the distribution can take over its support. Think +# of this as the ranges on the x- and y-axis respectively. Thus the distribution +# can be written as p = f(x). + +# The integral over a probability distribution is always 1. This means: the +# distribution reflects the situation that an event does occur, any event, but +# there is not "no event". + +# R's inbuilt probability functions always come in four flavours: +# d... for "density": this is the probability density function (p.d.f.), +# the value of f(x) at x. +# p... for "probability": this is the cumulative distribution function +# (c.d.f.). It is 0 at the left edge of the support, and 1 at +# the right edge. +# q... for "quantile": The quantile function returns the x value at which p... +# takes a requested value. +# r... for "random": produces random numbers that are distributed according +# to the p.d.f. + +# To illustrate with the "Normal Distribution" (Gaussian distribution): + +# 1000 normally distributed values with default parameters: mean 0, sd 1. +r <- rnorm(1000) + +# pastel green: histogram of 1000 random samples +hist(r, + freq = FALSE, + breaks = 30, + xlim = c(-4, 4), + ylim = c(0, 1), + main = "Normal Distribution", + xlab = "x", + ylab = "f(x)", + col = "#E6FFF6") + +# 100 equally spaced point along x +x <- seq(-4, 4, length.out = 100) + +# black: c. d. f. along x. Note that this asymptotically reaches 1 +points(x, pnorm(x), type = "l") + +# dark red: p. d. f. along x +points(x, dnorm(x), type = "l", lwd = 2, col="firebrick") + +# purple: 1% and 99% quantiles +abline(v = qnorm(c(0.01, 0.99)), lwd = 0.5, col = "#CCAAFF") + +# Study this plot well and familiarize yourself with the terms. + + +# = 2 Three fundamental distributions ===================================== + + +# == 2.1 The Poisson Distribution ========================================== + +# The Poisson distribution is a discrete probability distribution that +# characterizes how many events we expect among a given number of observations +# if the mean probability of an event is known. Assume we know that there are +# 256 transcription factors among the 6091 protein-coding genes of yeast, then +# the probability of picking a transcription factor at random from all ORFs is +# 256/6091 ~= 4.2%. How many transcription factors do we expect in a sample of +# 250 genes - like, for example, the top 250 differentially expressed genes in +# an assay? This is a frequently encountered type of question, converging on the +# information contained in a "list of genes". Once an assay has yielded a list +# of genes, what can we learn from looking at staistical features of its +# membership. In the transcription factor model, the question is: how many +# transcription factors do we expect as members of our list - and did we +# actually observe more or less than that? +# +# It would seem that the the probability of encountering _one_ transcription +# factor among our genes is 256/6091 and therefore the number of transcription +# factors we expect to choose at random is (250 * 256)/6091 i.e. 10.50731 in the +# average over many trials. Let's repeat our experiment a million times and see what we get: + +N <- 1000000 # One million trials +genes <- numeric(6091) # All genes are 0 +genes[1:256] <- 1 # TFs are 1 + +hAssays <- numeric(N) # initialize vector +set.seed(112358) +for (i in 1:N) { + pBar(i, N) + hAssays[i] <- sum(sample(genes, 250)) # sum of TFs in our sample in this trial +} +set.seed(NULL) + +# And the average is: +mean(hAssays) # 10.50293 + +# ... which is superbly close to our expectation of 10.50731 + +# All good - but we won't get 10.5 transcription factors in our assay. We'll +# observe five. Or thirteen. Or thirtysix. Or none at all ... and then we ask +# ourselves: is the number of observed transcription factors significantly +# different from what we would have expected if our experiment identified a +# transcription factor just as likely as it identified any other gene? To answer +# this, we need to consider the probability distribution of possible outcomes of +# our assay. Back to the Poisson distribution. In R it is implemented as dpois() +# and its parameters are: the number of observed events, and the probability of +# observing an event: + +dpois(0, (250 * 256) / 6091) # Probability of seeing no TFs +dpois(1, (250 * 256) / 6091) # Probability of seing one ... +dpois(2, (250 * 256) / 6091) # Probability of seing two ... +dpois(3:10, (250 * 256) / 6091) # Probability of seing from three to ten ... +sum(dpois(0:4, (250 * 256) / 6091)) # Probability of seeing four or less ... + +sum(dpois(0:250, (250*256)/6091)) # The sum over all possibilities is (for + # any probability distribution) exactly one. + +# Lets plot these probabilities ... +nMax <- 28 + +x <- dpois(0:nMax, (250 * 256) / 6091) + +barMids <- barplot(x, + col = "#FCF3CF", + names.arg = as.character(0:nMax), + cex.names = 0.5, + axes = TRUE, + ylim = c(0, 0.15), + xlab = "# of TF in set", + ylab = "p") + +# ... and add our simulated assays: + +(th <- table(factor(hAssays, levels = 0:nMax))/N) + +points(barMids - 0.55, th, type = "s", col = "firebrick") +abline(v = (((250 * 256) / 6091) * (barMids[2] - barMids[1])) + barMids[1], + col = "#5588FF") # scale to the correct position in the barplot +legend("topright", + legend = c("Poisson", "simulated", "expectation"), + pch = c(22, NA, NA), # one box, two lines only + pt.cex = 1.4, # larger, to match bar-width better + pt.bg = c("#FCF3CF", NA, NA), # bg color only for the box + lty = c(0, 1, 1), # no line for the box + col = c("#000000", "firebrick", "#5588FF"), + bty = "n") # no frame around the legend + +# NOTE: The simulation shows us that our expectations about the number of +# transcription factors in a sample are almost, but not exactly Poisson +# distributed. Can you figure out where we went wrong? Maybe the +# Poisson distribution is not quite the correct distribution to +# model our expectations? + + +# == 2.2 The hypergeometric distribution =================================== + +# With that suspicion in mind, we reconsider what we were trying to achieve at +# each point of the Poisson distribution. Assume we have observed seven +# transcription factors in our set of 250 genes. So we asked: what is the +# probability of observing seven? And concluded: + +dpois(7, (250 * 256) / 6091) # Probability of seeing seven ... + +# ... which is the probability of seven events in 250 choices if the underlying +# probability is equal to fraction of transcription factors among genes. But +# wait: we weren't careful in our simulation. Assume that our first observed +# gene was a transcription factor. Is the probability of the next sample the +# same? Not quite: one transcription factor has been observed, 249 more samples +# need to be considered, and there are now 6090 genes to choose from. I.e. the +# mean probability changes with every observation: + +(250 * 256) / 6091 # First sample, a TF: p = 10.50731 +(249 * (256 - 1)) / (6091 - 1) # Second sample: p = 10.42611 (-0.992 %) + +# This is actually noticeable: the mean probability for transcription factors +# drops by about one percent after a transcription factor is observed. But what +# if we would have observed the first transcription factor as the tenth gene? + +(239 * (256 - 1)) / (6091 - 10) # Eleventh sample: p = 10.0222 (-0.954 %) + +# This is getting complicated and we need a different way to think about this if +# we don't want to enumerate all possibilities by hand. (There are far too +# many!) Generally, the probability of observing a certain number of events in a +# series is the number of ways to realize the desired outcome, divided by the +# number of possible outcomes. So, if we code transcription factors by "1" and +# other genes by "0", seven transcription factors could be + +# 01010100100100100100000000000000000000000 ..., or +# 01110111100000000000000000000000000000000 ..., or +# 11101001000010000000100000000000000000000 ..., or any other combination. + +# But crucially, our number of trials is limited and every "success" changes the +# probability of future successes. This is sampling without replacement! And +# sampling without replacement is modeled by the so-called "hypergeometric +# distribution". This is the big difference: when we are sampling WITH +# replacement, we can model the process with a Poisson distribution. When we are +# sampling WITHOUT replacement, we use a hypergeometric distribution instead. + +# Let's first re-run our simulated assays. We put the previous run into the +# vector "hAssays" which I prefixed "h" as in "hypergeometric" because I knew +# what was coming, and that I had sampled WITHOUT replacement because that is +# the default for the sample() function. Accordingly, we call the new samples +# "pAssays", where "p" stands for Poisson: + +N <- 1000000 # One million trials +genes <- numeric(6091) # All genes are 0 +genes[1:256] <- 1 # TFs are 1 + +pAssays <- numeric(N) # initialize vector +set.seed(112358) +for (i in 1:N) { + pBar(i, N) + pAssays[i] <- sum(sample(genes, 250, replace = TRUE)) +} +set.seed(NULL) + +# Now the average is: +mean(pAssays) # 10.50312 which is essentially the same as 10.50293 + +# And the plot ... + +nMax <- 28 +barMids <- barplot(dpois(0:nMax, (250 * 256) / 6091), + names.arg = as.character(0:nMax), + cex.names = 0.5, + axes = TRUE, + ylim = c(0, 0.15), + xlab = "# of TF in set", + ylab = "p", + col = "#FCF3CF") +abline(v = (((250 * 256) / 6091) * (barMids[2] - barMids[1])) + barMids[1], + col = "#5588FF") # scale to the correct position in the barplot +th <- table(factor(hAssays, levels = 0:nMax))/N +points(barMids - 0.55, th, type = "s", col = "firebrick") + +# Here are the new assays: +tp <- table(factor(pAssays, levels = 0:nMax))/N +points(barMids - 0.55, tp, type = "s", col = "seagreen") + +legend("topright", + legend = c("Poisson", + "no replacement", + "with replacement", + "expectation"), + pch = c(22, NA, NA, NA), + pt.cex = 1.4, + pt.bg = c("#FCF3CF", NA, NA, NA), + lty = c(0, 1, 1, 1), + col = c("#000000", "firebrick", "seagreen", "#5588FF"), + bty = "n") + +# Clearly .. the "correct" simulation, the simulation that is actually +# appropriate for the Poisson distribution, matches the theoretical values +# better. Now let's see how well the hypergeometric distribution matches our +# original simulated assays. +# The function dhyper(x, m, n, k) expects the following parameters: +# x: the number of observed positive events for which to +# compute the probability +# m: the number of positive events in the population +# n: the number of negative eventsw in the population +# k: the number of observations (or trials) + + dhyper(0, 256, 6091 - 256, 250) # Probability of seeing no TFs + dhyper(1, 256, 6091 - 256, 250) # Probability of seing one ... + dhyper(2, 256, 6091 - 256, 250) # Probability of seing two ... + dhyper(3:10, 256, 6091 - 256, 250) # Probability of three to ten ... +sum(dhyper(0:4, 256, 6091 - 256, 250)) # Probability of seeing four or less ... + +sum(dhyper(0:250, 256, 6091-256, 250)) # The sum over all possibilities is (for + # any probability distribution) + # exactly one. + +# Lets plot these probabilities like we did above ... +nMax <- 28 +x <- dhyper(0:nMax, 256, 6091 - 256, 250) + +barMids <- barplot(x, col = "#E6FFF6", + names.arg = as.character(0:nMax), + cex.names = 0.5, + axes = TRUE, + ylim = c(0, 0.15), + xlab = "# of TF in set", + ylab = "p") +abline(v = (mean(hAssays) * (barMids[2] - barMids[1])) + barMids[1], + col = "#5588FF") # scale to the correct position in the barplot +points(barMids - 0.55, th, type = "s", col = "firebrick") + +legend("topright", + legend = c("Hypergeometric", + "no replacement", + "expectation"), + pch = c(22, NA, NA), + pt.cex = 1.4, + pt.bg = c("#E6FFF6", NA, NA), + lty = c(0, 1, 1, 1), + col = c("#000000", "firebrick", "#5588FF"), + bty = "n") + +# This! +# This is what a correctly simulated distribution looks like. + + +# === 2.2.1 Digression: qqplot() and residuals + +# The indication that something was wrong with our simulation versus the +# theoretical expectation came from the observation that the differences between +# the barplot and theory were not quite random: the values near the mode were +# systematically too high, the values in the tails were systematically too low. +# This is a general principle: when you see a SYSTEMATIC deviation between +# simulation and theory, something is wrong with your understanding. Either +# there is a subtle error in how you set up the simulation, or a subtle +# misunderstanding about the requirements for the particular theory to apply. R +# has a general way to examine such differences: qqplot() plots the deviations +# between theory and observation ordered as ranks, i.e. not affected by absolute +# scale. (See here for an accessible introduction to qqplot() and the +# "quantiles" that it uses: +# https://data.library.virginia.edu/understanding-q-q-plots/) + +oPar <- par(mfrow = c(1, 2)) +qqplot( dpois(0:nMax, (250 * 256) / 6091), + th, + xlab = "Poisson distribution", + ylab = "sampling with replacement", + pch = 22, bg = "#FCF3CF") +abline(lm(th ~ dpois(0:nMax, (250 * 256) / 6091)), col = "seagreen") + +qqplot( dhyper(0:nMax, 256, 6091 - 256, 250), + th, + xlab = "hypergeometric distribution", + ylab = "sampling with replacement", + pch = 22, bg = "#E6FFF6") +abline(lm(th ~ dhyper(0:nMax, 256, 6091 - 256, 250)), col = "seagreen") + +par(oPar) + +# Similar information can be obtained from a residual plot, plotting differences +# between prediction and observation: + +oPar <- par(mfrow = c(1, 2)) +plot( dpois(0:nMax, (250 * 256) / 6091) - as.numeric(th), + type = "b", + ylim = c(-0.006, 0.006), + xlab = "# observations", + ylab = "Poisson density - obs.", + pch = 22, + bg = "#FCF3CF", + col = "#000000") +abline(h = 0, col = "seagreen") + +plot( dhyper(0:nMax, 256, 6091 - 256, 250) - as.numeric(th), + type = "b", + ylim = c(-0.006, 0.006), + xlab = "# observations", + ylab = "Hypergeometric density - obs.", + pch = 22, + bg = "#E6FFF6", + col = "#000000") +abline(h = 0, col = "seagreen") + +par(oPar) + + +# === 2.2.2 Fitting functions + +# Note that there is a further subtle catch: We did not actually ask about seven +# transcription factors! We asked about the probability of seven _different_ +# transcription factors - because, implicit in the assumptions I made about the +# assay (and reasonable for most gene lists), we count duplicates only once! +# Does this actually make a difference? We can model the situation by giving +# each transcription factor a name (or a number), sampling at random, and +# counting how many unique() factors we found in our sample: + +N <- 1000000 # One million trials +genes <- numeric(6091) # All genes are initially 0 +genes[1:256] <- 1:256 # TFs get a unique "name" + +# example sample: +set.seed(11235) +x <- sample(genes, 250, replace = TRUE) # Pick 250 random genes. +x[x != 0] # Note that 189 appears twice. +length(x[x != 0]) # We picked 8 transcription factors ... +unique(x) # but only 7 are unique (plus zero). +length(unique(x)) - 1 # Ignore the zero. + +# Do this a million times +uAssays <- numeric(N) # initialize vector +set.seed(112358) +for (i in 1:N) { + pBar(i, N) + uAssays[i] <- length(unique(sample(genes, 250, replace = TRUE))) - 1 +} +set.seed(NULL) + +# plot the poisson distribution (with replacement) as our baseline +nMax <- 28 +barMids <- barplot(dpois(0:nMax, (250 * 256) / 6091), + col = "#FCF3CF", + names.arg = as.character(0:nMax), + cex.names = 0.5, + axes = TRUE, + ylim = c(0, 0.15), + xlab = "# of TF in set", + ylab = "p") + +tu <- table(factor(uAssays, levels = 0:nMax))/N +points(barMids - 0.55, tu, type = "s", col = "#EE22FF") + +legend("topright", + legend = c("Poisson", + "unique genes"), + pch = c(22, NA), + pt.cex = 1.4, + pt.bg = c("#FCF3CF", NA), + lty = c(0, 1), + col = c("#000000", "#EE22FF"), + bty = "n") + +# Clearly, the distribution does not match our model exactly. + +# So what is the "correct" distribution that we could apply in this case? There +# may or may not be one readily available. What we can do instead is to use a +# more general model and fit parameters. This takes us to the domain of +# regression analysis and curve fitting. The general approach is as follows: +# - Decide on a statistical model; +# - Express it in parametrized form; +# - Fit the parameters; +# - Analyze the coefficients; + +# Insight into the underlying process that generated our data can be obtained +# by analyzing the fitted parameters, or simply plotting the results. Let's +# look at examples of fits to the sampled distribution above: + +# ==== 2.2.2.1 Fit a normal distribution (using nls() ) + +x <- 0:28 +plot(x, tu, type="s") +fit <- nls(tu ~ ( a / (sig*sqrt(2*pi)) ) * exp( (-1/2)*((x-mu)/sig)^2 ), + data = data.frame(x = 0:28, tu = tu), + start = c(a = 1, mu = 10, sig = 3)) # starting values + +points(x, predict(fit), col = "#CC00CC55", lwd = 2, + type = "s") + +coef(fit) +# a mu sig +# 0.9990932 10.0717835 3.0588930 + +sum(resid(fit)^2) +# [1] 0.0001613488 + + +# ==== 2.2.2.2 Fit a normal distribution (using nlrob()) ) + +# There's a bit of an art to chosing starting parameters correctly and if the +# nls() fit does not converge, more robust methods are called for. + +if (! requireNamespace("robustbase", quietly = TRUE)) { + install.packages("robustbase") +} + +x <- 0:28 +plot(x, tu, type="s") +fit <- robustbase::nlrob(tu ~ ( a / (sig*sqrt(6.2831853072)) ) * + exp( (-1/2)*((x-mu)/sig)^2 ), + data = data.frame(x = 0:28, + tu = tu), + start = c(a = 1, mu = 10, sig = 3)) # starting values + +points(x, predict(fit), col = "#CC00CC55", lwd = 2, type = "s") + +coef(fit) +# a mu sig +# 1.002162 10.059189 3.071217 + +sum(resid(fit)^2) +# [1] 0.0001630868 + + +# ==== 2.2.2.3 Extreme Value distributions: Gumbel + +# Many processes that involve "best-of" choices are better modelled with +# so-called extreme-value distributions: here is the Gumbel distribution +# from the evd package. + +if (! requireNamespace("evd", quietly = TRUE)) { + install.packages("evd") +} + +x <- 0:28 +plot(x, tu, type="s") + +fit <- robustbase::nlrob(tu ~ evd::dgumbel(x, loc = L, scale = S), + data = data.frame(tu = tu, x = 0:28), + start = c(L = 7.3, S = 2.82)) + +points(x, predict(fit), type = "s", col = "#55DD88") + +coef(fit) +# L S +# 9.322110 2.818266 + +sum(resid(fit)^2) +# [1] 0.001027447 + + +# ==== 2.2.2.4 Extreme Value distributions: Weibull + +# Weibull distributions are common in reliabilty analysis. I found the +# distribution particularly hard to fit as it is quite sensitive to inital +# parameter estimates. https://en.wikipedia.org/wiki/Weibull_distribution + +# NOTE: the parameter TH is > X +idx <- 4:28 +myX <- idx +myY <- as.numeric(tu)[idx] +plot(myX, myY, type="s") + +dWei <- function(x, th, l, k) { + a <- k/l + b <- ((x-th)/l)^(k-1) + c <- exp(-((x-th)/l)^k) + y <- a * b * c + return(y) +} + +set.seed(112358) +fit <- robustbase::nlrob(y ~ dWei(x, th = TH, l = L, k = K), + data = data.frame(y = myY, + x = myX), + lower = c(TH = 3.5, + L = 8, + K = 2.5), + upper = c(TH = 3.7, + L = 9, + K = 3), + method = "mtl") + +points(x, predict(fit), col = "#CC00CC55", lwd = 2, type = "s") + +coef(fit) +# TH L K +#3.630807 8.573898 2.795116 + +sum(resid(fit)^2) +# [1] 7.807073e-05 + + +# ==== 2.2.2.5 Logistic distribution + +# Similar to normal distribution, but with heavier tails +# https://en.wikipedia.org/wiki/Logistic_distribution + +myX <- 0:28 +myY <- as.numeric(tu) +plot(myX, myY, type="s") + +dLogi <- function(x, mu, s) { + y <- (exp(-(x-mu)/s)) / (s * (1+exp(-(x-mu)/s))^2) + return(y) +} + +fit <- robustbase::nlrob(y ~ dLogi(x, mu = M, s = S), + data = data.frame(y = myY, + x = myX), + start = c(M = 10, S = 3)) + +points(x, predict(fit), col = "#CC00CC55", lwd = 2, type = "s") + +coef(fit) +# M S +# 10.088968 1.891654 + +sum(resid(fit)^2) +# [1] 0.0004030595 + + +# ==== 2.2.2.6 Log-Logistic distribution + +# Special case of logistic, often used in survival analysis +# https://en.wikipedia.org/wiki/Log-logistic_distribution + +myX <- 0:28 +myY <- as.numeric(tu) +plot(myX, myY, type="s") + +dLogLogi <- function(x, a, b) { + y <- ((b/a)*(x/a)^(b-1)) / (1+((x/a)^b))^2 + return(y) +} + +fit <- robustbase::nlrob(y ~ dLogLogi(x, a = A, b = B), + data = data.frame(y = myY, + x = myX), + start = c(A = 9.5, B = 4.8)) + +points(x, predict(fit), col = "#CC00CC55", lwd = 2, type = "s") + +coef(fit) +# A B +# 10.310181 5.288385 + +sum(resid(fit)^2) +# [1] 0.0006343927 + + +# ==== 2.2.2.7 Fitting a negative binomial distribution + +# The negative binomial distribution is related to the Poisson distribution. +# Assume you are observing events and and counting how many successes of a +# Bernoulli process (essentially a coin-flip) we encounter before we encounter a +# failure. Unlike the Poisson, it models mean and variance separately and is therefore especially useful for overdispersed functions. (cf. https://en.wikipedia.org/wiki/Negative_binomial_distribution) +# + +x <- 0:28 +plot(x, tu, type="s") + +# Negative binomial +dNB <- function(x, r, p) { + # Note: r is an integer! + y <- choose((x + r - 1), (r - 1)) * (1-p)^x * p^r + return(y) +} + +set.seed(112358) +RR <- 104 +fit <- robustbase::nlrob(tu ~ dNB(x, r = RR, p = P), + data = data.frame(x = x, RR = RR), + lower = c(P = 0.01), + upper = c(P = 0.99), + method = "mtl") + +points(x, predict(fit), col = "#CC00CC55", lwd = 2, type = "s") + +coef(fit) +# P +# 0.9100729 + +sum(resid(fit)^2) +# [1] 0.0005669086 + +# Nb. the parameter R is not continuous: to optimize it as an integer, we try +# reasonable choices and record the best fit. +N <- 150 +R <- numeric(N) +for (thisR in 1:N) { + set.seed(112358) + fit <- robustbase::nlrob(y ~ dNB(x, r = thisR, p = P), + data = data.frame(x = x, + thisR = thisR), + lower = c(P = 0.01), + upper = c(P = 0.99), + method = "mtl") + R[thisR] <- sum(resid(fit)^2) +} +plot(R) +which(R == min(R)) + + +# ==== 2.2.2.8 Fitting a binomial distribution +# The workhorse distribution for Bernoulli proceeses +# cf. https://en.wikipedia.org/wiki/Binomial_distribution + + +myX <- 0:28 +myY <- as.numeric(tu) +plot(myX, myY, type="s") + +dBinom <- function(x, s, p) { + y <- choose(s, x) * (p^x) * ((1-p)^(s-x)) + return(y) +} + +fit <- robustbase::nlrob(y ~ dBinom(x, s = S, p = P), + data = data.frame(y = myY, + x = myX), + start = c(S = 240, P = 256/6091)) + +points(x, predict(fit), col = "#CC00CC55", lwd = 2, type = "s") + +coef(fit) +# S P +# 122.77746436 0.08376922 + +sum(resid(fit)^2) +# [1] 1.114272e-06 + +# Here we go: near perfect fit. But note the parameters! Can you identify the +# relationship of S and P to our model of choosing unique transcription factors +# in a random sampling process? + +# Remember what we started out with: +points(x, dBinom(x, 240, 256/6091), + col = "#00AAFF55", lwd = 2, type = "s") + +# The model has improved a lot from our starting-value guess. But how does an +# effective sample size of 122.78 relate to the actual value of 250 samples? And +# how does a probability for choosing a transcription factor of 0.0838 relate to +# having 256 transcription factors among 6091 genes (a fraction of 0.0420)? Well +# - if you stare at the numbers for a bit you might notice that the fitted +# sample size is about half of what we had, while the fitted probability is +# about twice that. Let's correct for the factor of two, and look at the fit ... + +points(x, dBinom(x, coef(fit)["S"] * 2 , coef(fit)["P"] / 2), + col = "#00FF8899", lwd = 2, type = "s") + +# interesting ... that's not so bad ... Essentially what this tells us is: our +# model is very similar to one in which our effective sample size would have +# been about 246 genes, not 250, and the number of our genes would have been +# close to 0.04188461 * 6091 ~= 255 transcription factors, not 256. Close, to - +# but not almost perfect. + +# Incidentally: would you have thought that we can +# detect the number of transcription factors in our sample +- 1 if we just +# sample frequently enough? + +# Let's examine the effect that applying various factors to size and probability +# have on our distribution: + + +z <- c(1/8:2 , 1, 2:8, 10, 20, 50) +myCols <- colorRampPalette(c("#00000022", + "#00000088", + "#DD0000DD", + "#0088FF88", + "#0088FF55", + "#0088FF22"), + alpha=TRUE)(length(z)) + +myLwd <- rep(1.25, length(z)) +myLwd[z == 1] <- 2.5 # make the actual fitted value stand out + +plot(x, y, type="s", ylim =c(0, 0.22), lwd = 5, col="#FF990077") + +for (i in seq_along(z)) { + points(x, dBinom(x, coef(fit)["S"] * z[i] , coef(fit)["P"] / z[i]), + col = myCols[i], type = "s") +} + +legend("topright", + legend = sprintf("%3.2f", z), + cex = 0.5, + col = myCols, + lwd = myLwd, + bty = "n") + +# We see how factors less than 1 applied to our actual sample size and fraction +# of transcription factors increasingly narrow the distribution; factors larger +# than one increasingly broaden the distribution but in a much slower manner. A +# factor of one (i.e. half size, double probability) hits the sweet spot and +# recaptures the essence of our observation. Clearly, this is a case of +# fortuitously cancelling errors. + + +# What is the take-home message here? +# - The standard Poisson and hypergeometric distributions apply to +# very specific models of choice processes (with/without replacement); +# - It is not trivial to choose the right statistical model for any particular +# real-world specification of a sampling process. Our model of unique +# choices is neither Poisson nor hypergeometric distributed. Once we have +# identified the parameters of a binomial distribution that models the +# process perfectly, we nevertheless note that we don't seem to be +# able to interpret the parameters easily. +# - Stochastic modeling allows us to validate whether the model is correct, +# but in case there are discrepancies it is not obvious what might be +# a more appropriate model and how to parametrize it. +# - If building an explicit stochastic model is not possible, we'll have to +# to do the best we can, in this case that would mean: choose a more +# general distribution and parametrize it. + + +# == 2.3 The uniform distribution ========================================== + +# The uniform distribution has the same probability over its entire support. R's +# runif() function takes the desired number, the min and the max as arguments. +# Let's plot a histogram of a million values between -1 and 1 to demonstrate. + +hist(runif(1e6, -1, 1), breaks = 20, col = "#FFE6F6") +abline(h = 1e6/20, col="firebrick") + +# One of the important uses of the uniform distribution is to write conditional +# expressions that are TRUE with a given probability. For example, to get TRUE +# values with a probability of 1/3, we pick a random number between 0 and 1, and +# ask whether the number is smaller than 1/3. Example: + +runif(10) < 1/3 + +#confirm with a million trials +sum(runif(1e6) < 1/3)/1e6 # should be close to 0.33333... + + +# == 2.4 The Normal Distribution =========================================== + +# The king of probability distributions. Why? That's because of the Central +# Limit Theorem (CLT) that essentially says that a process that is subject to +# small fluctuations will tend to normally distributed outcomes ... and in +# biology literally everything is subject to small fluctuations. + +# Lets simulate: Lets create a vector of 12345 numbers, choose samples of size +# 77 from that vector and calculate the mean. We do that 9999 times. I am just +# using odd numbers so it is clear in the code which number represents what. + +x <- runif(12345) +v <- numeric(9999) +for (i in 1:length(v)) { + v[i] <- mean(sample(x, 77)) +} + +hist(v, breaks = 20, col = "#F8DDFF") + +# Let's try this again, this time sampling from an exponential distribution ... +x <- rexp(12345) +v <- numeric(9999) +for (i in 1:length(v)) { + v[i] <- mean(sample(x, 77)) +} + +hist(v, breaks = 20, col = "#F8DDFF") + +# ... or from a t-distribution ... +x <- rt(12345, df = 3) +v <- numeric(9999) +for (i in 1:length(v)) { + v[i] <- mean(sample(x, 77)) +} + +hist(v, breaks = 20, col = "#F8DDFF", freq = FALSE) + +# The outcomes all give normal distributions, regardless what the details of our +# original distribution were! + + +# = 3 quantile-quantile comparison ======================================== + + +# Once we have observed a distribution of outcomes, the next task is often to +# quantify whether the values correspond to a known distribution. This can be +# done with quantile-quantile plots that plot the quantile values of one +# distribution against those of the other. Identically distributed quantiles lie +# on a straight line. + + +# == 3.1 qqnorm() ========================================================== + +# The functions qqnorm() and qqline() perform this +# comparison with the normal distribution. + +set.seed(112358) +x <- rnorm(100, mean=0, sd=1) # 100 normally distributed values +set.seed(NULL) + +qqnorm(x) +qqline(x, col = "seagreen") + +# Our variables in x appear normally distribute - which is not surprising since +# we produced them with rnorm(). What about the kind of sampling we did above? +# Let's test whether samples from an exponential distribution are normally +# distributed (previously we just visually inspected the histogram.) + +# Create a vector of sample means from the exponential distribution; use +# only a few samples for the mean +x <- rexp(12345) +v <- numeric(999) + +set.seed(112358) +for (i in 1:length(v)) { + v[i] <- mean(sample(x, 12)) +} +set.seed(NULL) + +qqnorm(v) +qqline(v, col = "turquoise") # normal + +#try with more samples +for (i in 1:length(v)) { + v[i] <- mean(sample(x, 77)) +} +qqnorm(v) +qqline(v, col = "steelblue") # normal + +#try with many samples +for (i in 1:length(v)) { + v[i] <- mean(sample(x, 374)) +} +qqnorm(v) +qqline(v, col = "plum") # normal + +# Exactly as the CLT predicts, the more often we sample - we tried +# 12, 77, and 374 samples - the more "normal" the distribution looks. + +# What does a distribution look like that is NOT normal? +# Let's try simulating an "Extreme value distribution". This type of +# distribution appears if we choose the max() of a sample + +set.seed(112358) +rEVD <- numeric(9999) +for (i in seq_along(rEVD)) { + rEVD[i] <- max(rnorm(100)) +} +set.seed(NULL) + +hist(rEVD, breaks = 20, col = "orchid") +# Note the long tail on the right! + +qqnorm(rEVD) +qqline(rEVD, col = "orchid") # Definitely not "normal"! + + +# == 3.2 qqplot() ========================================================== + +# qqplot() works like qqnorm(), except that we compare two arbitrary +# distribtutions, rather than one distribution against the normal distribution +# as we did before. Sample against sample. + +x <- seq(0, 4, length.out = 100) + +dl <- dlnorm(x) # log-normal distribution +dg <- dgamma(x, shape=1.5) # gamma distribution + +plot(dl, type="l") +points(dg, type="l", col = "maroon") + +qqplot(dl, dg) # clearly not equal + + +# = 4 Quantifying the difference ========================================== + +# Quantile-quantile plots give us a visual estimate, but how do we quantify the +# difference between distributions? Let's compare two types of extreme-value +# distributions, a lognormal distribution with the same distribution that is +# slightly shifted, and three gamma distributions with three different shape +# parameters. Let's define and visualize the distributions first, to see what +# we are comparing. + +x <- seq(0, 4, length.out = 100) + +set.seed(112358) +dl1 <- dlnorm(x) # log-normal distribution +dl2 <- dlnorm(x - 0.25) # log-normal distribution, shifted right (a bit) +dg1.2 <- dgamma(x, shape=1.2) # three gamma distributions with... +dg1.5 <- dgamma(x, shape=1.5) # ...wider, and wider... +dg1.9 <- dgamma(x, shape=1.9) # ...peak +set.seed(NULL) + +myCols <- c("black", "grey", "maroon", "turquoise", "steelblue") + +plot(dl1, type="l", lwd=2) # visualize the distributions +points(dl2, type="l", col = myCols[2]) +points(dg1.2, type="l", col = myCols[3]) +points(dg1.5, type="l", col = myCols[4]) +points(dg1.9, type="l", col = myCols[5]) +legend("topright", + legend = c("dl1", "dl2", "dg1.2", "dg1.5", "dg1.9"), + lty = 1, + lwd = c(2, 1, 1, 1, 1), + col = myCols, + bty = "n") + + +# == 4.1 Chi2 test for discrete distributions ============================== + +# The chi2 test can be used to compare discrete distributions - even though +# it is not ideal for this purpose. +# (https://stats.stackexchange.com/questions/113692) +# +# Let's draw 100 random variables according to our target distributions +N <- 100 +set.seed(112358) +rL1 <- rlnorm(N) # log-normal distribution +rL2 <- rlnorm(N, meanlog = 0.25) # log-normal distribution, shifted right +rG1.2 <- rgamma(N, shape=1.2) # three gamma distributions with... +rG1.5 <- rgamma(N, shape=1.5) # ...wider, and wider... +rG1.9 <- rgamma(N, shape=1.9) # ...peak +set.seed(NULL) + +maxX <- max(c(rL1, rL2, rG1.2, rG1.5, rG1.9)) + +myBreaks <- seq(0, 5, length.out = 10) # 9 intervals from 0 to 5... +myBreaks <- c(myBreaks, maxX) # ... and one that contains the outliers + +# It's easy to plot a histogram of one set of random deviates... +hist(rG1.5, breaks = myBreaks, col = myCols[4]) + +# ... but basic R has no inbuilt function to stack histogram bars side-by-side. +# We use the multhist() function in the plotrix package: check out the +# package information - plotrix has _many_ useful utilities to enhance +# plots or produce informative visualizations. + +if (! requireNamespace("plotrix", quietly = TRUE)) { + install.packages("plotrix") +} + +# Package information: +# library(help = plotrix) # basic information +# browseVignettes("plotrix") # available vignettes +# data(package = "plotrix") # available datasets + + +h <- plotrix::multhist(list(rL1, rL2, rG1.2, rG1.5, rG1.9 ), + breaks = myBreaks, + col = myCols) +legend("topright", + legend = c("rL1", "rL2", "rG1.2", "rG1.5", "rG1.9"), + pch=15, + col = myCols, + bty="n") + +# We have assigned the output of multihist to the variable h, which now +# contains the densities, midpoints, breaks etc. of the histogram ... +# as well as the matrix of counts: +h[[2]] + +# But using hist() or multhist() for binning is a bit of a hack - even though +# it works, of course. The "real" R function to bin data is cut(). cut() +# sorts the values of a vector into bins, and returns the bin-labels as +# integers. + +x <- cut(rL1, breaks = myBreaks, labels = FALSE) +table(x) + +countsL1 <- table(cut(rL1 , breaks = myBreaks, labels = FALSE)) +countsL2 <- table(cut(rL2 , breaks = myBreaks, labels = FALSE)) +countsG1.2 <- table(cut(rG1.2, breaks = myBreaks, labels = FALSE)) +countsG1.5 <- table(cut(rG1.5, breaks = myBreaks, labels = FALSE)) +countsG1.9 <- table(cut(rG1.9, breaks = myBreaks, labels = FALSE)) + + +chisq.test(countsL1, countsL2) + +# Note that this use of the chi2 test does not have very much power, since it +# does not assume the values for the bins are ordered, but takes them to +# be independent. Also, chisq.test() complains about the Chi-squared +# approximation to be possibly incorrect because some of the counts are small. +# In this case, rather than rely on the in-built chi-square table, we can do +# an explicit simulation to estimate the p-value for the null hypothesis. +# +chisq.test(countsL1, countsL2, simulate.p.value = TRUE, B = 10000) + +# Note that the probability that the samples came from the same distribution is +# quite high. We don't seem to be able to distinguish l1 and l2 with the chi2 +# test. + +# Let's calculate this for the other distribution too: + +chisq.test(countsL1, countsG1.2, simulate.p.value = TRUE, B = 10000) +chisq.test(countsL1, countsG1.5, simulate.p.value = TRUE, B = 10000) +chisq.test(countsL1, countsG1.9, simulate.p.value = TRUE, B = 10000) + +# As a result, we would conclude that none of these distributions are +# significantly different. + +# == 4.2 Kullback-Leibler divergence ======================================= + +# For discrete probability distributions, there is a much better statistic, the +# Kullback-Leibler divergence (or relative entropy). It is based in information +# theory, and evaluates how different the matched pairs of outcome categories +# are. Its inputs are the probability mass functions (p.m.f.) of the two +# functions to be compared. A probability mass function is the probability of +# every outcome the process can have. Kullback-Leibler divergence therefore can +# be applied to discrete distributions. But we need to talk a bit about +# converting counts to p.m.f.'s. + +# === 4.2.1 An example from tossing dice + +# The p.m.f of an honest die is (1:1/6, 2:1/6, 3:1/6, 4:1/6, 5:1/6, 6:1/6). But +# there is an issue when we convert sampled counts to frequencies, and estimate +# probabilities with these frequencies. The problem is: by chance we might not +# have observed a particular outcome! Consider this example: + +set.seed(47) +N <- 20 +(counts <- table(sample(1:6, N, replace = TRUE))) +set.seed(NULL) + +# We have not observed a "2"! +# +# Now, if we convert the counts to frequencies, and assume these to be +# probabilities, we get an observed p.m.f: +pmf <- numeric(6) +for (i in seq_along(counts)) { + outcome <- as.integer(names(counts)[i]) + pmf[outcome] <- counts[i]/N +} +names(pmf) <- 1:6 +pmf + +# This means we assign a probability of 0 to the outcome "2" - because we +# haven't observed it. But how do we compare it then? What does it mean when we +# should have 1/6 of "2"s but we have none whatsoever? Taken at face value it +# means we are comparing apples to oranges - essentially a five-faced die with a +# six-faced die - and therefore divergence is infinitely large. Obviously, that +# was just a problem caused by our limited sampling, but the question remains: +# how do we account for missing data? There are several solutions, for example, +# for ordered data one could substitute the average values of the two bracketing +# outcomes. But a simple and quite robust solution is to add "pseudocounts". +# This is called adding a Laplace prior, or a Jeffreys prior: in our case, +# simply add 0.5 to every category. + +# pmf of an honest die +pmfHD <- rep(1/6, 6) +names(pmfHD) <- 1:6 +pmfHD + +# pmf, estimated from our sampled counts with and without pseudocounts + +pmfPC <- numeric(6) + 0.5 +for (i in seq_along(counts)) { + outcome <- as.integer(names(counts)[i]) + pmfPC[outcome] <- counts[i] + pmfPC[outcome] +} +pmfPC <- pmfPC / sum(pmfPC) +names(pmfPC) <- 1:6 +pmf # before +pmfPC # after + +# The definition of a function that takes samples and returns a pmf +# with pseudocounts is straightforward, but requires a bit of juggling +# the observed values into the right slots. Here's what this can look like: + +pmfPC <- function(cts, nam) { + # Convert counts to a p.m.f, adding a pseudocount of 0.5 to all categories + # of outcomes (Jeffreys prior). + # Parameters: + # cts num raw counts + # nam names of the categories, converted to char + # Value a probability mass function + + nam <- as.character(nam) + if (!all(names(cts) %in% nam)) { + stop("PANIC: names in \"cts\" do not match \"nam\"!") + } + pmf <- numeric(length(nam)) + names(pmf) <- nam + pmf[names(cts)] <- cts[names(cts)] + pmf <- pmf + 0.5 # add pseudocounts + return(pmf/sum(pmf)) +} + + +# The definition of the Kullback-Leibler divergence itself is quite simple +# actually: for two distributions, p and q it is sum(p * log( p / q)) + +KLdiv <- function(p, q) { + # p and q are two pmfs of discrete probability distributions + # with the same outcomes, which are nowhere 0. + # Value: Kullback-Leibler divergence sum(p * log( p / q))). + + if (length(p) != length(q)) { + stop("PANIC: input vector lengths differ!") + } + if (any(c((p == 0), (q == 0)))) { + stop("PANIC: 0's found in input vectors!") + } + + return(sum(p * log( p / q ))) +} + +# Now we can calculate KL-divergences for our six-faced die example: + +KLdiv(rep(1/6, 6), pmfPC(counts, 1:6)) # p.m.f. of an honest die vs. our + # actual counts + +# Is that a lot? Let's look at the distribution of KL-divergences in our +# six-sided die scenario: p.m.f. of 20 samples each versus the theoretical +# p.m.f. + +N <- 1000 +nSample <- 20 +divs <- numeric(N) +for (i in 1:N) { + x <- table(sample(1:6, nSample, replace = TRUE)) + divs[i] <- KLdiv(rep(1/6, 6), pmfPC(x, 1:6)) +} + +hist(divs, + col = "whitesmoke", + xlab = "Kullback-Leibler divergence", + main = sprintf("%d samples of honest die", nSample)) +abline(v = KLdiv(rep(1/6, 6), pmfPC(counts, 1:6)), col="firebrick") + +# We see that our example sample (KL-divergence marked with the red line) is +# somewhat but not drastically atypical. + + +# === 4.2.2 An example from lognormal distributions + +# We had compared a set of lognormal and gamma distributions above, now we +# can use KL-divergence to quantify their similarity: + +pmfL1 <- pmfPC(countsL1, nam = 1:10) +pmfL2 <- pmfPC(countsL2, nam = 1:10) +KLdiv(pmfL1, pmfL2) # 0.1087 + +# To evaluate what this number means, we can run a simple simulation: we create +# random samples according to the rL1 distribution, calculate the Kullback +# Leibler divergence with countsL1, and compare the distribution we get with the +# value we observed as the difference with discL2. Essentially, this tells us +# the probability that countsL2 is actually a sample from the L1 function. +# Here we go: + +N <- 1000 +divs <- numeric(N) + +set.seed(31416) +for (i in 1:N) { + x <- rlnorm(100) # get random samples from our reference distributions + y <- table(cut(x, breaks = myBreaks, labels = FALSE)) # tabulate counts + q <- pmfPC(y, nam = 1:10) # convert to p.m.f. with pseudocounts + divs[i] <- KLdiv(pmfL1, q) # calculate Kullback-Leibler divergence +} +set.seed(NULL) + +hist(divs, + col = "thistle", + xlab = "Kullback-Leibler divergence", + main = sprintf("Samples from shifted lnorm()")) +abline(v = KLdiv(pmfL1, pmfL2), col="firebrick") + +# How many KL-divergences were less than the difference we observed? +sum(divs < KLdiv(pmfL1, pmfL2)) # 933 + +# Therefore the empirical p-value that the samples came from the same +# distribution is only 100 * ((N - 933) + 1) / (N + 1) (%) ... 6.8%. You see +# that this gives a much more powerful statistical approach than the chi2 test +# we used above. + + +# == 4.3 Continuous distributions: Kolmogorov-Smirnov test ================= + +# The Kolmogorov-Smirnov (KS) test is meant for continuous distributions, i.e. +# the probability it calculates assumes that the function values are all +# different. In the case of random samples, that is a reasonable assumption. KS +# is a two-sample goodness of fit test, i.e. it has a null-hypothesis that the +# samples were taken from the same (unknown) distribution, and then asks whether +# this is likely, given the actual values. It is sensitive both to differences +# in location (position of the mean), and differences in shape. R has the +# ks.test() function to calculate it. + +ks.test(dl1, dl2) # vs. shifted log-normal. +ks.test(dl1, dg1.2) # vs. the three gamma distributions +ks.test(dl1, dg1.5) +ks.test(dl1, dg1.9) +ks.test(dg1.5, dg1.9) # the two last gammas against each other + +# (The warnings about the presence of ties comes from the 0's in our function +# values). The p-value that these distributions are samples of the same +# probability distribution gets progressively smaller. + + + +# [END] diff --git a/FND-STA-Significance.R b/FND-STA-Significance.R index d86dba9..3848e9b 100644 --- a/FND-STA-Significance.R +++ b/FND-STA-Significance.R @@ -1,351 +1,351 @@ -# tocID <- "FND-STA-Significance.R" -# -# -# Purpose: A Bioinformatics Course: -# R code accompanying the FND-STA-Significance unit. -# -# Version: 1.3 -# -# Date: 2017-09 - 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.3 2020 Maintenance. Add sample solution. -# 1.2 Update set.seed() usage -# 1.1 Corrected treatment of empirical p-value -# 1.0 First contents -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ------------------------------------------------------------------ -#TOC> 1 Significance and p-value 49 -#TOC> 1.1 Significance levels 60 -#TOC> 1.2 probability and p-value 77 -#TOC> 1.2.1 p-value illustrated 109 -#TOC> 2 One- or two-sided 165 -#TOC> 3 Significance by integration 209 -#TOC> 4 Significance by simulation or permutation 215 -#TOC> 5 Final tasks 327 -#TOC> 6 Sample solutions 336 -#TOC> 6.1 338 -#TOC> 6.2 342 -#TOC> 6.3 346 -#TOC> -#TOC> ========================================================================== - - -# = 1 Significance and p-value ============================================ - -# The idea of the probability of an event has a precise mathematical -# interpretation, but how is it useful to know the probability? Usually we are -# interested in whether we should accept or reject a hypothesis based on the -# observations we have. A rational way to do this is to say: if the probability -# of observing the data is very small under the null-hypothesis, then we will -# assume the observation is due to something other than the null-hypothesis. But -# what do we mean by the "probability of our observation"? And what is "very -# small"? - -# == 1.1 Significance levels =============================================== - -# A "very small" probability is purely a matter of convention - a cultural -# convention. In the biomedical field we usually call probabilities of less then -# 0.05 (5%) small enough to reject the null-hypothesis. Thus we call -# observations with a probability of less than 0.05 "significant" and if we want -# to highlight this in text or in a graph, we often mark them with an asterisk -# (*). Also we often call observations with a probability of less than 0.01 -# "highly significant" and mark them with two asterisks (**). But there is no -# special significance in these numbers, the cutoff point for significance could -# also be 0.0498631, or 0.03, or 1/(pi^3). 0.05 is just the value that the -# British statistician Ronald Fisher happened to propose for this purpose in -# 1925. Incidentally, Fisher later recommended to use different cutoffs for -# different purposes (cf. -# https://en.wikipedia.org/wiki/Statistical_significance). - - -# == 1.2 probability and p-value =========================================== - -# But what do we even mean by the probability of an observation? -# Assume I am drawing samples from a normal distribution with a mean of 0 and a -# standard deviation of 1. The sample I get is ... - -set.seed(sqrt(5)) -x <- rnorm(1) -set.seed(NULL) - -print(x, digits = 22) -# [1] -0.8969145466249813791748 - -# So what's the probability of that number? Obviously, the probability of -# getting exactly this number is very, very, very small. But also obviously, -# this does not mean that observing this number is in any way significant - we -# always observe some number. That's not what we mean in this case. There are -# several implicit assumptions when we speak of the probability of an -# observation: - -# 1: the observation can be compared to a probability distribution; -# 2: that distribution can be integrated between any specific value -# and its upper and lower bounds (or +- infinity). - -# Then what we really mean by the probability of an observation in the context -# of that distribution is: the probability of observing that value, or a value -# more extreme than the one we have. We call this the p-value. Note that we are -# not talking about an individual number anymore, we are talking about the area -# under the curve between our observation and the upper (or lower) bound of the -# curve, as a fraction of the whole. - - -# === 1.2.1 p-value illustrated - -# Let's illustrate. First we draw a million random values from our -# standard, normal distribution: - -N <- 1e6 # one million -set.seed(112358) # set RNG seed for repeatable randomness -r <- rnorm(N) # N values from a normal distribution -set.seed(NULL) # reset the RNG - -# Let's see what the distribution looks like: - -(h <- hist(r)) - -# The histogram details are now available in the list h - e.g. h$counts - -# Where is the value we have drawn previously? -abline(v = x, col = "#EE0000") - -# How many values are smaller? -sum(r < x) - -# Let's color the bars: -# first, make a vector of red and green colors for the bars with breaks -# smaller and larger then x, white for the bar that contains x ... -hCol <- rep("#EE000044", sum(h$breaks < x) - 1) -hCol <- c(hCol, "#FFFFFFFF") -hCol <- c(hCol, rep("#00EE0044", sum(h$breaks > x) - 1)) -# ... then plot the histogram, with colored bars ... -hist(r, col = hCol) -# ... add two colored rectangles into the white bar ... -idx <- sum(h$breaks < x) -xMin <- h$breaks[idx] -xMax <- h$breaks[idx + 1] -y <- h$counts[idx] -rect(xMin, 0, x, y, col = "#EE000044", border = TRUE) -rect(x, 0, xMax, y, col = "#00EE0044", border = TRUE) -# ... and a red line for our observation. -abline(v = x, col = "#EE0000", lwd = 2) - -# The p-value of our observation is the red area as a fraction of the -# whole histogram (red + green). - - -# Task: -# Explain how the expression sum(r < x) works to give us a count of values -# with the property we are looking for. E.g., examine -4:4 < x - -# Task: -# Write an expression to estimate the probability that a value -# drawn from the vector r is less-or-equal to x. The result you get -# will depend on the exact values that went into the vector r but it should -# be close to 0.185 That expression is the p-value associated with x. -# (Sample solution 6.1) - - -# = 2 One- or two-sided =================================================== - -# The shape of our histogram confirms that the rnorm() function has returned -# values that appear distributed according to a normal distribution. In a normal -# distribution, readily available tables tell us that 5% of the values (i.e. our -# significance level) lie 1.96 (or approximately 2) standard deviations away -# from the mean. Is this the case here? How many values in our vector r are -# larger than 1.96? - -sum(r > 1.96) -# [1] 24589 - -# Wait - that's about 2.5% of 1,000,000, not 5% as expected. Why? - -# The answer is: we have to be careful with two-sided distributions. 2 standard -# deviations away from the mean means either larger or smaller than 1.96 . This -# can give rise to errors. If we are simply are interested in outliers, no -# matter larger or smaller, then the 1.96 SD cutoff for significance is correct. -# But if we are specifically interested in, say, larger values, because a -# smaller value is not meaningful, then the significance cutoff, expressed as -# standard deviations, is relaxed. We can use the quantile function to see what -# the cutoff values are: - -quantile(r) -quantile(r, probs = c(0.025, 0.975)) # for the symmetric 2.5% boundaries -# close to ± 1.96, as expected -quantile(r, probs = 0.95) # for the single 5% boundary -# close to 1.64 . Check counts to confirm: -sum(r > quantile(r, probs = 0.95)) -# [1] 50000 -# which is 5%, as expected. - -# Task: -# Use abline() to add the p = 0.05 boundary for smaller values to the histogram. -# (Sample solution 6.2) - -# To summarize: when we evaluate the significance of an event, we divide a -# probability distribution into two parts at the point where the event was -# observed. We then ask whether the integral over the more extreme part is less -# or more than 5% of the whole. If it is less, we deem the event to be -# significant. -# - - -# = 3 Significance by integration ========================================= - -# If the underlying probability distribution can be analytically or numerically -# integrated, the siginificance of an observation can be directly computed. - - -# = 4 Significance by simulation or permutation =========================== - -# But whether the integration is correct, or relies on assumptions that may not -# be warranted for biological data, can be a highly technical question. -# Fortunately, we can often simply run a simulation, a random resampling, or a -# permutation and then count the number of outcomes, just as we did with our -# rnorm() samples. We call this an empirical p-value. (Actually, the "empirical -# p-value" is defined as (Nobs + 1) / (N + 1). ) - -# Here is an example. Assume you have a protein sequence and -# you speculate that positively charged residues are close to negatively charged -# residues to balance charge locally. A statistic that would capture this is the -# mean minimum distance between all D,E residues and the closest R,K,H -# residue. Let's compute this for the sequence of yeast Mbp1. - -MBP1 <- paste0("MSNQIYSARYSGVDVYEFIHSTGSIMKRKKDDWVNATHILKAANFAKAKRTRILEKEVLK", - "ETHEKVQGGFGKYQGTWVPLNIAKQLAEKFSVYDQLKPLFDFTQTDGSASPPPAPKHHHA", - "SKVDRKKAIRSASTSAIMETKRNNKKAEENQFQSSKILGNPTAAPRKRGRPVGSTRGSRR", - "KLGVNLQRSQSDMGFPRPAIPNSSISTTQLPSIRSTMGPQSPTLGILEEERHDSRQQQPQ", - "QNNSAQFKEIDLEDGLSSDVEPSQQLQQVFNQNTGFVPQQQSSLIQTQQTESMATSVSSS", - "PSLPTSPGDFADSNPFEERFPGGGTSPIISMIPRYPVTSRPQTSDINDKVNKYLSKLVDY", - "FISNEMKSNKSLPQVLLHPPPHSAPYIDAPIDPELHTAFHWACSMGNLPIAEALYEAGTS", - "IRSTNSQGQTPLMRSSLFHNSYTRRTFPRIFQLLHETVFDIDSQSQTVIHHIVKRKSTTP", - "SAVYYLDVVLSKIKDFSPQYRIELLLNTQDKNGDTALHIASKNGDVVFFNTLVKMGALTT", - "ISNKEGLTANEIMNQQYEQMMIQNGTNQHVNSSNTDLNIHVNTNNIETKNDVNSMVIMSP", - "VSPSDYITYPSQIATNISRNIPNVVNSMKQMASIYNDLHEQHDNEIKSLQKTLKSISKTK", - "IQVSLKTLEVLKESSKDENGEAQTNDDFEILSRLQEQNTKKLRKRLIRYKRLIKQKLEYR", - "QTVLLNKLIEDETQATTNNTVEKDNNTLERLELAQELTMLQLQRKNKLSSLVKKFEDNAK", - "IHKYRRIIREGTEMNIEEVDSSLDVILQTLIANNNKNKGAEQIITISNANSHA") - -# first we split this string into individual characters: -v <- unlist(strsplit(MBP1, "")) - -# and find the positions of our charged residues - -ED <- grep("[ED]", v) -RKH <- grep("[RKH]", v) - -sep <- numeric(length(ED)) # this vector will hold the distances -for (i in seq_along(ED)) { - sep[i] <- min(abs(RKH - ED[i])) -} - -# Task: read and explain this bit of code - -# Now that sep is computed, what does it look like? - -table(sep) # these are the minimum distances -# 24 of D,E residues are adjacent to R,K,H; -# the longest separation is 28 residues. - -# What is the mean separation? -mean(sep) - -# The value is 4.1 . Is this significant? Honestly, I would be hard pressed -# to solve this analytically. But by permutation it's soooo easy. - -# First, we combine what we have done above into a function: - -chSep <- function(v) { - # computes the mean minimum separation of oppositely charged residues - # Parameter: v (char) a vector of amino acids in the one-letter code - # Value: msep (numeric) mean minimum separation - - ED <- grep("[EDed]", v) - RKH <- grep("[RKHrkh]", v) - - sep <- numeric(length(ED)) - for (i in seq_along(ED)) { - sep[i] <- min(abs(RKH - ED[i])) - } - return(mean(sep)) -} - -# Execute the function to define it. - -# Confirm that the function gives the same result as the number we -# calculated above: -chSep(v) - -# Now we can produce a random permutation of v, and recalculate - -set.seed(pi) # set RNG seed for repeatable randomness -w <- sample(v, length(v)) # This shuffles the vector v. Memorize this - # code paradigm. It is very useful. -set.seed(NULL) # reset the RNG - - - -chSep(w) -# 3.773 ... that's actually less than what we had before. - -# Let's do this 10000 times and record the results (takes a few seconds): - -N <- 10000 -chs <- numeric(N) -for (i in 1:N) { - chs[i] <- chSep(sample(v, length(v))) # charge -} - -hist(chs, breaks = 50) -abline(v = chSep(v), col = "#EE0000") - -# Contrary to our expectations, the actual observed mean minimum charge -# separation seems to be larger than what we observe in randomly permuted -# sequences. But is this significant? Your task to find out. - -# Task: -# Calculate the empirical p-value for chsep(v) -# (Sample solution 6.3) - - -# = 5 Final tasks ========================================================= - -# From chs, compute the empirical p-value of a mean minimum charge separation to -# be larger or equal to the value observed for the yeast MBP1 sequence. Note -# the result in your journal. Is it significant? Also note the result of -# the following expression for validation: -seal(sum(chs)) - - -# = 6 Sample solutions ==================================================== - -# == 6.1 ================================================================== -# -sum(r <= x) / length(r) - -# == 6.2 ================================================================== -# -abline(v = quantile(r, probs = c(0.05))) - -# == 6.3 ================================================================== -# -( x <- (sum(chs >= chSep(v)) + 1) / (length(chs) + 1) ) - - -# [END] +# tocID <- "FND-STA-Significance.R" +# +# +# Purpose: A Bioinformatics Course: +# R code accompanying the FND-STA-Significance unit. +# +# Version: 1.3 +# +# Date: 2017-09 - 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.3 2020 Maintenance. Add sample solution. +# 1.2 Update set.seed() usage +# 1.1 Corrected treatment of empirical p-value +# 1.0 First contents +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ------------------------------------------------------------------ +#TOC> 1 Significance and p-value 49 +#TOC> 1.1 Significance levels 60 +#TOC> 1.2 probability and p-value 77 +#TOC> 1.2.1 p-value illustrated 109 +#TOC> 2 One- or two-sided 165 +#TOC> 3 Significance by integration 209 +#TOC> 4 Significance by simulation or permutation 215 +#TOC> 5 Final tasks 327 +#TOC> 6 Sample solutions 336 +#TOC> 6.1 338 +#TOC> 6.2 342 +#TOC> 6.3 346 +#TOC> +#TOC> ========================================================================== + + +# = 1 Significance and p-value ============================================ + +# The idea of the probability of an event has a precise mathematical +# interpretation, but how is it useful to know the probability? Usually we are +# interested in whether we should accept or reject a hypothesis based on the +# observations we have. A rational way to do this is to say: if the probability +# of observing the data is very small under the null-hypothesis, then we will +# assume the observation is due to something other than the null-hypothesis. But +# what do we mean by the "probability of our observation"? And what is "very +# small"? + +# == 1.1 Significance levels =============================================== + +# A "very small" probability is purely a matter of convention - a cultural +# convention. In the biomedical field we usually call probabilities of less then +# 0.05 (5%) small enough to reject the null-hypothesis. Thus we call +# observations with a probability of less than 0.05 "significant" and if we want +# to highlight this in text or in a graph, we often mark them with an asterisk +# (*). Also we often call observations with a probability of less than 0.01 +# "highly significant" and mark them with two asterisks (**). But there is no +# special significance in these numbers, the cutoff point for significance could +# also be 0.0498631, or 0.03, or 1/(pi^3). 0.05 is just the value that the +# British statistician Ronald Fisher happened to propose for this purpose in +# 1925. Incidentally, Fisher later recommended to use different cutoffs for +# different purposes (cf. +# https://en.wikipedia.org/wiki/Statistical_significance). + + +# == 1.2 probability and p-value =========================================== + +# But what do we even mean by the probability of an observation? +# Assume I am drawing samples from a normal distribution with a mean of 0 and a +# standard deviation of 1. The sample I get is ... + +set.seed(sqrt(5)) +x <- rnorm(1) +set.seed(NULL) + +print(x, digits = 22) +# [1] -0.8969145466249813791748 + +# So what's the probability of that number? Obviously, the probability of +# getting exactly this number is very, very, very small. But also obviously, +# this does not mean that observing this number is in any way significant - we +# always observe some number. That's not what we mean in this case. There are +# several implicit assumptions when we speak of the probability of an +# observation: + +# 1: the observation can be compared to a probability distribution; +# 2: that distribution can be integrated between any specific value +# and its upper and lower bounds (or +- infinity). + +# Then what we really mean by the probability of an observation in the context +# of that distribution is: the probability of observing that value, or a value +# more extreme than the one we have. We call this the p-value. Note that we are +# not talking about an individual number anymore, we are talking about the area +# under the curve between our observation and the upper (or lower) bound of the +# curve, as a fraction of the whole. + + +# === 1.2.1 p-value illustrated + +# Let's illustrate. First we draw a million random values from our +# standard, normal distribution: + +N <- 1e6 # one million +set.seed(112358) # set RNG seed for repeatable randomness +r <- rnorm(N) # N values from a normal distribution +set.seed(NULL) # reset the RNG + +# Let's see what the distribution looks like: + +(h <- hist(r)) + +# The histogram details are now available in the list h - e.g. h$counts + +# Where is the value we have drawn previously? +abline(v = x, col = "#EE0000") + +# How many values are smaller? +sum(r < x) + +# Let's color the bars: +# first, make a vector of red and green colors for the bars with breaks +# smaller and larger then x, white for the bar that contains x ... +hCol <- rep("#EE000044", sum(h$breaks < x) - 1) +hCol <- c(hCol, "#FFFFFFFF") +hCol <- c(hCol, rep("#00EE0044", sum(h$breaks > x) - 1)) +# ... then plot the histogram, with colored bars ... +hist(r, col = hCol) +# ... add two colored rectangles into the white bar ... +idx <- sum(h$breaks < x) +xMin <- h$breaks[idx] +xMax <- h$breaks[idx + 1] +y <- h$counts[idx] +rect(xMin, 0, x, y, col = "#EE000044", border = TRUE) +rect(x, 0, xMax, y, col = "#00EE0044", border = TRUE) +# ... and a red line for our observation. +abline(v = x, col = "#EE0000", lwd = 2) + +# The p-value of our observation is the red area as a fraction of the +# whole histogram (red + green). + + +# Task: +# Explain how the expression sum(r < x) works to give us a count of values +# with the property we are looking for. E.g., examine -4:4 < x + +# Task: +# Write an expression to estimate the probability that a value +# drawn from the vector r is less-or-equal to x. The result you get +# will depend on the exact values that went into the vector r but it should +# be close to 0.185 That expression is the p-value associated with x. +# (Sample solution 6.1) + + +# = 2 One- or two-sided =================================================== + +# The shape of our histogram confirms that the rnorm() function has returned +# values that appear distributed according to a normal distribution. In a normal +# distribution, readily available tables tell us that 5% of the values (i.e. our +# significance level) lie 1.96 (or approximately 2) standard deviations away +# from the mean. Is this the case here? How many values in our vector r are +# larger than 1.96? + +sum(r > 1.96) +# [1] 24589 + +# Wait - that's about 2.5% of 1,000,000, not 5% as expected. Why? + +# The answer is: we have to be careful with two-sided distributions. 2 standard +# deviations away from the mean means either larger or smaller than 1.96 . This +# can give rise to errors. If we are simply are interested in outliers, no +# matter larger or smaller, then the 1.96 SD cutoff for significance is correct. +# But if we are specifically interested in, say, larger values, because a +# smaller value is not meaningful, then the significance cutoff, expressed as +# standard deviations, is relaxed. We can use the quantile function to see what +# the cutoff values are: + +quantile(r) +quantile(r, probs = c(0.025, 0.975)) # for the symmetric 2.5% boundaries +# close to ± 1.96, as expected +quantile(r, probs = 0.95) # for the single 5% boundary +# close to 1.64 . Check counts to confirm: +sum(r > quantile(r, probs = 0.95)) +# [1] 50000 +# which is 5%, as expected. + +# Task: +# Use abline() to add the p = 0.05 boundary for smaller values to the histogram. +# (Sample solution 6.2) + +# To summarize: when we evaluate the significance of an event, we divide a +# probability distribution into two parts at the point where the event was +# observed. We then ask whether the integral over the more extreme part is less +# or more than 5% of the whole. If it is less, we deem the event to be +# significant. +# + + +# = 3 Significance by integration ========================================= + +# If the underlying probability distribution can be analytically or numerically +# integrated, the siginificance of an observation can be directly computed. + + +# = 4 Significance by simulation or permutation =========================== + +# But whether the integration is correct, or relies on assumptions that may not +# be warranted for biological data, can be a highly technical question. +# Fortunately, we can often simply run a simulation, a random resampling, or a +# permutation and then count the number of outcomes, just as we did with our +# rnorm() samples. We call this an empirical p-value. (Actually, the "empirical +# p-value" is defined as (Nobs + 1) / (N + 1). ) + +# Here is an example. Assume you have a protein sequence and +# you speculate that positively charged residues are close to negatively charged +# residues to balance charge locally. A statistic that would capture this is the +# mean minimum distance between all D,E residues and the closest R,K,H +# residue. Let's compute this for the sequence of yeast Mbp1. + +MBP1 <- paste0("MSNQIYSARYSGVDVYEFIHSTGSIMKRKKDDWVNATHILKAANFAKAKRTRILEKEVLK", + "ETHEKVQGGFGKYQGTWVPLNIAKQLAEKFSVYDQLKPLFDFTQTDGSASPPPAPKHHHA", + "SKVDRKKAIRSASTSAIMETKRNNKKAEENQFQSSKILGNPTAAPRKRGRPVGSTRGSRR", + "KLGVNLQRSQSDMGFPRPAIPNSSISTTQLPSIRSTMGPQSPTLGILEEERHDSRQQQPQ", + "QNNSAQFKEIDLEDGLSSDVEPSQQLQQVFNQNTGFVPQQQSSLIQTQQTESMATSVSSS", + "PSLPTSPGDFADSNPFEERFPGGGTSPIISMIPRYPVTSRPQTSDINDKVNKYLSKLVDY", + "FISNEMKSNKSLPQVLLHPPPHSAPYIDAPIDPELHTAFHWACSMGNLPIAEALYEAGTS", + "IRSTNSQGQTPLMRSSLFHNSYTRRTFPRIFQLLHETVFDIDSQSQTVIHHIVKRKSTTP", + "SAVYYLDVVLSKIKDFSPQYRIELLLNTQDKNGDTALHIASKNGDVVFFNTLVKMGALTT", + "ISNKEGLTANEIMNQQYEQMMIQNGTNQHVNSSNTDLNIHVNTNNIETKNDVNSMVIMSP", + "VSPSDYITYPSQIATNISRNIPNVVNSMKQMASIYNDLHEQHDNEIKSLQKTLKSISKTK", + "IQVSLKTLEVLKESSKDENGEAQTNDDFEILSRLQEQNTKKLRKRLIRYKRLIKQKLEYR", + "QTVLLNKLIEDETQATTNNTVEKDNNTLERLELAQELTMLQLQRKNKLSSLVKKFEDNAK", + "IHKYRRIIREGTEMNIEEVDSSLDVILQTLIANNNKNKGAEQIITISNANSHA") + +# first we split this string into individual characters: +v <- unlist(strsplit(MBP1, "")) + +# and find the positions of our charged residues + +ED <- grep("[ED]", v) +RKH <- grep("[RKH]", v) + +sep <- numeric(length(ED)) # this vector will hold the distances +for (i in seq_along(ED)) { + sep[i] <- min(abs(RKH - ED[i])) +} + +# Task: read and explain this bit of code + +# Now that sep is computed, what does it look like? + +table(sep) # these are the minimum distances +# 24 of D,E residues are adjacent to R,K,H; +# the longest separation is 28 residues. + +# What is the mean separation? +mean(sep) + +# The value is 4.1 . Is this significant? Honestly, I would be hard pressed +# to solve this analytically. But by permutation it's soooo easy. + +# First, we combine what we have done above into a function: + +chSep <- function(v) { + # computes the mean minimum separation of oppositely charged residues + # Parameter: v (char) a vector of amino acids in the one-letter code + # Value: msep (numeric) mean minimum separation + + ED <- grep("[EDed]", v) + RKH <- grep("[RKHrkh]", v) + + sep <- numeric(length(ED)) + for (i in seq_along(ED)) { + sep[i] <- min(abs(RKH - ED[i])) + } + return(mean(sep)) +} + +# Execute the function to define it. + +# Confirm that the function gives the same result as the number we +# calculated above: +chSep(v) + +# Now we can produce a random permutation of v, and recalculate + +set.seed(pi) # set RNG seed for repeatable randomness +w <- sample(v, length(v)) # This shuffles the vector v. Memorize this + # code paradigm. It is very useful. +set.seed(NULL) # reset the RNG + + + +chSep(w) +# 3.773 ... that's actually less than what we had before. + +# Let's do this 10000 times and record the results (takes a few seconds): + +N <- 10000 +chs <- numeric(N) +for (i in 1:N) { + chs[i] <- chSep(sample(v, length(v))) # charge +} + +hist(chs, breaks = 50) +abline(v = chSep(v), col = "#EE0000") + +# Contrary to our expectations, the actual observed mean minimum charge +# separation seems to be larger than what we observe in randomly permuted +# sequences. But is this significant? Your task to find out. + +# Task: +# Calculate the empirical p-value for chsep(v) +# (Sample solution 6.3) + + +# = 5 Final tasks ========================================================= + +# From chs, compute the empirical p-value of a mean minimum charge separation to +# be larger or equal to the value observed for the yeast MBP1 sequence. Note +# the result in your journal. Is it significant? Also note the result of +# the following expression for validation: +seal(sum(chs)) + + +# = 6 Sample solutions ==================================================== + +# == 6.1 ================================================================== +# +sum(r <= x) / length(r) + +# == 6.2 ================================================================== +# +abline(v = quantile(r, probs = c(0.05))) + +# == 6.3 ================================================================== +# +( x <- (sum(chs >= chSep(v)) + 1) / (length(chs) + 1) ) + + +# [END] diff --git a/README.md b/README.md index dd3087f..6818577 100644 --- a/README.md +++ b/README.md @@ -1,3 +1,3 @@ -# BCH441-WORK-ABC-units - +# BCH441-WORK-ABC-units + This is a fork of the project [ABC-units](https://github.com/hyginn/ABC-units) designed for BCH441. This setup allows changes to be committed here but updates pushed to the original repository can be fetched and pulled to keep up to date. \ No newline at end of file diff --git a/RPR-Biostrings.R b/RPR-Biostrings.R index 0af5c4a..bd614f5 100644 --- a/RPR-Biostrings.R +++ b/RPR-Biostrings.R @@ -1,245 +1,245 @@ -# tocID <- "RPR-Biostrings.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the RPR-Biostrings unit. -# -# Version: 1.2 -# -# Date: 2017-10 - 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.2 2020 Updates -# 1.1 Change from require() to requireNamespace(), -# use ::() idiom throughout, -# use Biocmanager:: not biocLite() -# 1.0 2017 Revisions -# 0.1 First code copied from 2016 material. -# -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ----------------------------------------------------------------- -#TOC> 1 The Biostrings:: Package 56 -#TOC> 2 Getting Data into Biostrings:: Objects 88 -#TOC> 3 Working with Biostrings:: Objects 110 -#TOC> 3.1 Properties 127 -#TOC> 3.2 Subsetting 168 -#TOC> 3.3 Operators 180 -#TOC> 3.4 Transformations 187 -#TOC> 4 Getting Data out of Biostrings:: Objects 194 -#TOC> 5 More 203 -#TOC> 5.1 Views 205 -#TOC> 5.2 Iranges 219 -#TOC> 5.3 StringSets 225 -#TOC> -#TOC> ========================================================================== - - -# This is a very brief introduction to the Biostrings:: package, other units will -# be using more of the Biostrings:: functions. - - -# = 1 The Biostrings:: Package ============================================ - - -# First, we install and load the Biostrings:: package from bioconductor (if we -# haven't done so already). - -if (! requireNamespace("BiocManager", quietly = TRUE)) { - install.packages("BiocManager") -} -if (! requireNamespace("Biostrings", quietly = TRUE)) { - BiocManager::install("Biostrings") -} -# Examine the package information: -library(help = Biostrings) # basic information -browseVignettes("Biostrings") # available vignettes -data(package = "Biostrings") # available datasets - - -# At its core, Biostrings:: objects are "classes" of type XString (you can think -# of a "class" in R as a special kind of list), that can take on particular -# flavours for RNA, DNA or amino acid sequence information. - -class(Biostrings::RNAString("AUG")) -class(Biostrings::DNAString("ATG")) -class(Biostrings::AAString("M")) - -# An essential property of Biostrings:: objects is that they only allow letters -# from the applicable IUPAC alphabet: -Biostrings::RNAString("AUG") -Biostrings::DNAString("AUG") # Error! No "U" in IUPAC DNA codes - - -# = 2 Getting Data into Biostrings:: Objects ============================== - - -# Example: read FASTA. Extract sequence. Convert to DNAString object. -rawSeq <- readLines("./data/S288C_YDL056W_MBP1_coding.fsa") -rawSeq <- dbSanitizeSequence(rawSeq) -biosDNAseq <- Biostrings::DNAString(rawSeq) # converts the nucleotide sequence - # into an object of class DNAstring - -# Multi FASTA files can be read directly as a "XStringSet) ... -rawMFAfile <- "./data/S288C_YDL056W_MBP1_coding.fsa" -(biosDNASet <- Biostrings::readDNAStringSet(rawMFAfile)) - -# ... and if you subset one sequence from the set, you get an XString object -# back again. -(Xseq <- biosDNASet[[1]]) - -biosDNAseq == Xseq # the comparison evaluates to TRUE ... -identical(biosDNAseq, Xseq) # ... and indeed the objects are deemed identical. - - - -# = 3 Working with Biostrings:: Objects =================================== - -# Biostrings:: is a highly engineered package that is tightly integrated into -# the Bioconductor world - unfortunately that brings with it a somewhat -# undesirable level of computational overhead and dependencies. Using the -# package as we normally do - i.e. calling required functions with their -# explicit package prefix is therefore not advisable. There are generics -# that won't be propery dispatched. If you only need a small number of -# functions for a very specific context, you will probably get away with -# Biostrings::() - but even in the demonstration code of this script -# not everything works out of the box. We'll therefore load the library, -# but we'll (redundantly) use the prefix anyway so as to emphasize where -# the functions come from. - -library(Biostrings) - - -# == 3.1 Properties ======================================================== -str(rawSeq) -str(biosDNAseq) - -length(rawSeq) # ... is 1: one string only. To get the number of - # characters in a string, you need nchar(). -length(biosDNAseq) # but the length of a "Bstring" is the number of elements -nchar(rawSeq) -nchar(biosDNAseq) # ... but nchar() works too. - -(uL <- Biostrings::uniqueLetters(biosDNAseq)) - -# Count frequencies - with strings, you would strsplit() into a character -# vector and then use table(). biost -Biostrings::alphabetFrequency(biosDNAseq) - -# letterFrequency() works with a defined alphabet - such as what uniqueLetters() -# returns. -Biostrings::letterFrequency(biosDNAseq, uL) -sum(Biostrings::letterFrequency(biosDNAseq, c("G", "C"))) / - length(biosDNAseq) # GC contents - -Biostrings::dinucleotideFrequency(biosDNAseq) -barplot(sort(Biostrings::dinucleotideFrequency(biosDNAseq)), cex.names = 0.5) - -(triNuc <- Biostrings::trinucleotideFrequency(biosDNAseq)) -barplot(sort(triNuc), col="#4499EE33") -triNuc[triNuc == max(triNuc)] -triNuc[triNuc == min(triNuc)] -max(triNuc) / min(triNuc) # AAA is more than 13 times as frequent as CGT - -# compare to a shuffled sequence: -(triNuc <- Biostrings::trinucleotideFrequency(sample(biosDNAseq))) -barplot(sort(triNuc), col="#EEEE4433", add = TRUE) -max(triNuc) -# Interpret this plot. -(triNuc <- Biostrings::trinucleotideFrequency(sample(biosDNAseq))) -barplot(sort(triNuc), col="#EEEE4433") -max(triNuc) - - -# == 3.2 Subsetting ======================================================== - -# Subsetting any XString object works as expected: -biosDNAseq[4:15] - -# ... well - maybe not expected, because rawSeq[4:15] would not work. - -# Alternatively to the "[" operator, use the subseq() function - especially for -# long sequences. This is far more efficient. -Biostrings::subseq(biosDNAseq, start = 1, end = 30) - - -# == 3.3 Operators ========================================================= - -# RNAstring() and DNAstring() objects compare U and T as equals! - Biostrings::RNAString("AUGUCUAACCAAAUAUACUCAGCGAGAUAU") == - Biostrings::DNAString("ATGTCTAACCAAATATACTCAGCGAGATAT") - - -# == 3.4 Transformations =================================================== - -biosDNAseq[4:15] -Biostrings::reverseComplement(biosDNAseq[4:15]) -Biostrings::translate(biosDNAseq[4:15]) - - -# = 4 Getting Data out of Biostrings:: Objects ============================ - -# If you need a character object, use toString(): - -Biostrings::toString(biosDNAseq[4:15]) - -# saveRDS() and readRDS() works like on all other R objects. - - -# = 5 More ================================================================ - -# == 5.1 Views ============================================================= - -# Biostring "Views" are objects that store multiple substrings of one -# Biostring object. - -(myView <- Biostrings::Views(biosDNAseq, - start = c(1, 19, 37), - end = c(15, 30, 45))) - -# Views are convenient to store feature annotations -names(myView) <- c("Feature-A", "Feature-B", "Feature-C") -cat(sprintf("\n%s\t(%d)\t%s", names(myView), width(myView), myView )) - - -# == 5.2 Iranges =========================================================== - -# Biostrings:: Iranges are like Views with a common start point. These can be -# useful for feature annotations. Instead of start/end you store start/width. - - -# == 5.3 StringSets ======================================================== - -# Biostring "StringSets" store multiple sequences. -# -ompA <- Biostrings::AAString("MKKTAIAIAVALAGFATVAQA") -sample(ompA) # sample can work directly on a Biostring object to shuffle it - -x <- Biostrings::toString(ompA) -for (i in 2:10) { - x[i] <- Biostrings::toString(sample(ompA)) -} -shuffledPeptideSet <- Biostrings::AAStringSet(x) -names(shuffledPeptideSet) <- c("ompA", paste("shuffle.", 1:9, sep="")) -shuffledPeptideSet - -length(shuffledPeptideSet) -Biostrings::width(shuffledPeptideSet) -Biostrings::alphabetFrequency(shuffledPeptideSet) - - -# [END] +# tocID <- "RPR-Biostrings.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the RPR-Biostrings unit. +# +# Version: 1.2 +# +# Date: 2017-10 - 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.2 2020 Updates +# 1.1 Change from require() to requireNamespace(), +# use ::() idiom throughout, +# use Biocmanager:: not biocLite() +# 1.0 2017 Revisions +# 0.1 First code copied from 2016 material. +# +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ----------------------------------------------------------------- +#TOC> 1 The Biostrings:: Package 56 +#TOC> 2 Getting Data into Biostrings:: Objects 88 +#TOC> 3 Working with Biostrings:: Objects 110 +#TOC> 3.1 Properties 127 +#TOC> 3.2 Subsetting 168 +#TOC> 3.3 Operators 180 +#TOC> 3.4 Transformations 187 +#TOC> 4 Getting Data out of Biostrings:: Objects 194 +#TOC> 5 More 203 +#TOC> 5.1 Views 205 +#TOC> 5.2 Iranges 219 +#TOC> 5.3 StringSets 225 +#TOC> +#TOC> ========================================================================== + + +# This is a very brief introduction to the Biostrings:: package, other units will +# be using more of the Biostrings:: functions. + + +# = 1 The Biostrings:: Package ============================================ + + +# First, we install and load the Biostrings:: package from bioconductor (if we +# haven't done so already). + +if (! requireNamespace("BiocManager", quietly = TRUE)) { + install.packages("BiocManager") +} +if (! requireNamespace("Biostrings", quietly = TRUE)) { + BiocManager::install("Biostrings") +} +# Examine the package information: +library(help = Biostrings) # basic information +browseVignettes("Biostrings") # available vignettes +data(package = "Biostrings") # available datasets + + +# At its core, Biostrings:: objects are "classes" of type XString (you can think +# of a "class" in R as a special kind of list), that can take on particular +# flavours for RNA, DNA or amino acid sequence information. + +class(Biostrings::RNAString("AUG")) +class(Biostrings::DNAString("ATG")) +class(Biostrings::AAString("M")) + +# An essential property of Biostrings:: objects is that they only allow letters +# from the applicable IUPAC alphabet: +Biostrings::RNAString("AUG") +Biostrings::DNAString("AUG") # Error! No "U" in IUPAC DNA codes + + +# = 2 Getting Data into Biostrings:: Objects ============================== + + +# Example: read FASTA. Extract sequence. Convert to DNAString object. +rawSeq <- readLines("./data/S288C_YDL056W_MBP1_coding.fsa") +rawSeq <- dbSanitizeSequence(rawSeq) +biosDNAseq <- Biostrings::DNAString(rawSeq) # converts the nucleotide sequence + # into an object of class DNAstring + +# Multi FASTA files can be read directly as a "XStringSet) ... +rawMFAfile <- "./data/S288C_YDL056W_MBP1_coding.fsa" +(biosDNASet <- Biostrings::readDNAStringSet(rawMFAfile)) + +# ... and if you subset one sequence from the set, you get an XString object +# back again. +(Xseq <- biosDNASet[[1]]) + +biosDNAseq == Xseq # the comparison evaluates to TRUE ... +identical(biosDNAseq, Xseq) # ... and indeed the objects are deemed identical. + + + +# = 3 Working with Biostrings:: Objects =================================== + +# Biostrings:: is a highly engineered package that is tightly integrated into +# the Bioconductor world - unfortunately that brings with it a somewhat +# undesirable level of computational overhead and dependencies. Using the +# package as we normally do - i.e. calling required functions with their +# explicit package prefix is therefore not advisable. There are generics +# that won't be propery dispatched. If you only need a small number of +# functions for a very specific context, you will probably get away with +# Biostrings::() - but even in the demonstration code of this script +# not everything works out of the box. We'll therefore load the library, +# but we'll (redundantly) use the prefix anyway so as to emphasize where +# the functions come from. + +library(Biostrings) + + +# == 3.1 Properties ======================================================== +str(rawSeq) +str(biosDNAseq) + +length(rawSeq) # ... is 1: one string only. To get the number of + # characters in a string, you need nchar(). +length(biosDNAseq) # but the length of a "Bstring" is the number of elements +nchar(rawSeq) +nchar(biosDNAseq) # ... but nchar() works too. + +(uL <- Biostrings::uniqueLetters(biosDNAseq)) + +# Count frequencies - with strings, you would strsplit() into a character +# vector and then use table(). biost +Biostrings::alphabetFrequency(biosDNAseq) + +# letterFrequency() works with a defined alphabet - such as what uniqueLetters() +# returns. +Biostrings::letterFrequency(biosDNAseq, uL) +sum(Biostrings::letterFrequency(biosDNAseq, c("G", "C"))) / + length(biosDNAseq) # GC contents + +Biostrings::dinucleotideFrequency(biosDNAseq) +barplot(sort(Biostrings::dinucleotideFrequency(biosDNAseq)), cex.names = 0.5) + +(triNuc <- Biostrings::trinucleotideFrequency(biosDNAseq)) +barplot(sort(triNuc), col="#4499EE33") +triNuc[triNuc == max(triNuc)] +triNuc[triNuc == min(triNuc)] +max(triNuc) / min(triNuc) # AAA is more than 13 times as frequent as CGT + +# compare to a shuffled sequence: +(triNuc <- Biostrings::trinucleotideFrequency(sample(biosDNAseq))) +barplot(sort(triNuc), col="#EEEE4433", add = TRUE) +max(triNuc) +# Interpret this plot. +(triNuc <- Biostrings::trinucleotideFrequency(sample(biosDNAseq))) +barplot(sort(triNuc), col="#EEEE4433") +max(triNuc) + + +# == 3.2 Subsetting ======================================================== + +# Subsetting any XString object works as expected: +biosDNAseq[4:15] + +# ... well - maybe not expected, because rawSeq[4:15] would not work. + +# Alternatively to the "[" operator, use the subseq() function - especially for +# long sequences. This is far more efficient. +Biostrings::subseq(biosDNAseq, start = 1, end = 30) + + +# == 3.3 Operators ========================================================= + +# RNAstring() and DNAstring() objects compare U and T as equals! + Biostrings::RNAString("AUGUCUAACCAAAUAUACUCAGCGAGAUAU") == + Biostrings::DNAString("ATGTCTAACCAAATATACTCAGCGAGATAT") + + +# == 3.4 Transformations =================================================== + +biosDNAseq[4:15] +Biostrings::reverseComplement(biosDNAseq[4:15]) +Biostrings::translate(biosDNAseq[4:15]) + + +# = 4 Getting Data out of Biostrings:: Objects ============================ + +# If you need a character object, use toString(): + +Biostrings::toString(biosDNAseq[4:15]) + +# saveRDS() and readRDS() works like on all other R objects. + + +# = 5 More ================================================================ + +# == 5.1 Views ============================================================= + +# Biostring "Views" are objects that store multiple substrings of one +# Biostring object. + +(myView <- Biostrings::Views(biosDNAseq, + start = c(1, 19, 37), + end = c(15, 30, 45))) + +# Views are convenient to store feature annotations +names(myView) <- c("Feature-A", "Feature-B", "Feature-C") +cat(sprintf("\n%s\t(%d)\t%s", names(myView), width(myView), myView )) + + +# == 5.2 Iranges =========================================================== + +# Biostrings:: Iranges are like Views with a common start point. These can be +# useful for feature annotations. Instead of start/end you store start/width. + + +# == 5.3 StringSets ======================================================== + +# Biostring "StringSets" store multiple sequences. +# +ompA <- Biostrings::AAString("MKKTAIAIAVALAGFATVAQA") +sample(ompA) # sample can work directly on a Biostring object to shuffle it + +x <- Biostrings::toString(ompA) +for (i in 2:10) { + x[i] <- Biostrings::toString(sample(ompA)) +} +shuffledPeptideSet <- Biostrings::AAStringSet(x) +names(shuffledPeptideSet) <- c("ompA", paste("shuffle.", 1:9, sep="")) +shuffledPeptideSet + +length(shuffledPeptideSet) +Biostrings::width(shuffledPeptideSet) +Biostrings::alphabetFrequency(shuffledPeptideSet) + + +# [END] diff --git a/RPR-ChimeraX_remote.R b/RPR-ChimeraX_remote.R index 5ee4710..e50648c 100644 --- a/RPR-ChimeraX_remote.R +++ b/RPR-ChimeraX_remote.R @@ -1,165 +1,165 @@ -# tocID <- "RPR-ChimeraX_remote.R" -# -# Purpose: A Bioinformatics Course: -# R code demonstrating remote scripting of ChimeraX. -# -# Version: 1.0.1 -# -# Date: 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.0.1 2021 Minimal updates -# 1.0 First ABC units version -# -# -# TODO: -# %-encode and escape quotes, or just pass-through? -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ------------------------------------------------------ -#TOC> 1 ChimeraX REMOTE SCRIPTING 41 -#TOC> 1.1 Defining a Port 59 -#TOC> 1.2 Open ChimeraX 81 -#TOC> 2 WORKED EXAMPLE: SUPERPOSITION 113 -#TOC> -#TOC> ========================================================================== - - -# = 1 ChimeraX REMOTE SCRIPTING =========================================== - - -# One of the cool features of ChimeraX is that it can be driven by Python code, -# both within a running session and through Python scripts. What I find even -# cooler though is that ChimeraX can be driven from any programming language via -# its remote control function that can listen to commands sent from any other -# application. The interface that is used here is the standard REST (method) - -# the GET and POST verbs that ubiquitously underly the communication of clients -# and servers on the Web. - -# In order to establish the communication between this script and ChimeraX, all -# we need to do is: -# - open ChimeraX; -# - tell it to listen on a specific "port"; -# - send commands to that port via httr:: - - -# == 1.1 Defining a Port =================================================== - -# The httr:: package needs to be available - -if (! requireNamespace("httr", quietly = TRUE)) { - install.packages("httr") -} -# Package information: -# library(help = httr) # basic information -# browseVignettes("httr") # available vignettes -# data(package = "httr") # available datasets - -# We need to think od a port. Any available port number between 49152-65535 is -# fine. We'll choose 61803 because that's the fractional part of the golden -# ratio. But one could choose another. - -CXPORT <- 61803 - -# Check that our current version of R supports sockets (default since V 3.3) -capabilities("sockets") # MUST be TRUE. If not, don't continue. - - -# == 1.2 Open ChimeraX ===================================================== - -# - Open a fresh, new session of recently updated version of ChimeraX -# - type: -# -# remotecontrol rest start port 61803 -# -# ... or whatever the value of CXPORT is. - -# Now watch what happens in ChimeraX when you execute the following line: -( x <- httr::GET("http://127.0.0.1:61803/run?command=open+1BM8") ) - -# The .utilities.R script includes the function CX(), based on this principle, -# through which you can send commands to ChimeraX - -CX("camera sbs") -CX("lighting soft") -CX("color sequential #1 & protein target abc palette powderblue:orchid:white") - -# The command echos Chimera's response if the parameter "quietly" is -# FALSE (default), and we can silence output with quietly = TRUE : -CX("info models #1 attribute num_residues") -CX("info models #1 attribute num_residues", quietly = TRUE) - -# Either way, the command also returns Chimera's responses "invisibly"; -# i.e. we can use the results by assigning the output to a variable: -hBonds <- CX("hbonds #1 & protein makePseudobonds false log true", quietly=TRUE) -x <- read.table(file = textConnection(hBonds), skip = 9, - blank.lines.skip = TRUE, fill = TRUE) -hist(x[,13], main="H-bonds", xlab="D···A (Å)", ylab="counts", col="#c9dcff") - - -# = 2 WORKED EXAMPLE: SUPERPOSITION ======================================= - -# We superimpose the 1BM8 structure with the 1DUX crystal structure to be able -# to explore possible DNA binding regions in 1BM8 - -# The model for 1BM8 is already open as model 1 (#1) -CX("hide #1 cartoons") # hide model 1 cartoon representation -CX("open 1DUX") # assume this is opened as model #2 -CX("hide #2") # hide everything ... -CX("select #2/C") # chain c (protein) -CX("show sel cartoons") # ... and show cartoons of chain c (protein) -CX("color sequential sel target c palette steelblue:darkmagenta") -CX("view #2/C") # re-center the display -CX("cofr #2/C:62@CA") # set pivot to an interface residue -CX("select #2/A,B & nucleic-acid") # chains A, B are the cognate DNA -CX("style sel stick") -CX("show sel target ab") # show atoms/bonds -CX("color sequential #2/A & nucleic-acid target ab palette teal:lightcyan") -CX("color sequential #2/B & nucleic-acid target ab palette teal:lightcyan") -CX("surface sel enclose sel") # compute joint accessible surface of both chains -CX("transparency 50") -CX("select clear") - -# Now superimpose the 1BM8 chain onto 1DUX chain C -CX("show #1 cartoons") -CX("matchmaker #1/A to #2/C pairing ss") # the actual superposition - -# study the general layout, and the position of the 1mb8 secondary structure -# elements relative to 1DUX - -# Let's examine side chain orientations in more detail -CX("hide #2/C cartoons") # hide the 1DUX protein - -# select all residues in 1BM8 that are within 3.5 A of the DNA chains (a, b) -CX("select zone #2/A,B 3.5 #1 & protein residues true") -CX("~select sel & H") # de-select H atoms -CX("show sel target ab") -CX("size stickRadius 0.4") -CX("select clear") - -# The overall architecture of the Mbp1 APSES domain is a good match for the Elk -# transcription factor binding mode; the detailed conformations of side chains -# would need to change only to a minor degree. There is a very significant -# degree of structural similarity; remarkable, given that the DNA is not the -# target sequence of the Mbp1 transcription factor, AND the 1MB8 structure was -# determined without a DNA ligand. - -CX("remotecontrol rest stop") # release the socket -# Done. - - - -# [END] +# tocID <- "RPR-ChimeraX_remote.R" +# +# Purpose: A Bioinformatics Course: +# R code demonstrating remote scripting of ChimeraX. +# +# Version: 1.0.1 +# +# Date: 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.0.1 2021 Minimal updates +# 1.0 First ABC units version +# +# +# TODO: +# %-encode and escape quotes, or just pass-through? +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ------------------------------------------------------ +#TOC> 1 ChimeraX REMOTE SCRIPTING 41 +#TOC> 1.1 Defining a Port 59 +#TOC> 1.2 Open ChimeraX 81 +#TOC> 2 WORKED EXAMPLE: SUPERPOSITION 113 +#TOC> +#TOC> ========================================================================== + + +# = 1 ChimeraX REMOTE SCRIPTING =========================================== + + +# One of the cool features of ChimeraX is that it can be driven by Python code, +# both within a running session and through Python scripts. What I find even +# cooler though is that ChimeraX can be driven from any programming language via +# its remote control function that can listen to commands sent from any other +# application. The interface that is used here is the standard REST (method) - +# the GET and POST verbs that ubiquitously underly the communication of clients +# and servers on the Web. + +# In order to establish the communication between this script and ChimeraX, all +# we need to do is: +# - open ChimeraX; +# - tell it to listen on a specific "port"; +# - send commands to that port via httr:: + + +# == 1.1 Defining a Port =================================================== + +# The httr:: package needs to be available + +if (! requireNamespace("httr", quietly = TRUE)) { + install.packages("httr") +} +# Package information: +# library(help = httr) # basic information +# browseVignettes("httr") # available vignettes +# data(package = "httr") # available datasets + +# We need to think od a port. Any available port number between 49152-65535 is +# fine. We'll choose 61803 because that's the fractional part of the golden +# ratio. But one could choose another. + +CXPORT <- 61803 + +# Check that our current version of R supports sockets (default since V 3.3) +capabilities("sockets") # MUST be TRUE. If not, don't continue. + + +# == 1.2 Open ChimeraX ===================================================== + +# - Open a fresh, new session of recently updated version of ChimeraX +# - type: +# +# remotecontrol rest start port 61803 +# +# ... or whatever the value of CXPORT is. + +# Now watch what happens in ChimeraX when you execute the following line: +( x <- httr::GET("http://127.0.0.1:61803/run?command=open+1BM8") ) + +# The .utilities.R script includes the function CX(), based on this principle, +# through which you can send commands to ChimeraX + +CX("camera sbs") +CX("lighting soft") +CX("color sequential #1 & protein target abc palette powderblue:orchid:white") + +# The command echos Chimera's response if the parameter "quietly" is +# FALSE (default), and we can silence output with quietly = TRUE : +CX("info models #1 attribute num_residues") +CX("info models #1 attribute num_residues", quietly = TRUE) + +# Either way, the command also returns Chimera's responses "invisibly"; +# i.e. we can use the results by assigning the output to a variable: +hBonds <- CX("hbonds #1 & protein makePseudobonds false log true", quietly=TRUE) +x <- read.table(file = textConnection(hBonds), skip = 9, + blank.lines.skip = TRUE, fill = TRUE) +hist(x[,13], main="H-bonds", xlab="D···A (Å)", ylab="counts", col="#c9dcff") + + +# = 2 WORKED EXAMPLE: SUPERPOSITION ======================================= + +# We superimpose the 1BM8 structure with the 1DUX crystal structure to be able +# to explore possible DNA binding regions in 1BM8 + +# The model for 1BM8 is already open as model 1 (#1) +CX("hide #1 cartoons") # hide model 1 cartoon representation +CX("open 1DUX") # assume this is opened as model #2 +CX("hide #2") # hide everything ... +CX("select #2/C") # chain c (protein) +CX("show sel cartoons") # ... and show cartoons of chain c (protein) +CX("color sequential sel target c palette steelblue:darkmagenta") +CX("view #2/C") # re-center the display +CX("cofr #2/C:62@CA") # set pivot to an interface residue +CX("select #2/A,B & nucleic-acid") # chains A, B are the cognate DNA +CX("style sel stick") +CX("show sel target ab") # show atoms/bonds +CX("color sequential #2/A & nucleic-acid target ab palette teal:lightcyan") +CX("color sequential #2/B & nucleic-acid target ab palette teal:lightcyan") +CX("surface sel enclose sel") # compute joint accessible surface of both chains +CX("transparency 50") +CX("select clear") + +# Now superimpose the 1BM8 chain onto 1DUX chain C +CX("show #1 cartoons") +CX("matchmaker #1/A to #2/C pairing ss") # the actual superposition + +# study the general layout, and the position of the 1mb8 secondary structure +# elements relative to 1DUX + +# Let's examine side chain orientations in more detail +CX("hide #2/C cartoons") # hide the 1DUX protein + +# select all residues in 1BM8 that are within 3.5 A of the DNA chains (a, b) +CX("select zone #2/A,B 3.5 #1 & protein residues true") +CX("~select sel & H") # de-select H atoms +CX("show sel target ab") +CX("size stickRadius 0.4") +CX("select clear") + +# The overall architecture of the Mbp1 APSES domain is a good match for the Elk +# transcription factor binding mode; the detailed conformations of side chains +# would need to change only to a minor degree. There is a very significant +# degree of structural similarity; remarkable, given that the DNA is not the +# target sequence of the Mbp1 transcription factor, AND the 1MB8 structure was +# determined without a DNA ligand. + +CX("remotecontrol rest stop") # release the socket +# Done. + + + +# [END] diff --git a/RPR-FASTA.R b/RPR-FASTA.R index 6861439..d4d5088 100644 --- a/RPR-FASTA.R +++ b/RPR-FASTA.R @@ -1,322 +1,322 @@ -# tocID <- "RPR-FASTA.R" -# -# -# Purpose: A Bioinformatics Course: -# R code accompanying the RPR-FASTA unit. -# -# Version: 1.1.2 -# -# Date: 2017-10 - 2021-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.1.2 style update -# 1.1.1 bugfix - wrong function name -# 1.1 2020 Maintenance. Rewrite validation logic. Add data -# to utilities. Define AACOLS -# 1.0 New unit. -# -# -# TODO: Make a simple solution first, then extend it to error checking, and -# to handle .mfa files. -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ----------------------------------------------------- -#TOC> 1 Reading and validating FASTA 45 -#TOC> 1.1 Validating FASTA 81 -#TOC> 2 Parsing FASTA 227 -#TOC> 3 Interpreting FASTA 247 -#TOC> 4 Writing FASTA 274 -#TOC> -#TOC> ========================================================================== - - -# = 1 Reading and validating FASTA ======================================== - -# FASTA is a text based format, structured in lines that are separated by -# line-feed or paragraph-break characters. Which one of these is used, depends -# on your operating system. But R's readLines() function knows how to handle -# these correctly, accross platforms. Don't try to read such files "by hand". -# Here is the yeast Mbp1 gene, via SGD. - -file.show("./data/S288C_YDL056W_MBP1_coding.fsa") -faMBP1 <- readLines("./data/S288C_YDL056W_MBP1_coding.fsa") - -# The warning is generated because the programmer at the NCBI who implemented -# the code to write this FASTA file neglected to place a line-break character -# after the last sequence character. While this is not technically incorrect, -# it is poor practice: the resulting file can't be distinguished from one that -# has been truncated in transmission. - -head(faMBP1) - -# Note that there are NO line-break characters ("\n") at the end of these -# strings, even though they were present in the original file. readLines() -# has "consumed" these characters while reading - but every single line is in -# a vector of its own. - -tail(faMBP1) - -# Also note that the last line has fewer characters - this means readLines() -# imported the whole line, despite it not being terminated by "\n". - -# It's very straightforward to work with such data, for example by collapsing -# everything except the first line into a single string ... - -f <- c(faMBP1[1], paste(faMBP1[-1], sep = "", collapse = "")) - -f[1] -nchar(f[2]) - -# == 1.1 Validating FASTA ================================================== - -# The code above is making the assumption that everything from line 2 until -# the end IS sequence, the whole sequence and nothing but sequence. -# That assumption can break down in many ways: -# -# - there could be more than one header line. The specification says otherwise, -# but some older files use multiple, consecutive header lines. You don't -# want that to end up in your sequence. -# - this could be not a FASTA file at all. It could be raw sequence, a -# different sequence file format, or a wholly different file altogether. -# If you look at the file, you can immediately tell, but if you are -# reading the file in a complex workflow, your could easily import wrong -# data into your analysis. -# - there could be more than one sequence in the file. Such Multi-FASTA files -# occur commonly, as downloads of ORFs from genome regions or other -# sets of genes or proteins, or as the input / output for multiple -# sequence alignment programs. -# -# Data "from the wild" can (and usually does) have the most unexpected -# variations and it is really, really important to be clear about the -# assumptions that you are making. It is possible to "fix" things, according -# to the "Robustness Principle" : -# "Be conservative in what you send, -# be liberal in what you accept". -# (cf. https://en.wikipedia.org/wiki/Robustness_principle ) -# ... but if you think about this, that's actually a really poor idea, -# which is much more likely to dilute standards, make unwarranted -# assumptions, and allow errors to pass silently and corrupt data. -# -# Let's discard this principle on the trash-heap of -# things-that-sound-like-a-good-idea-but-aren't. What we do instead is test, -# identify problems, and follow the principle: "crash early, crash often". Of -# course I can write code that would reformat any possible input as a FASTA -# file - but what good will it do me if it parses the file I receive -# from a server into FASTA format like: -# -# >404- Page Not Found -# dyh-PagentfndhpThepageyreqesteddesnteistnthisserverCheckthe -# spellingrcntacttheadministratrsdyhtml -# -# Therefore, we write ourselves a FASTA checker that will enforce the following: -# (1) a FASTA file contains one or more sequences separated by zero or -# more empty lines -# (2) a sequence contains one header line followed by -# one or more sequence lines -# (3) a sequence line contains one or more uppercase or lowercase single -# letter amino acid codes, hyphens (gap character), or * (stop). -# -# Anything else should generate an error. - -# (Case 1): Header(s) exist -fX <- c("ABC", - "defghi", - "klmnpq") -sel <- grepl("^>", fX) # "^>" is a regular expression that - # means: the exact character ">" at the - # beginning ("^") of the line. -if ( ! any(sel) ) { stop("no header lines in input.") } - - -# (Case 2) No adjacent header lines -fX <- c(">ABC", - ">123", - "defghi", - "klmnpq") -sel <- grepl("^>", fX) -sel <- sel[- length(sel)] & sel[-1] # comparing shifted vectors -if ( any(sel)) { stop("adjacent header lines in input.") } - -# (Case 3.1) all sequence lines contain only valid characters -# (constants for valid characters AAVALID, NUCVALID, and NUCAMBIG -# are defined with the .utilities.R script) -AAVALID -fX <- c(">ABC", - "def ;-) ghi", - "klmnpq") -myRegex <- sprintf("[^%s]", AAVALID) # NOT a valid character -sel <- ! grepl("^>", fX) # NOT headers -if (any(grepl(myRegex, fX[sel]))) { - stop("invalid chracter(s) outside of header lines.") -} - -# (Case 3.2) all headers are followed directly by -# at least one letter of sequence -fX <- c(">ABC", - "", - ">123", - "defghi", - "klmnpq") -sel <- grep("^>", fX) + 1 # indexes of headers + 1 -myRegex <- sprintf("[%s]+", AAVALID) # at least one valid character -if (! all(grepl(myRegex, fX[sel]))) { - stop("a header has no adjacent sequence.") -} -# Ah, you might ask - couldn't we just have dropped all empty lines, and -# then caught this in Case 2? No - for two reasons: we would still miss headers -# at the end of file, and, we would have changed the line numbering - and -# ideally our "production" function will create information about where the -# error is to be found. - - -# Now combine this into a function ... - -val <- function(fa) { - - if ( ! any(grepl("^>", fa)) ) { - stop("no header lines in input.") - } - - sel <- grepl("^>", fa) - if ( any(sel[- length(sel)] & sel[-1])) { - stop("adjacent header lines in input.") - } - - sel <- ! grepl("^>", fa) - if ( any(grepl(sprintf("[^%s]", AAVALID), fa[sel]))) { - stop("invalid chracter(s) outside of header lines.") - } - - sel <- grep("^>", fa) + 1 - if (! all(grepl(sprintf("[%s]+", AAVALID), fa[sel]))) { - stop("a header has no adjacent sequence.") - } - - return(invisible(NULL)) -} - -# Here is an example -FA <- c(">head1", - "acdef", - "ghi", - "", - ">head2", - "kl", - ">head3", - "mn", - "pqrs") -val(FA) # ... should not create an error - - -# A somewhat more elaborate validateFA() function was loaded with the -# ./utilities.R script. It needs a bit more bookkeeping, since NCBI multi- -# fasta files have space-characters in their spacer lines. Try it ... -validateFA(FA) - -# = 2 Parsing FASTA ======================================================= - -# Once we have validated our assumptions about our input, it's quite -# painless to parse it. I have put this together as a function and the function -# gets loaded from ./.utilities.R -# - -# Lets try this: -# - the first 3 elements of faMBP1: -readFASTA(faMBP1[1:3]) - -# - a multi FASTA file of aligned APSES domain sequences: - -refAPSES <- readFASTA("./data/refAPSES.mfa") - -# Subset the sequence with "P39678" in the header -refAPSES[grep("P39678", refAPSES$head) ,] - - - -# = 3 Interpreting FASTA ================================================== - - -# FASTA files are straightforward to interpret - just one thing may be of note: -# when working with strings, we can use substr(, , ) to -# extract substrings, but more often we expand the string into a vector of -# single characters with strsplit(, ""). strsplit() returns a list, -# to accommodate that could be a vector of many elements, therefore -# we usually unlist() the result if we use it only on a single string. - -# Example: How many positive charged residues in "MBP1_SACCE"? - -s <- unlist(strsplit(refAPSES$seq[grep("MBP1_SACCE", refAPSES$head)], "")) -s - -sum(grepl("[HKR]", s)) # 20 (+) charged residues. grepl() returns TRUE and FALSE - # for the characters, sum() coerces to 1 and 0 - # respectively, and that gives us the result. - -100 * sum(grepl("[HKR]", s)) / length(s) # in percent: 20.2 % - -# residue distribution -x <- factor(s, levels = names(AACOLS)) -pie(table(x)[names(AACOLS)], col = AACOLS) - - - -# = 4 Writing FASTA ======================================================= - - -# Writing FASTA files is mostly just the reverse of reading, with one -# twist: we need to break the long sequence string into chunks of the desired -# width. The FASTA specification calls for a maximum of 120 characters per line, -# but writing out much less than that is common, since it allows to comfortably -# view lines on the console, or printing them on a sheet of paper (do we still -# do that actually?). How do we break a string into chunks? A combination of -# seq(, , ) with substring(, , ) will work -# nicely. (Note that substring() is vectorized, whereas substr() is not!) As we -# loop through our FASTA object in memory, we can build the output by c()'ing -# blocks of header + sequence to each other. For VERY large objects this might -# be slow - in that case, we might want to precalculate the size of the output -# object. But that's more of a hypothetical consideration. - -( s <- refAPSES$seq[2] ) -nchar(s) -w <- 30 # width of chunk -(starts <- seq(1, nchar(s), by = w)) # starting index of chunk -(ends <- c((starts - 1)[-1], nchar(s))) # ending index of chunk - -# Task: Is this safe? What happens if nchar(s) is shorter than w? -# What happens if nchar(s) is an exact multiple of w? - -substring(s, starts, ends) -# confirm that the output contains the first and last residue, and both -# residues adjacent to the breaks - -# As always, the function has been defined in ".utilities.R" for to use -# any time... type writeFASTA to examine it. - -# Let's try this... - -writeFASTA(refAPSES, width = 40) - -# roundtrip for validation: write refAPSES with a different format, -# read it back in - the new dataframe must be identical -# to the original dataframe. -fname <- tempfile() -writeFASTA(refAPSES, fn = fname, width = 30) -identical(refAPSES, readFASTA(fname)) - -# ...works for me :-) - - -# [END] +# tocID <- "RPR-FASTA.R" +# +# +# Purpose: A Bioinformatics Course: +# R code accompanying the RPR-FASTA unit. +# +# Version: 1.1.2 +# +# Date: 2017-10 - 2021-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.1.2 style update +# 1.1.1 bugfix - wrong function name +# 1.1 2020 Maintenance. Rewrite validation logic. Add data +# to utilities. Define AACOLS +# 1.0 New unit. +# +# +# TODO: Make a simple solution first, then extend it to error checking, and +# to handle .mfa files. +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ----------------------------------------------------- +#TOC> 1 Reading and validating FASTA 45 +#TOC> 1.1 Validating FASTA 81 +#TOC> 2 Parsing FASTA 227 +#TOC> 3 Interpreting FASTA 247 +#TOC> 4 Writing FASTA 274 +#TOC> +#TOC> ========================================================================== + + +# = 1 Reading and validating FASTA ======================================== + +# FASTA is a text based format, structured in lines that are separated by +# line-feed or paragraph-break characters. Which one of these is used, depends +# on your operating system. But R's readLines() function knows how to handle +# these correctly, accross platforms. Don't try to read such files "by hand". +# Here is the yeast Mbp1 gene, via SGD. + +file.show("./data/S288C_YDL056W_MBP1_coding.fsa") +faMBP1 <- readLines("./data/S288C_YDL056W_MBP1_coding.fsa") + +# The warning is generated because the programmer at the NCBI who implemented +# the code to write this FASTA file neglected to place a line-break character +# after the last sequence character. While this is not technically incorrect, +# it is poor practice: the resulting file can't be distinguished from one that +# has been truncated in transmission. + +head(faMBP1) + +# Note that there are NO line-break characters ("\n") at the end of these +# strings, even though they were present in the original file. readLines() +# has "consumed" these characters while reading - but every single line is in +# a vector of its own. + +tail(faMBP1) + +# Also note that the last line has fewer characters - this means readLines() +# imported the whole line, despite it not being terminated by "\n". + +# It's very straightforward to work with such data, for example by collapsing +# everything except the first line into a single string ... + +f <- c(faMBP1[1], paste(faMBP1[-1], sep = "", collapse = "")) + +f[1] +nchar(f[2]) + +# == 1.1 Validating FASTA ================================================== + +# The code above is making the assumption that everything from line 2 until +# the end IS sequence, the whole sequence and nothing but sequence. +# That assumption can break down in many ways: +# +# - there could be more than one header line. The specification says otherwise, +# but some older files use multiple, consecutive header lines. You don't +# want that to end up in your sequence. +# - this could be not a FASTA file at all. It could be raw sequence, a +# different sequence file format, or a wholly different file altogether. +# If you look at the file, you can immediately tell, but if you are +# reading the file in a complex workflow, your could easily import wrong +# data into your analysis. +# - there could be more than one sequence in the file. Such Multi-FASTA files +# occur commonly, as downloads of ORFs from genome regions or other +# sets of genes or proteins, or as the input / output for multiple +# sequence alignment programs. +# +# Data "from the wild" can (and usually does) have the most unexpected +# variations and it is really, really important to be clear about the +# assumptions that you are making. It is possible to "fix" things, according +# to the "Robustness Principle" : +# "Be conservative in what you send, +# be liberal in what you accept". +# (cf. https://en.wikipedia.org/wiki/Robustness_principle ) +# ... but if you think about this, that's actually a really poor idea, +# which is much more likely to dilute standards, make unwarranted +# assumptions, and allow errors to pass silently and corrupt data. +# +# Let's discard this principle on the trash-heap of +# things-that-sound-like-a-good-idea-but-aren't. What we do instead is test, +# identify problems, and follow the principle: "crash early, crash often". Of +# course I can write code that would reformat any possible input as a FASTA +# file - but what good will it do me if it parses the file I receive +# from a server into FASTA format like: +# +# >404- Page Not Found +# dyh-PagentfndhpThepageyreqesteddesnteistnthisserverCheckthe +# spellingrcntacttheadministratrsdyhtml +# +# Therefore, we write ourselves a FASTA checker that will enforce the following: +# (1) a FASTA file contains one or more sequences separated by zero or +# more empty lines +# (2) a sequence contains one header line followed by +# one or more sequence lines +# (3) a sequence line contains one or more uppercase or lowercase single +# letter amino acid codes, hyphens (gap character), or * (stop). +# +# Anything else should generate an error. + +# (Case 1): Header(s) exist +fX <- c("ABC", + "defghi", + "klmnpq") +sel <- grepl("^>", fX) # "^>" is a regular expression that + # means: the exact character ">" at the + # beginning ("^") of the line. +if ( ! any(sel) ) { stop("no header lines in input.") } + + +# (Case 2) No adjacent header lines +fX <- c(">ABC", + ">123", + "defghi", + "klmnpq") +sel <- grepl("^>", fX) +sel <- sel[- length(sel)] & sel[-1] # comparing shifted vectors +if ( any(sel)) { stop("adjacent header lines in input.") } + +# (Case 3.1) all sequence lines contain only valid characters +# (constants for valid characters AAVALID, NUCVALID, and NUCAMBIG +# are defined with the .utilities.R script) +AAVALID +fX <- c(">ABC", + "def ;-) ghi", + "klmnpq") +myRegex <- sprintf("[^%s]", AAVALID) # NOT a valid character +sel <- ! grepl("^>", fX) # NOT headers +if (any(grepl(myRegex, fX[sel]))) { + stop("invalid chracter(s) outside of header lines.") +} + +# (Case 3.2) all headers are followed directly by +# at least one letter of sequence +fX <- c(">ABC", + "", + ">123", + "defghi", + "klmnpq") +sel <- grep("^>", fX) + 1 # indexes of headers + 1 +myRegex <- sprintf("[%s]+", AAVALID) # at least one valid character +if (! all(grepl(myRegex, fX[sel]))) { + stop("a header has no adjacent sequence.") +} +# Ah, you might ask - couldn't we just have dropped all empty lines, and +# then caught this in Case 2? No - for two reasons: we would still miss headers +# at the end of file, and, we would have changed the line numbering - and +# ideally our "production" function will create information about where the +# error is to be found. + + +# Now combine this into a function ... + +val <- function(fa) { + + if ( ! any(grepl("^>", fa)) ) { + stop("no header lines in input.") + } + + sel <- grepl("^>", fa) + if ( any(sel[- length(sel)] & sel[-1])) { + stop("adjacent header lines in input.") + } + + sel <- ! grepl("^>", fa) + if ( any(grepl(sprintf("[^%s]", AAVALID), fa[sel]))) { + stop("invalid chracter(s) outside of header lines.") + } + + sel <- grep("^>", fa) + 1 + if (! all(grepl(sprintf("[%s]+", AAVALID), fa[sel]))) { + stop("a header has no adjacent sequence.") + } + + return(invisible(NULL)) +} + +# Here is an example +FA <- c(">head1", + "acdef", + "ghi", + "", + ">head2", + "kl", + ">head3", + "mn", + "pqrs") +val(FA) # ... should not create an error + + +# A somewhat more elaborate validateFA() function was loaded with the +# ./utilities.R script. It needs a bit more bookkeeping, since NCBI multi- +# fasta files have space-characters in their spacer lines. Try it ... +validateFA(FA) + +# = 2 Parsing FASTA ======================================================= + +# Once we have validated our assumptions about our input, it's quite +# painless to parse it. I have put this together as a function and the function +# gets loaded from ./.utilities.R +# + +# Lets try this: +# - the first 3 elements of faMBP1: +readFASTA(faMBP1[1:3]) + +# - a multi FASTA file of aligned APSES domain sequences: + +refAPSES <- readFASTA("./data/refAPSES.mfa") + +# Subset the sequence with "P39678" in the header +refAPSES[grep("P39678", refAPSES$head) ,] + + + +# = 3 Interpreting FASTA ================================================== + + +# FASTA files are straightforward to interpret - just one thing may be of note: +# when working with strings, we can use substr(, , ) to +# extract substrings, but more often we expand the string into a vector of +# single characters with strsplit(, ""). strsplit() returns a list, +# to accommodate that could be a vector of many elements, therefore +# we usually unlist() the result if we use it only on a single string. + +# Example: How many positive charged residues in "MBP1_SACCE"? + +s <- unlist(strsplit(refAPSES$seq[grep("MBP1_SACCE", refAPSES$head)], "")) +s + +sum(grepl("[HKR]", s)) # 20 (+) charged residues. grepl() returns TRUE and FALSE + # for the characters, sum() coerces to 1 and 0 + # respectively, and that gives us the result. + +100 * sum(grepl("[HKR]", s)) / length(s) # in percent: 20.2 % + +# residue distribution +x <- factor(s, levels = names(AACOLS)) +pie(table(x)[names(AACOLS)], col = AACOLS) + + + +# = 4 Writing FASTA ======================================================= + + +# Writing FASTA files is mostly just the reverse of reading, with one +# twist: we need to break the long sequence string into chunks of the desired +# width. The FASTA specification calls for a maximum of 120 characters per line, +# but writing out much less than that is common, since it allows to comfortably +# view lines on the console, or printing them on a sheet of paper (do we still +# do that actually?). How do we break a string into chunks? A combination of +# seq(, , ) with substring(, , ) will work +# nicely. (Note that substring() is vectorized, whereas substr() is not!) As we +# loop through our FASTA object in memory, we can build the output by c()'ing +# blocks of header + sequence to each other. For VERY large objects this might +# be slow - in that case, we might want to precalculate the size of the output +# object. But that's more of a hypothetical consideration. + +( s <- refAPSES$seq[2] ) +nchar(s) +w <- 30 # width of chunk +(starts <- seq(1, nchar(s), by = w)) # starting index of chunk +(ends <- c((starts - 1)[-1], nchar(s))) # ending index of chunk + +# Task: Is this safe? What happens if nchar(s) is shorter than w? +# What happens if nchar(s) is an exact multiple of w? + +substring(s, starts, ends) +# confirm that the output contains the first and last residue, and both +# residues adjacent to the breaks + +# As always, the function has been defined in ".utilities.R" for to use +# any time... type writeFASTA to examine it. + +# Let's try this... + +writeFASTA(refAPSES, width = 40) + +# roundtrip for validation: write refAPSES with a different format, +# read it back in - the new dataframe must be identical +# to the original dataframe. +fname <- tempfile() +writeFASTA(refAPSES, fn = fname, width = 30) +identical(refAPSES, readFASTA(fname)) + +# ...works for me :-) + + +# [END] diff --git a/RPR-GEO2R.R b/RPR-GEO2R.R index a4820c2..6d21096 100644 --- a/RPR-GEO2R.R +++ b/RPR-GEO2R.R @@ -1,674 +1,674 @@ -# tocID <- "RPR-GEO2R.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the RPR_GEO2R unit. -# -# -# ============================================================================== -# Version: 1.3 -# -# Date: 2017-09 - 2020-09 -# Author: Boris Steipe -# -# Versions: -# 1.3 use saveRDS()/readRDS() rather than save()/load() -# 1.2 Change from require() to requireNamespace(), -# use ::() idiom throughout, -# use Biocmanager:: not biocLite() -# 1.1 Add section on GPL annotations -# 1.0 Updates for BCH441 2017 -# 0.1 First code copied from 2016 material. -# -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# TO SUBMIT FOR CREDIT.... -# -# Note: to submit tasks for credit for this unit, report on the sections -# that have "Task ..." section headers, and report on the lines that are -# identified with #TASK> comments. -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> -------------------------------------------------------------------------- -#TOC> 1 Preparations 62 -#TOC> 2 Loading a GEO Dataset 89 -#TOC> 2.1 Task - understanding the data 155 -#TOC> 3 Column wise analysis - time points 164 -#TOC> 3.1 Task - Comparison of experiments 193 -#TOC> 3.2 Grouped Samples 226 -#TOC> 4 Row-wise Analysis: Expression Profiles 261 -#TOC> 4.1 Task - Read a table of features 296 -#TOC> 4.2 Selected Expression profiles 349 -#TOC> 5 Differential Expression 392 -#TOC> 5.1 Final task: Gene descriptions 532 -#TOC> 6 Improving on Discovery by Differential Expression 538 -#TOC> 7 Annotation data 633 -#TOC> -#TOC> ========================================================================== - - -# = 1 Preparations ======================================================== - -# To load and analyze GEO datasets we use a number of Bioconductor packages: - - -if (! requireNamespace("BiocManager", quietly = TRUE)) { - install.packages("BiocManager") -} - -if (! requireNamespace("Biobase", quietly = TRUE)) { - BiocManager::install("Biobase") -} -# Package information: -# library(help = Biobase) # basic information -# browseVignettes("Biobase") # available vignettes -# data(package = "Biobase") # available datasets - - -if (! requireNamespace("GEOquery", quietly = TRUE)) { - BiocManager::install("GEOquery") -} -# Package information: -# library(help = GEOquery) # basic information -# browseVignettes("GEOquery") # available vignettes -# data(package = "GEOquery") # available datasets - - -# = 2 Loading a GEO Dataset =============================================== - -# The R code below is adapted from the GEO2R scripts produced by GEO for GSE3635 -# for the experiment conducted in the BIN-EXPR-GEO unit - -# Version info: R 3.2.3, Biobase 2.30.0, GEOquery 2.40.0, limma 3.26.8 -# R scripts generated Wed Jan 11 17:39:46 EST 2017 - - -# Load series and platform data from GEO. The GEO server is a bit flakey and -# I have experienced outages over several hours. If the command below does -# not work for you, skip ahead to the fallback procedure. - -GSE3635 <- GEOquery::getGEO("GSE3635", GSEMatrix =TRUE, getGPL=FALSE) -# Note: GEO2R scripts call the expression data set -# "gset" throughout ... in this script I give -# it the name "GSE3635" for clarity. - -# Subset, if the data contains multiple experiments with different platforms -# since we should not be mixing data from different platforms. (That's -# unfortunately very hard to do correctly). The "platform" is the type of chip -# that was used, and what I selected online when this script was produced, so -# GEO2R knows about the correct platform ID. Technically, subsetting to just one -# platform is not necessary here because we _know_ that GSE3635 contains only -# data produced with the GPL1914 platform. But that's the way GEO2R scripts are -# setup be default since they have to be able to handle a variety of cases. -if (length(GSE3635) > 1) { - idx <- grep("GPL1914", attr(GSE3635, "names")) -} else { - idx <- 1 -} - -GSE3635 <- GSE3635[[idx]] - -# FALLBACK -# ... in case the GEO server is not working, load the "GSE3635" object from -# the data directory: -# -# GSE3635 <- readRDS(file="./data/GSE3635.rds") - - -# Checkpoint ... -if (! exists("GSE3635")) { - stop("PANIC: GSE3635 was not loaded. Can't continue.") -} - - -# GSE3635 is an "Expression Set" - cf. -# https://bioconductor.org/packages/release/bioc/vignettes/Biobase/inst/doc/ExpressionSetIntroduction.pdf - -# What does this contain? -help("ExpressionSet-class") - -# Print it -GSE3635 - -# Access contents via methods: -Biobase::featureNames(GSE3635)[1:20] # Rows. What are these features? -Biobase::sampleNames(GSE3635)[1:10] # Columns. What are these columns? - -# Access contents by subsetting: -( tmp <- GSE3635[12:17, 1:6] ) - -# Access data -Biobase::exprs(tmp) # exprs() gives us the actual expression values. - -# == 2.1 Task - understanding the data ===================================== - -#TASK> What are the data values: -#TASK> ... in each cell? -#TASK> ... in each column? -#TASK> ... in each row? - - - -# = 3 Column wise analysis - time points ================================== - -# Get an overview of the distribution of values in individual columns -summary(Biobase::exprs(GSE3635)[ , 1]) -summary(Biobase::exprs(GSE3635)[ , 4]) -summary(Biobase::exprs(GSE3635)[ , 7]) - -# This allows us to com pare the columns, comment on the quality of the data, -# and get a sense for the distribution. We need to know how exactly these -# numbers were produced: obviously, if we don't know how those numbers were -# created in the first place, we would produce a major sin of Cargo Cult -# bioinformatics if we would analyze them. - - - -# compare them in a a boxplot -cyclicPalette <- colorRampPalette(c("#14b4c9", - "#d2d1e6", - "#e66594", - "#d2d1e6", - "#14b4c9", - "#d2d1e6", - "#e66594", - "#d2d1e6", - "#14b4c9")) -tCols <- cyclicPalette(13) -boxplot(Biobase::exprs(GSE3635), col = tCols) - - -# == 3.1 Task - Comparison of experiments ================================== -#TASK> Study this boxplot. What's going on? Are these expression values? -#TASK> What do the numbers mean? (Summarize the process and computation -#TASK> that has gone i to the preprocessing. You need to understand why -#TASK> these columns all have the same mean and range.) Given what common -#TASK> sense tells you about the variability of experiments, do you -#TASK> believe your understanding is complete? - - -# Lets plot the distributions of values in a more fine-grained manner: -hT0 <- hist(Biobase::exprs(GSE3635)[ , 1], breaks = 100, col = tCols[1]) -hT3 <- hist(Biobase::exprs(GSE3635)[ , 4], breaks = 100, col = tCols[4]) -hT6 <- hist(Biobase::exprs(GSE3635)[ , 7], breaks = 100, col = tCols[7]) -hT9 <- hist(Biobase::exprs(GSE3635)[ , 10], breaks = 100, col = tCols[10]) -hT12 <- hist(Biobase::exprs(GSE3635)[ , 13], breaks = 100, col = tCols[13]) - - -plot( hT0$mids, hT0$counts, type = "l", col = tCols[1], xlim = c(-0.5, 0.5)) -points(hT3$mids, hT3$counts, type = "l", col = tCols[4]) -points(hT6$mids, hT6$counts, type = "l", col = tCols[7]) -points(hT9$mids, hT9$counts, type = "l", col = tCols[10]) -points(hT12$mids, hT12$counts, type = "l", col = tCols[13]) -legend("topright", - legend = c("hT0", "hT3", "hT6", "hT9", "hT12"), - col = tCols[c(1, 4, 7, 10, 13)], - lwd = 1) - - -#TASK> Study this plot. What does it tell you? Is there systematic, global -#TASK> change in the values over time? Within a cycle? Over the course of the -#TASK> experiment? - - -# == 3.2 Grouped Samples =================================================== - -# This is the GEO2R code that produces the histogram you saw on the NCBI -# Website if you went through the BIN-EXPR-GEO unit. - -# Group names for all samples in a series -gsms <- "0123450123450" # Each digit identifies one of the 13 columns -sml <- c() -for (i in 1:nchar(gsms)) { - sml[i] <- substr(gsms,i,i) -} -sml <- paste("G", sml, sep="") # set group names - -# order samples by group -ex <- Biobase::exprs(GSE3635)[ , order(sml)] -sml <- sml[order(sml)] -fl <- as.factor(sml) -labels <- c("t0","t10","t20","t30","t40","t50") # these are the labels we - # assigned in the BIN-EXPR-GEO - # unit - -# Set parameters and draw the plot. I changed this from the original GEO2R -# code which overwrote the global palette(). That's evil! Utility code -# should _never_ mess with global parameters! -GEOcols <- c("#dfeaf4", "#f4dfdf", "#f2cb98", "#dcdaa5", - "#dff4e4", "#f4dff4", "#AABBCC") -dev.new(width = 4 + dim(GSE3635)[[2]] / 5, height = 6) # plot into a new window -par(mar = c(2 + round(max(nchar(Biobase::sampleNames(GSE3635))) / 2), 4, 2, 1)) -title <- paste ("GSE3635", '/', Biobase::annotation(GSE3635), - " grouped samples", sep ='') -boxplot(ex, boxwex = 0.6, notch = TRUE, main = title, outline=FALSE, - las = 2, col = GEOcols[fl]) -legend("topleft", labels, fill = GEOcols, bty = "n") - - -# = 4 Row-wise Analysis: Expression Profiles ============================== - -# What we did above was column-wise analysis and it gave us an idea about how -# our experiments relate to each other. To analyze individual genes, we need to -# do row-wise analyis. - -#TASK> Try to answer the following questions: -#TASK> Are all rows genes? -#TASK> What identifiers are being used? -# (cf. https://sites.google.com/view/yeastgenome-help/community-help/nomenclature-conventions) -#TASK> Are all rows/genes unique? -#TASK> Are all yeast genes accounted for? - -# These are crucially important questions but you can't answer the last -# question because you have no information other than the gene identifiers. -# However, any biological interpretation relies absolutely on understanding -# the semantics of the data. Merely manipulating abstract identifiers and -# numbers, that would surely be Cargo Cult bioinformatics. - -# To answer these questions about the data semantics, I have provided the -# file "SGD_features.tab" in the data directory of this project. I have -# downloaded it from SGD -# (http://www.yeastgenome.org/download-data/curation), for a description of -# its contents see here: -file.show("./data/SGD_features.README.txt") -# Note: the file as downloaded from SGD actually crashed RStudio due to an -# unbalanced quotation mark which caused R to try and read the whole -# of the subsequent file into a single string. This was caused by an -# alias gene name (B"). I have removed this abomination -# by editing the file. The version in the ./data directory can be -# read without issues. - -# Leets peek into the file: -readLines("./data/SGD_features.tab", n = 5) - -# == 4.1 Task - Read a table of features =================================== - -# Note: this task asks you to write code. You MUST identify your -# sources when you draw on other's examples. - -# This data file is rather typical of datasets that you will encounter "in the -# wild". To proceed, you need to write code to read it into an R-object. Develop -# the code in your script file according to the following specification: -# -# - read "./data/SGD_features.tab" into a data frame -# called "SGD_features" -# - remove unneeded columns - keep the following data columns: -# - Primary SGDID -# - Feature type -# - Feature qualifier -# - Feature name - (the systematic name !) -# - Standard gene name -# - Description -# - give the data frame meaningful column names: -# colnames(SGD_features) <- c("SGDID", -# "type", -# "qual", -# "sysName", -# "name", -# "description") -# -# - remove all rows that don't have a systematic name. (You'll have to check -# what's in cells that don't have a systematic name) -# - check that the systematic names are unique (Hint: use the duplicated() -# function.) -# - assign the systematic names as row names -# - confirm: are all rows of the expression data set represented in -# the feature table? Hint: use setdiff() to print all that -# are not. -# Example usage of setdiff(): -# A <- c("duck", "crow", "gull", "tern") -# B <- c("gull", "rook", "tern", "kite", "myna") -# -# setdiff(A, B) # [1] "duck" "crow" -# setdiff(B, A) # [1] "rook" "kite" "myna" - -# If some of the features in the expression set are not listed in the -# systematic names, you have to be aware of that, when you try to get -# more information on them. I presume they are missing because revisions -# of the yeast genome after these experiments were done showed that these -# genes did not actually exist. - -# - confirm: how many / which genes in the feature table do not -# have expression data? - -# How should we handle rows/columns that are missing or not unique? - - -# == 4.2 Selected Expression profiles ====================================== - -# The code below assumes that you have read ./data/SGD_features.tab and assigned -# the resulting data frame to SGD_features, with columns as specified above. - -# Here is an expression profile for Mbp1. - -gName <- "MBP1" -(iFeature <- which(SGD_features$name == gName)) -(iExprs <- which(featureNames(GSE3635) == SGD_features$sysName[iFeature])) -plot(seq(0, 120, by = 10), - Biobase::exprs(GSE3635)[iExprs, ], - main = paste("Expression profile for", gName), - xlab = "time (min)", - ylab = "expression", - type = "b", - col= "maroon") -abline(h = 0, col = "#00000055") -abline(v = 60, col = "#00000055") - -# Print the description -SGD_features$description[iFeature] - -# Here is a list of gene names that may be involved in the cell cycle switch, -# and some genes that are controls (cf. BIN-SYS-Concepts): - -# Turning it on -# Cdc14, Mbp1, Swi6, Swi4, Whi5, Cdc28, Cln1, Cln2, Cln3 - -# Turning it off -# Rad53, Cdc28, Clb1, Clb2, Clb6, Nrm1 - -# Housekeeping genes -# Act1, and Alg9 - -#TASK> Plot expression profiles for these genes and study them. What do you -#TASK> expect the profiles to look like, given the role of these genes? What -#TASK> do you find? (Hint: you will make your life much easier if you define -#TASK> a function that plots and prints descriptions with a gene name as input. -#TASK> Also: are the gene names in the feature table upper case, or lower case? -#TASK> Also: note that the absolute values of change are quite different. -#TASK> Also: note that some values may be outliers i.e. failed experiments.) - -# = 5 Differential Expression ============================================= - -# GEO2R discovers the top differentially expressed expressed genes by -# using functions in the Bioconductor limma package. - -if (! requireNamespace("limma", quietly = TRUE)) { - BiocManager::install("limma") -} -# Package information: -# library(help = limma) # basic information -# browseVignettes("limma") # available vignettes -# data(package = "limma") # available datasets - -# The GEO2R limma code is virtually uncommented, and has not been written for -# clarity, but for being easily produced by a code-generator that is triggered -# by the parameters on the GEO Web-site. Most of it is actually dispensable for -# our purposes. - -# In principle, the code goes through three steps: -# 1. Prepare the data -# 2. Define groups that are to be contrasted to define "Differential" -# 3. Find genes whose expression levels are significantly different across -# the groups -# 4. Format results. - -# Biobase is a highly engineered package that is tightly integrated into -# the Bioconductor world - unfortunately that brings with it a somewhat -# undesirable level of computational overhead and dependencies. Using the -# package as we normally do - i.e. calling required functions with their -# explicit package prefix is therefore not advisable. There are generics -# that won't be propery dispatched. If you only need a small number of -# functions for a very specific context, you will probably get away with -# Biobase::() - but even in the demonstration code of this script -# not everything works out of the box. We'll therefore load the library, -# but we'll (redundantly) use the prefix anyway so as to emphasize where -# the functions come from. - -library(Biobase) - -# We are recapitulating the experiment in which we assigned the 0, 10, 60 and -# 70 minute samples to one group, the 30, 40, 90 and 100 minute samples to -# another group, and calculated differential expression values between these -# two groups. - -setA <- c(1, 2, 7, 8) # columns for set A -setB <- c(4, 5, 10, 11) # columns for set B - -# We remove columns we don't need, and for simplicity put the experiments for -# group A in the first four columns, and the group B in the next four. - -mySet <- GSE3635[ , c(setA, setB)] - -# limma needs the column descriptions as factors -mySet$description <- as.factor(c(rep("A", 4), rep("B", 4))) - -# Next we build the "design Matrix" for the statistical test: -myDesign <- model.matrix(~ description + 0, mySet) -colnames(myDesign) <- levels(mySet$description) -myDesign - -# Now we can calculate the fit of all rows to a linear model that depends -# on the two groups as specified in the design: -myFit <- limma::lmFit(mySet, myDesign) - -# Next we calculate the contrasts, given the fit ... -myCont.matrix <- limma::makeContrasts(A - B, levels = myDesign) -myFit2 <- limma::contrasts.fit(myFit, myCont.matrix) - -# ... compute appropriate probabilites from a modified t-test -# (empirical Bayes) ... -myFit2 <- limma::eBayes(myFit2, 0.01) - -# ... add the gene names to the fit - object ... -myFit2$genes <- featureNames(mySet) - -# ... and pick the top N differentially expressed genes while controlling -# for multiple testing with a False Discovery Rate (fdr) correction. GEO2R -# gave us only the top 250 genes, but we might as well do 1000, just so we -# can be reasonable sure that our gens of interest are included. -N <- 1000 -myTable <- limma::topTable(myFit2, - adjust.method = "fdr", - sort.by = "B", - number = N) - -str(myTable) -# The gene names are now in the $ID column - -# These are the top 10 -write.table(myTable[1:10 , c("ID","P.Value","B")], - file = stdout(), - row.names = FALSE, - sep="\t") - -# Let's see what we got: let's plot the full expression profiles (all 13 -# columns) for the top ten genes from exprs(GSE3635). - -plot(seq(0, 120, by = 10), - rep(0, 13), - type = "n", - ylim = c(-1, 1), - xlab = "time", - ylab = "log-ratio expression") -rect( 0, -2, 15, 2, col = "#dfeaf4", border = NA) # setA -rect( 55, -2, 75, 2, col = "#dfeaf4", border = NA) # setA -rect( 25, -2, 45, 2, col = "#f4dfdf", border = NA) # setB -rect( 85, -2, 105, 2, col = "#f4dfdf", border = NA) # setB -abline(h = 0, col = "#00000055") - -for (i in 1:10) { - thisID <- myTable$ID[i] - points(seq(0, 120, by = 10), Biobase::exprs(GSE3635)[thisID, ], type = "b") -} - -# Our guess that we might discover interesting genes by selecting groups A and B -# like we did was not bad. But limma knows nothing about the biology and though -# the expression profiles look good, there is no guarantee that these are the -# most biologically relevant genes. Significantly different in expression -# according to the groups we define is not necessarily the same as a cyclically -# varying gene, nor does it necessarily find the genes whose expression levels -# are _most_ different, i.e. if the variance of a highly, differentially -# expressed gene within a group is large, it may not be very significant. Also, -# we are not exploiting the fact that these values are time series. -# Nevertheless, we find genes for which we see a change in expression levels -# along two cell-cycles. - -# Let's superimpose some "real" cell-cycle genes: -myControls <- c("Cdc14", "Mbp1", "Swi6", "Swi4", "Whi5", "Cln1", "Cln2", "Cln3") -for (name in toupper(myControls)) { - thisID <- SGD_features$sysName[which(SGD_features$name == name)] - points(seq(0, 120, by=10), - Biobase::exprs(GSE3635)[thisID, ], - type="b", - col="#AA0000") -} - -# Indeed, the discovered gene profiles look much "cleaner" than the real cycle -# genes and this just means that differential expression in the way that we -# have performed it is an approximation to the biology. - -# == 5.1 Final task: Gene descriptions ===================================== - -#TASK> Print the descriptions of the top ten differentially expressed genes -#TASK> and comment on what they have in common (or not). - - -# = 6 Improving on Discovery by Differential Expression =================== - - -# There are many ways to improve on purely statistical methods, if we have -# better ideas about the biology. I would just like to demonstrate one -# possibility here: calculate correlation values to a sample gene - such as Cln2 -# for which we know that it is involved in the cell cycle. Let's plot it first: - -gName <- "CLN2" -(iFeature <- which(SGD_features$name == gName)) -(iExprs <- which(featureNames(GSE3635) == SGD_features$sysName[iFeature])) -Cln2Profile <- Biobase::exprs(GSE3635)[iExprs, ] -plot(seq(0, 120, by = 10), - Cln2Profile, - ylim = c(-1, 1), - main = paste("Expression profile for", gName), - xlab = "time (min)", - ylab = "expression", - type = "b", - pch = 16, - cex = 1.5, - lwd = 2, - col= "#40b886") -abline(h = 0, col = "#0000FF55") -abline(v = 60, col = "#0000FF55") - -# Set up a vector of correlation values - - -myCorrelations <- numeric(nrow(Biobase::exprs(GSE3635))) -names(myCorrelations) <- Biobase::featureNames(GSE3635) -for (i in 1:length(myCorrelations)) { - myCorrelations[i] <- cor(Cln2Profile, Biobase::exprs(GSE3635)[i, ]) -} - -nTOP <- 20 -myTopC <- order(myCorrelations, decreasing = TRUE)[1:nTOP] - -# Number 1 -(ID <- Biobase::featureNames(GSE3635)[myTopC[1]]) - -# Get information -SGD_features[which(SGD_features$sysName == ID), ] -# Of course: the highest correlation is Cln1 itself. This is our positive -# control for the experiment. - -# Let's plot the rest -myPal <- colorRampPalette(c("#82f58d", "#E0F2E2", "#f6f6f6")) - -for (i in 2:nTOP) { - ID <- Biobase::featureNames(GSE3635)[myTopC[i]] - points(seq(0, 120, by = 10), - Biobase::exprs(GSE3635)[ID, ], - type = "b", - cex = 0.8, - col= myPal(nTOP)[i]) - print(SGD_features[which(SGD_features$sysName == ID), - c("name", "description")]) -} - -# Note that all of these genes are highly correlated with a known cell cycle -# gene, but because the absolute values of expression differences are not very -# large for some of them, they might not be picked up by any algorithm that is -# focussed on large differential expression changes. Do small relative changes -# mean small biological effects? Certainly not! - -# And we haven't even looked at the anticorrelated genes yet... -nBOT <- nTOP -myBottomC <- order(myCorrelations, decreasing = FALSE)[1:nBOT] # bottom ten -myPal <- colorRampPalette(c("#ba112a", "#E3C8CC", "#ebebeb")) - -for (i in 1:nBOT) { - ID <- Biobase::featureNames(GSE3635)[myBottomC[i]] - points(seq(0, 120, by = 10), - Biobase::exprs(GSE3635)[ID, ], - type = "b", - cex = 0.8, - col= myPal(nBOT)[i]) - print(SGD_features[which(SGD_features$sysName == ID), - c("name", "description")]) -} -# ... which are very interesting in their own right. - -# What I hope you appreciate from this example is: -# - convenient general purpose methods exist that analyze expression data -# with sophisticated statistical methods; -# - the results of these methods depend on whether the statistics model -# the biology well; -# - you will draw Cargo Cult conclusions if you can't cast your biology -# of interest in terms of a model, "canned" solutions are unlikely -# to give you all the answers you need; -# - being able to write your own code gives you the freedom to experiment -# and explore. There is a learning curve - but the payoffs are -# significant. - -# = 7 Annotation data ===================================================== -# -# Loading feature data "by hand" as we've done above, is usually not necessary -# since GEO provides rich annotations in the GPL platform files, which are -# associated with its Gene Expression Sets files. In the code above, -# we used getGEO("GSE3635", GSEMatrix = TRUE, getGPL = FALSE), and the GPL -# annotations were not loaded. We could use getGPL = TRUE instead ... - -GSE3635annot <- GEOquery::getGEO("GSE3635", GSEMatrix = TRUE, getGPL = TRUE) -GSE3635annot <- GSE3635annot[[1]] - -# ... and the feature data is then available in the GSE3635@featureData@data -# slot: -str(GSE3635annot@featureData@data) -GSE3635annot@featureData@data[ 1:20 , ] - -# ... from where you can access the columns you need, e.g. spotIDs and gene -# symbols: - -myAnnot <- GSE3635annot@featureData@data[ , c("SPOT_ID", "Gene")] -str(myAnnot) - -# ... Note that this is a data frame and it is easy to find things we -# might be looking for ... -myAnnot[which(myAnnot$Gene == "MBP1"), ] - -# ... or identify rows that might give us trouble, such as probes that -# hybridize to more than one gene. - - -# Alternatively, we could have identified the GPL file for this set: -GSE3635@annotation # "GPL1914" - -# ... and downloaded it directly from NCBI: -GPL1914 <- GEOquery::getGEO("GPL1914") -str(GPL1914) - -# ... from which we can get the data - which is however NOT necessarily -# matched to the rows of our expression dataset. - - -# [END] +# tocID <- "RPR-GEO2R.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the RPR_GEO2R unit. +# +# +# ============================================================================== +# Version: 1.3 +# +# Date: 2017-09 - 2020-09 +# Author: Boris Steipe +# +# Versions: +# 1.3 use saveRDS()/readRDS() rather than save()/load() +# 1.2 Change from require() to requireNamespace(), +# use ::() idiom throughout, +# use Biocmanager:: not biocLite() +# 1.1 Add section on GPL annotations +# 1.0 Updates for BCH441 2017 +# 0.1 First code copied from 2016 material. +# +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# TO SUBMIT FOR CREDIT.... +# +# Note: to submit tasks for credit for this unit, report on the sections +# that have "Task ..." section headers, and report on the lines that are +# identified with #TASK> comments. +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> -------------------------------------------------------------------------- +#TOC> 1 Preparations 62 +#TOC> 2 Loading a GEO Dataset 89 +#TOC> 2.1 Task - understanding the data 155 +#TOC> 3 Column wise analysis - time points 164 +#TOC> 3.1 Task - Comparison of experiments 193 +#TOC> 3.2 Grouped Samples 226 +#TOC> 4 Row-wise Analysis: Expression Profiles 261 +#TOC> 4.1 Task - Read a table of features 296 +#TOC> 4.2 Selected Expression profiles 349 +#TOC> 5 Differential Expression 392 +#TOC> 5.1 Final task: Gene descriptions 532 +#TOC> 6 Improving on Discovery by Differential Expression 538 +#TOC> 7 Annotation data 633 +#TOC> +#TOC> ========================================================================== + + +# = 1 Preparations ======================================================== + +# To load and analyze GEO datasets we use a number of Bioconductor packages: + + +if (! requireNamespace("BiocManager", quietly = TRUE)) { + install.packages("BiocManager") +} + +if (! requireNamespace("Biobase", quietly = TRUE)) { + BiocManager::install("Biobase") +} +# Package information: +# library(help = Biobase) # basic information +# browseVignettes("Biobase") # available vignettes +# data(package = "Biobase") # available datasets + + +if (! requireNamespace("GEOquery", quietly = TRUE)) { + BiocManager::install("GEOquery") +} +# Package information: +# library(help = GEOquery) # basic information +# browseVignettes("GEOquery") # available vignettes +# data(package = "GEOquery") # available datasets + + +# = 2 Loading a GEO Dataset =============================================== + +# The R code below is adapted from the GEO2R scripts produced by GEO for GSE3635 +# for the experiment conducted in the BIN-EXPR-GEO unit + +# Version info: R 3.2.3, Biobase 2.30.0, GEOquery 2.40.0, limma 3.26.8 +# R scripts generated Wed Jan 11 17:39:46 EST 2017 + + +# Load series and platform data from GEO. The GEO server is a bit flakey and +# I have experienced outages over several hours. If the command below does +# not work for you, skip ahead to the fallback procedure. + +GSE3635 <- GEOquery::getGEO("GSE3635", GSEMatrix =TRUE, getGPL=FALSE) +# Note: GEO2R scripts call the expression data set +# "gset" throughout ... in this script I give +# it the name "GSE3635" for clarity. + +# Subset, if the data contains multiple experiments with different platforms +# since we should not be mixing data from different platforms. (That's +# unfortunately very hard to do correctly). The "platform" is the type of chip +# that was used, and what I selected online when this script was produced, so +# GEO2R knows about the correct platform ID. Technically, subsetting to just one +# platform is not necessary here because we _know_ that GSE3635 contains only +# data produced with the GPL1914 platform. But that's the way GEO2R scripts are +# setup be default since they have to be able to handle a variety of cases. +if (length(GSE3635) > 1) { + idx <- grep("GPL1914", attr(GSE3635, "names")) +} else { + idx <- 1 +} + +GSE3635 <- GSE3635[[idx]] + +# FALLBACK +# ... in case the GEO server is not working, load the "GSE3635" object from +# the data directory: +# +# GSE3635 <- readRDS(file="./data/GSE3635.rds") + + +# Checkpoint ... +if (! exists("GSE3635")) { + stop("PANIC: GSE3635 was not loaded. Can't continue.") +} + + +# GSE3635 is an "Expression Set" - cf. +# https://bioconductor.org/packages/release/bioc/vignettes/Biobase/inst/doc/ExpressionSetIntroduction.pdf + +# What does this contain? +help("ExpressionSet-class") + +# Print it +GSE3635 + +# Access contents via methods: +Biobase::featureNames(GSE3635)[1:20] # Rows. What are these features? +Biobase::sampleNames(GSE3635)[1:10] # Columns. What are these columns? + +# Access contents by subsetting: +( tmp <- GSE3635[12:17, 1:6] ) + +# Access data +Biobase::exprs(tmp) # exprs() gives us the actual expression values. + +# == 2.1 Task - understanding the data ===================================== + +#TASK> What are the data values: +#TASK> ... in each cell? +#TASK> ... in each column? +#TASK> ... in each row? + + + +# = 3 Column wise analysis - time points ================================== + +# Get an overview of the distribution of values in individual columns +summary(Biobase::exprs(GSE3635)[ , 1]) +summary(Biobase::exprs(GSE3635)[ , 4]) +summary(Biobase::exprs(GSE3635)[ , 7]) + +# This allows us to com pare the columns, comment on the quality of the data, +# and get a sense for the distribution. We need to know how exactly these +# numbers were produced: obviously, if we don't know how those numbers were +# created in the first place, we would produce a major sin of Cargo Cult +# bioinformatics if we would analyze them. + + + +# compare them in a a boxplot +cyclicPalette <- colorRampPalette(c("#14b4c9", + "#d2d1e6", + "#e66594", + "#d2d1e6", + "#14b4c9", + "#d2d1e6", + "#e66594", + "#d2d1e6", + "#14b4c9")) +tCols <- cyclicPalette(13) +boxplot(Biobase::exprs(GSE3635), col = tCols) + + +# == 3.1 Task - Comparison of experiments ================================== +#TASK> Study this boxplot. What's going on? Are these expression values? +#TASK> What do the numbers mean? (Summarize the process and computation +#TASK> that has gone i to the preprocessing. You need to understand why +#TASK> these columns all have the same mean and range.) Given what common +#TASK> sense tells you about the variability of experiments, do you +#TASK> believe your understanding is complete? + + +# Lets plot the distributions of values in a more fine-grained manner: +hT0 <- hist(Biobase::exprs(GSE3635)[ , 1], breaks = 100, col = tCols[1]) +hT3 <- hist(Biobase::exprs(GSE3635)[ , 4], breaks = 100, col = tCols[4]) +hT6 <- hist(Biobase::exprs(GSE3635)[ , 7], breaks = 100, col = tCols[7]) +hT9 <- hist(Biobase::exprs(GSE3635)[ , 10], breaks = 100, col = tCols[10]) +hT12 <- hist(Biobase::exprs(GSE3635)[ , 13], breaks = 100, col = tCols[13]) + + +plot( hT0$mids, hT0$counts, type = "l", col = tCols[1], xlim = c(-0.5, 0.5)) +points(hT3$mids, hT3$counts, type = "l", col = tCols[4]) +points(hT6$mids, hT6$counts, type = "l", col = tCols[7]) +points(hT9$mids, hT9$counts, type = "l", col = tCols[10]) +points(hT12$mids, hT12$counts, type = "l", col = tCols[13]) +legend("topright", + legend = c("hT0", "hT3", "hT6", "hT9", "hT12"), + col = tCols[c(1, 4, 7, 10, 13)], + lwd = 1) + + +#TASK> Study this plot. What does it tell you? Is there systematic, global +#TASK> change in the values over time? Within a cycle? Over the course of the +#TASK> experiment? + + +# == 3.2 Grouped Samples =================================================== + +# This is the GEO2R code that produces the histogram you saw on the NCBI +# Website if you went through the BIN-EXPR-GEO unit. + +# Group names for all samples in a series +gsms <- "0123450123450" # Each digit identifies one of the 13 columns +sml <- c() +for (i in 1:nchar(gsms)) { + sml[i] <- substr(gsms,i,i) +} +sml <- paste("G", sml, sep="") # set group names + +# order samples by group +ex <- Biobase::exprs(GSE3635)[ , order(sml)] +sml <- sml[order(sml)] +fl <- as.factor(sml) +labels <- c("t0","t10","t20","t30","t40","t50") # these are the labels we + # assigned in the BIN-EXPR-GEO + # unit + +# Set parameters and draw the plot. I changed this from the original GEO2R +# code which overwrote the global palette(). That's evil! Utility code +# should _never_ mess with global parameters! +GEOcols <- c("#dfeaf4", "#f4dfdf", "#f2cb98", "#dcdaa5", + "#dff4e4", "#f4dff4", "#AABBCC") +dev.new(width = 4 + dim(GSE3635)[[2]] / 5, height = 6) # plot into a new window +par(mar = c(2 + round(max(nchar(Biobase::sampleNames(GSE3635))) / 2), 4, 2, 1)) +title <- paste ("GSE3635", '/', Biobase::annotation(GSE3635), + " grouped samples", sep ='') +boxplot(ex, boxwex = 0.6, notch = TRUE, main = title, outline=FALSE, + las = 2, col = GEOcols[fl]) +legend("topleft", labels, fill = GEOcols, bty = "n") + + +# = 4 Row-wise Analysis: Expression Profiles ============================== + +# What we did above was column-wise analysis and it gave us an idea about how +# our experiments relate to each other. To analyze individual genes, we need to +# do row-wise analyis. + +#TASK> Try to answer the following questions: +#TASK> Are all rows genes? +#TASK> What identifiers are being used? +# (cf. https://sites.google.com/view/yeastgenome-help/community-help/nomenclature-conventions) +#TASK> Are all rows/genes unique? +#TASK> Are all yeast genes accounted for? + +# These are crucially important questions but you can't answer the last +# question because you have no information other than the gene identifiers. +# However, any biological interpretation relies absolutely on understanding +# the semantics of the data. Merely manipulating abstract identifiers and +# numbers, that would surely be Cargo Cult bioinformatics. + +# To answer these questions about the data semantics, I have provided the +# file "SGD_features.tab" in the data directory of this project. I have +# downloaded it from SGD +# (http://www.yeastgenome.org/download-data/curation), for a description of +# its contents see here: +file.show("./data/SGD_features.README.txt") +# Note: the file as downloaded from SGD actually crashed RStudio due to an +# unbalanced quotation mark which caused R to try and read the whole +# of the subsequent file into a single string. This was caused by an +# alias gene name (B"). I have removed this abomination +# by editing the file. The version in the ./data directory can be +# read without issues. + +# Leets peek into the file: +readLines("./data/SGD_features.tab", n = 5) + +# == 4.1 Task - Read a table of features =================================== + +# Note: this task asks you to write code. You MUST identify your +# sources when you draw on other's examples. + +# This data file is rather typical of datasets that you will encounter "in the +# wild". To proceed, you need to write code to read it into an R-object. Develop +# the code in your script file according to the following specification: +# +# - read "./data/SGD_features.tab" into a data frame +# called "SGD_features" +# - remove unneeded columns - keep the following data columns: +# - Primary SGDID +# - Feature type +# - Feature qualifier +# - Feature name - (the systematic name !) +# - Standard gene name +# - Description +# - give the data frame meaningful column names: +# colnames(SGD_features) <- c("SGDID", +# "type", +# "qual", +# "sysName", +# "name", +# "description") +# +# - remove all rows that don't have a systematic name. (You'll have to check +# what's in cells that don't have a systematic name) +# - check that the systematic names are unique (Hint: use the duplicated() +# function.) +# - assign the systematic names as row names +# - confirm: are all rows of the expression data set represented in +# the feature table? Hint: use setdiff() to print all that +# are not. +# Example usage of setdiff(): +# A <- c("duck", "crow", "gull", "tern") +# B <- c("gull", "rook", "tern", "kite", "myna") +# +# setdiff(A, B) # [1] "duck" "crow" +# setdiff(B, A) # [1] "rook" "kite" "myna" + +# If some of the features in the expression set are not listed in the +# systematic names, you have to be aware of that, when you try to get +# more information on them. I presume they are missing because revisions +# of the yeast genome after these experiments were done showed that these +# genes did not actually exist. + +# - confirm: how many / which genes in the feature table do not +# have expression data? + +# How should we handle rows/columns that are missing or not unique? + + +# == 4.2 Selected Expression profiles ====================================== + +# The code below assumes that you have read ./data/SGD_features.tab and assigned +# the resulting data frame to SGD_features, with columns as specified above. + +# Here is an expression profile for Mbp1. + +gName <- "MBP1" +(iFeature <- which(SGD_features$name == gName)) +(iExprs <- which(featureNames(GSE3635) == SGD_features$sysName[iFeature])) +plot(seq(0, 120, by = 10), + Biobase::exprs(GSE3635)[iExprs, ], + main = paste("Expression profile for", gName), + xlab = "time (min)", + ylab = "expression", + type = "b", + col= "maroon") +abline(h = 0, col = "#00000055") +abline(v = 60, col = "#00000055") + +# Print the description +SGD_features$description[iFeature] + +# Here is a list of gene names that may be involved in the cell cycle switch, +# and some genes that are controls (cf. BIN-SYS-Concepts): + +# Turning it on +# Cdc14, Mbp1, Swi6, Swi4, Whi5, Cdc28, Cln1, Cln2, Cln3 + +# Turning it off +# Rad53, Cdc28, Clb1, Clb2, Clb6, Nrm1 + +# Housekeeping genes +# Act1, and Alg9 + +#TASK> Plot expression profiles for these genes and study them. What do you +#TASK> expect the profiles to look like, given the role of these genes? What +#TASK> do you find? (Hint: you will make your life much easier if you define +#TASK> a function that plots and prints descriptions with a gene name as input. +#TASK> Also: are the gene names in the feature table upper case, or lower case? +#TASK> Also: note that the absolute values of change are quite different. +#TASK> Also: note that some values may be outliers i.e. failed experiments.) + +# = 5 Differential Expression ============================================= + +# GEO2R discovers the top differentially expressed expressed genes by +# using functions in the Bioconductor limma package. + +if (! requireNamespace("limma", quietly = TRUE)) { + BiocManager::install("limma") +} +# Package information: +# library(help = limma) # basic information +# browseVignettes("limma") # available vignettes +# data(package = "limma") # available datasets + +# The GEO2R limma code is virtually uncommented, and has not been written for +# clarity, but for being easily produced by a code-generator that is triggered +# by the parameters on the GEO Web-site. Most of it is actually dispensable for +# our purposes. + +# In principle, the code goes through three steps: +# 1. Prepare the data +# 2. Define groups that are to be contrasted to define "Differential" +# 3. Find genes whose expression levels are significantly different across +# the groups +# 4. Format results. + +# Biobase is a highly engineered package that is tightly integrated into +# the Bioconductor world - unfortunately that brings with it a somewhat +# undesirable level of computational overhead and dependencies. Using the +# package as we normally do - i.e. calling required functions with their +# explicit package prefix is therefore not advisable. There are generics +# that won't be propery dispatched. If you only need a small number of +# functions for a very specific context, you will probably get away with +# Biobase::() - but even in the demonstration code of this script +# not everything works out of the box. We'll therefore load the library, +# but we'll (redundantly) use the prefix anyway so as to emphasize where +# the functions come from. + +library(Biobase) + +# We are recapitulating the experiment in which we assigned the 0, 10, 60 and +# 70 minute samples to one group, the 30, 40, 90 and 100 minute samples to +# another group, and calculated differential expression values between these +# two groups. + +setA <- c(1, 2, 7, 8) # columns for set A +setB <- c(4, 5, 10, 11) # columns for set B + +# We remove columns we don't need, and for simplicity put the experiments for +# group A in the first four columns, and the group B in the next four. + +mySet <- GSE3635[ , c(setA, setB)] + +# limma needs the column descriptions as factors +mySet$description <- as.factor(c(rep("A", 4), rep("B", 4))) + +# Next we build the "design Matrix" for the statistical test: +myDesign <- model.matrix(~ description + 0, mySet) +colnames(myDesign) <- levels(mySet$description) +myDesign + +# Now we can calculate the fit of all rows to a linear model that depends +# on the two groups as specified in the design: +myFit <- limma::lmFit(mySet, myDesign) + +# Next we calculate the contrasts, given the fit ... +myCont.matrix <- limma::makeContrasts(A - B, levels = myDesign) +myFit2 <- limma::contrasts.fit(myFit, myCont.matrix) + +# ... compute appropriate probabilites from a modified t-test +# (empirical Bayes) ... +myFit2 <- limma::eBayes(myFit2, 0.01) + +# ... add the gene names to the fit - object ... +myFit2$genes <- featureNames(mySet) + +# ... and pick the top N differentially expressed genes while controlling +# for multiple testing with a False Discovery Rate (fdr) correction. GEO2R +# gave us only the top 250 genes, but we might as well do 1000, just so we +# can be reasonable sure that our gens of interest are included. +N <- 1000 +myTable <- limma::topTable(myFit2, + adjust.method = "fdr", + sort.by = "B", + number = N) + +str(myTable) +# The gene names are now in the $ID column + +# These are the top 10 +write.table(myTable[1:10 , c("ID","P.Value","B")], + file = stdout(), + row.names = FALSE, + sep="\t") + +# Let's see what we got: let's plot the full expression profiles (all 13 +# columns) for the top ten genes from exprs(GSE3635). + +plot(seq(0, 120, by = 10), + rep(0, 13), + type = "n", + ylim = c(-1, 1), + xlab = "time", + ylab = "log-ratio expression") +rect( 0, -2, 15, 2, col = "#dfeaf4", border = NA) # setA +rect( 55, -2, 75, 2, col = "#dfeaf4", border = NA) # setA +rect( 25, -2, 45, 2, col = "#f4dfdf", border = NA) # setB +rect( 85, -2, 105, 2, col = "#f4dfdf", border = NA) # setB +abline(h = 0, col = "#00000055") + +for (i in 1:10) { + thisID <- myTable$ID[i] + points(seq(0, 120, by = 10), Biobase::exprs(GSE3635)[thisID, ], type = "b") +} + +# Our guess that we might discover interesting genes by selecting groups A and B +# like we did was not bad. But limma knows nothing about the biology and though +# the expression profiles look good, there is no guarantee that these are the +# most biologically relevant genes. Significantly different in expression +# according to the groups we define is not necessarily the same as a cyclically +# varying gene, nor does it necessarily find the genes whose expression levels +# are _most_ different, i.e. if the variance of a highly, differentially +# expressed gene within a group is large, it may not be very significant. Also, +# we are not exploiting the fact that these values are time series. +# Nevertheless, we find genes for which we see a change in expression levels +# along two cell-cycles. + +# Let's superimpose some "real" cell-cycle genes: +myControls <- c("Cdc14", "Mbp1", "Swi6", "Swi4", "Whi5", "Cln1", "Cln2", "Cln3") +for (name in toupper(myControls)) { + thisID <- SGD_features$sysName[which(SGD_features$name == name)] + points(seq(0, 120, by=10), + Biobase::exprs(GSE3635)[thisID, ], + type="b", + col="#AA0000") +} + +# Indeed, the discovered gene profiles look much "cleaner" than the real cycle +# genes and this just means that differential expression in the way that we +# have performed it is an approximation to the biology. + +# == 5.1 Final task: Gene descriptions ===================================== + +#TASK> Print the descriptions of the top ten differentially expressed genes +#TASK> and comment on what they have in common (or not). + + +# = 6 Improving on Discovery by Differential Expression =================== + + +# There are many ways to improve on purely statistical methods, if we have +# better ideas about the biology. I would just like to demonstrate one +# possibility here: calculate correlation values to a sample gene - such as Cln2 +# for which we know that it is involved in the cell cycle. Let's plot it first: + +gName <- "CLN2" +(iFeature <- which(SGD_features$name == gName)) +(iExprs <- which(featureNames(GSE3635) == SGD_features$sysName[iFeature])) +Cln2Profile <- Biobase::exprs(GSE3635)[iExprs, ] +plot(seq(0, 120, by = 10), + Cln2Profile, + ylim = c(-1, 1), + main = paste("Expression profile for", gName), + xlab = "time (min)", + ylab = "expression", + type = "b", + pch = 16, + cex = 1.5, + lwd = 2, + col= "#40b886") +abline(h = 0, col = "#0000FF55") +abline(v = 60, col = "#0000FF55") + +# Set up a vector of correlation values + + +myCorrelations <- numeric(nrow(Biobase::exprs(GSE3635))) +names(myCorrelations) <- Biobase::featureNames(GSE3635) +for (i in 1:length(myCorrelations)) { + myCorrelations[i] <- cor(Cln2Profile, Biobase::exprs(GSE3635)[i, ]) +} + +nTOP <- 20 +myTopC <- order(myCorrelations, decreasing = TRUE)[1:nTOP] + +# Number 1 +(ID <- Biobase::featureNames(GSE3635)[myTopC[1]]) + +# Get information +SGD_features[which(SGD_features$sysName == ID), ] +# Of course: the highest correlation is Cln1 itself. This is our positive +# control for the experiment. + +# Let's plot the rest +myPal <- colorRampPalette(c("#82f58d", "#E0F2E2", "#f6f6f6")) + +for (i in 2:nTOP) { + ID <- Biobase::featureNames(GSE3635)[myTopC[i]] + points(seq(0, 120, by = 10), + Biobase::exprs(GSE3635)[ID, ], + type = "b", + cex = 0.8, + col= myPal(nTOP)[i]) + print(SGD_features[which(SGD_features$sysName == ID), + c("name", "description")]) +} + +# Note that all of these genes are highly correlated with a known cell cycle +# gene, but because the absolute values of expression differences are not very +# large for some of them, they might not be picked up by any algorithm that is +# focussed on large differential expression changes. Do small relative changes +# mean small biological effects? Certainly not! + +# And we haven't even looked at the anticorrelated genes yet... +nBOT <- nTOP +myBottomC <- order(myCorrelations, decreasing = FALSE)[1:nBOT] # bottom ten +myPal <- colorRampPalette(c("#ba112a", "#E3C8CC", "#ebebeb")) + +for (i in 1:nBOT) { + ID <- Biobase::featureNames(GSE3635)[myBottomC[i]] + points(seq(0, 120, by = 10), + Biobase::exprs(GSE3635)[ID, ], + type = "b", + cex = 0.8, + col= myPal(nBOT)[i]) + print(SGD_features[which(SGD_features$sysName == ID), + c("name", "description")]) +} +# ... which are very interesting in their own right. + +# What I hope you appreciate from this example is: +# - convenient general purpose methods exist that analyze expression data +# with sophisticated statistical methods; +# - the results of these methods depend on whether the statistics model +# the biology well; +# - you will draw Cargo Cult conclusions if you can't cast your biology +# of interest in terms of a model, "canned" solutions are unlikely +# to give you all the answers you need; +# - being able to write your own code gives you the freedom to experiment +# and explore. There is a learning curve - but the payoffs are +# significant. + +# = 7 Annotation data ===================================================== +# +# Loading feature data "by hand" as we've done above, is usually not necessary +# since GEO provides rich annotations in the GPL platform files, which are +# associated with its Gene Expression Sets files. In the code above, +# we used getGEO("GSE3635", GSEMatrix = TRUE, getGPL = FALSE), and the GPL +# annotations were not loaded. We could use getGPL = TRUE instead ... + +GSE3635annot <- GEOquery::getGEO("GSE3635", GSEMatrix = TRUE, getGPL = TRUE) +GSE3635annot <- GSE3635annot[[1]] + +# ... and the feature data is then available in the GSE3635@featureData@data +# slot: +str(GSE3635annot@featureData@data) +GSE3635annot@featureData@data[ 1:20 , ] + +# ... from where you can access the columns you need, e.g. spotIDs and gene +# symbols: + +myAnnot <- GSE3635annot@featureData@data[ , c("SPOT_ID", "Gene")] +str(myAnnot) + +# ... Note that this is a data frame and it is easy to find things we +# might be looking for ... +myAnnot[which(myAnnot$Gene == "MBP1"), ] + +# ... or identify rows that might give us trouble, such as probes that +# hybridize to more than one gene. + + +# Alternatively, we could have identified the GPL file for this set: +GSE3635@annotation # "GPL1914" + +# ... and downloaded it directly from NCBI: +GPL1914 <- GEOquery::getGEO("GPL1914") +str(GPL1914) + +# ... from which we can get the data - which is however NOT necessarily +# matched to the rows of our expression dataset. + + +# [END] diff --git a/RPR-Genetic_code_optimality.R b/RPR-Genetic_code_optimality.R index ef8f865..0bd5293 100644 --- a/RPR-Genetic_code_optimality.R +++ b/RPR-Genetic_code_optimality.R @@ -1,385 +1,385 @@ -# tocID <- "RPR-Genetic_code_optimality.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the RPR-Genetic_code_optimality unit. -# -# Version: 1.3 -# -# Date: 2017-10 - 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.3 2020 Maintenance -# 1.2 Change from require() to requireNamespace(), -# use ::() idiom throughout, -# use Biocmanager:: not biocLite() -# 1.1 Update set.seed() usage -# 1.0.1 Fixed two bugs discovered by Suan Chin Yeo. -# 1.0 New material. -# -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> -------------------------------------------------------------- -#TOC> 1 Designing a computational experiment 58 -#TOC> 2 Setting up the tools 74 -#TOC> 2.1 Natural and alternative genetic codes 77 -#TOC> 2.2 Effect of mutations 135 -#TOC> 2.2.1 reverse-translate 146 -#TOC> 2.2.2 Randomly mutate 171 -#TOC> 2.2.3 Forward- translate 196 -#TOC> 2.2.4 measure effect 213 -#TOC> 3 Run the experiment 267 -#TOC> 4 Task solutions 363 -#TOC> -#TOC> ========================================================================== - - -# This unit demonstrates R code to simulate alternate genetic codes and evaluate -# their robsustness to code changes. The approaches are quite simple and you -# will be able to come up with obvious refinements; the point of this code is to -# demonstrate some R programming techniques, in preparation for more -# sophisticated questions later. - - -# = 1 Designing a computational experiment ================================ - -# Computational experiments are conducted like wet-lab experiments. We begin -# with a hypothesis, then define the observables that relate to the hypothesis, -# then define the measures we apply to observations, and finally we interpret -# our observations. If we want to learn something about the evolution of the -# genetic code ... - -# - we construct a hypothesis such as: the genetic code has evolved so as to -# minimize the effect of mutations; -# - we define the observables: the effect of mutations in -# sequences, given the natural and possible alternative codes; -# - we define the measures to quantify the effect of mutations; -# - then we compute alternatives and interpret the results. - - -# = 2 Setting up the tools ================================================ - - -# == 2.1 Natural and alternative genetic codes ============================= - -# Load genetic code tables from the Biostrings package -if (! requireNamespace("BiocManager", quietly = TRUE)) { - install.packages("BiocManager") -} -if (! requireNamespace("Biostrings", quietly = TRUE)) { - BiocManager::install("Biostrings") -} -# Package information: -# library(help = Biostrings) # basic information -# browseVignettes("Biostrings") # available vignettes -# data(package = "Biostrings") # available datasets - - -# There are many ways to generate alternative codes. The simplest way is to -# randomly assign amino acids to codons. A more sophisticated way is to keep the -# redundancy of codons intact, since it may reflect some form of symmetry -# breaking that ignores the third nucleotide of a codon for the most part; -# therefore we only replace the amino acids of the existing code with random -# others. Here are two functions that implement these two ideas about alternate -# codes. - -randomGC <- function(GC) { - # Return a genetic code with randomly assigned amino acids. - # Parameters: - # GC named chr length-64 character vector of 20 amino acid one-letter - # codes plus "*" (stop), named with the codon triplet. - # Value: named chr same vector with random amino acid assignments in which - # every amino acid and "*" is encoded at least once. - - aa <- unique(GC) # the amino acids in the input code - GC[1:64] <- sample(aa, 64, replace = TRUE) # random code - while(length(unique(GC)) < length(aa)) { # We could end up with a code that - # does not contain all amino acids, - # then we sample() again. - GC[1:64] <- sample(aa, 64, replace = TRUE) - } - return(GC) -} - -swappedGC <- function(GC) { - # Return a genetic code with randomly swapped amino acids. - # Parameters: - # GC named chr length-64 character vector of 20 amino acid one-letter - # codes plus "*" (stop), named with the codon triplet. - # Value: named chr same vector with random amino acid assignments where the - # amino acids have been swapped. - - aaOrig <- unique(GC) # the amino acids in the input code - aaSwap <- sample(aaOrig, length(aaOrig)) # shuffled - names(aaSwap) <- aaOrig # name them after the original - GC[1:64] <- aaSwap[GC] # replace original with shuffled - - return(GC) -} - - -# == 2.2 Effect of mutations =============================================== - - -# To evaluate the effects of mutations we will do the following: -# - we take an amino acid sequence (Mbp1 will do just nicely); -# - we reverse-translate it into a nucleotide sequence; -# - we mutate it randomly; -# - we translate it back to amino acids; -# - we count the number of mutations and evaluate their severity. - - -# === 2.2.1 reverse-translate - -# To reverse-translate an amino acid vector, we randomly pick one of its -# codons from a genetic code, and assemble all codons to a sequence. - -traRev <- function(s, GC) { - # Parameters: - # s chr a sequence vector - # GC chr a genetic code - # Value: - # A reverse-translated vector of codons - vC <- character(length(s)) - - for (i in seq_along(s)) { - codon <- names(GC)[GC == s[i]] # get all codons for this AA - if (length(codon) > 1) { # if there's more than one ... - codon <- sample(codon, 1) # pick one at random ... - } - vC[i] <- codon # store it - } - - return(vC) -} - - -# === 2.2.2 Randomly mutate - -# To mutate, we split a codon into it's three nucleotides, then randomly replace -# one of the three with another nucleotide. - -randMut <- function(vC) { - # Parameter: - # vC chr a vector of codons - # Value: chr a vector of codons with a single point mutation from vC - - nuc <- c("A", "C", "G", "T") - - for (i in seq_along(vC)) { - triplet <- unlist(strsplit(vC[i], "")) # split into three nucl. - iNuc <- sample(1:3, 1) # choose one of the three - mutNuc <- sample(nuc[nuc != triplet[iNuc]], 1) # chose a mutated nucleotide - triplet[iNuc] <- mutNuc # replace the original - vC[i] <- paste0(triplet, collapse = "") # collapse it to a codon - } - return(vC) - -} - - - -# === 2.2.3 Forward- translate - -traFor <- function(vC, GC) { - # Parameters: - # vC chr a codon vector - # GC chr a genetic code - # Value: - # A vector of amino acids - vAA <- character(length(vC)) - - for (i in seq_along(vC)) { - vAA[i] <- GC[vC[i]] # translate and store - } - return(vAA) -} - - -# === 2.2.4 measure effect - -# How do we evaluate the effect of the mutation? We'll take a simple ad hoc -# approach: we divide amino acids into hydrophobic, hydrophilic, and neutral -# categories, according to their free energy of transfer from water to octanol: -aaHphobic <- c("M", "I", "L", "C", "W", "Y", "F") -aaHphilic <- c("E", "D", "Q", "N", "P", "K", "R") -aaNeutral <- c("A", "H", "T", "S", "V", "G") - -# Then we will penalize as follows: -# Changes within one category: 0.1 -# Changes from hydrophobic or hydrophilic to neutral or back: 0.3 -# Changes from hydrophobic to hydrophilic or back: 1.0 -# Changes to stop-codon: 3.0 - -evalMut <- function(nat, mut) { - # Evaluate severity of mutations between amino acid sequence vectors nat and - # mut in an ad hoc approach based on hydrophobicity changes. - aaHphobic <- c("M", "I", "L", "C", "W", "Y", "F") - aaHphilic <- c("E", "D", "Q", "N", "P", "K", "R") - aaNeutral <- c("A", "H", "T", "S", "V", "G") - - penalties <- numeric(length(nat)) - lMut <- nat != mut # logical TRUE for all mutated positions - - penalties[lMut & (nat %in% aaHphobic) & (mut %in% aaHphobic)] <- 0.1 - penalties[lMut & (nat %in% aaHphobic) & (mut %in% aaHphilic)] <- 1.0 - penalties[lMut & (nat %in% aaHphobic) & (mut %in% aaNeutral)] <- 0.3 - - penalties[lMut & (nat %in% aaHphilic) & (mut %in% aaHphobic)] <- 1.0 - penalties[lMut & (nat %in% aaHphilic) & (mut %in% aaHphilic)] <- 0.1 - penalties[lMut & (nat %in% aaHphilic) & (mut %in% aaNeutral)] <- 0.3 - - penalties[lMut & (nat %in% aaNeutral) & (mut %in% aaHphobic)] <- 0.3 - penalties[lMut & (nat %in% aaNeutral) & (mut %in% aaHphilic)] <- 0.3 - penalties[lMut & (nat %in% aaNeutral) & (mut %in% aaNeutral)] <- 0.1 - - return(sum(penalties)) -} - -# A more sophisticated approach could take additional quantities into account, -# such as charge, size, or flexibility - and it could add heuristics, such as: -# proline is always bad in secondary structure, charged amino acids are terrible -# in the folded core of a protein, replacing a small by a large amino acid in -# the core is very disruptive ... etc. -# -# For our experiment, we should not use a mutation data matrix however: -# empirical mutation probabilities are superbly suited to estimate evolutionary -# relationships. Here however, as we are trying to evaluate effects of random -# mutations on genetic codes, our reasoning would be circular - we would -# discover that the natural genetic code is optimal ... because it is most -# similar to the natural genetic code. That would be Cargo Cult bioinformatics. - - -# = 3 Run the experiment ================================================== - -# Fetch the standard Genetic code from Biostrings:: - -stdCode <- Biostrings::GENETIC_CODE - -# Fetch the nucleotide sequence for MBP1: - -myDNA <- readLines("./data/S288C_YDL056W_MBP1_coding.fsa")[-1] -myDNA <- paste0(myDNA, collapse = "") -myDNA <- as.character(Biostrings::codons(Biostrings::DNAString(myDNA))) -myDNA <- myDNA[-length(myDNA)] # drop the stop codon - -myAA <- traFor(myDNA, stdCode) - -# Mutate and evaluate -set.seed(112358) -x <- randMut(myDNA) -set.seed(NULL) -x <- traFor(x, stdCode) -evalMut(myAA, x) # 166.4 - -# Try this 200 times, and see how the values are distributed. -N <- 200 -valSTDC <- numeric(N) - -set.seed(112358) # set RNG seed for repeatable randomness -for (i in 1:N) { # this takes a few seconds ... - x <- randMut(myDNA) # mutate - x <- traFor(x, stdCode) # translate - valSTDC[i] <- evalMut(myAA, x) # evaluate -} -set.seed(NULL) # reset the RNG - -hist(valSTDC, - breaks = 15, - col = "palegoldenrod", - xlim = c(0, 400), - ylim = c(0, N/4), - main = "Standard vs. Synthetic Genetic Code", - xlab = "Mutation penalty") - -# This looks like a normal distribution. Let's assume the effect of mutations -# under the standard genetic code is the mean of this distribution: -effectSTDC <- mean(valSTDC) # 178.1 - -# Now we can look at the effects of alternate genetic codes: - -set.seed(112358) -# choose a new code -GC <- randomGC(stdCode) -set.seed(NULL) - -# reverse translate hypothetical sequence according to the new code -x <- traRev(myAA, GC) - -x <- randMut(x) # randomly mutate hypothetical nucleotide sequence -x <- traFor(x, GC) # translate back, with the new code -evalMut(myAA, x) # evaluate mutation effects: 298.5 - -# That seems a fair bit higher than what we saw as "effectUGC" -# Let's try with different genetic codes. 200 trials - but this time every trial -# is with a different, synthetic genetic code. - -N <- 200 -valXGC <- numeric(N) - -set.seed(1414214) # set RNG seed for repeatable randomness -for (i in 1:N) { - GC <- randomGC(stdCode) # Choose code - x <- traRev(myAA, GC) # reverse translate - x <- randMut(x) # mutate - x <- traFor(x, GC) # translate - valXGC[i] <- evalMut(myAA, x) # evaluate -} -set.seed(NULL) # reset the RNG - -hist(valXGC, - col = "plum", - breaks = 15, - add = TRUE) - -# These two distributions are very widely separated! - -# Task: Perform the same experiment with the swapped genetic code. -# Compare the distributions. Interpret the result. - - -# These are simple experiments, under assumptions that can be refined in -# meaningful ways. Yet, even those simple computational experiments show -# that the Universal Genetic Code has features that one would predict if -# it has evolved under selective pressure to minimize the effects of mutations. -# Gradual change under mutation is benificial to evolution, disruptive -# change is not. - - -# = 4 Task solutions ====================================================== - -N <- 200 -valSGC <- numeric(N) - -set.seed(2718282) # set RNG seed for repeatable randomness -for (i in 1:N) { - GC <- swappedGC(stdCode) # Choose code - x <- traRev(myAA, GC) # reverse translate - x <- randMut(x) # mutate - x <- traFor(x, GC) # translate - valSGC[i] <- evalMut(myAA, x) # evaluate -} -set.seed(NULL) # reset the RNG - -hist(valSGC, - col = "#6688FF88", - breaks = 15, - add = TRUE) - - - -# [END] +# tocID <- "RPR-Genetic_code_optimality.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the RPR-Genetic_code_optimality unit. +# +# Version: 1.3 +# +# Date: 2017-10 - 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.3 2020 Maintenance +# 1.2 Change from require() to requireNamespace(), +# use ::() idiom throughout, +# use Biocmanager:: not biocLite() +# 1.1 Update set.seed() usage +# 1.0.1 Fixed two bugs discovered by Suan Chin Yeo. +# 1.0 New material. +# +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> -------------------------------------------------------------- +#TOC> 1 Designing a computational experiment 58 +#TOC> 2 Setting up the tools 74 +#TOC> 2.1 Natural and alternative genetic codes 77 +#TOC> 2.2 Effect of mutations 135 +#TOC> 2.2.1 reverse-translate 146 +#TOC> 2.2.2 Randomly mutate 171 +#TOC> 2.2.3 Forward- translate 196 +#TOC> 2.2.4 measure effect 213 +#TOC> 3 Run the experiment 267 +#TOC> 4 Task solutions 363 +#TOC> +#TOC> ========================================================================== + + +# This unit demonstrates R code to simulate alternate genetic codes and evaluate +# their robsustness to code changes. The approaches are quite simple and you +# will be able to come up with obvious refinements; the point of this code is to +# demonstrate some R programming techniques, in preparation for more +# sophisticated questions later. + + +# = 1 Designing a computational experiment ================================ + +# Computational experiments are conducted like wet-lab experiments. We begin +# with a hypothesis, then define the observables that relate to the hypothesis, +# then define the measures we apply to observations, and finally we interpret +# our observations. If we want to learn something about the evolution of the +# genetic code ... + +# - we construct a hypothesis such as: the genetic code has evolved so as to +# minimize the effect of mutations; +# - we define the observables: the effect of mutations in +# sequences, given the natural and possible alternative codes; +# - we define the measures to quantify the effect of mutations; +# - then we compute alternatives and interpret the results. + + +# = 2 Setting up the tools ================================================ + + +# == 2.1 Natural and alternative genetic codes ============================= + +# Load genetic code tables from the Biostrings package +if (! requireNamespace("BiocManager", quietly = TRUE)) { + install.packages("BiocManager") +} +if (! requireNamespace("Biostrings", quietly = TRUE)) { + BiocManager::install("Biostrings") +} +# Package information: +# library(help = Biostrings) # basic information +# browseVignettes("Biostrings") # available vignettes +# data(package = "Biostrings") # available datasets + + +# There are many ways to generate alternative codes. The simplest way is to +# randomly assign amino acids to codons. A more sophisticated way is to keep the +# redundancy of codons intact, since it may reflect some form of symmetry +# breaking that ignores the third nucleotide of a codon for the most part; +# therefore we only replace the amino acids of the existing code with random +# others. Here are two functions that implement these two ideas about alternate +# codes. + +randomGC <- function(GC) { + # Return a genetic code with randomly assigned amino acids. + # Parameters: + # GC named chr length-64 character vector of 20 amino acid one-letter + # codes plus "*" (stop), named with the codon triplet. + # Value: named chr same vector with random amino acid assignments in which + # every amino acid and "*" is encoded at least once. + + aa <- unique(GC) # the amino acids in the input code + GC[1:64] <- sample(aa, 64, replace = TRUE) # random code + while(length(unique(GC)) < length(aa)) { # We could end up with a code that + # does not contain all amino acids, + # then we sample() again. + GC[1:64] <- sample(aa, 64, replace = TRUE) + } + return(GC) +} + +swappedGC <- function(GC) { + # Return a genetic code with randomly swapped amino acids. + # Parameters: + # GC named chr length-64 character vector of 20 amino acid one-letter + # codes plus "*" (stop), named with the codon triplet. + # Value: named chr same vector with random amino acid assignments where the + # amino acids have been swapped. + + aaOrig <- unique(GC) # the amino acids in the input code + aaSwap <- sample(aaOrig, length(aaOrig)) # shuffled + names(aaSwap) <- aaOrig # name them after the original + GC[1:64] <- aaSwap[GC] # replace original with shuffled + + return(GC) +} + + +# == 2.2 Effect of mutations =============================================== + + +# To evaluate the effects of mutations we will do the following: +# - we take an amino acid sequence (Mbp1 will do just nicely); +# - we reverse-translate it into a nucleotide sequence; +# - we mutate it randomly; +# - we translate it back to amino acids; +# - we count the number of mutations and evaluate their severity. + + +# === 2.2.1 reverse-translate + +# To reverse-translate an amino acid vector, we randomly pick one of its +# codons from a genetic code, and assemble all codons to a sequence. + +traRev <- function(s, GC) { + # Parameters: + # s chr a sequence vector + # GC chr a genetic code + # Value: + # A reverse-translated vector of codons + vC <- character(length(s)) + + for (i in seq_along(s)) { + codon <- names(GC)[GC == s[i]] # get all codons for this AA + if (length(codon) > 1) { # if there's more than one ... + codon <- sample(codon, 1) # pick one at random ... + } + vC[i] <- codon # store it + } + + return(vC) +} + + +# === 2.2.2 Randomly mutate + +# To mutate, we split a codon into it's three nucleotides, then randomly replace +# one of the three with another nucleotide. + +randMut <- function(vC) { + # Parameter: + # vC chr a vector of codons + # Value: chr a vector of codons with a single point mutation from vC + + nuc <- c("A", "C", "G", "T") + + for (i in seq_along(vC)) { + triplet <- unlist(strsplit(vC[i], "")) # split into three nucl. + iNuc <- sample(1:3, 1) # choose one of the three + mutNuc <- sample(nuc[nuc != triplet[iNuc]], 1) # chose a mutated nucleotide + triplet[iNuc] <- mutNuc # replace the original + vC[i] <- paste0(triplet, collapse = "") # collapse it to a codon + } + return(vC) + +} + + + +# === 2.2.3 Forward- translate + +traFor <- function(vC, GC) { + # Parameters: + # vC chr a codon vector + # GC chr a genetic code + # Value: + # A vector of amino acids + vAA <- character(length(vC)) + + for (i in seq_along(vC)) { + vAA[i] <- GC[vC[i]] # translate and store + } + return(vAA) +} + + +# === 2.2.4 measure effect + +# How do we evaluate the effect of the mutation? We'll take a simple ad hoc +# approach: we divide amino acids into hydrophobic, hydrophilic, and neutral +# categories, according to their free energy of transfer from water to octanol: +aaHphobic <- c("M", "I", "L", "C", "W", "Y", "F") +aaHphilic <- c("E", "D", "Q", "N", "P", "K", "R") +aaNeutral <- c("A", "H", "T", "S", "V", "G") + +# Then we will penalize as follows: +# Changes within one category: 0.1 +# Changes from hydrophobic or hydrophilic to neutral or back: 0.3 +# Changes from hydrophobic to hydrophilic or back: 1.0 +# Changes to stop-codon: 3.0 + +evalMut <- function(nat, mut) { + # Evaluate severity of mutations between amino acid sequence vectors nat and + # mut in an ad hoc approach based on hydrophobicity changes. + aaHphobic <- c("M", "I", "L", "C", "W", "Y", "F") + aaHphilic <- c("E", "D", "Q", "N", "P", "K", "R") + aaNeutral <- c("A", "H", "T", "S", "V", "G") + + penalties <- numeric(length(nat)) + lMut <- nat != mut # logical TRUE for all mutated positions + + penalties[lMut & (nat %in% aaHphobic) & (mut %in% aaHphobic)] <- 0.1 + penalties[lMut & (nat %in% aaHphobic) & (mut %in% aaHphilic)] <- 1.0 + penalties[lMut & (nat %in% aaHphobic) & (mut %in% aaNeutral)] <- 0.3 + + penalties[lMut & (nat %in% aaHphilic) & (mut %in% aaHphobic)] <- 1.0 + penalties[lMut & (nat %in% aaHphilic) & (mut %in% aaHphilic)] <- 0.1 + penalties[lMut & (nat %in% aaHphilic) & (mut %in% aaNeutral)] <- 0.3 + + penalties[lMut & (nat %in% aaNeutral) & (mut %in% aaHphobic)] <- 0.3 + penalties[lMut & (nat %in% aaNeutral) & (mut %in% aaHphilic)] <- 0.3 + penalties[lMut & (nat %in% aaNeutral) & (mut %in% aaNeutral)] <- 0.1 + + return(sum(penalties)) +} + +# A more sophisticated approach could take additional quantities into account, +# such as charge, size, or flexibility - and it could add heuristics, such as: +# proline is always bad in secondary structure, charged amino acids are terrible +# in the folded core of a protein, replacing a small by a large amino acid in +# the core is very disruptive ... etc. +# +# For our experiment, we should not use a mutation data matrix however: +# empirical mutation probabilities are superbly suited to estimate evolutionary +# relationships. Here however, as we are trying to evaluate effects of random +# mutations on genetic codes, our reasoning would be circular - we would +# discover that the natural genetic code is optimal ... because it is most +# similar to the natural genetic code. That would be Cargo Cult bioinformatics. + + +# = 3 Run the experiment ================================================== + +# Fetch the standard Genetic code from Biostrings:: + +stdCode <- Biostrings::GENETIC_CODE + +# Fetch the nucleotide sequence for MBP1: + +myDNA <- readLines("./data/S288C_YDL056W_MBP1_coding.fsa")[-1] +myDNA <- paste0(myDNA, collapse = "") +myDNA <- as.character(Biostrings::codons(Biostrings::DNAString(myDNA))) +myDNA <- myDNA[-length(myDNA)] # drop the stop codon + +myAA <- traFor(myDNA, stdCode) + +# Mutate and evaluate +set.seed(112358) +x <- randMut(myDNA) +set.seed(NULL) +x <- traFor(x, stdCode) +evalMut(myAA, x) # 166.4 + +# Try this 200 times, and see how the values are distributed. +N <- 200 +valSTDC <- numeric(N) + +set.seed(112358) # set RNG seed for repeatable randomness +for (i in 1:N) { # this takes a few seconds ... + x <- randMut(myDNA) # mutate + x <- traFor(x, stdCode) # translate + valSTDC[i] <- evalMut(myAA, x) # evaluate +} +set.seed(NULL) # reset the RNG + +hist(valSTDC, + breaks = 15, + col = "palegoldenrod", + xlim = c(0, 400), + ylim = c(0, N/4), + main = "Standard vs. Synthetic Genetic Code", + xlab = "Mutation penalty") + +# This looks like a normal distribution. Let's assume the effect of mutations +# under the standard genetic code is the mean of this distribution: +effectSTDC <- mean(valSTDC) # 178.1 + +# Now we can look at the effects of alternate genetic codes: + +set.seed(112358) +# choose a new code +GC <- randomGC(stdCode) +set.seed(NULL) + +# reverse translate hypothetical sequence according to the new code +x <- traRev(myAA, GC) + +x <- randMut(x) # randomly mutate hypothetical nucleotide sequence +x <- traFor(x, GC) # translate back, with the new code +evalMut(myAA, x) # evaluate mutation effects: 298.5 + +# That seems a fair bit higher than what we saw as "effectUGC" +# Let's try with different genetic codes. 200 trials - but this time every trial +# is with a different, synthetic genetic code. + +N <- 200 +valXGC <- numeric(N) + +set.seed(1414214) # set RNG seed for repeatable randomness +for (i in 1:N) { + GC <- randomGC(stdCode) # Choose code + x <- traRev(myAA, GC) # reverse translate + x <- randMut(x) # mutate + x <- traFor(x, GC) # translate + valXGC[i] <- evalMut(myAA, x) # evaluate +} +set.seed(NULL) # reset the RNG + +hist(valXGC, + col = "plum", + breaks = 15, + add = TRUE) + +# These two distributions are very widely separated! + +# Task: Perform the same experiment with the swapped genetic code. +# Compare the distributions. Interpret the result. + + +# These are simple experiments, under assumptions that can be refined in +# meaningful ways. Yet, even those simple computational experiments show +# that the Universal Genetic Code has features that one would predict if +# it has evolved under selective pressure to minimize the effects of mutations. +# Gradual change under mutation is benificial to evolution, disruptive +# change is not. + + +# = 4 Task solutions ====================================================== + +N <- 200 +valSGC <- numeric(N) + +set.seed(2718282) # set RNG seed for repeatable randomness +for (i in 1:N) { + GC <- swappedGC(stdCode) # Choose code + x <- traRev(myAA, GC) # reverse translate + x <- randMut(x) # mutate + x <- traFor(x, GC) # translate + valSGC[i] <- evalMut(myAA, x) # evaluate +} +set.seed(NULL) # reset the RNG + +hist(valSGC, + col = "#6688FF88", + breaks = 15, + add = TRUE) + + + +# [END] diff --git a/RPR-Introduction.R b/RPR-Introduction.R index 1bedc58..e50b04b 100644 --- a/RPR-Introduction.R +++ b/RPR-Introduction.R @@ -1,50 +1,50 @@ -# tocID <- "RPR-Introduction.R" -# -# -# Purpose: A Bioinformatics Course: -# R code accompanying the RPR-Introduction unit -# -# Version: 1.0 -# -# Date: 2020-09-18 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# V 1.0 Updtaed workflow; live -# V 0.1 First code -# -# TODO: -# -# -# == HOW TO WORK WITH LEARNING UNIT FILES ====================================== -# -# DO NOT SIMPLY source() THESE FILES! - -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - -# === TASK: Local script -# -# - Open the file myScript.R -# -# - Create a section header with a date. -# - Enter an R-expression that will produce the first 11 powers of 2 (starting -# from 0). Not a loop - a single expression. The first number you get must -# be 1. The last number you get must be 1024. -# -# - Save the file in the myScripts folder, and close it. -# -# - Open the file again, select the expression and type Cmd+Enter (or Cmd+R) -# to execute it. -# -# - Done - -# (This task is meant to make sure that writing R expressions, saving -# them in scripts, opening script files and executing code in the file works -# for you. If there is an issue, get in touch.) - - - -# [END] +# tocID <- "RPR-Introduction.R" +# +# +# Purpose: A Bioinformatics Course: +# R code accompanying the RPR-Introduction unit +# +# Version: 1.0 +# +# Date: 2020-09-18 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# V 1.0 Updtaed workflow; live +# V 0.1 First code +# +# TODO: +# +# +# == HOW TO WORK WITH LEARNING UNIT FILES ====================================== +# +# DO NOT SIMPLY source() THESE FILES! + +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + +# === TASK: Local script +# +# - Open the file myScript.R +# +# - Create a section header with a date. +# - Enter an R-expression that will produce the first 11 powers of 2 (starting +# from 0). Not a loop - a single expression. The first number you get must +# be 1. The last number you get must be 1024. +# +# - Save the file in the myScripts folder, and close it. +# +# - Open the file again, select the expression and type Cmd+Enter (or Cmd+R) +# to execute it. +# +# - Done + +# (This task is meant to make sure that writing R expressions, saving +# them in scripts, opening script files and executing code in the file works +# for you. If there is an issue, get in touch.) + + + +# [END] diff --git a/RPR-PROSITE_POST.R b/RPR-PROSITE_POST.R index 1736a3d..5ca7758 100644 --- a/RPR-PROSITE_POST.R +++ b/RPR-PROSITE_POST.R @@ -1,168 +1,168 @@ -# tocID <- "RPR-PROSITE_POST.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the RPR-Scripting_data_downloads unit. -# -# Version: 1.2 -# -# Date: 2017-10 - 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.2 2020 Maintenance -# 1.1 Change from require() to requireNamespace(), -# use ::() idiom throughout, -# 1.0.1 Updates for slightly changed interfaces -# 1.0 First ABC units version -# 0.1 First code copied from 2016 material. -# -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> --------------------------------------------------------------------- -#TOC> 1 Constructing a POST command from a Web query 43 -#TOC> 1.1 Task - fetchPrositeFeatures() function 148 -#TOC> 2 Task solutions 156 -#TOC> -#TOC> ========================================================================== - - -# = 1 Constructing a POST command from a Web query ======================== - - -if (! requireNamespace("httr", quietly = TRUE)) { - install.packages("httr") -} -# Package information: -# library(help = httr) # basic information -# browseVignettes("httr") # available vignettes -# data(package = "httr") # available datasets - - - - -# We have reverse engineered the Web form for a ScanProsite request, and can -# construct a valid POST request from knowing the required field names. The POST -# command is similar to GET(), but we need an explicit request body that -# contains a list of key/value pairs - -UniProtID <- "P39678" - -URL <- "https://prosite.expasy.org/cgi-bin/prosite/PSScan.cgi" - -response <- httr::POST(URL, - body = list(meta = "opt1", - meta1_protein = "opt1", - seq = UniProtID, - skip = "on", - output = "tabular")) - -# Send off this request, and you should have a response in a few -# seconds. Let's check the status first: - -httr::status_code(response) # If this is not 200, something went wrong and it - # makes no sense to continue. If this persists, ask - # on the Discussion Board what to do. - - -# The text contents of the response is available with the -# content() function: -httr::content(response, "text") - -# ... should show you the same as the page contents that you have seen in the -# browser. Now we need to extract the data from the page. For this simple -# example we can get away with using regular expressions, but in general we need -# a real XML parser to parse HTML. We'll cover that in a later unit. Here, we -# strsplit() the response into individual lines, since each of our data elements -# is on its own line, and then capture the contents. The way Prosite has -# formatted their HTML we can simply split on the "\\n" newline character - but -# they could write the same valid HTML without any newline-characters at all. -# Understand that we are working with a bit of a "hack" here: exploting -# empirical assumptions rather than a formal specification. But sometimes quick -# and dirty is fine, because quick. - -lines <- unlist(strsplit(httr::content(response, "text"), "\\n")) -head(lines) - -# Now we define a query pattern for the lines we want: -# we can use the uID, bracketed by two "|" pipe -# characters: - -patt <- sprintf("\\|%s\\|", UniProtID) - -# ... and select only the lines that match this -# pattern: - -( lines <- lines[grep(patt, lines)] ) - -# ... captures the three lines of output. - -# Now we break the lines apart into tokens: this is another application of -# strsplit(), but this time we split either on "pipe" characters, "|" OR on tabs -# "\t". Look at the regex "\\t|\\|" in the strsplit() call: - -unlist(strsplit(lines[1], "\\t|\\|")) - -# Its parts are (\\t)=tab (|)=or (\\|)=pipe. Both "t" and "|" need to be escaped -# with a backslash. "t" has to be escaped because we want to match a tab (\t), -# not the literal character "t". And "|" has to be escaped because we mean the -# literal pipe character, not its metacharacter meaning OR. Thus sometimes the -# backslash turns a special meaning off, and sometimes it turns a special -# meaning on. Unfortunately there's no easy way to tell - you just need to -# remember the characters - or have a reference handy. The metacharacters are -# (){}[]^$?*+.|&- ... and some of them have different meanings depending on -# where in the regex they are. - -# Let's put the tokens into named slots of a data frame - -features <- data.frame() -for (line in lines) { - tokens <- unlist(strsplit(line, "\\t|\\|")) - features <- rbind(features, - data.frame(uID = tokens[2], - start = as.numeric(tokens[4]), - end = as.numeric(tokens[5]), - psID = tokens[6], - psName = tokens[7], - psSeq = tokens[11])) -} -features - -# This forms the base of a function that collects the features automatically -# from a PrositeScan result. You can write this! - - -# == 1.1 Task - fetchPrositeFeatures() function ============================ - - -# Task: write a function that takes as input a UniProt ID, fetches the -# features it contains from ScanProsite and returns a data frame as given above, or -# an empty data frame if there is an error. - - -# = 2 Task solutions ====================================================== - - -# I have placed such a function into the ABC-dbUtilities.R script: look it up by -# clicking on dbFetchPrositeFeatures() in the Environment pane. - -# Test: -dbFetchPrositeFeatures("Q5KMQ9") - - - - -# [END] +# tocID <- "RPR-PROSITE_POST.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the RPR-Scripting_data_downloads unit. +# +# Version: 1.2 +# +# Date: 2017-10 - 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.2 2020 Maintenance +# 1.1 Change from require() to requireNamespace(), +# use ::() idiom throughout, +# 1.0.1 Updates for slightly changed interfaces +# 1.0 First ABC units version +# 0.1 First code copied from 2016 material. +# +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> --------------------------------------------------------------------- +#TOC> 1 Constructing a POST command from a Web query 43 +#TOC> 1.1 Task - fetchPrositeFeatures() function 148 +#TOC> 2 Task solutions 156 +#TOC> +#TOC> ========================================================================== + + +# = 1 Constructing a POST command from a Web query ======================== + + +if (! requireNamespace("httr", quietly = TRUE)) { + install.packages("httr") +} +# Package information: +# library(help = httr) # basic information +# browseVignettes("httr") # available vignettes +# data(package = "httr") # available datasets + + + + +# We have reverse engineered the Web form for a ScanProsite request, and can +# construct a valid POST request from knowing the required field names. The POST +# command is similar to GET(), but we need an explicit request body that +# contains a list of key/value pairs + +UniProtID <- "P39678" + +URL <- "https://prosite.expasy.org/cgi-bin/prosite/PSScan.cgi" + +response <- httr::POST(URL, + body = list(meta = "opt1", + meta1_protein = "opt1", + seq = UniProtID, + skip = "on", + output = "tabular")) + +# Send off this request, and you should have a response in a few +# seconds. Let's check the status first: + +httr::status_code(response) # If this is not 200, something went wrong and it + # makes no sense to continue. If this persists, ask + # on the Discussion Board what to do. + + +# The text contents of the response is available with the +# content() function: +httr::content(response, "text") + +# ... should show you the same as the page contents that you have seen in the +# browser. Now we need to extract the data from the page. For this simple +# example we can get away with using regular expressions, but in general we need +# a real XML parser to parse HTML. We'll cover that in a later unit. Here, we +# strsplit() the response into individual lines, since each of our data elements +# is on its own line, and then capture the contents. The way Prosite has +# formatted their HTML we can simply split on the "\\n" newline character - but +# they could write the same valid HTML without any newline-characters at all. +# Understand that we are working with a bit of a "hack" here: exploting +# empirical assumptions rather than a formal specification. But sometimes quick +# and dirty is fine, because quick. + +lines <- unlist(strsplit(httr::content(response, "text"), "\\n")) +head(lines) + +# Now we define a query pattern for the lines we want: +# we can use the uID, bracketed by two "|" pipe +# characters: + +patt <- sprintf("\\|%s\\|", UniProtID) + +# ... and select only the lines that match this +# pattern: + +( lines <- lines[grep(patt, lines)] ) + +# ... captures the three lines of output. + +# Now we break the lines apart into tokens: this is another application of +# strsplit(), but this time we split either on "pipe" characters, "|" OR on tabs +# "\t". Look at the regex "\\t|\\|" in the strsplit() call: + +unlist(strsplit(lines[1], "\\t|\\|")) + +# Its parts are (\\t)=tab (|)=or (\\|)=pipe. Both "t" and "|" need to be escaped +# with a backslash. "t" has to be escaped because we want to match a tab (\t), +# not the literal character "t". And "|" has to be escaped because we mean the +# literal pipe character, not its metacharacter meaning OR. Thus sometimes the +# backslash turns a special meaning off, and sometimes it turns a special +# meaning on. Unfortunately there's no easy way to tell - you just need to +# remember the characters - or have a reference handy. The metacharacters are +# (){}[]^$?*+.|&- ... and some of them have different meanings depending on +# where in the regex they are. + +# Let's put the tokens into named slots of a data frame + +features <- data.frame() +for (line in lines) { + tokens <- unlist(strsplit(line, "\\t|\\|")) + features <- rbind(features, + data.frame(uID = tokens[2], + start = as.numeric(tokens[4]), + end = as.numeric(tokens[5]), + psID = tokens[6], + psName = tokens[7], + psSeq = tokens[11])) +} +features + +# This forms the base of a function that collects the features automatically +# from a PrositeScan result. You can write this! + + +# == 1.1 Task - fetchPrositeFeatures() function ============================ + + +# Task: write a function that takes as input a UniProt ID, fetches the +# features it contains from ScanProsite and returns a data frame as given above, or +# an empty data frame if there is an error. + + +# = 2 Task solutions ====================================================== + + +# I have placed such a function into the ABC-dbUtilities.R script: look it up by +# clicking on dbFetchPrositeFeatures() in the Environment pane. + +# Test: +dbFetchPrositeFeatures("Q5KMQ9") + + + + +# [END] diff --git a/RPR-Pipe.R b/RPR-Pipe.R index 517da92..41936d1 100644 --- a/RPR-Pipe.R +++ b/RPR-Pipe.R @@ -1,135 +1,135 @@ -# tocID <- "RPR-Pipe.R" -# -# Purpose: A Bioinformatics Course: -# Discussing pipe operators. -# -# Version: 1.0 -# -# Date: 2021 10 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.0 New code -# -# -# TODO: -# - find more interesting examples -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ------------------------------------------------ -#TOC> 1 Pipe Concept 41 -#TOC> 2 Nested Expression 73 -#TOC> 3 magrittr:: Pipe 78 -#TOC> 4 Base R Pipe 93 -#TOC> 5 Intermediate Assignment 108 -#TOC> 6 Postscript 127 -#TOC> -#TOC> ========================================================================== - - -# = 1 Pipe Concept ======================================================= - -# Pipes are actually an awesome idea for any code that implements a workflow - -# a sequence of operations, each of which transforms data in a specialized way. -# -# This principle is familiar from maths: chained functions. If have a function -# y = f(x) and want to use those results as in z = g(y), I can just write -# z = g(f(x)) -# -# On the unix command line, pipes were used from the very beginning, implemented -# with the "|" pipe character. -# -# In R, the magrittr package provided the %>% operator, and recently the |> -# operator has been introduced into base R. -# -# However there are alternatives: intermediate assignment, and nested functions -# that have always existed in base R anyway. -# -# Let us look at an example. In writing this, I found out that virtually -# ALL non-trivial examples I came up with don't translate well into this idiom -# at all. It is actually quite limited to simple filtering operations on -# data. A more interesting example might be added in the future, let me know if -# you have a good idea. -# -# A somewhat contrived example is to sort a list of files by the -# length of the file names: - -myFiles <- list.files(pattern = "\\.R$") - -# nchar() gives the number of characters in a string, order() produces indices -# that map an array to its sorted form. -# -# = 2 Nested Expression =================================================== - -myFiles[order(nchar(myFiles))] - - -# = 3 magrittr:: Pipe ===================================================== - -if (! requireNamespace("magrittr", quietly = TRUE)) { - install.packages("magrittr") -} -# Package information: -# library(help = magrittr) # basic information -# browseVignettes("magrittr") # available vignettes -# data(package = "magrittr") # available datasets - - -library(magrittr) - -myFiles %>% nchar %>% order %>% myFiles[.] - -# = 4 Base R Pipe ========================================================= - -# Since version 4.1, base R now supports a pipe operator without the need -# to load a special package. Such an introductions of external functionality -# into the language is very rare. -# -# Unfortunately it won't (yet) work with the '[' function, so we need to write -# an intermediate function for this example -extract <- function(x, v) { - return(v[x]) -} - -myFiles |> nchar() |> order() |> extract(myFiles) - - -# = 5 Intermediate Assignment ============================================= - -# So what's the problem? As you can see, the piped code may be concise and -# expressive. But there is also a large amount of implicit assignment and -# processing going on and that is usually a bad idea because it makes code hard -# to maintain. I am NOT a big fan of the nested syntax, but I don't think that -# replacing it with the pipe makes things much better. My preferred idiom is -# to use intermediate assignments. Only then is it convenient to examine -# the code step by step and validate every single step. And that is the most -# important objective at all: no code is good if it does not compute -# correctly. - - -x <- nchar(myFiles) -x <- order(x) -myFiles[x] - - - -# = 6 Postscript ========================================================== - -# I tried to write an example that strips all comments from a list of files, and -# another example that finds all files that were not yet updated this year -# (according to the "# Date: in the header). Neither examples can be well -# written without intermediate assignments, or at least sapply() functions -# that are not simpler at all than the intermediate assignment. - -# [END] +# tocID <- "RPR-Pipe.R" +# +# Purpose: A Bioinformatics Course: +# Discussing pipe operators. +# +# Version: 1.0 +# +# Date: 2021 10 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.0 New code +# +# +# TODO: +# - find more interesting examples +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ------------------------------------------------ +#TOC> 1 Pipe Concept 41 +#TOC> 2 Nested Expression 73 +#TOC> 3 magrittr:: Pipe 78 +#TOC> 4 Base R Pipe 93 +#TOC> 5 Intermediate Assignment 108 +#TOC> 6 Postscript 127 +#TOC> +#TOC> ========================================================================== + + +# = 1 Pipe Concept ======================================================= + +# Pipes are actually an awesome idea for any code that implements a workflow - +# a sequence of operations, each of which transforms data in a specialized way. +# +# This principle is familiar from maths: chained functions. If have a function +# y = f(x) and want to use those results as in z = g(y), I can just write +# z = g(f(x)) +# +# On the unix command line, pipes were used from the very beginning, implemented +# with the "|" pipe character. +# +# In R, the magrittr package provided the %>% operator, and recently the |> +# operator has been introduced into base R. +# +# However there are alternatives: intermediate assignment, and nested functions +# that have always existed in base R anyway. +# +# Let us look at an example. In writing this, I found out that virtually +# ALL non-trivial examples I came up with don't translate well into this idiom +# at all. It is actually quite limited to simple filtering operations on +# data. A more interesting example might be added in the future, let me know if +# you have a good idea. +# +# A somewhat contrived example is to sort a list of files by the +# length of the file names: + +myFiles <- list.files(pattern = "\\.R$") + +# nchar() gives the number of characters in a string, order() produces indices +# that map an array to its sorted form. +# +# = 2 Nested Expression =================================================== + +myFiles[order(nchar(myFiles))] + + +# = 3 magrittr:: Pipe ===================================================== + +if (! requireNamespace("magrittr", quietly = TRUE)) { + install.packages("magrittr") +} +# Package information: +# library(help = magrittr) # basic information +# browseVignettes("magrittr") # available vignettes +# data(package = "magrittr") # available datasets + + +library(magrittr) + +myFiles %>% nchar %>% order %>% myFiles[.] + +# = 4 Base R Pipe ========================================================= + +# Since version 4.1, base R now supports a pipe operator without the need +# to load a special package. Such an introductions of external functionality +# into the language is very rare. +# +# Unfortunately it won't (yet) work with the '[' function, so we need to write +# an intermediate function for this example +extract <- function(x, v) { + return(v[x]) +} + +myFiles |> nchar() |> order() |> extract(myFiles) + + +# = 5 Intermediate Assignment ============================================= + +# So what's the problem? As you can see, the piped code may be concise and +# expressive. But there is also a large amount of implicit assignment and +# processing going on and that is usually a bad idea because it makes code hard +# to maintain. I am NOT a big fan of the nested syntax, but I don't think that +# replacing it with the pipe makes things much better. My preferred idiom is +# to use intermediate assignments. Only then is it convenient to examine +# the code step by step and validate every single step. And that is the most +# important objective at all: no code is good if it does not compute +# correctly. + + +x <- nchar(myFiles) +x <- order(x) +myFiles[x] + + + +# = 6 Postscript ========================================================== + +# I tried to write an example that strips all comments from a list of files, and +# another example that finds all files that were not yet updated this year +# (according to the "# Date: in the header). Neither examples can be well +# written without intermediate assignments, or at least sapply() functions +# that are not simpler at all than the intermediate assignment. + +# [END] diff --git a/RPR-RegEx.R b/RPR-RegEx.R index f9f8a5b..4e49fb0 100644 --- a/RPR-RegEx.R +++ b/RPR-RegEx.R @@ -1,180 +1,180 @@ -# tocID <- "RPR-RegEx.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the RPR-RegEx unit -# -# Version: 1.0 -# -# Date: 2017-08 - 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# V 0.1 Maintenance 2020 -# V 0.1 First code -# -# TODO: -# -# -# == HOW TO WORK WITH LEARNING UNIT FILES ====================================== -# -# DO NOT SIMPLY source() THESE FILES! -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ---------------------------------------------------- -#TOC> 1 A regex example 41 -#TOC> 2 Counting lines 108 -#TOC> 2.1 Counting C-alpha atoms only 126 -#TOC> 3 Code Solutions 142 -#TOC> 3.1 Counting atoms 144 -#TOC> 3.2 Counting C-alpha records 160 -#TOC> -#TOC> ========================================================================== - - -# = 1 A regex example ===================================================== - -# The canonical FASTA version of yeast Mbp1 at Uniprot -s <- ">sp|P39678|MBP1_YEAST Transcription factor MBP1 OS=Saccharomyces cerevisiae (strain ATCC 204508 / S288c) GN=MBP1 PE=1 SV=1 -MSNQIYSARYSGVDVYEFIHSTGSIMKRKKDDWVNATHILKAANFAKAKRTRILEKEVLK -ETHEKVQGGFGKYQGTWVPLNIAKQLAEKFSVYDQLKPLFDFTQTDGSASPPPAPKHHHA -SKVDRKKAIRSASTSAIMETKRNNKKAEENQFQSSKILGNPTAAPRKRGRPVGSTRGSRR -KLGVNLQRSQSDMGFPRPAIPNSSISTTQLPSIRSTMGPQSPTLGILEEERHDSRQQQPQ -QNNSAQFKEIDLEDGLSSDVEPSQQLQQVFNQNTGFVPQQQSSLIQTQQTESMATSVSSS -PSLPTSPGDFADSNPFEERFPGGGTSPIISMIPRYPVTSRPQTSDINDKVNKYLSKLVDY -FISNEMKSNKSLPQVLLHPPPHSAPYIDAPIDPELHTAFHWACSMGNLPIAEALYEAGTS -IRSTNSQGQTPLMRSSLFHNSYTRRTFPRIFQLLHETVFDIDSQSQTVIHHIVKRKSTTP -SAVYYLDVVLSKIKDFSPQYRIELLLNTQDKNGDTALHIASKNGDVVFFNTLVKMGALTT -ISNKEGLTANEIMNQQYEQMMIQNGTNQHVNSSNTDLNIHVNTNNIETKNDVNSMVIMSP -VSPSDYITYPSQIATNISRNIPNVVNSMKQMASIYNDLHEQHDNEIKSLQKTLKSISKTK -IQVSLKTLEVLKESSKDENGEAQTNDDFEILSRLQEQNTKKLRKRLIRYKRLIKQKLEYR -QTVLLNKLIEDETQATTNNTVEKDNNTLERLELAQELTMLQLQRKNKLSSLVKKFEDNAK -IHKYRRIIREGTEMNIEEVDSSLDVILQTLIANNNKNKGAEQIITISNANSHA" - -nchar(s) -# Must be 969 - -# Task: Fetch the Uniprot ID by retrieving the first string that appears between -# two vertical bars ("pipes") in the header record. -# - -# Develop the regular expression: - # Just five characters returned, so we know we are using -patt <- "^>(.{5})" # the right functions -regmatches(s, regexec(patt, s, perl = TRUE))[[1]][2] - -patt <- "^>(.*)|" # everything to the pipe character -regmatches(s, regexec(patt, s, perl = TRUE))[[1]][2] - -# Ooops - "|" is a metacharacter - we must escape it - -patt <- "^>(.*)\|" # using "\|" -# Ooops - that's not how we escape: must double the \ to send a literal -# "\" plus the character "|" to the regex engine. - -patt <- "^>(.*)\\|" # using "\\|" -regmatches(s, regexec(patt, s, perl = TRUE))[[1]][2] - -# Good. Now let's first match everything that is not a "|", then match a "|" -patt <- "^>([^|]*)\\|" -regmatches(s, regexec(patt, s, perl = TRUE))[[1]][2] - -# the same thing again, but capture the second match. And insist that there -# must be at least one character captured - -patt <- "^>[^|]*\\|([^|]+)\\|" -# Analyze this pattern: -# ^ anchor the match at the beginning of the line -# > ">" must be the first character -# [^|]* all-characters-except-a-vertical-bar, 0 or more times because -# we don't know what other versions of the string "sp" -# might appear. Note that within the brackets "|" is NOT a -# metacharacter. -# \\| "|" character: ouside of square brackets "|" is a metacharacter -# and means "OR"; we need to escape it to match a literal "|". -# ( open parenthesis: capture what comes next ... -# [^|]+ all-characters-except-a-vertical-bar, 1 or more times -# ) close parenthesis: stop capturing here -# \\| second "|" character, escaped -regmatches(s, regexec(patt, s, perl = TRUE))[[1]][2] - - -# = 2 Counting lines ====================================================== - -# Task: Write a function that returns the number of atoms in a PDB file. Call it -# atomCount(). Sample data is here: -myPDB <- readLines("./data/0TST.pdb") - -# Specification: -# Read a file from its path given as the only argument. -# Return the number of lines in that file that begin with "ATOM " -# or with "HETATM". - -# Try this. Write a function. Solution code is at the end of this file. -# Don't peek. - -atomCount("./data/0TST.pdb") # must return 6 - - - -# == 2.1 Counting C-alpha atoms only ======================================= - -# Task: write a function based on the previous one that matches only CA records, -# i.e. it can be used to count the number of amino acids. Don't get -# fooled by calcium atoms, or the string CA appearing elsewhere. -# cf. https://www.wwpdb.org/documentation/file-format-content/format33/sect9.html#ATOM - -# Specification: -# Read a file from its path given as the only argument. -# Return the number of lines in that file that have a C-alpha atom. - -# Try this. Solution code is at the end of this file. Don't peek. - -CAcount("./data/0TST.pdb") # must return 1 - - -# = 3 Code Solutions ====================================================== - -# == 3.1 Counting atoms ==================================================== - -atomCount <- function(IN) { - # count the number of atoms in a PDB formatted file - # Parameters: - # IN chr path of the file to read - # Value: - # numeric number of lines that match "^ATOM " or "^HETATM" - # Note: the regex MUST be anchored to the beginning of the line, otherwise - # it might match somewhere in a comment! - x <- readLines(IN) - patt <- "(^ATOM )|(^HETATM)" - return(length(grep(patt, x))) -} - - -# == 3.2 Counting C-alpha records ========================================== - - -CAcount <- function(IN) { - # count the number of C-alpha atoms in a PDB formatted file - # Parameters: - # IN chr path of the file to read - # Value: - # numeric number of lines that match " CA " in position 13 - 16 of - # an ATOM record. - # Note: the regex MUST be aligned into the right position, otherwise it - # might match Calcium records! - x <- readLines(IN) - patt <- "^ATOM ...... CA " - return(length(grep(patt, x))) -} - - - -# [END] +# tocID <- "RPR-RegEx.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the RPR-RegEx unit +# +# Version: 1.0 +# +# Date: 2017-08 - 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# V 0.1 Maintenance 2020 +# V 0.1 First code +# +# TODO: +# +# +# == HOW TO WORK WITH LEARNING UNIT FILES ====================================== +# +# DO NOT SIMPLY source() THESE FILES! +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ---------------------------------------------------- +#TOC> 1 A regex example 41 +#TOC> 2 Counting lines 108 +#TOC> 2.1 Counting C-alpha atoms only 126 +#TOC> 3 Code Solutions 142 +#TOC> 3.1 Counting atoms 144 +#TOC> 3.2 Counting C-alpha records 160 +#TOC> +#TOC> ========================================================================== + + +# = 1 A regex example ===================================================== + +# The canonical FASTA version of yeast Mbp1 at Uniprot +s <- ">sp|P39678|MBP1_YEAST Transcription factor MBP1 OS=Saccharomyces cerevisiae (strain ATCC 204508 / S288c) GN=MBP1 PE=1 SV=1 +MSNQIYSARYSGVDVYEFIHSTGSIMKRKKDDWVNATHILKAANFAKAKRTRILEKEVLK +ETHEKVQGGFGKYQGTWVPLNIAKQLAEKFSVYDQLKPLFDFTQTDGSASPPPAPKHHHA +SKVDRKKAIRSASTSAIMETKRNNKKAEENQFQSSKILGNPTAAPRKRGRPVGSTRGSRR +KLGVNLQRSQSDMGFPRPAIPNSSISTTQLPSIRSTMGPQSPTLGILEEERHDSRQQQPQ +QNNSAQFKEIDLEDGLSSDVEPSQQLQQVFNQNTGFVPQQQSSLIQTQQTESMATSVSSS +PSLPTSPGDFADSNPFEERFPGGGTSPIISMIPRYPVTSRPQTSDINDKVNKYLSKLVDY +FISNEMKSNKSLPQVLLHPPPHSAPYIDAPIDPELHTAFHWACSMGNLPIAEALYEAGTS +IRSTNSQGQTPLMRSSLFHNSYTRRTFPRIFQLLHETVFDIDSQSQTVIHHIVKRKSTTP +SAVYYLDVVLSKIKDFSPQYRIELLLNTQDKNGDTALHIASKNGDVVFFNTLVKMGALTT +ISNKEGLTANEIMNQQYEQMMIQNGTNQHVNSSNTDLNIHVNTNNIETKNDVNSMVIMSP +VSPSDYITYPSQIATNISRNIPNVVNSMKQMASIYNDLHEQHDNEIKSLQKTLKSISKTK +IQVSLKTLEVLKESSKDENGEAQTNDDFEILSRLQEQNTKKLRKRLIRYKRLIKQKLEYR +QTVLLNKLIEDETQATTNNTVEKDNNTLERLELAQELTMLQLQRKNKLSSLVKKFEDNAK +IHKYRRIIREGTEMNIEEVDSSLDVILQTLIANNNKNKGAEQIITISNANSHA" + +nchar(s) +# Must be 969 + +# Task: Fetch the Uniprot ID by retrieving the first string that appears between +# two vertical bars ("pipes") in the header record. +# + +# Develop the regular expression: + # Just five characters returned, so we know we are using +patt <- "^>(.{5})" # the right functions +regmatches(s, regexec(patt, s, perl = TRUE))[[1]][2] + +patt <- "^>(.*)|" # everything to the pipe character +regmatches(s, regexec(patt, s, perl = TRUE))[[1]][2] + +# Ooops - "|" is a metacharacter - we must escape it + +patt <- "^>(.*)\|" # using "\|" +# Ooops - that's not how we escape: must double the \ to send a literal +# "\" plus the character "|" to the regex engine. + +patt <- "^>(.*)\\|" # using "\\|" +regmatches(s, regexec(patt, s, perl = TRUE))[[1]][2] + +# Good. Now let's first match everything that is not a "|", then match a "|" +patt <- "^>([^|]*)\\|" +regmatches(s, regexec(patt, s, perl = TRUE))[[1]][2] + +# the same thing again, but capture the second match. And insist that there +# must be at least one character captured + +patt <- "^>[^|]*\\|([^|]+)\\|" +# Analyze this pattern: +# ^ anchor the match at the beginning of the line +# > ">" must be the first character +# [^|]* all-characters-except-a-vertical-bar, 0 or more times because +# we don't know what other versions of the string "sp" +# might appear. Note that within the brackets "|" is NOT a +# metacharacter. +# \\| "|" character: ouside of square brackets "|" is a metacharacter +# and means "OR"; we need to escape it to match a literal "|". +# ( open parenthesis: capture what comes next ... +# [^|]+ all-characters-except-a-vertical-bar, 1 or more times +# ) close parenthesis: stop capturing here +# \\| second "|" character, escaped +regmatches(s, regexec(patt, s, perl = TRUE))[[1]][2] + + +# = 2 Counting lines ====================================================== + +# Task: Write a function that returns the number of atoms in a PDB file. Call it +# atomCount(). Sample data is here: +myPDB <- readLines("./data/0TST.pdb") + +# Specification: +# Read a file from its path given as the only argument. +# Return the number of lines in that file that begin with "ATOM " +# or with "HETATM". + +# Try this. Write a function. Solution code is at the end of this file. +# Don't peek. + +atomCount("./data/0TST.pdb") # must return 6 + + + +# == 2.1 Counting C-alpha atoms only ======================================= + +# Task: write a function based on the previous one that matches only CA records, +# i.e. it can be used to count the number of amino acids. Don't get +# fooled by calcium atoms, or the string CA appearing elsewhere. +# cf. https://www.wwpdb.org/documentation/file-format-content/format33/sect9.html#ATOM + +# Specification: +# Read a file from its path given as the only argument. +# Return the number of lines in that file that have a C-alpha atom. + +# Try this. Solution code is at the end of this file. Don't peek. + +CAcount("./data/0TST.pdb") # must return 1 + + +# = 3 Code Solutions ====================================================== + +# == 3.1 Counting atoms ==================================================== + +atomCount <- function(IN) { + # count the number of atoms in a PDB formatted file + # Parameters: + # IN chr path of the file to read + # Value: + # numeric number of lines that match "^ATOM " or "^HETATM" + # Note: the regex MUST be anchored to the beginning of the line, otherwise + # it might match somewhere in a comment! + x <- readLines(IN) + patt <- "(^ATOM )|(^HETATM)" + return(length(grep(patt, x))) +} + + +# == 3.2 Counting C-alpha records ========================================== + + +CAcount <- function(IN) { + # count the number of C-alpha atoms in a PDB formatted file + # Parameters: + # IN chr path of the file to read + # Value: + # numeric number of lines that match " CA " in position 13 - 16 of + # an ATOM record. + # Note: the regex MUST be aligned into the right position, otherwise it + # might match Calcium records! + x <- readLines(IN) + patt <- "^ATOM ...... CA " + return(length(grep(patt, x))) +} + + + +# [END] diff --git a/RPR-SX-PDB.R b/RPR-SX-PDB.R index 14db8ca..d51e8ee 100644 --- a/RPR-SX-PDB.R +++ b/RPR-SX-PDB.R @@ -1,829 +1,829 @@ -# tocID <- "RPR-SX-PDB.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the RPR-SX-PDB unit. -# -# Version: 1.3 -# -# Date: 2017-10 - 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.3 2020 Maintenance -# 1.2 2019 Maintenance -# 1.1 Change from require() to requireNamespace(), -# use ::() idiom throughout -# 1.0 First live version, completely refactores 2016 code -# with remarkable speed gains. Added section on x, y, z -# (density) plots. -# 0.1 First code copied from 2016 material. -# -# TODO: -# Confirm that SS residue numbers are indices -# Set task seed from student number -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ---------------------------------------------------------- -#TOC> 1 Introduction to the bio3D package 63 -#TOC> 2 A Ramachandran plot 155 -#TOC> 3 Density plots 231 -#TOC> 3.1 Density-based colours 245 -#TOC> 3.2 Plotting with smoothScatter() 264 -#TOC> 3.3 Plotting hexbins 279 -#TOC> 3.4 Plotting density contours 307 -#TOC> 3.4.1 ... as overlay on a coloured grid 340 -#TOC> 3.4.2 ... as filled countour 357 -#TOC> 3.4.3 ... as a perspective plot 388 -#TOC> 4 cis-peptide bonds 406 -#TOC> 5 H-bond lengths 421 -#TOC> -#TOC> ========================================================================== - - -# In this example of protein structure interpretation, we ... -# - download the package bio3D:: which supports work with -# protein structure files, -# - explore some elementary functions of the package -# - explore plotting of density values with scatterplots -# - assemble a script to see whether H-bond lengths systematically differ -# between alpha-helical and beta-sheet structures. - - -# = 1 Introduction to the bio3D package =================================== - - -if (! requireNamespace("bio3d", quietly = TRUE)) { - install.packages("bio3d") -} -# Package information: -# library(help = bio3d) # basic information -# browseVignettes("bio3d") # available vignettes -# data(package = "bio3d") # available datasets - - -# bio3d:: can load molecules directly from the PDB servers, you don't _have_ to -# store them locally, but you could. -# -# But before you _load_ a file, have a look what such a file contains. I have -# packaged the 1BM8 file into the project: -file.show("./data/1BM8.pdb") - -# Have a look at the header section, the atom records, the coordinate records -# etc. -# -# Task: -# Answer the following questions: -# What is the resolution of the structure? -# Is the first residue in the SEQRES section also the first residue -# with an ATOM record? -# How many water molecules does the structure contain? -# Can you explain REMARK 525 regarding HOH 459 and HOH 473? -# Are all atoms of the N-terminal residue present? -# Are all atoms of the C-terminal residue present? - -apses <- bio3d::read.pdb("1bm8") # load a molecule directly from the PDB via - # the Internet. - -# check what we have: -apses - -# what is this actually? -str(apses) - -# bio3d's pdb objects are simple lists. Great! You know lists! - -# You see that there is a list element called $atom which is a data frame in -# which the columns arevectors of the same length - namely the number of atoms -# in the structure file. And there is a matrix of (x, y, z) triplets called xyz. -# And there is a vector that holds sequence, and two tables called helix and -# sheet. Let's pull out a few values to confirm how selection and subsetting -# works here: - -# selection by atom ... -i <- 5 -apses$atom[i,] -apses$atom[i, c("x", "y", "z")] # here we are selecting with column names! -apses$xyz[c(i*3-2, i*3-1, i*3)] # here we are selecting with row numbers - -# all atoms of a residue ... -i <- 48 -apses$atom[apses$atom[,"resno"] == i, ] - -# sequence of the first ten residues -apses$seqres[1:10] # the "A"s here identify chain "A" - -# Can we convert this to one letter code? -bio3d::aa321(apses$seqres[1:10]) - -# Lets get the implicit sequence: -bio3d::aa321((apses$atom$resid[apses$calpha])[1:10]) -# Do you understand this code? - -# Do explicit and implicit sequence have the same length? -length(apses$seqres) -length(apses$atom$resid[apses$calpha]) - -# Are the sequences the same? -any(apses$seqres != apses$atom$resid[apses$calpha]) - -# get a list of all CA atoms of arginine residues -cols <- c("eleno", "elety", "resid", "chain", "resno", "insert") -sel <- apses$atom$resid == "ARG" & apses$atom$elety == "CA" -apses$atom[sel, cols] - -# The introduction to bio3d tutorial at -# http://thegrantlab.org/bio3d/tutorials/structure-analysis -# has the following example: -bio3d::plot.bio3d(apses$atom$b[apses$calpha], - sse=apses, - typ="l", - ylab="B-factor") - -# Good for now. Let's do some real work. - -# = 2 A Ramachandran plot ================================================= - -# Calculate a Ramachandran plot for the structure. The torsion.pdb() function -# calculates all dihedral angles for backbone and sidechain bonds, NA where -# the bond does not exist in an amino acid. -tor <- bio3d::torsion.pdb(apses) -plot(tor$phi, tor$psi, - xlim = c(-180, 180), ylim = c(-180, 180), - main = "Ramachandran plot for 1BM8", - xlab = expression(phi), - ylab = expression(psi)) -abline(h = 0, lwd = 0.5, col = "#00000044") -abline(v = 0, lwd = 0.5, col = "#00000044") -# As you can see, there are a number of points in the upper-right -# quadrant of the plot. This combination of phi-psi angles defines -# the conformation of a left-handed alpha helix and is generally -# only observed for glycine residues. Let's replot the data, but -# colour the points for glycine residues differently. First, we -# get a vector of glycine residue indices in the structure: - -mySeq <- bio3d::pdbseq(apses) - -# Explore the result object and extract the indices of GLY resiues. - mySeq == "G" - which(mySeq == "G") -iGly <- which(mySeq == "G") - -# Now plot all non-gly residues. -# Remember: negative indices exclude items from a vector -plot(tor$phi[-iGly], tor$psi[-iGly], - xlim=c(-180,180), ylim=c(-180,180), - main = "Ramachandran plot for 1BM8", - xlab = expression(phi), - ylab = expression(psi)) -abline(h = 0, lwd = 0.5, col = "#00000044") -abline(v = 0, lwd = 0.5, col = "#00000044") - -# Now plot GLY only, but with green dots: -points(tor$phi[iGly], tor$psi[iGly], pch=21, cex=0.9, bg="#00CC00") - -# As you see, four residues in the upper-right quadrant are -# not glycine. But what residues are these? Is there an -# error in our script? Let's get their coordinate records: - -# subset CA records -CA <- apses$atom[apses$calpha, c("eleno", "elety", "resid", "chain", "resno")] - -# get index of outliers -iOutliers <- which(tor$phi > 30 & tor$phi < 90 & - tor$psi > 0 & tor$psi < 90) - -# cbind records together -(dat <- cbind(CA[iOutliers, ], - phi = tor$phi[iOutliers], - psi = tor$psi[iOutliers])) - - -# remove the glycine ... -(dat <- dat[dat$resid != "GLY", ]) - - -# let's add the residue numbers to the plot with the text function: -for (i in 1:nrow(dat)) { - points(dat$phi[i], dat$psi[i], pch=21, cex=0.9, bg="#CC0000") - text(dat$phi[i], - dat$psi[i], - labels = sprintf("%s%d", bio3d::aa321(dat$resid[i]), dat$resno[i]), - pos = 4, - offset = 0.4, - cex = 0.7) -} - -# You can check the residues in Chimera. Is there anything unusual about these -# residues? - - -# = 3 Density plots ======================================================= - -# Such x, y scatter-plots of data that is sampled from a distribution can tell -# us a lot about what shapes the distribution. The distribution is governed by -# the free energy of the phi-psi landscape in folded proteins, since folded -# proteins generally minimize the free energy of their conformations. We observe -# empirically, from comparing frequency statistics and mutation experiments, -# that this generall follows a Boltzmann distribution, where the free energy -# changes we observe in experments that change one conformation into another are -# proportional to the log-ratio of the number of times we observe each -# observation in the protein structure database (after correcting for -# observation bias). The proper way to visualize such 2D landscapes is with -# contour plots. - -# == 3.1 Density-based colours ============================================= - -# A first approximation to scatterplots that visualize the density of the -# underlying distribution is colouring via the densCols() function. -?densCols -iNA <- c(which(is.na(tor$phi)), which(is.na(tor$psi))) -phi <- tor$phi[-iNA] -psi <- tor$psi[-iNA] -plot (phi, psi, - xlim = c(-180, 180), ylim = c(-180, 180), - col=densCols(phi,psi), - pch=20, cex=2, - main = "Ramachandran plot for 1BM8", - xlab = expression(phi), - ylab = expression(psi)) -abline(h = 0, lwd = 0.5, col = "#00000044") -abline(v = 0, lwd = 0.5, col = "#00000044") - - -# == 3.2 Plotting with smoothScatter() ===================================== - -# A better way, that spreads out the underlying density is smoothScatter() -smoothScatter(phi,psi) -smoothScatter(phi, psi, - xlim = c(-180, 180), ylim = c(-180, 180), - col = "#0033BB33", - pch = 3, cex = 0.6, - main = "Ramachandran plot for 1BM8", - xlab = expression(phi), - ylab = expression(psi)) -abline(h = 0, lwd = 0.5, col = "#00000044") -abline(v = 0, lwd = 0.5, col = "#00000044") - - -# == 3.3 Plotting hexbins ================================================== - -# If we wish to approximate values in a histogram-like fashion, we can use -# hexbin() -if (! requireNamespace("hexbin", quietly = TRUE)) { - install.packages("hexbin") -} -# Package information: -# library(help = hexbin) # basic information -# browseVignettes("hexbin") # available vignettes -# data(package = "hexbin") # available datasets - - -myColorRamp <- colorRampPalette(c("#EEEEEE", - "#3399CC", - "#2266DD")) -hexbin::gplot.hexbin(hexbin::hexbin(phi, psi, xbins = 10), - colramp = myColorRamp, - main = "phi-psi Density Bins for 1BM8", - xlab = expression(phi), - ylab = expression(psi)) - -# Note: -# Had we loaded hexbin with library(hexbin), the plot function would have -# been dispatched by the plot() generic, and we could simply have written: -# plot(hexbin(phi, psi, xbins = 10), ... - - -# == 3.4 Plotting density contours ========================================= - - -# The best way to handle such data is provided by the function contour(): -?contour - -# Contour plots are not produced along the haphazardly sampled values of a data -# set, but on a regular grid. This means, we need to convert observed values -# into estimated densities. Density estimation is an important topic for -# exploratory data analysis, base R has the density() function for 1D -# distributions. But for 2D data like or phi-psi plots, we need a function from -# the MASS package: kde2d() - -if (! requireNamespace("MASS", quietly = TRUE)) { - install.packages("MASS") -} -# Package information: -# library(help = MASS) # basic information -# browseVignettes("MASS") # available vignettes -# data(package = "MASS") # available datasets - -?MASS::kde2d -dPhiPsi <-MASS::kde2d(phi, psi, - n = 60, - lims = c(-180, 180, -180, 180)) - -str(dPhiPsi) -# This is a list, with gridpoints in x and y, and the estimated densities in z. - -# Generic plot with default parameters -contour(dPhiPsi) - - -# === 3.4.1 ... as overlay on a coloured grid - -image(dPhiPsi, - col = myColorRamp(100), - main = "Ramachandran plot for 1BM8", - xlab = expression(phi), - ylab = expression(psi)) -contour(dPhiPsi, col = "royalblue", - add = TRUE, - method = "edge", - nlevels = 10, - lty = 2) -points(phi, psi, col = "#00338866", pch = 3, cex = 0.7) -abline(h = 0, lwd = 0.5, col = "#00000044") -abline(v = 0, lwd = 0.5, col = "#00000044") - - -# === 3.4.2 ... as filled countour - -filled.contour(dPhiPsi, - xlim = c(-180, 180), ylim = c(-180, 180), - nlevels = 10, - color.palette = myColorRamp, - main = "Ramachandran plot for 1BM8", - xlab = expression(phi), - ylab = expression(psi)) - -# Note: we can pass additional plotting and overlay commands to the counter plot -# in a block of expressions passed via the plot.axes parameter: - -filled.contour(dPhiPsi, - xlim = c(-180, 180), ylim = c(-180, 180), - nlevels = 10, - color.palette = myColorRamp, - main = "Ramachandran plot for 1BM8", - xlab = expression(phi), - ylab = expression(psi), - plot.axes = { - contour(dPhiPsi, col = "#00000044", - add = TRUE, - method = "edge", - nlevels = 10, - lty = 2) - points(phi, psi, col = "#00338866", pch = 3, cex = 0.7) - abline(h = 0, lwd = 0.5, col = "#00000044") - abline(v = 0, lwd = 0.5, col = "#00000044") - }) - -# === 3.4.3 ... as a perspective plot - -persp(dPhiPsi, - xlab = "phi", - ylab = "psi", - zlab = "Density") - - -persp(dPhiPsi, - theta = 40, - phi = 10, - col = "#99AACC", - xlab = "phi", - ylab = "psi", - zlab = "Density") - - - -# = 4 cis-peptide bonds =================================================== - -# Are there any cis-peptide bonds in the structure? -tor$omega -#... gives us a quick answer. But wait - what values do we -# expect? And why are the values so different, ranging from -180° to 180°? -# Consider this plot: what am I doing here and why? -om <- c(360 + tor$omega[tor$omega < 0], - tor$omega[tor$omega >= 0]) -hist(om, xlim=c(0,360)) -abline(v=180, col="red") - -# Note: a cis-peptide bond will have an omega torsion angle around 0° - - -# = 5 H-bond lengths ====================================================== - -# Let's do something a little less trivial and compare -# backbone H-bond lengths between helices and strands. - -# Secondary structure is defined in the bio3d object's ...$helix and ...$strand -# list elements. -str(apses) - -# We need to -# - collect all N atoms in alpha helices resp. -# beta strands; -# - collect all O atoms in alpha helices resp. -# beta strands; -# - fetch the atom coordinates; -# - calculate all N, O distances; -# - filter them for distances that indicate H-bonds; and, -# - plot the results. - -# Secondary structure can either be obtained from definitions contained in most -# PDB files, or by running the DSSP algorithm IF(!) you have it installed on -# your machine. See the dssp() function of bio3d for instructions how to obtain -# and install DSSP and STRIDE. This is highly recommended for "real" work with -# structure coordinate files. The 1BM8 file contains secondary structure -# definitions: - -apses$helix -apses$sheet - - -# A function to collect atom indices for particular type of secondary structure - -ssSelect <- function(PDB, myChain = "A", ssType, myElety) { - # Function to retrieve specified atom types from specified secondary - # structure types in a PDB object. - # Parameters: - # PDB A bio3D PDB object - # myChain chr The chain to use. Default: chain "A". - # ssType chr A vector of keywords "helix" and/or "sheet" - # myElety chr A vector of $eletype atom types to return - # Value: num Indices of the matching atom rows in PDB$atom - - # Build a vector of $resno numbers - starts <- numeric() - ends <- numeric() - if ("helix" %in% ssType) { - sel <- PDB$helix$chain %in% myChain - starts <- c(starts, PDB$helix$start[sel]) - ends <- c(ends, PDB$helix$end[sel]) - } - if ("sheet" %in% ssType) { - sel <- PDB$sheet$chain %in% myChain - starts <- c(starts, PDB$sheet$start[sel]) - ends <- c(ends, PDB$sheet$end[sel]) - } - myResno <- numeric() - for (i in seq_along(starts)) { - myResno <- c(myResno, starts[i]:ends[i]) - } - - # get id's from PDB - - x <- bio3d::atom.select(PDB, - string = "protein", - type = "ATOM", - chain = myChain, - resno = myResno, - elety = myElety) - - return(x$atom) -} - -# Example: -ssSelect(apses, ssType = "sheet", myElety = "N") -ssSelect(apses, ssType = "sheet", myElety = "O") - -# That looks correct: O atoms should be stored three index position after N: the -# sequence of atoms in a PDB file is usually N, CA, C, O ... followed by the -# side chain coordinates. - -# Now to extract the coordinates and calculate distances. Our function needs to -# take the PDB object and two vectors of atom indices as argument, and return a -# vector of pair-distances (actually dist.xyz() returns a matrix). - -pairDist <- function(PDB, a, b) { - # Calculate pairwise distances between atoms indicated by a and b - # Parameters: - # PDB A bio3D PDB object - # a int A vector of atom indexes - # b int A vector of atom indexes - # Value: num matrix of Euclidian distances between the atoms given in a, b. - # There are as many rows as atoms in a, as many columns as - # atoms in b. - - dMat <- numeric() - if (length(a) > 0 && length(b) > 0) { - - A <- PDB$atom[a, c("x", "y", "z")] - B <- PDB$atom[b, c("x", "y", "z")] - dMat <- bio3d::dist.xyz(A, B) - - } - return(dMat) -} - -# Let's see if this looks correct. Let's look at all the pairwise distances -# between N and O atoms in both types of secondary structure: - -iN <- ssSelect(apses, ssType = c("helix", "sheet"), myElety = "N") -iO <- ssSelect(apses, ssType = c("helix", "sheet"), myElety = "O") -x <- pairDist(apses, iN, iO) -hist(x, - breaks = 80, - col = "lavenderblush", - main = "", - xlab = "N-O distances (Å)") - -# Since we are collecting distance from all secondary structure elements, we -# are just seing a big peak of (meaningless) long-distance separations. We -# need to zoom in on the shorter distances, in which we expect -# hydrogen bonds: -hist(x[x < 4.2], # restrict to N-O distance less than 4.2 Å long - breaks=seq(2.0, 4.2, 0.1), - xlim=c(2.0,4.2), - col = "lavenderblush", - main = "", - xlab = "N-O distances (Å)") - -# There is a large peak at about 2.2Å, and another -# large peak above 3.5Å. But these are not typical hydrogen -# bond distances! Rather these are (N,O) pairs in peptide -# bonds, and within residues. That's not good, because these will contaminate -# our statistics. -# We need to exclude all distances between N of a residue -# and O of a preceeding residue, and all (N,O) pairs in the -# same residue. We need a function to filter distances by residue numbers. And while we are filtering, we might as well throw away the non-H bond distances too. - -filterHB <- function(PDB, iN, iO, dMat, cutoff = 3.9) { - # Filters distances between O(i-1) and N(i), and between N(i) and O(i) - # in a distance matrix where there is one row per N-atom and one - # column per O atom. - # Parameters: - # PDB a bio3D PDB object - # iN int a vector of N atom indexes - # iO int a vector of O atom indexes - # dMat num a distance matrix created by pairDist() - # cutoff num only return distances that are shorter than "cutoff - # Value: a distance matrix in which values that do not match the - # filter criteria have bee set to NA. - - if (length(iN) > 0 && length(iO) > 0) { - - resN <- PDB$atom$resno[iN] - resO <- PDB$atom$resno[iO] - - for (i in seq_along(resN)) { # for all N atoms - for (j in seq_along(resO)) { # for all O atoms - if (dMat[i, j] > cutoff || # if: distance > cutoff, or ... - (resN[i] - 1) == resO[j] || # distance is N(i)---O(i-1), or ... - resN[i] == resO[j]) { # distance is N(i)---O(i), then: - dMat[i, j] <- NA # set this distance to NA. - } - } - } - } - return(dMat) -} - -# Inspect the result: -hist(filterHB(apses, iN, iO, x), - breaks=seq(2.0, 4.2, 0.1), - xlim=c(2.0,4.2), - col = "paleturquoise", - main = "", - xlab = "N-O distances (Å)") - - -# Finally we can calculate alpha- and beta- structure -# bonds and compare them. In this section we'll explore -# different options for histogram plots. - -# H-bonds in helices ... -iN <- ssSelect(apses, ssType = c("helix"), myElety = "N") -iO <- ssSelect(apses, ssType = c("helix"), myElety = "O") -dH <- filterHB(apses, iN, iO, pairDist(apses, iN, iO)) -dH <- dH[!is.na(dH)] - -# H-bonds in sheets. (We commonly use the letter "E" to symbolize a beta -# strand or sheet, because "E" visually evokes an extended strand with -# protruding sidechains.) -iN <- ssSelect(apses, ssType = c("sheet"), myElety = "N") -iO <- ssSelect(apses, ssType = c("sheet"), myElety = "O") -dE <- filterHB(apses, iN, iO, pairDist(apses, iN, iO)) -dE <- dE[!is.na(dE)] - -# The plain histogram functions without parameters -# give us white stacks. - -hist(dH) - -# and ... -hist(dE) - -# We can see that the histrograms look different -# but that is better visualized by showing two plots -# in the same window. We use the par() function, for -# more flexible layout, look up the layout() function. -?par -?layout - -opar <- par(no.readonly=TRUE) # store current state -par(mfrow=c(2,1)) # set graphics parameters: 2 rows, one column - -# plot two histograms -hist(dH) -hist(dE) - - -# add colour: -hist(dH, col="#DD0055") -hist(dE, col="#00AA70") - - - -# For better comparison, plot both in the -# same window (use the "add = TRUE" parameter in hist() ): - -hist(dH, col="#DD0055") -hist(dE, col="#00AA70", add = TRUE) - -# ... oops, we dind't reset the graphics parameters. You can either use -# the broom icon of the Plot tab to clear asll plots, or ... -par(opar) # ... reset the graphics parameters - -hist(dH, col = "#DD0055") -hist(dE, col = "#00AA70", add = TRUE) - -# We see that the leftmost column of the sheet bonds hides the helix bonds in -# that column. Not good. But we can make the colours transparent! We just need to -# add a fourth set of two hexadecimal-numbers to the #RRGGBB triplet. (This -# sets the transparency of the colour, it is called the "alpha channel"). Lets -# use 2/3 transparent, in hexadecimal, 1/3 of 256 is x55 - i.e. an RGB triplet -# specied as #RRGGBB55 is only 33% opaque: - -hist(dH, col = "#DD005555") -hist(dE, col = "#00AA7055", add = TRUE) - -# To finalize the plots, let's do two more things: Explicitly define the breaks, -# to make sure they match up - otherwise they would not need to... like in this -# example: - -hist(dH, col ="#DD005555") -hist(dE[dE < 3], col = "#00AA7055", add = TRUE) - -# Breaks are a parameter in hist() that can either be a scalar, to define how -# many columns you want, or a vector, that defines the actual breakpoints. -brk=seq(2.4, 4.0, 0.1) - -hist(dH, col="#DD005555", breaks=brk) -hist(dE, col="#00AA7055", breaks=brk, add=TRUE) - -# The last thing to do is to think about rescaling the plot. You notice that the -# y-axis is scaled in absolute frequency (i.e. counts). That gives us some -# impression of the relative frequency, but it is of course skewed by observing -# relatively more or less of one type of secondary structure in a protein. As -# part of the hist() function we can rescale the values so that the sum over all -# is one: set the parameter freq=FALSE. And we explicitly set y-axis limits -# to accommodate bot distributions. - -hist(dH, col="#DD005555", breaks=brk, freq=FALSE, ylim = c(0, 4)) -hist(dE, col="#00AA7055", breaks=brk, freq=FALSE, add=TRUE) - -# Adding labels and legend ... - -hH <- hist(dH, - freq=FALSE, - breaks=brk, - col="#DD005550", - xlab="(N,O) distance (Å)", - ylab="Density", - ylim=c(0,4), - main="Helix and Sheet H-bond lengths") -hE <- hist(dE, - freq=FALSE, - breaks=brk, - col="#00AA7060", - add=TRUE) - -legend("topright", - c(sprintf("alpha (N = %3d)", sum(hH$counts)), - sprintf("beta (N = %3d)", sum(hE$counts))), - fill = c("#DD005550", "#00AA7060"), bty = 'n', - border = NA) - - -# With all the functions we have defined, -# it is easy to try this with a larger protein. -# 3ugj for example is VERY large. - -pdb <- bio3d::read.pdb("3ugj") - -# helices... -iN <- ssSelect(pdb, ssType = c("helix"), myElety = "N") -iO <- ssSelect(pdb, ssType = c("helix"), myElety = "O") -dH <- filterHB(pdb, iN, iO, pairDist(pdb, iN, iO)) -dH <- dH[!is.na(dH)] - -# sheets -iN <- ssSelect(pdb, ssType = c("sheet"), myElety = "N") -iO <- ssSelect(pdb, ssType = c("sheet"), myElety = "O") -dE <- filterHB(pdb, iN, iO, pairDist(pdb, iN, iO)) -dE <- dE[!is.na(dE)] - -# histograms ... -brk=seq(2.4, 4.0, 0.1) - -hH <- hist(dH, - freq=FALSE, - breaks=brk, - col="#DD005550", - xlab="(N,O) distance (Å)", - ylab="Density", - ylim=c(0,4), - main="Helix and Sheet H-bond lengths") -hE <- hist(dE, - freq=FALSE, - breaks=brk, - col="#00AA7060", - add=TRUE) - -legend('topright', - c(paste("alpha (N = ", sum(hH$counts), ")"), - paste("beta (N = ", sum(hE$counts), ")")), - fill = c("#DD005550", "#00AA7060"), bty = 'n', - border = NA, - inset = 0.1) - -# It's apparent that the distributions are indeed different. Our sample -# is large, but derives from a single protein. To do database scale statistics, -# we should look at many more proteins. To give you a sense of how, let's do -# this for just ten proteins, randomly selected from non-homologous, -# high-resolution, single domain structures. I have provided a utility function -# for such a selection (details beyond the scope of this project). - -myPDBs <- selectPDBrep(10) -# My selection is "2OVJ", "1HQS", "3BON", "4JZX", "3BQ3", "2IUM", "2C9E", -# "4X1F", "2V3I", "3GE3". Yours will be different. - -# We are loading the files online - don't do this if you have bandwidth -# limitations. - - -dH <- c() # collect all helix H-bonds here -dE <- c() # collect all sheet H-bonds here - -for (i in seq_along(myPDBs)) { - pdb <- bio3d::read.pdb(myPDBs[i]) - - # helices... - iN <- ssSelect(pdb, ssType = c("helix"), myElety = "N") - iO <- ssSelect(pdb, ssType = c("helix"), myElety = "O") - x <- filterHB(pdb, iN, iO, pairDist(pdb, iN, iO)) - dH <- c(dH, x[!is.na(x)]) - - # sheets - iN <- ssSelect(pdb, ssType = c("sheet"), myElety = "N") - iO <- ssSelect(pdb, ssType = c("sheet"), myElety = "O") - x <- filterHB(pdb, iN, iO, pairDist(pdb, iN, iO)) - dE <- c(dE, x[!is.na(x)]) -} - -# Inspect the results - -length(dH) # 4415 (your numbers are different, but there should be many) -length(dE) # 262 - -brk=seq(2.0, 4.0, 0.1) - -hH <- hist(dH, - freq=FALSE, - breaks=brk, - col="#DD005550", - xlab="(N,O) distance (Å)", - ylab="Density", - ylim=c(0,4), - cex.main = 0.8, - main="Helix and Sheet H-bond lengths (10 representative structures)") -hE <- hist(dE, - freq=FALSE, - breaks=brk, - col="#00AA7060", - add=TRUE) - -legend('topright', - c(paste("alpha (N = ", sum(hH$counts), ")"), - paste("beta (N = ", sum(hE$counts), ")")), - fill = c("#DD005550", "#00AA7060"), bty = 'n', - border = NA, - inset = 0.1) - -# Task: -# Why do you think these distributions are different? -# At what distance do you think H-bonds have the lowest energy? -# For alpha-helices? For beta-strands? - - - - -# [END] +# tocID <- "RPR-SX-PDB.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the RPR-SX-PDB unit. +# +# Version: 1.3 +# +# Date: 2017-10 - 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.3 2020 Maintenance +# 1.2 2019 Maintenance +# 1.1 Change from require() to requireNamespace(), +# use ::() idiom throughout +# 1.0 First live version, completely refactores 2016 code +# with remarkable speed gains. Added section on x, y, z +# (density) plots. +# 0.1 First code copied from 2016 material. +# +# TODO: +# Confirm that SS residue numbers are indices +# Set task seed from student number +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ---------------------------------------------------------- +#TOC> 1 Introduction to the bio3D package 63 +#TOC> 2 A Ramachandran plot 155 +#TOC> 3 Density plots 231 +#TOC> 3.1 Density-based colours 245 +#TOC> 3.2 Plotting with smoothScatter() 264 +#TOC> 3.3 Plotting hexbins 279 +#TOC> 3.4 Plotting density contours 307 +#TOC> 3.4.1 ... as overlay on a coloured grid 340 +#TOC> 3.4.2 ... as filled countour 357 +#TOC> 3.4.3 ... as a perspective plot 388 +#TOC> 4 cis-peptide bonds 406 +#TOC> 5 H-bond lengths 421 +#TOC> +#TOC> ========================================================================== + + +# In this example of protein structure interpretation, we ... +# - download the package bio3D:: which supports work with +# protein structure files, +# - explore some elementary functions of the package +# - explore plotting of density values with scatterplots +# - assemble a script to see whether H-bond lengths systematically differ +# between alpha-helical and beta-sheet structures. + + +# = 1 Introduction to the bio3D package =================================== + + +if (! requireNamespace("bio3d", quietly = TRUE)) { + install.packages("bio3d") +} +# Package information: +# library(help = bio3d) # basic information +# browseVignettes("bio3d") # available vignettes +# data(package = "bio3d") # available datasets + + +# bio3d:: can load molecules directly from the PDB servers, you don't _have_ to +# store them locally, but you could. +# +# But before you _load_ a file, have a look what such a file contains. I have +# packaged the 1BM8 file into the project: +file.show("./data/1BM8.pdb") + +# Have a look at the header section, the atom records, the coordinate records +# etc. +# +# Task: +# Answer the following questions: +# What is the resolution of the structure? +# Is the first residue in the SEQRES section also the first residue +# with an ATOM record? +# How many water molecules does the structure contain? +# Can you explain REMARK 525 regarding HOH 459 and HOH 473? +# Are all atoms of the N-terminal residue present? +# Are all atoms of the C-terminal residue present? + +apses <- bio3d::read.pdb("1bm8") # load a molecule directly from the PDB via + # the Internet. + +# check what we have: +apses + +# what is this actually? +str(apses) + +# bio3d's pdb objects are simple lists. Great! You know lists! + +# You see that there is a list element called $atom which is a data frame in +# which the columns are vectors of the same length - namely the number of atoms +# in the structure file. And there is a matrix of (x, y, z) triplets called xyz. +# And there is a vector that holds sequence, and two tables called helix and +# sheet. Let's pull out a few values to confirm how selection and subsetting +# works here: + +# selection by atom ... +i <- 5 +apses$atom[i,] +apses$atom[i, c("x", "y", "z")] # here we are selecting with column names! +apses$xyz[c(i*3-2, i*3-1, i*3)] # here we are selecting with row numbers + +# all atoms of a residue ... +i <- 48 +apses$atom[apses$atom[,"resno"] == i, ] + +# sequence of the first ten residues +apses$seqres[1:10] # the "A"s here identify chain "A" + +# Can we convert this to one letter code? +bio3d::aa321(apses$seqres[1:10]) + +# Lets get the implicit sequence: +bio3d::aa321((apses$atom$resid[apses$calpha])[1:10]) +# Do you understand this code? + +# Do explicit and implicit sequence have the same length? +length(apses$seqres) +length(apses$atom$resid[apses$calpha]) + +# Are the sequences the same? +any(apses$seqres != apses$atom$resid[apses$calpha]) + +# get a list of all CA atoms of arginine residues +cols <- c("eleno", "elety", "resid", "chain", "resno", "insert") +sel <- apses$atom$resid == "ARG" & apses$atom$elety == "CA" +apses$atom[sel, cols] + +# The introduction to bio3d tutorial at +# http://thegrantlab.org/bio3d/tutorials/structure-analysis +# has the following example: +bio3d::plot.bio3d(apses$atom$b[apses$calpha], + sse=apses, + typ="l", + ylab="B-factor") + +# Good for now. Let's do some real work. + +# = 2 A Ramachandran plot ================================================= + +# Calculate a Ramachandran plot for the structure. The torsion.pdb() function +# calculates all dihedral angles for backbone and sidechain bonds, NA where +# the bond does not exist in an amino acid. +tor <- bio3d::torsion.pdb(apses) +plot(tor$phi, tor$psi, + xlim = c(-180, 180), ylim = c(-180, 180), + main = "Ramachandran plot for 1BM8", + xlab = expression(phi), + ylab = expression(psi)) +abline(h = 0, lwd = 0.5, col = "#00000044") +abline(v = 0, lwd = 0.5, col = "#00000044") +# As you can see, there are a number of points in the upper-right +# quadrant of the plot. This combination of phi-psi angles defines +# the conformation of a left-handed alpha helix and is generally +# only observed for glycine residues. Let's replot the data, but +# colour the points for glycine residues differently. First, we +# get a vector of glycine residue indices in the structure: + +mySeq <- bio3d::pdbseq(apses) + +# Explore the result object and extract the indices of GLY resiues. + mySeq == "G" + which(mySeq == "G") +iGly <- which(mySeq == "G") + +# Now plot all non-gly residues. +# Remember: negative indices exclude items from a vector +plot(tor$phi[-iGly], tor$psi[-iGly], + xlim=c(-180,180), ylim=c(-180,180), + main = "Ramachandran plot for 1BM8", + xlab = expression(phi), + ylab = expression(psi)) +abline(h = 0, lwd = 0.5, col = "#00000044") +abline(v = 0, lwd = 0.5, col = "#00000044") + +# Now plot GLY only, but with green dots: +points(tor$phi[iGly], tor$psi[iGly], pch=21, cex=0.9, bg="#00CC00") + +# As you see, four residues in the upper-right quadrant are +# not glycine. But what residues are these? Is there an +# error in our script? Let's get their coordinate records: + +# subset CA records +CA <- apses$atom[apses$calpha, c("eleno", "elety", "resid", "chain", "resno")] + +# get index of outliers +iOutliers <- which(tor$phi > 30 & tor$phi < 90 & + tor$psi > 0 & tor$psi < 90) + +# cbind records together +(dat <- cbind(CA[iOutliers, ], + phi = tor$phi[iOutliers], + psi = tor$psi[iOutliers])) + + +# remove the glycine ... +(dat <- dat[dat$resid != "GLY", ]) + + +# let's add the residue numbers to the plot with the text function: +for (i in 1:nrow(dat)) { + points(dat$phi[i], dat$psi[i], pch=21, cex=0.9, bg="#CC0000") + text(dat$phi[i], + dat$psi[i], + labels = sprintf("%s%d", bio3d::aa321(dat$resid[i]), dat$resno[i]), + pos = 4, + offset = 0.4, + cex = 0.7) +} + +# You can check the residues in Chimera. Is there anything unusual about these +# residues? + + +# = 3 Density plots ======================================================= + +# Such x, y scatter-plots of data that is sampled from a distribution can tell +# us a lot about what shapes the distribution. The distribution is governed by +# the free energy of the phi-psi landscape in folded proteins, since folded +# proteins generally minimize the free energy of their conformations. We observe +# empirically, from comparing frequency statistics and mutation experiments, +# that this generall follows a Boltzmann distribution, where the free energy +# changes we observe in experments that change one conformation into another are +# proportional to the log-ratio of the number of times we observe each +# observation in the protein structure database (after correcting for +# observation bias). The proper way to visualize such 2D landscapes is with +# contour plots. + +# == 3.1 Density-based colours ============================================= + +# A first approximation to scatterplots that visualize the density of the +# underlying distribution is colouring via the densCols() function. +?densCols +iNA <- c(which(is.na(tor$phi)), which(is.na(tor$psi))) +phi <- tor$phi[-iNA] +psi <- tor$psi[-iNA] +plot (phi, psi, + xlim = c(-180, 180), ylim = c(-180, 180), + col=densCols(phi,psi), + pch=20, cex=2, + main = "Ramachandran plot for 1BM8", + xlab = expression(phi), + ylab = expression(psi)) +abline(h = 0, lwd = 0.5, col = "#00000044") +abline(v = 0, lwd = 0.5, col = "#00000044") + + +# == 3.2 Plotting with smoothScatter() ===================================== + +# A better way, that spreads out the underlying density is smoothScatter() +smoothScatter(phi,psi) +smoothScatter(phi, psi, + xlim = c(-180, 180), ylim = c(-180, 180), + col = "#0033BB33", + pch = 3, cex = 0.6, + main = "Ramachandran plot for 1BM8", + xlab = expression(phi), + ylab = expression(psi)) +abline(h = 0, lwd = 0.5, col = "#00000044") +abline(v = 0, lwd = 0.5, col = "#00000044") + + +# == 3.3 Plotting hexbins ================================================== + +# If we wish to approximate values in a histogram-like fashion, we can use +# hexbin() +if (! requireNamespace("hexbin", quietly = TRUE)) { + install.packages("hexbin") +} +# Package information: +# library(help = hexbin) # basic information +# browseVignettes("hexbin") # available vignettes +# data(package = "hexbin") # available datasets + + +myColorRamp <- colorRampPalette(c("#EEEEEE", + "#3399CC", + "#2266DD")) +hexbin::gplot.hexbin(hexbin::hexbin(phi, psi, xbins = 10), + colramp = myColorRamp, + main = "phi-psi Density Bins for 1BM8", + xlab = expression(phi), + ylab = expression(psi)) + +# Note: +# Had we loaded hexbin with library(hexbin), the plot function would have +# been dispatched by the plot() generic, and we could simply have written: +# plot(hexbin(phi, psi, xbins = 10), ... + + +# == 3.4 Plotting density contours ========================================= + + +# The best way to handle such data is provided by the function contour(): +?contour + +# Contour plots are not produced along the haphazardly sampled values of a data +# set, but on a regular grid. This means, we need to convert observed values +# into estimated densities. Density estimation is an important topic for +# exploratory data analysis, base R has the density() function for 1D +# distributions. But for 2D data like or phi-psi plots, we need a function from +# the MASS package: kde2d() + +if (! requireNamespace("MASS", quietly = TRUE)) { + install.packages("MASS") +} +# Package information: +# library(help = MASS) # basic information +# browseVignettes("MASS") # available vignettes +# data(package = "MASS") # available datasets + +?MASS::kde2d +dPhiPsi <-MASS::kde2d(phi, psi, + n = 60, + lims = c(-180, 180, -180, 180)) + +str(dPhiPsi) +# This is a list, with gridpoints in x and y, and the estimated densities in z. + +# Generic plot with default parameters +contour(dPhiPsi) + + +# === 3.4.1 ... as overlay on a coloured grid + +image(dPhiPsi, + col = myColorRamp(100), + main = "Ramachandran plot for 1BM8", + xlab = expression(phi), + ylab = expression(psi)) +contour(dPhiPsi, col = "royalblue", + add = TRUE, + method = "edge", + nlevels = 10, + lty = 2) +points(phi, psi, col = "#00338866", pch = 3, cex = 0.7) +abline(h = 0, lwd = 0.5, col = "#00000044") +abline(v = 0, lwd = 0.5, col = "#00000044") + + +# === 3.4.2 ... as filled countour + +filled.contour(dPhiPsi, + xlim = c(-180, 180), ylim = c(-180, 180), + nlevels = 10, + color.palette = myColorRamp, + main = "Ramachandran plot for 1BM8", + xlab = expression(phi), + ylab = expression(psi)) + +# Note: we can pass additional plotting and overlay commands to the counter plot +# in a block of expressions passed via the plot.axes parameter: + +filled.contour(dPhiPsi, + xlim = c(-180, 180), ylim = c(-180, 180), + nlevels = 10, + color.palette = myColorRamp, + main = "Ramachandran plot for 1BM8", + xlab = expression(phi), + ylab = expression(psi), + plot.axes = { + contour(dPhiPsi, col = "#00000044", + add = TRUE, + method = "edge", + nlevels = 10, + lty = 2) + points(phi, psi, col = "#00338866", pch = 3, cex = 0.7) + abline(h = 0, lwd = 0.5, col = "#00000044") + abline(v = 0, lwd = 0.5, col = "#00000044") + }) + +# === 3.4.3 ... as a perspective plot + +persp(dPhiPsi, + xlab = "phi", + ylab = "psi", + zlab = "Density") + + +persp(dPhiPsi, + theta = 40, + phi = 10, + col = "#99AACC", + xlab = "phi", + ylab = "psi", + zlab = "Density") + + + +# = 4 cis-peptide bonds =================================================== + +# Are there any cis-peptide bonds in the structure? +tor$omega +#... gives us a quick answer. But wait - what values do we +# expect? And why are the values so different, ranging from -180° to 180°? +# Consider this plot: what am I doing here and why? +om <- c(360 + tor$omega[tor$omega < 0], + tor$omega[tor$omega >= 0]) +hist(om, xlim=c(0,360)) +abline(v=180, col="red") + +# Note: a cis-peptide bond will have an omega torsion angle around 0° + + +# = 5 H-bond lengths ====================================================== + +# Let's do something a little less trivial and compare +# backbone H-bond lengths between helices and strands. + +# Secondary structure is defined in the bio3d object's ...$helix and ...$strand +# list elements. +str(apses) + +# We need to +# - collect all N atoms in alpha helices resp. +# beta strands; +# - collect all O atoms in alpha helices resp. +# beta strands; +# - fetch the atom coordinates; +# - calculate all N, O distances; +# - filter them for distances that indicate H-bonds; and, +# - plot the results. + +# Secondary structure can either be obtained from definitions contained in most +# PDB files, or by running the DSSP algorithm IF(!) you have it installed on +# your machine. See the dssp() function of bio3d for instructions how to obtain +# and install DSSP and STRIDE. This is highly recommended for "real" work with +# structure coordinate files. The 1BM8 file contains secondary structure +# definitions: + +apses$helix +apses$sheet + + +# A function to collect atom indices for particular type of secondary structure + +ssSelect <- function(PDB, myChain = "A", ssType, myElety) { + # Function to retrieve specified atom types from specified secondary + # structure types in a PDB object. + # Parameters: + # PDB A bio3D PDB object + # myChain chr The chain to use. Default: chain "A". + # ssType chr A vector of keywords "helix" and/or "sheet" + # myElety chr A vector of $eletype atom types to return + # Value: num Indices of the matching atom rows in PDB$atom + + # Build a vector of $resno numbers + starts <- numeric() + ends <- numeric() + if ("helix" %in% ssType) { + sel <- PDB$helix$chain %in% myChain + starts <- c(starts, PDB$helix$start[sel]) + ends <- c(ends, PDB$helix$end[sel]) + } + if ("sheet" %in% ssType) { + sel <- PDB$sheet$chain %in% myChain + starts <- c(starts, PDB$sheet$start[sel]) + ends <- c(ends, PDB$sheet$end[sel]) + } + myResno <- numeric() + for (i in seq_along(starts)) { + myResno <- c(myResno, starts[i]:ends[i]) + } + + # get id's from PDB + + x <- bio3d::atom.select(PDB, + string = "protein", + type = "ATOM", + chain = myChain, + resno = myResno, + elety = myElety) + + return(x$atom) +} + +# Example: +ssSelect(apses, ssType = "sheet", myElety = "N") +ssSelect(apses, ssType = "sheet", myElety = "O") + +# That looks correct: O atoms should be stored three index position after N: the +# sequence of atoms in a PDB file is usually N, CA, C, O ... followed by the +# side chain coordinates. + +# Now to extract the coordinates and calculate distances. Our function needs to +# take the PDB object and two vectors of atom indices as argument, and return a +# vector of pair-distances (actually dist.xyz() returns a matrix). + +pairDist <- function(PDB, a, b) { + # Calculate pairwise distances between atoms indicated by a and b + # Parameters: + # PDB A bio3D PDB object + # a int A vector of atom indexes + # b int A vector of atom indexes + # Value: num matrix of Euclidian distances between the atoms given in a, b. + # There are as many rows as atoms in a, as many columns as + # atoms in b. + + dMat <- numeric() + if (length(a) > 0 && length(b) > 0) { + + A <- PDB$atom[a, c("x", "y", "z")] + B <- PDB$atom[b, c("x", "y", "z")] + dMat <- bio3d::dist.xyz(A, B) + + } + return(dMat) +} + +# Let's see if this looks correct. Let's look at all the pairwise distances +# between N and O atoms in both types of secondary structure: + +iN <- ssSelect(apses, ssType = c("helix", "sheet"), myElety = "N") +iO <- ssSelect(apses, ssType = c("helix", "sheet"), myElety = "O") +x <- pairDist(apses, iN, iO) +hist(x, + breaks = 80, + col = "lavenderblush", + main = "", + xlab = "N-O distances (Å)") + +# Since we are collecting distance from all secondary structure elements, we +# are just seing a big peak of (meaningless) long-distance separations. We +# need to zoom in on the shorter distances, in which we expect +# hydrogen bonds: +hist(x[x < 4.2], # restrict to N-O distance less than 4.2 Å long + breaks=seq(2.0, 4.2, 0.1), + xlim=c(2.0,4.2), + col = "lavenderblush", + main = "", + xlab = "N-O distances (Å)") + +# There is a large peak at about 2.2Å, and another +# large peak above 3.5Å. But these are not typical hydrogen +# bond distances! Rather these are (N,O) pairs in peptide +# bonds, and within residues. That's not good, because these will contaminate +# our statistics. +# We need to exclude all distances between N of a residue +# and O of a preceeding residue, and all (N,O) pairs in the +# same residue. We need a function to filter distances by residue numbers. And while we are filtering, we might as well throw away the non-H bond distances too. + +filterHB <- function(PDB, iN, iO, dMat, cutoff = 3.9) { + # Filters distances between O(i-1) and N(i), and between N(i) and O(i) + # in a distance matrix where there is one row per N-atom and one + # column per O atom. + # Parameters: + # PDB a bio3D PDB object + # iN int a vector of N atom indexes + # iO int a vector of O atom indexes + # dMat num a distance matrix created by pairDist() + # cutoff num only return distances that are shorter than "cutoff + # Value: a distance matrix in which values that do not match the + # filter criteria have bee set to NA. + + if (length(iN) > 0 && length(iO) > 0) { + + resN <- PDB$atom$resno[iN] + resO <- PDB$atom$resno[iO] + + for (i in seq_along(resN)) { # for all N atoms + for (j in seq_along(resO)) { # for all O atoms + if (dMat[i, j] > cutoff || # if: distance > cutoff, or ... + (resN[i] - 1) == resO[j] || # distance is N(i)---O(i-1), or ... + resN[i] == resO[j]) { # distance is N(i)---O(i), then: + dMat[i, j] <- NA # set this distance to NA. + } + } + } + } + return(dMat) +} + +# Inspect the result: +hist(filterHB(apses, iN, iO, x), + breaks=seq(2.0, 4.2, 0.1), + xlim=c(2.0,4.2), + col = "paleturquoise", + main = "", + xlab = "N-O distances (Å)") + + +# Finally we can calculate alpha- and beta- structure +# bonds and compare them. In this section we'll explore +# different options for histogram plots. + +# H-bonds in helices ... +iN <- ssSelect(apses, ssType = c("helix"), myElety = "N") +iO <- ssSelect(apses, ssType = c("helix"), myElety = "O") +dH <- filterHB(apses, iN, iO, pairDist(apses, iN, iO)) +dH <- dH[!is.na(dH)] + +# H-bonds in sheets. (We commonly use the letter "E" to symbolize a beta +# strand or sheet, because "E" visually evokes an extended strand with +# protruding sidechains.) +iN <- ssSelect(apses, ssType = c("sheet"), myElety = "N") +iO <- ssSelect(apses, ssType = c("sheet"), myElety = "O") +dE <- filterHB(apses, iN, iO, pairDist(apses, iN, iO)) +dE <- dE[!is.na(dE)] + +# The plain histogram functions without parameters +# give us white stacks. + +hist(dH) + +# and ... +hist(dE) + +# We can see that the histrograms look different +# but that is better visualized by showing two plots +# in the same window. We use the par() function, for +# more flexible layout, look up the layout() function. +?par +?layout + +opar <- par(no.readonly=TRUE) # store current state +par(mfrow=c(2,1)) # set graphics parameters: 2 rows, one column + +# plot two histograms +hist(dH) +hist(dE) + + +# add colour: +hist(dH, col="#DD0055") +hist(dE, col="#00AA70") + + + +# For better comparison, plot both in the +# same window (use the "add = TRUE" parameter in hist() ): + +hist(dH, col="#DD0055") +hist(dE, col="#00AA70", add = TRUE) + +# ... oops, we dind't reset the graphics parameters. You can either use +# the broom icon of the Plot tab to clear asll plots, or ... +par(opar) # ... reset the graphics parameters + +hist(dH, col = "#DD0055") +hist(dE, col = "#00AA70", add = TRUE) + +# We see that the leftmost column of the sheet bonds hides the helix bonds in +# that column. Not good. But we can make the colours transparent! We just need to +# add a fourth set of two hexadecimal-numbers to the #RRGGBB triplet. (This +# sets the transparency of the colour, it is called the "alpha channel"). Lets +# use 2/3 transparent, in hexadecimal, 1/3 of 256 is x55 - i.e. an RGB triplet +# specied as #RRGGBB55 is only 33% opaque: + +hist(dH, col = "#DD005555") +hist(dE, col = "#00AA7055", add = TRUE) + +# To finalize the plots, let's do two more things: Explicitly define the breaks, +# to make sure they match up - otherwise they would not need to... like in this +# example: + +hist(dH, col ="#DD005555") +hist(dE[dE < 3], col = "#00AA7055", add = TRUE) + +# Breaks are a parameter in hist() that can either be a scalar, to define how +# many columns you want, or a vector, that defines the actual breakpoints. +brk=seq(2.4, 4.0, 0.1) + +hist(dH, col="#DD005555", breaks=brk) +hist(dE, col="#00AA7055", breaks=brk, add=TRUE) + +# The last thing to do is to think about rescaling the plot. You notice that the +# y-axis is scaled in absolute frequency (i.e. counts). That gives us some +# impression of the relative frequency, but it is of course skewed by observing +# relatively more or less of one type of secondary structure in a protein. As +# part of the hist() function we can rescale the values so that the sum over all +# is one: set the parameter freq=FALSE. And we explicitly set y-axis limits +# to accommodate bot distributions. + +hist(dH, col="#DD005555", breaks=brk, freq=FALSE, ylim = c(0, 4)) +hist(dE, col="#00AA7055", breaks=brk, freq=FALSE, add=TRUE) + +# Adding labels and legend ... + +hH <- hist(dH, + freq=FALSE, + breaks=brk, + col="#DD005550", + xlab="(N,O) distance (Å)", + ylab="Density", + ylim=c(0,4), + main="Helix and Sheet H-bond lengths") +hE <- hist(dE, + freq=FALSE, + breaks=brk, + col="#00AA7060", + add=TRUE) + +legend("topright", + c(sprintf("alpha (N = %3d)", sum(hH$counts)), + sprintf("beta (N = %3d)", sum(hE$counts))), + fill = c("#DD005550", "#00AA7060"), bty = 'n', + border = NA) + + +# With all the functions we have defined, +# it is easy to try this with a larger protein. +# 3ugj for example is VERY large. + +pdb <- bio3d::read.pdb("3ugj") + +# helices... +iN <- ssSelect(pdb, ssType = c("helix"), myElety = "N") +iO <- ssSelect(pdb, ssType = c("helix"), myElety = "O") +dH <- filterHB(pdb, iN, iO, pairDist(pdb, iN, iO)) +dH <- dH[!is.na(dH)] + +# sheets +iN <- ssSelect(pdb, ssType = c("sheet"), myElety = "N") +iO <- ssSelect(pdb, ssType = c("sheet"), myElety = "O") +dE <- filterHB(pdb, iN, iO, pairDist(pdb, iN, iO)) +dE <- dE[!is.na(dE)] + +# histograms ... +brk=seq(2.4, 4.0, 0.1) + +hH <- hist(dH, + freq=FALSE, + breaks=brk, + col="#DD005550", + xlab="(N,O) distance (Å)", + ylab="Density", + ylim=c(0,4), + main="Helix and Sheet H-bond lengths") +hE <- hist(dE, + freq=FALSE, + breaks=brk, + col="#00AA7060", + add=TRUE) + +legend('topright', + c(paste("alpha (N = ", sum(hH$counts), ")"), + paste("beta (N = ", sum(hE$counts), ")")), + fill = c("#DD005550", "#00AA7060"), bty = 'n', + border = NA, + inset = 0.1) + +# It's apparent that the distributions are indeed different. Our sample +# is large, but derives from a single protein. To do database scale statistics, +# we should look at many more proteins. To give you a sense of how, let's do +# this for just ten proteins, randomly selected from non-homologous, +# high-resolution, single domain structures. I have provided a utility function +# for such a selection (details beyond the scope of this project). + +myPDBs <- selectPDBrep(10) +# My selection is "2OVJ", "1HQS", "3BON", "4JZX", "3BQ3", "2IUM", "2C9E", +# "4X1F", "2V3I", "3GE3". Yours will be different. + +# We are loading the files online - don't do this if you have bandwidth +# limitations. + + +dH <- c() # collect all helix H-bonds here +dE <- c() # collect all sheet H-bonds here + +for (i in seq_along(myPDBs)) { + pdb <- bio3d::read.pdb(myPDBs[i]) + + # helices... + iN <- ssSelect(pdb, ssType = c("helix"), myElety = "N") + iO <- ssSelect(pdb, ssType = c("helix"), myElety = "O") + x <- filterHB(pdb, iN, iO, pairDist(pdb, iN, iO)) + dH <- c(dH, x[!is.na(x)]) + + # sheets + iN <- ssSelect(pdb, ssType = c("sheet"), myElety = "N") + iO <- ssSelect(pdb, ssType = c("sheet"), myElety = "O") + x <- filterHB(pdb, iN, iO, pairDist(pdb, iN, iO)) + dE <- c(dE, x[!is.na(x)]) +} + +# Inspect the results + +length(dH) # 4415 (your numbers are different, but there should be many) +length(dE) # 262 + +brk=seq(2.0, 4.0, 0.1) + +hH <- hist(dH, + freq=FALSE, + breaks=brk, + col="#DD005550", + xlab="(N,O) distance (Å)", + ylab="Density", + ylim=c(0,4), + cex.main = 0.8, + main="Helix and Sheet H-bond lengths (10 representative structures)") +hE <- hist(dE, + freq=FALSE, + breaks=brk, + col="#00AA7060", + add=TRUE) + +legend('topright', + c(paste("alpha (N = ", sum(hH$counts), ")"), + paste("beta (N = ", sum(hE$counts), ")")), + fill = c("#DD005550", "#00AA7060"), bty = 'n', + border = NA, + inset = 0.1) + +# Task: +# Why do you think these distributions are different? +# At what distance do you think H-bonds have the lowest energy? +# For alpha-helices? For beta-strands? + + + + +# [END] diff --git a/RPR-UniProt_GET.R b/RPR-UniProt_GET.R index 6a87854..4b6b4d4 100644 --- a/RPR-UniProt_GET.R +++ b/RPR-UniProt_GET.R @@ -1,135 +1,135 @@ -# tocID <- "RPR-UniProt_GET.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the RPR-Scripting_data_downloads unit. -# -# Version: 1.2 -# -# Date: 2017-10 - 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.2 2020 Maintenance. Made dbFetchUniProtSeq() vector-safe and -# added FASTA headers as attribute -# 1.1 Change from require() to requireNamespace(), -# use ::() idiom throughout -# 1.0 First ABC units version -# 0.1 First code copied from 2016 material. -# -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ---------------------------------------------------------- -#TOC> 1 UniProt files via GET 43 -#TOC> 1.1 Task - fetchUniProtSeq() function 105 -#TOC> 2 Task solutions 118 -#TOC> -#TOC> ========================================================================== - - -# = 1 UniProt files via GET =============================================== - - -# Perhaps the simplest example of scripted download is to retrieve a protein -# FASTA sequence from UniProt. All we need is to construct an URL with the -# correct UniProt ID. - -# An interface between R scripts and Web servers is provided by the httr:: -# package. This sends and receives information via the http protocol, just like -# a Web browser. Since this is a short and simple request, the GET verb is the -# right tool: - -if (! requireNamespace("httr", quietly = TRUE)) { - install.packages("httr") -} -# Package information: -# library(help = httr) # basic information -# browseVignettes("httr") # available vignettes -# data(package = "httr") # available datasets - - -# The UniProt ID for Mbp1 is ... - -UniProtID <- "P39678" - -# and the base URL to retrieve data is ... -# http://www.uniprot.org/uniprot/ . We can construct a simple URL to -# retrieve a FASTA sequence: - -(URL <- sprintf("http://www.uniprot.org/uniprot/%s.fasta", UniProtID)) - -# the GET() function from httr will get the data. -response <- httr::GET(URL) - -str(response) # the response object is a bit complex ... -as.character(response) # ... but it is easy to pull out the data. - -# to process ... -x <- as.character(response) -x <- strsplit(x, "\n") -dbSanitizeSequence(x) - -# Simple. -# But what happens if there is an error, e.g. the uniprot ID does not exist? - -response <- httr::GET("http://www.uniprot.org/uniprot/X000000.fasta") -as.character(response) -# this is a large HTML page that tells us the URL was not found. So we need to -# check for errors. The Right Way to do this is to evaluate the staus code that -# every Web server returns for every transaction. -# -httr::status_code(response) # 404 == Page Not Found - -# There are many possible codes, but the only code we will be happy with -# is 200 - oK. -# (cf. https://en.wikipedia.org/wiki/List_of_HTTP_status_codes ) - -URL <- sprintf("http://www.uniprot.org/uniprot/%s.fasta", UniProtID) -response <- httr::GET(URL) -httr::status_code(response) - - -# == 1.1 Task - fetchUniProtSeq() function ================================= - -# Task: write a function that -# - takes as input a vector of UniProt IDs, -# - fetches the FASTA sequence for each -# - returns a vector of the same length as the input, where an element is: -# - ... the sequence, if the query was successful -# - ... NA if there was an error -# - each element has the UniProt ID as the name() -# - bonus: the output has an attribute "headers" that is a vector of the -# FASTA headers ( cf. ?attr ) - - -# = 2 Task solutions ====================================================== - - -# I have placed such a function - dbFetchUniProtSeq() - into -# "./scripts/ABC-dbUtilities.R": look it up by clicking on dbFetchUniProtSeq() -# in the Environment pane. - -# Test this: -( x <- dbFetchUniProtSeq("P39678") ) -names(x)[1] -attr(x, "headers")[1] -x[1] -cat(writeFASTA(data.frame(head = attr(x, "headers")[1], seq =x[1]), - width = 40), sep = "\n") - - - -# [END] +# tocID <- "RPR-UniProt_GET.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the RPR-Scripting_data_downloads unit. +# +# Version: 1.2 +# +# Date: 2017-10 - 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.2 2020 Maintenance. Made dbFetchUniProtSeq() vector-safe and +# added FASTA headers as attribute +# 1.1 Change from require() to requireNamespace(), +# use ::() idiom throughout +# 1.0 First ABC units version +# 0.1 First code copied from 2016 material. +# +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ---------------------------------------------------------- +#TOC> 1 UniProt files via GET 43 +#TOC> 1.1 Task - fetchUniProtSeq() function 105 +#TOC> 2 Task solutions 118 +#TOC> +#TOC> ========================================================================== + + +# = 1 UniProt files via GET =============================================== + + +# Perhaps the simplest example of scripted download is to retrieve a protein +# FASTA sequence from UniProt. All we need is to construct an URL with the +# correct UniProt ID. + +# An interface between R scripts and Web servers is provided by the httr:: +# package. This sends and receives information via the http protocol, just like +# a Web browser. Since this is a short and simple request, the GET verb is the +# right tool: + +if (! requireNamespace("httr", quietly = TRUE)) { + install.packages("httr") +} +# Package information: +# library(help = httr) # basic information +# browseVignettes("httr") # available vignettes +# data(package = "httr") # available datasets + + +# The UniProt ID for Mbp1 is ... + +UniProtID <- "P39678" + +# and the base URL to retrieve data is ... +# http://www.uniprot.org/uniprot/ . We can construct a simple URL to +# retrieve a FASTA sequence: + +(URL <- sprintf("http://www.uniprot.org/uniprot/%s.fasta", UniProtID)) + +# the GET() function from httr will get the data. +response <- httr::GET(URL) + +str(response) # the response object is a bit complex ... +as.character(response) # ... but it is easy to pull out the data. + +# to process ... +x <- as.character(response) +x <- strsplit(x, "\n") +dbSanitizeSequence(x) + +# Simple. +# But what happens if there is an error, e.g. the uniprot ID does not exist? + +response <- httr::GET("http://www.uniprot.org/uniprot/X000000.fasta") +as.character(response) +# this is a large HTML page that tells us the URL was not found. So we need to +# check for errors. The Right Way to do this is to evaluate the staus code that +# every Web server returns for every transaction. +# +httr::status_code(response) # 404 == Page Not Found + +# There are many possible codes, but the only code we will be happy with +# is 200 - oK. +# (cf. https://en.wikipedia.org/wiki/List_of_HTTP_status_codes ) + +URL <- sprintf("http://www.uniprot.org/uniprot/%s.fasta", UniProtID) +response <- httr::GET(URL) +httr::status_code(response) + + +# == 1.1 Task - fetchUniProtSeq() function ================================= + +# Task: write a function that +# - takes as input a vector of UniProt IDs, +# - fetches the FASTA sequence for each +# - returns a vector of the same length as the input, where an element is: +# - ... the sequence, if the query was successful +# - ... NA if there was an error +# - each element has the UniProt ID as the name() +# - bonus: the output has an attribute "headers" that is a vector of the +# FASTA headers ( cf. ?attr ) + + +# = 2 Task solutions ====================================================== + + +# I have placed such a function - dbFetchUniProtSeq() - into +# "./scripts/ABC-dbUtilities.R": look it up by clicking on dbFetchUniProtSeq() +# in the Environment pane. + +# Test this: +( x <- dbFetchUniProtSeq("P39678") ) +names(x)[1] +attr(x, "headers")[1] +x[1] +cat(writeFASTA(data.frame(head = attr(x, "headers")[1], seq =x[1]), + width = 40), sep = "\n") + + + +# [END] diff --git a/RPR-Unit_testing.R b/RPR-Unit_testing.R index 5f4a26e..c599648 100644 --- a/RPR-Unit_testing.R +++ b/RPR-Unit_testing.R @@ -1,234 +1,234 @@ -# tocID <- "RPR-Unit_testing.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the RPR-Unit_testing unit. -# -# Version: 1.2 -# -# Date: 2017 10 - 2019 01 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.2 2020 Updates. Discuss local tests. -# 1.1 Change from require() to requireNamespace() -# 1.0 New code -# -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ------------------------------------------------- -#TOC> 1 Unit Tests with testthat 42 -#TOC> 2 Organizing your tests 165 -#TOC> 2.1 Testing scripts 189 -#TOC> 2.2 Rethinking testing 202 -#TOC> 3 Task solutions 220 -#TOC> -#TOC> ========================================================================== - - -# = 1 Unit Tests with testthat ============================================ - -# The testthat package supports writing and executing unit tests in many ways. - -if (! requireNamespace("testthat", quietly = TRUE)) { - install.packages("testthat") -} -# Package information: -# library(help = testthat) # basic information -# browseVignettes("testthat") # available vignettes -# data(package = "testthat") # available datasets - -# testthat is one of those packages that we either use A LOT in a script, -# or not at all. Therefore it's more reasonable to depart from our usual -# ::() idiom, and load the entire library. In fact, if -# we author packages, it is common practice to load testthat in the part -# of the package that automates testing. - -library(testthat) - -# An atomic test consists of an expectation about the bahaviour of a function or -# the existence of an object. testthat provides a number of useful expectations: - -# At the most basic level, you can use expect_true() and expect_false(): - -expect_true(file.exists("./data/S288C_YDL056W_MBP1_coding.fsa")) -expect_true(file.exists("NO-SUCH-FILE.txt")) - -expect_false(is.integer(NA)) - -# More commonly, you will test for equality of an output with a given result. -# But you need to consider what it means for two numbers to be "equal" on a -# digital computer. Consider: - -49*(1/49) == 1 # Surprised? Read FAQ 7.31 - # https://cran.r-project.org/doc/FAQ/R-FAQ.html -49*(1/49) - 1 # NOT zero (but almost) - -# This is really unpredictable ... -0.1 + 0.05 == 0.15 -0.2 + 0.07 == 0.27 - -# It's easy to be caught on the wrong foot with numeric comparisons, therefore -# R uses the function all.equal() to test whether two numbers are equal for -# practical puposes up to machine precision. -49*(1/49) == 1 -all.equal(49*(1/49), 1) - -# The testthat function expect_equal() uses all.equal internally: -expect_equal(49*(1/49), 1) - -# ... which is reasonable, or, if things MUST be exactly the same ... -expect_identical(49*(1/49), 1) - -# ... but consider: -expect_identical(2, 2L) # one is typeof() "double", the other is integer" - -# Some very useful expectations are expect_warning(), and expect_error(), for -# constructing tests that check for erroneous output: - -as.integer(c("1", "2", "three")) -expect_warning(as.integer(c("1", "2", "three"))) # Note that the warning is NOT - # printed. -1/"x" -expect_warning(1/"x") -expect_error(1/"x") # Again: note that the error is NOT printed, as well - # code execution will continue. - -# Even better, you can check if the warning or error is what you expect it -# to be - because it could actually have occured somewhere else in your code. - -v <- c("1", "x") -log(v[1:2]) -expect_error(log(v[1:2]), "non-numeric argument to mathematical function") -expect_error(log(v[1:2]), "non-numeric") # We can abbreviate the error message. -expect_error(log(v[1,2])) # This appears oK, but ... -expect_error(log(v[1,2]), "non-numeric") # ... it's actually a different error! - -# Producing unit tests simply means: we define a function, and then we check -# whether all test pass. Consider a function that is loaded on startup from -# the .utilities.R script: - -biCode - -# We could test it like so: - -expect_equal(biCode(""), ".....") -expect_equal(biCode(" "), ".....") -expect_equal(biCode("123 12"), ".....") -expect_equal(biCode("h sapiens"), "H..SA") -expect_equal(biCode("homo sapiens"), "HOMSA") -expect_equal(biCode("[homo sapiens neanderthaliensis]"), "HOMSA") -expect_equal(biCode(c("Phascolarctos cinereus", "Macropus rufus")), - c("PHACI", "MACRU")) -expect_error(biCode(), "argument \"s\" is missing, with no default") - -# The test_that() function allows to group related tests, include an informative -# message which test is being executed, and run a number of tests that are -# passed to the function inside a code block - i.e. {...} -# test_that(", {}) - -test_that("NA values are preserved", { - # bicode() respects vector length: input and output must have the smae length. - # Therefore NA's can't be simply skipped, bust must be properly passed - # into output: - expect_true(is.na((biCode(NA)))) - expect_equal(biCode(c("first", NA, "last")), - c("FIRST", NA, "LAST.")) -}) - - -# Task: Write a function calcGC() that calculates GC content in a sequence. -# Hint: you could strsplit() the sequence into a vector, and count -# G's and C's; or you could use gsub("[AT]", "", ) to remove -# A's and T's, and use nchar() before and after to calculate the content -# from the length difference. -# Then write tests that: -# confirm that calcGC("AATT") is 0; -# confirm that calcGC("ATGC") is 0.5; -# confirm that calcGC("AC") is 0.5; -# confirm that calcGC("CGCG") is 1; - - -# = 2 Organizing your tests =============================================== - - -# Tests are only useful if they are actually executed and we need to make sure -# there are no barriers to do that. The testthat package supports automatic -# execution of tests: -# - put your tests into an R-script, -# - save your tests in a file called "test_.R" -# - execute the test with test_file("test_.R") ... -# ... or, if you are working on a project ... -# - place the file in a test-directory (e.g. the directory "test" in this -# project), -# - execute all your tests with test_dir("") - -# For example I have provided a "tests" directory with this project, and -# placed the file "test_biCode.R" inside. -file.show("./tests/test_biCode.R") - -# Execute the file ... -test_file("./tests/test_biCode.R") - -# .. or execute all the test files in the directory: -test_dir("./tests") - -# == 2.1 Testing scripts =================================================== - -# Scripts need special consideration since we do not necessarily source() them -# entirely. Therefore automated testing is not reasonable. What you can do -# instead is to place a conditional block at the end of your script, that -# never gets executed - then you can manually execute the code in the block -# whenever you wish to test your functions. For example: - -if (FALSE) { - # ... your tests go here - -} - -# == 2.2 Rethinking testing ================================================ - -# However, it is important to keep in mind that different objectives lead to -# different ideas of what works best. There is never a "best" in and of itself, -# the question is always: "Best for what?" While automated unit testing is a -# great way to assure the integrity of packages and larger software artefacts as -# they are being developed, more loosely conceived aggregates of code - like the -# scripts for this course for example - have different objectives and in this -# case I find the testthat approach to actually be inferior. The reason is its -# tendency to physically separate code and tests. Keeping assets, and functions -# that operate on those assets separated is always poor design. I have found -# over time that a more stable approach is to move individual functions into -# their individual scripts, all in one folder, one function (and its helpers) -# per file, and examples, demos and tests in an if (FALSE) { ... } block, as -# explained above. - - - -# = 3 Task solutions ====================================================== - -calcGC <- function(s) { - s <- gsub("[^agctAGCT]", "", s) - return(nchar(gsub("[atAT]", "", s)) / nchar(s)) -} - -expect_equal(calcGC("AATT"), 0) -expect_equal(calcGC("ATGC"), 0.5) -expect_equal(calcGC("AC"), 0.5) -expect_equal(calcGC("CGCG"), 1) - - - -# [END] +# tocID <- "RPR-Unit_testing.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the RPR-Unit_testing unit. +# +# Version: 1.2 +# +# Date: 2017 10 - 2019 01 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.2 2020 Updates. Discuss local tests. +# 1.1 Change from require() to requireNamespace() +# 1.0 New code +# +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ------------------------------------------------- +#TOC> 1 Unit Tests with testthat 42 +#TOC> 2 Organizing your tests 165 +#TOC> 2.1 Testing scripts 189 +#TOC> 2.2 Rethinking testing 202 +#TOC> 3 Task solutions 220 +#TOC> +#TOC> ========================================================================== + + +# = 1 Unit Tests with testthat ============================================ + +# The testthat package supports writing and executing unit tests in many ways. + +if (! requireNamespace("testthat", quietly = TRUE)) { + install.packages("testthat") +} +# Package information: +# library(help = testthat) # basic information +# browseVignettes("testthat") # available vignettes +# data(package = "testthat") # available datasets + +# testthat is one of those packages that we either use A LOT in a script, +# or not at all. Therefore it's more reasonable to depart from our usual +# ::() idiom, and load the entire library. In fact, if +# we author packages, it is common practice to load testthat in the part +# of the package that automates testing. + +library(testthat) + +# An atomic test consists of an expectation about the bahaviour of a function or +# the existence of an object. testthat provides a number of useful expectations: + +# At the most basic level, you can use expect_true() and expect_false(): + +expect_true(file.exists("./data/S288C_YDL056W_MBP1_coding.fsa")) +expect_true(file.exists("NO-SUCH-FILE.txt")) + +expect_false(is.integer(NA)) + +# More commonly, you will test for equality of an output with a given result. +# But you need to consider what it means for two numbers to be "equal" on a +# digital computer. Consider: + +49*(1/49) == 1 # Surprised? Read FAQ 7.31 + # https://cran.r-project.org/doc/FAQ/R-FAQ.html +49*(1/49) - 1 # NOT zero (but almost) + +# This is really unpredictable ... +0.1 + 0.05 == 0.15 +0.2 + 0.07 == 0.27 + +# It's easy to be caught on the wrong foot with numeric comparisons, therefore +# R uses the function all.equal() to test whether two numbers are equal for +# practical puposes up to machine precision. +49*(1/49) == 1 +all.equal(49*(1/49), 1) + +# The testthat function expect_equal() uses all.equal internally: +expect_equal(49*(1/49), 1) + +# ... which is reasonable, or, if things MUST be exactly the same ... +expect_identical(49*(1/49), 1) + +# ... but consider: +expect_identical(2, 2L) # one is typeof() "double", the other is integer" + +# Some very useful expectations are expect_warning(), and expect_error(), for +# constructing tests that check for erroneous output: + +as.integer(c("1", "2", "three")) +expect_warning(as.integer(c("1", "2", "three"))) # Note that the warning is NOT + # printed. +1/"x" +expect_warning(1/"x") +expect_error(1/"x") # Again: note that the error is NOT printed, as well + # code execution will continue. + +# Even better, you can check if the warning or error is what you expect it +# to be - because it could actually have occured somewhere else in your code. + +v <- c("1", "x") +log(v[1:2]) +expect_error(log(v[1:2]), "non-numeric argument to mathematical function") +expect_error(log(v[1:2]), "non-numeric") # We can abbreviate the error message. +expect_error(log(v[1,2])) # This appears oK, but ... +expect_error(log(v[1,2]), "non-numeric") # ... it's actually a different error! + +# Producing unit tests simply means: we define a function, and then we check +# whether all test pass. Consider a function that is loaded on startup from +# the .utilities.R script: + +biCode + +# We could test it like so: + +expect_equal(biCode(""), ".....") +expect_equal(biCode(" "), ".....") +expect_equal(biCode("123 12"), ".....") +expect_equal(biCode("h sapiens"), "H..SA") +expect_equal(biCode("homo sapiens"), "HOMSA") +expect_equal(biCode("[homo sapiens neanderthaliensis]"), "HOMSA") +expect_equal(biCode(c("Phascolarctos cinereus", "Macropus rufus")), + c("PHACI", "MACRU")) +expect_error(biCode(), "argument \"s\" is missing, with no default") + +# The test_that() function allows to group related tests, include an informative +# message which test is being executed, and run a number of tests that are +# passed to the function inside a code block - i.e. {...} +# test_that(", {}) + +test_that("NA values are preserved", { + # bicode() respects vector length: input and output must have the smae length. + # Therefore NA's can't be simply skipped, bust must be properly passed + # into output: + expect_true(is.na((biCode(NA)))) + expect_equal(biCode(c("first", NA, "last")), + c("FIRST", NA, "LAST.")) +}) + + +# Task: Write a function calcGC() that calculates GC content in a sequence. +# Hint: you could strsplit() the sequence into a vector, and count +# G's and C's; or you could use gsub("[AT]", "", ) to remove +# A's and T's, and use nchar() before and after to calculate the content +# from the length difference. +# Then write tests that: +# confirm that calcGC("AATT") is 0; +# confirm that calcGC("ATGC") is 0.5; +# confirm that calcGC("AC") is 0.5; +# confirm that calcGC("CGCG") is 1; + + +# = 2 Organizing your tests =============================================== + + +# Tests are only useful if they are actually executed and we need to make sure +# there are no barriers to do that. The testthat package supports automatic +# execution of tests: +# - put your tests into an R-script, +# - save your tests in a file called "test_.R" +# - execute the test with test_file("test_.R") ... +# ... or, if you are working on a project ... +# - place the file in a test-directory (e.g. the directory "test" in this +# project), +# - execute all your tests with test_dir("") + +# For example I have provided a "tests" directory with this project, and +# placed the file "test_biCode.R" inside. +file.show("./tests/test_biCode.R") + +# Execute the file ... +test_file("./tests/test_biCode.R") + +# .. or execute all the test files in the directory: +test_dir("./tests") + +# == 2.1 Testing scripts =================================================== + +# Scripts need special consideration since we do not necessarily source() them +# entirely. Therefore automated testing is not reasonable. What you can do +# instead is to place a conditional block at the end of your script, that +# never gets executed - then you can manually execute the code in the block +# whenever you wish to test your functions. For example: + +if (FALSE) { + # ... your tests go here + +} + +# == 2.2 Rethinking testing ================================================ + +# However, it is important to keep in mind that different objectives lead to +# different ideas of what works best. There is never a "best" in and of itself, +# the question is always: "Best for what?" While automated unit testing is a +# great way to assure the integrity of packages and larger software artefacts as +# they are being developed, more loosely conceived aggregates of code - like the +# scripts for this course for example - have different objectives and in this +# case I find the testthat approach to actually be inferior. The reason is its +# tendency to physically separate code and tests. Keeping assets, and functions +# that operate on those assets separated is always poor design. I have found +# over time that a more stable approach is to move individual functions into +# their individual scripts, all in one folder, one function (and its helpers) +# per file, and examples, demos and tests in an if (FALSE) { ... } block, as +# explained above. + + + +# = 3 Task solutions ====================================================== + +calcGC <- function(s) { + s <- gsub("[^agctAGCT]", "", s) + return(nchar(gsub("[atAT]", "", s)) / nchar(s)) +} + +expect_equal(calcGC("AATT"), 0) +expect_equal(calcGC("ATGC"), 0.5) +expect_equal(calcGC("AC"), 0.5) +expect_equal(calcGC("CGCG"), 1) + + + +# [END] diff --git a/RPR-eUtils_XML.R b/RPR-eUtils_XML.R index f22f6c6..e097588 100644 --- a/RPR-eUtils_XML.R +++ b/RPR-eUtils_XML.R @@ -1,166 +1,166 @@ -# tocID <- "RPR-eUtils_XML.R" -# -# Purpose: A Bioinformatics Course: -# R code accompanying the RPR-Scripting_data_downloads unit. -# -# Version: 1.2.1 -# -# Date: 2017-10 - 2021-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.2.1 2021 Maintenance -# 1.2 2020 Updates -# 1.1 Change from require() to requireNamespace(), -# use ::() idiom throughout -# 1.0 First ABC units version -# 0.1 First code copied from 2016 material. -# -# -# TODO: -# -# -# == DO NOT SIMPLY source() THIS FILE! ======================================= -# -# If there are portions you don't understand, use R's help system, Google for an -# answer, or ask your instructor. Don't continue if you don't understand what's -# going on. That's not how it works ... -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ----------------------------------------------------------- -#TOC> 1 Working with NCBI eUtils 43 -#TOC> 1.1 Task - fetchNCBItaxData() function 145 -#TOC> 2 Task solutions 152 -#TOC> -#TOC> ========================================================================== - - -# = 1 Working with NCBI eUtils ============================================ - - -# To begin, we load the xml2 package that contains functions -# we need to receive and parse html data. NCBI's eUtils send information in -# XML format so we need to be able to parse XML. -if (! requireNamespace("xml2", quietly=TRUE)) { - install.packages("xml2") -} -# Package information: -# library(help = xml2) # basic information -# browseVignettes("xml2") # available vignettes -# data(package = "xml2") # available datasets - - - -# We will walk through the process with the refSeqID -# of yeast Mbp1 -refSeqID <- "NP_010227" - - -# First we build a query URL... -eUtilsBase <- "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/" - - -# Then we assemble an URL that will search for get the -# unique, NCBI internal identifier, -# for our refSeqID... -URL <- paste(eUtilsBase, - "esearch.fcgi?", # ...using the esearch program - # that finds an entry in an - # NCBI database - "db=protein", - "&term=", refSeqID, - sep="") -# Copy the URL and paste it into your browser to see -# what the response should look like. -URL - -# To fetch a response in R, we use the function read_xml() -# with our URL as its argument. -( myXML <- xml2::read_xml(URL) ) - -# This is XML. We can take the response apart into -# its individual components with the as_list() function. - -xml2::as_list(myXML) - -# Note how the XML "tree" is represented as a list of -# lists of lists ... -# If we know exactly what element we are looking for, -# we can extract it from this structure: -xml2::as_list(myXML)[["eSearchResult"]][["IdList"]][["Id"]][[1]] - -# But this is not very robust, it would break with the -# slightest change that the NCBI makes to their data format - -# and the NCBI changes things A LOT! - -# Somewhat more robust is to specify the type of element -# we want - its the text contained in an ... -# element, and use the XPath XML parsing language to -# retrieve it. - -xml2::xml_find_all(myXML, "//Id") # returns a "node set" - -xml2::xml_text(xml2::xml_find_all(myXML, "//Id")) # returns the contents - # of the node set - -# We will need to do this more than once, so we write a function -# for it... -node2text <- function(doc, tag) { - # an extractor function for the contents of elements - # between given tags in an XML response. - # Contents of all matching elements is returned in - # a vector of strings. - path <- paste0("//", tag) - nodes <- xml2::xml_find_all(doc, path) - return(xml2::xml_text(nodes)) -} - -# using node2text() ... -(GID <- node2text(myXML, "Id")) - -# The GI is the pivot for data requests at the -# NCBI. - -# Let's first get the associated data for this GI -URL <- paste0(eUtilsBase, - "esummary.fcgi?", - "db=protein", - "&id=", - GID, - "&version=2.0") -(myXML <- xml2::read_xml(URL)) - -(taxID <- node2text(myXML, "TaxId")) -(organism <- node2text(myXML, "Organism")) - -# This forms the base of a function that gets taxonomy data -# from an Entrez result. You can write this! - - -# == 1.1 Task - fetchNCBItaxData() function ================================ - -# Task: write a function that takes as input a RefSeq ID, fetches the taxonomy -# information, returns a list with taxID and organism, if the operation is -# successful, or a list of length 0 if there is an error. - - -# = 2 Task solutions ====================================================== - -# I have placed such a function into the dbUtilities script: look it up by -# clicking on dbFetchNCBItaxData() in the Environment pane. - -# Test: -dbFetchNCBItaxData("XP_001837394") - -# Expected outout: -# ---------------- -# taxID organism -# 1 240176 Coprinopsis cinerea okayama7#130 - - -# [END] +# tocID <- "RPR-eUtils_XML.R" +# +# Purpose: A Bioinformatics Course: +# R code accompanying the RPR-Scripting_data_downloads unit. +# +# Version: 1.2.1 +# +# Date: 2017-10 - 2021-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.2.1 2021 Maintenance +# 1.2 2020 Updates +# 1.1 Change from require() to requireNamespace(), +# use ::() idiom throughout +# 1.0 First ABC units version +# 0.1 First code copied from 2016 material. +# +# +# TODO: +# +# +# == DO NOT SIMPLY source() THIS FILE! ======================================= +# +# If there are portions you don't understand, use R's help system, Google for an +# answer, or ask your instructor. Don't continue if you don't understand what's +# going on. That's not how it works ... +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ----------------------------------------------------------- +#TOC> 1 Working with NCBI eUtils 43 +#TOC> 1.1 Task - fetchNCBItaxData() function 145 +#TOC> 2 Task solutions 152 +#TOC> +#TOC> ========================================================================== + + +# = 1 Working with NCBI eUtils ============================================ + + +# To begin, we load the xml2 package that contains functions +# we need to receive and parse html data. NCBI's eUtils send information in +# XML format so we need to be able to parse XML. +if (! requireNamespace("xml2", quietly=TRUE)) { + install.packages("xml2") +} +# Package information: +# library(help = xml2) # basic information +# browseVignettes("xml2") # available vignettes +# data(package = "xml2") # available datasets + + + +# We will walk through the process with the refSeqID +# of yeast Mbp1 +refSeqID <- "NP_010227" + + +# First we build a query URL... +eUtilsBase <- "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/" + + +# Then we assemble an URL that will search for get the +# unique, NCBI internal identifier, +# for our refSeqID... +URL <- paste(eUtilsBase, + "esearch.fcgi?", # ...using the esearch program + # that finds an entry in an + # NCBI database + "db=protein", + "&term=", refSeqID, + sep="") +# Copy the URL and paste it into your browser to see +# what the response should look like. +URL + +# To fetch a response in R, we use the function read_xml() +# with our URL as its argument. +( myXML <- xml2::read_xml(URL) ) + +# This is XML. We can take the response apart into +# its individual components with the as_list() function. + +xml2::as_list(myXML) + +# Note how the XML "tree" is represented as a list of +# lists of lists ... +# If we know exactly what element we are looking for, +# we can extract it from this structure: +xml2::as_list(myXML)[["eSearchResult"]][["IdList"]][["Id"]][[1]] + +# But this is not very robust, it would break with the +# slightest change that the NCBI makes to their data format - +# and the NCBI changes things A LOT! + +# Somewhat more robust is to specify the type of element +# we want - its the text contained in an ... +# element, and use the XPath XML parsing language to +# retrieve it. + +xml2::xml_find_all(myXML, "//Id") # returns a "node set" + +xml2::xml_text(xml2::xml_find_all(myXML, "//Id")) # returns the contents + # of the node set + +# We will need to do this more than once, so we write a function +# for it... +node2text <- function(doc, tag) { + # an extractor function for the contents of elements + # between given tags in an XML response. + # Contents of all matching elements is returned in + # a vector of strings. + path <- paste0("//", tag) + nodes <- xml2::xml_find_all(doc, path) + return(xml2::xml_text(nodes)) +} + +# using node2text() ... +(GID <- node2text(myXML, "Id")) + +# The GI is the pivot for data requests at the +# NCBI. + +# Let's first get the associated data for this GI +URL <- paste0(eUtilsBase, + "esummary.fcgi?", + "db=protein", + "&id=", + GID, + "&version=2.0") +(myXML <- xml2::read_xml(URL)) + +(taxID <- node2text(myXML, "TaxId")) +(organism <- node2text(myXML, "Organism")) + +# This forms the base of a function that gets taxonomy data +# from an Entrez result. You can write this! + + +# == 1.1 Task - fetchNCBItaxData() function ================================ + +# Task: write a function that takes as input a RefSeq ID, fetches the taxonomy +# information, returns a list with taxID and organism, if the operation is +# successful, or a list of length 0 if there is an error. + + +# = 2 Task solutions ====================================================== + +# I have placed such a function into the dbUtilities script: look it up by +# clicking on dbFetchNCBItaxData() in the Environment pane. + +# Test: +dbFetchNCBItaxData("XP_001837394") + +# Expected outout: +# ---------------- +# taxID organism +# 1 240176 Coprinopsis cinerea okayama7#130 + + +# [END] diff --git a/data/0TST.pdb b/data/0TST.pdb index ccb631c..44bf1bd 100644 --- a/data/0TST.pdb +++ b/data/0TST.pdb @@ -1,10 +1,10 @@ -HEADER TEST 0TST 0TST 1 -REMARK A CATALOGUE OF ATOM AND HETATM RECORDS 0TST 2 -ATOM 1 N GLY 1 -6.253 75.745 53.559 1.00 36.34 0TST 3 -ATOM 2 CA GLY 1 -5.789 75.223 52.264 1.00 44.94 0TST 4 -ATOM 3 C GLY 1 -5.592 73.702 52.294 1.00 32.28 0TST 5 -ATOM 4 O GLY 1 -5.140 73.148 53.304 1.00 19.32 0TST 6 -TER 5 GLY 1 0TST 7 -HETATM 6 O HOH 1 -4.169 60.050 40.145 1.00 3.00 0TST 8 -HETATM 7 CA CA 1 -1.258 -71.579 50.253 1.00 3.00 0TST 9 -END 0TST 10 +HEADER TEST 0TST 0TST 1 +REMARK A CATALOGUE OF ATOM AND HETATM RECORDS 0TST 2 +ATOM 1 N GLY 1 -6.253 75.745 53.559 1.00 36.34 0TST 3 +ATOM 2 CA GLY 1 -5.789 75.223 52.264 1.00 44.94 0TST 4 +ATOM 3 C GLY 1 -5.592 73.702 52.294 1.00 32.28 0TST 5 +ATOM 4 O GLY 1 -5.140 73.148 53.304 1.00 19.32 0TST 6 +TER 5 GLY 1 0TST 7 +HETATM 6 O HOH 1 -4.169 60.050 40.145 1.00 3.00 0TST 8 +HETATM 7 CA CA 1 -1.258 -71.579 50.253 1.00 3.00 0TST 9 +END 0TST 10 diff --git a/data/1BM8.pdb b/data/1BM8.pdb index 552801e..91daf57 100644 --- a/data/1BM8.pdb +++ b/data/1BM8.pdb @@ -1,1552 +1,1552 @@ -HEADER CELL CYCLE 29-JUL-98 1BM8 -TITLE DNA-BINDING DOMAIN OF MBP1 -COMPND MOL_ID: 1; -COMPND 2 MOLECULE: TRANSCRIPTION FACTOR MBP1; -COMPND 3 CHAIN: A; -COMPND 4 FRAGMENT: N-TERMINAL DNA-BINDING DOMAIN; -COMPND 5 SYNONYM: MCB (MLUI CELL-CYLE BOX) BINDING PROTEIN; -COMPND 6 ENGINEERED: YES -SOURCE MOL_ID: 1; -SOURCE 2 ORGANISM_SCIENTIFIC: SACCHAROMYCES CEREVISIAE; -SOURCE 3 ORGANISM_COMMON: BAKER'S YEAST; -SOURCE 4 ORGANISM_TAXID: 4932; -SOURCE 5 CELL_LINE: BL21; -SOURCE 6 EXPRESSION_SYSTEM: ESCHERICHIA COLI; -SOURCE 7 EXPRESSION_SYSTEM_TAXID: 562; -SOURCE 8 EXPRESSION_SYSTEM_STRAIN: BL21 (DE3) PLYSS; -SOURCE 9 EXPRESSION_SYSTEM_PLASMID: BL21 (DE3) PLYSS/PET43 -KEYWDS CELL CYCLE, CYCLINS, DNA SYNTHESIS, HELIX-TURN-HELIX DNA- -KEYWDS 2 BINDING DOMAIN, MULTIWAVELENGTH ANOMALOUS DIFFRACTION, -KEYWDS 3 TRANSCRIPTION FACTOR -EXPDTA X-RAY DIFFRACTION -AUTHOR R.-M.XU,C.KOCH,Y.LIU,J.R.HORTON,D.KNAPP,K.NASMYTH,X.CHENG -REVDAT 2 24-FEB-09 1BM8 1 VERSN -REVDAT 1 02-MAR-99 1BM8 0 -JRNL AUTH R.M.XU,C.KOCH,Y.LIU,J.R.HORTON,D.KNAPP,K.NASMYTH, -JRNL AUTH 2 X.CHENG -JRNL TITL CRYSTAL STRUCTURE OF THE DNA-BINDING DOMAIN OF -JRNL TITL 2 MBP1, A TRANSCRIPTION FACTOR IMPORTANT IN -JRNL TITL 3 CELL-CYCLE CONTROL OF DNA SYNTHESIS. -JRNL REF STRUCTURE V. 5 349 1997 -JRNL REFN ISSN 0969-2126 -JRNL PMID 9083114 -JRNL DOI 10.1016/S0969-2126(97)00192-5 -REMARK 1 -REMARK 2 -REMARK 2 RESOLUTION. 1.71 ANGSTROMS. -REMARK 3 -REMARK 3 REFINEMENT. -REMARK 3 PROGRAM : X-PLOR 3.851 -REMARK 3 AUTHORS : BRUNGER -REMARK 3 -REMARK 3 DATA USED IN REFINEMENT. -REMARK 3 RESOLUTION RANGE HIGH (ANGSTROMS) : 1.71 -REMARK 3 RESOLUTION RANGE LOW (ANGSTROMS) : 5.00 -REMARK 3 DATA CUTOFF (SIGMA(F)) : 0.000 -REMARK 3 DATA CUTOFF HIGH (ABS(F)) : NULL -REMARK 3 DATA CUTOFF LOW (ABS(F)) : NULL -REMARK 3 COMPLETENESS (WORKING+TEST) (%) : 93.6 -REMARK 3 NUMBER OF REFLECTIONS : 10273 -REMARK 3 -REMARK 3 FIT TO DATA USED IN REFINEMENT. -REMARK 3 CROSS-VALIDATION METHOD : NULL -REMARK 3 FREE R VALUE TEST SET SELECTION : RANDOM -REMARK 3 R VALUE (WORKING SET) : 0.197 -REMARK 3 FREE R VALUE : 0.261 -REMARK 3 FREE R VALUE TEST SET SIZE (%) : 10.000 -REMARK 3 FREE R VALUE TEST SET COUNT : NULL -REMARK 3 ESTIMATED ERROR OF FREE R VALUE : NULL -REMARK 3 -REMARK 3 FIT IN THE HIGHEST RESOLUTION BIN. -REMARK 3 TOTAL NUMBER OF BINS USED : 8 -REMARK 3 BIN RESOLUTION RANGE HIGH (A) : 1.71 -REMARK 3 BIN RESOLUTION RANGE LOW (A) : 1.78 -REMARK 3 BIN COMPLETENESS (WORKING+TEST) (%) : 34.10 -REMARK 3 REFLECTIONS IN BIN (WORKING SET) : 535 -REMARK 3 BIN R VALUE (WORKING SET) : 0.4020 -REMARK 3 BIN FREE R VALUE : 0.3350 -REMARK 3 BIN FREE R VALUE TEST SET SIZE (%) : 10.00 -REMARK 3 BIN FREE R VALUE TEST SET COUNT : NULL -REMARK 3 ESTIMATED ERROR OF BIN FREE R VALUE : NULL -REMARK 3 -REMARK 3 NUMBER OF NON-HYDROGEN ATOMS USED IN REFINEMENT. -REMARK 3 PROTEIN ATOMS : 812 -REMARK 3 NUCLEIC ACID ATOMS : 0 -REMARK 3 HETEROGEN ATOMS : 0 -REMARK 3 SOLVENT ATOMS : 66 -REMARK 3 -REMARK 3 B VALUES. -REMARK 3 FROM WILSON PLOT (A**2) : NULL -REMARK 3 MEAN B VALUE (OVERALL, A**2) : 36.00 -REMARK 3 OVERALL ANISOTROPIC B VALUE. -REMARK 3 B11 (A**2) : NULL -REMARK 3 B22 (A**2) : NULL -REMARK 3 B33 (A**2) : NULL -REMARK 3 B12 (A**2) : NULL -REMARK 3 B13 (A**2) : NULL -REMARK 3 B23 (A**2) : NULL -REMARK 3 -REMARK 3 ESTIMATED COORDINATE ERROR. -REMARK 3 ESD FROM LUZZATI PLOT (A) : NULL -REMARK 3 ESD FROM SIGMAA (A) : NULL -REMARK 3 LOW RESOLUTION CUTOFF (A) : 5.00 -REMARK 3 -REMARK 3 CROSS-VALIDATED ESTIMATED COORDINATE ERROR. -REMARK 3 ESD FROM C-V LUZZATI PLOT (A) : NULL -REMARK 3 ESD FROM C-V SIGMAA (A) : NULL -REMARK 3 -REMARK 3 RMS DEVIATIONS FROM IDEAL VALUES. -REMARK 3 BOND LENGTHS (A) : 0.009 -REMARK 3 BOND ANGLES (DEGREES) : 1.11 -REMARK 3 DIHEDRAL ANGLES (DEGREES) : 23.30 -REMARK 3 IMPROPER ANGLES (DEGREES) : 0.98 -REMARK 3 -REMARK 3 ISOTROPIC THERMAL MODEL : RESTRAINED -REMARK 3 -REMARK 3 ISOTROPIC THERMAL FACTOR RESTRAINTS. RMS SIGMA -REMARK 3 MAIN-CHAIN BOND (A**2) : NULL ; NULL -REMARK 3 MAIN-CHAIN ANGLE (A**2) : NULL ; NULL -REMARK 3 SIDE-CHAIN BOND (A**2) : NULL ; NULL -REMARK 3 SIDE-CHAIN ANGLE (A**2) : NULL ; NULL -REMARK 3 -REMARK 3 NCS MODEL : NULL -REMARK 3 -REMARK 3 NCS RESTRAINTS. RMS SIGMA/WEIGHT -REMARK 3 GROUP 1 POSITIONAL (A) : NULL ; NULL -REMARK 3 GROUP 1 B-FACTOR (A**2) : NULL ; NULL -REMARK 3 -REMARK 3 PARAMETER FILE 1 : PARHCSDX.PRO -REMARK 3 PARAMETER FILE 2 : NULL -REMARK 3 PARAMETER FILE 3 : NULL -REMARK 3 TOPOLOGY FILE 1 : TOPHCSDX.PRO -REMARK 3 TOPOLOGY FILE 2 : NULL -REMARK 3 TOPOLOGY FILE 3 : NULL -REMARK 3 -REMARK 3 OTHER REFINEMENT REMARKS: ISOTROPIC THERMAL FACTOR RESTRAINTS: -REMARK 3 36. (A**2) FOR MAIN-CHAIN BONDS AND 40.3 (A**2) FOR SIDE-CHAIN -REMARK 3 BONDS. -REMARK 4 -REMARK 4 1BM8 COMPLIES WITH FORMAT V. 3.15, 01-DEC-08 -REMARK 100 -REMARK 100 THIS ENTRY HAS BEEN PROCESSED BY BNL. -REMARK 200 -REMARK 200 EXPERIMENTAL DETAILS -REMARK 200 EXPERIMENT TYPE : X-RAY DIFFRACTION -REMARK 200 DATE OF DATA COLLECTION : JUN-96 -REMARK 200 TEMPERATURE (KELVIN) : 289 -REMARK 200 PH : 8.0 -REMARK 200 NUMBER OF CRYSTALS USED : 3 -REMARK 200 -REMARK 200 SYNCHROTRON (Y/N) : Y -REMARK 200 RADIATION SOURCE : NSLS -REMARK 200 BEAMLINE : X12C -REMARK 200 X-RAY GENERATOR MODEL : NULL -REMARK 200 MONOCHROMATIC OR LAUE (M/L) : M -REMARK 200 WAVELENGTH OR RANGE (A) : 0.96 -REMARK 200 MONOCHROMATOR : NI FILTER -REMARK 200 OPTICS : MIRRORS -REMARK 200 -REMARK 200 DETECTOR TYPE : IMAGE PLATE -REMARK 200 DETECTOR MANUFACTURER : RIGAKU RAXIS IIC -REMARK 200 INTENSITY-INTEGRATION SOFTWARE : DENZO -REMARK 200 DATA SCALING SOFTWARE : SCALEPACK -REMARK 200 -REMARK 200 NUMBER OF UNIQUE REFLECTIONS : 12811 -REMARK 200 RESOLUTION RANGE HIGH (A) : 1.700 -REMARK 200 RESOLUTION RANGE LOW (A) : 30.000 -REMARK 200 REJECTION CRITERIA (SIGMA(I)) : -3.000 -REMARK 200 -REMARK 200 OVERALL. -REMARK 200 COMPLETENESS FOR RANGE (%) : 93.6 -REMARK 200 DATA REDUNDANCY : 5.300 -REMARK 200 R MERGE (I) : 0.05200 -REMARK 200 R SYM (I) : NULL -REMARK 200 FOR THE DATA SET : 11.4000 -REMARK 200 -REMARK 200 IN THE HIGHEST RESOLUTION SHELL. -REMARK 200 HIGHEST RESOLUTION SHELL, RANGE HIGH (A) : 1.71 -REMARK 200 HIGHEST RESOLUTION SHELL, RANGE LOW (A) : 1.78 -REMARK 200 COMPLETENESS FOR SHELL (%) : 34.0 -REMARK 200 DATA REDUNDANCY IN SHELL : NULL -REMARK 200 R MERGE FOR SHELL (I) : NULL -REMARK 200 R SYM FOR SHELL (I) : NULL -REMARK 200 FOR SHELL : NULL -REMARK 200 -REMARK 200 DIFFRACTION PROTOCOL: NULL -REMARK 200 METHOD USED TO DETERMINE THE STRUCTURE: NULL -REMARK 200 SOFTWARE USED: PHASES -REMARK 200 STARTING MODEL: NULL -REMARK 200 -REMARK 200 REMARK: NULL -REMARK 280 -REMARK 280 CRYSTAL -REMARK 280 SOLVENT CONTENT, VS (%): 34.00 -REMARK 280 MATTHEWS COEFFICIENT, VM (ANGSTROMS**3/DA): 1.85 -REMARK 280 -REMARK 280 CRYSTALLIZATION CONDITIONS: PH 8.0 -REMARK 290 -REMARK 290 CRYSTALLOGRAPHIC SYMMETRY -REMARK 290 SYMMETRY OPERATORS FOR SPACE GROUP: P 41 21 2 -REMARK 290 -REMARK 290 SYMOP SYMMETRY -REMARK 290 NNNMMM OPERATOR -REMARK 290 1555 X,Y,Z -REMARK 290 2555 -X,-Y,Z+1/2 -REMARK 290 3555 -Y+1/2,X+1/2,Z+1/4 -REMARK 290 4555 Y+1/2,-X+1/2,Z+3/4 -REMARK 290 5555 -X+1/2,Y+1/2,-Z+1/4 -REMARK 290 6555 X+1/2,-Y+1/2,-Z+3/4 -REMARK 290 7555 Y,X,-Z -REMARK 290 8555 -Y,-X,-Z+1/2 -REMARK 290 -REMARK 290 WHERE NNN -> OPERATOR NUMBER -REMARK 290 MMM -> TRANSLATION VECTOR -REMARK 290 -REMARK 290 CRYSTALLOGRAPHIC SYMMETRY TRANSFORMATIONS -REMARK 290 THE FOLLOWING TRANSFORMATIONS OPERATE ON THE ATOM/HETATM -REMARK 290 RECORDS IN THIS ENTRY TO PRODUCE CRYSTALLOGRAPHICALLY -REMARK 290 RELATED MOLECULES. -REMARK 290 SMTRY1 1 1.000000 0.000000 0.000000 0.00000 -REMARK 290 SMTRY2 1 0.000000 1.000000 0.000000 0.00000 -REMARK 290 SMTRY3 1 0.000000 0.000000 1.000000 0.00000 -REMARK 290 SMTRY1 2 -1.000000 0.000000 0.000000 0.00000 -REMARK 290 SMTRY2 2 0.000000 -1.000000 0.000000 0.00000 -REMARK 290 SMTRY3 2 0.000000 0.000000 1.000000 62.11000 -REMARK 290 SMTRY1 3 0.000000 -1.000000 0.000000 21.67500 -REMARK 290 SMTRY2 3 1.000000 0.000000 0.000000 21.67500 -REMARK 290 SMTRY3 3 0.000000 0.000000 1.000000 31.05500 -REMARK 290 SMTRY1 4 0.000000 1.000000 0.000000 21.67500 -REMARK 290 SMTRY2 4 -1.000000 0.000000 0.000000 21.67500 -REMARK 290 SMTRY3 4 0.000000 0.000000 1.000000 93.16500 -REMARK 290 SMTRY1 5 -1.000000 0.000000 0.000000 21.67500 -REMARK 290 SMTRY2 5 0.000000 1.000000 0.000000 21.67500 -REMARK 290 SMTRY3 5 0.000000 0.000000 -1.000000 31.05500 -REMARK 290 SMTRY1 6 1.000000 0.000000 0.000000 21.67500 -REMARK 290 SMTRY2 6 0.000000 -1.000000 0.000000 21.67500 -REMARK 290 SMTRY3 6 0.000000 0.000000 -1.000000 93.16500 -REMARK 290 SMTRY1 7 0.000000 1.000000 0.000000 0.00000 -REMARK 290 SMTRY2 7 1.000000 0.000000 0.000000 0.00000 -REMARK 290 SMTRY3 7 0.000000 0.000000 -1.000000 0.00000 -REMARK 290 SMTRY1 8 0.000000 -1.000000 0.000000 0.00000 -REMARK 290 SMTRY2 8 -1.000000 0.000000 0.000000 0.00000 -REMARK 290 SMTRY3 8 0.000000 0.000000 -1.000000 62.11000 -REMARK 290 -REMARK 290 REMARK: NULL -REMARK 300 -REMARK 300 BIOMOLECULE: 1 -REMARK 300 SEE REMARK 350 FOR THE AUTHOR PROVIDED AND/OR PROGRAM -REMARK 300 GENERATED ASSEMBLY INFORMATION FOR THE STRUCTURE IN -REMARK 300 THIS ENTRY. THE REMARK MAY ALSO PROVIDE INFORMATION ON -REMARK 300 BURIED SURFACE AREA. -REMARK 350 -REMARK 350 COORDINATES FOR A COMPLETE MULTIMER REPRESENTING THE KNOWN -REMARK 350 BIOLOGICALLY SIGNIFICANT OLIGOMERIZATION STATE OF THE -REMARK 350 MOLECULE CAN BE GENERATED BY APPLYING BIOMT TRANSFORMATIONS -REMARK 350 GIVEN BELOW. BOTH NON-CRYSTALLOGRAPHIC AND -REMARK 350 CRYSTALLOGRAPHIC OPERATIONS ARE GIVEN. -REMARK 350 -REMARK 350 BIOMOLECULE: 1 -REMARK 350 AUTHOR DETERMINED BIOLOGICAL UNIT: MONOMERIC -REMARK 350 APPLY THE FOLLOWING TO CHAINS: A -REMARK 350 BIOMT1 1 1.000000 0.000000 0.000000 0.00000 -REMARK 350 BIOMT2 1 0.000000 1.000000 0.000000 0.00000 -REMARK 350 BIOMT3 1 0.000000 0.000000 1.000000 0.00000 -REMARK 525 -REMARK 525 SOLVENT -REMARK 525 -REMARK 525 THE SOLVENT MOLECULES HAVE CHAIN IDENTIFIERS THAT -REMARK 525 INDICATE THE POLYMER CHAIN WITH WHICH THEY ARE MOST -REMARK 525 CLOSELY ASSOCIATED. THE REMARK LISTS ALL THE SOLVENT -REMARK 525 MOLECULES WHICH ARE MORE THAN 5A AWAY FROM THE -REMARK 525 NEAREST POLYMER CHAIN (M = MODEL NUMBER; -REMARK 525 RES=RESIDUE NAME; C=CHAIN IDENTIFIER; SSEQ=SEQUENCE -REMARK 525 NUMBER; I=INSERTION CODE): -REMARK 525 -REMARK 525 M RES CSSEQI -REMARK 525 HOH A 459 DISTANCE = 6.67 ANGSTROMS -REMARK 525 HOH A 473 DISTANCE = 6.70 ANGSTROMS -DBREF 1BM8 A 4 102 UNP P39678 MBP1_YEAST 4 102 -SEQRES 1 A 99 GLN ILE TYR SER ALA ARG TYR SER GLY VAL ASP VAL TYR -SEQRES 2 A 99 GLU PHE ILE HIS SER THR GLY SER ILE MET LYS ARG LYS -SEQRES 3 A 99 LYS ASP ASP TRP VAL ASN ALA THR HIS ILE LEU LYS ALA -SEQRES 4 A 99 ALA ASN PHE ALA LYS ALA LYS ARG THR ARG ILE LEU GLU -SEQRES 5 A 99 LYS GLU VAL LEU LYS GLU THR HIS GLU LYS VAL GLN GLY -SEQRES 6 A 99 GLY PHE GLY LYS TYR GLN GLY THR TRP VAL PRO LEU ASN -SEQRES 7 A 99 ILE ALA LYS GLN LEU ALA GLU LYS PHE SER VAL TYR ASP -SEQRES 8 A 99 GLN LEU LYS PRO LEU PHE ASP PHE -FORMUL 2 HOH *83(H2 O) -HELIX 1 1 ALA A 36 ALA A 42 1 7 -HELIX 2 2 LYS A 47 GLU A 57 1 11 -HELIX 3 3 LEU A 80 LYS A 89 1 10 -HELIX 4 4 TYR A 93 PHE A 100 1 8 -SHEET 1 A 3 ILE A 5 TYR A 10 0 -SHEET 2 A 3 VAL A 13 ILE A 19 -1 N GLU A 17 O TYR A 6 -SHEET 3 A 3 SER A 24 ARG A 28 -1 N LYS A 27 O TYR A 16 -SHEET 1 B 2 GLU A 64 VAL A 66 0 -SHEET 2 B 2 GLY A 75 TRP A 77 -1 N TRP A 77 O GLU A 64 -CRYST1 43.350 43.350 124.220 90.00 90.00 90.00 P 41 21 2 8 -ORIGX1 1.000000 0.000000 0.000000 0.00000 -ORIGX2 0.000000 1.000000 0.000000 0.00000 -ORIGX3 0.000000 0.000000 1.000000 0.00000 -SCALE1 0.023068 0.000000 0.000000 0.00000 -SCALE2 0.000000 0.023068 0.000000 0.00000 -SCALE3 0.000000 0.000000 0.008050 0.00000 -ATOM 1 N GLN A 4 -0.991 4.920 14.982 1.00 52.28 N -ATOM 2 CA GLN A 4 -0.575 5.127 16.398 1.00 51.22 C -ATOM 3 C GLN A 4 0.344 6.335 16.538 1.00 48.16 C -ATOM 4 O GLN A 4 0.893 6.823 15.540 1.00 46.43 O -ATOM 5 CB GLN A 4 0.121 3.877 16.961 1.00 53.87 C -ATOM 6 CG GLN A 4 -0.797 3.008 17.820 1.00 57.21 C -ATOM 7 CD GLN A 4 -0.029 2.066 18.730 1.00 60.18 C -ATOM 8 OE1 GLN A 4 1.135 2.325 19.071 1.00 61.12 O -ATOM 9 NE2 GLN A 4 -0.673 0.970 19.131 1.00 61.27 N -ATOM 10 H1 GLN A 4 -1.493 5.767 14.644 1.00 0.00 H -ATOM 11 H2 GLN A 4 -0.148 4.764 14.393 1.00 0.00 H -ATOM 12 H3 GLN A 4 -1.618 4.097 14.918 1.00 0.00 H -ATOM 13 HE21 GLN A 4 -0.200 0.339 19.714 1.00 0.00 H -ATOM 14 HE22 GLN A 4 -1.594 0.835 18.832 1.00 0.00 H -ATOM 15 N ILE A 5 0.487 6.801 17.778 1.00 44.78 N -ATOM 16 CA ILE A 5 1.300 7.959 18.076 1.00 42.51 C -ATOM 17 C ILE A 5 2.358 7.589 19.087 1.00 40.28 C -ATOM 18 O ILE A 5 2.041 7.137 20.170 1.00 41.33 O -ATOM 19 CB ILE A 5 0.424 9.104 18.631 1.00 42.76 C -ATOM 20 CG1 ILE A 5 -0.582 9.523 17.557 1.00 44.06 C -ATOM 21 CG2 ILE A 5 1.281 10.293 19.056 1.00 43.55 C -ATOM 22 CD1 ILE A 5 -1.471 10.684 17.936 1.00 43.93 C -ATOM 23 H ILE A 5 0.039 6.338 18.519 1.00 0.00 H -ATOM 24 N TYR A 6 3.607 7.754 18.720 1.00 38.87 N -ATOM 25 CA TYR A 6 4.710 7.452 19.621 1.00 38.04 C -ATOM 26 C TYR A 6 5.273 8.733 20.218 1.00 34.53 C -ATOM 27 O TYR A 6 5.170 9.805 19.650 1.00 33.71 O -ATOM 28 CB TYR A 6 5.892 6.794 18.889 1.00 42.49 C -ATOM 29 CG TYR A 6 5.619 5.559 18.078 1.00 49.90 C -ATOM 30 CD1 TYR A 6 4.759 4.551 18.520 1.00 52.40 C -ATOM 31 CD2 TYR A 6 6.290 5.367 16.884 1.00 53.52 C -ATOM 32 CE1 TYR A 6 4.603 3.377 17.787 1.00 56.29 C -ATOM 33 CE2 TYR A 6 6.148 4.208 16.144 1.00 56.87 C -ATOM 34 CZ TYR A 6 5.307 3.211 16.595 1.00 58.22 C -ATOM 35 OH TYR A 6 5.213 2.023 15.883 1.00 62.12 O -ATOM 36 H TYR A 6 3.803 8.092 17.823 1.00 0.00 H -ATOM 37 HH TYR A 6 4.525 1.471 16.264 1.00 0.00 H -ATOM 38 N SER A 7 5.887 8.595 21.343 1.00 29.82 N -ATOM 39 CA SER A 7 6.641 9.658 21.907 1.00 27.41 C -ATOM 40 C SER A 7 8.065 9.484 21.365 1.00 25.27 C -ATOM 41 O SER A 7 8.573 8.364 21.336 1.00 24.52 O -ATOM 42 CB SER A 7 6.604 9.491 23.411 1.00 27.69 C -ATOM 43 OG SER A 7 7.393 10.446 24.052 1.00 34.18 O -ATOM 44 H SER A 7 5.839 7.737 21.817 1.00 0.00 H -ATOM 45 HG SER A 7 8.257 10.478 23.644 1.00 0.00 H -ATOM 46 N ALA A 8 8.709 10.555 20.901 1.00 23.35 N -ATOM 47 CA ALA A 8 10.071 10.423 20.364 1.00 20.99 C -ATOM 48 C ALA A 8 10.887 11.696 20.574 1.00 21.47 C -ATOM 49 O ALA A 8 10.370 12.693 21.084 1.00 21.33 O -ATOM 50 CB ALA A 8 10.016 10.075 18.875 1.00 20.24 C -ATOM 51 H ALA A 8 8.274 11.435 20.918 1.00 0.00 H -ATOM 52 N ARG A 9 12.163 11.644 20.207 1.00 21.36 N -ATOM 53 CA ARG A 9 13.054 12.817 20.318 1.00 23.94 C -ATOM 54 C ARG A 9 14.026 12.854 19.153 1.00 24.02 C -ATOM 55 O ARG A 9 14.629 11.831 18.835 1.00 22.48 O -ATOM 56 CB ARG A 9 13.864 12.818 21.615 1.00 24.91 C -ATOM 57 CG ARG A 9 14.921 13.922 21.647 1.00 28.68 C -ATOM 58 CD ARG A 9 15.735 13.904 22.931 1.00 31.98 C -ATOM 59 NE ARG A 9 14.979 14.426 24.042 1.00 35.74 N -ATOM 60 CZ ARG A 9 15.234 15.602 24.583 1.00 37.58 C -ATOM 61 NH1 ARG A 9 16.262 16.324 24.162 1.00 38.78 N -ATOM 62 NH2 ARG A 9 14.475 16.048 25.571 1.00 40.26 N -ATOM 63 H ARG A 9 12.518 10.810 19.832 1.00 0.00 H -ATOM 64 HE ARG A 9 14.250 13.885 24.413 1.00 0.00 H -ATOM 65 HH11 ARG A 9 16.855 15.976 23.436 1.00 0.00 H -ATOM 66 HH12 ARG A 9 16.446 17.220 24.568 1.00 0.00 H -ATOM 67 HH21 ARG A 9 13.711 15.495 25.906 1.00 0.00 H -ATOM 68 HH22 ARG A 9 14.657 16.944 25.977 1.00 0.00 H -ATOM 69 N TYR A 10 14.154 14.035 18.532 1.00 24.15 N -ATOM 70 CA TYR A 10 15.034 14.236 17.379 1.00 26.92 C -ATOM 71 C TYR A 10 15.730 15.585 17.504 1.00 28.93 C -ATOM 72 O TYR A 10 15.085 16.571 17.814 1.00 29.46 O -ATOM 73 CB TYR A 10 14.234 14.252 16.072 1.00 23.90 C -ATOM 74 CG TYR A 10 13.510 12.977 15.778 1.00 24.39 C -ATOM 75 CD1 TYR A 10 14.171 11.907 15.185 1.00 25.27 C -ATOM 76 CD2 TYR A 10 12.174 12.813 16.148 1.00 25.41 C -ATOM 77 CE1 TYR A 10 13.521 10.695 14.967 1.00 27.01 C -ATOM 78 CE2 TYR A 10 11.520 11.609 15.936 1.00 27.17 C -ATOM 79 CZ TYR A 10 12.196 10.556 15.346 1.00 26.47 C -ATOM 80 OH TYR A 10 11.540 9.379 15.101 1.00 27.96 O -ATOM 81 H TYR A 10 13.640 14.801 18.866 1.00 0.00 H -ATOM 82 HH TYR A 10 12.100 8.804 14.574 1.00 0.00 H -ATOM 83 N SER A 11 17.029 15.630 17.266 1.00 30.98 N -ATOM 84 CA SER A 11 17.751 16.893 17.349 1.00 32.54 C -ATOM 85 C SER A 11 17.509 17.599 18.695 1.00 32.28 C -ATOM 86 O SER A 11 17.377 18.827 18.737 1.00 33.57 O -ATOM 87 CB SER A 11 17.299 17.821 16.212 1.00 34.50 C -ATOM 88 OG SER A 11 17.469 17.220 14.934 1.00 39.12 O -ATOM 89 H SER A 11 17.508 14.810 17.019 1.00 0.00 H -ATOM 90 HG SER A 11 18.388 16.968 14.813 1.00 0.00 H -ATOM 91 N GLY A 12 17.410 16.826 19.780 1.00 30.27 N -ATOM 92 CA GLY A 12 17.187 17.403 21.099 1.00 27.72 C -ATOM 93 C GLY A 12 15.760 17.867 21.361 1.00 26.67 C -ATOM 94 O GLY A 12 15.474 18.436 22.414 1.00 28.11 O -ATOM 95 H GLY A 12 17.494 15.856 19.690 1.00 0.00 H -ATOM 96 N VAL A 13 14.855 17.590 20.434 1.00 25.00 N -ATOM 97 CA VAL A 13 13.459 18.045 20.539 1.00 22.39 C -ATOM 98 C VAL A 13 12.471 16.877 20.723 1.00 22.62 C -ATOM 99 O VAL A 13 12.494 15.913 19.959 1.00 21.65 O -ATOM 100 CB VAL A 13 13.075 18.819 19.253 1.00 21.97 C -ATOM 101 CG1 VAL A 13 11.652 19.334 19.343 1.00 18.81 C -ATOM 102 CG2 VAL A 13 14.057 19.964 19.042 1.00 22.24 C -ATOM 103 H VAL A 13 15.123 17.070 19.648 1.00 0.00 H -ATOM 104 N ASP A 14 11.617 16.976 21.734 1.00 21.41 N -ATOM 105 CA ASP A 14 10.622 15.950 22.003 1.00 21.86 C -ATOM 106 C ASP A 14 9.377 16.206 21.197 1.00 21.71 C -ATOM 107 O ASP A 14 8.837 17.312 21.204 1.00 20.60 O -ATOM 108 CB ASP A 14 10.237 15.913 23.494 1.00 24.96 C -ATOM 109 CG ASP A 14 11.414 15.636 24.396 1.00 25.52 C -ATOM 110 OD1 ASP A 14 12.057 14.597 24.232 1.00 27.41 O -ATOM 111 OD2 ASP A 14 11.704 16.473 25.257 1.00 30.85 O -ATOM 112 H ASP A 14 11.653 17.765 22.313 1.00 0.00 H -ATOM 113 N VAL A 15 8.897 15.168 20.550 1.00 21.11 N -ATOM 114 CA VAL A 15 7.740 15.281 19.686 1.00 20.99 C -ATOM 115 C VAL A 15 6.819 14.096 19.900 1.00 23.45 C -ATOM 116 O VAL A 15 7.178 13.132 20.595 1.00 24.63 O -ATOM 117 CB VAL A 15 8.149 15.282 18.166 1.00 19.89 C -ATOM 118 CG1 VAL A 15 9.103 16.420 17.854 1.00 16.46 C -ATOM 119 CG2 VAL A 15 8.795 13.934 17.785 1.00 18.59 C -ATOM 120 H VAL A 15 9.323 14.292 20.662 1.00 0.00 H -ATOM 121 N TYR A 16 5.632 14.216 19.339 1.00 24.96 N -ATOM 122 CA TYR A 16 4.726 13.114 19.215 1.00 26.21 C -ATOM 123 C TYR A 16 4.746 12.756 17.744 1.00 26.48 C -ATOM 124 O TYR A 16 4.631 13.643 16.884 1.00 25.01 O -ATOM 125 CB TYR A 16 3.314 13.507 19.644 1.00 29.28 C -ATOM 126 CG TYR A 16 3.170 13.632 21.144 1.00 32.30 C -ATOM 127 CD1 TYR A 16 3.375 12.530 21.959 1.00 34.32 C -ATOM 128 CD2 TYR A 16 2.859 14.843 21.746 1.00 33.14 C -ATOM 129 CE1 TYR A 16 3.272 12.625 23.332 1.00 36.05 C -ATOM 130 CE2 TYR A 16 2.755 14.950 23.125 1.00 35.60 C -ATOM 131 CZ TYR A 16 2.962 13.832 23.907 1.00 37.33 C -ATOM 132 OH TYR A 16 2.870 13.922 25.273 1.00 42.80 O -ATOM 133 H TYR A 16 5.364 15.082 18.983 1.00 0.00 H -ATOM 134 HH TYR A 16 3.304 13.159 25.678 1.00 0.00 H -ATOM 135 N GLU A 17 4.950 11.483 17.454 1.00 27.52 N -ATOM 136 CA GLU A 17 5.040 11.030 16.074 1.00 29.95 C -ATOM 137 C GLU A 17 3.841 10.167 15.709 1.00 30.66 C -ATOM 138 O GLU A 17 3.533 9.205 16.390 1.00 27.27 O -ATOM 139 CB GLU A 17 6.349 10.268 15.880 1.00 29.55 C -ATOM 140 CG GLU A 17 6.689 9.958 14.439 1.00 32.47 C -ATOM 141 CD GLU A 17 8.068 9.340 14.291 1.00 34.84 C -ATOM 142 OE1 GLU A 17 8.917 9.552 15.182 1.00 36.30 O -ATOM 143 OE2 GLU A 17 8.307 8.643 13.282 1.00 38.82 O -ATOM 144 H GLU A 17 5.048 10.834 18.179 1.00 0.00 H -ATOM 145 N PHE A 18 3.157 10.574 14.657 1.00 34.09 N -ATOM 146 CA PHE A 18 1.992 9.874 14.154 1.00 38.16 C -ATOM 147 C PHE A 18 2.404 9.093 12.906 1.00 40.68 C -ATOM 148 O PHE A 18 3.066 9.635 12.005 1.00 38.31 O -ATOM 149 CB PHE A 18 0.911 10.908 13.837 1.00 39.21 C -ATOM 150 CG PHE A 18 -0.309 10.396 13.139 1.00 43.44 C -ATOM 151 CD1 PHE A 18 -1.285 9.683 13.838 1.00 45.30 C -ATOM 152 CD2 PHE A 18 -0.520 10.684 11.789 1.00 45.30 C -ATOM 153 CE1 PHE A 18 -2.451 9.269 13.205 1.00 45.73 C -ATOM 154 CE2 PHE A 18 -1.682 10.275 11.146 1.00 46.28 C -ATOM 155 CZ PHE A 18 -2.651 9.568 11.854 1.00 46.51 C -ATOM 156 H PHE A 18 3.446 11.386 14.198 1.00 0.00 H -ATOM 157 N ILE A 19 2.060 7.813 12.875 1.00 43.87 N -ATOM 158 CA ILE A 19 2.451 6.970 11.756 1.00 47.64 C -ATOM 159 C ILE A 19 1.361 6.905 10.701 1.00 50.18 C -ATOM 160 O ILE A 19 0.316 6.280 10.907 1.00 50.83 O -ATOM 161 CB ILE A 19 2.787 5.548 12.208 1.00 48.13 C -ATOM 162 CG1 ILE A 19 3.734 5.597 13.406 1.00 49.26 C -ATOM 163 CG2 ILE A 19 3.425 4.793 11.061 1.00 48.27 C -ATOM 164 CD1 ILE A 19 5.016 6.356 13.140 1.00 51.27 C -ATOM 165 H ILE A 19 1.535 7.436 13.609 1.00 0.00 H -ATOM 166 N HIS A 20 1.623 7.574 9.587 1.00 52.47 N -ATOM 167 CA HIS A 20 0.710 7.602 8.461 1.00 54.63 C -ATOM 168 C HIS A 20 1.325 6.738 7.359 1.00 54.62 C -ATOM 169 O HIS A 20 2.518 6.415 7.424 1.00 54.75 O -ATOM 170 CB HIS A 20 0.553 9.056 7.990 1.00 57.40 C -ATOM 171 CG HIS A 20 -0.664 9.340 7.157 1.00 60.64 C -ATOM 172 ND1 HIS A 20 -0.604 9.703 5.820 1.00 61.69 N -ATOM 173 CD2 HIS A 20 -1.991 9.341 7.470 1.00 61.84 C -ATOM 174 CE1 HIS A 20 -1.811 9.917 5.323 1.00 62.25 C -ATOM 175 NE2 HIS A 20 -2.653 9.699 6.317 1.00 63.47 N -ATOM 176 H HIS A 20 2.472 8.058 9.517 1.00 0.00 H -ATOM 177 HD1 HIS A 20 0.226 9.797 5.306 1.00 0.00 H -ATOM 178 HE2 HIS A 20 -3.628 9.768 6.238 1.00 0.00 H -ATOM 179 N SER A 21 0.535 6.358 6.354 1.00 54.36 N -ATOM 180 CA SER A 21 1.057 5.528 5.265 1.00 52.80 C -ATOM 181 C SER A 21 2.204 6.221 4.504 1.00 52.38 C -ATOM 182 O SER A 21 3.242 5.606 4.237 1.00 51.68 O -ATOM 183 CB SER A 21 -0.081 5.142 4.322 1.00 51.54 C -ATOM 184 OG SER A 21 -0.940 6.237 4.107 1.00 51.51 O -ATOM 185 H SER A 21 -0.408 6.625 6.348 1.00 0.00 H -ATOM 186 HG SER A 21 -1.720 5.940 3.628 1.00 0.00 H -ATOM 187 N THR A 22 2.030 7.509 4.195 1.00 52.22 N -ATOM 188 CA THR A 22 3.058 8.284 3.475 1.00 52.84 C -ATOM 189 C THR A 22 4.294 8.548 4.334 1.00 50.76 C -ATOM 190 O THR A 22 5.358 8.913 3.827 1.00 50.70 O -ATOM 191 CB THR A 22 2.503 9.648 3.031 1.00 54.77 C -ATOM 192 OG1 THR A 22 1.746 10.224 4.115 1.00 57.43 O -ATOM 193 CG2 THR A 22 1.604 9.504 1.816 1.00 56.57 C -ATOM 194 H THR A 22 1.193 7.951 4.445 1.00 0.00 H -ATOM 195 HG1 THR A 22 1.603 11.155 3.928 1.00 0.00 H -ATOM 196 N GLY A 23 4.142 8.376 5.635 1.00 49.11 N -ATOM 197 CA GLY A 23 5.238 8.640 6.541 1.00 45.68 C -ATOM 198 C GLY A 23 4.739 9.133 7.876 1.00 43.53 C -ATOM 199 O GLY A 23 3.521 9.157 8.138 1.00 42.97 O -ATOM 200 H GLY A 23 3.287 8.054 5.988 1.00 0.00 H -ATOM 201 N SER A 24 5.655 9.533 8.719 1.00 40.66 N -ATOM 202 CA SER A 24 5.279 10.004 10.026 1.00 38.67 C -ATOM 203 C SER A 24 5.066 11.517 10.046 1.00 36.42 C -ATOM 204 O SER A 24 5.714 12.267 9.291 1.00 34.95 O -ATOM 205 CB SER A 24 6.335 9.598 11.029 1.00 39.09 C -ATOM 206 OG SER A 24 7.622 9.743 10.472 1.00 44.40 O -ATOM 207 H SER A 24 6.597 9.521 8.458 1.00 0.00 H -ATOM 208 HG SER A 24 7.777 9.032 9.837 1.00 0.00 H -ATOM 209 N ILE A 25 4.129 11.946 10.890 1.00 32.56 N -ATOM 210 CA ILE A 25 3.824 13.356 11.064 1.00 29.27 C -ATOM 211 C ILE A 25 4.108 13.725 12.516 1.00 27.24 C -ATOM 212 O ILE A 25 3.698 13.017 13.431 1.00 26.25 O -ATOM 213 CB ILE A 25 2.354 13.628 10.682 1.00 30.38 C -ATOM 214 CG1 ILE A 25 2.172 13.204 9.219 1.00 33.50 C -ATOM 215 CG2 ILE A 25 2.011 15.105 10.843 1.00 28.01 C -ATOM 216 CD1 ILE A 25 0.746 13.027 8.780 1.00 35.33 C -ATOM 217 H ILE A 25 3.628 11.287 11.414 1.00 0.00 H -ATOM 218 N MET A 26 4.821 14.815 12.713 1.00 24.03 N -ATOM 219 CA MET A 26 5.282 15.188 14.040 1.00 22.95 C -ATOM 220 C MET A 26 4.649 16.463 14.576 1.00 23.00 C -ATOM 221 O MET A 26 4.398 17.426 13.832 1.00 19.80 O -ATOM 222 CB MET A 26 6.800 15.397 14.034 1.00 22.54 C -ATOM 223 CG MET A 26 7.632 14.152 13.821 1.00 22.25 C -ATOM 224 SD MET A 26 9.393 14.520 13.783 1.00 27.59 S -ATOM 225 CE MET A 26 10.026 13.008 13.046 1.00 27.15 C -ATOM 226 H MET A 26 5.012 15.401 11.961 1.00 0.00 H -ATOM 227 N LYS A 27 4.443 16.453 15.891 1.00 23.73 N -ATOM 228 CA LYS A 27 3.998 17.625 16.632 1.00 23.46 C -ATOM 229 C LYS A 27 4.942 17.793 17.828 1.00 22.79 C -ATOM 230 O LYS A 27 5.244 16.813 18.522 1.00 22.50 O -ATOM 231 CB LYS A 27 2.550 17.459 17.133 1.00 24.99 C -ATOM 232 CG LYS A 27 2.055 18.665 17.923 1.00 27.08 C -ATOM 233 CD LYS A 27 0.574 18.594 18.223 1.00 29.52 C -ATOM 234 CE LYS A 27 0.272 17.523 19.243 1.00 32.06 C -ATOM 235 NZ LYS A 27 -1.178 17.499 19.580 1.00 35.59 N -ATOM 236 H LYS A 27 4.599 15.620 16.384 1.00 0.00 H -ATOM 237 HZ1 LYS A 27 -1.732 17.319 18.719 1.00 0.00 H -ATOM 238 HZ2 LYS A 27 -1.359 16.745 20.272 1.00 0.00 H -ATOM 239 HZ3 LYS A 27 -1.452 18.414 19.986 1.00 0.00 H -ATOM 240 N ARG A 28 5.455 19.003 18.033 1.00 21.34 N -ATOM 241 CA ARG A 28 6.361 19.253 19.141 1.00 21.22 C -ATOM 242 C ARG A 28 5.615 19.292 20.464 1.00 20.99 C -ATOM 243 O ARG A 28 4.534 19.902 20.557 1.00 20.62 O -ATOM 244 CB ARG A 28 7.090 20.582 18.971 1.00 20.55 C -ATOM 245 CG ARG A 28 8.119 20.580 17.884 1.00 23.75 C -ATOM 246 CD ARG A 28 9.092 21.725 18.053 1.00 24.37 C -ATOM 247 NE ARG A 28 8.452 23.024 17.897 1.00 22.21 N -ATOM 248 CZ ARG A 28 8.906 23.947 17.062 1.00 22.16 C -ATOM 249 NH1 ARG A 28 9.932 23.686 16.260 1.00 21.40 N -ATOM 250 NH2 ARG A 28 8.314 25.124 17.006 1.00 22.10 N -ATOM 251 H ARG A 28 5.216 19.737 17.429 1.00 0.00 H -ATOM 252 HE ARG A 28 7.659 23.223 18.432 1.00 0.00 H -ATOM 253 HH11 ARG A 28 10.372 22.788 16.284 1.00 0.00 H -ATOM 254 HH12 ARG A 28 10.278 24.394 15.642 1.00 0.00 H -ATOM 255 HH21 ARG A 28 7.520 25.312 17.581 1.00 0.00 H -ATOM 256 HH22 ARG A 28 8.657 25.824 16.379 1.00 0.00 H -ATOM 257 N LYS A 29 6.215 18.701 21.488 1.00 20.40 N -ATOM 258 CA LYS A 29 5.601 18.678 22.813 1.00 22.71 C -ATOM 259 C LYS A 29 5.623 20.043 23.491 1.00 22.45 C -ATOM 260 O LYS A 29 4.669 20.397 24.190 1.00 21.87 O -ATOM 261 CB LYS A 29 6.298 17.668 23.723 1.00 25.87 C -ATOM 262 CG LYS A 29 6.214 16.228 23.225 1.00 31.52 C -ATOM 263 CD LYS A 29 6.749 15.268 24.259 1.00 32.96 C -ATOM 264 CE LYS A 29 6.701 13.831 23.781 1.00 33.83 C -ATOM 265 NZ LYS A 29 7.106 12.908 24.868 1.00 35.21 N -ATOM 266 H LYS A 29 7.088 18.274 21.356 1.00 0.00 H -ATOM 267 HZ1 LYS A 29 6.552 13.117 25.721 1.00 0.00 H -ATOM 268 HZ2 LYS A 29 6.929 11.933 24.575 1.00 0.00 H -ATOM 269 HZ3 LYS A 29 8.116 13.033 25.071 1.00 0.00 H -ATOM 270 N LYS A 30 6.693 20.822 23.275 1.00 21.91 N -ATOM 271 CA LYS A 30 6.818 22.108 23.970 1.00 22.50 C -ATOM 272 C LYS A 30 5.797 23.154 23.535 1.00 22.00 C -ATOM 273 O LYS A 30 5.348 23.925 24.374 1.00 21.27 O -ATOM 274 CB LYS A 30 8.230 22.683 23.839 1.00 23.91 C -ATOM 275 CG LYS A 30 8.602 23.159 22.448 1.00 30.91 C -ATOM 276 CD LYS A 30 10.047 23.652 22.422 1.00 35.19 C -ATOM 277 CE LYS A 30 10.510 24.019 21.007 1.00 36.53 C -ATOM 278 NZ LYS A 30 9.871 25.274 20.519 1.00 36.17 N -ATOM 279 H LYS A 30 7.397 20.528 22.662 1.00 0.00 H -ATOM 280 HZ1 LYS A 30 8.838 25.181 20.585 1.00 0.00 H -ATOM 281 HZ2 LYS A 30 10.185 26.073 21.106 1.00 0.00 H -ATOM 282 HZ3 LYS A 30 10.142 25.441 19.531 1.00 0.00 H -ATOM 283 N ASP A 31 5.401 23.183 22.245 1.00 18.95 N -ATOM 284 CA ASP A 31 4.499 24.232 21.794 1.00 20.45 C -ATOM 285 C ASP A 31 3.382 23.785 20.872 1.00 21.56 C -ATOM 286 O ASP A 31 2.634 24.636 20.361 1.00 23.45 O -ATOM 287 CB ASP A 31 5.298 25.339 21.113 1.00 21.42 C -ATOM 288 CG ASP A 31 6.231 24.825 20.027 1.00 26.39 C -ATOM 289 OD1 ASP A 31 6.013 23.695 19.518 1.00 25.20 O -ATOM 290 OD2 ASP A 31 7.181 25.546 19.686 1.00 24.41 O -ATOM 291 H ASP A 31 5.715 22.499 21.621 1.00 0.00 H -ATOM 292 N ASP A 32 3.265 22.484 20.634 1.00 21.07 N -ATOM 293 CA ASP A 32 2.221 21.961 19.749 1.00 21.22 C -ATOM 294 C ASP A 32 2.374 22.381 18.293 1.00 20.57 C -ATOM 295 O ASP A 32 1.426 22.253 17.511 1.00 22.37 O -ATOM 296 CB ASP A 32 0.809 22.358 20.226 1.00 23.08 C -ATOM 297 CG ASP A 32 0.375 21.651 21.495 1.00 25.24 C -ATOM 298 OD1 ASP A 32 1.027 20.663 21.882 1.00 26.63 O -ATOM 299 OD2 ASP A 32 -0.615 22.083 22.104 1.00 26.97 O -ATOM 300 H ASP A 32 3.881 21.858 21.068 1.00 0.00 H -ATOM 301 N TRP A 33 3.525 22.886 17.903 1.00 18.75 N -ATOM 302 CA TRP A 33 3.708 23.213 16.488 1.00 20.17 C -ATOM 303 C TRP A 33 3.768 21.917 15.706 1.00 20.21 C -ATOM 304 O TRP A 33 4.182 20.893 16.259 1.00 20.80 O -ATOM 305 CB TRP A 33 4.991 24.009 16.266 1.00 20.31 C -ATOM 306 CG TRP A 33 4.872 25.450 16.661 1.00 22.77 C -ATOM 307 CD1 TRP A 33 4.129 25.972 17.696 1.00 23.36 C -ATOM 308 CD2 TRP A 33 5.470 26.570 15.984 1.00 23.95 C -ATOM 309 NE1 TRP A 33 4.240 27.334 17.673 1.00 22.96 N -ATOM 310 CE2 TRP A 33 5.046 27.743 16.657 1.00 22.56 C -ATOM 311 CE3 TRP A 33 6.318 26.696 14.877 1.00 22.29 C -ATOM 312 CZ2 TRP A 33 5.442 29.023 16.257 1.00 24.90 C -ATOM 313 CZ3 TRP A 33 6.702 27.969 14.481 1.00 25.00 C -ATOM 314 CH2 TRP A 33 6.268 29.117 15.169 1.00 24.02 C -ATOM 315 H TRP A 33 4.245 23.030 18.542 1.00 0.00 H -ATOM 316 HE1 TRP A 33 3.780 27.938 18.295 1.00 0.00 H -ATOM 317 N VAL A 34 3.368 21.950 14.440 1.00 20.68 N -ATOM 318 CA VAL A 34 3.355 20.734 13.613 1.00 18.96 C -ATOM 319 C VAL A 34 4.219 20.947 12.371 1.00 20.18 C -ATOM 320 O VAL A 34 4.331 22.074 11.871 1.00 18.53 O -ATOM 321 CB VAL A 34 1.892 20.385 13.183 1.00 20.63 C -ATOM 322 CG1 VAL A 34 1.843 19.102 12.349 1.00 17.40 C -ATOM 323 CG2 VAL A 34 1.006 20.252 14.422 1.00 19.03 C -ATOM 324 H VAL A 34 3.075 22.803 14.050 1.00 0.00 H -ATOM 325 N ASN A 35 4.858 19.876 11.891 1.00 18.57 N -ATOM 326 CA ASN A 35 5.684 19.962 10.692 1.00 18.84 C -ATOM 327 C ASN A 35 4.771 20.026 9.459 1.00 19.27 C -ATOM 328 O ASN A 35 4.149 19.040 9.101 1.00 20.41 O -ATOM 329 CB ASN A 35 6.607 18.737 10.627 1.00 18.29 C -ATOM 330 CG ASN A 35 7.711 18.858 9.586 1.00 19.87 C -ATOM 331 OD1 ASN A 35 7.497 19.373 8.481 1.00 23.76 O -ATOM 332 ND2 ASN A 35 8.909 18.410 9.922 1.00 17.21 N -ATOM 333 H ASN A 35 4.769 19.017 12.356 1.00 0.00 H -ATOM 334 N ALA A 36 4.686 21.185 8.820 1.00 18.30 N -ATOM 335 CA ALA A 36 3.779 21.366 7.681 1.00 20.19 C -ATOM 336 C ALA A 36 4.218 20.577 6.451 1.00 20.67 C -ATOM 337 O ALA A 36 3.395 20.256 5.596 1.00 21.70 O -ATOM 338 CB ALA A 36 3.662 22.854 7.326 1.00 20.68 C -ATOM 339 H ALA A 36 5.227 21.939 9.126 1.00 0.00 H -ATOM 340 N THR A 37 5.520 20.304 6.337 1.00 20.05 N -ATOM 341 CA THR A 37 6.027 19.490 5.233 1.00 21.46 C -ATOM 342 C THR A 37 5.430 18.061 5.316 1.00 23.26 C -ATOM 343 O THR A 37 5.035 17.455 4.301 1.00 22.30 O -ATOM 344 CB THR A 37 7.565 19.411 5.296 1.00 22.61 C -ATOM 345 OG1 THR A 37 8.110 20.735 5.383 1.00 21.49 O -ATOM 346 CG2 THR A 37 8.117 18.703 4.063 1.00 24.86 C -ATOM 347 H THR A 37 6.144 20.670 6.994 1.00 0.00 H -ATOM 348 HG1 THR A 37 7.816 21.252 4.621 1.00 0.00 H -ATOM 349 N HIS A 38 5.356 17.534 6.551 1.00 22.61 N -ATOM 350 CA HIS A 38 4.747 16.236 6.788 1.00 22.32 C -ATOM 351 C HIS A 38 3.266 16.262 6.404 1.00 23.66 C -ATOM 352 O HIS A 38 2.720 15.268 5.928 1.00 24.58 O -ATOM 353 CB HIS A 38 4.859 15.863 8.257 1.00 20.45 C -ATOM 354 CG HIS A 38 6.246 15.623 8.731 1.00 20.07 C -ATOM 355 ND1 HIS A 38 6.563 15.505 10.070 1.00 19.75 N -ATOM 356 CD2 HIS A 38 7.419 15.519 8.069 1.00 20.62 C -ATOM 357 CE1 HIS A 38 7.858 15.336 10.243 1.00 21.58 C -ATOM 358 NE2 HIS A 38 8.380 15.347 9.033 1.00 21.07 N -ATOM 359 H HIS A 38 5.719 18.035 7.308 1.00 0.00 H -ATOM 360 HD1 HIS A 38 5.914 15.546 10.794 1.00 0.00 H -ATOM 361 HE2 HIS A 38 9.344 15.267 8.845 1.00 0.00 H -ATOM 362 N ILE A 39 2.600 17.377 6.659 1.00 22.79 N -ATOM 363 CA ILE A 39 1.189 17.509 6.277 1.00 25.79 C -ATOM 364 C ILE A 39 1.049 17.441 4.739 1.00 27.01 C -ATOM 365 O ILE A 39 0.113 16.832 4.209 1.00 27.50 O -ATOM 366 CB ILE A 39 0.593 18.857 6.784 1.00 25.78 C -ATOM 367 CG1 ILE A 39 0.451 18.822 8.308 1.00 25.82 C -ATOM 368 CG2 ILE A 39 -0.753 19.136 6.133 1.00 25.83 C -ATOM 369 CD1 ILE A 39 -0.033 20.127 8.900 1.00 26.05 C -ATOM 370 H ILE A 39 3.050 18.121 7.112 1.00 0.00 H -ATOM 371 N LEU A 40 1.986 18.075 4.038 1.00 27.04 N -ATOM 372 CA LEU A 40 1.953 18.101 2.581 1.00 28.05 C -ATOM 373 C LEU A 40 2.329 16.742 1.996 1.00 28.75 C -ATOM 374 O LEU A 40 1.788 16.329 0.960 1.00 29.82 O -ATOM 375 CB LEU A 40 2.879 19.202 2.054 1.00 27.15 C -ATOM 376 CG LEU A 40 2.515 20.627 2.472 1.00 27.87 C -ATOM 377 CD1 LEU A 40 3.470 21.612 1.841 1.00 26.87 C -ATOM 378 CD2 LEU A 40 1.078 20.936 2.072 1.00 27.13 C -ATOM 379 H LEU A 40 2.709 18.541 4.512 1.00 0.00 H -ATOM 380 N LYS A 41 3.242 16.043 2.643 1.00 29.67 N -ATOM 381 CA LYS A 41 3.570 14.693 2.203 1.00 32.88 C -ATOM 382 C LYS A 41 2.353 13.772 2.380 1.00 32.92 C -ATOM 383 O LYS A 41 2.113 12.887 1.562 1.00 33.65 O -ATOM 384 CB LYS A 41 4.764 14.129 2.980 1.00 35.05 C -ATOM 385 CG LYS A 41 6.078 14.828 2.690 1.00 40.79 C -ATOM 386 CD LYS A 41 7.262 14.033 3.222 1.00 45.43 C -ATOM 387 CE LYS A 41 8.571 14.734 2.889 1.00 49.42 C -ATOM 388 NZ LYS A 41 9.755 13.979 3.371 1.00 52.09 N -ATOM 389 H LYS A 41 3.699 16.431 3.415 1.00 0.00 H -ATOM 390 HZ1 LYS A 41 9.699 13.866 4.403 1.00 0.00 H -ATOM 391 HZ2 LYS A 41 9.776 13.041 2.920 1.00 0.00 H -ATOM 392 HZ3 LYS A 41 10.619 14.502 3.124 1.00 0.00 H -ATOM 393 N ALA A 42 1.581 13.997 3.446 1.00 32.20 N -ATOM 394 CA ALA A 42 0.382 13.209 3.702 1.00 32.15 C -ATOM 395 C ALA A 42 -0.678 13.434 2.618 1.00 33.55 C -ATOM 396 O ALA A 42 -1.459 12.535 2.319 1.00 33.31 O -ATOM 397 CB ALA A 42 -0.179 13.540 5.083 1.00 31.12 C -ATOM 398 H ALA A 42 1.831 14.705 4.078 1.00 0.00 H -ATOM 399 N ALA A 43 -0.704 14.637 2.027 1.00 34.01 N -ATOM 400 CA ALA A 43 -1.639 14.935 0.940 1.00 34.26 C -ATOM 401 C ALA A 43 -1.164 14.317 -0.400 1.00 35.09 C -ATOM 402 O ALA A 43 -1.780 14.532 -1.444 1.00 36.00 O -ATOM 403 CB ALA A 43 -1.812 16.443 0.800 1.00 32.11 C -ATOM 404 H ALA A 43 -0.088 15.334 2.334 1.00 0.00 H -ATOM 405 N ASN A 44 -0.054 13.575 -0.350 1.00 35.94 N -ATOM 406 CA ASN A 44 0.485 12.867 -1.520 1.00 37.87 C -ATOM 407 C ASN A 44 1.070 13.799 -2.591 1.00 36.65 C -ATOM 408 O ASN A 44 1.132 13.449 -3.777 1.00 37.27 O -ATOM 409 CB ASN A 44 -0.587 11.961 -2.122 1.00 41.40 C -ATOM 410 CG ASN A 44 -1.094 10.943 -1.116 1.00 46.56 C -ATOM 411 OD1 ASN A 44 -2.261 10.973 -0.701 1.00 49.78 O -ATOM 412 ND2 ASN A 44 -0.215 10.039 -0.707 1.00 48.00 N -ATOM 413 H ASN A 44 0.421 13.500 0.500 1.00 0.00 H -ATOM 414 HD21 ASN A 44 -0.504 9.368 -0.057 1.00 0.00 H -ATOM 415 HD22 ASN A 44 0.693 10.076 -1.076 1.00 0.00 H -ATOM 416 N PHE A 45 1.542 14.961 -2.165 1.00 33.67 N -ATOM 417 CA PHE A 45 2.126 15.914 -3.079 1.00 31.23 C -ATOM 418 C PHE A 45 3.596 15.632 -3.306 1.00 31.80 C -ATOM 419 O PHE A 45 4.332 15.338 -2.381 1.00 32.20 O -ATOM 420 CB PHE A 45 1.945 17.322 -2.540 1.00 31.12 C -ATOM 421 CG PHE A 45 0.517 17.781 -2.553 1.00 33.41 C -ATOM 422 CD1 PHE A 45 -0.390 17.273 -3.496 1.00 32.61 C -ATOM 423 CD2 PHE A 45 0.076 18.765 -1.663 1.00 33.98 C -ATOM 424 CE1 PHE A 45 -1.696 17.732 -3.548 1.00 32.35 C -ATOM 425 CE2 PHE A 45 -1.239 19.230 -1.713 1.00 34.17 C -ATOM 426 CZ PHE A 45 -2.122 18.716 -2.658 1.00 33.76 C -ATOM 427 H PHE A 45 1.504 15.175 -1.209 1.00 0.00 H -ATOM 428 N ALA A 46 4.016 15.712 -4.549 1.00 31.48 N -ATOM 429 CA ALA A 46 5.402 15.509 -4.899 1.00 30.26 C -ATOM 430 C ALA A 46 6.235 16.683 -4.414 1.00 30.35 C -ATOM 431 O ALA A 46 5.724 17.782 -4.212 1.00 28.10 O -ATOM 432 CB ALA A 46 5.546 15.368 -6.420 1.00 30.02 C -ATOM 433 H ALA A 46 3.373 15.924 -5.256 1.00 0.00 H -ATOM 434 N LYS A 47 7.531 16.442 -4.304 1.00 32.10 N -ATOM 435 CA LYS A 47 8.483 17.418 -3.792 1.00 32.24 C -ATOM 436 C LYS A 47 8.395 18.800 -4.429 1.00 30.73 C -ATOM 437 O LYS A 47 8.277 19.801 -3.722 1.00 30.50 O -ATOM 438 CB LYS A 47 9.899 16.853 -3.944 1.00 37.40 C -ATOM 439 CG LYS A 47 10.972 17.841 -3.565 1.00 42.56 C -ATOM 440 CD LYS A 47 12.341 17.207 -3.556 1.00 46.91 C -ATOM 441 CE LYS A 47 13.321 18.163 -2.910 1.00 50.20 C -ATOM 442 NZ LYS A 47 12.820 18.645 -1.584 1.00 52.19 N -ATOM 443 H LYS A 47 7.867 15.565 -4.578 1.00 0.00 H -ATOM 444 HZ1 LYS A 47 12.666 17.831 -0.956 1.00 0.00 H -ATOM 445 HZ2 LYS A 47 13.522 19.283 -1.159 1.00 0.00 H -ATOM 446 HZ3 LYS A 47 11.922 19.155 -1.715 1.00 0.00 H -ATOM 447 N ALA A 48 8.475 18.884 -5.757 1.00 29.18 N -ATOM 448 CA ALA A 48 8.416 20.192 -6.406 1.00 27.07 C -ATOM 449 C ALA A 48 7.120 20.934 -6.061 1.00 26.43 C -ATOM 450 O ALA A 48 7.125 22.153 -5.856 1.00 26.30 O -ATOM 451 CB ALA A 48 8.549 20.032 -7.907 1.00 27.43 C -ATOM 452 H ALA A 48 8.573 18.072 -6.295 1.00 0.00 H -ATOM 453 N LYS A 49 6.004 20.204 -5.990 1.00 25.81 N -ATOM 454 CA LYS A 49 4.739 20.835 -5.644 1.00 25.14 C -ATOM 455 C LYS A 49 4.708 21.228 -4.149 1.00 26.02 C -ATOM 456 O LYS A 49 4.271 22.333 -3.807 1.00 26.28 O -ATOM 457 CB LYS A 49 3.557 19.911 -5.998 1.00 23.26 C -ATOM 458 CG LYS A 49 2.204 20.550 -5.749 1.00 21.88 C -ATOM 459 CD LYS A 49 1.068 19.673 -6.205 1.00 21.75 C -ATOM 460 CE LYS A 49 -0.261 20.341 -5.886 1.00 23.25 C -ATOM 461 NZ LYS A 49 -1.431 19.580 -6.417 1.00 25.36 N -ATOM 462 H LYS A 49 6.035 19.244 -6.171 1.00 0.00 H -ATOM 463 HZ1 LYS A 49 -1.317 19.440 -7.442 1.00 0.00 H -ATOM 464 HZ2 LYS A 49 -1.486 18.656 -5.945 1.00 0.00 H -ATOM 465 HZ3 LYS A 49 -2.302 20.115 -6.235 1.00 0.00 H -ATOM 466 N ARG A 50 5.175 20.346 -3.257 1.00 26.65 N -ATOM 467 CA ARG A 50 5.214 20.698 -1.829 1.00 28.25 C -ATOM 468 C ARG A 50 6.004 21.993 -1.639 1.00 29.71 C -ATOM 469 O ARG A 50 5.571 22.889 -0.911 1.00 29.79 O -ATOM 470 CB ARG A 50 5.861 19.596 -0.974 1.00 28.86 C -ATOM 471 CG ARG A 50 5.095 18.281 -0.903 1.00 29.69 C -ATOM 472 CD ARG A 50 5.631 17.384 0.212 1.00 31.10 C -ATOM 473 NE ARG A 50 7.081 17.183 0.132 1.00 33.71 N -ATOM 474 CZ ARG A 50 7.649 16.086 -0.374 1.00 32.93 C -ATOM 475 NH1 ARG A 50 6.913 15.086 -0.812 1.00 33.08 N -ATOM 476 NH2 ARG A 50 8.962 15.997 -0.433 1.00 34.05 N -ATOM 477 H ARG A 50 5.491 19.468 -3.555 1.00 0.00 H -ATOM 478 HE ARG A 50 7.666 17.894 0.470 1.00 0.00 H -ATOM 479 HH11 ARG A 50 5.915 15.141 -0.768 1.00 0.00 H -ATOM 480 HH12 ARG A 50 7.351 14.268 -1.183 1.00 0.00 H -ATOM 481 HH21 ARG A 50 9.530 16.754 -0.109 1.00 0.00 H -ATOM 482 HH22 ARG A 50 9.390 15.182 -0.821 1.00 0.00 H -ATOM 483 N THR A 51 7.156 22.103 -2.293 1.00 30.60 N -ATOM 484 CA THR A 51 7.940 23.328 -2.202 1.00 34.13 C -ATOM 485 C THR A 51 7.126 24.546 -2.664 1.00 36.23 C -ATOM 486 O THR A 51 7.116 25.572 -1.989 1.00 37.79 O -ATOM 487 CB THR A 51 9.229 23.248 -3.045 1.00 34.90 C -ATOM 488 OG1 THR A 51 10.012 22.129 -2.618 1.00 37.41 O -ATOM 489 CG2 THR A 51 10.053 24.516 -2.883 1.00 34.97 C -ATOM 490 H THR A 51 7.478 21.356 -2.840 1.00 0.00 H -ATOM 491 HG1 THR A 51 10.112 22.153 -1.662 1.00 0.00 H -ATOM 492 N ARG A 52 6.437 24.426 -3.808 1.00 36.91 N -ATOM 493 CA ARG A 52 5.643 25.532 -4.334 1.00 37.18 C -ATOM 494 C ARG A 52 4.606 25.971 -3.336 1.00 36.76 C -ATOM 495 O ARG A 52 4.440 27.160 -3.082 1.00 36.25 O -ATOM 496 CB ARG A 52 4.936 25.144 -5.645 1.00 40.06 C -ATOM 497 CG ARG A 52 5.789 25.346 -6.882 1.00 46.55 C -ATOM 498 CD ARG A 52 5.012 25.112 -8.177 1.00 50.64 C -ATOM 499 NE ARG A 52 4.800 23.686 -8.469 1.00 54.17 N -ATOM 500 CZ ARG A 52 3.586 23.152 -8.595 1.00 55.29 C -ATOM 501 NH1 ARG A 52 2.510 23.914 -8.453 1.00 55.77 N -ATOM 502 NH2 ARG A 52 3.448 21.863 -8.859 1.00 54.72 N -ATOM 503 H ARG A 52 6.465 23.577 -4.298 1.00 0.00 H -ATOM 504 HE ARG A 52 5.582 23.107 -8.573 1.00 0.00 H -ATOM 505 HH11 ARG A 52 2.609 24.886 -8.243 1.00 0.00 H -ATOM 506 HH12 ARG A 52 1.601 23.516 -8.532 1.00 0.00 H -ATOM 507 HH21 ARG A 52 4.256 21.283 -8.962 1.00 0.00 H -ATOM 508 HH22 ARG A 52 2.534 21.466 -8.949 1.00 0.00 H -ATOM 509 N ILE A 53 3.911 25.007 -2.763 1.00 35.47 N -ATOM 510 CA ILE A 53 2.880 25.315 -1.797 1.00 34.72 C -ATOM 511 C ILE A 53 3.469 25.944 -0.519 1.00 36.40 C -ATOM 512 O ILE A 53 2.917 26.915 0.007 1.00 35.83 O -ATOM 513 CB ILE A 53 2.060 24.063 -1.457 1.00 32.23 C -ATOM 514 CG1 ILE A 53 1.312 23.604 -2.722 1.00 29.11 C -ATOM 515 CG2 ILE A 53 1.091 24.371 -0.326 1.00 31.92 C -ATOM 516 CD1 ILE A 53 0.519 22.328 -2.562 1.00 26.86 C -ATOM 517 H ILE A 53 4.101 24.073 -2.991 1.00 0.00 H -ATOM 518 N LEU A 54 4.593 25.421 -0.035 1.00 37.08 N -ATOM 519 CA LEU A 54 5.218 26.007 1.135 1.00 40.29 C -ATOM 520 C LEU A 54 5.580 27.455 0.843 1.00 44.75 C -ATOM 521 O LEU A 54 5.191 28.352 1.593 1.00 46.69 O -ATOM 522 CB LEU A 54 6.455 25.213 1.570 1.00 36.32 C -ATOM 523 CG LEU A 54 6.184 23.848 2.250 1.00 35.63 C -ATOM 524 CD1 LEU A 54 7.482 23.082 2.415 1.00 35.47 C -ATOM 525 CD2 LEU A 54 5.495 24.031 3.599 1.00 32.30 C -ATOM 526 H LEU A 54 4.995 24.636 -0.465 1.00 0.00 H -ATOM 527 N GLU A 55 6.255 27.694 -0.278 1.00 48.95 N -ATOM 528 CA GLU A 55 6.653 29.057 -0.641 1.00 53.87 C -ATOM 529 C GLU A 55 5.475 30.011 -0.879 1.00 55.01 C -ATOM 530 O GLU A 55 5.632 31.220 -0.716 1.00 56.05 O -ATOM 531 CB GLU A 55 7.559 29.061 -1.867 1.00 56.02 C -ATOM 532 CG GLU A 55 8.998 28.661 -1.574 1.00 61.71 C -ATOM 533 CD GLU A 55 9.913 28.817 -2.782 1.00 65.77 C -ATOM 534 OE1 GLU A 55 9.578 29.620 -3.692 1.00 67.68 O -ATOM 535 OE2 GLU A 55 10.972 28.141 -2.825 1.00 67.99 O -ATOM 536 H GLU A 55 6.487 26.949 -0.871 1.00 0.00 H -ATOM 537 N LYS A 56 4.300 29.504 -1.233 1.00 56.16 N -ATOM 538 CA LYS A 56 3.190 30.407 -1.512 1.00 57.49 C -ATOM 539 C LYS A 56 2.177 30.484 -0.374 1.00 57.70 C -ATOM 540 O LYS A 56 1.709 31.565 -0.027 1.00 58.88 O -ATOM 541 CB LYS A 56 2.462 30.010 -2.805 1.00 59.37 C -ATOM 542 CG LYS A 56 3.353 29.694 -4.000 1.00 60.92 C -ATOM 543 CD LYS A 56 4.379 30.776 -4.270 1.00 62.11 C -ATOM 544 CE LYS A 56 5.349 30.325 -5.346 1.00 62.44 C -ATOM 545 NZ LYS A 56 6.619 31.101 -5.312 1.00 63.21 N -ATOM 546 H LYS A 56 4.182 28.533 -1.316 1.00 0.00 H -ATOM 547 HZ1 LYS A 56 6.413 32.110 -5.451 1.00 0.00 H -ATOM 548 HZ2 LYS A 56 7.083 30.968 -4.390 1.00 0.00 H -ATOM 549 HZ3 LYS A 56 7.249 30.768 -6.070 1.00 0.00 H -ATOM 550 N GLU A 57 1.827 29.347 0.196 1.00 57.07 N -ATOM 551 CA GLU A 57 0.797 29.311 1.235 1.00 56.65 C -ATOM 552 C GLU A 57 1.332 29.368 2.684 1.00 54.52 C -ATOM 553 O GLU A 57 0.620 29.824 3.598 1.00 54.61 O -ATOM 554 CB GLU A 57 -0.062 28.043 1.078 1.00 59.13 C -ATOM 555 CG GLU A 57 -1.132 28.102 -0.004 1.00 63.67 C -ATOM 556 CD GLU A 57 -0.571 28.357 -1.387 1.00 67.30 C -ATOM 557 OE1 GLU A 57 -0.072 27.402 -2.017 1.00 69.12 O -ATOM 558 OE2 GLU A 57 -0.632 29.519 -1.849 1.00 70.26 O -ATOM 559 H GLU A 57 2.257 28.521 -0.082 1.00 0.00 H -ATOM 560 N VAL A 58 2.570 28.937 2.917 1.00 49.63 N -ATOM 561 CA VAL A 58 3.017 28.786 4.292 1.00 44.43 C -ATOM 562 C VAL A 58 4.100 29.778 4.744 1.00 42.78 C -ATOM 563 O VAL A 58 4.065 30.242 5.888 1.00 40.70 O -ATOM 564 CB VAL A 58 3.470 27.322 4.534 1.00 43.06 C -ATOM 565 CG1 VAL A 58 3.795 27.092 5.998 1.00 40.87 C -ATOM 566 CG2 VAL A 58 2.370 26.369 4.086 1.00 40.46 C -ATOM 567 H VAL A 58 3.172 28.726 2.171 1.00 0.00 H -ATOM 568 N LEU A 59 5.045 30.125 3.873 1.00 39.75 N -ATOM 569 CA LEU A 59 6.126 31.020 4.281 1.00 38.99 C -ATOM 570 C LEU A 59 5.649 32.438 4.643 1.00 38.81 C -ATOM 571 O LEU A 59 6.371 33.182 5.311 1.00 38.40 O -ATOM 572 CB LEU A 59 7.220 31.083 3.218 1.00 40.26 C -ATOM 573 CG LEU A 59 8.011 29.793 2.935 1.00 42.18 C -ATOM 574 CD1 LEU A 59 9.048 30.068 1.854 1.00 43.46 C -ATOM 575 CD2 LEU A 59 8.705 29.285 4.187 1.00 40.89 C -ATOM 576 H LEU A 59 5.019 29.775 2.957 1.00 0.00 H -ATOM 577 N LYS A 60 4.442 32.824 4.220 1.00 37.98 N -ATOM 578 CA LYS A 60 3.900 34.140 4.604 1.00 38.59 C -ATOM 579 C LYS A 60 3.195 34.061 5.973 1.00 36.39 C -ATOM 580 O LYS A 60 2.649 35.028 6.474 1.00 35.79 O -ATOM 581 CB LYS A 60 2.940 34.673 3.522 1.00 41.34 C -ATOM 582 CG LYS A 60 1.766 33.760 3.171 1.00 47.49 C -ATOM 583 CD LYS A 60 0.876 34.407 2.102 1.00 50.85 C -ATOM 584 CE LYS A 60 -0.508 33.757 2.010 1.00 53.27 C -ATOM 585 NZ LYS A 60 -0.459 32.368 1.466 1.00 54.66 N -ATOM 586 H LYS A 60 3.915 32.232 3.649 1.00 0.00 H -ATOM 587 HZ1 LYS A 60 0.153 31.784 2.070 1.00 0.00 H -ATOM 588 HZ2 LYS A 60 -1.418 31.967 1.451 1.00 0.00 H -ATOM 589 HZ3 LYS A 60 -0.076 32.388 0.500 1.00 0.00 H -ATOM 590 N GLU A 61 3.241 32.884 6.559 1.00 35.74 N -ATOM 591 CA GLU A 61 2.635 32.606 7.849 1.00 34.60 C -ATOM 592 C GLU A 61 3.719 32.560 8.935 1.00 30.62 C -ATOM 593 O GLU A 61 4.924 32.542 8.646 1.00 28.48 O -ATOM 594 CB GLU A 61 1.990 31.214 7.782 1.00 39.66 C -ATOM 595 CG GLU A 61 0.636 31.096 8.418 1.00 45.92 C -ATOM 596 CD GLU A 61 -0.377 31.877 7.639 1.00 48.95 C -ATOM 597 OE1 GLU A 61 -0.692 31.467 6.495 1.00 51.19 O -ATOM 598 OE2 GLU A 61 -0.850 32.904 8.161 1.00 51.71 O -ATOM 599 H GLU A 61 3.711 32.155 6.108 1.00 0.00 H -ATOM 600 N THR A 62 3.293 32.544 10.171 1.00 27.25 N -ATOM 601 CA THR A 62 4.222 32.307 11.253 1.00 25.63 C -ATOM 602 C THR A 62 4.784 30.874 11.059 1.00 24.77 C -ATOM 603 O THR A 62 4.029 29.932 10.840 1.00 25.37 O -ATOM 604 CB THR A 62 3.489 32.435 12.612 1.00 24.97 C -ATOM 605 OG1 THR A 62 3.032 33.783 12.735 1.00 26.20 O -ATOM 606 CG2 THR A 62 4.398 32.117 13.789 1.00 21.20 C -ATOM 607 H THR A 62 2.346 32.689 10.363 1.00 0.00 H -ATOM 608 HG1 THR A 62 2.683 34.075 11.886 1.00 0.00 H -ATOM 609 N HIS A 63 6.090 30.727 11.103 1.00 22.46 N -ATOM 610 CA HIS A 63 6.689 29.428 10.867 1.00 21.88 C -ATOM 611 C HIS A 63 8.151 29.435 11.272 1.00 22.48 C -ATOM 612 O HIS A 63 8.745 30.495 11.513 1.00 21.68 O -ATOM 613 CB HIS A 63 6.608 29.071 9.366 1.00 20.21 C -ATOM 614 CG HIS A 63 7.519 29.918 8.512 1.00 20.30 C -ATOM 615 ND1 HIS A 63 7.125 31.124 7.953 1.00 21.50 N -ATOM 616 CD2 HIS A 63 8.845 29.800 8.198 1.00 20.65 C -ATOM 617 CE1 HIS A 63 8.126 31.727 7.333 1.00 20.90 C -ATOM 618 NE2 HIS A 63 9.169 30.942 7.478 1.00 21.55 N -ATOM 619 H HIS A 63 6.663 31.500 11.309 1.00 0.00 H -ATOM 620 HD1 HIS A 63 6.209 31.477 7.991 1.00 0.00 H -ATOM 621 HE2 HIS A 63 10.052 31.147 7.133 1.00 0.00 H -ATOM 622 N GLU A 64 8.738 28.251 11.238 1.00 22.95 N -ATOM 623 CA GLU A 64 10.138 28.055 11.535 1.00 23.61 C -ATOM 624 C GLU A 64 10.697 27.100 10.460 1.00 24.98 C -ATOM 625 O GLU A 64 10.132 26.021 10.254 1.00 24.19 O -ATOM 626 CB GLU A 64 10.199 27.431 12.901 1.00 25.13 C -ATOM 627 CG GLU A 64 11.558 27.257 13.499 1.00 33.54 C -ATOM 628 CD GLU A 64 11.474 26.481 14.804 1.00 36.59 C -ATOM 629 OE1 GLU A 64 10.501 26.685 15.558 1.00 36.12 O -ATOM 630 OE2 GLU A 64 12.376 25.665 15.070 1.00 41.18 O -ATOM 631 H GLU A 64 8.200 27.468 10.997 1.00 0.00 H -ATOM 632 N LYS A 65 11.739 27.531 9.737 1.00 24.36 N -ATOM 633 CA LYS A 65 12.353 26.718 8.693 1.00 28.24 C -ATOM 634 C LYS A 65 13.510 25.954 9.251 1.00 28.33 C -ATOM 635 O LYS A 65 14.585 26.503 9.412 1.00 28.08 O -ATOM 636 CB LYS A 65 12.896 27.587 7.556 1.00 31.73 C -ATOM 637 CG LYS A 65 12.049 27.649 6.299 1.00 36.91 C -ATOM 638 CD LYS A 65 12.165 29.023 5.643 1.00 40.14 C -ATOM 639 CE LYS A 65 11.933 30.111 6.681 1.00 39.32 C -ATOM 640 NZ LYS A 65 11.630 31.435 6.088 1.00 36.54 N -ATOM 641 H LYS A 65 12.110 28.420 9.924 1.00 0.00 H -ATOM 642 HZ1 LYS A 65 12.425 31.734 5.487 1.00 0.00 H -ATOM 643 HZ2 LYS A 65 10.766 31.367 5.511 1.00 0.00 H -ATOM 644 HZ3 LYS A 65 11.487 32.131 6.847 1.00 0.00 H -ATOM 645 N VAL A 66 13.291 24.696 9.552 1.00 31.01 N -ATOM 646 CA VAL A 66 14.358 23.851 10.050 1.00 34.94 C -ATOM 647 C VAL A 66 14.962 23.049 8.896 1.00 39.67 C -ATOM 648 O VAL A 66 14.428 22.006 8.483 1.00 37.52 O -ATOM 649 CB VAL A 66 13.862 22.887 11.168 1.00 34.61 C -ATOM 650 CG1 VAL A 66 14.973 21.935 11.594 1.00 33.81 C -ATOM 651 CG2 VAL A 66 13.401 23.687 12.375 1.00 34.49 C -ATOM 652 H VAL A 66 12.388 24.323 9.443 1.00 0.00 H -ATOM 653 N GLN A 67 16.040 23.586 8.332 1.00 46.01 N -ATOM 654 CA GLN A 67 16.763 22.891 7.275 1.00 53.84 C -ATOM 655 C GLN A 67 18.179 22.570 7.732 1.00 58.95 C -ATOM 656 O GLN A 67 19.013 22.109 6.948 1.00 60.26 O -ATOM 657 CB GLN A 67 16.784 23.703 5.985 1.00 53.89 C -ATOM 658 CG GLN A 67 15.426 23.779 5.294 1.00 59.07 C -ATOM 659 CD GLN A 67 14.657 22.452 5.300 1.00 60.32 C -ATOM 660 OE1 GLN A 67 15.031 21.480 4.629 1.00 62.98 O -ATOM 661 NE2 GLN A 67 13.571 22.404 6.053 1.00 59.66 N -ATOM 662 H GLN A 67 16.348 24.470 8.627 1.00 0.00 H -ATOM 663 HE21 GLN A 67 13.049 21.578 6.062 1.00 0.00 H -ATOM 664 HE22 GLN A 67 13.328 23.200 6.571 1.00 0.00 H -ATOM 665 N GLY A 68 18.428 22.811 9.025 1.00 63.66 N -ATOM 666 CA GLY A 68 19.718 22.513 9.608 1.00 67.82 C -ATOM 667 C GLY A 68 19.631 21.327 10.546 1.00 70.65 C -ATOM 668 O GLY A 68 20.590 20.563 10.690 1.00 72.02 O -ATOM 669 H GLY A 68 17.727 23.193 9.587 1.00 0.00 H -ATOM 670 N GLY A 69 18.484 21.187 11.208 1.00 72.32 N -ATOM 671 CA GLY A 69 18.274 20.048 12.083 1.00 73.41 C -ATOM 672 C GLY A 69 18.041 18.789 11.270 1.00 73.97 C -ATOM 673 O GLY A 69 16.899 18.441 10.969 1.00 75.24 O -ATOM 674 H GLY A 69 17.778 21.853 11.102 1.00 0.00 H -ATOM 675 N PHE A 70 19.137 18.135 10.900 1.00 73.39 N -ATOM 676 CA PHE A 70 19.106 16.920 10.080 1.00 72.45 C -ATOM 677 C PHE A 70 18.165 15.833 10.606 1.00 69.47 C -ATOM 678 O PHE A 70 18.036 15.622 11.819 1.00 69.28 O -ATOM 679 CB PHE A 70 20.534 16.352 9.963 1.00 77.03 C -ATOM 680 CG PHE A 70 20.600 14.896 9.586 1.00 79.94 C -ATOM 681 CD1 PHE A 70 20.367 14.492 8.269 1.00 81.63 C -ATOM 682 CD2 PHE A 70 20.858 13.920 10.561 1.00 80.76 C -ATOM 683 CE1 PHE A 70 20.384 13.141 7.933 1.00 82.97 C -ATOM 684 CE2 PHE A 70 20.875 12.571 10.232 1.00 81.33 C -ATOM 685 CZ PHE A 70 20.638 12.181 8.917 1.00 82.90 C -ATOM 686 H PHE A 70 20.007 18.487 11.182 1.00 0.00 H -ATOM 687 N GLY A 71 17.534 15.127 9.666 1.00 65.37 N -ATOM 688 CA GLY A 71 16.681 14.014 10.024 1.00 60.61 C -ATOM 689 C GLY A 71 15.251 14.174 9.548 1.00 56.43 C -ATOM 690 O GLY A 71 14.949 15.071 8.766 1.00 56.11 O -ATOM 691 H GLY A 71 17.632 15.378 8.724 1.00 0.00 H -ATOM 692 N LYS A 72 14.367 13.295 10.036 1.00 51.93 N -ATOM 693 CA LYS A 72 12.939 13.359 9.704 1.00 47.12 C -ATOM 694 C LYS A 72 12.312 14.620 10.322 1.00 42.99 C -ATOM 695 O LYS A 72 11.172 14.976 10.019 1.00 41.22 O -ATOM 696 CB LYS A 72 12.214 12.127 10.263 1.00 47.52 C -ATOM 697 CG LYS A 72 12.828 10.789 9.890 1.00 47.51 C -ATOM 698 CD LYS A 72 13.208 9.975 11.122 1.00 45.89 C -ATOM 699 CE LYS A 72 12.024 9.749 12.053 1.00 45.99 C -ATOM 700 NZ LYS A 72 10.946 8.941 11.439 1.00 43.61 N -ATOM 701 H LYS A 72 14.682 12.587 10.635 1.00 0.00 H -ATOM 702 HZ1 LYS A 72 10.620 9.405 10.566 1.00 0.00 H -ATOM 703 HZ2 LYS A 72 11.311 7.995 11.214 1.00 0.00 H -ATOM 704 HZ3 LYS A 72 10.153 8.856 12.105 1.00 0.00 H -ATOM 705 N TYR A 73 13.084 15.252 11.211 1.00 38.82 N -ATOM 706 CA TYR A 73 12.666 16.439 11.926 1.00 35.13 C -ATOM 707 C TYR A 73 12.654 17.679 11.023 1.00 33.18 C -ATOM 708 O TYR A 73 11.879 18.607 11.253 1.00 30.17 O -ATOM 709 CB TYR A 73 13.600 16.649 13.125 1.00 32.68 C -ATOM 710 CG TYR A 73 13.198 17.796 14.018 1.00 32.41 C -ATOM 711 CD1 TYR A 73 12.116 17.691 14.884 1.00 31.25 C -ATOM 712 CD2 TYR A 73 13.835 19.025 13.921 1.00 32.40 C -ATOM 713 CE1 TYR A 73 11.679 18.785 15.613 1.00 30.72 C -ATOM 714 CE2 TYR A 73 13.400 20.120 14.644 1.00 32.39 C -ATOM 715 CZ TYR A 73 12.317 19.993 15.478 1.00 30.86 C -ATOM 716 OH TYR A 73 11.840 21.094 16.130 1.00 32.23 O -ATOM 717 H TYR A 73 13.974 14.893 11.393 1.00 0.00 H -ATOM 718 HH TYR A 73 12.352 21.867 15.869 1.00 0.00 H -ATOM 719 N GLN A 74 13.525 17.690 10.013 1.00 31.23 N -ATOM 720 CA GLN A 74 13.605 18.814 9.066 1.00 29.72 C -ATOM 721 C GLN A 74 12.254 19.162 8.468 1.00 26.23 C -ATOM 722 O GLN A 74 11.409 18.291 8.229 1.00 24.41 O -ATOM 723 CB GLN A 74 14.535 18.475 7.902 1.00 33.74 C -ATOM 724 CG GLN A 74 16.010 18.494 8.213 1.00 41.63 C -ATOM 725 CD GLN A 74 16.825 17.988 7.039 1.00 47.74 C -ATOM 726 OE1 GLN A 74 17.535 16.971 7.143 1.00 52.12 O -ATOM 727 NE2 GLN A 74 16.728 18.678 5.908 1.00 49.67 N -ATOM 728 H GLN A 74 14.129 16.927 9.898 1.00 0.00 H -ATOM 729 HE21 GLN A 74 17.240 18.365 5.133 1.00 0.00 H -ATOM 730 HE22 GLN A 74 16.152 19.471 5.887 1.00 0.00 H -ATOM 731 N GLY A 75 12.066 20.432 8.182 1.00 24.61 N -ATOM 732 CA GLY A 75 10.849 20.850 7.522 1.00 22.59 C -ATOM 733 C GLY A 75 10.439 22.235 7.929 1.00 22.00 C -ATOM 734 O GLY A 75 11.189 22.944 8.595 1.00 20.96 O -ATOM 735 H GLY A 75 12.741 21.096 8.433 1.00 0.00 H -ATOM 736 N THR A 76 9.267 22.641 7.507 1.00 22.18 N -ATOM 737 CA THR A 76 8.739 23.926 7.925 1.00 23.13 C -ATOM 738 C THR A 76 7.705 23.707 9.012 1.00 21.22 C -ATOM 739 O THR A 76 6.677 23.047 8.785 1.00 20.41 O -ATOM 740 CB THR A 76 8.129 24.677 6.750 1.00 22.98 C -ATOM 741 OG1 THR A 76 9.172 24.951 5.823 1.00 23.34 O -ATOM 742 CG2 THR A 76 7.529 25.993 7.203 1.00 22.12 C -ATOM 743 H THR A 76 8.743 22.073 6.908 1.00 0.00 H -ATOM 744 HG1 THR A 76 9.671 24.146 5.648 1.00 0.00 H -ATOM 745 N TRP A 77 8.007 24.190 10.198 1.00 18.01 N -ATOM 746 CA TRP A 77 7.115 24.000 11.334 1.00 19.61 C -ATOM 747 C TRP A 77 6.172 25.179 11.495 1.00 20.15 C -ATOM 748 O TRP A 77 6.569 26.324 11.307 1.00 21.17 O -ATOM 749 CB TRP A 77 7.954 23.797 12.587 1.00 18.45 C -ATOM 750 CG TRP A 77 8.738 22.517 12.563 1.00 16.73 C -ATOM 751 CD1 TRP A 77 9.924 22.262 11.889 1.00 19.52 C -ATOM 752 CD2 TRP A 77 8.383 21.314 13.246 1.00 16.18 C -ATOM 753 NE1 TRP A 77 10.287 20.964 12.134 1.00 18.03 N -ATOM 754 CE2 TRP A 77 9.378 20.351 12.952 1.00 18.24 C -ATOM 755 CE3 TRP A 77 7.303 20.950 14.076 1.00 15.09 C -ATOM 756 CZ2 TRP A 77 9.333 19.052 13.464 1.00 17.80 C -ATOM 757 CZ3 TRP A 77 7.263 19.657 14.586 1.00 16.17 C -ATOM 758 CH2 TRP A 77 8.271 18.728 14.275 1.00 16.88 C -ATOM 759 H TRP A 77 8.844 24.682 10.320 1.00 0.00 H -ATOM 760 HE1 TRP A 77 11.083 20.525 11.763 1.00 0.00 H -ATOM 761 N VAL A 78 4.940 24.916 11.848 1.00 19.79 N -ATOM 762 CA VAL A 78 3.960 25.992 11.977 1.00 21.20 C -ATOM 763 C VAL A 78 3.102 25.800 13.232 1.00 22.23 C -ATOM 764 O VAL A 78 3.039 24.692 13.785 1.00 20.52 O -ATOM 765 CB VAL A 78 3.014 26.045 10.738 1.00 20.50 C -ATOM 766 CG1 VAL A 78 3.805 26.352 9.464 1.00 19.09 C -ATOM 767 CG2 VAL A 78 2.264 24.722 10.594 1.00 19.19 C -ATOM 768 H VAL A 78 4.670 23.993 12.035 1.00 0.00 H -ATOM 769 N PRO A 79 2.461 26.879 13.729 1.00 22.62 N -ATOM 770 CA PRO A 79 1.579 26.796 14.902 1.00 23.25 C -ATOM 771 C PRO A 79 0.479 25.793 14.613 1.00 23.88 C -ATOM 772 O PRO A 79 0.126 25.577 13.452 1.00 22.74 O -ATOM 773 CB PRO A 79 1.009 28.217 15.030 1.00 22.80 C -ATOM 774 CG PRO A 79 2.089 29.063 14.441 1.00 23.48 C -ATOM 775 CD PRO A 79 2.583 28.279 13.243 1.00 21.77 C -ATOM 776 N LEU A 80 -0.081 25.221 15.664 1.00 25.83 N -ATOM 777 CA LEU A 80 -1.142 24.222 15.543 1.00 26.16 C -ATOM 778 C LEU A 80 -2.338 24.712 14.733 1.00 28.51 C -ATOM 779 O LEU A 80 -2.846 23.991 13.849 1.00 27.56 O -ATOM 780 CB LEU A 80 -1.606 23.815 16.940 1.00 25.96 C -ATOM 781 CG LEU A 80 -2.660 22.728 17.020 1.00 26.73 C -ATOM 782 CD1 LEU A 80 -2.142 21.452 16.363 1.00 25.64 C -ATOM 783 CD2 LEU A 80 -3.028 22.488 18.480 1.00 29.49 C -ATOM 784 H LEU A 80 0.229 25.469 16.557 1.00 0.00 H -ATOM 785 N ASN A 81 -2.811 25.922 15.016 1.00 30.41 N -ATOM 786 CA ASN A 81 -3.989 26.411 14.305 1.00 33.34 C -ATOM 787 C ASN A 81 -3.726 26.541 12.797 1.00 33.24 C -ATOM 788 O ASN A 81 -4.593 26.200 11.979 1.00 32.55 O -ATOM 789 CB ASN A 81 -4.522 27.720 14.912 1.00 36.72 C -ATOM 790 CG ASN A 81 -3.615 28.898 14.707 1.00 41.39 C -ATOM 791 OD1 ASN A 81 -2.520 28.954 15.254 1.00 45.06 O -ATOM 792 ND2 ASN A 81 -4.064 29.855 13.912 1.00 44.46 N -ATOM 793 H ASN A 81 -2.379 26.474 15.701 1.00 0.00 H -ATOM 794 HD21 ASN A 81 -3.494 30.640 13.765 1.00 0.00 H -ATOM 795 HD22 ASN A 81 -4.947 29.746 13.504 1.00 0.00 H -ATOM 796 N ILE A 82 -2.509 26.970 12.436 1.00 33.12 N -ATOM 797 CA ILE A 82 -2.133 27.108 11.022 1.00 33.42 C -ATOM 798 C ILE A 82 -1.996 25.751 10.338 1.00 33.66 C -ATOM 799 O ILE A 82 -2.344 25.611 9.172 1.00 33.06 O -ATOM 800 CB ILE A 82 -0.820 27.882 10.878 1.00 34.68 C -ATOM 801 CG1 ILE A 82 -1.027 29.318 11.381 1.00 35.90 C -ATOM 802 CG2 ILE A 82 -0.364 27.862 9.424 1.00 32.30 C -ATOM 803 CD1 ILE A 82 0.246 30.062 11.708 1.00 36.35 C -ATOM 804 H ILE A 82 -1.856 27.193 13.129 1.00 0.00 H -ATOM 805 N ALA A 83 -1.487 24.751 11.078 1.00 33.47 N -ATOM 806 CA ALA A 83 -1.385 23.383 10.547 1.00 32.68 C -ATOM 807 C ALA A 83 -2.796 22.798 10.314 1.00 32.07 C -ATOM 808 O ALA A 83 -3.034 22.097 9.335 1.00 30.79 O -ATOM 809 CB ALA A 83 -0.586 22.496 11.509 1.00 31.27 C -ATOM 810 H ALA A 83 -1.184 24.937 11.992 1.00 0.00 H -ATOM 811 N LYS A 84 -3.729 23.093 11.215 1.00 33.43 N -ATOM 812 CA LYS A 84 -5.093 22.639 11.041 1.00 35.11 C -ATOM 813 C LYS A 84 -5.693 23.212 9.756 1.00 36.73 C -ATOM 814 O LYS A 84 -6.318 22.491 8.974 1.00 36.83 O -ATOM 815 CB LYS A 84 -5.948 23.050 12.228 1.00 37.36 C -ATOM 816 CG LYS A 84 -5.607 22.354 13.530 1.00 40.04 C -ATOM 817 CD LYS A 84 -6.871 22.073 14.319 1.00 42.74 C -ATOM 818 CE LYS A 84 -6.559 21.578 15.716 1.00 45.28 C -ATOM 819 NZ LYS A 84 -6.384 22.711 16.664 1.00 49.86 N -ATOM 820 H LYS A 84 -3.489 23.619 12.006 1.00 0.00 H -ATOM 821 HZ1 LYS A 84 -5.641 23.348 16.311 1.00 0.00 H -ATOM 822 HZ2 LYS A 84 -7.280 23.233 16.744 1.00 0.00 H -ATOM 823 HZ3 LYS A 84 -6.113 22.344 17.598 1.00 0.00 H -ATOM 824 N GLN A 85 -5.504 24.510 9.535 1.00 37.40 N -ATOM 825 CA GLN A 85 -5.981 25.141 8.298 1.00 38.47 C -ATOM 826 C GLN A 85 -5.414 24.411 7.065 1.00 37.19 C -ATOM 827 O GLN A 85 -6.144 24.015 6.168 1.00 36.76 O -ATOM 828 CB GLN A 85 -5.550 26.617 8.243 1.00 41.65 C -ATOM 829 CG GLN A 85 -6.176 27.513 9.302 1.00 47.67 C -ATOM 830 CD GLN A 85 -5.653 28.953 9.274 1.00 52.44 C -ATOM 831 OE1 GLN A 85 -4.985 29.379 8.321 1.00 53.70 O -ATOM 832 NE2 GLN A 85 -5.956 29.710 10.327 1.00 54.30 N -ATOM 833 H GLN A 85 -5.029 25.050 10.201 1.00 0.00 H -ATOM 834 HE21 GLN A 85 -5.645 30.638 10.336 1.00 0.00 H -ATOM 835 HE22 GLN A 85 -6.483 29.308 11.051 1.00 0.00 H -ATOM 836 N LEU A 86 -4.107 24.239 7.050 1.00 35.90 N -ATOM 837 CA LEU A 86 -3.427 23.593 5.952 1.00 35.57 C -ATOM 838 C LEU A 86 -3.973 22.187 5.705 1.00 36.04 C -ATOM 839 O LEU A 86 -4.216 21.789 4.568 1.00 35.67 O -ATOM 840 CB LEU A 86 -1.940 23.522 6.282 1.00 35.24 C -ATOM 841 CG LEU A 86 -0.979 23.392 5.104 1.00 37.99 C -ATOM 842 CD1 LEU A 86 -1.046 24.641 4.236 1.00 37.21 C -ATOM 843 CD2 LEU A 86 0.434 23.187 5.623 1.00 37.56 C -ATOM 844 H LEU A 86 -3.579 24.563 7.810 1.00 0.00 H -ATOM 845 N ALA A 87 -4.167 21.440 6.774 1.00 37.61 N -ATOM 846 CA ALA A 87 -4.658 20.075 6.672 1.00 40.07 C -ATOM 847 C ALA A 87 -6.071 20.045 6.108 1.00 42.25 C -ATOM 848 O ALA A 87 -6.423 19.123 5.387 1.00 44.08 O -ATOM 849 CB ALA A 87 -4.614 19.402 8.041 1.00 37.62 C -ATOM 850 H ALA A 87 -3.984 21.816 7.658 1.00 0.00 H -ATOM 851 N GLU A 88 -6.881 21.042 6.453 1.00 44.94 N -ATOM 852 CA GLU A 88 -8.250 21.137 5.934 1.00 47.72 C -ATOM 853 C GLU A 88 -8.249 21.462 4.446 1.00 46.92 C -ATOM 854 O GLU A 88 -8.935 20.809 3.652 1.00 46.82 O -ATOM 855 CB GLU A 88 -9.029 22.238 6.647 1.00 51.27 C -ATOM 856 CG GLU A 88 -9.499 21.887 8.035 1.00 58.64 C -ATOM 857 CD GLU A 88 -10.532 22.873 8.532 1.00 63.08 C -ATOM 858 OE1 GLU A 88 -11.497 23.154 7.774 1.00 65.53 O -ATOM 859 OE2 GLU A 88 -10.381 23.370 9.674 1.00 64.92 O -ATOM 860 H GLU A 88 -6.554 21.730 7.069 1.00 0.00 H -ATOM 861 N LYS A 89 -7.484 22.490 4.087 1.00 45.19 N -ATOM 862 CA LYS A 89 -7.401 22.930 2.722 1.00 45.73 C -ATOM 863 C LYS A 89 -7.064 21.776 1.802 1.00 45.59 C -ATOM 864 O LYS A 89 -7.728 21.571 0.792 1.00 46.84 O -ATOM 865 CB LYS A 89 -6.346 24.019 2.592 1.00 46.57 C -ATOM 866 CG LYS A 89 -6.374 24.759 1.269 1.00 49.11 C -ATOM 867 CD LYS A 89 -5.470 25.976 1.314 1.00 52.19 C -ATOM 868 CE LYS A 89 -5.826 26.963 0.216 1.00 55.10 C -ATOM 869 NZ LYS A 89 -5.139 28.274 0.395 1.00 56.62 N -ATOM 870 H LYS A 89 -6.963 22.959 4.773 1.00 0.00 H -ATOM 871 HZ1 LYS A 89 -4.109 28.127 0.406 1.00 0.00 H -ATOM 872 HZ2 LYS A 89 -5.390 28.905 -0.391 1.00 0.00 H -ATOM 873 HZ3 LYS A 89 -5.437 28.704 1.294 1.00 0.00 H -ATOM 874 N PHE A 90 -6.055 21.001 2.163 1.00 44.53 N -ATOM 875 CA PHE A 90 -5.631 19.900 1.314 1.00 44.24 C -ATOM 876 C PHE A 90 -6.275 18.576 1.716 1.00 44.45 C -ATOM 877 O PHE A 90 -5.737 17.496 1.463 1.00 44.80 O -ATOM 878 CB PHE A 90 -4.099 19.837 1.283 1.00 43.69 C -ATOM 879 CG PHE A 90 -3.510 21.100 0.707 1.00 43.58 C -ATOM 880 CD1 PHE A 90 -3.664 21.403 -0.642 1.00 44.38 C -ATOM 881 CD2 PHE A 90 -2.881 22.034 1.523 1.00 44.26 C -ATOM 882 CE1 PHE A 90 -3.212 22.610 -1.165 1.00 43.38 C -ATOM 883 CE2 PHE A 90 -2.425 23.246 1.011 1.00 43.71 C -ATOM 884 CZ PHE A 90 -2.592 23.535 -0.337 1.00 43.90 C -ATOM 885 H PHE A 90 -5.588 21.170 3.009 1.00 0.00 H -ATOM 886 N SER A 91 -7.444 18.690 2.345 1.00 45.17 N -ATOM 887 CA SER A 91 -8.282 17.543 2.686 1.00 45.85 C -ATOM 888 C SER A 91 -7.553 16.348 3.290 1.00 45.16 C -ATOM 889 O SER A 91 -7.662 15.229 2.790 1.00 45.12 O -ATOM 890 CB SER A 91 -9.061 17.113 1.441 1.00 48.12 C -ATOM 891 OG SER A 91 -9.727 18.233 0.864 1.00 51.11 O -ATOM 892 H SER A 91 -7.764 19.584 2.580 1.00 0.00 H -ATOM 893 HG SER A 91 -10.205 17.955 0.079 1.00 0.00 H -ATOM 894 N VAL A 92 -6.811 16.583 4.361 1.00 44.55 N -ATOM 895 CA VAL A 92 -6.196 15.487 5.129 1.00 44.43 C -ATOM 896 C VAL A 92 -6.451 15.690 6.627 1.00 43.59 C -ATOM 897 O VAL A 92 -5.911 14.975 7.471 1.00 42.35 O -ATOM 898 CB VAL A 92 -4.657 15.344 4.880 1.00 44.50 C -ATOM 899 CG1 VAL A 92 -4.413 14.652 3.553 1.00 44.93 C -ATOM 900 CG2 VAL A 92 -3.972 16.697 4.904 1.00 43.55 C -ATOM 901 H VAL A 92 -6.657 17.507 4.637 1.00 0.00 H -ATOM 902 N TYR A 93 -7.311 16.652 6.938 1.00 44.06 N -ATOM 903 CA TYR A 93 -7.606 16.994 8.321 1.00 46.56 C -ATOM 904 C TYR A 93 -8.156 15.815 9.115 1.00 47.20 C -ATOM 905 O TYR A 93 -7.747 15.568 10.249 1.00 45.84 O -ATOM 906 CB TYR A 93 -8.590 18.172 8.392 1.00 48.04 C -ATOM 907 CG TYR A 93 -8.880 18.600 9.814 1.00 51.15 C -ATOM 908 CD1 TYR A 93 -8.058 19.512 10.466 1.00 52.01 C -ATOM 909 CD2 TYR A 93 -9.901 17.996 10.550 1.00 51.74 C -ATOM 910 CE1 TYR A 93 -8.234 19.796 11.806 1.00 53.05 C -ATOM 911 CE2 TYR A 93 -10.083 18.274 11.891 1.00 52.13 C -ATOM 912 CZ TYR A 93 -9.243 19.172 12.513 1.00 53.58 C -ATOM 913 OH TYR A 93 -9.405 19.442 13.848 1.00 56.47 O -ATOM 914 H TYR A 93 -7.753 17.146 6.220 1.00 0.00 H -ATOM 915 HH TYR A 93 -10.182 18.981 14.176 1.00 0.00 H -ATOM 916 N ASP A 94 -9.076 15.086 8.529 1.00 48.64 N -ATOM 917 CA ASP A 94 -9.678 13.962 9.232 1.00 50.01 C -ATOM 918 C ASP A 94 -8.697 12.805 9.419 1.00 49.07 C -ATOM 919 O ASP A 94 -8.827 12.031 10.370 1.00 48.92 O -ATOM 920 CB ASP A 94 -10.964 13.515 8.517 1.00 53.54 C -ATOM 921 CG ASP A 94 -12.120 14.474 8.796 1.00 54.92 C -ATOM 922 OD1 ASP A 94 -12.762 14.329 9.852 1.00 57.73 O -ATOM 923 OD2 ASP A 94 -12.379 15.377 7.969 1.00 56.24 O -ATOM 924 H ASP A 94 -9.357 15.301 7.615 1.00 0.00 H -ATOM 925 N GLN A 95 -7.712 12.698 8.520 1.00 49.21 N -ATOM 926 CA GLN A 95 -6.664 11.678 8.659 1.00 49.95 C -ATOM 927 C GLN A 95 -5.677 12.029 9.780 1.00 48.73 C -ATOM 928 O GLN A 95 -5.206 11.146 10.495 1.00 48.14 O -ATOM 929 CB GLN A 95 -5.871 11.526 7.358 1.00 51.32 C -ATOM 930 CG GLN A 95 -6.617 10.859 6.227 1.00 54.77 C -ATOM 931 CD GLN A 95 -5.805 10.848 4.952 1.00 57.17 C -ATOM 932 OE1 GLN A 95 -4.715 10.277 4.905 1.00 57.65 O -ATOM 933 NE2 GLN A 95 -6.325 11.483 3.912 1.00 58.76 N -ATOM 934 H GLN A 95 -7.694 13.305 7.752 1.00 0.00 H -ATOM 935 HE21 GLN A 95 -5.808 11.509 3.079 1.00 0.00 H -ATOM 936 HE22 GLN A 95 -7.202 11.904 4.016 1.00 0.00 H -ATOM 937 N LEU A 96 -5.360 13.327 9.908 1.00 48.04 N -ATOM 938 CA LEU A 96 -4.374 13.800 10.893 1.00 46.14 C -ATOM 939 C LEU A 96 -5.003 14.231 12.202 1.00 45.87 C -ATOM 940 O LEU A 96 -4.285 14.496 13.166 1.00 44.88 O -ATOM 941 CB LEU A 96 -3.579 14.981 10.323 1.00 43.86 C -ATOM 942 CG LEU A 96 -3.107 14.825 8.881 1.00 43.10 C -ATOM 943 CD1 LEU A 96 -2.080 15.892 8.542 1.00 40.00 C -ATOM 944 CD2 LEU A 96 -2.533 13.432 8.681 1.00 42.10 C -ATOM 945 H LEU A 96 -5.794 13.981 9.318 1.00 0.00 H -ATOM 946 N LYS A 97 -6.332 14.297 12.237 1.00 47.18 N -ATOM 947 CA LYS A 97 -7.053 14.723 13.436 1.00 47.61 C -ATOM 948 C LYS A 97 -6.528 14.080 14.736 1.00 45.43 C -ATOM 949 O LYS A 97 -6.293 14.784 15.717 1.00 44.43 O -ATOM 950 CB LYS A 97 -8.568 14.489 13.291 1.00 50.67 C -ATOM 951 CG LYS A 97 -9.336 15.078 14.463 1.00 56.31 C -ATOM 952 CD LYS A 97 -10.823 15.199 14.216 1.00 59.48 C -ATOM 953 CE LYS A 97 -11.463 16.020 15.331 1.00 61.13 C -ATOM 954 NZ LYS A 97 -12.926 16.202 15.134 1.00 63.44 N -ATOM 955 H LYS A 97 -6.842 14.065 11.432 1.00 0.00 H -ATOM 956 HZ1 LYS A 97 -13.098 16.675 14.224 1.00 0.00 H -ATOM 957 HZ2 LYS A 97 -13.392 15.273 15.137 1.00 0.00 H -ATOM 958 HZ3 LYS A 97 -13.309 16.784 15.906 1.00 0.00 H -ATOM 959 N PRO A 98 -6.334 12.753 14.803 1.00 44.31 N -ATOM 960 CA PRO A 98 -5.818 12.119 16.014 1.00 45.37 C -ATOM 961 C PRO A 98 -4.589 12.847 16.590 1.00 46.45 C -ATOM 962 O PRO A 98 -4.526 13.091 17.795 1.00 47.44 O -ATOM 963 CB PRO A 98 -5.497 10.687 15.575 1.00 43.63 C -ATOM 964 CG PRO A 98 -5.537 10.749 14.086 1.00 44.43 C -ATOM 965 CD PRO A 98 -6.611 11.744 13.777 1.00 43.98 C -ATOM 966 N LEU A 99 -3.638 13.217 15.725 1.00 46.20 N -ATOM 967 CA LEU A 99 -2.427 13.892 16.177 1.00 45.20 C -ATOM 968 C LEU A 99 -2.731 15.288 16.672 1.00 46.29 C -ATOM 969 O LEU A 99 -2.212 15.707 17.705 1.00 45.15 O -ATOM 970 CB LEU A 99 -1.386 13.979 15.053 1.00 42.84 C -ATOM 971 CG LEU A 99 -0.093 14.741 15.389 1.00 41.15 C -ATOM 972 CD1 LEU A 99 0.804 13.895 16.275 1.00 38.20 C -ATOM 973 CD2 LEU A 99 0.626 15.131 14.117 1.00 39.05 C -ATOM 974 H LEU A 99 -3.759 13.036 14.770 1.00 0.00 H -ATOM 975 N PHE A 100 -3.564 16.007 15.933 1.00 48.58 N -ATOM 976 CA PHE A 100 -3.896 17.372 16.305 1.00 52.20 C -ATOM 977 C PHE A 100 -4.517 17.429 17.688 1.00 56.06 C -ATOM 978 O PHE A 100 -4.089 18.213 18.537 1.00 56.52 O -ATOM 979 CB PHE A 100 -4.865 18.008 15.296 1.00 50.34 C -ATOM 980 CG PHE A 100 -4.309 18.236 13.913 1.00 48.52 C -ATOM 981 CD1 PHE A 100 -2.950 18.478 13.717 1.00 46.65 C -ATOM 982 CD2 PHE A 100 -5.158 18.231 12.803 1.00 47.63 C -ATOM 983 CE1 PHE A 100 -2.447 18.713 12.445 1.00 46.95 C -ATOM 984 CE2 PHE A 100 -4.662 18.466 11.530 1.00 46.65 C -ATOM 985 CZ PHE A 100 -3.304 18.707 11.350 1.00 46.70 C -ATOM 986 H PHE A 100 -3.954 15.615 15.124 1.00 0.00 H -ATOM 987 N ASP A 101 -5.517 16.594 17.924 1.00 60.72 N -ATOM 988 CA ASP A 101 -6.204 16.632 19.205 1.00 66.29 C -ATOM 989 C ASP A 101 -5.449 15.864 20.289 1.00 68.12 C -ATOM 990 O ASP A 101 -5.728 16.047 21.477 1.00 69.45 O -ATOM 991 CB ASP A 101 -7.653 16.132 19.071 1.00 68.88 C -ATOM 992 CG ASP A 101 -7.782 14.625 19.028 1.00 72.53 C -ATOM 993 OD1 ASP A 101 -7.085 13.994 18.212 1.00 74.44 O -ATOM 994 OD2 ASP A 101 -8.584 14.071 19.818 1.00 73.84 O -ATOM 995 H ASP A 101 -5.795 15.955 17.233 1.00 0.00 H -ATOM 996 N PHE A 102 -4.497 15.014 19.881 1.00 69.09 N -ATOM 997 CA PHE A 102 -3.676 14.272 20.835 1.00 69.65 C -ATOM 998 C PHE A 102 -3.031 15.235 21.825 1.00 70.64 C -ATOM 999 O PHE A 102 -2.775 14.878 22.974 1.00 72.94 O -ATOM 1000 CB PHE A 102 -2.583 13.502 20.091 1.00 70.00 C -ATOM 1001 CG PHE A 102 -1.745 12.597 20.951 1.00 71.29 C -ATOM 1002 CD1 PHE A 102 -0.639 13.089 21.637 1.00 71.76 C -ATOM 1003 CD2 PHE A 102 -2.053 11.238 21.062 1.00 72.61 C -ATOM 1004 CE1 PHE A 102 0.139 12.248 22.414 1.00 72.74 C -ATOM 1005 CE2 PHE A 102 -1.274 10.387 21.838 1.00 72.58 C -ATOM 1006 CZ PHE A 102 -0.177 10.895 22.516 1.00 73.27 C -ATOM 1007 H PHE A 102 -4.346 14.884 18.921 1.00 0.00 H -TER 1008 PHE A 102 -HETATM 1009 O HOH A 401 11.442 26.376 18.419 1.00 38.23 O -HETATM 1010 H1 HOH A 401 12.360 26.094 18.365 1.00 0.00 H -HETATM 1011 H2 HOH A 401 11.489 27.267 18.767 1.00 0.00 H -HETATM 1012 O HOH A 402 8.649 28.512 17.527 1.00 47.94 O -HETATM 1013 H1 HOH A 402 9.202 27.788 17.213 1.00 0.00 H -HETATM 1014 H2 HOH A 402 7.878 28.486 16.957 1.00 0.00 H -HETATM 1015 O HOH A 403 7.263 28.403 19.944 1.00 38.55 O -HETATM 1016 H1 HOH A 403 7.266 27.444 19.925 1.00 0.00 H -HETATM 1017 H2 HOH A 403 7.891 28.655 19.252 1.00 0.00 H -HETATM 1018 O HOH A 404 13.823 23.249 15.906 1.00 61.76 O -HETATM 1019 H1 HOH A 404 14.758 23.159 15.681 1.00 0.00 H -HETATM 1020 H2 HOH A 404 13.741 24.157 16.204 1.00 0.00 H -HETATM 1021 O HOH A 405 8.756 28.493 22.514 1.00 66.03 O -HETATM 1022 H1 HOH A 405 8.339 28.510 21.650 1.00 0.00 H -HETATM 1023 H2 HOH A 405 8.556 29.355 22.893 1.00 0.00 H -HETATM 1024 O HOH A 406 9.224 19.780 22.203 1.00 22.24 O -HETATM 1025 H1 HOH A 406 9.276 19.201 21.436 1.00 0.00 H -HETATM 1026 H2 HOH A 406 9.990 19.533 22.736 1.00 0.00 H -HETATM 1027 O HOH A 407 11.643 19.276 23.871 1.00 44.82 O -HETATM 1028 H1 HOH A 407 12.275 19.960 23.620 1.00 0.00 H -HETATM 1029 H2 HOH A 407 11.978 18.952 24.712 1.00 0.00 H -HETATM 1030 O HOH A 408 7.638 19.412 26.856 1.00 66.34 O -HETATM 1031 H1 HOH A 408 7.334 19.672 27.732 1.00 0.00 H -HETATM 1032 H2 HOH A 408 8.293 18.736 27.024 1.00 0.00 H -HETATM 1033 O HOH A 409 9.788 12.718 23.881 1.00 35.90 O -HETATM 1034 H1 HOH A 409 10.485 13.349 24.074 1.00 0.00 H -HETATM 1035 H2 HOH A 409 9.534 12.912 22.975 1.00 0.00 H -HETATM 1036 O HOH A 410 -7.039 27.560 12.371 1.00 76.53 O -HETATM 1037 H1 HOH A 410 -7.871 27.092 12.461 1.00 0.00 H -HETATM 1038 H2 HOH A 410 -6.381 26.862 12.283 1.00 0.00 H -HETATM 1039 O HOH A 411 10.636 15.015 28.679 1.00 79.82 O -HETATM 1040 H1 HOH A 411 10.754 14.224 29.205 1.00 0.00 H -HETATM 1041 H2 HOH A 411 9.685 15.085 28.566 1.00 0.00 H -HETATM 1042 O HOH A 412 -5.406 19.815 21.604 1.00 67.01 O -HETATM 1043 H1 HOH A 412 -5.059 20.294 22.359 1.00 0.00 H -HETATM 1044 H2 HOH A 412 -5.402 18.897 21.884 1.00 0.00 H -HETATM 1045 O HOH A 413 0.948 26.025 18.289 1.00 28.37 O -HETATM 1046 H1 HOH A 413 1.360 25.442 18.933 1.00 0.00 H -HETATM 1047 H2 HOH A 413 1.280 26.901 18.518 1.00 0.00 H -HETATM 1048 O HOH A 414 2.348 27.103 21.691 1.00 40.51 O -HETATM 1049 H1 HOH A 414 2.244 26.285 21.195 1.00 0.00 H -HETATM 1050 H2 HOH A 414 2.771 27.701 21.073 1.00 0.00 H -HETATM 1051 O HOH A 415 1.783 28.751 19.142 1.00 45.14 O -HETATM 1052 H1 HOH A 415 2.466 29.079 19.741 1.00 0.00 H -HETATM 1053 H2 HOH A 415 1.057 29.370 19.247 1.00 0.00 H -HETATM 1054 O HOH A 416 -1.813 27.629 17.603 1.00 63.33 O -HETATM 1055 H1 HOH A 416 -0.906 27.508 17.899 1.00 0.00 H -HETATM 1056 H2 HOH A 416 -1.823 28.521 17.231 1.00 0.00 H -HETATM 1057 O HOH A 417 0.364 33.475 10.829 1.00 43.72 O -HETATM 1058 H1 HOH A 417 -0.450 33.139 10.448 1.00 0.00 H -HETATM 1059 H2 HOH A 417 0.123 33.712 11.729 1.00 0.00 H -HETATM 1060 O HOH A 418 3.290 35.799 10.789 1.00 45.96 O -HETATM 1061 H1 HOH A 418 2.521 35.871 11.354 1.00 0.00 H -HETATM 1062 H2 HOH A 418 2.954 36.032 9.910 1.00 0.00 H -HETATM 1063 O HOH A 419 8.914 16.633 -7.731 1.00 47.58 O -HETATM 1064 H1 HOH A 419 8.580 16.211 -8.527 1.00 0.00 H -HETATM 1065 H2 HOH A 419 9.739 17.055 -8.014 1.00 0.00 H -HETATM 1066 O HOH A 420 16.804 28.181 7.657 1.00 52.61 O -HETATM 1067 H1 HOH A 420 17.349 28.921 7.925 1.00 0.00 H -HETATM 1068 H2 HOH A 420 17.428 27.548 7.300 1.00 0.00 H -HETATM 1069 O HOH A 421 4.841 5.174 7.671 1.00 54.02 O -HETATM 1070 H1 HOH A 421 4.992 4.811 6.796 1.00 0.00 H -HETATM 1071 H2 HOH A 421 3.969 5.585 7.610 1.00 0.00 H -HETATM 1072 O HOH A 422 6.123 12.466 6.644 1.00 38.59 O -HETATM 1073 H1 HOH A 422 6.354 11.569 6.880 1.00 0.00 H -HETATM 1074 H2 HOH A 422 5.242 12.393 6.258 1.00 0.00 H -HETATM 1075 O HOH A 423 3.623 12.224 6.231 1.00 46.24 O -HETATM 1076 H1 HOH A 423 3.260 11.491 6.732 1.00 0.00 H -HETATM 1077 H2 HOH A 423 3.150 12.995 6.560 1.00 0.00 H -HETATM 1078 O HOH A 424 8.696 11.998 9.005 1.00 59.93 O -HETATM 1079 H1 HOH A 424 7.734 12.042 9.009 1.00 0.00 H -HETATM 1080 H2 HOH A 424 8.947 12.160 9.914 1.00 0.00 H -HETATM 1081 O HOH A 425 8.405 9.129 7.648 1.00 61.20 O -HETATM 1082 H1 HOH A 425 9.210 8.614 7.550 1.00 0.00 H -HETATM 1083 H2 HOH A 425 8.701 9.956 8.049 1.00 0.00 H -HETATM 1084 O HOH A 426 18.447 13.535 15.604 1.00 34.60 O -HETATM 1085 H1 HOH A 426 18.325 12.712 16.083 1.00 0.00 H -HETATM 1086 H2 HOH A 426 17.838 13.470 14.861 1.00 0.00 H -HETATM 1087 O HOH A 427 12.794 20.256 3.954 1.00 62.89 O -HETATM 1088 H1 HOH A 427 13.638 20.705 4.102 1.00 0.00 H -HETATM 1089 H2 HOH A 427 13.034 19.453 3.487 1.00 0.00 H -HETATM 1090 O HOH A 428 8.847 19.809 0.651 1.00 65.07 O -HETATM 1091 H1 HOH A 428 8.427 19.180 1.242 1.00 0.00 H -HETATM 1092 H2 HOH A 428 8.764 20.651 1.101 1.00 0.00 H -HETATM 1093 O HOH A 429 -2.878 19.586 20.641 1.00 55.95 O -HETATM 1094 H1 HOH A 429 -3.712 19.246 20.304 1.00 0.00 H -HETATM 1095 H2 HOH A 429 -2.949 20.533 20.530 1.00 0.00 H -HETATM 1096 O HOH A 430 -3.389 10.814 2.153 1.00 68.44 O -HETATM 1097 H1 HOH A 430 -3.370 10.574 1.223 1.00 0.00 H -HETATM 1098 H2 HOH A 430 -2.731 11.518 2.225 1.00 0.00 H -HETATM 1099 O HOH A 431 7.974 6.841 9.094 1.00 81.57 O -HETATM 1100 H1 HOH A 431 7.873 7.036 8.159 1.00 0.00 H -HETATM 1101 H2 HOH A 431 7.642 5.943 9.185 1.00 0.00 H -HETATM 1102 O HOH A 432 8.985 13.925 -7.061 1.00 46.17 O -HETATM 1103 H1 HOH A 432 9.892 13.636 -6.937 1.00 0.00 H -HETATM 1104 H2 HOH A 432 9.045 14.887 -7.113 1.00 0.00 H -HETATM 1105 O HOH A 433 11.459 17.807 -8.216 1.00 61.98 O -HETATM 1106 H1 HOH A 433 12.207 17.850 -7.615 1.00 0.00 H -HETATM 1107 H2 HOH A 433 11.478 18.651 -8.675 1.00 0.00 H -HETATM 1108 O HOH A 434 -10.484 15.879 5.891 1.00 49.08 O -HETATM 1109 H1 HOH A 434 -10.763 16.064 4.990 1.00 0.00 H -HETATM 1110 H2 HOH A 434 -11.213 16.190 6.431 1.00 0.00 H -HETATM 1111 O HOH A 435 12.930 13.009 26.185 1.00 43.86 O -HETATM 1112 H1 HOH A 435 12.963 13.330 27.087 1.00 0.00 H -HETATM 1113 H2 HOH A 435 13.476 13.625 25.694 1.00 0.00 H -HETATM 1114 O HOH A 436 -3.464 25.858 19.747 1.00 63.70 O -HETATM 1115 H1 HOH A 436 -3.471 26.403 18.954 1.00 0.00 H -HETATM 1116 H2 HOH A 436 -2.587 25.992 20.114 1.00 0.00 H -HETATM 1117 O HOH A 437 6.235 16.677 28.203 1.00 68.03 O -HETATM 1118 H1 HOH A 437 6.291 17.517 28.663 1.00 0.00 H -HETATM 1119 H2 HOH A 437 5.340 16.667 27.835 1.00 0.00 H -HETATM 1120 O HOH A 438 7.423 17.512 -10.650 1.00 57.40 O -HETATM 1121 H1 HOH A 438 7.010 16.951 -9.986 1.00 0.00 H -HETATM 1122 H2 HOH A 438 7.702 16.894 -11.334 1.00 0.00 H -HETATM 1123 O HOH A 439 -5.355 10.866 19.619 1.00 51.92 O -HETATM 1124 H1 HOH A 439 -6.252 10.945 19.294 1.00 0.00 H -HETATM 1125 H2 HOH A 439 -4.871 11.550 19.149 1.00 0.00 H -HETATM 1126 O HOH A 440 -8.867 11.724 17.801 1.00 59.09 O -HETATM 1127 H1 HOH A 440 -8.909 12.448 18.427 1.00 0.00 H -HETATM 1128 H2 HOH A 440 -9.457 11.061 18.162 1.00 0.00 H -HETATM 1129 O HOH A 441 13.107 15.120 7.186 1.00 56.17 O -HETATM 1130 H1 HOH A 441 12.362 15.432 7.708 1.00 0.00 H -HETATM 1131 H2 HOH A 441 13.869 15.225 7.770 1.00 0.00 H -HETATM 1132 O HOH A 442 -2.200 10.629 25.072 1.00 84.96 O -HETATM 1133 H1 HOH A 442 -1.698 11.431 25.238 1.00 0.00 H -HETATM 1134 H2 HOH A 442 -3.040 10.942 24.729 1.00 0.00 H -HETATM 1135 O HOH A 444 1.798 36.196 8.660 1.00 69.55 O -HETATM 1136 H1 HOH A 444 2.171 36.075 7.775 1.00 0.00 H -HETATM 1137 H2 HOH A 444 1.186 35.465 8.757 1.00 0.00 H -HETATM 1138 O HOH A 446 12.829 16.619 28.388 1.00 76.91 O -HETATM 1139 H1 HOH A 446 12.031 17.139 28.283 1.00 0.00 H -HETATM 1140 H2 HOH A 446 12.511 15.764 28.684 1.00 0.00 H -HETATM 1141 O HOH A 447 -1.714 7.995 25.869 1.00 53.32 O -HETATM 1142 H1 HOH A 447 -1.215 7.807 25.076 1.00 0.00 H -HETATM 1143 H2 HOH A 447 -1.895 8.941 25.818 1.00 0.00 H -HETATM 1144 O HOH A 449 17.342 21.354 17.381 1.00 78.08 O -HETATM 1145 H1 HOH A 449 17.257 20.526 17.868 1.00 0.00 H -HETATM 1146 H2 HOH A 449 17.020 22.020 17.988 1.00 0.00 H -HETATM 1147 O HOH A 450 17.554 22.356 21.606 1.00 81.11 O -HETATM 1148 H1 HOH A 450 17.863 21.463 21.445 1.00 0.00 H -HETATM 1149 H2 HOH A 450 18.333 22.902 21.491 1.00 0.00 H -HETATM 1150 O HOH A 451 21.261 19.604 17.525 1.00 60.20 O -HETATM 1151 H1 HOH A 451 21.971 20.078 17.088 1.00 0.00 H -HETATM 1152 H2 HOH A 451 20.490 20.166 17.407 1.00 0.00 H -HETATM 1153 O HOH A 452 20.618 19.027 20.159 1.00 71.08 O -HETATM 1154 H1 HOH A 452 20.831 19.188 19.232 1.00 0.00 H -HETATM 1155 H2 HOH A 452 21.279 18.398 20.447 1.00 0.00 H -HETATM 1156 O HOH A 454 3.691 16.091 27.806 1.00 75.85 O -HETATM 1157 H1 HOH A 454 3.113 15.469 27.354 1.00 0.00 H -HETATM 1158 H2 HOH A 454 3.644 15.832 28.729 1.00 0.00 H -HETATM 1159 O HOH A 456 17.778 15.979 4.727 1.00 87.15 O -HETATM 1160 H1 HOH A 456 17.578 15.048 4.815 1.00 0.00 H -HETATM 1161 H2 HOH A 456 17.841 16.297 5.638 1.00 0.00 H -HETATM 1162 O HOH A 457 2.784 6.732 0.413 1.00 58.64 O -HETATM 1163 H1 HOH A 457 3.270 6.190 1.038 1.00 0.00 H -HETATM 1164 H2 HOH A 457 2.569 6.134 -0.304 1.00 0.00 H -HETATM 1165 O HOH A 458 6.812 6.267 3.872 1.00 78.10 O -HETATM 1166 H1 HOH A 458 6.068 6.869 3.796 1.00 0.00 H -HETATM 1167 H2 HOH A 458 7.515 6.697 3.386 1.00 0.00 H -HETATM 1168 O HOH A 459 11.360 23.250 27.379 1.00 91.15 O -HETATM 1169 H1 HOH A 459 10.875 24.075 27.257 1.00 0.00 H -HETATM 1170 H2 HOH A 459 11.895 23.176 26.588 1.00 0.00 H -HETATM 1171 O HOH A 460 11.533 21.478 -4.909 1.00 61.19 O -HETATM 1172 H1 HOH A 460 11.125 21.466 -4.035 1.00 0.00 H -HETATM 1173 H2 HOH A 460 11.171 22.260 -5.324 1.00 0.00 H -HETATM 1174 O HOH A 461 -2.761 38.231 3.181 1.00 84.62 O -HETATM 1175 H1 HOH A 461 -1.871 38.468 3.455 1.00 0.00 H -HETATM 1176 H2 HOH A 461 -2.645 37.814 2.327 1.00 0.00 H -HETATM 1177 O HOH A 462 -5.015 39.320 4.311 1.00 88.70 O -HETATM 1178 H1 HOH A 462 -4.698 40.216 4.219 1.00 0.00 H -HETATM 1179 H2 HOH A 462 -4.298 38.779 3.950 1.00 0.00 H -HETATM 1180 O HOH A 463 10.179 21.307 3.687 1.00 49.11 O -HETATM 1181 H1 HOH A 463 9.722 21.057 4.495 1.00 0.00 H -HETATM 1182 H2 HOH A 463 11.079 20.973 3.815 1.00 0.00 H -HETATM 1183 O HOH A 464 -1.283 31.486 14.715 1.00 75.28 O -HETATM 1184 H1 HOH A 464 -0.458 31.251 14.289 1.00 0.00 H -HETATM 1185 H2 HOH A 464 -1.540 30.684 15.190 1.00 0.00 H -HETATM 1186 O HOH A 465 -3.174 28.185 6.783 1.00 76.66 O -HETATM 1187 H1 HOH A 465 -3.814 28.666 7.321 1.00 0.00 H -HETATM 1188 H2 HOH A 465 -3.169 28.650 5.944 1.00 0.00 H -HETATM 1189 O HOH A 466 -5.798 24.608 20.375 1.00 86.02 O -HETATM 1190 H1 HOH A 466 -5.419 23.785 20.680 1.00 0.00 H -HETATM 1191 H2 HOH A 466 -5.032 25.168 20.192 1.00 0.00 H -HETATM 1192 O HOH A 467 -10.433 22.178 -0.029 1.00 70.77 O -HETATM 1193 H1 HOH A 467 -10.696 21.582 0.672 1.00 0.00 H -HETATM 1194 H2 HOH A 467 -9.472 22.144 -0.019 1.00 0.00 H -HETATM 1195 O HOH A 468 -12.736 19.373 14.748 1.00 67.61 O -HETATM 1196 H1 HOH A 468 -13.404 19.567 14.089 1.00 0.00 H -HETATM 1197 H2 HOH A 468 -12.581 20.211 15.186 1.00 0.00 H -HETATM 1198 O HOH A 469 -12.719 15.279 19.686 1.00 72.04 O -HETATM 1199 H1 HOH A 469 -11.938 15.746 19.984 1.00 0.00 H -HETATM 1200 H2 HOH A 469 -12.734 14.477 20.208 1.00 0.00 H -HETATM 1201 O HOH A 470 14.152 20.306 23.565 1.00 67.11 O -HETATM 1202 H1 HOH A 470 14.822 20.685 24.137 1.00 0.00 H -HETATM 1203 H2 HOH A 470 14.616 19.594 23.101 1.00 0.00 H -HETATM 1204 O HOH A 471 13.538 23.641 18.923 1.00 71.61 O -HETATM 1205 H1 HOH A 471 13.182 23.149 18.177 1.00 0.00 H -HETATM 1206 H2 HOH A 471 13.920 22.968 19.489 1.00 0.00 H -HETATM 1207 O HOH A 472 -2.426 22.296 24.456 1.00 58.68 O -HETATM 1208 H1 HOH A 472 -1.824 21.550 24.486 1.00 0.00 H -HETATM 1209 H2 HOH A 472 -2.172 22.837 25.206 1.00 0.00 H -HETATM 1210 O HOH A 473 -4.196 19.616 27.496 1.00 73.73 O -HETATM 1211 H1 HOH A 473 -4.186 20.369 28.087 1.00 0.00 H -HETATM 1212 H2 HOH A 473 -3.490 19.052 27.815 1.00 0.00 H -HETATM 1213 O HOH A 474 -3.309 5.980 5.845 1.00 68.19 O -HETATM 1214 H1 HOH A 474 -3.838 5.345 6.332 1.00 0.00 H -HETATM 1215 H2 HOH A 474 -3.906 6.325 5.178 1.00 0.00 H -HETATM 1216 O HOH A 475 17.838 23.280 1.198 1.00 77.31 O -HETATM 1217 H1 HOH A 475 18.005 22.946 2.080 1.00 0.00 H -HETATM 1218 H2 HOH A 475 16.886 23.249 1.107 1.00 0.00 H -HETATM 1219 O HOH A 476 10.307 16.081 6.990 1.00 59.61 O -HETATM 1220 H1 HOH A 476 10.750 16.852 7.367 1.00 0.00 H -HETATM 1221 H2 HOH A 476 10.894 15.787 6.290 1.00 0.00 H -HETATM 1222 O HOH A 477 11.355 23.439 4.466 1.00 66.34 O -HETATM 1223 H1 HOH A 477 10.901 22.829 3.870 1.00 0.00 H -HETATM 1224 H2 HOH A 477 12.059 23.808 3.935 1.00 0.00 H -HETATM 1225 O HOH A 478 17.221 12.554 13.119 1.00 53.33 O -HETATM 1226 H1 HOH A 478 17.675 13.340 12.793 1.00 0.00 H -HETATM 1227 H2 HOH A 478 17.910 11.893 13.189 1.00 0.00 H -HETATM 1228 O HOH A 479 6.483 28.190 5.603 1.00 90.05 O -HETATM 1229 H1 HOH A 479 6.350 28.405 4.680 1.00 0.00 H -HETATM 1230 H2 HOH A 479 6.782 27.278 5.595 1.00 0.00 H -HETATM 1231 O HOH A 480 -1.050 28.108 4.394 1.00 85.46 O -HETATM 1232 H1 HOH A 480 -0.904 27.942 5.328 1.00 0.00 H -HETATM 1233 H2 HOH A 480 -0.405 28.792 4.169 1.00 0.00 H -HETATM 1234 O HOH A 481 7.764 6.413 14.803 1.00 47.44 O -HETATM 1235 H1 HOH A 481 7.927 7.153 15.390 1.00 0.00 H -HETATM 1236 H2 HOH A 481 7.543 6.819 13.965 1.00 0.00 H -HETATM 1237 O HOH A 482 -1.304 30.550 17.203 1.00 47.05 O -HETATM 1238 H1 HOH A 482 -2.121 30.831 17.619 1.00 0.00 H -HETATM 1239 H2 HOH A 482 -0.966 31.348 16.785 1.00 0.00 H -HETATM 1240 O HOH A 484 3.582 11.825 -5.019 1.00 54.04 O -HETATM 1241 H1 HOH A 484 4.118 12.609 -4.883 1.00 0.00 H -HETATM 1242 H2 HOH A 484 2.776 12.157 -5.424 1.00 0.00 H -HETATM 1243 O HOH A 485 10.477 17.818 1.534 1.00 52.39 O -HETATM 1244 H1 HOH A 485 10.080 18.415 0.889 1.00 0.00 H -HETATM 1245 H2 HOH A 485 11.050 18.380 2.054 1.00 0.00 H -HETATM 1246 O HOH A 486 8.350 13.220 -2.518 1.00 51.86 O -HETATM 1247 H1 HOH A 486 7.500 12.811 -2.685 1.00 0.00 H -HETATM 1248 H2 HOH A 486 8.871 13.018 -3.295 1.00 0.00 H -HETATM 1249 O HOH A 487 10.766 31.335 -1.067 1.00 53.16 O -HETATM 1250 H1 HOH A 487 9.819 31.209 -0.984 1.00 0.00 H -HETATM 1251 H2 HOH A 487 11.147 30.557 -0.661 1.00 0.00 H -HETATM 1252 O HOH A 488 -1.322 36.803 5.890 1.00 51.31 O -HETATM 1253 H1 HOH A 488 -2.260 36.695 6.053 1.00 0.00 H -HETATM 1254 H2 HOH A 488 -0.911 36.077 6.358 1.00 0.00 H -HETATM 1255 O HOH A 489 -8.558 12.902 5.180 1.00 53.15 O -HETATM 1256 H1 HOH A 489 -8.421 13.507 4.441 1.00 0.00 H -HETATM 1257 H2 HOH A 489 -9.446 12.564 5.045 1.00 0.00 H -MASTER 234 0 0 4 5 0 0 6 1256 1 0 8 -END +HEADER CELL CYCLE 29-JUL-98 1BM8 +TITLE DNA-BINDING DOMAIN OF MBP1 +COMPND MOL_ID: 1; +COMPND 2 MOLECULE: TRANSCRIPTION FACTOR MBP1; +COMPND 3 CHAIN: A; +COMPND 4 FRAGMENT: N-TERMINAL DNA-BINDING DOMAIN; +COMPND 5 SYNONYM: MCB (MLUI CELL-CYLE BOX) BINDING PROTEIN; +COMPND 6 ENGINEERED: YES +SOURCE MOL_ID: 1; +SOURCE 2 ORGANISM_SCIENTIFIC: SACCHAROMYCES CEREVISIAE; +SOURCE 3 ORGANISM_COMMON: BAKER'S YEAST; +SOURCE 4 ORGANISM_TAXID: 4932; +SOURCE 5 CELL_LINE: BL21; +SOURCE 6 EXPRESSION_SYSTEM: ESCHERICHIA COLI; +SOURCE 7 EXPRESSION_SYSTEM_TAXID: 562; +SOURCE 8 EXPRESSION_SYSTEM_STRAIN: BL21 (DE3) PLYSS; +SOURCE 9 EXPRESSION_SYSTEM_PLASMID: BL21 (DE3) PLYSS/PET43 +KEYWDS CELL CYCLE, CYCLINS, DNA SYNTHESIS, HELIX-TURN-HELIX DNA- +KEYWDS 2 BINDING DOMAIN, MULTIWAVELENGTH ANOMALOUS DIFFRACTION, +KEYWDS 3 TRANSCRIPTION FACTOR +EXPDTA X-RAY DIFFRACTION +AUTHOR R.-M.XU,C.KOCH,Y.LIU,J.R.HORTON,D.KNAPP,K.NASMYTH,X.CHENG +REVDAT 2 24-FEB-09 1BM8 1 VERSN +REVDAT 1 02-MAR-99 1BM8 0 +JRNL AUTH R.M.XU,C.KOCH,Y.LIU,J.R.HORTON,D.KNAPP,K.NASMYTH, +JRNL AUTH 2 X.CHENG +JRNL TITL CRYSTAL STRUCTURE OF THE DNA-BINDING DOMAIN OF +JRNL TITL 2 MBP1, A TRANSCRIPTION FACTOR IMPORTANT IN +JRNL TITL 3 CELL-CYCLE CONTROL OF DNA SYNTHESIS. +JRNL REF STRUCTURE V. 5 349 1997 +JRNL REFN ISSN 0969-2126 +JRNL PMID 9083114 +JRNL DOI 10.1016/S0969-2126(97)00192-5 +REMARK 1 +REMARK 2 +REMARK 2 RESOLUTION. 1.71 ANGSTROMS. +REMARK 3 +REMARK 3 REFINEMENT. +REMARK 3 PROGRAM : X-PLOR 3.851 +REMARK 3 AUTHORS : BRUNGER +REMARK 3 +REMARK 3 DATA USED IN REFINEMENT. +REMARK 3 RESOLUTION RANGE HIGH (ANGSTROMS) : 1.71 +REMARK 3 RESOLUTION RANGE LOW (ANGSTROMS) : 5.00 +REMARK 3 DATA CUTOFF (SIGMA(F)) : 0.000 +REMARK 3 DATA CUTOFF HIGH (ABS(F)) : NULL +REMARK 3 DATA CUTOFF LOW (ABS(F)) : NULL +REMARK 3 COMPLETENESS (WORKING+TEST) (%) : 93.6 +REMARK 3 NUMBER OF REFLECTIONS : 10273 +REMARK 3 +REMARK 3 FIT TO DATA USED IN REFINEMENT. +REMARK 3 CROSS-VALIDATION METHOD : NULL +REMARK 3 FREE R VALUE TEST SET SELECTION : RANDOM +REMARK 3 R VALUE (WORKING SET) : 0.197 +REMARK 3 FREE R VALUE : 0.261 +REMARK 3 FREE R VALUE TEST SET SIZE (%) : 10.000 +REMARK 3 FREE R VALUE TEST SET COUNT : NULL +REMARK 3 ESTIMATED ERROR OF FREE R VALUE : NULL +REMARK 3 +REMARK 3 FIT IN THE HIGHEST RESOLUTION BIN. +REMARK 3 TOTAL NUMBER OF BINS USED : 8 +REMARK 3 BIN RESOLUTION RANGE HIGH (A) : 1.71 +REMARK 3 BIN RESOLUTION RANGE LOW (A) : 1.78 +REMARK 3 BIN COMPLETENESS (WORKING+TEST) (%) : 34.10 +REMARK 3 REFLECTIONS IN BIN (WORKING SET) : 535 +REMARK 3 BIN R VALUE (WORKING SET) : 0.4020 +REMARK 3 BIN FREE R VALUE : 0.3350 +REMARK 3 BIN FREE R VALUE TEST SET SIZE (%) : 10.00 +REMARK 3 BIN FREE R VALUE TEST SET COUNT : NULL +REMARK 3 ESTIMATED ERROR OF BIN FREE R VALUE : NULL +REMARK 3 +REMARK 3 NUMBER OF NON-HYDROGEN ATOMS USED IN REFINEMENT. +REMARK 3 PROTEIN ATOMS : 812 +REMARK 3 NUCLEIC ACID ATOMS : 0 +REMARK 3 HETEROGEN ATOMS : 0 +REMARK 3 SOLVENT ATOMS : 66 +REMARK 3 +REMARK 3 B VALUES. +REMARK 3 FROM WILSON PLOT (A**2) : NULL +REMARK 3 MEAN B VALUE (OVERALL, A**2) : 36.00 +REMARK 3 OVERALL ANISOTROPIC B VALUE. +REMARK 3 B11 (A**2) : NULL +REMARK 3 B22 (A**2) : NULL +REMARK 3 B33 (A**2) : NULL +REMARK 3 B12 (A**2) : NULL +REMARK 3 B13 (A**2) : NULL +REMARK 3 B23 (A**2) : NULL +REMARK 3 +REMARK 3 ESTIMATED COORDINATE ERROR. +REMARK 3 ESD FROM LUZZATI PLOT (A) : NULL +REMARK 3 ESD FROM SIGMAA (A) : NULL +REMARK 3 LOW RESOLUTION CUTOFF (A) : 5.00 +REMARK 3 +REMARK 3 CROSS-VALIDATED ESTIMATED COORDINATE ERROR. +REMARK 3 ESD FROM C-V LUZZATI PLOT (A) : NULL +REMARK 3 ESD FROM C-V SIGMAA (A) : NULL +REMARK 3 +REMARK 3 RMS DEVIATIONS FROM IDEAL VALUES. +REMARK 3 BOND LENGTHS (A) : 0.009 +REMARK 3 BOND ANGLES (DEGREES) : 1.11 +REMARK 3 DIHEDRAL ANGLES (DEGREES) : 23.30 +REMARK 3 IMPROPER ANGLES (DEGREES) : 0.98 +REMARK 3 +REMARK 3 ISOTROPIC THERMAL MODEL : RESTRAINED +REMARK 3 +REMARK 3 ISOTROPIC THERMAL FACTOR RESTRAINTS. RMS SIGMA +REMARK 3 MAIN-CHAIN BOND (A**2) : NULL ; NULL +REMARK 3 MAIN-CHAIN ANGLE (A**2) : NULL ; NULL +REMARK 3 SIDE-CHAIN BOND (A**2) : NULL ; NULL +REMARK 3 SIDE-CHAIN ANGLE (A**2) : NULL ; NULL +REMARK 3 +REMARK 3 NCS MODEL : NULL +REMARK 3 +REMARK 3 NCS RESTRAINTS. RMS SIGMA/WEIGHT +REMARK 3 GROUP 1 POSITIONAL (A) : NULL ; NULL +REMARK 3 GROUP 1 B-FACTOR (A**2) : NULL ; NULL +REMARK 3 +REMARK 3 PARAMETER FILE 1 : PARHCSDX.PRO +REMARK 3 PARAMETER FILE 2 : NULL +REMARK 3 PARAMETER FILE 3 : NULL +REMARK 3 TOPOLOGY FILE 1 : TOPHCSDX.PRO +REMARK 3 TOPOLOGY FILE 2 : NULL +REMARK 3 TOPOLOGY FILE 3 : NULL +REMARK 3 +REMARK 3 OTHER REFINEMENT REMARKS: ISOTROPIC THERMAL FACTOR RESTRAINTS: +REMARK 3 36. (A**2) FOR MAIN-CHAIN BONDS AND 40.3 (A**2) FOR SIDE-CHAIN +REMARK 3 BONDS. +REMARK 4 +REMARK 4 1BM8 COMPLIES WITH FORMAT V. 3.15, 01-DEC-08 +REMARK 100 +REMARK 100 THIS ENTRY HAS BEEN PROCESSED BY BNL. +REMARK 200 +REMARK 200 EXPERIMENTAL DETAILS +REMARK 200 EXPERIMENT TYPE : X-RAY DIFFRACTION +REMARK 200 DATE OF DATA COLLECTION : JUN-96 +REMARK 200 TEMPERATURE (KELVIN) : 289 +REMARK 200 PH : 8.0 +REMARK 200 NUMBER OF CRYSTALS USED : 3 +REMARK 200 +REMARK 200 SYNCHROTRON (Y/N) : Y +REMARK 200 RADIATION SOURCE : NSLS +REMARK 200 BEAMLINE : X12C +REMARK 200 X-RAY GENERATOR MODEL : NULL +REMARK 200 MONOCHROMATIC OR LAUE (M/L) : M +REMARK 200 WAVELENGTH OR RANGE (A) : 0.96 +REMARK 200 MONOCHROMATOR : NI FILTER +REMARK 200 OPTICS : MIRRORS +REMARK 200 +REMARK 200 DETECTOR TYPE : IMAGE PLATE +REMARK 200 DETECTOR MANUFACTURER : RIGAKU RAXIS IIC +REMARK 200 INTENSITY-INTEGRATION SOFTWARE : DENZO +REMARK 200 DATA SCALING SOFTWARE : SCALEPACK +REMARK 200 +REMARK 200 NUMBER OF UNIQUE REFLECTIONS : 12811 +REMARK 200 RESOLUTION RANGE HIGH (A) : 1.700 +REMARK 200 RESOLUTION RANGE LOW (A) : 30.000 +REMARK 200 REJECTION CRITERIA (SIGMA(I)) : -3.000 +REMARK 200 +REMARK 200 OVERALL. +REMARK 200 COMPLETENESS FOR RANGE (%) : 93.6 +REMARK 200 DATA REDUNDANCY : 5.300 +REMARK 200 R MERGE (I) : 0.05200 +REMARK 200 R SYM (I) : NULL +REMARK 200 FOR THE DATA SET : 11.4000 +REMARK 200 +REMARK 200 IN THE HIGHEST RESOLUTION SHELL. +REMARK 200 HIGHEST RESOLUTION SHELL, RANGE HIGH (A) : 1.71 +REMARK 200 HIGHEST RESOLUTION SHELL, RANGE LOW (A) : 1.78 +REMARK 200 COMPLETENESS FOR SHELL (%) : 34.0 +REMARK 200 DATA REDUNDANCY IN SHELL : NULL +REMARK 200 R MERGE FOR SHELL (I) : NULL +REMARK 200 R SYM FOR SHELL (I) : NULL +REMARK 200 FOR SHELL : NULL +REMARK 200 +REMARK 200 DIFFRACTION PROTOCOL: NULL +REMARK 200 METHOD USED TO DETERMINE THE STRUCTURE: NULL +REMARK 200 SOFTWARE USED: PHASES +REMARK 200 STARTING MODEL: NULL +REMARK 200 +REMARK 200 REMARK: NULL +REMARK 280 +REMARK 280 CRYSTAL +REMARK 280 SOLVENT CONTENT, VS (%): 34.00 +REMARK 280 MATTHEWS COEFFICIENT, VM (ANGSTROMS**3/DA): 1.85 +REMARK 280 +REMARK 280 CRYSTALLIZATION CONDITIONS: PH 8.0 +REMARK 290 +REMARK 290 CRYSTALLOGRAPHIC SYMMETRY +REMARK 290 SYMMETRY OPERATORS FOR SPACE GROUP: P 41 21 2 +REMARK 290 +REMARK 290 SYMOP SYMMETRY +REMARK 290 NNNMMM OPERATOR +REMARK 290 1555 X,Y,Z +REMARK 290 2555 -X,-Y,Z+1/2 +REMARK 290 3555 -Y+1/2,X+1/2,Z+1/4 +REMARK 290 4555 Y+1/2,-X+1/2,Z+3/4 +REMARK 290 5555 -X+1/2,Y+1/2,-Z+1/4 +REMARK 290 6555 X+1/2,-Y+1/2,-Z+3/4 +REMARK 290 7555 Y,X,-Z +REMARK 290 8555 -Y,-X,-Z+1/2 +REMARK 290 +REMARK 290 WHERE NNN -> OPERATOR NUMBER +REMARK 290 MMM -> TRANSLATION VECTOR +REMARK 290 +REMARK 290 CRYSTALLOGRAPHIC SYMMETRY TRANSFORMATIONS +REMARK 290 THE FOLLOWING TRANSFORMATIONS OPERATE ON THE ATOM/HETATM +REMARK 290 RECORDS IN THIS ENTRY TO PRODUCE CRYSTALLOGRAPHICALLY +REMARK 290 RELATED MOLECULES. +REMARK 290 SMTRY1 1 1.000000 0.000000 0.000000 0.00000 +REMARK 290 SMTRY2 1 0.000000 1.000000 0.000000 0.00000 +REMARK 290 SMTRY3 1 0.000000 0.000000 1.000000 0.00000 +REMARK 290 SMTRY1 2 -1.000000 0.000000 0.000000 0.00000 +REMARK 290 SMTRY2 2 0.000000 -1.000000 0.000000 0.00000 +REMARK 290 SMTRY3 2 0.000000 0.000000 1.000000 62.11000 +REMARK 290 SMTRY1 3 0.000000 -1.000000 0.000000 21.67500 +REMARK 290 SMTRY2 3 1.000000 0.000000 0.000000 21.67500 +REMARK 290 SMTRY3 3 0.000000 0.000000 1.000000 31.05500 +REMARK 290 SMTRY1 4 0.000000 1.000000 0.000000 21.67500 +REMARK 290 SMTRY2 4 -1.000000 0.000000 0.000000 21.67500 +REMARK 290 SMTRY3 4 0.000000 0.000000 1.000000 93.16500 +REMARK 290 SMTRY1 5 -1.000000 0.000000 0.000000 21.67500 +REMARK 290 SMTRY2 5 0.000000 1.000000 0.000000 21.67500 +REMARK 290 SMTRY3 5 0.000000 0.000000 -1.000000 31.05500 +REMARK 290 SMTRY1 6 1.000000 0.000000 0.000000 21.67500 +REMARK 290 SMTRY2 6 0.000000 -1.000000 0.000000 21.67500 +REMARK 290 SMTRY3 6 0.000000 0.000000 -1.000000 93.16500 +REMARK 290 SMTRY1 7 0.000000 1.000000 0.000000 0.00000 +REMARK 290 SMTRY2 7 1.000000 0.000000 0.000000 0.00000 +REMARK 290 SMTRY3 7 0.000000 0.000000 -1.000000 0.00000 +REMARK 290 SMTRY1 8 0.000000 -1.000000 0.000000 0.00000 +REMARK 290 SMTRY2 8 -1.000000 0.000000 0.000000 0.00000 +REMARK 290 SMTRY3 8 0.000000 0.000000 -1.000000 62.11000 +REMARK 290 +REMARK 290 REMARK: NULL +REMARK 300 +REMARK 300 BIOMOLECULE: 1 +REMARK 300 SEE REMARK 350 FOR THE AUTHOR PROVIDED AND/OR PROGRAM +REMARK 300 GENERATED ASSEMBLY INFORMATION FOR THE STRUCTURE IN +REMARK 300 THIS ENTRY. THE REMARK MAY ALSO PROVIDE INFORMATION ON +REMARK 300 BURIED SURFACE AREA. +REMARK 350 +REMARK 350 COORDINATES FOR A COMPLETE MULTIMER REPRESENTING THE KNOWN +REMARK 350 BIOLOGICALLY SIGNIFICANT OLIGOMERIZATION STATE OF THE +REMARK 350 MOLECULE CAN BE GENERATED BY APPLYING BIOMT TRANSFORMATIONS +REMARK 350 GIVEN BELOW. BOTH NON-CRYSTALLOGRAPHIC AND +REMARK 350 CRYSTALLOGRAPHIC OPERATIONS ARE GIVEN. +REMARK 350 +REMARK 350 BIOMOLECULE: 1 +REMARK 350 AUTHOR DETERMINED BIOLOGICAL UNIT: MONOMERIC +REMARK 350 APPLY THE FOLLOWING TO CHAINS: A +REMARK 350 BIOMT1 1 1.000000 0.000000 0.000000 0.00000 +REMARK 350 BIOMT2 1 0.000000 1.000000 0.000000 0.00000 +REMARK 350 BIOMT3 1 0.000000 0.000000 1.000000 0.00000 +REMARK 525 +REMARK 525 SOLVENT +REMARK 525 +REMARK 525 THE SOLVENT MOLECULES HAVE CHAIN IDENTIFIERS THAT +REMARK 525 INDICATE THE POLYMER CHAIN WITH WHICH THEY ARE MOST +REMARK 525 CLOSELY ASSOCIATED. THE REMARK LISTS ALL THE SOLVENT +REMARK 525 MOLECULES WHICH ARE MORE THAN 5A AWAY FROM THE +REMARK 525 NEAREST POLYMER CHAIN (M = MODEL NUMBER; +REMARK 525 RES=RESIDUE NAME; C=CHAIN IDENTIFIER; SSEQ=SEQUENCE +REMARK 525 NUMBER; I=INSERTION CODE): +REMARK 525 +REMARK 525 M RES CSSEQI +REMARK 525 HOH A 459 DISTANCE = 6.67 ANGSTROMS +REMARK 525 HOH A 473 DISTANCE = 6.70 ANGSTROMS +DBREF 1BM8 A 4 102 UNP P39678 MBP1_YEAST 4 102 +SEQRES 1 A 99 GLN ILE TYR SER ALA ARG TYR SER GLY VAL ASP VAL TYR +SEQRES 2 A 99 GLU PHE ILE HIS SER THR GLY SER ILE MET LYS ARG LYS +SEQRES 3 A 99 LYS ASP ASP TRP VAL ASN ALA THR HIS ILE LEU LYS ALA +SEQRES 4 A 99 ALA ASN PHE ALA LYS ALA LYS ARG THR ARG ILE LEU GLU +SEQRES 5 A 99 LYS GLU VAL LEU LYS GLU THR HIS GLU LYS VAL GLN GLY +SEQRES 6 A 99 GLY PHE GLY LYS TYR GLN GLY THR TRP VAL PRO LEU ASN +SEQRES 7 A 99 ILE ALA LYS GLN LEU ALA GLU LYS PHE SER VAL TYR ASP +SEQRES 8 A 99 GLN LEU LYS PRO LEU PHE ASP PHE +FORMUL 2 HOH *83(H2 O) +HELIX 1 1 ALA A 36 ALA A 42 1 7 +HELIX 2 2 LYS A 47 GLU A 57 1 11 +HELIX 3 3 LEU A 80 LYS A 89 1 10 +HELIX 4 4 TYR A 93 PHE A 100 1 8 +SHEET 1 A 3 ILE A 5 TYR A 10 0 +SHEET 2 A 3 VAL A 13 ILE A 19 -1 N GLU A 17 O TYR A 6 +SHEET 3 A 3 SER A 24 ARG A 28 -1 N LYS A 27 O TYR A 16 +SHEET 1 B 2 GLU A 64 VAL A 66 0 +SHEET 2 B 2 GLY A 75 TRP A 77 -1 N TRP A 77 O GLU A 64 +CRYST1 43.350 43.350 124.220 90.00 90.00 90.00 P 41 21 2 8 +ORIGX1 1.000000 0.000000 0.000000 0.00000 +ORIGX2 0.000000 1.000000 0.000000 0.00000 +ORIGX3 0.000000 0.000000 1.000000 0.00000 +SCALE1 0.023068 0.000000 0.000000 0.00000 +SCALE2 0.000000 0.023068 0.000000 0.00000 +SCALE3 0.000000 0.000000 0.008050 0.00000 +ATOM 1 N GLN A 4 -0.991 4.920 14.982 1.00 52.28 N +ATOM 2 CA GLN A 4 -0.575 5.127 16.398 1.00 51.22 C +ATOM 3 C GLN A 4 0.344 6.335 16.538 1.00 48.16 C +ATOM 4 O GLN A 4 0.893 6.823 15.540 1.00 46.43 O +ATOM 5 CB GLN A 4 0.121 3.877 16.961 1.00 53.87 C +ATOM 6 CG GLN A 4 -0.797 3.008 17.820 1.00 57.21 C +ATOM 7 CD GLN A 4 -0.029 2.066 18.730 1.00 60.18 C +ATOM 8 OE1 GLN A 4 1.135 2.325 19.071 1.00 61.12 O +ATOM 9 NE2 GLN A 4 -0.673 0.970 19.131 1.00 61.27 N +ATOM 10 H1 GLN A 4 -1.493 5.767 14.644 1.00 0.00 H +ATOM 11 H2 GLN A 4 -0.148 4.764 14.393 1.00 0.00 H +ATOM 12 H3 GLN A 4 -1.618 4.097 14.918 1.00 0.00 H +ATOM 13 HE21 GLN A 4 -0.200 0.339 19.714 1.00 0.00 H +ATOM 14 HE22 GLN A 4 -1.594 0.835 18.832 1.00 0.00 H +ATOM 15 N ILE A 5 0.487 6.801 17.778 1.00 44.78 N +ATOM 16 CA ILE A 5 1.300 7.959 18.076 1.00 42.51 C +ATOM 17 C ILE A 5 2.358 7.589 19.087 1.00 40.28 C +ATOM 18 O ILE A 5 2.041 7.137 20.170 1.00 41.33 O +ATOM 19 CB ILE A 5 0.424 9.104 18.631 1.00 42.76 C +ATOM 20 CG1 ILE A 5 -0.582 9.523 17.557 1.00 44.06 C +ATOM 21 CG2 ILE A 5 1.281 10.293 19.056 1.00 43.55 C +ATOM 22 CD1 ILE A 5 -1.471 10.684 17.936 1.00 43.93 C +ATOM 23 H ILE A 5 0.039 6.338 18.519 1.00 0.00 H +ATOM 24 N TYR A 6 3.607 7.754 18.720 1.00 38.87 N +ATOM 25 CA TYR A 6 4.710 7.452 19.621 1.00 38.04 C +ATOM 26 C TYR A 6 5.273 8.733 20.218 1.00 34.53 C +ATOM 27 O TYR A 6 5.170 9.805 19.650 1.00 33.71 O +ATOM 28 CB TYR A 6 5.892 6.794 18.889 1.00 42.49 C +ATOM 29 CG TYR A 6 5.619 5.559 18.078 1.00 49.90 C +ATOM 30 CD1 TYR A 6 4.759 4.551 18.520 1.00 52.40 C +ATOM 31 CD2 TYR A 6 6.290 5.367 16.884 1.00 53.52 C +ATOM 32 CE1 TYR A 6 4.603 3.377 17.787 1.00 56.29 C +ATOM 33 CE2 TYR A 6 6.148 4.208 16.144 1.00 56.87 C +ATOM 34 CZ TYR A 6 5.307 3.211 16.595 1.00 58.22 C +ATOM 35 OH TYR A 6 5.213 2.023 15.883 1.00 62.12 O +ATOM 36 H TYR A 6 3.803 8.092 17.823 1.00 0.00 H +ATOM 37 HH TYR A 6 4.525 1.471 16.264 1.00 0.00 H +ATOM 38 N SER A 7 5.887 8.595 21.343 1.00 29.82 N +ATOM 39 CA SER A 7 6.641 9.658 21.907 1.00 27.41 C +ATOM 40 C SER A 7 8.065 9.484 21.365 1.00 25.27 C +ATOM 41 O SER A 7 8.573 8.364 21.336 1.00 24.52 O +ATOM 42 CB SER A 7 6.604 9.491 23.411 1.00 27.69 C +ATOM 43 OG SER A 7 7.393 10.446 24.052 1.00 34.18 O +ATOM 44 H SER A 7 5.839 7.737 21.817 1.00 0.00 H +ATOM 45 HG SER A 7 8.257 10.478 23.644 1.00 0.00 H +ATOM 46 N ALA A 8 8.709 10.555 20.901 1.00 23.35 N +ATOM 47 CA ALA A 8 10.071 10.423 20.364 1.00 20.99 C +ATOM 48 C ALA A 8 10.887 11.696 20.574 1.00 21.47 C +ATOM 49 O ALA A 8 10.370 12.693 21.084 1.00 21.33 O +ATOM 50 CB ALA A 8 10.016 10.075 18.875 1.00 20.24 C +ATOM 51 H ALA A 8 8.274 11.435 20.918 1.00 0.00 H +ATOM 52 N ARG A 9 12.163 11.644 20.207 1.00 21.36 N +ATOM 53 CA ARG A 9 13.054 12.817 20.318 1.00 23.94 C +ATOM 54 C ARG A 9 14.026 12.854 19.153 1.00 24.02 C +ATOM 55 O ARG A 9 14.629 11.831 18.835 1.00 22.48 O +ATOM 56 CB ARG A 9 13.864 12.818 21.615 1.00 24.91 C +ATOM 57 CG ARG A 9 14.921 13.922 21.647 1.00 28.68 C +ATOM 58 CD ARG A 9 15.735 13.904 22.931 1.00 31.98 C +ATOM 59 NE ARG A 9 14.979 14.426 24.042 1.00 35.74 N +ATOM 60 CZ ARG A 9 15.234 15.602 24.583 1.00 37.58 C +ATOM 61 NH1 ARG A 9 16.262 16.324 24.162 1.00 38.78 N +ATOM 62 NH2 ARG A 9 14.475 16.048 25.571 1.00 40.26 N +ATOM 63 H ARG A 9 12.518 10.810 19.832 1.00 0.00 H +ATOM 64 HE ARG A 9 14.250 13.885 24.413 1.00 0.00 H +ATOM 65 HH11 ARG A 9 16.855 15.976 23.436 1.00 0.00 H +ATOM 66 HH12 ARG A 9 16.446 17.220 24.568 1.00 0.00 H +ATOM 67 HH21 ARG A 9 13.711 15.495 25.906 1.00 0.00 H +ATOM 68 HH22 ARG A 9 14.657 16.944 25.977 1.00 0.00 H +ATOM 69 N TYR A 10 14.154 14.035 18.532 1.00 24.15 N +ATOM 70 CA TYR A 10 15.034 14.236 17.379 1.00 26.92 C +ATOM 71 C TYR A 10 15.730 15.585 17.504 1.00 28.93 C +ATOM 72 O TYR A 10 15.085 16.571 17.814 1.00 29.46 O +ATOM 73 CB TYR A 10 14.234 14.252 16.072 1.00 23.90 C +ATOM 74 CG TYR A 10 13.510 12.977 15.778 1.00 24.39 C +ATOM 75 CD1 TYR A 10 14.171 11.907 15.185 1.00 25.27 C +ATOM 76 CD2 TYR A 10 12.174 12.813 16.148 1.00 25.41 C +ATOM 77 CE1 TYR A 10 13.521 10.695 14.967 1.00 27.01 C +ATOM 78 CE2 TYR A 10 11.520 11.609 15.936 1.00 27.17 C +ATOM 79 CZ TYR A 10 12.196 10.556 15.346 1.00 26.47 C +ATOM 80 OH TYR A 10 11.540 9.379 15.101 1.00 27.96 O +ATOM 81 H TYR A 10 13.640 14.801 18.866 1.00 0.00 H +ATOM 82 HH TYR A 10 12.100 8.804 14.574 1.00 0.00 H +ATOM 83 N SER A 11 17.029 15.630 17.266 1.00 30.98 N +ATOM 84 CA SER A 11 17.751 16.893 17.349 1.00 32.54 C +ATOM 85 C SER A 11 17.509 17.599 18.695 1.00 32.28 C +ATOM 86 O SER A 11 17.377 18.827 18.737 1.00 33.57 O +ATOM 87 CB SER A 11 17.299 17.821 16.212 1.00 34.50 C +ATOM 88 OG SER A 11 17.469 17.220 14.934 1.00 39.12 O +ATOM 89 H SER A 11 17.508 14.810 17.019 1.00 0.00 H +ATOM 90 HG SER A 11 18.388 16.968 14.813 1.00 0.00 H +ATOM 91 N GLY A 12 17.410 16.826 19.780 1.00 30.27 N +ATOM 92 CA GLY A 12 17.187 17.403 21.099 1.00 27.72 C +ATOM 93 C GLY A 12 15.760 17.867 21.361 1.00 26.67 C +ATOM 94 O GLY A 12 15.474 18.436 22.414 1.00 28.11 O +ATOM 95 H GLY A 12 17.494 15.856 19.690 1.00 0.00 H +ATOM 96 N VAL A 13 14.855 17.590 20.434 1.00 25.00 N +ATOM 97 CA VAL A 13 13.459 18.045 20.539 1.00 22.39 C +ATOM 98 C VAL A 13 12.471 16.877 20.723 1.00 22.62 C +ATOM 99 O VAL A 13 12.494 15.913 19.959 1.00 21.65 O +ATOM 100 CB VAL A 13 13.075 18.819 19.253 1.00 21.97 C +ATOM 101 CG1 VAL A 13 11.652 19.334 19.343 1.00 18.81 C +ATOM 102 CG2 VAL A 13 14.057 19.964 19.042 1.00 22.24 C +ATOM 103 H VAL A 13 15.123 17.070 19.648 1.00 0.00 H +ATOM 104 N ASP A 14 11.617 16.976 21.734 1.00 21.41 N +ATOM 105 CA ASP A 14 10.622 15.950 22.003 1.00 21.86 C +ATOM 106 C ASP A 14 9.377 16.206 21.197 1.00 21.71 C +ATOM 107 O ASP A 14 8.837 17.312 21.204 1.00 20.60 O +ATOM 108 CB ASP A 14 10.237 15.913 23.494 1.00 24.96 C +ATOM 109 CG ASP A 14 11.414 15.636 24.396 1.00 25.52 C +ATOM 110 OD1 ASP A 14 12.057 14.597 24.232 1.00 27.41 O +ATOM 111 OD2 ASP A 14 11.704 16.473 25.257 1.00 30.85 O +ATOM 112 H ASP A 14 11.653 17.765 22.313 1.00 0.00 H +ATOM 113 N VAL A 15 8.897 15.168 20.550 1.00 21.11 N +ATOM 114 CA VAL A 15 7.740 15.281 19.686 1.00 20.99 C +ATOM 115 C VAL A 15 6.819 14.096 19.900 1.00 23.45 C +ATOM 116 O VAL A 15 7.178 13.132 20.595 1.00 24.63 O +ATOM 117 CB VAL A 15 8.149 15.282 18.166 1.00 19.89 C +ATOM 118 CG1 VAL A 15 9.103 16.420 17.854 1.00 16.46 C +ATOM 119 CG2 VAL A 15 8.795 13.934 17.785 1.00 18.59 C +ATOM 120 H VAL A 15 9.323 14.292 20.662 1.00 0.00 H +ATOM 121 N TYR A 16 5.632 14.216 19.339 1.00 24.96 N +ATOM 122 CA TYR A 16 4.726 13.114 19.215 1.00 26.21 C +ATOM 123 C TYR A 16 4.746 12.756 17.744 1.00 26.48 C +ATOM 124 O TYR A 16 4.631 13.643 16.884 1.00 25.01 O +ATOM 125 CB TYR A 16 3.314 13.507 19.644 1.00 29.28 C +ATOM 126 CG TYR A 16 3.170 13.632 21.144 1.00 32.30 C +ATOM 127 CD1 TYR A 16 3.375 12.530 21.959 1.00 34.32 C +ATOM 128 CD2 TYR A 16 2.859 14.843 21.746 1.00 33.14 C +ATOM 129 CE1 TYR A 16 3.272 12.625 23.332 1.00 36.05 C +ATOM 130 CE2 TYR A 16 2.755 14.950 23.125 1.00 35.60 C +ATOM 131 CZ TYR A 16 2.962 13.832 23.907 1.00 37.33 C +ATOM 132 OH TYR A 16 2.870 13.922 25.273 1.00 42.80 O +ATOM 133 H TYR A 16 5.364 15.082 18.983 1.00 0.00 H +ATOM 134 HH TYR A 16 3.304 13.159 25.678 1.00 0.00 H +ATOM 135 N GLU A 17 4.950 11.483 17.454 1.00 27.52 N +ATOM 136 CA GLU A 17 5.040 11.030 16.074 1.00 29.95 C +ATOM 137 C GLU A 17 3.841 10.167 15.709 1.00 30.66 C +ATOM 138 O GLU A 17 3.533 9.205 16.390 1.00 27.27 O +ATOM 139 CB GLU A 17 6.349 10.268 15.880 1.00 29.55 C +ATOM 140 CG GLU A 17 6.689 9.958 14.439 1.00 32.47 C +ATOM 141 CD GLU A 17 8.068 9.340 14.291 1.00 34.84 C +ATOM 142 OE1 GLU A 17 8.917 9.552 15.182 1.00 36.30 O +ATOM 143 OE2 GLU A 17 8.307 8.643 13.282 1.00 38.82 O +ATOM 144 H GLU A 17 5.048 10.834 18.179 1.00 0.00 H +ATOM 145 N PHE A 18 3.157 10.574 14.657 1.00 34.09 N +ATOM 146 CA PHE A 18 1.992 9.874 14.154 1.00 38.16 C +ATOM 147 C PHE A 18 2.404 9.093 12.906 1.00 40.68 C +ATOM 148 O PHE A 18 3.066 9.635 12.005 1.00 38.31 O +ATOM 149 CB PHE A 18 0.911 10.908 13.837 1.00 39.21 C +ATOM 150 CG PHE A 18 -0.309 10.396 13.139 1.00 43.44 C +ATOM 151 CD1 PHE A 18 -1.285 9.683 13.838 1.00 45.30 C +ATOM 152 CD2 PHE A 18 -0.520 10.684 11.789 1.00 45.30 C +ATOM 153 CE1 PHE A 18 -2.451 9.269 13.205 1.00 45.73 C +ATOM 154 CE2 PHE A 18 -1.682 10.275 11.146 1.00 46.28 C +ATOM 155 CZ PHE A 18 -2.651 9.568 11.854 1.00 46.51 C +ATOM 156 H PHE A 18 3.446 11.386 14.198 1.00 0.00 H +ATOM 157 N ILE A 19 2.060 7.813 12.875 1.00 43.87 N +ATOM 158 CA ILE A 19 2.451 6.970 11.756 1.00 47.64 C +ATOM 159 C ILE A 19 1.361 6.905 10.701 1.00 50.18 C +ATOM 160 O ILE A 19 0.316 6.280 10.907 1.00 50.83 O +ATOM 161 CB ILE A 19 2.787 5.548 12.208 1.00 48.13 C +ATOM 162 CG1 ILE A 19 3.734 5.597 13.406 1.00 49.26 C +ATOM 163 CG2 ILE A 19 3.425 4.793 11.061 1.00 48.27 C +ATOM 164 CD1 ILE A 19 5.016 6.356 13.140 1.00 51.27 C +ATOM 165 H ILE A 19 1.535 7.436 13.609 1.00 0.00 H +ATOM 166 N HIS A 20 1.623 7.574 9.587 1.00 52.47 N +ATOM 167 CA HIS A 20 0.710 7.602 8.461 1.00 54.63 C +ATOM 168 C HIS A 20 1.325 6.738 7.359 1.00 54.62 C +ATOM 169 O HIS A 20 2.518 6.415 7.424 1.00 54.75 O +ATOM 170 CB HIS A 20 0.553 9.056 7.990 1.00 57.40 C +ATOM 171 CG HIS A 20 -0.664 9.340 7.157 1.00 60.64 C +ATOM 172 ND1 HIS A 20 -0.604 9.703 5.820 1.00 61.69 N +ATOM 173 CD2 HIS A 20 -1.991 9.341 7.470 1.00 61.84 C +ATOM 174 CE1 HIS A 20 -1.811 9.917 5.323 1.00 62.25 C +ATOM 175 NE2 HIS A 20 -2.653 9.699 6.317 1.00 63.47 N +ATOM 176 H HIS A 20 2.472 8.058 9.517 1.00 0.00 H +ATOM 177 HD1 HIS A 20 0.226 9.797 5.306 1.00 0.00 H +ATOM 178 HE2 HIS A 20 -3.628 9.768 6.238 1.00 0.00 H +ATOM 179 N SER A 21 0.535 6.358 6.354 1.00 54.36 N +ATOM 180 CA SER A 21 1.057 5.528 5.265 1.00 52.80 C +ATOM 181 C SER A 21 2.204 6.221 4.504 1.00 52.38 C +ATOM 182 O SER A 21 3.242 5.606 4.237 1.00 51.68 O +ATOM 183 CB SER A 21 -0.081 5.142 4.322 1.00 51.54 C +ATOM 184 OG SER A 21 -0.940 6.237 4.107 1.00 51.51 O +ATOM 185 H SER A 21 -0.408 6.625 6.348 1.00 0.00 H +ATOM 186 HG SER A 21 -1.720 5.940 3.628 1.00 0.00 H +ATOM 187 N THR A 22 2.030 7.509 4.195 1.00 52.22 N +ATOM 188 CA THR A 22 3.058 8.284 3.475 1.00 52.84 C +ATOM 189 C THR A 22 4.294 8.548 4.334 1.00 50.76 C +ATOM 190 O THR A 22 5.358 8.913 3.827 1.00 50.70 O +ATOM 191 CB THR A 22 2.503 9.648 3.031 1.00 54.77 C +ATOM 192 OG1 THR A 22 1.746 10.224 4.115 1.00 57.43 O +ATOM 193 CG2 THR A 22 1.604 9.504 1.816 1.00 56.57 C +ATOM 194 H THR A 22 1.193 7.951 4.445 1.00 0.00 H +ATOM 195 HG1 THR A 22 1.603 11.155 3.928 1.00 0.00 H +ATOM 196 N GLY A 23 4.142 8.376 5.635 1.00 49.11 N +ATOM 197 CA GLY A 23 5.238 8.640 6.541 1.00 45.68 C +ATOM 198 C GLY A 23 4.739 9.133 7.876 1.00 43.53 C +ATOM 199 O GLY A 23 3.521 9.157 8.138 1.00 42.97 O +ATOM 200 H GLY A 23 3.287 8.054 5.988 1.00 0.00 H +ATOM 201 N SER A 24 5.655 9.533 8.719 1.00 40.66 N +ATOM 202 CA SER A 24 5.279 10.004 10.026 1.00 38.67 C +ATOM 203 C SER A 24 5.066 11.517 10.046 1.00 36.42 C +ATOM 204 O SER A 24 5.714 12.267 9.291 1.00 34.95 O +ATOM 205 CB SER A 24 6.335 9.598 11.029 1.00 39.09 C +ATOM 206 OG SER A 24 7.622 9.743 10.472 1.00 44.40 O +ATOM 207 H SER A 24 6.597 9.521 8.458 1.00 0.00 H +ATOM 208 HG SER A 24 7.777 9.032 9.837 1.00 0.00 H +ATOM 209 N ILE A 25 4.129 11.946 10.890 1.00 32.56 N +ATOM 210 CA ILE A 25 3.824 13.356 11.064 1.00 29.27 C +ATOM 211 C ILE A 25 4.108 13.725 12.516 1.00 27.24 C +ATOM 212 O ILE A 25 3.698 13.017 13.431 1.00 26.25 O +ATOM 213 CB ILE A 25 2.354 13.628 10.682 1.00 30.38 C +ATOM 214 CG1 ILE A 25 2.172 13.204 9.219 1.00 33.50 C +ATOM 215 CG2 ILE A 25 2.011 15.105 10.843 1.00 28.01 C +ATOM 216 CD1 ILE A 25 0.746 13.027 8.780 1.00 35.33 C +ATOM 217 H ILE A 25 3.628 11.287 11.414 1.00 0.00 H +ATOM 218 N MET A 26 4.821 14.815 12.713 1.00 24.03 N +ATOM 219 CA MET A 26 5.282 15.188 14.040 1.00 22.95 C +ATOM 220 C MET A 26 4.649 16.463 14.576 1.00 23.00 C +ATOM 221 O MET A 26 4.398 17.426 13.832 1.00 19.80 O +ATOM 222 CB MET A 26 6.800 15.397 14.034 1.00 22.54 C +ATOM 223 CG MET A 26 7.632 14.152 13.821 1.00 22.25 C +ATOM 224 SD MET A 26 9.393 14.520 13.783 1.00 27.59 S +ATOM 225 CE MET A 26 10.026 13.008 13.046 1.00 27.15 C +ATOM 226 H MET A 26 5.012 15.401 11.961 1.00 0.00 H +ATOM 227 N LYS A 27 4.443 16.453 15.891 1.00 23.73 N +ATOM 228 CA LYS A 27 3.998 17.625 16.632 1.00 23.46 C +ATOM 229 C LYS A 27 4.942 17.793 17.828 1.00 22.79 C +ATOM 230 O LYS A 27 5.244 16.813 18.522 1.00 22.50 O +ATOM 231 CB LYS A 27 2.550 17.459 17.133 1.00 24.99 C +ATOM 232 CG LYS A 27 2.055 18.665 17.923 1.00 27.08 C +ATOM 233 CD LYS A 27 0.574 18.594 18.223 1.00 29.52 C +ATOM 234 CE LYS A 27 0.272 17.523 19.243 1.00 32.06 C +ATOM 235 NZ LYS A 27 -1.178 17.499 19.580 1.00 35.59 N +ATOM 236 H LYS A 27 4.599 15.620 16.384 1.00 0.00 H +ATOM 237 HZ1 LYS A 27 -1.732 17.319 18.719 1.00 0.00 H +ATOM 238 HZ2 LYS A 27 -1.359 16.745 20.272 1.00 0.00 H +ATOM 239 HZ3 LYS A 27 -1.452 18.414 19.986 1.00 0.00 H +ATOM 240 N ARG A 28 5.455 19.003 18.033 1.00 21.34 N +ATOM 241 CA ARG A 28 6.361 19.253 19.141 1.00 21.22 C +ATOM 242 C ARG A 28 5.615 19.292 20.464 1.00 20.99 C +ATOM 243 O ARG A 28 4.534 19.902 20.557 1.00 20.62 O +ATOM 244 CB ARG A 28 7.090 20.582 18.971 1.00 20.55 C +ATOM 245 CG ARG A 28 8.119 20.580 17.884 1.00 23.75 C +ATOM 246 CD ARG A 28 9.092 21.725 18.053 1.00 24.37 C +ATOM 247 NE ARG A 28 8.452 23.024 17.897 1.00 22.21 N +ATOM 248 CZ ARG A 28 8.906 23.947 17.062 1.00 22.16 C +ATOM 249 NH1 ARG A 28 9.932 23.686 16.260 1.00 21.40 N +ATOM 250 NH2 ARG A 28 8.314 25.124 17.006 1.00 22.10 N +ATOM 251 H ARG A 28 5.216 19.737 17.429 1.00 0.00 H +ATOM 252 HE ARG A 28 7.659 23.223 18.432 1.00 0.00 H +ATOM 253 HH11 ARG A 28 10.372 22.788 16.284 1.00 0.00 H +ATOM 254 HH12 ARG A 28 10.278 24.394 15.642 1.00 0.00 H +ATOM 255 HH21 ARG A 28 7.520 25.312 17.581 1.00 0.00 H +ATOM 256 HH22 ARG A 28 8.657 25.824 16.379 1.00 0.00 H +ATOM 257 N LYS A 29 6.215 18.701 21.488 1.00 20.40 N +ATOM 258 CA LYS A 29 5.601 18.678 22.813 1.00 22.71 C +ATOM 259 C LYS A 29 5.623 20.043 23.491 1.00 22.45 C +ATOM 260 O LYS A 29 4.669 20.397 24.190 1.00 21.87 O +ATOM 261 CB LYS A 29 6.298 17.668 23.723 1.00 25.87 C +ATOM 262 CG LYS A 29 6.214 16.228 23.225 1.00 31.52 C +ATOM 263 CD LYS A 29 6.749 15.268 24.259 1.00 32.96 C +ATOM 264 CE LYS A 29 6.701 13.831 23.781 1.00 33.83 C +ATOM 265 NZ LYS A 29 7.106 12.908 24.868 1.00 35.21 N +ATOM 266 H LYS A 29 7.088 18.274 21.356 1.00 0.00 H +ATOM 267 HZ1 LYS A 29 6.552 13.117 25.721 1.00 0.00 H +ATOM 268 HZ2 LYS A 29 6.929 11.933 24.575 1.00 0.00 H +ATOM 269 HZ3 LYS A 29 8.116 13.033 25.071 1.00 0.00 H +ATOM 270 N LYS A 30 6.693 20.822 23.275 1.00 21.91 N +ATOM 271 CA LYS A 30 6.818 22.108 23.970 1.00 22.50 C +ATOM 272 C LYS A 30 5.797 23.154 23.535 1.00 22.00 C +ATOM 273 O LYS A 30 5.348 23.925 24.374 1.00 21.27 O +ATOM 274 CB LYS A 30 8.230 22.683 23.839 1.00 23.91 C +ATOM 275 CG LYS A 30 8.602 23.159 22.448 1.00 30.91 C +ATOM 276 CD LYS A 30 10.047 23.652 22.422 1.00 35.19 C +ATOM 277 CE LYS A 30 10.510 24.019 21.007 1.00 36.53 C +ATOM 278 NZ LYS A 30 9.871 25.274 20.519 1.00 36.17 N +ATOM 279 H LYS A 30 7.397 20.528 22.662 1.00 0.00 H +ATOM 280 HZ1 LYS A 30 8.838 25.181 20.585 1.00 0.00 H +ATOM 281 HZ2 LYS A 30 10.185 26.073 21.106 1.00 0.00 H +ATOM 282 HZ3 LYS A 30 10.142 25.441 19.531 1.00 0.00 H +ATOM 283 N ASP A 31 5.401 23.183 22.245 1.00 18.95 N +ATOM 284 CA ASP A 31 4.499 24.232 21.794 1.00 20.45 C +ATOM 285 C ASP A 31 3.382 23.785 20.872 1.00 21.56 C +ATOM 286 O ASP A 31 2.634 24.636 20.361 1.00 23.45 O +ATOM 287 CB ASP A 31 5.298 25.339 21.113 1.00 21.42 C +ATOM 288 CG ASP A 31 6.231 24.825 20.027 1.00 26.39 C +ATOM 289 OD1 ASP A 31 6.013 23.695 19.518 1.00 25.20 O +ATOM 290 OD2 ASP A 31 7.181 25.546 19.686 1.00 24.41 O +ATOM 291 H ASP A 31 5.715 22.499 21.621 1.00 0.00 H +ATOM 292 N ASP A 32 3.265 22.484 20.634 1.00 21.07 N +ATOM 293 CA ASP A 32 2.221 21.961 19.749 1.00 21.22 C +ATOM 294 C ASP A 32 2.374 22.381 18.293 1.00 20.57 C +ATOM 295 O ASP A 32 1.426 22.253 17.511 1.00 22.37 O +ATOM 296 CB ASP A 32 0.809 22.358 20.226 1.00 23.08 C +ATOM 297 CG ASP A 32 0.375 21.651 21.495 1.00 25.24 C +ATOM 298 OD1 ASP A 32 1.027 20.663 21.882 1.00 26.63 O +ATOM 299 OD2 ASP A 32 -0.615 22.083 22.104 1.00 26.97 O +ATOM 300 H ASP A 32 3.881 21.858 21.068 1.00 0.00 H +ATOM 301 N TRP A 33 3.525 22.886 17.903 1.00 18.75 N +ATOM 302 CA TRP A 33 3.708 23.213 16.488 1.00 20.17 C +ATOM 303 C TRP A 33 3.768 21.917 15.706 1.00 20.21 C +ATOM 304 O TRP A 33 4.182 20.893 16.259 1.00 20.80 O +ATOM 305 CB TRP A 33 4.991 24.009 16.266 1.00 20.31 C +ATOM 306 CG TRP A 33 4.872 25.450 16.661 1.00 22.77 C +ATOM 307 CD1 TRP A 33 4.129 25.972 17.696 1.00 23.36 C +ATOM 308 CD2 TRP A 33 5.470 26.570 15.984 1.00 23.95 C +ATOM 309 NE1 TRP A 33 4.240 27.334 17.673 1.00 22.96 N +ATOM 310 CE2 TRP A 33 5.046 27.743 16.657 1.00 22.56 C +ATOM 311 CE3 TRP A 33 6.318 26.696 14.877 1.00 22.29 C +ATOM 312 CZ2 TRP A 33 5.442 29.023 16.257 1.00 24.90 C +ATOM 313 CZ3 TRP A 33 6.702 27.969 14.481 1.00 25.00 C +ATOM 314 CH2 TRP A 33 6.268 29.117 15.169 1.00 24.02 C +ATOM 315 H TRP A 33 4.245 23.030 18.542 1.00 0.00 H +ATOM 316 HE1 TRP A 33 3.780 27.938 18.295 1.00 0.00 H +ATOM 317 N VAL A 34 3.368 21.950 14.440 1.00 20.68 N +ATOM 318 CA VAL A 34 3.355 20.734 13.613 1.00 18.96 C +ATOM 319 C VAL A 34 4.219 20.947 12.371 1.00 20.18 C +ATOM 320 O VAL A 34 4.331 22.074 11.871 1.00 18.53 O +ATOM 321 CB VAL A 34 1.892 20.385 13.183 1.00 20.63 C +ATOM 322 CG1 VAL A 34 1.843 19.102 12.349 1.00 17.40 C +ATOM 323 CG2 VAL A 34 1.006 20.252 14.422 1.00 19.03 C +ATOM 324 H VAL A 34 3.075 22.803 14.050 1.00 0.00 H +ATOM 325 N ASN A 35 4.858 19.876 11.891 1.00 18.57 N +ATOM 326 CA ASN A 35 5.684 19.962 10.692 1.00 18.84 C +ATOM 327 C ASN A 35 4.771 20.026 9.459 1.00 19.27 C +ATOM 328 O ASN A 35 4.149 19.040 9.101 1.00 20.41 O +ATOM 329 CB ASN A 35 6.607 18.737 10.627 1.00 18.29 C +ATOM 330 CG ASN A 35 7.711 18.858 9.586 1.00 19.87 C +ATOM 331 OD1 ASN A 35 7.497 19.373 8.481 1.00 23.76 O +ATOM 332 ND2 ASN A 35 8.909 18.410 9.922 1.00 17.21 N +ATOM 333 H ASN A 35 4.769 19.017 12.356 1.00 0.00 H +ATOM 334 N ALA A 36 4.686 21.185 8.820 1.00 18.30 N +ATOM 335 CA ALA A 36 3.779 21.366 7.681 1.00 20.19 C +ATOM 336 C ALA A 36 4.218 20.577 6.451 1.00 20.67 C +ATOM 337 O ALA A 36 3.395 20.256 5.596 1.00 21.70 O +ATOM 338 CB ALA A 36 3.662 22.854 7.326 1.00 20.68 C +ATOM 339 H ALA A 36 5.227 21.939 9.126 1.00 0.00 H +ATOM 340 N THR A 37 5.520 20.304 6.337 1.00 20.05 N +ATOM 341 CA THR A 37 6.027 19.490 5.233 1.00 21.46 C +ATOM 342 C THR A 37 5.430 18.061 5.316 1.00 23.26 C +ATOM 343 O THR A 37 5.035 17.455 4.301 1.00 22.30 O +ATOM 344 CB THR A 37 7.565 19.411 5.296 1.00 22.61 C +ATOM 345 OG1 THR A 37 8.110 20.735 5.383 1.00 21.49 O +ATOM 346 CG2 THR A 37 8.117 18.703 4.063 1.00 24.86 C +ATOM 347 H THR A 37 6.144 20.670 6.994 1.00 0.00 H +ATOM 348 HG1 THR A 37 7.816 21.252 4.621 1.00 0.00 H +ATOM 349 N HIS A 38 5.356 17.534 6.551 1.00 22.61 N +ATOM 350 CA HIS A 38 4.747 16.236 6.788 1.00 22.32 C +ATOM 351 C HIS A 38 3.266 16.262 6.404 1.00 23.66 C +ATOM 352 O HIS A 38 2.720 15.268 5.928 1.00 24.58 O +ATOM 353 CB HIS A 38 4.859 15.863 8.257 1.00 20.45 C +ATOM 354 CG HIS A 38 6.246 15.623 8.731 1.00 20.07 C +ATOM 355 ND1 HIS A 38 6.563 15.505 10.070 1.00 19.75 N +ATOM 356 CD2 HIS A 38 7.419 15.519 8.069 1.00 20.62 C +ATOM 357 CE1 HIS A 38 7.858 15.336 10.243 1.00 21.58 C +ATOM 358 NE2 HIS A 38 8.380 15.347 9.033 1.00 21.07 N +ATOM 359 H HIS A 38 5.719 18.035 7.308 1.00 0.00 H +ATOM 360 HD1 HIS A 38 5.914 15.546 10.794 1.00 0.00 H +ATOM 361 HE2 HIS A 38 9.344 15.267 8.845 1.00 0.00 H +ATOM 362 N ILE A 39 2.600 17.377 6.659 1.00 22.79 N +ATOM 363 CA ILE A 39 1.189 17.509 6.277 1.00 25.79 C +ATOM 364 C ILE A 39 1.049 17.441 4.739 1.00 27.01 C +ATOM 365 O ILE A 39 0.113 16.832 4.209 1.00 27.50 O +ATOM 366 CB ILE A 39 0.593 18.857 6.784 1.00 25.78 C +ATOM 367 CG1 ILE A 39 0.451 18.822 8.308 1.00 25.82 C +ATOM 368 CG2 ILE A 39 -0.753 19.136 6.133 1.00 25.83 C +ATOM 369 CD1 ILE A 39 -0.033 20.127 8.900 1.00 26.05 C +ATOM 370 H ILE A 39 3.050 18.121 7.112 1.00 0.00 H +ATOM 371 N LEU A 40 1.986 18.075 4.038 1.00 27.04 N +ATOM 372 CA LEU A 40 1.953 18.101 2.581 1.00 28.05 C +ATOM 373 C LEU A 40 2.329 16.742 1.996 1.00 28.75 C +ATOM 374 O LEU A 40 1.788 16.329 0.960 1.00 29.82 O +ATOM 375 CB LEU A 40 2.879 19.202 2.054 1.00 27.15 C +ATOM 376 CG LEU A 40 2.515 20.627 2.472 1.00 27.87 C +ATOM 377 CD1 LEU A 40 3.470 21.612 1.841 1.00 26.87 C +ATOM 378 CD2 LEU A 40 1.078 20.936 2.072 1.00 27.13 C +ATOM 379 H LEU A 40 2.709 18.541 4.512 1.00 0.00 H +ATOM 380 N LYS A 41 3.242 16.043 2.643 1.00 29.67 N +ATOM 381 CA LYS A 41 3.570 14.693 2.203 1.00 32.88 C +ATOM 382 C LYS A 41 2.353 13.772 2.380 1.00 32.92 C +ATOM 383 O LYS A 41 2.113 12.887 1.562 1.00 33.65 O +ATOM 384 CB LYS A 41 4.764 14.129 2.980 1.00 35.05 C +ATOM 385 CG LYS A 41 6.078 14.828 2.690 1.00 40.79 C +ATOM 386 CD LYS A 41 7.262 14.033 3.222 1.00 45.43 C +ATOM 387 CE LYS A 41 8.571 14.734 2.889 1.00 49.42 C +ATOM 388 NZ LYS A 41 9.755 13.979 3.371 1.00 52.09 N +ATOM 389 H LYS A 41 3.699 16.431 3.415 1.00 0.00 H +ATOM 390 HZ1 LYS A 41 9.699 13.866 4.403 1.00 0.00 H +ATOM 391 HZ2 LYS A 41 9.776 13.041 2.920 1.00 0.00 H +ATOM 392 HZ3 LYS A 41 10.619 14.502 3.124 1.00 0.00 H +ATOM 393 N ALA A 42 1.581 13.997 3.446 1.00 32.20 N +ATOM 394 CA ALA A 42 0.382 13.209 3.702 1.00 32.15 C +ATOM 395 C ALA A 42 -0.678 13.434 2.618 1.00 33.55 C +ATOM 396 O ALA A 42 -1.459 12.535 2.319 1.00 33.31 O +ATOM 397 CB ALA A 42 -0.179 13.540 5.083 1.00 31.12 C +ATOM 398 H ALA A 42 1.831 14.705 4.078 1.00 0.00 H +ATOM 399 N ALA A 43 -0.704 14.637 2.027 1.00 34.01 N +ATOM 400 CA ALA A 43 -1.639 14.935 0.940 1.00 34.26 C +ATOM 401 C ALA A 43 -1.164 14.317 -0.400 1.00 35.09 C +ATOM 402 O ALA A 43 -1.780 14.532 -1.444 1.00 36.00 O +ATOM 403 CB ALA A 43 -1.812 16.443 0.800 1.00 32.11 C +ATOM 404 H ALA A 43 -0.088 15.334 2.334 1.00 0.00 H +ATOM 405 N ASN A 44 -0.054 13.575 -0.350 1.00 35.94 N +ATOM 406 CA ASN A 44 0.485 12.867 -1.520 1.00 37.87 C +ATOM 407 C ASN A 44 1.070 13.799 -2.591 1.00 36.65 C +ATOM 408 O ASN A 44 1.132 13.449 -3.777 1.00 37.27 O +ATOM 409 CB ASN A 44 -0.587 11.961 -2.122 1.00 41.40 C +ATOM 410 CG ASN A 44 -1.094 10.943 -1.116 1.00 46.56 C +ATOM 411 OD1 ASN A 44 -2.261 10.973 -0.701 1.00 49.78 O +ATOM 412 ND2 ASN A 44 -0.215 10.039 -0.707 1.00 48.00 N +ATOM 413 H ASN A 44 0.421 13.500 0.500 1.00 0.00 H +ATOM 414 HD21 ASN A 44 -0.504 9.368 -0.057 1.00 0.00 H +ATOM 415 HD22 ASN A 44 0.693 10.076 -1.076 1.00 0.00 H +ATOM 416 N PHE A 45 1.542 14.961 -2.165 1.00 33.67 N +ATOM 417 CA PHE A 45 2.126 15.914 -3.079 1.00 31.23 C +ATOM 418 C PHE A 45 3.596 15.632 -3.306 1.00 31.80 C +ATOM 419 O PHE A 45 4.332 15.338 -2.381 1.00 32.20 O +ATOM 420 CB PHE A 45 1.945 17.322 -2.540 1.00 31.12 C +ATOM 421 CG PHE A 45 0.517 17.781 -2.553 1.00 33.41 C +ATOM 422 CD1 PHE A 45 -0.390 17.273 -3.496 1.00 32.61 C +ATOM 423 CD2 PHE A 45 0.076 18.765 -1.663 1.00 33.98 C +ATOM 424 CE1 PHE A 45 -1.696 17.732 -3.548 1.00 32.35 C +ATOM 425 CE2 PHE A 45 -1.239 19.230 -1.713 1.00 34.17 C +ATOM 426 CZ PHE A 45 -2.122 18.716 -2.658 1.00 33.76 C +ATOM 427 H PHE A 45 1.504 15.175 -1.209 1.00 0.00 H +ATOM 428 N ALA A 46 4.016 15.712 -4.549 1.00 31.48 N +ATOM 429 CA ALA A 46 5.402 15.509 -4.899 1.00 30.26 C +ATOM 430 C ALA A 46 6.235 16.683 -4.414 1.00 30.35 C +ATOM 431 O ALA A 46 5.724 17.782 -4.212 1.00 28.10 O +ATOM 432 CB ALA A 46 5.546 15.368 -6.420 1.00 30.02 C +ATOM 433 H ALA A 46 3.373 15.924 -5.256 1.00 0.00 H +ATOM 434 N LYS A 47 7.531 16.442 -4.304 1.00 32.10 N +ATOM 435 CA LYS A 47 8.483 17.418 -3.792 1.00 32.24 C +ATOM 436 C LYS A 47 8.395 18.800 -4.429 1.00 30.73 C +ATOM 437 O LYS A 47 8.277 19.801 -3.722 1.00 30.50 O +ATOM 438 CB LYS A 47 9.899 16.853 -3.944 1.00 37.40 C +ATOM 439 CG LYS A 47 10.972 17.841 -3.565 1.00 42.56 C +ATOM 440 CD LYS A 47 12.341 17.207 -3.556 1.00 46.91 C +ATOM 441 CE LYS A 47 13.321 18.163 -2.910 1.00 50.20 C +ATOM 442 NZ LYS A 47 12.820 18.645 -1.584 1.00 52.19 N +ATOM 443 H LYS A 47 7.867 15.565 -4.578 1.00 0.00 H +ATOM 444 HZ1 LYS A 47 12.666 17.831 -0.956 1.00 0.00 H +ATOM 445 HZ2 LYS A 47 13.522 19.283 -1.159 1.00 0.00 H +ATOM 446 HZ3 LYS A 47 11.922 19.155 -1.715 1.00 0.00 H +ATOM 447 N ALA A 48 8.475 18.884 -5.757 1.00 29.18 N +ATOM 448 CA ALA A 48 8.416 20.192 -6.406 1.00 27.07 C +ATOM 449 C ALA A 48 7.120 20.934 -6.061 1.00 26.43 C +ATOM 450 O ALA A 48 7.125 22.153 -5.856 1.00 26.30 O +ATOM 451 CB ALA A 48 8.549 20.032 -7.907 1.00 27.43 C +ATOM 452 H ALA A 48 8.573 18.072 -6.295 1.00 0.00 H +ATOM 453 N LYS A 49 6.004 20.204 -5.990 1.00 25.81 N +ATOM 454 CA LYS A 49 4.739 20.835 -5.644 1.00 25.14 C +ATOM 455 C LYS A 49 4.708 21.228 -4.149 1.00 26.02 C +ATOM 456 O LYS A 49 4.271 22.333 -3.807 1.00 26.28 O +ATOM 457 CB LYS A 49 3.557 19.911 -5.998 1.00 23.26 C +ATOM 458 CG LYS A 49 2.204 20.550 -5.749 1.00 21.88 C +ATOM 459 CD LYS A 49 1.068 19.673 -6.205 1.00 21.75 C +ATOM 460 CE LYS A 49 -0.261 20.341 -5.886 1.00 23.25 C +ATOM 461 NZ LYS A 49 -1.431 19.580 -6.417 1.00 25.36 N +ATOM 462 H LYS A 49 6.035 19.244 -6.171 1.00 0.00 H +ATOM 463 HZ1 LYS A 49 -1.317 19.440 -7.442 1.00 0.00 H +ATOM 464 HZ2 LYS A 49 -1.486 18.656 -5.945 1.00 0.00 H +ATOM 465 HZ3 LYS A 49 -2.302 20.115 -6.235 1.00 0.00 H +ATOM 466 N ARG A 50 5.175 20.346 -3.257 1.00 26.65 N +ATOM 467 CA ARG A 50 5.214 20.698 -1.829 1.00 28.25 C +ATOM 468 C ARG A 50 6.004 21.993 -1.639 1.00 29.71 C +ATOM 469 O ARG A 50 5.571 22.889 -0.911 1.00 29.79 O +ATOM 470 CB ARG A 50 5.861 19.596 -0.974 1.00 28.86 C +ATOM 471 CG ARG A 50 5.095 18.281 -0.903 1.00 29.69 C +ATOM 472 CD ARG A 50 5.631 17.384 0.212 1.00 31.10 C +ATOM 473 NE ARG A 50 7.081 17.183 0.132 1.00 33.71 N +ATOM 474 CZ ARG A 50 7.649 16.086 -0.374 1.00 32.93 C +ATOM 475 NH1 ARG A 50 6.913 15.086 -0.812 1.00 33.08 N +ATOM 476 NH2 ARG A 50 8.962 15.997 -0.433 1.00 34.05 N +ATOM 477 H ARG A 50 5.491 19.468 -3.555 1.00 0.00 H +ATOM 478 HE ARG A 50 7.666 17.894 0.470 1.00 0.00 H +ATOM 479 HH11 ARG A 50 5.915 15.141 -0.768 1.00 0.00 H +ATOM 480 HH12 ARG A 50 7.351 14.268 -1.183 1.00 0.00 H +ATOM 481 HH21 ARG A 50 9.530 16.754 -0.109 1.00 0.00 H +ATOM 482 HH22 ARG A 50 9.390 15.182 -0.821 1.00 0.00 H +ATOM 483 N THR A 51 7.156 22.103 -2.293 1.00 30.60 N +ATOM 484 CA THR A 51 7.940 23.328 -2.202 1.00 34.13 C +ATOM 485 C THR A 51 7.126 24.546 -2.664 1.00 36.23 C +ATOM 486 O THR A 51 7.116 25.572 -1.989 1.00 37.79 O +ATOM 487 CB THR A 51 9.229 23.248 -3.045 1.00 34.90 C +ATOM 488 OG1 THR A 51 10.012 22.129 -2.618 1.00 37.41 O +ATOM 489 CG2 THR A 51 10.053 24.516 -2.883 1.00 34.97 C +ATOM 490 H THR A 51 7.478 21.356 -2.840 1.00 0.00 H +ATOM 491 HG1 THR A 51 10.112 22.153 -1.662 1.00 0.00 H +ATOM 492 N ARG A 52 6.437 24.426 -3.808 1.00 36.91 N +ATOM 493 CA ARG A 52 5.643 25.532 -4.334 1.00 37.18 C +ATOM 494 C ARG A 52 4.606 25.971 -3.336 1.00 36.76 C +ATOM 495 O ARG A 52 4.440 27.160 -3.082 1.00 36.25 O +ATOM 496 CB ARG A 52 4.936 25.144 -5.645 1.00 40.06 C +ATOM 497 CG ARG A 52 5.789 25.346 -6.882 1.00 46.55 C +ATOM 498 CD ARG A 52 5.012 25.112 -8.177 1.00 50.64 C +ATOM 499 NE ARG A 52 4.800 23.686 -8.469 1.00 54.17 N +ATOM 500 CZ ARG A 52 3.586 23.152 -8.595 1.00 55.29 C +ATOM 501 NH1 ARG A 52 2.510 23.914 -8.453 1.00 55.77 N +ATOM 502 NH2 ARG A 52 3.448 21.863 -8.859 1.00 54.72 N +ATOM 503 H ARG A 52 6.465 23.577 -4.298 1.00 0.00 H +ATOM 504 HE ARG A 52 5.582 23.107 -8.573 1.00 0.00 H +ATOM 505 HH11 ARG A 52 2.609 24.886 -8.243 1.00 0.00 H +ATOM 506 HH12 ARG A 52 1.601 23.516 -8.532 1.00 0.00 H +ATOM 507 HH21 ARG A 52 4.256 21.283 -8.962 1.00 0.00 H +ATOM 508 HH22 ARG A 52 2.534 21.466 -8.949 1.00 0.00 H +ATOM 509 N ILE A 53 3.911 25.007 -2.763 1.00 35.47 N +ATOM 510 CA ILE A 53 2.880 25.315 -1.797 1.00 34.72 C +ATOM 511 C ILE A 53 3.469 25.944 -0.519 1.00 36.40 C +ATOM 512 O ILE A 53 2.917 26.915 0.007 1.00 35.83 O +ATOM 513 CB ILE A 53 2.060 24.063 -1.457 1.00 32.23 C +ATOM 514 CG1 ILE A 53 1.312 23.604 -2.722 1.00 29.11 C +ATOM 515 CG2 ILE A 53 1.091 24.371 -0.326 1.00 31.92 C +ATOM 516 CD1 ILE A 53 0.519 22.328 -2.562 1.00 26.86 C +ATOM 517 H ILE A 53 4.101 24.073 -2.991 1.00 0.00 H +ATOM 518 N LEU A 54 4.593 25.421 -0.035 1.00 37.08 N +ATOM 519 CA LEU A 54 5.218 26.007 1.135 1.00 40.29 C +ATOM 520 C LEU A 54 5.580 27.455 0.843 1.00 44.75 C +ATOM 521 O LEU A 54 5.191 28.352 1.593 1.00 46.69 O +ATOM 522 CB LEU A 54 6.455 25.213 1.570 1.00 36.32 C +ATOM 523 CG LEU A 54 6.184 23.848 2.250 1.00 35.63 C +ATOM 524 CD1 LEU A 54 7.482 23.082 2.415 1.00 35.47 C +ATOM 525 CD2 LEU A 54 5.495 24.031 3.599 1.00 32.30 C +ATOM 526 H LEU A 54 4.995 24.636 -0.465 1.00 0.00 H +ATOM 527 N GLU A 55 6.255 27.694 -0.278 1.00 48.95 N +ATOM 528 CA GLU A 55 6.653 29.057 -0.641 1.00 53.87 C +ATOM 529 C GLU A 55 5.475 30.011 -0.879 1.00 55.01 C +ATOM 530 O GLU A 55 5.632 31.220 -0.716 1.00 56.05 O +ATOM 531 CB GLU A 55 7.559 29.061 -1.867 1.00 56.02 C +ATOM 532 CG GLU A 55 8.998 28.661 -1.574 1.00 61.71 C +ATOM 533 CD GLU A 55 9.913 28.817 -2.782 1.00 65.77 C +ATOM 534 OE1 GLU A 55 9.578 29.620 -3.692 1.00 67.68 O +ATOM 535 OE2 GLU A 55 10.972 28.141 -2.825 1.00 67.99 O +ATOM 536 H GLU A 55 6.487 26.949 -0.871 1.00 0.00 H +ATOM 537 N LYS A 56 4.300 29.504 -1.233 1.00 56.16 N +ATOM 538 CA LYS A 56 3.190 30.407 -1.512 1.00 57.49 C +ATOM 539 C LYS A 56 2.177 30.484 -0.374 1.00 57.70 C +ATOM 540 O LYS A 56 1.709 31.565 -0.027 1.00 58.88 O +ATOM 541 CB LYS A 56 2.462 30.010 -2.805 1.00 59.37 C +ATOM 542 CG LYS A 56 3.353 29.694 -4.000 1.00 60.92 C +ATOM 543 CD LYS A 56 4.379 30.776 -4.270 1.00 62.11 C +ATOM 544 CE LYS A 56 5.349 30.325 -5.346 1.00 62.44 C +ATOM 545 NZ LYS A 56 6.619 31.101 -5.312 1.00 63.21 N +ATOM 546 H LYS A 56 4.182 28.533 -1.316 1.00 0.00 H +ATOM 547 HZ1 LYS A 56 6.413 32.110 -5.451 1.00 0.00 H +ATOM 548 HZ2 LYS A 56 7.083 30.968 -4.390 1.00 0.00 H +ATOM 549 HZ3 LYS A 56 7.249 30.768 -6.070 1.00 0.00 H +ATOM 550 N GLU A 57 1.827 29.347 0.196 1.00 57.07 N +ATOM 551 CA GLU A 57 0.797 29.311 1.235 1.00 56.65 C +ATOM 552 C GLU A 57 1.332 29.368 2.684 1.00 54.52 C +ATOM 553 O GLU A 57 0.620 29.824 3.598 1.00 54.61 O +ATOM 554 CB GLU A 57 -0.062 28.043 1.078 1.00 59.13 C +ATOM 555 CG GLU A 57 -1.132 28.102 -0.004 1.00 63.67 C +ATOM 556 CD GLU A 57 -0.571 28.357 -1.387 1.00 67.30 C +ATOM 557 OE1 GLU A 57 -0.072 27.402 -2.017 1.00 69.12 O +ATOM 558 OE2 GLU A 57 -0.632 29.519 -1.849 1.00 70.26 O +ATOM 559 H GLU A 57 2.257 28.521 -0.082 1.00 0.00 H +ATOM 560 N VAL A 58 2.570 28.937 2.917 1.00 49.63 N +ATOM 561 CA VAL A 58 3.017 28.786 4.292 1.00 44.43 C +ATOM 562 C VAL A 58 4.100 29.778 4.744 1.00 42.78 C +ATOM 563 O VAL A 58 4.065 30.242 5.888 1.00 40.70 O +ATOM 564 CB VAL A 58 3.470 27.322 4.534 1.00 43.06 C +ATOM 565 CG1 VAL A 58 3.795 27.092 5.998 1.00 40.87 C +ATOM 566 CG2 VAL A 58 2.370 26.369 4.086 1.00 40.46 C +ATOM 567 H VAL A 58 3.172 28.726 2.171 1.00 0.00 H +ATOM 568 N LEU A 59 5.045 30.125 3.873 1.00 39.75 N +ATOM 569 CA LEU A 59 6.126 31.020 4.281 1.00 38.99 C +ATOM 570 C LEU A 59 5.649 32.438 4.643 1.00 38.81 C +ATOM 571 O LEU A 59 6.371 33.182 5.311 1.00 38.40 O +ATOM 572 CB LEU A 59 7.220 31.083 3.218 1.00 40.26 C +ATOM 573 CG LEU A 59 8.011 29.793 2.935 1.00 42.18 C +ATOM 574 CD1 LEU A 59 9.048 30.068 1.854 1.00 43.46 C +ATOM 575 CD2 LEU A 59 8.705 29.285 4.187 1.00 40.89 C +ATOM 576 H LEU A 59 5.019 29.775 2.957 1.00 0.00 H +ATOM 577 N LYS A 60 4.442 32.824 4.220 1.00 37.98 N +ATOM 578 CA LYS A 60 3.900 34.140 4.604 1.00 38.59 C +ATOM 579 C LYS A 60 3.195 34.061 5.973 1.00 36.39 C +ATOM 580 O LYS A 60 2.649 35.028 6.474 1.00 35.79 O +ATOM 581 CB LYS A 60 2.940 34.673 3.522 1.00 41.34 C +ATOM 582 CG LYS A 60 1.766 33.760 3.171 1.00 47.49 C +ATOM 583 CD LYS A 60 0.876 34.407 2.102 1.00 50.85 C +ATOM 584 CE LYS A 60 -0.508 33.757 2.010 1.00 53.27 C +ATOM 585 NZ LYS A 60 -0.459 32.368 1.466 1.00 54.66 N +ATOM 586 H LYS A 60 3.915 32.232 3.649 1.00 0.00 H +ATOM 587 HZ1 LYS A 60 0.153 31.784 2.070 1.00 0.00 H +ATOM 588 HZ2 LYS A 60 -1.418 31.967 1.451 1.00 0.00 H +ATOM 589 HZ3 LYS A 60 -0.076 32.388 0.500 1.00 0.00 H +ATOM 590 N GLU A 61 3.241 32.884 6.559 1.00 35.74 N +ATOM 591 CA GLU A 61 2.635 32.606 7.849 1.00 34.60 C +ATOM 592 C GLU A 61 3.719 32.560 8.935 1.00 30.62 C +ATOM 593 O GLU A 61 4.924 32.542 8.646 1.00 28.48 O +ATOM 594 CB GLU A 61 1.990 31.214 7.782 1.00 39.66 C +ATOM 595 CG GLU A 61 0.636 31.096 8.418 1.00 45.92 C +ATOM 596 CD GLU A 61 -0.377 31.877 7.639 1.00 48.95 C +ATOM 597 OE1 GLU A 61 -0.692 31.467 6.495 1.00 51.19 O +ATOM 598 OE2 GLU A 61 -0.850 32.904 8.161 1.00 51.71 O +ATOM 599 H GLU A 61 3.711 32.155 6.108 1.00 0.00 H +ATOM 600 N THR A 62 3.293 32.544 10.171 1.00 27.25 N +ATOM 601 CA THR A 62 4.222 32.307 11.253 1.00 25.63 C +ATOM 602 C THR A 62 4.784 30.874 11.059 1.00 24.77 C +ATOM 603 O THR A 62 4.029 29.932 10.840 1.00 25.37 O +ATOM 604 CB THR A 62 3.489 32.435 12.612 1.00 24.97 C +ATOM 605 OG1 THR A 62 3.032 33.783 12.735 1.00 26.20 O +ATOM 606 CG2 THR A 62 4.398 32.117 13.789 1.00 21.20 C +ATOM 607 H THR A 62 2.346 32.689 10.363 1.00 0.00 H +ATOM 608 HG1 THR A 62 2.683 34.075 11.886 1.00 0.00 H +ATOM 609 N HIS A 63 6.090 30.727 11.103 1.00 22.46 N +ATOM 610 CA HIS A 63 6.689 29.428 10.867 1.00 21.88 C +ATOM 611 C HIS A 63 8.151 29.435 11.272 1.00 22.48 C +ATOM 612 O HIS A 63 8.745 30.495 11.513 1.00 21.68 O +ATOM 613 CB HIS A 63 6.608 29.071 9.366 1.00 20.21 C +ATOM 614 CG HIS A 63 7.519 29.918 8.512 1.00 20.30 C +ATOM 615 ND1 HIS A 63 7.125 31.124 7.953 1.00 21.50 N +ATOM 616 CD2 HIS A 63 8.845 29.800 8.198 1.00 20.65 C +ATOM 617 CE1 HIS A 63 8.126 31.727 7.333 1.00 20.90 C +ATOM 618 NE2 HIS A 63 9.169 30.942 7.478 1.00 21.55 N +ATOM 619 H HIS A 63 6.663 31.500 11.309 1.00 0.00 H +ATOM 620 HD1 HIS A 63 6.209 31.477 7.991 1.00 0.00 H +ATOM 621 HE2 HIS A 63 10.052 31.147 7.133 1.00 0.00 H +ATOM 622 N GLU A 64 8.738 28.251 11.238 1.00 22.95 N +ATOM 623 CA GLU A 64 10.138 28.055 11.535 1.00 23.61 C +ATOM 624 C GLU A 64 10.697 27.100 10.460 1.00 24.98 C +ATOM 625 O GLU A 64 10.132 26.021 10.254 1.00 24.19 O +ATOM 626 CB GLU A 64 10.199 27.431 12.901 1.00 25.13 C +ATOM 627 CG GLU A 64 11.558 27.257 13.499 1.00 33.54 C +ATOM 628 CD GLU A 64 11.474 26.481 14.804 1.00 36.59 C +ATOM 629 OE1 GLU A 64 10.501 26.685 15.558 1.00 36.12 O +ATOM 630 OE2 GLU A 64 12.376 25.665 15.070 1.00 41.18 O +ATOM 631 H GLU A 64 8.200 27.468 10.997 1.00 0.00 H +ATOM 632 N LYS A 65 11.739 27.531 9.737 1.00 24.36 N +ATOM 633 CA LYS A 65 12.353 26.718 8.693 1.00 28.24 C +ATOM 634 C LYS A 65 13.510 25.954 9.251 1.00 28.33 C +ATOM 635 O LYS A 65 14.585 26.503 9.412 1.00 28.08 O +ATOM 636 CB LYS A 65 12.896 27.587 7.556 1.00 31.73 C +ATOM 637 CG LYS A 65 12.049 27.649 6.299 1.00 36.91 C +ATOM 638 CD LYS A 65 12.165 29.023 5.643 1.00 40.14 C +ATOM 639 CE LYS A 65 11.933 30.111 6.681 1.00 39.32 C +ATOM 640 NZ LYS A 65 11.630 31.435 6.088 1.00 36.54 N +ATOM 641 H LYS A 65 12.110 28.420 9.924 1.00 0.00 H +ATOM 642 HZ1 LYS A 65 12.425 31.734 5.487 1.00 0.00 H +ATOM 643 HZ2 LYS A 65 10.766 31.367 5.511 1.00 0.00 H +ATOM 644 HZ3 LYS A 65 11.487 32.131 6.847 1.00 0.00 H +ATOM 645 N VAL A 66 13.291 24.696 9.552 1.00 31.01 N +ATOM 646 CA VAL A 66 14.358 23.851 10.050 1.00 34.94 C +ATOM 647 C VAL A 66 14.962 23.049 8.896 1.00 39.67 C +ATOM 648 O VAL A 66 14.428 22.006 8.483 1.00 37.52 O +ATOM 649 CB VAL A 66 13.862 22.887 11.168 1.00 34.61 C +ATOM 650 CG1 VAL A 66 14.973 21.935 11.594 1.00 33.81 C +ATOM 651 CG2 VAL A 66 13.401 23.687 12.375 1.00 34.49 C +ATOM 652 H VAL A 66 12.388 24.323 9.443 1.00 0.00 H +ATOM 653 N GLN A 67 16.040 23.586 8.332 1.00 46.01 N +ATOM 654 CA GLN A 67 16.763 22.891 7.275 1.00 53.84 C +ATOM 655 C GLN A 67 18.179 22.570 7.732 1.00 58.95 C +ATOM 656 O GLN A 67 19.013 22.109 6.948 1.00 60.26 O +ATOM 657 CB GLN A 67 16.784 23.703 5.985 1.00 53.89 C +ATOM 658 CG GLN A 67 15.426 23.779 5.294 1.00 59.07 C +ATOM 659 CD GLN A 67 14.657 22.452 5.300 1.00 60.32 C +ATOM 660 OE1 GLN A 67 15.031 21.480 4.629 1.00 62.98 O +ATOM 661 NE2 GLN A 67 13.571 22.404 6.053 1.00 59.66 N +ATOM 662 H GLN A 67 16.348 24.470 8.627 1.00 0.00 H +ATOM 663 HE21 GLN A 67 13.049 21.578 6.062 1.00 0.00 H +ATOM 664 HE22 GLN A 67 13.328 23.200 6.571 1.00 0.00 H +ATOM 665 N GLY A 68 18.428 22.811 9.025 1.00 63.66 N +ATOM 666 CA GLY A 68 19.718 22.513 9.608 1.00 67.82 C +ATOM 667 C GLY A 68 19.631 21.327 10.546 1.00 70.65 C +ATOM 668 O GLY A 68 20.590 20.563 10.690 1.00 72.02 O +ATOM 669 H GLY A 68 17.727 23.193 9.587 1.00 0.00 H +ATOM 670 N GLY A 69 18.484 21.187 11.208 1.00 72.32 N +ATOM 671 CA GLY A 69 18.274 20.048 12.083 1.00 73.41 C +ATOM 672 C GLY A 69 18.041 18.789 11.270 1.00 73.97 C +ATOM 673 O GLY A 69 16.899 18.441 10.969 1.00 75.24 O +ATOM 674 H GLY A 69 17.778 21.853 11.102 1.00 0.00 H +ATOM 675 N PHE A 70 19.137 18.135 10.900 1.00 73.39 N +ATOM 676 CA PHE A 70 19.106 16.920 10.080 1.00 72.45 C +ATOM 677 C PHE A 70 18.165 15.833 10.606 1.00 69.47 C +ATOM 678 O PHE A 70 18.036 15.622 11.819 1.00 69.28 O +ATOM 679 CB PHE A 70 20.534 16.352 9.963 1.00 77.03 C +ATOM 680 CG PHE A 70 20.600 14.896 9.586 1.00 79.94 C +ATOM 681 CD1 PHE A 70 20.367 14.492 8.269 1.00 81.63 C +ATOM 682 CD2 PHE A 70 20.858 13.920 10.561 1.00 80.76 C +ATOM 683 CE1 PHE A 70 20.384 13.141 7.933 1.00 82.97 C +ATOM 684 CE2 PHE A 70 20.875 12.571 10.232 1.00 81.33 C +ATOM 685 CZ PHE A 70 20.638 12.181 8.917 1.00 82.90 C +ATOM 686 H PHE A 70 20.007 18.487 11.182 1.00 0.00 H +ATOM 687 N GLY A 71 17.534 15.127 9.666 1.00 65.37 N +ATOM 688 CA GLY A 71 16.681 14.014 10.024 1.00 60.61 C +ATOM 689 C GLY A 71 15.251 14.174 9.548 1.00 56.43 C +ATOM 690 O GLY A 71 14.949 15.071 8.766 1.00 56.11 O +ATOM 691 H GLY A 71 17.632 15.378 8.724 1.00 0.00 H +ATOM 692 N LYS A 72 14.367 13.295 10.036 1.00 51.93 N +ATOM 693 CA LYS A 72 12.939 13.359 9.704 1.00 47.12 C +ATOM 694 C LYS A 72 12.312 14.620 10.322 1.00 42.99 C +ATOM 695 O LYS A 72 11.172 14.976 10.019 1.00 41.22 O +ATOM 696 CB LYS A 72 12.214 12.127 10.263 1.00 47.52 C +ATOM 697 CG LYS A 72 12.828 10.789 9.890 1.00 47.51 C +ATOM 698 CD LYS A 72 13.208 9.975 11.122 1.00 45.89 C +ATOM 699 CE LYS A 72 12.024 9.749 12.053 1.00 45.99 C +ATOM 700 NZ LYS A 72 10.946 8.941 11.439 1.00 43.61 N +ATOM 701 H LYS A 72 14.682 12.587 10.635 1.00 0.00 H +ATOM 702 HZ1 LYS A 72 10.620 9.405 10.566 1.00 0.00 H +ATOM 703 HZ2 LYS A 72 11.311 7.995 11.214 1.00 0.00 H +ATOM 704 HZ3 LYS A 72 10.153 8.856 12.105 1.00 0.00 H +ATOM 705 N TYR A 73 13.084 15.252 11.211 1.00 38.82 N +ATOM 706 CA TYR A 73 12.666 16.439 11.926 1.00 35.13 C +ATOM 707 C TYR A 73 12.654 17.679 11.023 1.00 33.18 C +ATOM 708 O TYR A 73 11.879 18.607 11.253 1.00 30.17 O +ATOM 709 CB TYR A 73 13.600 16.649 13.125 1.00 32.68 C +ATOM 710 CG TYR A 73 13.198 17.796 14.018 1.00 32.41 C +ATOM 711 CD1 TYR A 73 12.116 17.691 14.884 1.00 31.25 C +ATOM 712 CD2 TYR A 73 13.835 19.025 13.921 1.00 32.40 C +ATOM 713 CE1 TYR A 73 11.679 18.785 15.613 1.00 30.72 C +ATOM 714 CE2 TYR A 73 13.400 20.120 14.644 1.00 32.39 C +ATOM 715 CZ TYR A 73 12.317 19.993 15.478 1.00 30.86 C +ATOM 716 OH TYR A 73 11.840 21.094 16.130 1.00 32.23 O +ATOM 717 H TYR A 73 13.974 14.893 11.393 1.00 0.00 H +ATOM 718 HH TYR A 73 12.352 21.867 15.869 1.00 0.00 H +ATOM 719 N GLN A 74 13.525 17.690 10.013 1.00 31.23 N +ATOM 720 CA GLN A 74 13.605 18.814 9.066 1.00 29.72 C +ATOM 721 C GLN A 74 12.254 19.162 8.468 1.00 26.23 C +ATOM 722 O GLN A 74 11.409 18.291 8.229 1.00 24.41 O +ATOM 723 CB GLN A 74 14.535 18.475 7.902 1.00 33.74 C +ATOM 724 CG GLN A 74 16.010 18.494 8.213 1.00 41.63 C +ATOM 725 CD GLN A 74 16.825 17.988 7.039 1.00 47.74 C +ATOM 726 OE1 GLN A 74 17.535 16.971 7.143 1.00 52.12 O +ATOM 727 NE2 GLN A 74 16.728 18.678 5.908 1.00 49.67 N +ATOM 728 H GLN A 74 14.129 16.927 9.898 1.00 0.00 H +ATOM 729 HE21 GLN A 74 17.240 18.365 5.133 1.00 0.00 H +ATOM 730 HE22 GLN A 74 16.152 19.471 5.887 1.00 0.00 H +ATOM 731 N GLY A 75 12.066 20.432 8.182 1.00 24.61 N +ATOM 732 CA GLY A 75 10.849 20.850 7.522 1.00 22.59 C +ATOM 733 C GLY A 75 10.439 22.235 7.929 1.00 22.00 C +ATOM 734 O GLY A 75 11.189 22.944 8.595 1.00 20.96 O +ATOM 735 H GLY A 75 12.741 21.096 8.433 1.00 0.00 H +ATOM 736 N THR A 76 9.267 22.641 7.507 1.00 22.18 N +ATOM 737 CA THR A 76 8.739 23.926 7.925 1.00 23.13 C +ATOM 738 C THR A 76 7.705 23.707 9.012 1.00 21.22 C +ATOM 739 O THR A 76 6.677 23.047 8.785 1.00 20.41 O +ATOM 740 CB THR A 76 8.129 24.677 6.750 1.00 22.98 C +ATOM 741 OG1 THR A 76 9.172 24.951 5.823 1.00 23.34 O +ATOM 742 CG2 THR A 76 7.529 25.993 7.203 1.00 22.12 C +ATOM 743 H THR A 76 8.743 22.073 6.908 1.00 0.00 H +ATOM 744 HG1 THR A 76 9.671 24.146 5.648 1.00 0.00 H +ATOM 745 N TRP A 77 8.007 24.190 10.198 1.00 18.01 N +ATOM 746 CA TRP A 77 7.115 24.000 11.334 1.00 19.61 C +ATOM 747 C TRP A 77 6.172 25.179 11.495 1.00 20.15 C +ATOM 748 O TRP A 77 6.569 26.324 11.307 1.00 21.17 O +ATOM 749 CB TRP A 77 7.954 23.797 12.587 1.00 18.45 C +ATOM 750 CG TRP A 77 8.738 22.517 12.563 1.00 16.73 C +ATOM 751 CD1 TRP A 77 9.924 22.262 11.889 1.00 19.52 C +ATOM 752 CD2 TRP A 77 8.383 21.314 13.246 1.00 16.18 C +ATOM 753 NE1 TRP A 77 10.287 20.964 12.134 1.00 18.03 N +ATOM 754 CE2 TRP A 77 9.378 20.351 12.952 1.00 18.24 C +ATOM 755 CE3 TRP A 77 7.303 20.950 14.076 1.00 15.09 C +ATOM 756 CZ2 TRP A 77 9.333 19.052 13.464 1.00 17.80 C +ATOM 757 CZ3 TRP A 77 7.263 19.657 14.586 1.00 16.17 C +ATOM 758 CH2 TRP A 77 8.271 18.728 14.275 1.00 16.88 C +ATOM 759 H TRP A 77 8.844 24.682 10.320 1.00 0.00 H +ATOM 760 HE1 TRP A 77 11.083 20.525 11.763 1.00 0.00 H +ATOM 761 N VAL A 78 4.940 24.916 11.848 1.00 19.79 N +ATOM 762 CA VAL A 78 3.960 25.992 11.977 1.00 21.20 C +ATOM 763 C VAL A 78 3.102 25.800 13.232 1.00 22.23 C +ATOM 764 O VAL A 78 3.039 24.692 13.785 1.00 20.52 O +ATOM 765 CB VAL A 78 3.014 26.045 10.738 1.00 20.50 C +ATOM 766 CG1 VAL A 78 3.805 26.352 9.464 1.00 19.09 C +ATOM 767 CG2 VAL A 78 2.264 24.722 10.594 1.00 19.19 C +ATOM 768 H VAL A 78 4.670 23.993 12.035 1.00 0.00 H +ATOM 769 N PRO A 79 2.461 26.879 13.729 1.00 22.62 N +ATOM 770 CA PRO A 79 1.579 26.796 14.902 1.00 23.25 C +ATOM 771 C PRO A 79 0.479 25.793 14.613 1.00 23.88 C +ATOM 772 O PRO A 79 0.126 25.577 13.452 1.00 22.74 O +ATOM 773 CB PRO A 79 1.009 28.217 15.030 1.00 22.80 C +ATOM 774 CG PRO A 79 2.089 29.063 14.441 1.00 23.48 C +ATOM 775 CD PRO A 79 2.583 28.279 13.243 1.00 21.77 C +ATOM 776 N LEU A 80 -0.081 25.221 15.664 1.00 25.83 N +ATOM 777 CA LEU A 80 -1.142 24.222 15.543 1.00 26.16 C +ATOM 778 C LEU A 80 -2.338 24.712 14.733 1.00 28.51 C +ATOM 779 O LEU A 80 -2.846 23.991 13.849 1.00 27.56 O +ATOM 780 CB LEU A 80 -1.606 23.815 16.940 1.00 25.96 C +ATOM 781 CG LEU A 80 -2.660 22.728 17.020 1.00 26.73 C +ATOM 782 CD1 LEU A 80 -2.142 21.452 16.363 1.00 25.64 C +ATOM 783 CD2 LEU A 80 -3.028 22.488 18.480 1.00 29.49 C +ATOM 784 H LEU A 80 0.229 25.469 16.557 1.00 0.00 H +ATOM 785 N ASN A 81 -2.811 25.922 15.016 1.00 30.41 N +ATOM 786 CA ASN A 81 -3.989 26.411 14.305 1.00 33.34 C +ATOM 787 C ASN A 81 -3.726 26.541 12.797 1.00 33.24 C +ATOM 788 O ASN A 81 -4.593 26.200 11.979 1.00 32.55 O +ATOM 789 CB ASN A 81 -4.522 27.720 14.912 1.00 36.72 C +ATOM 790 CG ASN A 81 -3.615 28.898 14.707 1.00 41.39 C +ATOM 791 OD1 ASN A 81 -2.520 28.954 15.254 1.00 45.06 O +ATOM 792 ND2 ASN A 81 -4.064 29.855 13.912 1.00 44.46 N +ATOM 793 H ASN A 81 -2.379 26.474 15.701 1.00 0.00 H +ATOM 794 HD21 ASN A 81 -3.494 30.640 13.765 1.00 0.00 H +ATOM 795 HD22 ASN A 81 -4.947 29.746 13.504 1.00 0.00 H +ATOM 796 N ILE A 82 -2.509 26.970 12.436 1.00 33.12 N +ATOM 797 CA ILE A 82 -2.133 27.108 11.022 1.00 33.42 C +ATOM 798 C ILE A 82 -1.996 25.751 10.338 1.00 33.66 C +ATOM 799 O ILE A 82 -2.344 25.611 9.172 1.00 33.06 O +ATOM 800 CB ILE A 82 -0.820 27.882 10.878 1.00 34.68 C +ATOM 801 CG1 ILE A 82 -1.027 29.318 11.381 1.00 35.90 C +ATOM 802 CG2 ILE A 82 -0.364 27.862 9.424 1.00 32.30 C +ATOM 803 CD1 ILE A 82 0.246 30.062 11.708 1.00 36.35 C +ATOM 804 H ILE A 82 -1.856 27.193 13.129 1.00 0.00 H +ATOM 805 N ALA A 83 -1.487 24.751 11.078 1.00 33.47 N +ATOM 806 CA ALA A 83 -1.385 23.383 10.547 1.00 32.68 C +ATOM 807 C ALA A 83 -2.796 22.798 10.314 1.00 32.07 C +ATOM 808 O ALA A 83 -3.034 22.097 9.335 1.00 30.79 O +ATOM 809 CB ALA A 83 -0.586 22.496 11.509 1.00 31.27 C +ATOM 810 H ALA A 83 -1.184 24.937 11.992 1.00 0.00 H +ATOM 811 N LYS A 84 -3.729 23.093 11.215 1.00 33.43 N +ATOM 812 CA LYS A 84 -5.093 22.639 11.041 1.00 35.11 C +ATOM 813 C LYS A 84 -5.693 23.212 9.756 1.00 36.73 C +ATOM 814 O LYS A 84 -6.318 22.491 8.974 1.00 36.83 O +ATOM 815 CB LYS A 84 -5.948 23.050 12.228 1.00 37.36 C +ATOM 816 CG LYS A 84 -5.607 22.354 13.530 1.00 40.04 C +ATOM 817 CD LYS A 84 -6.871 22.073 14.319 1.00 42.74 C +ATOM 818 CE LYS A 84 -6.559 21.578 15.716 1.00 45.28 C +ATOM 819 NZ LYS A 84 -6.384 22.711 16.664 1.00 49.86 N +ATOM 820 H LYS A 84 -3.489 23.619 12.006 1.00 0.00 H +ATOM 821 HZ1 LYS A 84 -5.641 23.348 16.311 1.00 0.00 H +ATOM 822 HZ2 LYS A 84 -7.280 23.233 16.744 1.00 0.00 H +ATOM 823 HZ3 LYS A 84 -6.113 22.344 17.598 1.00 0.00 H +ATOM 824 N GLN A 85 -5.504 24.510 9.535 1.00 37.40 N +ATOM 825 CA GLN A 85 -5.981 25.141 8.298 1.00 38.47 C +ATOM 826 C GLN A 85 -5.414 24.411 7.065 1.00 37.19 C +ATOM 827 O GLN A 85 -6.144 24.015 6.168 1.00 36.76 O +ATOM 828 CB GLN A 85 -5.550 26.617 8.243 1.00 41.65 C +ATOM 829 CG GLN A 85 -6.176 27.513 9.302 1.00 47.67 C +ATOM 830 CD GLN A 85 -5.653 28.953 9.274 1.00 52.44 C +ATOM 831 OE1 GLN A 85 -4.985 29.379 8.321 1.00 53.70 O +ATOM 832 NE2 GLN A 85 -5.956 29.710 10.327 1.00 54.30 N +ATOM 833 H GLN A 85 -5.029 25.050 10.201 1.00 0.00 H +ATOM 834 HE21 GLN A 85 -5.645 30.638 10.336 1.00 0.00 H +ATOM 835 HE22 GLN A 85 -6.483 29.308 11.051 1.00 0.00 H +ATOM 836 N LEU A 86 -4.107 24.239 7.050 1.00 35.90 N +ATOM 837 CA LEU A 86 -3.427 23.593 5.952 1.00 35.57 C +ATOM 838 C LEU A 86 -3.973 22.187 5.705 1.00 36.04 C +ATOM 839 O LEU A 86 -4.216 21.789 4.568 1.00 35.67 O +ATOM 840 CB LEU A 86 -1.940 23.522 6.282 1.00 35.24 C +ATOM 841 CG LEU A 86 -0.979 23.392 5.104 1.00 37.99 C +ATOM 842 CD1 LEU A 86 -1.046 24.641 4.236 1.00 37.21 C +ATOM 843 CD2 LEU A 86 0.434 23.187 5.623 1.00 37.56 C +ATOM 844 H LEU A 86 -3.579 24.563 7.810 1.00 0.00 H +ATOM 845 N ALA A 87 -4.167 21.440 6.774 1.00 37.61 N +ATOM 846 CA ALA A 87 -4.658 20.075 6.672 1.00 40.07 C +ATOM 847 C ALA A 87 -6.071 20.045 6.108 1.00 42.25 C +ATOM 848 O ALA A 87 -6.423 19.123 5.387 1.00 44.08 O +ATOM 849 CB ALA A 87 -4.614 19.402 8.041 1.00 37.62 C +ATOM 850 H ALA A 87 -3.984 21.816 7.658 1.00 0.00 H +ATOM 851 N GLU A 88 -6.881 21.042 6.453 1.00 44.94 N +ATOM 852 CA GLU A 88 -8.250 21.137 5.934 1.00 47.72 C +ATOM 853 C GLU A 88 -8.249 21.462 4.446 1.00 46.92 C +ATOM 854 O GLU A 88 -8.935 20.809 3.652 1.00 46.82 O +ATOM 855 CB GLU A 88 -9.029 22.238 6.647 1.00 51.27 C +ATOM 856 CG GLU A 88 -9.499 21.887 8.035 1.00 58.64 C +ATOM 857 CD GLU A 88 -10.532 22.873 8.532 1.00 63.08 C +ATOM 858 OE1 GLU A 88 -11.497 23.154 7.774 1.00 65.53 O +ATOM 859 OE2 GLU A 88 -10.381 23.370 9.674 1.00 64.92 O +ATOM 860 H GLU A 88 -6.554 21.730 7.069 1.00 0.00 H +ATOM 861 N LYS A 89 -7.484 22.490 4.087 1.00 45.19 N +ATOM 862 CA LYS A 89 -7.401 22.930 2.722 1.00 45.73 C +ATOM 863 C LYS A 89 -7.064 21.776 1.802 1.00 45.59 C +ATOM 864 O LYS A 89 -7.728 21.571 0.792 1.00 46.84 O +ATOM 865 CB LYS A 89 -6.346 24.019 2.592 1.00 46.57 C +ATOM 866 CG LYS A 89 -6.374 24.759 1.269 1.00 49.11 C +ATOM 867 CD LYS A 89 -5.470 25.976 1.314 1.00 52.19 C +ATOM 868 CE LYS A 89 -5.826 26.963 0.216 1.00 55.10 C +ATOM 869 NZ LYS A 89 -5.139 28.274 0.395 1.00 56.62 N +ATOM 870 H LYS A 89 -6.963 22.959 4.773 1.00 0.00 H +ATOM 871 HZ1 LYS A 89 -4.109 28.127 0.406 1.00 0.00 H +ATOM 872 HZ2 LYS A 89 -5.390 28.905 -0.391 1.00 0.00 H +ATOM 873 HZ3 LYS A 89 -5.437 28.704 1.294 1.00 0.00 H +ATOM 874 N PHE A 90 -6.055 21.001 2.163 1.00 44.53 N +ATOM 875 CA PHE A 90 -5.631 19.900 1.314 1.00 44.24 C +ATOM 876 C PHE A 90 -6.275 18.576 1.716 1.00 44.45 C +ATOM 877 O PHE A 90 -5.737 17.496 1.463 1.00 44.80 O +ATOM 878 CB PHE A 90 -4.099 19.837 1.283 1.00 43.69 C +ATOM 879 CG PHE A 90 -3.510 21.100 0.707 1.00 43.58 C +ATOM 880 CD1 PHE A 90 -3.664 21.403 -0.642 1.00 44.38 C +ATOM 881 CD2 PHE A 90 -2.881 22.034 1.523 1.00 44.26 C +ATOM 882 CE1 PHE A 90 -3.212 22.610 -1.165 1.00 43.38 C +ATOM 883 CE2 PHE A 90 -2.425 23.246 1.011 1.00 43.71 C +ATOM 884 CZ PHE A 90 -2.592 23.535 -0.337 1.00 43.90 C +ATOM 885 H PHE A 90 -5.588 21.170 3.009 1.00 0.00 H +ATOM 886 N SER A 91 -7.444 18.690 2.345 1.00 45.17 N +ATOM 887 CA SER A 91 -8.282 17.543 2.686 1.00 45.85 C +ATOM 888 C SER A 91 -7.553 16.348 3.290 1.00 45.16 C +ATOM 889 O SER A 91 -7.662 15.229 2.790 1.00 45.12 O +ATOM 890 CB SER A 91 -9.061 17.113 1.441 1.00 48.12 C +ATOM 891 OG SER A 91 -9.727 18.233 0.864 1.00 51.11 O +ATOM 892 H SER A 91 -7.764 19.584 2.580 1.00 0.00 H +ATOM 893 HG SER A 91 -10.205 17.955 0.079 1.00 0.00 H +ATOM 894 N VAL A 92 -6.811 16.583 4.361 1.00 44.55 N +ATOM 895 CA VAL A 92 -6.196 15.487 5.129 1.00 44.43 C +ATOM 896 C VAL A 92 -6.451 15.690 6.627 1.00 43.59 C +ATOM 897 O VAL A 92 -5.911 14.975 7.471 1.00 42.35 O +ATOM 898 CB VAL A 92 -4.657 15.344 4.880 1.00 44.50 C +ATOM 899 CG1 VAL A 92 -4.413 14.652 3.553 1.00 44.93 C +ATOM 900 CG2 VAL A 92 -3.972 16.697 4.904 1.00 43.55 C +ATOM 901 H VAL A 92 -6.657 17.507 4.637 1.00 0.00 H +ATOM 902 N TYR A 93 -7.311 16.652 6.938 1.00 44.06 N +ATOM 903 CA TYR A 93 -7.606 16.994 8.321 1.00 46.56 C +ATOM 904 C TYR A 93 -8.156 15.815 9.115 1.00 47.20 C +ATOM 905 O TYR A 93 -7.747 15.568 10.249 1.00 45.84 O +ATOM 906 CB TYR A 93 -8.590 18.172 8.392 1.00 48.04 C +ATOM 907 CG TYR A 93 -8.880 18.600 9.814 1.00 51.15 C +ATOM 908 CD1 TYR A 93 -8.058 19.512 10.466 1.00 52.01 C +ATOM 909 CD2 TYR A 93 -9.901 17.996 10.550 1.00 51.74 C +ATOM 910 CE1 TYR A 93 -8.234 19.796 11.806 1.00 53.05 C +ATOM 911 CE2 TYR A 93 -10.083 18.274 11.891 1.00 52.13 C +ATOM 912 CZ TYR A 93 -9.243 19.172 12.513 1.00 53.58 C +ATOM 913 OH TYR A 93 -9.405 19.442 13.848 1.00 56.47 O +ATOM 914 H TYR A 93 -7.753 17.146 6.220 1.00 0.00 H +ATOM 915 HH TYR A 93 -10.182 18.981 14.176 1.00 0.00 H +ATOM 916 N ASP A 94 -9.076 15.086 8.529 1.00 48.64 N +ATOM 917 CA ASP A 94 -9.678 13.962 9.232 1.00 50.01 C +ATOM 918 C ASP A 94 -8.697 12.805 9.419 1.00 49.07 C +ATOM 919 O ASP A 94 -8.827 12.031 10.370 1.00 48.92 O +ATOM 920 CB ASP A 94 -10.964 13.515 8.517 1.00 53.54 C +ATOM 921 CG ASP A 94 -12.120 14.474 8.796 1.00 54.92 C +ATOM 922 OD1 ASP A 94 -12.762 14.329 9.852 1.00 57.73 O +ATOM 923 OD2 ASP A 94 -12.379 15.377 7.969 1.00 56.24 O +ATOM 924 H ASP A 94 -9.357 15.301 7.615 1.00 0.00 H +ATOM 925 N GLN A 95 -7.712 12.698 8.520 1.00 49.21 N +ATOM 926 CA GLN A 95 -6.664 11.678 8.659 1.00 49.95 C +ATOM 927 C GLN A 95 -5.677 12.029 9.780 1.00 48.73 C +ATOM 928 O GLN A 95 -5.206 11.146 10.495 1.00 48.14 O +ATOM 929 CB GLN A 95 -5.871 11.526 7.358 1.00 51.32 C +ATOM 930 CG GLN A 95 -6.617 10.859 6.227 1.00 54.77 C +ATOM 931 CD GLN A 95 -5.805 10.848 4.952 1.00 57.17 C +ATOM 932 OE1 GLN A 95 -4.715 10.277 4.905 1.00 57.65 O +ATOM 933 NE2 GLN A 95 -6.325 11.483 3.912 1.00 58.76 N +ATOM 934 H GLN A 95 -7.694 13.305 7.752 1.00 0.00 H +ATOM 935 HE21 GLN A 95 -5.808 11.509 3.079 1.00 0.00 H +ATOM 936 HE22 GLN A 95 -7.202 11.904 4.016 1.00 0.00 H +ATOM 937 N LEU A 96 -5.360 13.327 9.908 1.00 48.04 N +ATOM 938 CA LEU A 96 -4.374 13.800 10.893 1.00 46.14 C +ATOM 939 C LEU A 96 -5.003 14.231 12.202 1.00 45.87 C +ATOM 940 O LEU A 96 -4.285 14.496 13.166 1.00 44.88 O +ATOM 941 CB LEU A 96 -3.579 14.981 10.323 1.00 43.86 C +ATOM 942 CG LEU A 96 -3.107 14.825 8.881 1.00 43.10 C +ATOM 943 CD1 LEU A 96 -2.080 15.892 8.542 1.00 40.00 C +ATOM 944 CD2 LEU A 96 -2.533 13.432 8.681 1.00 42.10 C +ATOM 945 H LEU A 96 -5.794 13.981 9.318 1.00 0.00 H +ATOM 946 N LYS A 97 -6.332 14.297 12.237 1.00 47.18 N +ATOM 947 CA LYS A 97 -7.053 14.723 13.436 1.00 47.61 C +ATOM 948 C LYS A 97 -6.528 14.080 14.736 1.00 45.43 C +ATOM 949 O LYS A 97 -6.293 14.784 15.717 1.00 44.43 O +ATOM 950 CB LYS A 97 -8.568 14.489 13.291 1.00 50.67 C +ATOM 951 CG LYS A 97 -9.336 15.078 14.463 1.00 56.31 C +ATOM 952 CD LYS A 97 -10.823 15.199 14.216 1.00 59.48 C +ATOM 953 CE LYS A 97 -11.463 16.020 15.331 1.00 61.13 C +ATOM 954 NZ LYS A 97 -12.926 16.202 15.134 1.00 63.44 N +ATOM 955 H LYS A 97 -6.842 14.065 11.432 1.00 0.00 H +ATOM 956 HZ1 LYS A 97 -13.098 16.675 14.224 1.00 0.00 H +ATOM 957 HZ2 LYS A 97 -13.392 15.273 15.137 1.00 0.00 H +ATOM 958 HZ3 LYS A 97 -13.309 16.784 15.906 1.00 0.00 H +ATOM 959 N PRO A 98 -6.334 12.753 14.803 1.00 44.31 N +ATOM 960 CA PRO A 98 -5.818 12.119 16.014 1.00 45.37 C +ATOM 961 C PRO A 98 -4.589 12.847 16.590 1.00 46.45 C +ATOM 962 O PRO A 98 -4.526 13.091 17.795 1.00 47.44 O +ATOM 963 CB PRO A 98 -5.497 10.687 15.575 1.00 43.63 C +ATOM 964 CG PRO A 98 -5.537 10.749 14.086 1.00 44.43 C +ATOM 965 CD PRO A 98 -6.611 11.744 13.777 1.00 43.98 C +ATOM 966 N LEU A 99 -3.638 13.217 15.725 1.00 46.20 N +ATOM 967 CA LEU A 99 -2.427 13.892 16.177 1.00 45.20 C +ATOM 968 C LEU A 99 -2.731 15.288 16.672 1.00 46.29 C +ATOM 969 O LEU A 99 -2.212 15.707 17.705 1.00 45.15 O +ATOM 970 CB LEU A 99 -1.386 13.979 15.053 1.00 42.84 C +ATOM 971 CG LEU A 99 -0.093 14.741 15.389 1.00 41.15 C +ATOM 972 CD1 LEU A 99 0.804 13.895 16.275 1.00 38.20 C +ATOM 973 CD2 LEU A 99 0.626 15.131 14.117 1.00 39.05 C +ATOM 974 H LEU A 99 -3.759 13.036 14.770 1.00 0.00 H +ATOM 975 N PHE A 100 -3.564 16.007 15.933 1.00 48.58 N +ATOM 976 CA PHE A 100 -3.896 17.372 16.305 1.00 52.20 C +ATOM 977 C PHE A 100 -4.517 17.429 17.688 1.00 56.06 C +ATOM 978 O PHE A 100 -4.089 18.213 18.537 1.00 56.52 O +ATOM 979 CB PHE A 100 -4.865 18.008 15.296 1.00 50.34 C +ATOM 980 CG PHE A 100 -4.309 18.236 13.913 1.00 48.52 C +ATOM 981 CD1 PHE A 100 -2.950 18.478 13.717 1.00 46.65 C +ATOM 982 CD2 PHE A 100 -5.158 18.231 12.803 1.00 47.63 C +ATOM 983 CE1 PHE A 100 -2.447 18.713 12.445 1.00 46.95 C +ATOM 984 CE2 PHE A 100 -4.662 18.466 11.530 1.00 46.65 C +ATOM 985 CZ PHE A 100 -3.304 18.707 11.350 1.00 46.70 C +ATOM 986 H PHE A 100 -3.954 15.615 15.124 1.00 0.00 H +ATOM 987 N ASP A 101 -5.517 16.594 17.924 1.00 60.72 N +ATOM 988 CA ASP A 101 -6.204 16.632 19.205 1.00 66.29 C +ATOM 989 C ASP A 101 -5.449 15.864 20.289 1.00 68.12 C +ATOM 990 O ASP A 101 -5.728 16.047 21.477 1.00 69.45 O +ATOM 991 CB ASP A 101 -7.653 16.132 19.071 1.00 68.88 C +ATOM 992 CG ASP A 101 -7.782 14.625 19.028 1.00 72.53 C +ATOM 993 OD1 ASP A 101 -7.085 13.994 18.212 1.00 74.44 O +ATOM 994 OD2 ASP A 101 -8.584 14.071 19.818 1.00 73.84 O +ATOM 995 H ASP A 101 -5.795 15.955 17.233 1.00 0.00 H +ATOM 996 N PHE A 102 -4.497 15.014 19.881 1.00 69.09 N +ATOM 997 CA PHE A 102 -3.676 14.272 20.835 1.00 69.65 C +ATOM 998 C PHE A 102 -3.031 15.235 21.825 1.00 70.64 C +ATOM 999 O PHE A 102 -2.775 14.878 22.974 1.00 72.94 O +ATOM 1000 CB PHE A 102 -2.583 13.502 20.091 1.00 70.00 C +ATOM 1001 CG PHE A 102 -1.745 12.597 20.951 1.00 71.29 C +ATOM 1002 CD1 PHE A 102 -0.639 13.089 21.637 1.00 71.76 C +ATOM 1003 CD2 PHE A 102 -2.053 11.238 21.062 1.00 72.61 C +ATOM 1004 CE1 PHE A 102 0.139 12.248 22.414 1.00 72.74 C +ATOM 1005 CE2 PHE A 102 -1.274 10.387 21.838 1.00 72.58 C +ATOM 1006 CZ PHE A 102 -0.177 10.895 22.516 1.00 73.27 C +ATOM 1007 H PHE A 102 -4.346 14.884 18.921 1.00 0.00 H +TER 1008 PHE A 102 +HETATM 1009 O HOH A 401 11.442 26.376 18.419 1.00 38.23 O +HETATM 1010 H1 HOH A 401 12.360 26.094 18.365 1.00 0.00 H +HETATM 1011 H2 HOH A 401 11.489 27.267 18.767 1.00 0.00 H +HETATM 1012 O HOH A 402 8.649 28.512 17.527 1.00 47.94 O +HETATM 1013 H1 HOH A 402 9.202 27.788 17.213 1.00 0.00 H +HETATM 1014 H2 HOH A 402 7.878 28.486 16.957 1.00 0.00 H +HETATM 1015 O HOH A 403 7.263 28.403 19.944 1.00 38.55 O +HETATM 1016 H1 HOH A 403 7.266 27.444 19.925 1.00 0.00 H +HETATM 1017 H2 HOH A 403 7.891 28.655 19.252 1.00 0.00 H +HETATM 1018 O HOH A 404 13.823 23.249 15.906 1.00 61.76 O +HETATM 1019 H1 HOH A 404 14.758 23.159 15.681 1.00 0.00 H +HETATM 1020 H2 HOH A 404 13.741 24.157 16.204 1.00 0.00 H +HETATM 1021 O HOH A 405 8.756 28.493 22.514 1.00 66.03 O +HETATM 1022 H1 HOH A 405 8.339 28.510 21.650 1.00 0.00 H +HETATM 1023 H2 HOH A 405 8.556 29.355 22.893 1.00 0.00 H +HETATM 1024 O HOH A 406 9.224 19.780 22.203 1.00 22.24 O +HETATM 1025 H1 HOH A 406 9.276 19.201 21.436 1.00 0.00 H +HETATM 1026 H2 HOH A 406 9.990 19.533 22.736 1.00 0.00 H +HETATM 1027 O HOH A 407 11.643 19.276 23.871 1.00 44.82 O +HETATM 1028 H1 HOH A 407 12.275 19.960 23.620 1.00 0.00 H +HETATM 1029 H2 HOH A 407 11.978 18.952 24.712 1.00 0.00 H +HETATM 1030 O HOH A 408 7.638 19.412 26.856 1.00 66.34 O +HETATM 1031 H1 HOH A 408 7.334 19.672 27.732 1.00 0.00 H +HETATM 1032 H2 HOH A 408 8.293 18.736 27.024 1.00 0.00 H +HETATM 1033 O HOH A 409 9.788 12.718 23.881 1.00 35.90 O +HETATM 1034 H1 HOH A 409 10.485 13.349 24.074 1.00 0.00 H +HETATM 1035 H2 HOH A 409 9.534 12.912 22.975 1.00 0.00 H +HETATM 1036 O HOH A 410 -7.039 27.560 12.371 1.00 76.53 O +HETATM 1037 H1 HOH A 410 -7.871 27.092 12.461 1.00 0.00 H +HETATM 1038 H2 HOH A 410 -6.381 26.862 12.283 1.00 0.00 H +HETATM 1039 O HOH A 411 10.636 15.015 28.679 1.00 79.82 O +HETATM 1040 H1 HOH A 411 10.754 14.224 29.205 1.00 0.00 H +HETATM 1041 H2 HOH A 411 9.685 15.085 28.566 1.00 0.00 H +HETATM 1042 O HOH A 412 -5.406 19.815 21.604 1.00 67.01 O +HETATM 1043 H1 HOH A 412 -5.059 20.294 22.359 1.00 0.00 H +HETATM 1044 H2 HOH A 412 -5.402 18.897 21.884 1.00 0.00 H +HETATM 1045 O HOH A 413 0.948 26.025 18.289 1.00 28.37 O +HETATM 1046 H1 HOH A 413 1.360 25.442 18.933 1.00 0.00 H +HETATM 1047 H2 HOH A 413 1.280 26.901 18.518 1.00 0.00 H +HETATM 1048 O HOH A 414 2.348 27.103 21.691 1.00 40.51 O +HETATM 1049 H1 HOH A 414 2.244 26.285 21.195 1.00 0.00 H +HETATM 1050 H2 HOH A 414 2.771 27.701 21.073 1.00 0.00 H +HETATM 1051 O HOH A 415 1.783 28.751 19.142 1.00 45.14 O +HETATM 1052 H1 HOH A 415 2.466 29.079 19.741 1.00 0.00 H +HETATM 1053 H2 HOH A 415 1.057 29.370 19.247 1.00 0.00 H +HETATM 1054 O HOH A 416 -1.813 27.629 17.603 1.00 63.33 O +HETATM 1055 H1 HOH A 416 -0.906 27.508 17.899 1.00 0.00 H +HETATM 1056 H2 HOH A 416 -1.823 28.521 17.231 1.00 0.00 H +HETATM 1057 O HOH A 417 0.364 33.475 10.829 1.00 43.72 O +HETATM 1058 H1 HOH A 417 -0.450 33.139 10.448 1.00 0.00 H +HETATM 1059 H2 HOH A 417 0.123 33.712 11.729 1.00 0.00 H +HETATM 1060 O HOH A 418 3.290 35.799 10.789 1.00 45.96 O +HETATM 1061 H1 HOH A 418 2.521 35.871 11.354 1.00 0.00 H +HETATM 1062 H2 HOH A 418 2.954 36.032 9.910 1.00 0.00 H +HETATM 1063 O HOH A 419 8.914 16.633 -7.731 1.00 47.58 O +HETATM 1064 H1 HOH A 419 8.580 16.211 -8.527 1.00 0.00 H +HETATM 1065 H2 HOH A 419 9.739 17.055 -8.014 1.00 0.00 H +HETATM 1066 O HOH A 420 16.804 28.181 7.657 1.00 52.61 O +HETATM 1067 H1 HOH A 420 17.349 28.921 7.925 1.00 0.00 H +HETATM 1068 H2 HOH A 420 17.428 27.548 7.300 1.00 0.00 H +HETATM 1069 O HOH A 421 4.841 5.174 7.671 1.00 54.02 O +HETATM 1070 H1 HOH A 421 4.992 4.811 6.796 1.00 0.00 H +HETATM 1071 H2 HOH A 421 3.969 5.585 7.610 1.00 0.00 H +HETATM 1072 O HOH A 422 6.123 12.466 6.644 1.00 38.59 O +HETATM 1073 H1 HOH A 422 6.354 11.569 6.880 1.00 0.00 H +HETATM 1074 H2 HOH A 422 5.242 12.393 6.258 1.00 0.00 H +HETATM 1075 O HOH A 423 3.623 12.224 6.231 1.00 46.24 O +HETATM 1076 H1 HOH A 423 3.260 11.491 6.732 1.00 0.00 H +HETATM 1077 H2 HOH A 423 3.150 12.995 6.560 1.00 0.00 H +HETATM 1078 O HOH A 424 8.696 11.998 9.005 1.00 59.93 O +HETATM 1079 H1 HOH A 424 7.734 12.042 9.009 1.00 0.00 H +HETATM 1080 H2 HOH A 424 8.947 12.160 9.914 1.00 0.00 H +HETATM 1081 O HOH A 425 8.405 9.129 7.648 1.00 61.20 O +HETATM 1082 H1 HOH A 425 9.210 8.614 7.550 1.00 0.00 H +HETATM 1083 H2 HOH A 425 8.701 9.956 8.049 1.00 0.00 H +HETATM 1084 O HOH A 426 18.447 13.535 15.604 1.00 34.60 O +HETATM 1085 H1 HOH A 426 18.325 12.712 16.083 1.00 0.00 H +HETATM 1086 H2 HOH A 426 17.838 13.470 14.861 1.00 0.00 H +HETATM 1087 O HOH A 427 12.794 20.256 3.954 1.00 62.89 O +HETATM 1088 H1 HOH A 427 13.638 20.705 4.102 1.00 0.00 H +HETATM 1089 H2 HOH A 427 13.034 19.453 3.487 1.00 0.00 H +HETATM 1090 O HOH A 428 8.847 19.809 0.651 1.00 65.07 O +HETATM 1091 H1 HOH A 428 8.427 19.180 1.242 1.00 0.00 H +HETATM 1092 H2 HOH A 428 8.764 20.651 1.101 1.00 0.00 H +HETATM 1093 O HOH A 429 -2.878 19.586 20.641 1.00 55.95 O +HETATM 1094 H1 HOH A 429 -3.712 19.246 20.304 1.00 0.00 H +HETATM 1095 H2 HOH A 429 -2.949 20.533 20.530 1.00 0.00 H +HETATM 1096 O HOH A 430 -3.389 10.814 2.153 1.00 68.44 O +HETATM 1097 H1 HOH A 430 -3.370 10.574 1.223 1.00 0.00 H +HETATM 1098 H2 HOH A 430 -2.731 11.518 2.225 1.00 0.00 H +HETATM 1099 O HOH A 431 7.974 6.841 9.094 1.00 81.57 O +HETATM 1100 H1 HOH A 431 7.873 7.036 8.159 1.00 0.00 H +HETATM 1101 H2 HOH A 431 7.642 5.943 9.185 1.00 0.00 H +HETATM 1102 O HOH A 432 8.985 13.925 -7.061 1.00 46.17 O +HETATM 1103 H1 HOH A 432 9.892 13.636 -6.937 1.00 0.00 H +HETATM 1104 H2 HOH A 432 9.045 14.887 -7.113 1.00 0.00 H +HETATM 1105 O HOH A 433 11.459 17.807 -8.216 1.00 61.98 O +HETATM 1106 H1 HOH A 433 12.207 17.850 -7.615 1.00 0.00 H +HETATM 1107 H2 HOH A 433 11.478 18.651 -8.675 1.00 0.00 H +HETATM 1108 O HOH A 434 -10.484 15.879 5.891 1.00 49.08 O +HETATM 1109 H1 HOH A 434 -10.763 16.064 4.990 1.00 0.00 H +HETATM 1110 H2 HOH A 434 -11.213 16.190 6.431 1.00 0.00 H +HETATM 1111 O HOH A 435 12.930 13.009 26.185 1.00 43.86 O +HETATM 1112 H1 HOH A 435 12.963 13.330 27.087 1.00 0.00 H +HETATM 1113 H2 HOH A 435 13.476 13.625 25.694 1.00 0.00 H +HETATM 1114 O HOH A 436 -3.464 25.858 19.747 1.00 63.70 O +HETATM 1115 H1 HOH A 436 -3.471 26.403 18.954 1.00 0.00 H +HETATM 1116 H2 HOH A 436 -2.587 25.992 20.114 1.00 0.00 H +HETATM 1117 O HOH A 437 6.235 16.677 28.203 1.00 68.03 O +HETATM 1118 H1 HOH A 437 6.291 17.517 28.663 1.00 0.00 H +HETATM 1119 H2 HOH A 437 5.340 16.667 27.835 1.00 0.00 H +HETATM 1120 O HOH A 438 7.423 17.512 -10.650 1.00 57.40 O +HETATM 1121 H1 HOH A 438 7.010 16.951 -9.986 1.00 0.00 H +HETATM 1122 H2 HOH A 438 7.702 16.894 -11.334 1.00 0.00 H +HETATM 1123 O HOH A 439 -5.355 10.866 19.619 1.00 51.92 O +HETATM 1124 H1 HOH A 439 -6.252 10.945 19.294 1.00 0.00 H +HETATM 1125 H2 HOH A 439 -4.871 11.550 19.149 1.00 0.00 H +HETATM 1126 O HOH A 440 -8.867 11.724 17.801 1.00 59.09 O +HETATM 1127 H1 HOH A 440 -8.909 12.448 18.427 1.00 0.00 H +HETATM 1128 H2 HOH A 440 -9.457 11.061 18.162 1.00 0.00 H +HETATM 1129 O HOH A 441 13.107 15.120 7.186 1.00 56.17 O +HETATM 1130 H1 HOH A 441 12.362 15.432 7.708 1.00 0.00 H +HETATM 1131 H2 HOH A 441 13.869 15.225 7.770 1.00 0.00 H +HETATM 1132 O HOH A 442 -2.200 10.629 25.072 1.00 84.96 O +HETATM 1133 H1 HOH A 442 -1.698 11.431 25.238 1.00 0.00 H +HETATM 1134 H2 HOH A 442 -3.040 10.942 24.729 1.00 0.00 H +HETATM 1135 O HOH A 444 1.798 36.196 8.660 1.00 69.55 O +HETATM 1136 H1 HOH A 444 2.171 36.075 7.775 1.00 0.00 H +HETATM 1137 H2 HOH A 444 1.186 35.465 8.757 1.00 0.00 H +HETATM 1138 O HOH A 446 12.829 16.619 28.388 1.00 76.91 O +HETATM 1139 H1 HOH A 446 12.031 17.139 28.283 1.00 0.00 H +HETATM 1140 H2 HOH A 446 12.511 15.764 28.684 1.00 0.00 H +HETATM 1141 O HOH A 447 -1.714 7.995 25.869 1.00 53.32 O +HETATM 1142 H1 HOH A 447 -1.215 7.807 25.076 1.00 0.00 H +HETATM 1143 H2 HOH A 447 -1.895 8.941 25.818 1.00 0.00 H +HETATM 1144 O HOH A 449 17.342 21.354 17.381 1.00 78.08 O +HETATM 1145 H1 HOH A 449 17.257 20.526 17.868 1.00 0.00 H +HETATM 1146 H2 HOH A 449 17.020 22.020 17.988 1.00 0.00 H +HETATM 1147 O HOH A 450 17.554 22.356 21.606 1.00 81.11 O +HETATM 1148 H1 HOH A 450 17.863 21.463 21.445 1.00 0.00 H +HETATM 1149 H2 HOH A 450 18.333 22.902 21.491 1.00 0.00 H +HETATM 1150 O HOH A 451 21.261 19.604 17.525 1.00 60.20 O +HETATM 1151 H1 HOH A 451 21.971 20.078 17.088 1.00 0.00 H +HETATM 1152 H2 HOH A 451 20.490 20.166 17.407 1.00 0.00 H +HETATM 1153 O HOH A 452 20.618 19.027 20.159 1.00 71.08 O +HETATM 1154 H1 HOH A 452 20.831 19.188 19.232 1.00 0.00 H +HETATM 1155 H2 HOH A 452 21.279 18.398 20.447 1.00 0.00 H +HETATM 1156 O HOH A 454 3.691 16.091 27.806 1.00 75.85 O +HETATM 1157 H1 HOH A 454 3.113 15.469 27.354 1.00 0.00 H +HETATM 1158 H2 HOH A 454 3.644 15.832 28.729 1.00 0.00 H +HETATM 1159 O HOH A 456 17.778 15.979 4.727 1.00 87.15 O +HETATM 1160 H1 HOH A 456 17.578 15.048 4.815 1.00 0.00 H +HETATM 1161 H2 HOH A 456 17.841 16.297 5.638 1.00 0.00 H +HETATM 1162 O HOH A 457 2.784 6.732 0.413 1.00 58.64 O +HETATM 1163 H1 HOH A 457 3.270 6.190 1.038 1.00 0.00 H +HETATM 1164 H2 HOH A 457 2.569 6.134 -0.304 1.00 0.00 H +HETATM 1165 O HOH A 458 6.812 6.267 3.872 1.00 78.10 O +HETATM 1166 H1 HOH A 458 6.068 6.869 3.796 1.00 0.00 H +HETATM 1167 H2 HOH A 458 7.515 6.697 3.386 1.00 0.00 H +HETATM 1168 O HOH A 459 11.360 23.250 27.379 1.00 91.15 O +HETATM 1169 H1 HOH A 459 10.875 24.075 27.257 1.00 0.00 H +HETATM 1170 H2 HOH A 459 11.895 23.176 26.588 1.00 0.00 H +HETATM 1171 O HOH A 460 11.533 21.478 -4.909 1.00 61.19 O +HETATM 1172 H1 HOH A 460 11.125 21.466 -4.035 1.00 0.00 H +HETATM 1173 H2 HOH A 460 11.171 22.260 -5.324 1.00 0.00 H +HETATM 1174 O HOH A 461 -2.761 38.231 3.181 1.00 84.62 O +HETATM 1175 H1 HOH A 461 -1.871 38.468 3.455 1.00 0.00 H +HETATM 1176 H2 HOH A 461 -2.645 37.814 2.327 1.00 0.00 H +HETATM 1177 O HOH A 462 -5.015 39.320 4.311 1.00 88.70 O +HETATM 1178 H1 HOH A 462 -4.698 40.216 4.219 1.00 0.00 H +HETATM 1179 H2 HOH A 462 -4.298 38.779 3.950 1.00 0.00 H +HETATM 1180 O HOH A 463 10.179 21.307 3.687 1.00 49.11 O +HETATM 1181 H1 HOH A 463 9.722 21.057 4.495 1.00 0.00 H +HETATM 1182 H2 HOH A 463 11.079 20.973 3.815 1.00 0.00 H +HETATM 1183 O HOH A 464 -1.283 31.486 14.715 1.00 75.28 O +HETATM 1184 H1 HOH A 464 -0.458 31.251 14.289 1.00 0.00 H +HETATM 1185 H2 HOH A 464 -1.540 30.684 15.190 1.00 0.00 H +HETATM 1186 O HOH A 465 -3.174 28.185 6.783 1.00 76.66 O +HETATM 1187 H1 HOH A 465 -3.814 28.666 7.321 1.00 0.00 H +HETATM 1188 H2 HOH A 465 -3.169 28.650 5.944 1.00 0.00 H +HETATM 1189 O HOH A 466 -5.798 24.608 20.375 1.00 86.02 O +HETATM 1190 H1 HOH A 466 -5.419 23.785 20.680 1.00 0.00 H +HETATM 1191 H2 HOH A 466 -5.032 25.168 20.192 1.00 0.00 H +HETATM 1192 O HOH A 467 -10.433 22.178 -0.029 1.00 70.77 O +HETATM 1193 H1 HOH A 467 -10.696 21.582 0.672 1.00 0.00 H +HETATM 1194 H2 HOH A 467 -9.472 22.144 -0.019 1.00 0.00 H +HETATM 1195 O HOH A 468 -12.736 19.373 14.748 1.00 67.61 O +HETATM 1196 H1 HOH A 468 -13.404 19.567 14.089 1.00 0.00 H +HETATM 1197 H2 HOH A 468 -12.581 20.211 15.186 1.00 0.00 H +HETATM 1198 O HOH A 469 -12.719 15.279 19.686 1.00 72.04 O +HETATM 1199 H1 HOH A 469 -11.938 15.746 19.984 1.00 0.00 H +HETATM 1200 H2 HOH A 469 -12.734 14.477 20.208 1.00 0.00 H +HETATM 1201 O HOH A 470 14.152 20.306 23.565 1.00 67.11 O +HETATM 1202 H1 HOH A 470 14.822 20.685 24.137 1.00 0.00 H +HETATM 1203 H2 HOH A 470 14.616 19.594 23.101 1.00 0.00 H +HETATM 1204 O HOH A 471 13.538 23.641 18.923 1.00 71.61 O +HETATM 1205 H1 HOH A 471 13.182 23.149 18.177 1.00 0.00 H +HETATM 1206 H2 HOH A 471 13.920 22.968 19.489 1.00 0.00 H +HETATM 1207 O HOH A 472 -2.426 22.296 24.456 1.00 58.68 O +HETATM 1208 H1 HOH A 472 -1.824 21.550 24.486 1.00 0.00 H +HETATM 1209 H2 HOH A 472 -2.172 22.837 25.206 1.00 0.00 H +HETATM 1210 O HOH A 473 -4.196 19.616 27.496 1.00 73.73 O +HETATM 1211 H1 HOH A 473 -4.186 20.369 28.087 1.00 0.00 H +HETATM 1212 H2 HOH A 473 -3.490 19.052 27.815 1.00 0.00 H +HETATM 1213 O HOH A 474 -3.309 5.980 5.845 1.00 68.19 O +HETATM 1214 H1 HOH A 474 -3.838 5.345 6.332 1.00 0.00 H +HETATM 1215 H2 HOH A 474 -3.906 6.325 5.178 1.00 0.00 H +HETATM 1216 O HOH A 475 17.838 23.280 1.198 1.00 77.31 O +HETATM 1217 H1 HOH A 475 18.005 22.946 2.080 1.00 0.00 H +HETATM 1218 H2 HOH A 475 16.886 23.249 1.107 1.00 0.00 H +HETATM 1219 O HOH A 476 10.307 16.081 6.990 1.00 59.61 O +HETATM 1220 H1 HOH A 476 10.750 16.852 7.367 1.00 0.00 H +HETATM 1221 H2 HOH A 476 10.894 15.787 6.290 1.00 0.00 H +HETATM 1222 O HOH A 477 11.355 23.439 4.466 1.00 66.34 O +HETATM 1223 H1 HOH A 477 10.901 22.829 3.870 1.00 0.00 H +HETATM 1224 H2 HOH A 477 12.059 23.808 3.935 1.00 0.00 H +HETATM 1225 O HOH A 478 17.221 12.554 13.119 1.00 53.33 O +HETATM 1226 H1 HOH A 478 17.675 13.340 12.793 1.00 0.00 H +HETATM 1227 H2 HOH A 478 17.910 11.893 13.189 1.00 0.00 H +HETATM 1228 O HOH A 479 6.483 28.190 5.603 1.00 90.05 O +HETATM 1229 H1 HOH A 479 6.350 28.405 4.680 1.00 0.00 H +HETATM 1230 H2 HOH A 479 6.782 27.278 5.595 1.00 0.00 H +HETATM 1231 O HOH A 480 -1.050 28.108 4.394 1.00 85.46 O +HETATM 1232 H1 HOH A 480 -0.904 27.942 5.328 1.00 0.00 H +HETATM 1233 H2 HOH A 480 -0.405 28.792 4.169 1.00 0.00 H +HETATM 1234 O HOH A 481 7.764 6.413 14.803 1.00 47.44 O +HETATM 1235 H1 HOH A 481 7.927 7.153 15.390 1.00 0.00 H +HETATM 1236 H2 HOH A 481 7.543 6.819 13.965 1.00 0.00 H +HETATM 1237 O HOH A 482 -1.304 30.550 17.203 1.00 47.05 O +HETATM 1238 H1 HOH A 482 -2.121 30.831 17.619 1.00 0.00 H +HETATM 1239 H2 HOH A 482 -0.966 31.348 16.785 1.00 0.00 H +HETATM 1240 O HOH A 484 3.582 11.825 -5.019 1.00 54.04 O +HETATM 1241 H1 HOH A 484 4.118 12.609 -4.883 1.00 0.00 H +HETATM 1242 H2 HOH A 484 2.776 12.157 -5.424 1.00 0.00 H +HETATM 1243 O HOH A 485 10.477 17.818 1.534 1.00 52.39 O +HETATM 1244 H1 HOH A 485 10.080 18.415 0.889 1.00 0.00 H +HETATM 1245 H2 HOH A 485 11.050 18.380 2.054 1.00 0.00 H +HETATM 1246 O HOH A 486 8.350 13.220 -2.518 1.00 51.86 O +HETATM 1247 H1 HOH A 486 7.500 12.811 -2.685 1.00 0.00 H +HETATM 1248 H2 HOH A 486 8.871 13.018 -3.295 1.00 0.00 H +HETATM 1249 O HOH A 487 10.766 31.335 -1.067 1.00 53.16 O +HETATM 1250 H1 HOH A 487 9.819 31.209 -0.984 1.00 0.00 H +HETATM 1251 H2 HOH A 487 11.147 30.557 -0.661 1.00 0.00 H +HETATM 1252 O HOH A 488 -1.322 36.803 5.890 1.00 51.31 O +HETATM 1253 H1 HOH A 488 -2.260 36.695 6.053 1.00 0.00 H +HETATM 1254 H2 HOH A 488 -0.911 36.077 6.358 1.00 0.00 H +HETATM 1255 O HOH A 489 -8.558 12.902 5.180 1.00 53.15 O +HETATM 1256 H1 HOH A 489 -8.421 13.507 4.441 1.00 0.00 H +HETATM 1257 H2 HOH A 489 -9.446 12.564 5.045 1.00 0.00 H +MASTER 234 0 0 4 5 0 0 6 1256 1 0 8 +END diff --git a/data/2F1C.fa b/data/2F1C.fa index f7eac38..5281bb4 100644 --- a/data/2F1C.fa +++ b/data/2F1C.fa @@ -1,5 +1,5 @@ ->2F1C:X|PDBID|CHAIN|SEQUENCE -EERNDWHFNIGAMYEIENVEGYGEDMDGLAEPSVYFNAANGPWRIALAYYQEGPVDYSAGKRGTWFDRPELEVHYQFLEN -DDFSFGLTGGFRNYGYHYVDEPGKDTANMQRWKIAPDWDVKLTDDLRFNGWLSMYKFANDLNTTGYADTRVETETGLQYT -FNETVALRVNYYLERGFNMDDSRNNGEFSTQEIRAYLPLTLGNHSVTPYTRIGLDRWSNWDWQDDIEREGHDFNRVGLFY +>2F1C:X|PDBID|CHAIN|SEQUENCE +EERNDWHFNIGAMYEIENVEGYGEDMDGLAEPSVYFNAANGPWRIALAYYQEGPVDYSAGKRGTWFDRPELEVHYQFLEN +DDFSFGLTGGFRNYGYHYVDEPGKDTANMQRWKIAPDWDVKLTDDLRFNGWLSMYKFANDLNTTGYADTRVETETGLQYT +FNETVALRVNYYLERGFNMDDSRNNGEFSTQEIRAYLPLTLGNHSVTPYTRIGLDRWSNWDWQDDIEREGHDFNRVGLFY GYDFQNGLSVSLEYAFEWQDHDEGDSDKFHYAGVGVNYSFHHHHHH \ No newline at end of file diff --git a/data/3FG7.fa b/data/3FG7.fa index aa22c46..5fb7df0 100644 --- a/data/3FG7.fa +++ b/data/3FG7.fa @@ -1,6 +1,6 @@ ->3FG7:A|PDBID|CHAIN|SEQUENCE -MAEEHHHHHHHHLEVLFQGPGRPKTHTVGSVAKVEQVKFDATSMHVKPQVAAQQKMVDDGSGEVQVWRIENLELVPVDSK -WLGHFYGGDCYLLLYTYLIGEKQHYLLYVWQGSQASQDEITASAYQAVILDQKYNGEPVQIRVPMGKEPPHLMSIFKGRM -VVYQGGTSRTNNLETGPSTRLFQVQGTGANNTKAFEVPARANFLNSNDVFVLKTQSCCYLWCGKGCSGDEREMAKMVADT -ISRTEKQVVVEGQEPANFWMALGGKAPYANTKRLQEENLVITPRLFECSNKTGRFLATEIPDFNQDDLEEDDVFLLDVWD -QVFFWIGKHANEEEKKAAATTAQEYLKTHPSGRDPETPIIVVKQGHEPPTFTGWFLAWDPFKWSGIHVVPNLSPLSNN +>3FG7:A|PDBID|CHAIN|SEQUENCE +MAEEHHHHHHHHLEVLFQGPGRPKTHTVGSVAKVEQVKFDATSMHVKPQVAAQQKMVDDGSGEVQVWRIENLELVPVDSK +WLGHFYGGDCYLLLYTYLIGEKQHYLLYVWQGSQASQDEITASAYQAVILDQKYNGEPVQIRVPMGKEPPHLMSIFKGRM +VVYQGGTSRTNNLETGPSTRLFQVQGTGANNTKAFEVPARANFLNSNDVFVLKTQSCCYLWCGKGCSGDEREMAKMVADT +ISRTEKQVVVEGQEPANFWMALGGKAPYANTKRLQEENLVITPRLFECSNKTGRFLATEIPDFNQDDLEEDDVFLLDVWD +QVFFWIGKHANEEEKKAAATTAQEYLKTHPSGRDPETPIIVVKQGHEPPTFTGWFLAWDPFKWSGIHVVPNLSPLSNN diff --git a/data/MBP1_SACCE.json b/data/MBP1_SACCE.json index 56e91a3..46c695f 100644 --- a/data/MBP1_SACCE.json +++ b/data/MBP1_SACCE.json @@ -1,20 +1,20 @@ -[ - { "name" : "MBP1_SACCE", - "RefSeqID" : "NP_010227", - "UniProtID" : "P39678", - "taxonomyID" : 559292, - "sequence" : [ - "MSNQIYSARYSGVDVYEFIHSTGSIMKRKKDDWVNATHILKAANFAKAKRTRILEKEVLKETHEKVQGGF", - "GKYQGTWVPLNIAKQLAEKFSVYDQLKPLFDFTQTDGSASPPPAPKHHHASKVDRKKAIRSASTSAIMET", - "KRNNKKAEENQFQSSKILGNPTAAPRKRGRPVGSTRGSRRKLGVNLQRSQSDMGFPRPAIPNSSISTTQL", - "PSIRSTMGPQSPTLGILEEERHDSRQQQPQQNNSAQFKEIDLEDGLSSDVEPSQQLQQVFNQNTGFVPQQ", - "QSSLIQTQQTESMATSVSSSPSLPTSPGDFADSNPFEERFPGGGTSPIISMIPRYPVTSRPQTSDINDKV", - "NKYLSKLVDYFISNEMKSNKSLPQVLLHPPPHSAPYIDAPIDPELHTAFHWACSMGNLPIAEALYEAGTS", - "IRSTNSQGQTPLMRSSLFHNSYTRRTFPRIFQLLHETVFDIDSQSQTVIHHIVKRKSTTPSAVYYLDVVL", - "SKIKDFSPQYRIELLLNTQDKNGDTALHIASKNGDVVFFNTLVKMGALTTISNKEGLTANEIMNQQYEQM", - "MIQNGTNQHVNSSNTDLNIHVNTNNIETKNDVNSMVIMSPVSPSDYITYPSQIATNISRNIPNVVNSMKQ", - "MASIYNDLHEQHDNEIKSLQKTLKSISKTKIQVSLKTLEVLKESSKDENGEAQTNDDFEILSRLQEQNTK", - "KLRKRLIRYKRLIKQKLEYRQTVLLNKLIEDETQATTNNTVEKDNNTLERLELAQELTMLQLQRKNKLSS", - "LVKKFEDNAKIHKYRRIIREGTEMNIEEVDSSLDVILQTLIANNNKNKGAEQIITISNANSHA"] - } -] +[ + { "name" : "MBP1_SACCE", + "RefSeqID" : "NP_010227", + "UniProtID" : "P39678", + "taxonomyID" : 559292, + "sequence" : [ + "MSNQIYSARYSGVDVYEFIHSTGSIMKRKKDDWVNATHILKAANFAKAKRTRILEKEVLKETHEKVQGGF", + "GKYQGTWVPLNIAKQLAEKFSVYDQLKPLFDFTQTDGSASPPPAPKHHHASKVDRKKAIRSASTSAIMET", + "KRNNKKAEENQFQSSKILGNPTAAPRKRGRPVGSTRGSRRKLGVNLQRSQSDMGFPRPAIPNSSISTTQL", + "PSIRSTMGPQSPTLGILEEERHDSRQQQPQQNNSAQFKEIDLEDGLSSDVEPSQQLQQVFNQNTGFVPQQ", + "QSSLIQTQQTESMATSVSSSPSLPTSPGDFADSNPFEERFPGGGTSPIISMIPRYPVTSRPQTSDINDKV", + "NKYLSKLVDYFISNEMKSNKSLPQVLLHPPPHSAPYIDAPIDPELHTAFHWACSMGNLPIAEALYEAGTS", + "IRSTNSQGQTPLMRSSLFHNSYTRRTFPRIFQLLHETVFDIDSQSQTVIHHIVKRKSTTPSAVYYLDVVL", + "SKIKDFSPQYRIELLLNTQDKNGDTALHIASKNGDVVFFNTLVKMGALTTISNKEGLTANEIMNQQYEQM", + "MIQNGTNQHVNSSNTDLNIHVNTNNIETKNDVNSMVIMSPVSPSDYITYPSQIATNISRNIPNVVNSMKQ", + "MASIYNDLHEQHDNEIKSLQKTLKSISKTKIQVSLKTLEVLKESSKDENGEAQTNDDFEILSRLQEQNTK", + "KLRKRLIRYKRLIKQKLEYRQTVLLNKLIEDETQATTNNTVEKDNNTLERLELAQELTMLQLQRKNKLSS", + "LVKKFEDNAKIHKYRRIIREGTEMNIEEVDSSLDVILQTLIANNNKNKGAEQIITISNANSHA"] + } +] diff --git a/data/PTPN5_HSa_coding.fa b/data/PTPN5_HSa_coding.fa index 4a11b7e..3337caf 100644 --- a/data/PTPN5_HSa_coding.fa +++ b/data/PTPN5_HSa_coding.fa @@ -1,30 +1,30 @@ ->PTPN5-201 cds:protein_coding (ENST00000358540.7) -ATGAATTATGAGGGAGCCAGGAGTGAGAGAGAGAACCACGCTGCTGATGACTCCGAGGGA -GGGGCCCTGGACATGTGCTGCAGTGAGAGGCTACCGGGTCTCCCCCAGCCGATAGTGATG -GAGGCACTGGACGAGGCTGAAGGGCTCCAGGACTCACAGAGAGAGATGCCGCCACCCCCT -CCTCCCTCGCCGCCCTCAGATCCAGCTCAGAAGCCACCACCTCGAGGCGCTGGGAGCCAC -TCCCTCACTGTCAGGAGCAGCCTGTGCCTGTTCGCTGCCTCACAGTTCCTGCTTGCCTGT -GGGGTGCTCTGGTTCAGCGGTTATGGCCACATCTGGTCACAGAACGCCACAAACCTCGTC -TCCTCTTTGCTGACGCTCCTGAAACAGCTGGAACCCACGGCCTGGCTTGACTCTGGGACG -TGGGGAGTCCCCAGTCTGCTGCTGGTCTTTCTGTCCGTGGGCCTGGTCCTCGTTACCACC -CTGGTGTGGCACCTCCTGAGGACACCCCCAGAGCCACCCACCCCACTGCCCCCTGAGGAC -AGGCGCCAGTCAGTGAGCCGCCAGCCCTCCTTCACCTACTCAGAGTGGATGGAGGAGAAG -ATCGAGGATGACTTCCTGGACCTCGACCCGGTGCCCGAGACTCCTGTGTTTGATTGTGTG -ATGGACATCAAGCCTGAGGCTGACCCCACCTCACTCACCGTCAAGTCCATGGGTCTGCAG -GAGAGGAGGGGTTCCAATGTCTCCCTGACCCTGGACATGTGCACTCCGGGCTGCAACGAG -GAGGGCTTTGGCTATCTCATGTCCCCACGTGAGGAGTCCGCCCGCGAGTACCTGCTCAGC -GCCTCCCGTGTCCTCCAAGCAGAAGAGCTTCATGAAAAGGCCCTGGACCCTTTCCTGCTG -CAGGCGGAATTCTTTGAAATCCCCATGAACTTTGTGGATCCGAAAGAGTACGACATCCCT -GGGCTGGTGCGGAAGAACCGGTACAAAACCATACTTCCCAACCCTCACAGCAGAGTGTGT -CTGACCTCACCAGACCCTGACGACCCTCTGAGTTCCTACATCAATGCCAACTACATCCGG -GGCTATGGTGGGGAGGAGAAGGTGTACATCGCCACTCAGGGACCCATCGTCAGCACGGTC -GCCGACTTCTGGCGCATGGTGTGGCAGGAGCACACGCCCATCATTGTCATGATCACCAAC -ATCGAGGAGATGAACGAGAAATGCACCGAGTATTGGCCGGAGGAGCAGGTGGCGTACGAC -GGTGTTGAGATCACTGTGCAGAAAGTCATTCACACGGAGGATTACCGGCTGCGACTCATC -TCCCTCAAGAGTGGGACTGAGGAGCGAGGCCTGAAGCATTACTGGTTCACATCCTGGCCC -GACCAGAAGACCCCAGACCGGGCCCCCCCACTCCTGCACCTGGTGCGGGAGGTGGAGGAG -GCAGCCCAGCAGGAGGGGCCCCACTGTGCCCCCATCATCGTCCACTGCAGTGCAGGGATT -GGGAGGACCGGCTGCTTCATTGCCACCAGCATCTGCTGCCAGCAGCTGCGGCAGGAGGGT -GTGGTGGACATCCTGAAGACCACGTGCCAGCTCCGTCAGGACAGGGGCGGCATGATCCAG -ACATGCGAGCAGTACCAGTTTGTGCACCACGTCATGAGCCTCTACGAAAAGCAGCTGTCC -CACCAGTCCCCAGAATGA +>PTPN5-201 cds:protein_coding (ENST00000358540.7) +ATGAATTATGAGGGAGCCAGGAGTGAGAGAGAGAACCACGCTGCTGATGACTCCGAGGGA +GGGGCCCTGGACATGTGCTGCAGTGAGAGGCTACCGGGTCTCCCCCAGCCGATAGTGATG +GAGGCACTGGACGAGGCTGAAGGGCTCCAGGACTCACAGAGAGAGATGCCGCCACCCCCT +CCTCCCTCGCCGCCCTCAGATCCAGCTCAGAAGCCACCACCTCGAGGCGCTGGGAGCCAC +TCCCTCACTGTCAGGAGCAGCCTGTGCCTGTTCGCTGCCTCACAGTTCCTGCTTGCCTGT +GGGGTGCTCTGGTTCAGCGGTTATGGCCACATCTGGTCACAGAACGCCACAAACCTCGTC +TCCTCTTTGCTGACGCTCCTGAAACAGCTGGAACCCACGGCCTGGCTTGACTCTGGGACG +TGGGGAGTCCCCAGTCTGCTGCTGGTCTTTCTGTCCGTGGGCCTGGTCCTCGTTACCACC +CTGGTGTGGCACCTCCTGAGGACACCCCCAGAGCCACCCACCCCACTGCCCCCTGAGGAC +AGGCGCCAGTCAGTGAGCCGCCAGCCCTCCTTCACCTACTCAGAGTGGATGGAGGAGAAG +ATCGAGGATGACTTCCTGGACCTCGACCCGGTGCCCGAGACTCCTGTGTTTGATTGTGTG +ATGGACATCAAGCCTGAGGCTGACCCCACCTCACTCACCGTCAAGTCCATGGGTCTGCAG +GAGAGGAGGGGTTCCAATGTCTCCCTGACCCTGGACATGTGCACTCCGGGCTGCAACGAG +GAGGGCTTTGGCTATCTCATGTCCCCACGTGAGGAGTCCGCCCGCGAGTACCTGCTCAGC +GCCTCCCGTGTCCTCCAAGCAGAAGAGCTTCATGAAAAGGCCCTGGACCCTTTCCTGCTG +CAGGCGGAATTCTTTGAAATCCCCATGAACTTTGTGGATCCGAAAGAGTACGACATCCCT +GGGCTGGTGCGGAAGAACCGGTACAAAACCATACTTCCCAACCCTCACAGCAGAGTGTGT +CTGACCTCACCAGACCCTGACGACCCTCTGAGTTCCTACATCAATGCCAACTACATCCGG +GGCTATGGTGGGGAGGAGAAGGTGTACATCGCCACTCAGGGACCCATCGTCAGCACGGTC +GCCGACTTCTGGCGCATGGTGTGGCAGGAGCACACGCCCATCATTGTCATGATCACCAAC +ATCGAGGAGATGAACGAGAAATGCACCGAGTATTGGCCGGAGGAGCAGGTGGCGTACGAC +GGTGTTGAGATCACTGTGCAGAAAGTCATTCACACGGAGGATTACCGGCTGCGACTCATC +TCCCTCAAGAGTGGGACTGAGGAGCGAGGCCTGAAGCATTACTGGTTCACATCCTGGCCC +GACCAGAAGACCCCAGACCGGGCCCCCCCACTCCTGCACCTGGTGCGGGAGGTGGAGGAG +GCAGCCCAGCAGGAGGGGCCCCACTGTGCCCCCATCATCGTCCACTGCAGTGCAGGGATT +GGGAGGACCGGCTGCTTCATTGCCACCAGCATCTGCTGCCAGCAGCTGCGGCAGGAGGGT +GTGGTGGACATCCTGAAGACCACGTGCCAGCTCCGTCAGGACAGGGGCGGCATGATCCAG +ACATGCGAGCAGTACCAGTTTGTGCACCACGTCATGAGCCTCTACGAAAAGCAGCTGTCC +CACCAGTCCCCAGAATGA diff --git a/data/RAB39B_HSa_coding.fa b/data/RAB39B_HSa_coding.fa index 2e6e3d8..4d0dd37 100644 --- a/data/RAB39B_HSa_coding.fa +++ b/data/RAB39B_HSa_coding.fa @@ -1,12 +1,12 @@ ->RAB39B cds:protein_coding (ENST00000369454.4) -ATGGAGGCCATCTGGCTGTACCAGTTCCGGCTCATTGTCATCGGGGATTCCACAGTGGGC -AAGTCCTGCCTGATCCGCCGCTTCACCGAGGGTCGCTTTGCCCAGGTTTCTGACCCCACC -GTGGGGGTGGATTTTTTCTCCCGCTTGGTGGAGATCGAGCCAGGAAAACGCATCAAGCTC -CAGATCTGGGATACCGCGGGTCAAGAGAGGTTCAGATCCATCACTCGCGCCTACTACAGG -AACTCAGTAGGTGGTCTTCTCTTATTTGACATTACCAACCGCAGGTCCTTCCAGAATGTC -CATGAGTGGTTAGAAGAGACCAAAGTACACGTTCAGCCCTACCAAATTGTATTTGTTCTG -GTGGGTCACAAGTGTGACCTGGATACACAGAGGCAAGTGACTCGCCACGAGGCCGAGAAA -CTGGCTGCTGCATACGGCATGAAGTACATTGAAACGTCAGCCCGAGATGCCATTAATGTG -GAGAAAGCCTTCACAGACCTGACAAGAGACATATATGAGCTGGTTAAAAGGGGGGAGATT -ACAATCCAGGAGGGCTGGGAAGGGGTGAAGAGTGGATTTGTACCAAATGTGGTTCACTCT -TCAGAAGAGGTTGTCAAATCAGAGAGGAGATGTTTGTGCTAG +>RAB39B cds:protein_coding (ENST00000369454.4) +ATGGAGGCCATCTGGCTGTACCAGTTCCGGCTCATTGTCATCGGGGATTCCACAGTGGGC +AAGTCCTGCCTGATCCGCCGCTTCACCGAGGGTCGCTTTGCCCAGGTTTCTGACCCCACC +GTGGGGGTGGATTTTTTCTCCCGCTTGGTGGAGATCGAGCCAGGAAAACGCATCAAGCTC +CAGATCTGGGATACCGCGGGTCAAGAGAGGTTCAGATCCATCACTCGCGCCTACTACAGG +AACTCAGTAGGTGGTCTTCTCTTATTTGACATTACCAACCGCAGGTCCTTCCAGAATGTC +CATGAGTGGTTAGAAGAGACCAAAGTACACGTTCAGCCCTACCAAATTGTATTTGTTCTG +GTGGGTCACAAGTGTGACCTGGATACACAGAGGCAAGTGACTCGCCACGAGGCCGAGAAA +CTGGCTGCTGCATACGGCATGAAGTACATTGAAACGTCAGCCCGAGATGCCATTAATGTG +GAGAAAGCCTTCACAGACCTGACAAGAGACATATATGAGCTGGTTAAAAGGGGGGAGATT +ACAATCCAGGAGGGCTGGGAAGGGGTGAAGAGTGGATTTGTACCAAATGTGGTTCACTCT +TCAGAAGAGGTTGTCAAATCAGAGAGGAGATGTTTGTGCTAG diff --git a/data/RandomPhobiaPage.txt b/data/RandomPhobiaPage.txt index 75153c9..57296cb 100644 --- a/data/RandomPhobiaPage.txt +++ b/data/RandomPhobiaPage.txt @@ -1,131 +1,131 @@ - - -```{css, echo = FALSE} - -.striped tr:nth-child(even) { - background: #eaf1ff; -} -.striped { - padding: 5px; -} -``` -Random Phobias - .Rmd sample code for BCH441 at the University of Toronto. (c) Boris Steipe 2020 --> - - -```{r setup, include=FALSE} -knitr::opts_chunk$set(echo = TRUE) -``` - -## Phobias! ## -We all have some, but we could always use more. How to know them all? With this code we access the [Wikipedia list of phobias](https://en.wikipedia.org/wiki/List_of_phobias), scrape the contents and assemble a dataframe. Then we write a function to retrieve a random phobia, which we can subsequently ponder on - either to delight in the fact that we don't have that fear, or to add to our daily quota of anxieties (like our well-founded [fear of bad programming practice](http://xkcd.com/292/)). - -To load the list, we will "screenscrape" the contents of Wikipedia's [List of Phobias](https://en.wikipedia.org/wiki/List_of_phobias). First, we install the `rvest` library and the `xml2` library from CRAN, if we don't have it. -```{r packages} -if (! requireNamespace("rvest", quietly=TRUE)) { - install.packages("rvest") -} -if (! requireNamespace("xml2", quietly=TRUE)) { - install.packages("xml2") -} -``` -As we customarily do, we avoid using the `library()` function to make the package contents accessible, but use the `package::` syntax instead. This makes our code more explicit and maintainable. - -`xml2` handles reading and parsing of documents. The `rvest` package was designed for screenscraping and has functions to make our life very easy: it accesses the response of an `xml2` query, looks for all HTML formatted tables, parses them with an XPATH expression and returns them as lists from which we can get data frames. - -```{r getPageData, cache=TRUE} -webPage <- xml2::read_html("https://en.wikipedia.org/wiki/List_of_phobias") -allTables <- rvest::html_table(webPage, fill = TRUE) -``` - -There are ```r length(allTables)``` tables in the list, but the ones we are interested in are data frames with two columns named `Phobia` and `Condition`. - -```{r collateTables, cache=TRUE} -phobiaTable <- data.frame(Phobia = character(), Condition = character()) -for (i in seq_along(allTables)) { - df <- allTables[[i]] - if (all(colnames(df) == c("Phobia", "Condition"))) { - phobiaTable <- rbind(phobiaTable, df) - } -} -``` - -Done, we collected ```r nrow(phobiaTable)``` phobias. Let's randomly select a few and print them. - -

  -

- -```{r , ref.label="randRow", echo=FALSE} -``` - -**Table**: seven random phobias
-```{r renderPhobiaTable, echo=FALSE, results='asis'} -sel <- sample(1:nrow(phobiaTable), 7) -knitr::kable(phobiaTable[sel, ], table.attr = "class=\"striped\"", format = "html") -``` - -

  -

-To pick a single random phobia from the list, we take a (pseudo) random sample of size 1 from the number of rows in the `phobiaFrame` object. Our function thus returns a random row from a matrix or dataframe, and it uses an optional argument: `seed`. This can either be Boolean `FALSE` (the default), or an integer that is used in R's `set.seed()` function. - -```{r randRow} -randRow <- function(M, seed = FALSE) { - # Return a random row from a dataframe M. - if (seed) { - oldseed <- .Random.seed # play nice and save the RNG state ... - set.seed(as.integer(seed)) - } - r <- M[sample(1:nrow(M), 1), ] # fetch one random row - if (seed) { .Random.seed <- oldseed } # ... restore the RNG state - return(r) -} -``` -

  -

-With this useful tool we can ponder on our favourite phobia of the day. For today, let it be **`r randRow(phobiaTable, seed=1123581321)[2]`**, the `r randRow(phobiaTable, seed=1123581321)[1]`. - -_`r randRow(phobiaTable, seed=1123581321)[1]`_! Really!!? Awful. - -

  -

- -Finally: let's plot a histogram of phobia name lengths just to illustrate plots. A little preprocessing is required, since some names collate synonyms, like _"Hypnophobia, somniphobia"_. We'll break these up. - -```{r preProcess} - -# select only single-word phobias that end with "phobia" -sel <- ! grepl(" ", phobiaTable$Phobia) & grepl(".phobia$", phobiaTable$Phobia) -names <- phobiaTable$Phobia[sel] - -# extract the ones we did _not_ select -x <- phobiaTable$Phobia[! sel] -# use strsplit() to split them apart and flatten the resulting list -x <- unlist(strsplit(x, ", ")) -x <- unlist(strsplit(x, " ")) -x <- unlist(strsplit(x, "/")) -# use the same selection as above, and append the result to our "names"" -sel <- ! grepl(" ", x) & grepl(".phobia$", x) -names <- c(names, x[sel]) - -``` - -Done, we collected ```r length(names)``` names for phobias. Here is a histogram of their lengths. - -```{r showHist} - -x <- nchar(names) -pShort <- names[which(x == min(x))[1]] # pull out the shortest name ... -pLong <- names[which(x == max(x))[1]] # ... and the longest name too. -hist(x, - main = "Length of phobia-names", - sub = sprintf("Shortest: %s (%d), Longest: %s (%d)", - pShort, nchar(pShort), pLong, nchar(pLong)), - cex.sub = 0.8, - xlab = "name", - ylab = "counts", - col ="#aef5ee") - -``` - -That's all. - - + + +```{css, echo = FALSE} + +.striped tr:nth-child(even) { + background: #eaf1ff; +} +.striped { + padding: 5px; +} +``` +Random Phobias - .Rmd sample code for BCH441 at the University of Toronto. (c) Boris Steipe 2020 --> + + +```{r setup, include=FALSE} +knitr::opts_chunk$set(echo = TRUE) +``` + +## Phobias! ## +We all have some, but we could always use more. How to know them all? With this code we access the [Wikipedia list of phobias](https://en.wikipedia.org/wiki/List_of_phobias), scrape the contents and assemble a dataframe. Then we write a function to retrieve a random phobia, which we can subsequently ponder on - either to delight in the fact that we don't have that fear, or to add to our daily quota of anxieties (like our well-founded [fear of bad programming practice](http://xkcd.com/292/)). + +To load the list, we will "screenscrape" the contents of Wikipedia's [List of Phobias](https://en.wikipedia.org/wiki/List_of_phobias). First, we install the `rvest` library and the `xml2` library from CRAN, if we don't have it. +```{r packages} +if (! requireNamespace("rvest", quietly=TRUE)) { + install.packages("rvest") +} +if (! requireNamespace("xml2", quietly=TRUE)) { + install.packages("xml2") +} +``` +As we customarily do, we avoid using the `library()` function to make the package contents accessible, but use the `package::` syntax instead. This makes our code more explicit and maintainable. + +`xml2` handles reading and parsing of documents. The `rvest` package was designed for screenscraping and has functions to make our life very easy: it accesses the response of an `xml2` query, looks for all HTML formatted tables, parses them with an XPATH expression and returns them as lists from which we can get data frames. + +```{r getPageData, cache=TRUE} +webPage <- xml2::read_html("https://en.wikipedia.org/wiki/List_of_phobias") +allTables <- rvest::html_table(webPage, fill = TRUE) +``` + +There are ```r length(allTables)``` tables in the list, but the ones we are interested in are data frames with two columns named `Phobia` and `Condition`. + +```{r collateTables, cache=TRUE} +phobiaTable <- data.frame(Phobia = character(), Condition = character()) +for (i in seq_along(allTables)) { + df <- allTables[[i]] + if (all(colnames(df) == c("Phobia", "Condition"))) { + phobiaTable <- rbind(phobiaTable, df) + } +} +``` + +Done, we collected ```r nrow(phobiaTable)``` phobias. Let's randomly select a few and print them. + +

  +

+ +```{r , ref.label="randRow", echo=FALSE} +``` + +**Table**: seven random phobias
+```{r renderPhobiaTable, echo=FALSE, results='asis'} +sel <- sample(1:nrow(phobiaTable), 7) +knitr::kable(phobiaTable[sel, ], table.attr = "class=\"striped\"", format = "html") +``` + +

  +

+To pick a single random phobia from the list, we take a (pseudo) random sample of size 1 from the number of rows in the `phobiaFrame` object. Our function thus returns a random row from a matrix or dataframe, and it uses an optional argument: `seed`. This can either be Boolean `FALSE` (the default), or an integer that is used in R's `set.seed()` function. + +```{r randRow} +randRow <- function(M, seed = FALSE) { + # Return a random row from a dataframe M. + if (seed) { + oldseed <- .Random.seed # play nice and save the RNG state ... + set.seed(as.integer(seed)) + } + r <- M[sample(1:nrow(M), 1), ] # fetch one random row + if (seed) { .Random.seed <- oldseed } # ... restore the RNG state + return(r) +} +``` +

  +

+With this useful tool we can ponder on our favourite phobia of the day. For today, let it be **`r randRow(phobiaTable, seed=1123581321)[2]`**, the `r randRow(phobiaTable, seed=1123581321)[1]`. + +_`r randRow(phobiaTable, seed=1123581321)[1]`_! Really!!? Awful. + +

  +

+ +Finally: let's plot a histogram of phobia name lengths just to illustrate plots. A little preprocessing is required, since some names collate synonyms, like _"Hypnophobia, somniphobia"_. We'll break these up. + +```{r preProcess} + +# select only single-word phobias that end with "phobia" +sel <- ! grepl(" ", phobiaTable$Phobia) & grepl(".phobia$", phobiaTable$Phobia) +names <- phobiaTable$Phobia[sel] + +# extract the ones we did _not_ select +x <- phobiaTable$Phobia[! sel] +# use strsplit() to split them apart and flatten the resulting list +x <- unlist(strsplit(x, ", ")) +x <- unlist(strsplit(x, " ")) +x <- unlist(strsplit(x, "/")) +# use the same selection as above, and append the result to our "names"" +sel <- ! grepl(" ", x) & grepl(".phobia$", x) +names <- c(names, x[sel]) + +``` + +Done, we collected ```r length(names)``` names for phobias. Here is a histogram of their lengths. + +```{r showHist} + +x <- nchar(names) +pShort <- names[which(x == min(x))[1]] # pull out the shortest name ... +pLong <- names[which(x == max(x))[1]] # ... and the longest name too. +hist(x, + main = "Length of phobia-names", + sub = sprintf("Shortest: %s (%d), Longest: %s (%d)", + pShort, nchar(pShort), pLong, nchar(pLong)), + cex.sub = 0.8, + xlab = "name", + ylab = "counts", + col ="#aef5ee") + +``` + +That's all. + + diff --git a/data/S288C_YDL056W_MBP1_coding.fsa b/data/S288C_YDL056W_MBP1_coding.fsa index c528751..befe459 100644 --- a/data/S288C_YDL056W_MBP1_coding.fsa +++ b/data/S288C_YDL056W_MBP1_coding.fsa @@ -1,43 +1,43 @@ ->MBP1 YDL056W SGDID:S000002214 -ATGTCTAACCAAATATACTCAGCGAGATATTCGGGGGTTGATGTTTATGAATTCATTCAT -TCTACAGGATCTATCATGAAAAGGAAAAAGGATGATTGGGTCAATGCTACACATATTTTA -AAGGCCGCCAATTTTGCCAAGGCTAAAAGAACAAGGATTCTAGAGAAGGAAGTACTTAAG -GAAACTCATGAAAAAGTTCAGGGTGGATTTGGTAAATATCAGGGTACATGGGTCCCACTG -AACATAGCGAAACAACTGGCAGAAAAATTTAGTGTCTACGATCAGCTGAAACCGTTGTTC -GACTTTACGCAAACAGATGGGTCTGCTTCTCCACCTCCTGCTCCAAAACATCACCATGCC -TCGAAGGTGGATAGGAAAAAGGCTATTAGAAGTGCAAGTACTTCCGCAATTATGGAAACA -AAAAGAAACAACAAGAAAGCCGAGGAAAATCAATTTCAAAGCAGCAAAATATTGGGAAAT -CCCACGGCTGCACCAAGGAAAAGAGGTAGACCGGTAGGATCTACGAGGGGAAGTAGGCGG -AAGTTAGGTGTCAATTTACAACGTTCTCAAAGTGATATGGGATTTCCTAGACCGGCGATA -CCGAATTCTTCAATATCGACAACGCAACTTCCCTCTATTAGATCCACCATGGGACCACAA -TCCCCTACATTGGGTATTCTGGAAGAAGAAAGGCACGATTCTCGACAGCAGCAGCCGCAA -CAAAATAATTCTGCACAGTTCAAAGAAATTGATCTTGAGGACGGCTTATCAAGCGATGTG -GAACCTTCACAACAATTACAACAAGTTTTTAATCAAAATACTGGATTTGTACCCCAACAA -CAATCTTCCTTGATACAGACACAGCAAACAGAATCAATGGCCACGTCCGTATCTTCCTCT -CCTTCATTACCTACGTCACCGGGCGATTTTGCCGATAGTAATCCATTTGAAGAGCGATTT -CCCGGTGGTGGAACATCTCCTATTATTTCCATGATCCCGCGTTATCCTGTAACTTCAAGG -CCTCAAACATCGGATATTAATGATAAAGTTAACAAATACCTTTCAAAATTGGTTGATTAT -TTTATTTCCAATGAAATGAAGTCAAATAAGTCCCTACCACAAGTGTTATTGCACCCACCT -CCACACAGCGCTCCCTATATAGATGCTCCAATCGATCCAGAATTACATACTGCCTTCCAT -TGGGCTTGTTCTATGGGTAATTTACCAATTGCTGAGGCGTTGTACGAAGCCGGAACAAGT -ATCAGATCGACAAATTCTCAAGGCCAAACTCCATTGATGAGAAGTTCCTTATTCCACAAT -TCATACACTAGAAGAACTTTCCCTAGAATTTTCCAGCTACTGCACGAGACCGTATTTGAT -ATCGATTCGCAATCACAAACAGTAATTCACCATATTGTGAAACGAAAATCAACAACACCT -TCTGCAGTTTATTATCTTGATGTTGTGCTATCTAAGATCAAGGATTTTTCCCCACAGTAT -AGAATTGAATTACTTTTAAACACACAAGACAAAAATGGCGATACCGCACTTCATATTGCT -TCTAAAAATGGAGATGTTGTTTTTTTTAATACACTGGTCAAAATGGGTGCATTAACTACT -ATTTCCAATAAGGAAGGATTAACCGCCAATGAAATAATGAATCAACAATATGAGCAAATG -ATGATACAAAATGGTACAAATCAACATGTCAATTCTTCAAACACGGACTTGAATATCCAC -GTTAATACAAACAACATTGAAACGAAAAATGATGTTAATTCAATGGTAATCATGTCGCCT -GTTTCTCCTTCGGATTACATAACCTATCCATCTCAAATTGCCACCAATATATCAAGAAAT -ATTCCAAATGTAGTGAATTCTATGAAGCAAATGGCTAGCATATACAACGATCTTCATGAA -CAGCATGACAACGAAATAAAAAGTTTGCAAAAAACTTTAAAAAGCATTTCTAAGACGAAA -ATACAGGTAAGCCTAAAAACTTTAGAGGTATTGAAAGAGAGCAGTAAAGATGAAAACGGC -GAAGCTCAGACTAATGATGACTTCGAAATTTTATCTCGTCTACAAGAACAAAATACTAAG -AAATTGAGAAAAAGGCTCATACGATACAAACGGTTGATAAAACAAAAGCTGGAATACAGG -CAAACGGTTTTATTGAACAAATTAATAGAAGATGAAACTCAGGCTACCACCAATAACACA -GTTGAGAAAGATAATAATACGCTGGAAAGGTTGGAATTGGCTCAAGAACTAACGATGTTG -CAATTACAAAGGAAAAACAAATTGAGTTCCTTGGTGAAGAAATTTGAAGACAATGCCAAG -ATTCATAAATATAGACGGATTATCAGGGAAGGTACGGAAATGAATATTGAAGAAGTAGAT -AGTTCGCTGGATGTAATACTACAGACATTGATAGCCAACAATAATAAAAATAAGGGCGCA +>MBP1 YDL056W SGDID:S000002214 +ATGTCTAACCAAATATACTCAGCGAGATATTCGGGGGTTGATGTTTATGAATTCATTCAT +TCTACAGGATCTATCATGAAAAGGAAAAAGGATGATTGGGTCAATGCTACACATATTTTA +AAGGCCGCCAATTTTGCCAAGGCTAAAAGAACAAGGATTCTAGAGAAGGAAGTACTTAAG +GAAACTCATGAAAAAGTTCAGGGTGGATTTGGTAAATATCAGGGTACATGGGTCCCACTG +AACATAGCGAAACAACTGGCAGAAAAATTTAGTGTCTACGATCAGCTGAAACCGTTGTTC +GACTTTACGCAAACAGATGGGTCTGCTTCTCCACCTCCTGCTCCAAAACATCACCATGCC +TCGAAGGTGGATAGGAAAAAGGCTATTAGAAGTGCAAGTACTTCCGCAATTATGGAAACA +AAAAGAAACAACAAGAAAGCCGAGGAAAATCAATTTCAAAGCAGCAAAATATTGGGAAAT +CCCACGGCTGCACCAAGGAAAAGAGGTAGACCGGTAGGATCTACGAGGGGAAGTAGGCGG +AAGTTAGGTGTCAATTTACAACGTTCTCAAAGTGATATGGGATTTCCTAGACCGGCGATA +CCGAATTCTTCAATATCGACAACGCAACTTCCCTCTATTAGATCCACCATGGGACCACAA +TCCCCTACATTGGGTATTCTGGAAGAAGAAAGGCACGATTCTCGACAGCAGCAGCCGCAA +CAAAATAATTCTGCACAGTTCAAAGAAATTGATCTTGAGGACGGCTTATCAAGCGATGTG +GAACCTTCACAACAATTACAACAAGTTTTTAATCAAAATACTGGATTTGTACCCCAACAA +CAATCTTCCTTGATACAGACACAGCAAACAGAATCAATGGCCACGTCCGTATCTTCCTCT +CCTTCATTACCTACGTCACCGGGCGATTTTGCCGATAGTAATCCATTTGAAGAGCGATTT +CCCGGTGGTGGAACATCTCCTATTATTTCCATGATCCCGCGTTATCCTGTAACTTCAAGG +CCTCAAACATCGGATATTAATGATAAAGTTAACAAATACCTTTCAAAATTGGTTGATTAT +TTTATTTCCAATGAAATGAAGTCAAATAAGTCCCTACCACAAGTGTTATTGCACCCACCT +CCACACAGCGCTCCCTATATAGATGCTCCAATCGATCCAGAATTACATACTGCCTTCCAT +TGGGCTTGTTCTATGGGTAATTTACCAATTGCTGAGGCGTTGTACGAAGCCGGAACAAGT +ATCAGATCGACAAATTCTCAAGGCCAAACTCCATTGATGAGAAGTTCCTTATTCCACAAT +TCATACACTAGAAGAACTTTCCCTAGAATTTTCCAGCTACTGCACGAGACCGTATTTGAT +ATCGATTCGCAATCACAAACAGTAATTCACCATATTGTGAAACGAAAATCAACAACACCT +TCTGCAGTTTATTATCTTGATGTTGTGCTATCTAAGATCAAGGATTTTTCCCCACAGTAT +AGAATTGAATTACTTTTAAACACACAAGACAAAAATGGCGATACCGCACTTCATATTGCT +TCTAAAAATGGAGATGTTGTTTTTTTTAATACACTGGTCAAAATGGGTGCATTAACTACT +ATTTCCAATAAGGAAGGATTAACCGCCAATGAAATAATGAATCAACAATATGAGCAAATG +ATGATACAAAATGGTACAAATCAACATGTCAATTCTTCAAACACGGACTTGAATATCCAC +GTTAATACAAACAACATTGAAACGAAAAATGATGTTAATTCAATGGTAATCATGTCGCCT +GTTTCTCCTTCGGATTACATAACCTATCCATCTCAAATTGCCACCAATATATCAAGAAAT +ATTCCAAATGTAGTGAATTCTATGAAGCAAATGGCTAGCATATACAACGATCTTCATGAA +CAGCATGACAACGAAATAAAAAGTTTGCAAAAAACTTTAAAAAGCATTTCTAAGACGAAA +ATACAGGTAAGCCTAAAAACTTTAGAGGTATTGAAAGAGAGCAGTAAAGATGAAAACGGC +GAAGCTCAGACTAATGATGACTTCGAAATTTTATCTCGTCTACAAGAACAAAATACTAAG +AAATTGAGAAAAAGGCTCATACGATACAAACGGTTGATAAAACAAAAGCTGGAATACAGG +CAAACGGTTTTATTGAACAAATTAATAGAAGATGAAACTCAGGCTACCACCAATAACACA +GTTGAGAAAGATAATAATACGCTGGAAAGGTTGGAATTGGCTCAAGAACTAACGATGTTG +CAATTACAAAGGAAAAACAAATTGAGTTCCTTGGTGAAGAAATTTGAAGACAATGCCAAG +ATTCATAAATATAGACGGATTATCAGGGAAGGTACGGAAATGAATATTGAAGAAGTAGAT +AGTTCGCTGGATGTAATACTACAGACATTGATAGCCAACAATAATAAAAATAAGGGCGCA GAACAGATCATCACAATCTCAAACGCGAATAGTCATGCATAA \ No newline at end of file diff --git a/data/SGD_features.README.txt b/data/SGD_features.README.txt index 2f527d4..5b6364d 100644 --- a/data/SGD_features.README.txt +++ b/data/SGD_features.README.txt @@ -1,47 +1,47 @@ -SGD_features.tab - -The latest version of the SGD_features.tab file is based on Genome Version R64-2-1. - -The SGD_features.tab file is updated weekly (Saturday). - -NOTE: On 4 September 2004, the SGD_features.tab file replaced the previously -used chromosomal_feature.tab file. - -File contents: - -1. Information on current chromosomal features in SGD, including Dubious ORFs. -Also contains coordinates of intron, exons, and other subfeatures that are located -within a chromosomal feature. - -2. The relationship between subfeatures and the feature in which they -are located is identified by the feature name in column #7 (parent -feature). For example, the parent feature of the intron found in -ACT1/YFL039C will be YFL039C. The parent feature of YFL039C is -chromosome 6. - -3. The coordinates of all features are in chromosomal coordinates. - - -Columns within SGD_features.tab: - -1. Primary SGDID (mandatory) -2. Feature type (mandatory) -3. Feature qualifier (optional) -4. Feature name (optional) -5. Standard gene name (optional) -6. Alias (optional, multiples separated by |) -7. Parent feature name (optional) -8. Secondary SGDID (optional, multiples separated by |) -9. Chromosome (optional) -10. Start_coordinate (optional) -11. Stop_coordinate (optional) -12. Strand (optional) -13. Genetic position (optional) -14. Coordinate version (optional) -15. Sequence version (optional) -16. Description (optional) - -Note that "chromosome 17" is the mitochondrial chromosome. - -The SGD_features.tab file is complemented by GFF3 file saccharomyces_cerevisiae.gff - +SGD_features.tab + +The latest version of the SGD_features.tab file is based on Genome Version R64-2-1. + +The SGD_features.tab file is updated weekly (Saturday). + +NOTE: On 4 September 2004, the SGD_features.tab file replaced the previously +used chromosomal_feature.tab file. + +File contents: + +1. Information on current chromosomal features in SGD, including Dubious ORFs. +Also contains coordinates of intron, exons, and other subfeatures that are located +within a chromosomal feature. + +2. The relationship between subfeatures and the feature in which they +are located is identified by the feature name in column #7 (parent +feature). For example, the parent feature of the intron found in +ACT1/YFL039C will be YFL039C. The parent feature of YFL039C is +chromosome 6. + +3. The coordinates of all features are in chromosomal coordinates. + + +Columns within SGD_features.tab: + +1. Primary SGDID (mandatory) +2. Feature type (mandatory) +3. Feature qualifier (optional) +4. Feature name (optional) +5. Standard gene name (optional) +6. Alias (optional, multiples separated by |) +7. Parent feature name (optional) +8. Secondary SGDID (optional, multiples separated by |) +9. Chromosome (optional) +10. Start_coordinate (optional) +11. Stop_coordinate (optional) +12. Strand (optional) +13. Genetic position (optional) +14. Coordinate version (optional) +15. Sequence version (optional) +16. Description (optional) + +Note that "chromosome 17" is the mitochondrial chromosome. + +The SGD_features.tab file is complemented by GFF3 file saccharomyces_cerevisiae.gff + diff --git a/data/SGD_features.tab b/data/SGD_features.tab index 7dbfb32..f9340e9 100644 --- a/data/SGD_features.tab +++ b/data/SGD_features.tab @@ -1,16454 +1,16454 @@ -S000002143 ORF Dubious YAL069W chromosome 1 1 335 649 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031098 CDS YAL069W 1 335 649 W 1996-07-31 1996-07-31 -S000028594 ORF Dubious YAL068W-A chromosome 1 1 538 792 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031372 CDS YAL068W-A 1 538 792 W 2003-07-29 2003-07-29 -S000121252 ARS ARS102 ARSI-1 chromosome 1 1 707 776 2014-11-18 2014-11-18|2007-03-07 Autonomously Replicating Sequence -S000028862 telomere TEL01L chromosome 1 1 801 1 C -64 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome I; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats -S000028864 telomeric_repeat TEL01L 1 62 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome I -S000028865 X_element TEL01L 1 801 337 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome I; contains an ARS consensus sequence, an Abf1p binding site consensus sequence and two small overlapping ORFs (YAL068W-A and YAL069W) -S000028866 X_element_combinatorial_repeat TEL01L 1 336 63 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr I; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000002142 ORF Verified YAL068C PAU8 seripauperin PAU8 chromosome 1 1 2169 1807 C 1996-07-31 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions -S000030944 CDS YAL068C 1 2169 1807 C 1996-07-31 1996-07-31 -S000028593 ORF Uncharacterized YAL067W-A chromosome 1 1 2480 2707 W 2003-07-29 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031368 CDS YAL067W-A 1 2480 2707 W 2003-07-29 2003-07-29 -S000121253 ARS ARS103 ARSI-8 chromosome 1 1 7997 8547 2011-02-03 2007-03-07 Autonomously Replicating Sequence; replication origin of very weak function -S000000062 ORF Verified YAL067C SEO1 putative permease SEO1 chromosome 1 L000003363 1 9016 7235 C 2011-02-03 1996-07-31 Putative permease; member of the allantoate transporter subfamily of the major facilitator superfamily; mutation confers resistance to ethionine sulfoxide -S000029932 CDS YAL067C 1 9016 7235 C 2011-02-03 1996-07-31 -S000000061 ORF Dubious YAL066W chromosome 1 1 10091 10399 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000029887 CDS YAL066W 1 10091 10399 W 2011-02-03 1996-07-31 -S000001817 ORF Uncharacterized YAL065C chromosome 1 1 11951 11565 C 2011-02-03 1996-07-31 Putative protein of unknown function; shows sequence similarity to FLO1 and other flocculins -S000037154 CDS YAL065C 1 11951 11565 C 2011-02-03 1996-07-31 -S000002141 ORF Uncharacterized YAL064W-B chromosome 1 1 12046 12426 W 2011-02-03 1999-07-17 Fungal-specific protein of unknown function -S000034793 CDS YAL064W-B 1 12046 12426 W 2011-02-03 1999-07-17 -S000002140 ORF Uncharacterized YAL064C-A TDA8 YAL065C-A chromosome 1 1 13743 13363 C 2011-02-03 1996-07-31 Putative protein of unknown function; null mutant is sensitive to expression of the top1-T722A allele; not an essential gene -S000031541 CDS YAL064C-A 1 13743 13363 C 2011-02-03 1996-07-31 -S000000060 ORF Verified YAL064W chromosome 1 1 21566 21850 W 2011-02-03 1996-07-31|2011-02-03 Protein of unknown function; may interact with ribosomes, based on co-purification experiments -S000037087 CDS YAL064W 1 21566 21850 W 2011-02-03 1996-07-31|2011-02-03 -S000006787 long_terminal_repeat YALWdelta1 chromosome 1 1 22230 22552 W 2011-02-03 2000-05-19 Ty1 LTR -S000028813 ORF Uncharacterized YAL063C-A chromosome 1 1 22685 22395 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000033613 CDS YAL063C-A 1 22685 22395 C 2011-02-03 2003-07-29 -S000000059 ORF Verified YAL063C FLO9 flocculin FLO9 chromosome 1 L000003331 1 27968 24000 C 2011-02-03 1996-07-31 Lectin-like protein with similarity to Flo1p; thought to be expressed and involved in flocculation -S000036982 CDS YAL063C 1 27968 24000 C 2011-02-03 1996-07-31 -S000118317 ARS ARS104 ARSI-31 chromosome 1 1 30946 31183 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178034 ARS_consensus_sequence ARS104 1 31002 31018 W 2014-11-18 2014-11-18 -S000000058 ORF Verified YAL062W GDH3 glutamate dehydrogenase (NADP(+)) GDH3|FUN51 chromosome 1 L000000698 1 31567 32940 W 2011-02-03 1996-07-31 NADP(+)-dependent glutamate dehydrogenase; synthesizes glutamate from ammonia and alpha-ketoglutarate; rate of alpha-ketoglutarate utilization differs from Gdh1p; expression regulated by nitrogen and carbon sources; GDH3 has a paralog, GDH1, that arose from the whole genome duplication -S000036963 CDS YAL062W 1 31567 32940 W 2011-02-03 1996-07-31 -S000000057 ORF Uncharacterized YAL061W BDH2 putative dehydrogenase BDH2 chromosome 1 1 33448 34701 W 2011-02-03 1996-07-31 Putative medium-chain alcohol dehydrogenase with similarity to BDH1; transcription induced by constitutively active PDR1 and PDR3 -S000036902 CDS YAL061W 1 33448 34701 W 2011-02-03 1996-07-31 -S000000056 ORF Verified YAL060W BDH1 (R,R)-butanediol dehydrogenase|BDH chromosome 1 1 35155 36303 W 2011-02-03 1996-07-31|2011-02-03 NAD-dependent (R,R)-butanediol dehydrogenase; catalyzes oxidation of (R,R)-2,3-butanediol to (3R)-acetoin, oxidation of meso-butanediol to (3S)-acetoin, and reduction of acetoin; enhances use of 2,3-butanediol as an aerobic carbon source -S000036089 CDS YAL060W 1 35155 36303 W 2011-02-03 1996-07-31|2011-02-03 -S000000055 ORF Verified YAL059W ECM1 chromosome 1 L000003052 1 36509 37147 W 2011-02-03 1996-07-31|2011-02-03 Pre-ribosomal factor involved in 60S ribosomal protein subunit export; associates with the pre-60S particle; shuttles between the nucleus and cytoplasm -S000035122 CDS YAL059W 1 36509 37147 W 2011-02-03 1996-07-31|2011-02-03 -S000028734 ORF Dubious YAL059C-A chromosome 1 1 36918 36496 C 2011-02-03 2003-07-29|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene ECM1/YAL059W -S000033378 CDS YAL059C-A 1 36918 36496 C 2011-02-03 2003-07-29|2011-02-03 -S000000054 ORF Verified YAL058W CNE1 calnexin|FUN48 chromosome 1 L000000373 1 37464 38972 W 2011-02-03 1996-07-31 Calnexin; integral membrane ER chaperone involved in folding and quality control of glycoproteins; chaperone activity is inhibited by Mpd1p, with which Cne1p interacts; 24% identical to mammalian calnexin; Ca+ binding not yet shown in yeast -S000034933 CDS YAL058W 1 37464 38972 W 2011-02-03 1996-07-31 -S000002139 ORF Dubious YAL056C-A YAL058C-A chromosome 1 1 39046 38696 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035879 CDS YAL056C-A 1 39046 38696 C 2011-02-03 1996-07-31 -S000000052 ORF Verified YAL056W GPB2 KRH1 chromosome 1 1 39259 41901 W 2011-02-03 2004-01-20|1996-07-31|2011-02-03 Multistep regulator of cAMP-PKA signaling; inhibits PKA downstream of Gpa2p and Cyr1p, thereby increasing cAMP dependency; inhibits Ras activity through direct interactions with Ira1p/2p; regulated by G-alpha protein Gpa2p; GPB2 has a paralog, GPB1, that arose from the whole genome duplication -S000033885 CDS YAL056W 1 39259 41901 W 2011-02-03 2004-01-20|1996-07-31|2011-02-03 -S000121254 ARS ARS105 ARSI-42 chromosome 1 1 41992 42151 2014-11-18 2014-11-18|2007-03-07 Autonomously Replicating Sequence -S000000051 ORF Verified YAL055W PEX22 ubiquitin-protein transferase activating protein PEX22|YAF5 chromosome 1 1 42177 42719 W 2011-02-03 1996-07-31 Putative peroxisomal membrane protein; required for import of peroxisomal proteins; functionally complements a Pichia pastoris pex22 mutation -S000033812 CDS YAL055W 1 42177 42719 W 2011-02-03 1996-07-31 -S000000050 ORF Verified YAL054C ACS1 acetate--CoA ligase 1|FUN44 chromosome 1 L000000024 1 45022 42881 C -63.11 2011-02-03 1996-07-31 Acetyl-coA synthetase isoform; along with Acs2p, acetyl-coA synthetase isoform is the nuclear source of acetyl-coA for histone acetylation; expressed during growth on nonfermentable carbon sources and under aerobic conditions -S000033073 CDS YAL054C 1 45022 42881 C 2011-02-03 1996-07-31 -S000000049 ORF Verified YAL053W FLC2 flavin adenine dinucleotide transporter FLC2|HUF2 chromosome 1 1 45899 48250 W 2011-02-03 1996-07-31|2011-02-03 Putative calcium channel involved in calcium release under hypotonic stress; required for uptake of FAD into endoplasmic reticulum; involved in cell wall maintenance; FLC2 has a paralog, YOR365C, that arose from the whole genome duplication -S000033037 CDS YAL053W 1 45899 48250 W 2011-02-03 1996-07-31|2011-02-03 -S000000048 ORF Verified YAL051W OAF1 oleate-activated transcription factor OAF1|YAF1 chromosome 1 L000004197 1 48564 51707 W 2011-02-03 2004-07-20|1996-07-31|2011-02-03 Oleate-activated transcription factor; subunit of a heterodimeric complex with Pip2p, which binds to oleate-response elements (ORE) in the promoter of genes involved in beta-oxidation of fatty acids, peroxisome organization and biogenesis, activating transcription in the presence of oleate; regulates chromatin silencing at telomeres; involved in diauxic shift; OAF1 has a paralog, PIP2, that arose from the whole genome duplication -S000032862 CDS YAL051W 1 48564 51707 W 2011-02-03 2004-07-20|1996-07-31|2011-02-03 -S000000047 ORF Verified YAL049C AIM2 protein AIM2 chromosome 1 1 52595 51855 C 2011-02-03 1996-07-31 Cytoplasmic protein involved in mitochondrial function or organization; null mutant displays reduced frequency of mitochondrial genome loss; potential Hsp82p interactor -S000031896 CDS YAL049C 1 52595 51855 C 2011-02-03 1996-07-31 -S000028733 ORF Dubious YAL047W-A chromosome 1 1 54584 54913 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF GEM1/YAL048C -S000033377 CDS YAL047W-A 1 54584 54913 W 2011-02-03 2003-07-29 -S000000046 ORF Verified YAL048C GEM1 ERMES complex Ca(2+)-binding regulatory GTPase GEM1|GON1 chromosome 1 1 54789 52801 C 2011-02-03 1996-07-31 Outer mitochondrial membrane GTPase, subunit of the ERMES complex; potential regulatory subunit of the ERMES complex that links the ER to mitochondria and may promote inter-organellar calcium and phospholipid exchange as well as coordinating mitochondrial DNA replication and growth; cells lacking Gem1p contain collapsed, globular, or grape-like mitochondria; ortholog of metazoan Miro GTPases -S000030895 CDS YAL048C 1 54789 52801 C 2011-02-03 1996-07-31 -S000000045 ORF Verified YAL047C SPC72 gamma-tubulin complex subunit SPC72|LDB4 chromosome 1 L000003455 1 56857 54989 C 2011-02-03 1996-07-31|2011-02-03 Gamma-tubulin small complex (gamma-TuSC) receptor; recruits the gamma-TuSC complex to the cytoplasmic side of the SPB, connecting nuclear microtubules to the SPB; involved in astral microtubule formation, stabilization, and with Stu2p, anchoring astral MTs at the cytoplasmic face of the SPB, and regulating plus-end MT dynamics; regulated by Cdc5 kinase -S000030803 CDS YAL047C 1 56857 54989 C 2011-02-03 1996-07-31|2011-02-03 -S000000044 ORF Verified YAL046C BOL3 AIM1 chromosome 1 1 57385 57029 C 2011-02-03 1996-07-31 Protein involved in Fe-S cluster transfer to mitochondrial clients; protects [4Fe-4S] clusters from damage due to oxidative stress by acting along with Nfu1p at a late step in the transfer of [4Fe-4S] clusters from the ISA complex to mitochondrial client proteins like lipoate synthase and succinate dehydrogenase; sequence similarity to human BOLA family member, BOLA3, mutations of which are associated with Multiple Mitochondria Dysfunctions Syndrome (MMDS2) -S000030666 CDS YAL046C 1 57385 57029 C 2011-02-03 1996-07-31 -S000007586 ORF Verified YAL044W-A BOL1 chromosome 1 1 57518 57850 W 2011-02-03 2001-01-30 Mitochondrial matrix protein involved in Fe-S cluster biogenesis; facilitates [4Fe-2S] cluster inception into mitochondrial proteins such as lipoate synthase and succinate dehydrogenase; interacts and may function with Grx5p at an early step in Fe-S cluster biosynthesis; forms dimeric complexes with Grx5p and Nfu1p that alter the stability of shared Fe/S clusters; sequence similarity to human BOLA family member, BOLA1 and S. pombe uvi31, a putative DNA repair protein -S000037097 CDS YAL044W-A 1 57518 57850 W 2011-02-03 2001-01-30 -S000000043 ORF Dubious YAL045C chromosome 1 1 57796 57488 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps YAL044W-A -S000030576 CDS YAL045C 1 57796 57488 C 2011-02-03 1996-07-31 -S000000042 ORF Verified YAL044C GCV3 glycine decarboxylase subunit H chromosome 1 L000003501 1 58462 57950 C 2011-02-03 2003-09-22|1996-07-31|2008-03-05 H subunit of the mitochondrial glycine decarboxylase complex; glycine decarboxylase is required for the catabolism of glycine to 5,10-methylene-THF; also required for all protein lipoylation; expression is regulated by levels of 5,10-methylene-THF -S000037751 CDS YAL044C 1 58462 57950 C 2011-02-03 2003-09-22|1996-07-31|2008-03-05 -S000000041 ORF Verified YAL043C PTA1 RNA-processing protein PTA1|FUN39 chromosome 1 L000001522 1 61052 58695 C 2011-02-03 1996-07-31 Subunit of holo-CPF; holo-CPF is a multiprotein complex and functional homolog of mammalian CPSF, required for the cleavage and polyadenylation of mRNA and snoRNA 3' ends; involved in pre-tRNA processing; binds to the phosphorylated CTD of RNAPII -S000037691 CDS YAL043C 1 61052 58695 C 2011-02-03 1996-07-31 -S000000040 ORF Verified YAL042W ERV46 FUN9 chromosome 1 L000000633 1 61316 62563 W 2011-02-03 1996-07-31 Protein localized to COPII-coated vesicles; forms a complex with Erv41p; involved in the membrane fusion stage of transport -S000037669 CDS YAL042W 1 61316 62563 W 2011-02-03 1996-07-31 -S000002138 ORF Dubious YAL042C-A YAL043C-A chromosome 1 1 61608 61231 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF ERV46/YAL042W; YAL042C-A is a non-essential gene -S000030422 CDS YAL042C-A 1 61608 61231 C 2011-02-03 1996-07-31 -S000000039 ORF Verified YAL041W CDC24 Rho family guanine nucleotide exchange factor CDC24|CLS4 chromosome 1 L000000262 1 62840 65404 W -56 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF) for Cdc42p; required for polarity establishment and maintenance, and mutants have morphological defects in bud formation and shmooing; relocalizes from nucleus to cytoplasm upon DNA replication stress; thermosensitivity of the cdc24-4 mutant in the presence of sorbitol is functionally complemented by human CDC42 -S000037599 CDS YAL041W 1 62840 65404 W 2011-02-03 1996-07-31 -S000000038 ORF Verified YAL040C CLN3 cyclin CLN3|WHI1|FUN10|DAF1 chromosome 1 L000000359 1 67520 65778 C -56 2011-02-03 1996-07-31 G1 cyclin involved in cell cycle progression; activates Cdc28p kinase to promote G1 to S phase transition; plays a role in regulating transcription of other G1 cyclins, CLN1 and CLN2; regulated by phosphorylation and proteolysis; acetyl-CoA induces CLN3 transcription in response to nutrient repletion to promote cell-cycle entry; cell cycle arrest phenotype of the cln1 cln2 cln3 triple null mutant is complemented by any of human cyclins CCNA2, CCNB1, CCNC, CCND1, or CCNE1 -S000036825 CDS YAL040C 1 67520 65778 C 2011-02-03 1996-07-31 -S000000037 ORF Verified YAL039C CYC3 holocytochrome c synthase CYC3|CCHL chromosome 1 L000000450 1 69525 68716 C -47 2011-02-03 1996-07-31 Cytochrome c heme lyase (holocytochrome c synthase); attaches heme to apo-cytochrome c (Cyc1p or Cyc7p) in mitochondrial intermembrane space; human homolog HCCS implicated in microphthalmia with linear skin defects (MLS), and can complement yeast null mutant -S000035956 CDS YAL039C 1 69525 68716 C 2011-02-03 1996-07-31 -S000118318 ARS ARS106 ARSI-70 chromosome 1 1 70300 70469 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178035 ARS_consensus_sequence ARS106 1 70434 70418 C 2014-11-18 2014-11-18 -S000000036 ORF Verified YAL038W CDC19 pyruvate kinase CDC19|PYK1 chromosome 1 L000000258 1 71786 73288 W -45 2011-02-03 1996-07-31 Pyruvate kinase; functions as a homotetramer in glycolysis to convert phosphoenolpyruvate to pyruvate, the input for aerobic (TCA cycle) or anaerobic (glucose fermentation) respiration; regulated via allosteric activation by fructose bisphosphate; CDC19 has a paralog, PYK2, that arose from the whole genome duplication -S000035915 CDS YAL038W 1 71786 73288 W 2011-02-03 1996-07-31 -S000028592 ORF Dubious YAL037C-B chromosome 1 1 73300 72326 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031366 CDS YAL037C-B 1 73300 72326 C 2011-02-03 2003-07-29 -S000028732 ORF Uncharacterized YAL037C-A chromosome 1 1 73518 73426 C 2011-02-03 2003-07-29 Putative protein of unknown function -S000033376 CDS YAL037C-A 1 73518 73426 C 2011-02-03 2003-07-29 -S000000035 ORF Uncharacterized YAL037W chromosome 1 1 74020 74823 W 2011-02-03 1996-07-31 Putative protein of unknown function; YAL037W has a paralog, YOR342C, that arose from the whole genome duplication -S000035798 CDS YAL037W 1 74020 74823 W 2011-02-03 1996-07-31 -S000000034 ORF Verified YAL036C RBG1 GTP-binding protein RBG1|FUN11 chromosome 1 L000000634 1 76152 75043 C 2011-02-03 1996-07-31 Member of the DRG family of GTP-binding proteins; associates with translating ribosomes; interacts with Tma46p, Ygr250cp, Gir2p and Yap1p via two-hybrid -S000034719 CDS YAL036C 1 76152 75043 C 2011-02-03 1996-07-31 -S000000033 ORF Verified YAL035W FUN12 translation initiation factor eIF5B|eIF5B|yIF2 chromosome 1 L000000635 1 76427 79435 W 2011-02-03 1996-07-31 Translation initiation factor eIF5B; GTPase that promotes Met-tRNAiMet binding to ribosomes and ribosomal subunit joining; promotes GTP-dependent maturation of 18S rRNA by Nob1p; protein abundance increases in response to DNA replication stress; homolog of bacterial IF2 -S000034678 CDS YAL035W 1 76427 79435 W 2011-02-03 1996-07-31 -S000000032 ORF Verified YAL034W-A MTW1 MIND complex subunit MTW1|NSL2|DSN3 chromosome 1 S000007418 1 79718 80587 W 2011-02-03 1996-07-31 Essential component of the MIND kinetochore complex; joins kinetochore subunits contacting DNA to those contacting microtubules; critical to kinetochore assembly; complex consists of Mtw1p Including Nnf1p-Nsl1p-Dsn1p (MIND) -S000031836 CDS YAL034W-A 1 79718 80587 W 2011-02-03 1996-07-31 -S000002137 ORF Dubious YAL034C-B YAL035C-A chromosome 1 1 79842 79489 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031374 CDS YAL034C-B 1 79842 79489 C 2011-02-03 1996-07-31 -S000002134 ORF Verified YAL034C FUN19 chromosome 1 L000000637 1 81951 80710 C 2011-02-03 2003-09-22|1996-07-31 Non-essential protein of unknown function; expression induced in response to heat stress; FUN19 has a paralog, YOR338W, that arose from the whole genome duplication -S000034508 CDS YAL034C 1 81951 80710 C 2011-02-03 2003-09-22|1996-07-31 -S000000031 ORF Verified YAL033W POP5 RNA-binding protein POP5|FUN53 chromosome 1 L000004301|L000000649 1 82706 83227 W 2011-02-03 1996-07-31 Subunit of both RNase MRP and nuclear RNase P; RNase MRP cleaves pre-rRNA, while nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs -S000034465 CDS YAL033W 1 82706 83227 W 2011-02-03 1996-07-31 -S000000030 ORF Verified YAL032C PRP45 mRNA splicing protein PRP45|FUN20 chromosome 1 L000000638 1 84474 83335 C 2011-02-03 1996-07-31 Protein required for pre-mRNA splicing; associates with the spliceosome and interacts with splicing factors Prp22p and Prp46p; orthologous to human transcriptional coactivator SKIP and can activate transcription of a reporter gene -S000033541 CDS YAL032C 1 84474 83335 C 2011-02-03 1996-07-31 -S000028731 ORF Dubious YAL031W-A chromosome 1 1 84669 84977 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF GIP4/YAL031C -S000033375 CDS YAL031W-A 1 84669 84977 W 2011-02-03 2003-07-29 -S000000029 ORF Verified YAL031C GIP4 protein phosphatase regulator GIP4|FUN21 chromosome 1 L000000639 1 87031 84749 C 2011-02-03 1996-07-31 Cytoplasmic protein that regulates protein phosphatase 1 Glc7p; protein overexpression relocalizes Glc7p from the nucleus and prevents chromosome segregation; potential Cdc28p substrate -S000033476 CDS YAL031C 1 87031 84749 C 2011-02-03 1996-07-31 -S000000028 ORF Verified YAL030W SNC1 SNAP receptor SNC1 chromosome 1 L000001942 1 87286 87752 W 2011-02-03 1996-07-31 Vesicle membrane receptor protein (v-SNARE); involved in the fusion between Golgi-derived secretory vesicles with the plasma membrane; proposed to be involved in endocytosis; member of the synaptobrevin/VAMP family of R-type v-SNARE proteins; SNC1 has a paralog, SNC2, that arose from the whole genome duplication -S000033437 CDS YAL030W 1 87286 87387 W 2011-02-03 1996-07-31 -S000033438 CDS YAL030W 1 87501 87752 W 2011-02-03 1996-07-31 -S000033439 intron YAL030W 1 87388 87500 W 2011-02-03 1996-07-31 -S000000027 ORF Verified YAL029C MYO4 myosin 4|SHE1|FUN22 chromosome 1 L000000640|L000001224 1 92270 87855 C 2011-02-03 1996-07-31 Type V myosin motor involved in actin-based transport of cargos; required for mRNA transport, including ASH1 mRNA, and facilitating the growth and movement of ER tubules into the growing bud along with She3p; MYO4 has a paralog, MYO2, that arose from the whole genome duplication -S000033821 CDS YAL029C 1 92270 87855 C 2011-02-03 1996-07-31 -S000000026 ORF Verified YAL028W FRT2 HPH2 chromosome 1 1 92900 94486 W 2011-02-03 1996-07-31 Tail-anchored ER membrane protein of unknown function; interacts with homolog Frt1p; promotes growth in conditions of high Na+, alkaline pH, or cell wall stress, possibly via a role in posttranslational translocation; potential Cdc28p substrate; FRT2 has a paralog, FRT1, that arose from the whole genome duplication -S000033747 CDS YAL028W 1 92900 94486 W 2011-02-03 1996-07-31 -S000000025 ORF Verified YAL027W SAW1 DNA-binding protein SAW1 chromosome 1 1 94687 95472 W 2011-02-03 1996-07-31 5'- and 3'-flap DNA binding protein; recruits Rad1p-Rad10p to single-strand annealing intermediates with 3' non-homologous tails for removal during double-strand break repair; complexes with Rad1p-Rad10p and stimulates its endonuclease activity; green fluorescent protein (GFP)-fusion protein localizes to the nucleus -S000033629 CDS YAL027W 1 94687 95472 W 2011-02-03 1996-07-31 -S000028730 ORF Dubious YAL026C-A chromosome 1 1 95823 95386 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YAL027W and the verified gene DRS2 -S000033374 CDS YAL026C-A 1 95823 95386 C 2011-02-03 2003-07-29 -S000119380 ncRNA_gene HRA1 HRA1 chromosome 1 1 99305 99868 W 2011-02-03 2007-02-06|2007-05-08|2011-02-03 Non-protein-coding RNA; substrate of RNase P, possibly involved in rRNA processing, specifically maturation of 20S precursor into the mature 18S rRNA -S000120654 noncoding_exon HRA1 1 99305 99868 W 2011-02-03 2007-02-06|2007-05-08|2011-02-03 -S000000024 ORF Verified YAL026C DRS2 aminophospholipid-translocating P4-type ATPase DRS2|SWA3|FUN38 chromosome 1 L000000526 1 99697 95630 C 2011-02-03 1996-07-31|2011-02-03 Trans-golgi network aminophospholipid translocase (flippase); maintains membrane lipid asymmetry in post-Golgi secretory vesicles; contributes to clathrin-coated vesicle formation, endocytosis, protein trafficking between the Golgi and endosomal system and the cellular response to mating pheromone; autoinhibited by its C-terminal tail; localizes to the trans-Golgi network; mutations in human homolog ATP8B1 result in liver disease -S000030197 CDS YAL026C 1 99697 95630 C 2011-02-03 1996-07-31|2011-02-03 -S000000023 ORF Verified YAL025C MAK16 ribosome biosynthesis protein MAK16 chromosome 1 L000000989 1 101145 100225 C -31 2011-02-03 1996-07-31|2011-02-03 Essential nuclear protein; constituent of 66S pre-ribosomal particles; required for maturation of 25S and 5.8S rRNAs; required for maintenance of M1 satellite double-stranded RNA of the L-A virus -S000030064 CDS YAL025C 1 101145 100225 C 2011-02-03 1996-07-31|2011-02-03 -S000000022 ORF Verified YAL024C LTE1 mitotic regulator LTE1|MSI2 chromosome 1 L000000955 1 105872 101565 C -31 2011-02-03 1996-07-31 Protein similar to GDP/GTP exchange factors; without detectable GEF activity; required for asymmetric localization of Bfa1p at daughter-directed spindle pole bodies and for mitotic exit at low temperatures -S000029981 CDS YAL024C 1 105872 101565 C 2011-02-03 1996-07-31 -S000000021 ORF Verified YAL023C PMT2 dolichyl-phosphate-mannose-protein mannosyltransferase PMT2|FUN25 chromosome 1 L000000642|L000001459 1 108551 106272 C 2011-02-03 2002-12-17|1996-07-31 Protein O-mannosyltransferase of the ER membrane; transfers mannose residues from dolichyl phosphate-D-mannose to protein serine/threonine residues; involved in ER quality control; acts in a complex with Pmt1p, can instead interact with Pmt5p; antifungal drug target; PMT2 has a paralog, PMT3, that arose from the whole genome duplication -S000037355 CDS YAL023C 1 108551 106272 C 2011-02-03 2002-12-17|1996-07-31 -S000000020 ORF Verified YAL022C FUN26 nucleoside transmembrane transporter FUN26 chromosome 1 L000000643 1 110430 108877 C 2011-02-03 1996-07-31 High affinity, broad selectivity, nucleoside/nucleobase transporter; vacuolar membrane localized transporter which may regulate the balance of nicotinamide riboside (NmR) levels between the cytosol and vacuole, contributing to salvage of NmR for use in cytosolic NAD+ synthesis; equilibrative nucleoside transporter (ENT) family member -S000037286 CDS YAL022C 1 110430 108877 C 2011-02-03 1996-07-31 -S000000019 ORF Verified YAL021C CCR4 CCR4-NOT core exoribonuclease subunit CCR4|NUT21|FUN27 chromosome 1 L000000239 1 113359 110846 C -25 2011-02-03 1996-07-31 Component of the CCR4-NOT transcriptional complex; CCR4-NOT is involved in regulation of gene expression; component of the major cytoplasmic deadenylase, which is involved in mRNA poly(A) tail shortening -S000037200 CDS YAL021C 1 113359 110846 C 2011-02-03 1996-07-31 -S000028729 ORF Dubious YAL019W-A chromosome 1 1 114250 114819 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF ATS1/YAL020C -S000032720 CDS YAL019W-A 1 114250 114819 W 2011-02-03 2003-07-29 -S000000018 ORF Verified YAL020C ATS1 KTI13|FUN28 chromosome 1 L000000644|L000000154 1 114615 113614 C 2011-02-03 1996-07-31|2011-02-03 Protein required for modification of wobble nucleosides in tRNA; acts with Elongator complex, Kti11p, and Kti12p; has a potential role in regulatory interactions between microtubules and the cell cycle; forms a stable heterodimer with Kti11p -S000037124 CDS YAL020C 1 114615 113614 C 2011-02-03 1996-07-31|2011-02-03 -S000000017 ORF Verified YAL019W FUN30 DNA-dependent ATPase FUN30 chromosome 1 L000000645 1 114919 118314 W 2011-02-03 1996-07-31 Snf2p family member with ATP-dependent chromatin remodeling activity; has a role in silencing at the mating type locus, telomeres and centromeres; enriched at centromeres and is required for correct chromatin structure around centromeres, as well as at the boundary element of the silent HMR; recruited to DNA double-strand breaks (DSBs) where it promotes 5' strand resection of DSBs; potential Cdc28p substrate -S000037555 CDS YAL019W 1 114919 118314 W 2011-02-03 1996-07-31 -S000000016 ORF Verified YAL018C LDS1 chromosome 1 1 119541 118564 C 2011-02-03 1996-07-31 Protein Involved in spore wall assembly; localizes to lipid droplets found on or outside of the prospore membrane; shares similarity with Lds2p and Rrt8p, and a strain mutant for all 3 genes exhibits reduced dityrosine fluorescence relative to the single mutants -S000032033 CDS YAL018C 1 119541 118564 C 2011-02-03 1996-07-31 -S000000015 ORF Verified YAL017W PSK1 serine/threonine protein kinase PSK1|FUN31 chromosome 1 L000000646 1 120225 124295 W 2011-02-03 1996-07-31|2011-02-03 PAS domain-containing serine/threonine protein kinase; coordinately regulates protein synthesis and carbohydrate metabolism and storage in response to a unknown metabolite that reflects nutritional status; PSK1 has a paralog, PSK2, that arose from the whole genome duplication -S000031992 CDS YAL017W 1 120225 124295 W 2011-02-03 1996-07-31|2011-02-03 -S000118319 ARS ARS107 ARSI-125 chromosome 1 1 124349 124597 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178036 ARS_consensus_sequence ARS107 1 124479 124463 C 2014-11-18 2014-11-18 -S000028528 ORF Dubious YAL016C-B chromosome 1 1 124492 124307 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030333 CDS YAL016C-B 1 124492 124307 C 2011-02-03 2003-07-29 -S000000014 ORF Verified YAL016W TPD3 protein phosphatase 2A structural subunit TPD3|FUN32 chromosome 1 L000002325 1 124879 126786 W .5 2011-02-03 1996-07-31 Regulatory subunit A of the heterotrimeric PP2A complex; the heterotrimeric protein phosphatase 2A (PP2A) complex also contains regulatory subunit Cdc55p and either catalytic subunit Pph21p or Pph22p; required for cell morphogenesis and transcription by RNA polymerase III -S000031874 CDS YAL016W 1 124879 126786 W 2011-02-03 1996-07-31 -S000028728 ORF Dubious YAL016C-A chromosome 1 1 125069 124755 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF TPD3/YAL016W -S000032719 CDS YAL016C-A 1 125069 124755 C 2011-02-03 2003-07-29 -S000000013 ORF Verified YAL015C NTG1 bifunctional N-glycosylase/AP lyase NTG1|ogg2|SCR1|FUN33 chromosome 1 L000004114 1 128102 126903 C 2011-02-03 1996-07-31 DNA N-glycosylase and apurinic/apyrimidinic (AP) lyase; involved in base excision repair; acts in both nucleus and mitochondrion; creates a double-strand break at mtDNA origins that stimulates replication in response to oxidative stress; required for maintaining mitochondrial genome integrity; NTG1 has a paralog, NTG2, that arose from the whole genome duplication -S000036247 CDS YAL015C 1 128102 126903 C 2011-02-03 1996-07-31 -S000000012 ORF Verified YAL014C SYN8 syntaxin|SLT2|UIP2 chromosome 1 1 129019 128252 C 2011-02-03 2002-12-17|1996-07-31 Endosomal SNARE related to mammalian syntaxin 8 -S000036146 CDS YAL014C 1 129019 128252 C 2011-02-03 2002-12-17|1996-07-31 -S000000011 ORF Verified YAL013W DEP1 Rpd3L histone deacetylase complex subunit DEP1|FUN54 chromosome 1 L000000502 1 129270 130487 W 12 2011-02-03 2003-12-15|1996-07-31|2011-02-03 Component of the Rpd3L histone deacetylase complex; required for diauxic shift-induced histone H2B deposition onto rDNA genes; transcriptional modulator involved in regulation of structural phospholipid biosynthesis genes and metabolically unrelated genes, as well as maintenance of telomeres, mating efficiency, and sporulation -S000036100 CDS YAL013W 1 129270 130487 W 2011-02-03 2003-12-15|1996-07-31|2011-02-03 -S000000010 ORF Verified YAL012W CYS3 cystathionine gamma-lyase CYS3|STR1|FUN35|CYI1 chromosome 1 L000000470 1 130799 131983 W -16 2011-02-03 1996-07-31 Cystathionine gamma-lyase; catalyzes one of the two reactions involved in the transsulfuration pathway that yields cysteine from homocysteine with the intermediary formation of cystathionine; protein abundance increases in response to DNA replication stress -S000035250 CDS YAL012W 1 130799 131983 W 2011-02-03 1996-07-31 -S000000009 ORF Verified YAL011W SWC3 SWC1 chromosome 1 1 132199 134076 W 2011-02-03 2003-09-22|1996-07-31 Protein of unknown function; component of the SWR1 complex, which exchanges histone variant H2AZ (Htz1p) for chromatin-bound histone H2A; required for formation of nuclear-associated array of smooth endoplasmic reticulum known as karmellae -S000035116 CDS YAL011W 1 132199 134076 W 2011-02-03 2003-09-22|1996-07-31 -S000000008 ORF Verified YAL010C MDM10 FUN37 chromosome 1 L000000648|L000001053 1 135665 134184 C 2011-02-03 1996-07-31|2011-02-03 Subunit of both the ERMES and the SAM complex; component of ERMES complex which acts as a molecular tether between the mitochondria and the ER, necessary for efficient phospholipid exchange between organelles and for mitophagy; SAM/TOB complex component that functions in the assembly of outer membrane beta-barrel proteins; involved in mitochondrial inheritance and morphology; ERMES complex is often co-localized with peroxisomes and concentrated areas of pyruvate dehydrogenase -S000034958 CDS YAL010C 1 135665 134184 C 2011-02-03 1996-07-31|2011-02-03 -S000000007 ORF Verified YAL009W SPO7 Nem1-Spo7 phosphatase regulatory subunit SPO7 chromosome 1 L000002000 1 135854 136633 W -4 2011-02-03 1996-07-31 Putative regulatory subunit of Nem1p-Spo7p phosphatase holoenzyme; regulates nuclear growth by controlling phospholipid biosynthesis, required for normal nuclear envelope morphology, premeiotic replication, and sporulation -S000034070 CDS YAL009W 1 135854 136633 W 2011-02-03 1996-07-31 -S000000006 ORF Verified YAL008W FUN14 MCP3 chromosome 1 L000000636 1 136914 137510 W 2011-02-03 1996-07-31 Integral mitochondrial outer membrane (MOM) protein; dosage suppressor of an MDM10 null that reduces ERMES-related phenotypes, such as alterations in mitochondrial morphology, protein complex assembly, and lipid profile; dosage suppressor of MDM12, MDM34, and MMM1 null mutant growth defects; novel mechanism of MOM import involving Tom70p, the TOM complex, and the TIM23 complex, requiring mitochondrial membrane potential and processing by the IMP complex for correct biogenesis -S000033957 CDS YAL008W 1 136914 137510 W 2011-02-03 1996-07-31 -S000000005 ORF Verified YAL007C ERP2 chromosome 1 L000004679 1 138345 137698 C 2011-02-03 1996-07-31 Member of the p24 family involved in ER to Golgi transport; similar to Emp24p and Erv25p; role in misfolded protein quality control; forms a heterotrimeric complex with Erp1p, Emp24p, and Erv25p; localized to COPII-coated vesicles; ERP2 has a paralog, ERP4, that arose from the whole genome duplication -S000033112 CDS YAL007C 1 138345 137698 C 2011-02-03 1996-07-31 -S000006786 long_terminal_repeat YALCdelta2 chromosome 1 1 138992 138831 C 2011-02-03 2000-05-19 Ty1 LTR -S000006680 tRNA_gene tP(UGG)A TRN1 chromosome 1 L000003601 1 139152 139254 W -2 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin; can mutate to suppress +1 frameshift mutations in proline codons -S000035969 intron tP(UGG)A 1 139188 139218 W 2011-02-03 2000-05-19 -S000035967 noncoding_exon tP(UGG)A 1 139152 139187 W 2011-02-03 2000-05-19 -S000035968 noncoding_exon tP(UGG)A 1 139219 139254 W 2011-02-03 2000-05-19 -S000002136 ORF Dubious YAL004W chromosome 1 1 140760 141407 W 2011-02-03 1996-07-31|2007-04-05 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified gene SSA1/YAL005C -S000032057 CDS YAL004W 1 140760 141407 W 2011-02-03 1996-07-31|2007-04-05 -S000000004 ORF Verified YAL005C SSA1 Hsp70 family ATPase SSA1|YG100 chromosome 1 L000002069 1 141431 139503 C -1 2011-02-03 1996-07-31|2007-04-05 ATPase involved in protein folding and NLS-directed nuclear transport; member of HSP70 family; required for ubiquitin-dependent degradation of short-lived proteins; forms chaperone complex with Ydj1p; localized to nucleus, cytoplasm, cell wall; 98% identical to paralog Ssa2p with different functional specificity in propagation of yeast [URE3] prions, vacuolar-mediated degradations of gluconeogenesis enzymes; general targeting factor of Hsp104p to prion fibrils -S000032096 CDS YAL005C 1 141431 139503 C 2011-02-03 1996-07-31|2007-04-05 -S000000003 ORF Verified YAL003W EFB1 translation elongation factor 1 subunit beta|EF-1beta|eEF1Balpha|TEF5 chromosome 1 L000000542 1 142174 143160 W 2011-02-03 1996-07-31|1999-07-17 Translation elongation factor 1 beta; stimulates nucleotide exchange to regenerate EF-1 alpha-GTP for the next elongation cycle; part of the EF-1 complex, which facilitates binding of aminoacyl-tRNA to the ribosomal A site; human homolog EEF1B2 can complement yeast efb1 mutants -S000031941 CDS YAL003W 1 142174 142253 W 2011-02-03 1999-07-17|1996-07-31 -S000031942 CDS YAL003W 1 142620 143160 W 2011-02-03 1999-07-17|1996-07-31 -S000031943 intron YAL003W 1 142254 142619 W 2011-02-03 1999-07-17|1996-07-31 -S000007500 snoRNA_gene snR18 SNR18 chromosome 1 1 142367 142468 W 2011-02-03 2000-05-19|2007-05-08 C/D box small nucleolar RNA (snoRNA); commonly referred to as U18; guides 2'-O-methylation of large subunit (LSU) rRNA at positions A649 and C650 -S000036595 noncoding_exon snR18 1 142367 142468 W 2011-02-03 2000-05-19|2007-05-08 -S000000002 ORF Verified YAL002W VPS8 CORVET complex membrane-binding subunit VPS8|VPL8|VPT8|FUN15 chromosome 1 L000003013 1 143707 147531 W 2011-02-03 2004-01-14|1996-07-31 Membrane-binding component of the CORVET complex; involved in endosomal vesicle tethering and fusion in the endosome to vacuole protein targeting pathway; interacts with Vps21p; contains RING finger motif -S000031737 CDS YAL002W 1 143707 147531 W 2011-02-03 2004-01-14|1996-07-31 -S000121255 ARS ARS108 ARSI-147 chromosome 1 1 147398 147717 2014-11-18 2014-11-18|2007-03-07 Autonomously Replicating Sequence -S000000001 ORF Verified YAL001C TFC3 transcription factor TFIIIC subunit TFC3|tau 138|TSV115|FUN24 chromosome 1 L000000641|L000002287 1 151166 147594 C -1 2011-02-03 1996-07-31 Subunit of RNA polymerase III transcription initiation factor complex; part of the TauB domain of TFIIIC that binds DNA at the BoxB promoter sites of tRNA and similar genes; cooperates with Tfc6p in DNA binding; largest of six subunits of the RNA polymerase III transcription initiation factor complex (TFIIIC) -S000030735 CDS YAL001C 1 151006 147594 C 2011-02-03 1996-07-31 -S000030734 CDS YAL001C 1 151166 151097 C 2011-02-03 1996-07-31 -S000030736 intron YAL001C 1 151096 151007 C 2011-02-03 1996-07-31 -S000006463 centromere CEN1 CEN1 chromosome 1 L000000294 1 151465 151582 W 0 2011-02-03 2000-05-19|2006-05-08 Chromosome I centromere -S000077257 centromere_DNA_Element_I CEN1 1 151465 151474 W 2011-02-03 2004-10-04 -S000077258 centromere_DNA_Element_II CEN1 1 151475 151557 W 2011-02-03 2004-10-04 -S000077259 centromere_DNA_Element_III CEN1 1 151558 151582 W 2011-02-03 2004-10-04 -S000000063 ORF Verified YAR002W NUP60 FG-nucleoporin NUP60 chromosome 1 1 152257 153876 W 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; contributes directly to nucleocytoplasmic transport and maintenance of the nuclear pore complex (NPC) permeability barrier and is involved in gene tethering at the nuclear periphery; relocalizes to the cytosol in response to hypoxia; both NUP1 and NUP60 are homologous to human NUP153 -S000035473 CDS YAR002W 1 152257 153876 W 2011-02-03 1996-07-31 -S000002129 ORF Verified YAR002C-A ERP1 chromosome 1 L000004678 1 154724 154065 C 2011-02-03 1999-07-17 Member of the p24 family involved in ER to Golgi transport; role in misfolded protein quality control; forms heterotrimeric complex with Erp2p, Emp24p, and Erv25p; localized to COPII-coated vesicles; ERP1 has a paralog, ERP6, that arose from the whole genome duplication -S000032940 CDS YAR002C-A 1 154724 154065 C 2011-02-03 1999-07-17 -S000000064 ORF Verified YAR003W SWD1 COMPASS subunit protein SWD1|SAF49|CPS50|FUN16 chromosome 1 1 155005 156285 W 2011-02-03 1996-07-31 Subunit of the COMPASS (Set1C) complex; COMPASS methylates histone H3 on lysine 4 and is required in transcriptional silencing near telomeres; WD40 beta propeller superfamily member with similarity to mammalian Rbbp7 -S000035547 CDS YAR003W 1 155005 156285 W 2011-02-03 1996-07-31 -S000000065 ORF Verified YAR007C RFA1 replication factor A subunit protein RFA1|RPA70|RPA1|FUN3|BUF2 chromosome 1 L000000204|L000001620 1 158619 156754 C -3 2011-02-03 1996-07-31 Subunit of heterotrimeric Replication Protein A (RPA); RPA is a highly conserved single-stranded DNA binding protein involved in DNA replication, repair, and recombination; RPA protects against inappropriate telomere recombination, and upon telomere uncapping, prevents cell proliferation by a checkpoint-independent pathway; role in DNA catenation/decatenation pathway of chromosome disentangling; relocalizes to the cytosol in response to hypoxia -S000036676 CDS YAR007C 1 158619 156754 C 2011-02-03 1996-07-31 -S000000066 ORF Verified YAR008W SEN34 tRNA splicing endonuclease subunit SEN34|FUN4 chromosome 1 L000003973 1 158966 159793 W 2011-02-03 1996-07-31 Subunit of the tRNA splicing endonuclease; tRNA splicing endonuclease (Sen complex) is composed of Sen2p, Sen15p, Sen34p, and Sen54p; Sen complex also cleaves the CBP1 mRNA at the mitochondrial surface; Sen34p contains the active site for tRNA 3' splice site cleavage and has similarity to Sen2p and to Archaeal tRNA splicing endonuclease -S000037450 CDS YAR008W 1 158966 159793 W 2011-02-03 1996-07-31 -S000077372 ARS ARS109 ARS101 ARSI-160 chromosome 1 1 159907 160127 2011-02-03 2004-10-18|2006-09-06 ARS containing multiple redundant ORC binding sites; ORC is the acronym for origin recognition complex -S000121251 ARS_consensus_sequence ARS109 1 159945 159935 C 2011-02-03 2007-03-07 -S000118986 ARS_consensus_sequence ARS109 1 159952 159966 W 2011-02-03 2006-10-02 -S000006788 long_terminal_repeat YARCdelta3 chromosome 1 1 160237 160105 C 2011-02-03 2000-05-19 Ty1 LTR -S000006789 long_terminal_repeat YARCdelta4 chromosome 1 1 160574 160238 C 2011-02-03 2000-05-19 Ty1 LTR -S000000067 transposable_element_gene YAR009C truncated gag-pol fusion protein|YARCTyB1-1 chromosome 1 1 164187 160597 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; Gag processing produces capsid proteins, Pol is cleaved to produce protease, reverse transcriptase and integrase activities; in YARCTy1-1 TYB is mutant and probably non-functional; protein product forms cytoplasmic foci upon DNA replication stress -S000037508 CDS YAR009C 1 164187 160597 C 2011-02-03 1996-07-31 -S000000068 transposable_element_gene YAR010C gag protein|YARCTyA1-1 chromosome 1 1 165866 164544 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; Gag processing produces capsid proteins; in YARCTy1-1 TYB is mutant and probably non-functional -S000030210 CDS YAR010C 1 165866 164544 C 2011-02-03 1996-07-31 -S000006792 LTR_retrotransposon YARCTy1-1 Ty1 chromosome 1 1 166162 160238 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; mutated in S288C -S000006790 long_terminal_repeat YARCdelta5 chromosome 1 1 166162 165826 C 2011-02-03 2000-05-19 Ty1 LTR -S000006521 tRNA_gene tA(UGC)A TGA1 chromosome 1 L000003602|S000029601|L000002292 1 166267 166339 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 5 nuclear tRNA genes containing the tDNA-anticodon TGC (mature tRNA may be UGC or may contain modified bases), decodes GCA and probably GCG codons into alanine, one of 16 nuclear tRNAs for alanine -S000034842 noncoding_exon tA(UGC)A 1 166267 166339 W 2011-02-03 2000-05-19 -S000000069 ORF Verified YAR014C BUD14 protein phosphatase regulator BUD14 chromosome 1 1 168871 166742 C 2011-02-03 2004-01-27|1996-07-31|2011-02-03 Protein involved in bud-site selection; Bud14p-Glc7p complex is a cortical regulator of dynein; forms a complex with Kel1p and Kel2p that regulates Bnr1p (formin) to affect actin cable assembly, cytokinesis, and polarized growth; diploid mutants display a random budding pattern instead of the wild-type bipolar pattern; relative distribution to the nucleus increases upon DNA replication stress -S000031457 CDS YAR014C 1 168871 166742 C 2011-02-03 2004-01-27|1996-07-31|2011-02-03 -S000000070 ORF Verified YAR015W ADE1 phosphoribosylaminoimidazolesuccinocarboxamide synthase chromosome 1 L000000031 1 169375 170295 W 4 2011-02-03 1996-07-31 N-succinyl-5-aminoimidazole-4-carboxamide ribotide synthetase; required for 'de novo' purine nucleotide biosynthesis; red pigment accumulates in mutant cells deprived of adenine; protein abundance increases in response to DNA replication stress -S000031548 CDS YAR015W 1 169375 170295 W 2011-02-03 1996-07-31 -S000000071 ORF Verified YAR018C KIN3 serine/threonine protein kinase KIN3|NPK1|FUN52 chromosome 1 L000000903 1 171703 170396 C 2011-02-03 1996-07-31 Nonessential serine/threonine protein kinase; possible role in DNA damage response; influences tolerance to high levels of ethanol -S000032711 CDS YAR018C 1 171703 170396 C 2011-02-03 1996-07-31 -S000028735 ORF Dubious YAR019W-A chromosome 1 1 174998 175330 W 2011-02-03 2003-07-29|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF CDC15/YAR019C -S000033379 CDS YAR019W-A 1 174998 175330 W 2011-02-03 2003-07-29|2011-02-03 -S000000072 ORF Verified YAR019C CDC15 serine/threonine protein kinase CDC15|LYT1 chromosome 1 L000000255 1 175135 172211 C 6 2011-02-03 1996-07-31|2011-02-03 Protein kinase of the Mitotic Exit Network; localized to the spindle pole bodies at late anaphase; promotes mitotic exit by directly switching on the kinase activity of Dbf2p; required for spindle disassembly after meiosis II; relocalizes to the cytoplasm upon DNA replication stress -S000032794 CDS YAR019C 1 175135 172211 C 2011-02-03 1996-07-31|2011-02-03 -S000114488 ARS ARS110 ARS110 ARSI-176 chromosome 1 1 176157 176404 2011-02-03 2006-09-06|2006-02-28 Autonomously Replicating Sequence; originally referred to as ADE1 ARS -S000178037 ARS_consensus_sequence ARS110 1 176232 176248 W 2014-11-18 2014-11-18 -S000000073 ORF Verified YAR020C PAU7 seripauperin PAU7 chromosome 1 1 177023 176856 C 2011-02-03 1996-07-31 Member of the seripauperin multigene family; active during alcoholic fermentation, regulated by anaerobiosis, inhibited by oxygen, repressed by heme -S000034578 CDS YAR020C 1 177023 176856 C 2011-02-03 1996-07-31 -S000000074 ORF Uncharacterized YAR023C DUP240 family protein chromosome 1 1 179820 179281 C 2011-02-03 1996-07-31|2011-02-03 Putative integral membrane protein; member of DUP240 gene family -S000035643 CDS YAR023C 1 179820 179281 C 2011-02-03 1996-07-31|2011-02-03 -S000006636 tRNA_gene tL(CAA)A SUP56 chromosome 1 L000003603 1 181141 181254 W 10 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis; can mutate to suppress amber nonsense mutations -S000033745 intron tL(CAA)A 1 181179 181210 W 2011-02-03 2000-05-19 -S000033743 noncoding_exon tL(CAA)A 1 181141 181178 W 2011-02-03 2000-05-19 -S000033744 noncoding_exon tL(CAA)A 1 181211 181254 W 2011-02-03 2000-05-19 -S000006719 tRNA_gene tS(AGA)A chromosome 1 L000003604 1 182603 182522 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000032337 noncoding_exon tS(AGA)A 1 182603 182522 C 2011-02-03 2000-05-19 -S000006795 long_terminal_repeat YARWsigma1 chromosome 1 1 182620 182959 W 2011-02-03 2000-05-19 Ty3 LTR -S000006793 long_terminal_repeat YARWdelta6 chromosome 1 1 183142 183474 W 2011-02-03 2000-05-19 Ty1 LTR -S000000075 ORF Verified YAR027W UIP3 DUP240 family protein UIP3 chromosome 1 1 183770 184477 W 2011-02-03 1996-07-31 Putative integral membrane protein of unknown function; interacts with Ulp1p at the nuclear periphery; member of DUP240 gene family -S000036855 CDS YAR027W 1 183770 184477 W 2011-02-03 1996-07-31 -S000000076 ORF Uncharacterized YAR028W DUP240 family protein chromosome 1 1 184892 185596 W 2011-02-03 1996-07-31 Putative integral membrane protein; member of DUP240 gene family; GFP-fusion protein is induced in response to the DNA-damaging agent MMS -S000036899 CDS YAR028W 1 184892 185596 W 2011-02-03 1996-07-31 -S000000077 ORF Uncharacterized YAR029W DUP240 family protein chromosome 1 1 186321 186545 W 2011-02-03 1996-07-31 Member of DUP240 gene family but contains no transmembrane domains; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern -S000036967 CDS YAR029W 1 186321 186545 W 2011-02-03 1996-07-31 -S000000078 ORF Verified YAR031W PRM9 pheromone-regulated DUP240 family protein PRM9 chromosome 1 1 186836 187732 W 2011-02-03 1996-07-31 Pheromone-regulated protein; contains 3 predicted transmembrane segments and an FF sequence, a motif involved in COPII binding; member of DUP240 gene family; PRM9 has a paralog, PRM8, that arose from a segmental duplication -S000030609 CDS YAR031W 1 186836 187732 W 2011-02-03 1996-07-31 -S000001821 ORF Dubious YAR030C chromosome 1 1 186853 186512 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YAR029W and the verified gene PRM9 -S000036694 CDS YAR030C 1 186853 186512 C 2011-02-03 1996-07-31 -S000000079 ORF Verified YAR033W MST28 DUP240 family protein MST28 chromosome 1 1 188107 188811 W 2011-02-03 1996-07-31 Putative integral membrane protein, involved in vesicle formation; forms complex with Mst27p; member of DUP240 gene family; binds COPI and COPII vesicles; MST28 has a paralog, MST27, that arose from a segmental duplication -S000030819 CDS YAR033W 1 188107 188811 W 2011-02-03 1996-07-31 -S000006794 long_terminal_repeat YARWdelta7 chromosome 1 1 189426 189757 W 2011-02-03 2000-05-19 Ty2 LTR -S000000080 ORF Verified YAR035W YAT1 carnitine O-acetyltransferase YAT1 chromosome 1 L000002497 1 190193 192256 W 2011-02-03 1996-07-31 Outer mitochondrial carnitine acetyltransferase; minor ethanol-inducible enzyme involved in transport of activated acyl groups from the cytoplasm into the mitochondrial matrix; phosphorylated -S000031976 CDS YAR035W 1 190193 192256 W 2011-02-03 1996-07-31 -S000028595 ORF Uncharacterized YAR035C-A chromosome 1 1 192417 192337 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; predicted to have a role in cell budding based on computational "guilt by association" analysis -S000031375 CDS YAR035C-A 1 192417 192337 C 2011-02-03 2003-07-29 -S000000081 ORF Verified YAR042W SWH1 oxysterol-binding protein related protein SWH1|OSH1|YAR044W chromosome 1 L000002249 1 192619 196185 W 2011-02-03 2003-09-27|2006-01-19|1996-07-31 Protein similar to mammalian oxysterol-binding protein; contains ankyrin repeats and FFAT motif; interacts with ER anchor Scs2p at the nucleus-vacuole junction; regulated by sterol binding; SWH1 has a paralog, OSH2, that arose from the whole genome duplication -S000035065 CDS YAR042W 1 192619 196185 W 2011-02-03 2003-09-27|2006-01-19|1996-07-31 -S000000083 ORF Dubious YAR047C chromosome 1 1 201787 201467 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031684 CDS YAR047C 1 201787 201467 C 2011-02-03 1996-07-31 -S000000084 ORF Verified YAR050W FLO1 flocculin FLO1|FLO4|FLO2 chromosome 1 L000000617|L000000616 1 203403 208016 W 44 2011-02-03 1998-09-02|1996-07-31 Lectin-like protein involved in flocculation; cell wall protein that binds mannose chains on the surface of other cells, confers floc-forming ability that is chymotrypsin sensitive and heat resistant; important for co-flocculation with other yeasts, mediating interaction with specific species; FLO1 has a paralog, FLO5, that arose from a segmental duplication -S000036444 CDS YAR050W 1 203403 208016 W 2011-02-03 1998-09-02|1996-07-31 -S000000085 ORF Dubious YAR053W chromosome 1 1 208367 208663 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037285 CDS YAR053W 1 208367 208663 W 2011-02-03 1996-07-31 -S000006791 long_terminal_repeat YARCdelta8 chromosome 1 1 209778 209448 C 2011-02-03 2000-05-19 Ty1 LTR -S000121256 ARS ARS111 ARSI-215 chromosome 1 1 214888 215644 2011-02-03 2007-03-07 Autonomously Replicating Sequence -S000178038 ARS_consensus_sequence ARS111 1 215028 215012 C 2014-11-18 2014-11-18 -S000000086 ORF Dubious YAR060C chromosome 1 1 217492 217157 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YAR060C has a paralog, YHR212C, that arose from a segmental duplication -S000032661 CDS YAR060C 1 217492 217157 C 2011-02-03 1996-07-31 -S000000087 pseudogene YAR061W YAR062W chromosome 1 1 218140 219145 W 2014-11-18 1996-07-31|2014-11-18 Pseudogenic fragment with similarity to flocculins; YAR061W has a paralog, YHR212W-A, that arose from a segmental duplication -S000033393 CDS YAR061W 1 218140 219145 W 2014-11-18 1996-07-31|2014-11-18 -S000000089 ORF Uncharacterized YAR064W chromosome 1 1 220198 220497 W 2011-02-03 1996-07-31 Pseudogenic fragment with similarity to flocculins; YAR064W has a paralog, YHR213W-B, that arose from a segmental duplication -S000033577 CDS YAR064W 1 220198 220497 W 2011-02-03 1996-07-31 -S000002144 ORF Uncharacterized YAR066W chromosome 1 1 221049 221660 W 2011-02-03 1996-07-31 Putative GPI protein; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively; YAR066W has a paralog, YHR214W, that arose from a segmental duplication -S000034603 CDS YAR066W 1 221049 221660 W 2011-02-03 1996-07-31 -S000000091 ORF Uncharacterized YAR068W chromosome 1 1 222406 222891 W 2011-02-03 1996-07-31 Fungal-specific protein of unknown function; induced in respiratory-deficient cells; YAR068W has a paralog, YHR214W-A, that arose from a segmental duplication -S000035691 CDS YAR068W 1 222406 222891 W 2011-02-03 1996-07-31 -S000121257 ARS ARS112 ARSI-223 chromosome 1 1 222880 224046 2011-02-03 2007-03-07 Autonomously Replicating Sequence -S000000092 ORF Dubious YAR069C chromosome 1 1 224304 224011 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a protein, based on available experimental and comparative sequence data; YAR069C has a paralog, YHR214C-D, that arose from a segmental duplication -S000035758 CDS YAR069C 1 224304 224011 C 2011-02-03 1996-07-31 -S000000093 ORF Dubious YAR070C chromosome 1 1 224862 224563 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a protein, based on available experimental and comparative sequence data; YAR070C has a paralog, YHR214C-B, that arose from a segmental duplication -S000036733 CDS YAR070C 1 224862 224563 C 2011-02-03 1996-07-31 -S000000094 ORF Verified YAR071W PHO11 acid phosphatase PHO11 chromosome 1 L000001423 1 225460 226863 W 48 2011-02-03 1996-07-31 One of three repressible acid phosphatases; glycoprotein that is transported to the cell surface by the secretory pathway; induced by phosphate starvation and coordinately regulated by PHO4 and PHO2; PHO11 has a paralog, PHO12, that arose from a segmental duplication -S000036824 CDS YAR071W 1 225460 226863 W 2011-02-03 1996-07-31 -S000000095 ORF Dubious YAR073W IMD1 chromosome 1 1 227742 228953 W 2011-02-03 1996-07-31 Nonfunctional protein with homology to IMP dehydrogenase; blocked reading frame, located close to the telomere; not expressed at detectable levels; YAR073W and YAR075W comprise a continuous reading frame in most strains of S. cerevisiae; YAR073W/YAR075W together have a paralog, IMD2, that arose from a segmental duplication -S000037618 CDS YAR073W 1 227742 228953 W 2011-02-03 1996-07-31 -S000002145 ORF Dubious YAR075W chromosome 1 1 228844 229317 W 2011-02-03 1996-07-31 Non-functional protein with homology IMP dehydrogenase; YAR073W/IMD1 and YAR075W comprise a continuous reading frame in most strains of S. cerevisiae; YAR073W/YAR075W together have a paralog, IMD2, that arose from a segmental duplication -S000037740 CDS YAR075W 1 228844 229317 W 2011-02-03 1996-07-31 -S000028937 telomere TEL01R chromosome 1 1 229411 230218 W 51 2011-02-03 2003-09-09|2011-02-03 Telomeric region on the right arm of Chromosome I; composed of an X element core sequence and a short terminal stretch of telomeric repeats -S000028938 telomeric_repeat TEL01R 1 230121 230218 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome I -S000028939 X_element TEL01R 1 229411 229871 W 2011-02-03 2003-09-09|2011-02-03 Telomeric X element Core sequence on the right arm of Chromosome I; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028438 ARS ARS1001 chromosome 10 10 65 577 2002-12-16 2002-12-16 Autonomously Replicating Sequence -S000028665 ORF Dubious YJL225W-A chromosome 10 10 829 1311 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized gene YJL225C -S000032490 CDS YJL225W-A 10 829 1311 W 2003-07-29 2003-07-29 -S000003760 ORF Uncharacterized YJL225C Y' element ATP-dependent helicase chromosome 10 10 6130 466 C 1996-07-31 1996-07-31 Putative Y' element ATP-dependent helicase -S000033322 CDS YJL225C 10 4581 466 C 1996-07-31 1996-07-31 -S000033321 CDS YJL225C 10 6130 4970 C 1996-07-31 1996-07-31 -S000033323 intron YJL225C 10 4969 4582 C 1996-07-31 1996-07-31 -S000028439 ARS ARS1002 chromosome 10 10 7445 7943 2002-12-16 2002-12-16 Autonomously Replicating Sequence -S000028901 telomere TEL10L chromosome 10 10 7767 1 C -125 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome X; composed of an X element core sequence, X element combinatorial repeats, a long Y' element, and a short terminal stretch of telomeric repeats -S000028902 telomeric_repeat TEL10L 10 60 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome X -S000028903 X_element TEL10L 10 7767 7305 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome X; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028904 X_element_combinatorial_repeat TEL10L 10 7304 6932 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr X; contains a repeat of the D type with a group I mitochondrial bI4 intron insertion; formerly called SubTelomeric Repeats -S000028905 Y_prime_element TEL10L 10 6931 61 C 2003-09-09 2003-09-09 Telomeric long Y' element on the left arm of Chromosome X; contains an ARS consensus sequence, a region of 36-bp repeats, and two ORFs YJL225C and YJL225W-A -S000003759 ORF Verified YJL223C PAU1 seripauperin PAU1 chromosome 10 L000001343 10 9138 8776 C 1996-07-31 1996-07-31 Member of the seripauperin multigene family; encoded mainly in subtelomeric regions; SWAT-GFP and mCherry fusion proteins localize to the vacuole; active during alcoholic fermentation; regulated by anaerobiosis, negatively regulated by oxygen; repressed by heme; identical to Pau14p -S000032445 CDS YJL223C 10 9138 8776 C 1996-07-31 1996-07-31 -S000028664 ORF Dubious YJL222W-B chromosome 10 10 9346 9483 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032489 CDS YJL222W-B 10 9346 9483 W 2003-07-29 2003-07-29 -S000028663 ORF Dubious YJL222W-A chromosome 10 10 9452 9679 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032488 CDS YJL222W-A 10 9452 9679 W 2003-07-29 2003-07-29 -S000003758 ORF Verified YJL222W VTH2 signal sequence-binding protein chromosome 10 10 11475 16124 W 1996-07-31 1996-07-31 Putative membrane glycoprotein; has strong similarity to Vth1p and Pep1p/Vps10p; may be involved in vacuolar protein sorting -S000032381 CDS YJL222W 10 11475 16124 W 1996-07-31 1996-07-31 -S000028440 ARS ARS1003 chromosome 10 10 16124 16762 2002-12-16 2002-12-16 Autonomously Replicating Sequence -S000003756 ORF Dubious YJL220W chromosome 10 10 18243 18695 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YJL221C/FSP2 -S000032208 CDS YJL220W 10 18243 18695 W 1996-07-31 1996-07-31 -S000003757 ORF Verified YJL221C IMA4 oligo-1,6-glucosidase IMA4|FSP2 chromosome 10 L000002901 10 18536 16767 C 1996-07-31 1996-07-31 Alpha-glucosidase; weak, but broad substrate specificity for alpha-1,4- and alpha-1,6-glucosides; member of IMA isomaltase family; not required for isomaltose utilization, but Ima4p overexpression allows the ima1 null mutant to grow on isomaltose; identical to IMA3 -S000032237 CDS YJL221C 10 18536 16767 C 1996-07-31 1996-07-31 -S000003755 ORF Verified YJL219W HXT9 hexose transporter HXT9 chromosome 10 L000000843 10 19497 21200 W 1996-07-31 1996-07-31 Putative hexose transporter that is nearly identical to Hxt11p; has similarity to major facilitator superfamily (MFS) transporters, expression of HXT9 is regulated by transcription factors Pdr1p and Pdr3p -S000031251 CDS YJL219W 10 19497 21200 W 1996-07-31 1996-07-31 -S000003754 ORF Uncharacterized YJL218W acetyltransferase chromosome 10 10 21973 22563 W 1996-07-31 1996-07-31 Putative acetyltransferase; similar to bacterial galactoside O-acetyltransferases; induced by oleate in an OAF1/PIP2-dependent manner; promoter contains an oleate response element consensus sequence; non-essential gene -S000031119 CDS YJL218W 10 21973 22563 W 1996-07-31 1996-07-31 -S000003753 ORF Verified YJL217W REE1 chromosome 10 10 23133 23729 W 1996-07-31 1996-07-31 Cytoplasmic protein involved in the regulation of enolase (ENO1); mRNA expression is induced by calcium shortage, copper deficiency (via Mac1p) and the presence of galactose (via Gal4p); mRNA expression is also regulated by the cell cycle -S000030093 CDS YJL217W 10 23133 23729 W 1996-07-31 1996-07-31 -S000028441 ARS ARS1004 chromosome 10 10 23662 24158 2002-12-16 2002-12-16 Autonomously Replicating Sequence -S000178121 ARS_consensus_sequence ARS1004 10 23819 23835 W 2014-11-18 2014-11-18 -S000003752 ORF Verified YJL216C IMA5 oligo-1,6-glucosidase IMA5 chromosome 10 10 26086 24341 C 1996-07-31 1996-07-31 Alpha-glucosidase; specificity for isomaltose, maltose, and palatinose, but not alpha-methylglucoside; most distant member of the IMA isomaltase family, but with similar catalytic properties as Ima1p and Ima2p; not required for isomaltose utilization, but Ima5p overexpression allows the ima1 null mutant to grow on isomaltose; can cleave alpha-1,3 linkage of nigerose and turanose and alpha-1,5 linkage of leucrose and is very sensitive to temperature in vitro -S000029921 CDS YJL216C 10 26086 24341 C 1996-07-31 1996-07-31 -S000003751 ORF Dubious YJL215C chromosome 10 10 26771 26412 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037269 CDS YJL215C 10 26771 26412 C 1996-07-31 1996-07-31 -S000003750 ORF Verified YJL214W HXT8 hexose transporter HXT8 chromosome 10 L000000842 10 26887 28596 W 1996-07-31 1996-07-31 Protein of unknown function with similarity to hexose transporters; expression is induced by low levels of glucose and repressed by high levels of glucose -S000037229 CDS YJL214W 10 26887 28596 W 1996-07-31 1996-07-31 -S000003749 ORF Verified YJL213W chromosome 10 10 32163 33158 W 1996-07-31 1996-07-31 Protein of unknown function that may interact with ribosomes; periodically expressed during the yeast metabolic cycle; phosphorylated in vitro by the mitotic exit network (MEN) kinase complex, Dbf2p/Mob1p -S000037130 CDS YJL213W 10 32163 33158 W 1996-07-31 1996-07-31 -S000003748 ORF Verified YJL212C OPT1 oligopeptide transporter OPT1|GSH11|HGT1 chromosome 10 10 36249 33850 C 1996-07-31 1996-07-31 Proton-coupled oligopeptide transporter of the plasma membrane; also transports glutathione and phytochelatin; member of the OPT family -S000037000 CDS YJL212C 10 36249 33850 C 1996-07-31 1996-07-31 -S000003746 ORF Verified YJL210W PEX2 ubiquitin-protein ligase peroxin 2|PAS5|CRT1 chromosome 10 L000000422|L000003076 10 36919 37734 W 1996-07-31 1996-07-31 RING-finger peroxin and E3 ubiquitin ligase; peroxisomal membrane protein with a C-terminal zinc-binding RING domain, forms translocation subcomplex with Pex10p and Pex12p which functions in peroxisomal matrix protein import -S000036292 CDS YJL210W 10 36919 37734 W 1996-07-31 1996-07-31 -S000003747 ORF Dubious YJL211C chromosome 10 10 37200 36757 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YJL210W/PEX2 -S000036326 CDS YJL211C 10 37200 36757 C 1996-07-31 1996-07-31 -S000003745 ORF Verified YJL209W CBP1 chromosome 10 L000000224 10 38005 39969 W 1996-07-31 1996-07-31 Mitochondrial protein, regulator of COB mRNA stability and translation; interacts with the 5'-untranslated region of the COB mRNA; found in a complex at the inner membrane along with Pet309p; localizes to mitochondrial foci upon DNA replication stress -S000034944 CDS YJL209W 10 38005 39969 W 1996-07-31 1996-07-31 -S000003744 ORF Verified YJL208C NUC1 ribonuclease chromosome 10 L000001283 10 41183 40194 C 1996-07-31 1996-07-31 Major mitochondrial nuclease; has RNAse and DNA endo- and exonucleolytic activities; roles in mitochondrial recombination, apoptosis and maintenance of polyploidy; involved in fragmentation of genomic DNA during PND (programmed nuclear destruction); encodes ortholog of mammalian endoG -S000033945 CDS YJL208C 10 41183 40194 C 1996-07-31 1996-07-31 -S000003743 ORF Verified YJL207C LAA1 chromosome 10 10 47433 41389 C 1996-07-31 1996-07-31 AP-1 accessory protein; colocalizes with clathrin to the late-Golgi apparatus; involved in TGN-endosome transport; physically interacts with AP-1; similar to the mammalian p200; may interact with ribosomes; YJL207C is a non-essential gene -S000033803 CDS YJL207C 10 47433 41389 C 1996-07-31 1996-07-31 -S000003741 ORF Uncharacterized YJL206C chromosome 10 10 49935 47659 C 1996-07-31 1996-07-31 Putative protein of unknown function; similar to transcriptional regulators from the Zn[2]-Cys[6] binuclear cluster protein family; mRNA is weakly cell cycle regulated, peaking in S phase; induced rapidly upon MMS treatment -S000033077 CDS YJL206C 10 49935 47659 C 1996-07-31 1996-07-31 -S000003742 ORF Verified YJL205C NCE101 YJL205C-A|YJL206C-A|NCE1 chromosome 10 L000003097 10 50443 50139 C 1996-07-31 1996-07-31 Protein of unknown function; involved in secretion of proteins that lack classical secretory signal sequences; SWAT-GFP and mCherry fusion proteins localize to the cytosol -S000034430 CDS YJL205C 10 50268 50139 C 1996-07-31 1996-07-31 -S000034429 CDS YJL205C 10 50443 50412 C 1996-07-31 1996-07-31 -S000034431 intron YJL205C 10 50411 50269 C 1996-07-31 1996-07-31 -S000003740 ORF Verified YJL204C RCY1 chromosome 10 10 53151 50629 C 1996-07-31 1996-07-31 F-box protein involved in recycling endocytosed proteins; involved in recycling plasma membrane proteins internalized by endocytosis; localized to sites of polarized growth; direct interaction with C-terminal cytoplasmic region of Drs2p plays an important role for Drs2p function in endocytic recycling pathway -S000032878 CDS YJL204C 10 53151 50629 C 1996-07-31 1996-07-31 -S000003739 ORF Verified YJL203W PRP21 SPP91 chromosome 10 L000001507 10 53341 54183 W 1996-07-31 1996-07-31 Subunit of the SF3a splicing factor complex; required for spliceosome assembly -S000032839 CDS YJL203W 10 53341 54183 W 1996-07-31 1996-07-31 -S000003738 ORF Dubious YJL202C chromosome 10 10 54290 53943 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps 3' end of essential PRP21 gene encoding a subunit of the SF3a splicing factor complex -S000031876 CDS YJL202C 10 54290 53943 C 1996-07-31 1996-07-31 -S000003737 ORF Verified YJL201W ECM25 chromosome 10 L000003897 10 54379 56178 W 1996-07-31 1996-07-31 Non-essential protein of unknown function; promoter contains a consensus binding sequence for factor Abf1p -S000031819 CDS YJL201W 10 54379 56178 W 1996-07-31 1996-07-31 -S000003736 ORF Verified YJL200C ACO2 aconitate hydratase ACO2 chromosome 10 10 58813 56444 C 1996-07-31 1996-07-31 Putative mitochondrial aconitase isozyme; similarity to Aco1p, an aconitase required for the TCA cycle; expression induced during growth on glucose, by amino acid starvation via Gcn4p, and repressed on ethanol -S000031641 CDS YJL200C 10 58813 56444 C 1996-07-31 1996-07-31 -S000006743 tRNA_gene tT(AGU)J chromosome 10 L000003628 10 59172 59100 C 2000-05-19 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000032173 noncoding_exon tT(AGU)J 10 59172 59100 C 2000-05-19 2000-05-19 -S000007027 long_terminal_repeat YJLWdelta1 chromosome 10 10 59505 59784 W 2011-02-03 2000-05-19 Ty1 LTR -S000003735 ORF Uncharacterized YJL199C MBB1 chromosome 10 10 60182 59856 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains, not conserved in closely related Saccharomyces species; protein detected in large-scale protein-protein interaction studies; YJL199C is not an essential gene -S000035098 CDS YJL199C 10 60182 59856 C 2011-02-03 1996-07-31 -S000003734 ORF Verified YJL198W PHO90 SPX domain-containing inorganic phosphate transporter chromosome 10 10 60844 63489 W 2011-02-03 1996-07-31 Low-affinity phosphate transporter; acts upstream of Pho81p in regulation of the PHO pathway; deletion of pho84, pho87, pho89, pho90, and pho91 causes synthetic lethality; transcription independent of Pi and Pho4p activity; overexpression results in vigorous growth; PHO90 has a paralog, PHO87, that arose from the whole genome duplication -S000034201 CDS YJL198W 10 60844 63489 W 2011-02-03 1996-07-31 -S000003733 ORF Verified YJL197W UBP12 putative ubiquitin-specific protease UBP12 chromosome 10 L000003033 10 63805 67569 W 2011-02-03 1996-07-31 Ubiquitin-specific protease; cleaves ubiquitin from ubiquitinated proteins; present in the nucleus and cytoplasm -S000034104 CDS YJL197W 10 63805 67569 W 2011-02-03 1996-07-31 -S000028839 ORF Dubious YJL197C-A chromosome 10 10 66086 65805 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene YJL197C/UBP12 -S000034494 CDS YJL197C-A 10 66086 65805 C 2011-02-03 2003-07-29 -S000028442 ARS ARS1005 chromosome 10 10 67663 67736 2014-11-18 2002-12-16|2014-11-18 Autonomously Replicating Sequence -S000003732 ORF Verified YJL196C ELO1 fatty acid elongase ELO1 chromosome 10 L000003442 10 68782 67850 C 2011-02-03 1996-07-31 Elongase I, medium-chain acyl elongase; catalyzes carboxy-terminal elongation of unsaturated C12-C16 fatty acyl-CoAs to C16-C18 fatty acids; ELO1 has a paralog, ELO2, that arose from the whole genome duplication -S000033953 CDS YJL196C 10 68782 67850 C 2011-02-03 1996-07-31 -S000003730 ORF Verified YJL194W CDC6 AAA family ATPase CDC6 chromosome 10 L000000246 10 69338 70879 W -124 2011-02-03 1996-07-31 Essential ATP-binding protein required for DNA replication; component of the pre-replicative complex (pre-RC) which requires ORC to associate with chromatin and is in turn required for Mcm2-7p DNA association; homologous to S. pombe Cdc18p; relocalizes from nucleus to cytoplasm upon DNA replication stress; degraded in response to plasma membrane stress -S000033118 CDS YJL194W 10 69338 70879 W 2011-02-03 1996-07-31 -S000003731 ORF Dubious YJL195C chromosome 10 10 69942 69241 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YJL194W/CDC6 -S000033155 CDS YJL195C 10 69942 69241 C 2011-02-03 1996-07-31 -S000003729 ORF Uncharacterized YJL193W chromosome 10 10 71366 72574 W 2011-02-03 1996-07-31 Putative protein of unknown function; predicted to encode a triose phosphate transporter subfamily member based on phylogenetic analysis; similar to YOR307C/SLY41; deletion mutant has a respiratory growth defect -S000033028 CDS YJL193W 10 71366 72574 W 2011-02-03 1996-07-31 -S000003728 ORF Verified YJL192C SOP4 EMC7 chromosome 10 10 73414 72710 C 2011-02-03 1996-07-31 ER-membrane protein; subunit of evolutionarily conserved EMC (Endoplasmic Reticulum Membrane Complex) implicated in ERAD (ER-associated degradation) and proper assembly of multi-pass transmembrane (TM) proteins; EMC acts in yeast as an ER-mitochondria tether that interacts with outer membrane protein Tom5 of TOM (Translocase of the Mitochondrial Outer Membrane) complex; suppressor of pma1-7, deletion of SOP4 slows down export of wild-type Pma1p and Pma1-7 from the ER -S000032055 CDS YJL192C 10 73414 72710 C 2011-02-03 1996-07-31 -S000003727 ORF Verified YJL191W RPS14B uS11|ribosomal 40S subunit protein S14B|S11|rp59B|S14B|CRY2 chromosome 10 L000000424 10 73787 74611 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; required for ribosome assembly and 20S pre-rRNA processing; mutations confer cryptopleurine resistance; homologous to mammalian ribosomal protein S14 and bacterial S11; RPS14B has a paralog, RPS14A, that arose from the whole genome duplication -S000032004 CDS YJL191W 10 73787 73796 W 2011-02-03 1996-07-31 -S000032005 CDS YJL191W 10 74205 74611 W 2011-02-03 1996-07-31 -S000032006 intron YJL191W 10 73797 74204 W 2011-02-03 1996-07-31 -S000003726 ORF Verified YJL190C RPS22A uS8|ribosomal 40S subunit protein S22A|S8|rp50|YS22|S24A|S22A|RPS24 chromosome 10 L000003150|L000001760 10 75302 74910 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S15A and bacterial S8; RPS22A has a paralog, RPS22B, that arose from the whole genome duplication -S000031736 CDS YJL190C 10 75302 74910 C 2011-02-03 1996-07-31 -S000003725 ORF Verified YJL189W RPL39 eL39|ribosomal 60S subunit protein L39|L39e|YL40|L46|L39|SPB2|RPL46 chromosome 10 L000001737 10 75933 76474 W 2011-02-03 1996-07-31|2011-02-03 Ribosomal 60S subunit protein L39; required for ribosome biogenesis; loss of both Rpl31p and Rpl39p confers lethality; also exhibits genetic interactions with SIS1 and PAB1; homologous to mammalian ribosomal protein L39, no bacterial homolog -S000030844 CDS YJL189W 10 75933 75938 W 2011-02-03 1996-07-31 -S000030845 CDS YJL189W 10 76325 76474 W 2011-02-03 1996-07-31 -S000030846 intron YJL189W 10 75939 76324 W 2011-02-03 1996-07-31|2011-02-03 -S000003724 ORF Dubious YJL188C BUD19 chromosome 10 10 76510 76202 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 88% of ORF overlaps the verified gene RPL39; diploid mutant displays a weak budding pattern phenotype in a systematic assay -S000037873 CDS YJL188C 10 76510 76202 C 2011-02-03 1996-07-31|2011-02-03 -S000003723 ORF Verified YJL187C SWE1 tyrosine protein kinase SWE1|WEE1 chromosome 10 L000002248 10 79262 76803 C 2011-02-03 1996-07-31 Protein kinase that regulates the G2/M transition; negative regulator of the Cdc28p kinase; morphogenesis checkpoint kinase; positive regulator of sphingolipid biosynthesis via Orm2p; phosphorylates a tyrosine residue in the N-terminus of Hsp90 in a cell-cycle associated manner, thus modulating the ability of Hsp90 to chaperone a selected clientele; localizes to the nucleus and to the daughter side of the mother-bud neck; homolog of S. pombe Wee1p; potential Cdc28p substrate -S000037770 CDS YJL187C 10 79262 76803 C 2011-02-03 1996-07-31 -S000003722 ORF Verified YJL186W MNN5 alpha-1,2-mannosyltransferase MNN5 chromosome 10 L000004918 10 80155 81915 W 2011-02-03 1996-07-31|2011-02-03 Alpha-1,2-mannosyltransferase; responsible for addition of the second alpha-1,2-linked mannose of the branches on the mannan backbone of oligosaccharides, localizes to an early Golgi compartment -S000037744 CDS YJL186W 10 80155 81915 W 2011-02-03 1996-07-31|2011-02-03 -S000003721 ORF Verified YJL185C ATG36 chromosome 10 10 82976 82095 C 2011-02-03 1996-07-31 Pex3p interacting protein, required for pexophagy; interacts with Atg8p and Atg11p; mRNA is weakly cell cycle regulated, peaking in G2 phase; YJL185C is a non-essential gene -S000036951 CDS YJL185C 10 82976 82095 C 2011-02-03 1996-07-31 -S000003720 ORF Verified YJL184W GON7 chromatin DNA-binding EKC/KEOPS complex subunit GON7|PCC2|LDB6 chromosome 10 10 83448 83819 W 2011-02-03 1996-07-31 Component of the EKC/KEOPS protein complex; EKC/KEOPS complex is required for t6A tRNA modification and telomeric TG1-3 recombination; may have role in transcription; implicated in osmotic stress response; other complex members are Kae1p, Cgi121p, Pcc1p, and Bud32p -S000036918 CDS YJL184W 10 83448 83819 W 2011-02-03 1996-07-31 -S000003719 ORF Verified YJL183W MNN11 alpha-1,6-mannosyltransferase chromosome 10 L000004260 10 84068 85336 W 2011-02-03 1996-07-31|2011-02-03 Subunit of a Golgi mannosyltransferase complex; this complex also contains Anp1p, Mnn9p, Mnn10p, and Hoc1p, and mediates elongation of the polysaccharide mannan backbone; has homology to Mnn10p -S000036862 CDS YJL183W 10 84068 85336 W 2011-02-03 1996-07-31|2011-02-03 -S000003717 ORF Uncharacterized YJL181W RBH1 RBH1 chromosome 10 10 85660 87495 W 2011-02-03 1996-07-31 Putative protein of unknown function; expression is cell-cycle regulated as shown by microarray analysis; potential regulatory target of Mbp1p, which binds to the YJL181W promoter region; contains a PH-like domain; RBH1 has a paralog, RBH2, that arose from the whole genome duplication -S000035872 CDS YJL181W 10 85660 87495 W 2011-02-03 1996-07-31 -S000003718 ORF Dubious YJL182C chromosome 10 10 85752 85435 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps uncharacterized ORF YJL181W -S000035944 CDS YJL182C 10 85752 85435 C 2011-02-03 1996-07-31 -S000003716 ORF Verified YJL180C ATP12 ATP synthase complex assembly protein ATP12 chromosome 10 L000000149 10 88560 87583 C 2011-02-03 1996-07-31 Assembly factor for F1 sector of mitochondrial F1F0 ATP synthase; conserved protein; required for assembly of alpha and beta subunits into F1 sector of mitochondrial F1F0 ATP synthase; human homolog ATPAF2 can complement yeast atp12 mutant; mutation of human homolog reduces active ATP synthase levels and is associated with the disorder ATPAF2 deficiency -S000035717 CDS YJL180C 10 88560 87583 C 2011-02-03 1996-07-31 -S000003715 ORF Verified YJL179W PFD1 prefolding complex chaperone subunit|GIM6 chromosome 10 L000004367 10 88787 89116 W 2011-02-03 1996-07-31|2011-02-03 Subunit of heterohexameric prefoldin; prefoldin binds cytosolic chaperonin and transfers target proteins to it; involved in the biogenesis of actin and of alpha- and gamma-tubulin; prefoldin complex also localizes to chromatin of actively transcribed genes in the nucleus and facilitates transcriptional elongation -S000034696 CDS YJL179W 10 88787 89116 W 2011-02-03 1996-07-31|2011-02-03 -S000003714 ORF Verified YJL178C ATG27 ETF1 chromosome 10 10 90097 89282 C 2011-02-03 2004-02-12|1996-07-31 Type I membrane protein involved in autophagy and the Cvt pathway; may be involved in membrane delivery to the phagophore assembly site -S000033739 CDS YJL178C 10 90097 89282 C 2011-02-03 2004-02-12|1996-07-31 -S000003713 ORF Verified YJL177W RPL17B uL22|ribosomal 60S subunit protein L17B|L22|YL17|L20B|L17B chromosome 10 L000004457 10 90786 91657 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L17B; required for processing of 27SB pre-rRNA and formation of stable 66S assembly intermediates; homologous to mammalian ribosomal protein L17 and bacterial L22; RPL17B has a paralog, RPL17A, that arose from the whole genome duplication -S000033683 CDS YJL177W 10 90786 91094 W 2011-02-03 1996-07-31 -S000033684 CDS YJL177W 10 91412 91657 W 2011-02-03 1996-07-31 -S000033685 intron YJL177W 10 91095 91411 W 2011-02-03 1996-07-31 -S000003711 ORF Dubious YJL175W chromosome 10 10 94049 94561 W 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; deletion confers resistance to cisplatin, hypersensitivity to 5-fluorouracil, and growth defect at high pH with high calcium; overlaps gene for SWI3 transcription factor -S000033497 CDS YJL175W 10 94049 94561 W 2011-02-03 1996-07-31 -S000003712 ORF Verified YJL176C SWI3 HAF2|TYE2 chromosome 10 L000002251 10 94530 92053 C 2011-02-03 1996-07-31 Subunit of the SWI/SNF chromatin remodeling complex; SWI/SNF regulates transcription by remodeling chromosomes; contains SANT domain that is required for SWI/SNF assembly; is essential for displacement of histone H2A-H2B dimers during ATP-dependent remodeling; required for transcription of many genes, including ADH1, ADH2, GAL1, HO, INO1 and SUC2; relocates to the cytosol under hypoxic conditions -S000033535 CDS YJL176C 10 94530 92053 C 2011-02-03 1996-07-31 -S000003710 ORF Verified YJL174W KRE9 chromosome 10 L000000916 10 95092 95922 W -111.26 2011-02-03 1996-07-31 Glycoprotein involved in cell wall beta-glucan assembly; null mutation leads to severe growth defects, aberrant multibudded morphology, and mating defects -S000032753 CDS YJL174W 10 95092 95922 W 2011-02-03 1996-07-31 -S000003709 ORF Verified YJL173C RFA3 RPA14|RPA3 chromosome 10 L000001622 10 96529 96161 C 2011-02-03 1996-07-31 Subunit of heterotrimeric Replication Protein A (RPA); RPA is a highly conserved single-stranded DNA binding protein complex involved in DNA replication, repair, recombination; RPA protects against inappropriate telomere recombination, and upon telomere uncapping, prevents cell proliferation by a checkpoint-independent pathway; with Sgs1p-Top2p-Rmi1p, stimulates DNA catenation/decatenation activity of Top3p; protein abundance increases in response to DNA replication stress -S000032609 CDS YJL173C 10 96529 96161 C 2011-02-03 1996-07-31 -S000003708 ORF Verified YJL172W CPS1 Gly-Xaa carboxypeptidase chromosome 10 L000000403 10 97737 99467 W 2011-02-03 1996-07-31 Vacuolar carboxypeptidase S; expression is induced under low-nitrogen conditions -S000032538 CDS YJL172W 10 97737 99467 W 2011-02-03 1996-07-31 -S000028443 ARS ARS1006 chromosome 10 10 99458 99678 2014-11-18 2002-12-16|2014-11-18|2011-02-03 Autonomously Replicating Sequence -S000178122 ARS_consensus_sequence ARS1006 10 99617 99601 C 2014-11-18 2014-11-18 -S000003707 ORF Verified YJL171C TOH1 chromosome 10 10 100894 99704 C 2011-02-03 1996-07-31|2011-02-03 GPI-anchored cell wall protein of unknown function; induced in response to cell wall damaging agents and by mutations in genes involved in cell wall biogenesis; sequence similarity to YBR162C/TOS1, a covalently bound cell wall protein; protein abundance increases in response to DNA replication stress -S000031523 CDS YJL171C 10 100894 99704 C 2011-02-03 1996-07-31|2011-02-03 -S000003706 ORF Verified YJL170C ASG7 chromosome 10 L000004055 10 101779 101150 C 2011-02-03 1996-07-31|2006-01-18 Protein that regulates signaling from G protein beta subunit Ste4p; contributes to relocalization of Ste4p within the cell; specific to a-cells and induced by alpha-factor -S000031474 CDS YJL170C 10 101779 101150 C 2011-02-03 1996-07-31|2006-01-18 -S000003705 ORF Dubious YJL169W chromosome 10 10 102099 102467 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YJL168C/SET2 -S000030718 CDS YJL169W 10 102099 102467 W 2011-02-03 1996-07-31|2011-02-03 -S000003704 ORF Verified YJL168C SET2 histone methyltransferase SET2|KMT3|EZL1 chromosome 10 L000003090 10 104428 102227 C 2011-02-03 1996-07-31|2011-02-03 Histone methyltransferase with a role in transcriptional elongation; methylates H3 lysine 36 (H3K36), which suppresses incorporation of acetylated histones and signals for the deacetylation of these histones within transcribed genes; associates with the C-terminal domain(CTD) of Rpo21p; H3K36me3 (trimethylation) requires Spt6p, proline 38 on H3, CTD of Rpo21p, Ctk1p, and C-terminal SRI domain of Ste2p; relocalizes to the cytosol in response to hypoxia -S000030590 CDS YJL168C 10 104428 102227 C 2011-02-03 1996-07-31|2011-02-03 -S000003703 ORF Verified YJL167W ERG20 bifunctional (2E,6E)-farnesyl diphosphate synthase/dimethylallyltranstransferase|FPP1|FDS1|BOT3 chromosome 10 L000000579 10 105014 106072 W 2011-02-03 1996-07-31 Farnesyl pyrophosphate synthetase; has both dimethylallyltranstransferase and geranyltranstransferase activities; catalyzes the formation of C15 farnesyl pyrophosphate units for isoprenoid and sterol biosynthesis -S000030519 CDS YJL167W 10 105014 106072 W 2011-02-03 1996-07-31 -S000003702 ORF Verified YJL166W QCR8 ubiquinol--cytochrome-c reductase subunit 8|COR5 chromosome 10 L000001548 10 106434 106718 W 2011-02-03 1996-07-31 Subunit 8 of ubiquinol cytochrome-c reductase (Complex III); Complex III is a component of the mitochondrial inner membrane electron transport chain; oriented facing the intermembrane space; expression is regulated by Abf1p and Cpf1p -S000030370 CDS YJL166W 10 106434 106718 W 2011-02-03 1996-07-31 -S000003701 ORF Verified YJL165C HAL5 protein kinase HAL5 chromosome 10 L000000751 10 109461 106894 C 2011-02-03 1996-07-31 Putative protein kinase; overexpression increases sodium and lithium tolerance, whereas gene disruption increases cation and low pH sensitivity and impairs potassium uptake, suggesting a role in regulation of Trk1p and/or Trk2p transporters; HAL5 has a paralog, KKQ8, that arose from the whole genome duplication -S000037517 CDS YJL165C 10 109461 106894 C 2011-02-03 1996-07-31 -S000003700 ORF Verified YJL164C TPK1 cAMP-dependent protein kinase catalytic subunit TPK1|SRA3|PKA1 chromosome 10 L000002045 10 111159 109966 C -106 2011-02-03 1996-07-31|2011-02-03 cAMP-dependent protein kinase catalytic subunit; promotes vegetative growth in response to nutrients via the Ras-cAMP signaling pathway; inhibited by regulatory subunit Bcy1p in the absence of cAMP; phosphorylates and inhibits Whi3p to promote G1/S phase passage; partially redundant with Tpk2p and Tpk3p; phosphorylates pre-Tom40p, which impairs its import into mitochondria under non-respiratory conditions; TPK1 has a paralog, TPK3, that arose from the whole genome duplication -S000037409 CDS YJL164C 10 111159 109966 C 2011-02-03 1996-07-31|2011-02-03 -S000003699 ORF Uncharacterized YJL163C chromosome 10 10 113333 111666 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000036682 CDS YJL163C 10 113333 111666 C 2011-02-03 1996-07-31 -S000028444 ARS ARS1007 chromosome 10 10 113678 113749 2014-11-18 2002-12-16|2014-11-18 Autonomously Replicating Sequence -S000178123 ARS_consensus_sequence ARS1007 10 113744 113728 C 2014-11-18 2014-11-18 -S000003698 ORF Verified YJL162C JJJ2 chromosome 10 10 115629 113878 C 2011-02-03 1996-07-31|2006-01-18 Protein of unknown function; contains a J-domain, which is a region with homology to the E. coli DnaJ protein -S000036580 CDS YJL162C 10 115629 113878 C 2011-02-03 1996-07-31|2006-01-18 -S000006557 tRNA_gene tE(UUC)J chromosome 10 L000003627 10 116010 115939 C 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; target of K. lactis zymocin -S000035988 noncoding_exon tE(UUC)J 10 116010 115939 C 2011-02-03 2000-05-19 -S000003697 ORF Uncharacterized YJL161W FMP33 chromosome 10 10 117245 117787 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000036525 CDS YJL161W 10 117245 117787 W 2011-02-03 1996-07-31 -S000003696 ORF Uncharacterized YJL160C PIR5 beta-1,3-glucan linked protein chromosome 10 10 118825 117962 C 2011-02-03 2004-02-19|1996-07-31 Putative protein of unknown function; member of the PIR (Proteins with Internal Repeats) family of cell wall proteins; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, and mCherry fusion localizes to the vacuole; non-essential gene that is required for sporulation; mRNA is weakly cell cycle regulated, peaking in mitosis; YJL160C has a paralog, PIR1, that arose from the whole genome duplication -S000035585 CDS YJL160C 10 118825 117962 C 2011-02-03 2004-02-19|1996-07-31 -S000003695 ORF Verified YJL159W HSP150 heat shock protein HSP150|PIR2|ORE1|CCW7 chromosome 10 L000000824|L000001442 10 120449 121690 W 2011-02-03 2004-02-18|1996-07-31|2006-10-04 O-mannosylated heat shock protein; secreted and covalently attached to the cell wall via beta-1,3-glucan and disulfide bridges; required for cell wall stability; induced by heat shock, oxidative stress, and nitrogen limitation; HSP150 has a paralog, PIR3, that arose from the whole genome duplication -S000035769 CDS YJL159W 10 120449 121690 W 2011-02-03 2004-02-18|1996-07-31|2006-10-04 -S000003694 ORF Verified YJL158C CIS3 SCW8|CCW5|PIR4|CCW11 chromosome 10 S000029072|L000003951|L000004553|S000029439|L000004569 10 122948 122265 C 2011-02-03 1996-07-31 Mannose-containing glycoprotein constituent of the cell wall; member of the PIR (proteins with internal repeats) family -S000035606 CDS YJL158C 10 122948 122265 C 2011-02-03 1996-07-31 -S000003693 ORF Verified YJL157C FAR1 cyclin-dependent protein serine/threonine kinase inhibiting protein FAR1 chromosome 10 L000000600 10 126328 123836 C 2011-02-03 1996-07-31 CDK inhibitor and nuclear anchor; during the cell cycle Far1p sequesters the GEF Cdc24p in the nucleus; phosphorylation by Cdc28p-Cln results in SCFCdc4 complex-mediated ubiquitin-dependent degradation, releasing Cdc24p for export and activation of GTPase Cdc42p; in response to pheromone, phosphorylation of Far1p by MAPK Fus3p results in association with, and inhibition of Cdc28p-Cln, as well as Msn5p mediated nuclear export of Far1p-Cdc24p, targeting Cdc24p to polarity sites -S000035524 CDS YJL157C 10 126328 123836 C 2011-02-03 1996-07-31 -S000007613 ORF Dubious YJL156W-A chromosome 10 10 126604 126825 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037190 CDS YJL156W-A 10 126604 126825 W 2011-02-03 2001-02-26 -S000003692 ORF Verified YJL156C SSY5 RAA3 chromosome 10 L000003187|S000029401|L000004045 10 128952 126853 C 2011-02-03 1996-07-31|2009-02-18 Serine protease of SPS plasma membrane amino acid sensor system; contains an inhibitory domain that dissociates in response to extracellular amino acids, freeing a catalytic domain to activate transcription factor Stp1p; other members are Ssy1p and Ptr3p -S000034507 CDS YJL156C 10 128952 126853 C 2011-02-03 1996-07-31|2009-02-18 -S000003691 ORF Verified YJL155C FBP26 fructose-2,6-bisphosphatase chromosome 10 L000000606 10 130643 129285 C 2011-02-03 1996-07-31 Fructose-2,6-bisphosphatase, required for glucose metabolism; protein abundance increases in response to DNA replication stress -S000034402 CDS YJL155C 10 130643 129285 C 2011-02-03 1996-07-31 -S000003690 ORF Verified YJL154C VPS35 retromer subunit VPS35|VPT7|GRD9 chromosome 10 L000002477 10 133935 131101 C -102 2011-02-03 1996-07-31 Endosomal subunit of membrane-associated retromer complex; required for retrograde transport; receptor that recognizes retrieval signals on cargo proteins, forms subcomplex with Vps26p and Vps29p that selects cargo proteins for retrieval; interacts with Ypt7p; overexpression of wild-type human VPS35 or Parkinson's-associated vps35-D686N or vps35-P299S variants complements Ni2+ resistance and Cd2+ sensitivity of yeast vps35 null mutant -S000034312 CDS YJL154C 10 133935 131101 C 2011-02-03 1996-07-31 -S000003689 ORF Verified YJL153C INO1 inositol-3-phosphate synthase INO1|APR1 chromosome 10 L000000867 10 135933 134332 C -101 2011-02-03 2003-09-22|1996-07-31 Inositol-3-phosphate synthase; involved in synthesis of inositol phosphates and inositol-containing phospholipids; transcription is coregulated with other phospholipid biosynthetic genes by Ino2p and Ino4p, which bind the UASINO DNA element -S000033398 CDS YJL153C 10 135933 134332 C 2011-02-03 2003-09-22|1996-07-31 -S000003688 ORF Dubious YJL152W chromosome 10 10 136174 136533 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033364 CDS YJL152W 10 136174 136533 W 2011-02-03 1996-07-31 -S000003687 ORF Verified YJL151C SNA3 chromosome 10 10 136773 136372 C 2011-02-03 1996-07-31 Protein involved in efficient MVB sorting of proteins to the vacuole; may function as an RSP5 adapter protein for MVB cargos; integral membrane protein localized to vacuolar intralumenal vesicles -S000033267 CDS YJL151C 10 136773 136372 C 2011-02-03 1996-07-31 -S000003686 ORF Dubious YJL150W chromosome 10 10 137123 137425 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033233 CDS YJL150W 10 137123 137425 W 2011-02-03 1996-07-31 -S000003685 ORF Verified YJL149W DAS1 DUH1|SCF ubiquitin ligase complex subunit DAS1 chromosome 10 10 137379 139370 W 2011-02-03 1996-07-31 Putative SCF ubiquitin ligase F-box protein; interacts physically with both Cdc53p and Skp1 and genetically with CDC34; similar to putative F-box protein YDR131C -S000032472 CDS YJL149W 10 137379 139370 W 2011-02-03 1996-07-31 -S000006508 snoRNA_gene snR128 SNR128 U14 chromosome 10 L000001975 10 139691 139566 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); referred to as U14; essential gene required for cleavage of 35S primary rRNA transcript to release the precursor to the 18S rRNA; guides 2'-O-methylation of small subunit (SSU) rRNA at position C414 -S000035225 noncoding_exon snR128 10 139691 139566 C 2011-02-03 2000-05-19 -S000006509 snoRNA_gene snR190 SNR190 chromosome 10 L000001977 10 139950 139761 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); predicted to guide 2'-O-methylation of large subunit (LSU) rRNA at position G2395; not shown to be active -S000030414 noncoding_exon snR190 10 139950 139761 C 2011-02-03 2000-05-19 -S000003684 ORF Verified YJL148W RPA34 DNA-directed RNA polymerase I subunit RPA34|CST21|A34.5 chromosome 10 L000004132|L000003000|S000029123 10 140437 141138 W 2011-02-03 1996-07-31 RNA polymerase I subunit A34.5; essential for nucleolar assembly and for high polymerase loading rate; nucleolar localization depends on Rpa49p -S000032342 CDS YJL148W 10 140437 141138 W 2011-02-03 1996-07-31 -S000003683 ORF Uncharacterized YJL147C MRX5 chromosome 10 10 142567 141419 C 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; homozygous diploid deletion strain has a sporulation defect characterized by elevated dityrosine in the soluble fraction; expression induced by calcium shortage; YJL147W is a non-essential gene -S000031289 CDS YJL147C 10 142567 141419 C 2011-02-03 1996-07-31 -S000003682 ORF Verified YJL146W IDS2 chromosome 10 L000000853 10 143292 144701 W 2011-02-03 1996-07-31 Protein involved in modulation of Ime2p activity during meiosis; appears to act indirectly to promote Ime2p-mediated late meiotic functions; found in growing cells and degraded during sporulation -S000031249 CDS YJL146W 10 143292 144701 W 2011-02-03 1996-07-31 -S000003681 ORF Verified YJL145W SFH5 chromosome 10 10 145160 146044 W 2011-02-03 1996-07-31 Non-classical phosphatidylinositol transfer protein (PITP); exhibits PI- but not PC-transfer activity; localizes to the peripheral endoplasmic reticulum, cytosol and microsomes; similar to Sec14p; partially relocalizes to the plasma membrane upon DNA replication stress -S000031116 CDS YJL145W 10 145160 146044 W 2011-02-03 1996-07-31 -S000003680 ORF Verified YJL144W chromosome 10 10 146359 146673 W 2011-02-03 1996-07-31 Cytoplasmic hydrophilin essential in desiccation-rehydration process; expression induced by osmotic stress, starvation and during stationary phase; protein abundance increases in response to DNA replication stress -S000030090 CDS YJL144W 10 146359 146673 W 2011-02-03 1996-07-31 -S000003679 ORF Verified YJL143W TIM17 protein transporter TIM17|SMS1|MPI2|MIM17 chromosome 10 L000001139 10 147101 147577 W 2011-02-03 1996-07-31 Essential component of the TIM23 complex; with Tim23p, contributes to the architecture and function of the import channel; may link the import motor to the core Translocase of the Inner Mitochondrial membrane (TIM23 complex) -S000029979 CDS YJL143W 10 147101 147577 W 2011-02-03 1996-07-31 -S000003678 ORF Dubious YJL142C IRC9 chromosome 10 10 148211 147819 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene YJL141C; null mutant displays increased levels of spontaneous Rad52p foci -S000037267 CDS YJL142C 10 148211 147819 C 2011-02-03 1996-07-31 -S000003677 ORF Verified YJL141C YAK1 serine/threonine protein kinase YAK1 chromosome 10 L000002490 10 150390 147967 C 2011-02-03 1996-07-31 Serine-threonine protein kinase; component of a glucose-sensing system that inhibits growth in response to glucose availability; upon nutrient deprivation Yak1p phosphorylates Pop2p to regulate mRNA deadenylation, the co-repressor Crf1p to inhibit transcription of ribosomal genes, and the stress-responsive transcription factors Hsf1p and Msn2p; nuclear localization negatively regulated by the Ras/PKA signaling pathway in the presence of glucose -S000037175 CDS YJL141C 10 150390 147967 C 2011-02-03 1996-07-31 -S000003676 ORF Verified YJL140W RPB4 DNA-directed RNA polymerase II subunit RPB4|B32|CTF15 chromosome 10 L000001678 10 150961 151626 W 2011-02-03 1996-07-31 RNA polymerase II subunit B32; forms dissociable heterodimer with Rpb7p; Rpb4/7 dissociates from RNAPII as Ser2 CTD phosphorylation increases; Rpb4/7 regulates cellular lifespan via mRNA decay process; involved in recruitment of 3'-end processing factors to transcribing RNAPII complex, export of mRNA to cytoplasm under stress conditions; also involved in translation initiation -S000037123 CDS YJL140W 10 150961 151626 W 2011-02-03 1996-07-31 -S000003675 ORF Verified YJL139C YUR1 mannosyltransferase YUR1 chromosome 10 L000002566 10 152999 151713 C -90.66 2011-02-03 1996-07-31 Mannosyltransferase involved in protein N-glycosylation; member of the KTR1 family; located in the Golgi apparatus; YUR1 has a paralog, KTR2, that arose from the whole genome duplication -S000035317 CDS YJL139C 10 152999 151713 C 2011-02-03 1996-07-31 -S000003674 ORF Verified YJL138C TIF2 translation initiation factor eIF4A|eIF4A chromosome 10 L000002303 10 154691 153504 C -92 2011-02-03 1996-07-31 Translation initiation factor eIF4A; DEA(D/H)-box RNA helicase that couples ATPase activity to RNA binding and unwinding; forms a dumbbell structure of two compact domains connected by a linker; interacts with eIF4G; protein abundance increases in response to DNA replication stress; TIF2 has a paralog, TIF1, that arose from the whole genome duplication -S000035154 CDS YJL138C 10 154691 153504 C 2011-02-03 1996-07-31 -S000003673 ORF Verified YJL137C GLG2 glycogenin glucosyltransferase GLG2 chromosome 10 L000003159 10 156127 154985 C 2011-02-03 1996-07-31 Glycogenin glucosyltransferase; self-glucosylating initiator of glycogen synthesis, also glucosylates n-dodecyl-beta-D-maltoside; similar to mammalian glycogenin; GLG2 has a paralog, GLG1, that arose from the whole genome duplication -S000035008 CDS YJL137C 10 156127 154985 C 2011-02-03 1996-07-31 -S000028806 ORF Uncharacterized YJL136W-A chromosome 10 10 156169 156252 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by SAGE -S000033589 CDS YJL136W-A 10 156169 156252 W 2011-02-03 2003-07-29 -S000003672 ORF Verified YJL136C RPS21B eS21|ribosomal 40S subunit protein S21B|S21e|YS25|S26B|S21B chromosome 10 L000003031 10 157273 156550 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S21, no bacterial homolog; RPS21B has a paralog, RPS21A, that arose from the whole genome duplication -S000034084 CDS YJL136C 10 156789 156550 C 2011-02-03 1996-07-31 -S000034083 CDS YJL136C 10 157273 157250 C 2011-02-03 1996-07-31 -S000034085 intron YJL136C 10 157249 156790 C 2011-02-03 1996-07-31 -S000003671 ORF Dubious YJL135W chromosome 10 10 157877 158194 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified genes YJL134W/LCB3 -S000034027 CDS YJL135W 10 157877 158194 W 2011-02-03 1996-07-31 -S000003670 ORF Verified YJL134W LCB3 sphinganine kinase LCB3|YSR2|LBP1 chromosome 10 L000004101 10 158188 159417 W 2011-02-03 1996-07-31 Long-chain base-1-phosphate phosphatase; specific for dihydrosphingosine-1-phosphate, regulates ceramide and long-chain base phosphates levels, involved in incorporation of exogenous long chain bases in sphingolipids; LCB3 has a paralog, YSR3, that arose from the whole genome duplication -S000033888 CDS YJL134W 10 158188 159417 W 2011-02-03 1996-07-31 -S000028805 ORF Uncharacterized YJL133C-A chromosome 10 10 159847 159623 C 2011-02-03 2003-07-29 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000033587 CDS YJL133C-A 10 159847 159623 C 2011-02-03 2003-07-29 -S000003669 ORF Verified YJL133W MRS3 Fe(2+) transporter chromosome 10 L000001179 10 160619 161563 W 2011-02-03 1996-07-31 Iron transporter, mediates Fe2+ transport across inner mito membrane; mitochondrial carrier family member; active under low-iron conditions; may transport other cations; MRS3 has a paralog, MRS4, that arose from the whole genome duplication -S000033746 CDS YJL133W 10 160619 161563 W 2011-02-03 1996-07-31 -S000003668 ORF Uncharacterized YJL132W chromosome 10 10 161914 164166 W 2011-02-03 1996-07-31 Putative protein of unknown function; localizes to the membrane fraction; possible Zap1p-regulated target gene induced by zinc deficiency; YJL132W is a non-essential gene -S000033018 CDS YJL132W 10 161914 164166 W 2011-02-03 1996-07-31 -S000003667 ORF Verified YJL131C AIM23 chromosome 10 10 165348 164278 C 2011-02-03 1996-07-31 Mitochondrial translation initiation factor 3 (IF3, mIF3); evolutionarily conserved; binds to E. coli ribosomes in vitro; null mutant displays severe respiratory growth defect and elevated frequency of mitochondrial genome loss -S000032877 CDS YJL131C 10 165348 164278 C 2011-02-03 1996-07-31 -S000003666 ORF Verified YJL130C URA2 bifunctional carbamoylphosphate synthetase/aspartate transcarbamylase chromosome 10 L000002431 10 172367 165723 C -89 2011-02-03 1996-07-31|2011-02-03 Bifunctional carbamoylphosphate synthetase/aspartate transcarbamylase; catalyzes the first two enzymatic steps in the de novo biosynthesis of pyrimidines; both activities are subject to feedback inhibition by UTP -S000031969 CDS YJL130C 10 172367 165723 C 2011-02-03 1996-07-31|2011-02-03 -S000122104 five_prime_UTR_intron YJL130C 10 172752 172433 C 2011-02-03 2007-04-04 -S000003665 ORF Verified YJL129C TRK1 chromosome 10 L000002334 10 177306 173599 C 2011-02-03 1996-07-31 Component of the Trk1p-Trk2p potassium transport system; 180 kDa high affinity potassium transporter; phosphorylated in vivo and interacts physically with the phosphatase Ppz1p, suggesting Trk1p acitivy is regulated by phosphorylation; TRK1 has a paralog, TRK2, that arose from the whole genome duplication -S000032672 CDS YJL129C 10 177306 173599 C 2011-02-03 1996-07-31 -S000003664 ORF Verified YJL128C PBS2 mitogen-activated protein kinase kinase PBS2|SSK4|SFS4|HOG4 chromosome 10 L000001346|L000001874 10 180103 178097 C -85 2011-02-03 1996-07-31|2011-02-03 MAP kinase kinase of the HOG signaling pathway; activated under severe osmotic stress; mitophagy-specific regulator; plays a role in regulating Ty1 transposition -S000031693 CDS YJL128C 10 180103 178097 C 2011-02-03 1996-07-31|2011-02-03 -S000007612 ORF Dubious YJL127W-A YJL127W-B chromosome 10 10 180194 180310 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037189 CDS YJL127W-A 10 180194 180310 W 2011-02-03 2001-02-26 -S000028522 ORF Uncharacterized YJL127C-B YJL127C-A chromosome 10 10 181709 181551 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified based on homology to the filamentous fungus, Ashbya gossypii; SWAT-GFP and seamless-GFP fusion proteins localize to the mitochondria -S000030318 CDS YJL127C-B 10 181709 181551 C 2011-02-03 2003-07-29 -S000003663 ORF Verified YJL127C SPT10 SUD1|CRE1 chromosome 10 L000002035 10 184220 182298 C -87 2011-02-03 1996-07-31 Histone H3 acetylase with a role in transcriptional regulation; sequence-specific activator of histone genes, binds specifically and cooperatively to pairs of UAS elements in core histone promoters, functions at or near TATA box; involved in S phase-specific acetylation of H3K56 at histone promoters, which is required for recruitment of SWI/SNF nucleosome remodeling complex and subsequent transcription -S000031537 CDS YJL127C 10 184220 182298 C 2011-02-03 1996-07-31 -S000003662 ORF Verified YJL126W NIT2 putative hydrolase chromosome 10 L000004212 10 184501 185424 W 2011-02-03 1996-07-31 Nit protein; one of two proteins in S. cerevisiae with similarity to the Nit domain of NitFhit from fly and worm and to the mouse and human Nit protein which interacts with the Fhit tumor suppressor; nitrilase superfamily member -S000031498 CDS YJL126W 10 184501 185424 W 2011-02-03 1996-07-31 -S000003661 ORF Verified YJL125C GCD14 tRNA 1-methyladenosine methyltransferase subunit GCD14|TRM61 chromosome 10 L000002902 10 186679 185528 C 2011-02-03 1996-07-31 Subunit of tRNA (1-methyladenosine) methyltransferase; required, along with Gcd10p, for the modification of the adenine at position 58 in tRNAs, especially tRNAi-Met; first identified as a negative regulator of GCN4 expression -S000030509 CDS YJL125C 10 186679 185528 C 2011-02-03 1996-07-31 -S000003660 ORF Verified YJL124C LSM1 SPB8 chromosome 10 L000004427 10 187644 187126 C 2011-02-03 1996-07-31 Lsm (Like Sm) protein; forms heteroheptameric complex (with Lsm2p, Lsm3p, Lsm4p, Lsm5p, Lsm6p, and Lsm7p) involved in degradation of cytoplasmic mRNAs; also enters the nucleus and positively regulates transcription initiation; unlike most Sm-like proteins, Lsm1p requires both its SM-domain and C-terminal domain for RNA-binding; binds to mRNAs under glucose starvation, most often in the 3' UTR; forms cytoplasmic foci upon DNA replication stress -S000030388 CDS YJL124C 10 187644 187126 C 2011-02-03 1996-07-31 -S000003659 ORF Verified YJL123C MTC1 chromosome 10 10 189440 188004 C 2011-02-03 1996-07-31 Protein of unknown function that may interact with ribosomes; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and to COPI-coated vesicles (early Golgi); mtc1 is synthetically lethal with cdc13-1 -S000030206 CDS YJL123C 10 189440 188004 C 2011-02-03 1996-07-31 -S000003658 ORF Verified YJL122W ALB1 chromosome 10 10 189716 190243 W 2011-02-03 1996-07-31 Shuttling pre-60S factor; involved in the biogenesis of ribosomal large subunit; interacts directly with Arx1p; responsible for Tif6p recycling defects in absence of Rei1p -S000037544 CDS YJL122W 10 189716 190243 W 2011-02-03 1996-07-31 -S000003656 ORF Dubious YJL120W chromosome 10 10 191022 191345 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YJL121C/RPE1; deletion confers sensitivity to GSAO -S000037326 CDS YJL120W 10 191022 191345 W 2011-02-03 1996-07-31 -S000003657 ORF Verified YJL121C RPE1 ribulose-phosphate 3-epimerase RPE1|POS18|EPI1 chromosome 10 L000004023|L000002588 10 191090 190374 C 2011-02-03 1996-07-31 D-ribulose-5-phosphate 3-epimerase; catalyzes a reaction in the non-oxidative part of the pentose-phosphate pathway; mutants are sensitive to oxidative stress -S000037363 CDS YJL121C 10 191090 190374 C 2011-02-03 1996-07-31 -S000003654 ORF Verified YJL118W chromosome 10 10 191639 192298 W 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; YJL118W is a non-essential gene; deletion enhances the toxicity of heterologously expressed human alpha-synuclein -S000035604 CDS YJL118W 10 191639 192298 W 2011-02-03 1996-07-31 -S000003655 ORF Dubious YJL119C chromosome 10 10 191895 191572 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035622 CDS YJL119C 10 191895 191572 C 2011-02-03 1996-07-31 -S000003653 ORF Verified YJL117W PHO86 chromosome 10 L000002945 10 192531 193466 W 2011-02-03 1996-07-31 Endoplasmic reticulum (ER) resident protein; required for ER exit of the high-affinity phosphate transporter Pho84p, specifically required for packaging of Pho84p into COPII vesicles; protein abundance increases in response to DNA replication stress -S000035509 CDS YJL117W 10 192531 193466 W 2011-02-03 1996-07-31 -S000003652 ORF Verified YJL116C NCA3 SUN family protein NCA3 chromosome 10 L000002936 10 194873 193860 C 2011-02-03 1996-07-31 Protein involved in mitochondrion organization; functions with Nca2p to regulate mitochondrial expression of subunits 6 (Atp6p) and 8 (Atp8p) of the Fo-F1 ATP synthase; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the vacuole; member of the SUN family; expression induced in cells treated with the mycotoxin patulin; NCA3 has a paralog, UTH1, that arose from the whole genome duplication -S000034420 CDS YJL116C 10 194873 193860 C 2011-02-03 1996-07-31 -S000003651 ORF Verified YJL115W ASF1 nucleosome assembly factor ASF1|CIA1 chromosome 10 L000000126 10 196287 197126 W -80.06 2011-02-03 1996-07-31 Nucleosome assembly factor; involved in chromatin assembly, disassembly; required for recovery after DSB repair; role in H3K56 acetylation required for expression homeostasis, buffering mRNA synthesis rate against gene dosage changes in S phase; anti-silencing protein, derepresses silent loci when overexpressed; role in regulating Ty1 transposition; relocalizes to cytosol under hypoxia; growth defect of asf1 null is functionally complemented by either human ASF1A or ASF1B -S000034387 CDS YJL115W 10 196287 197126 W 2011-02-03 1996-07-31 -S000006514 tRNA_gene tA(AGC)J chromosome 10 L000003626 10 197385 197313 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine -S000032283 noncoding_exon tA(AGC)J 10 197385 197313 C 2011-02-03 2000-05-19 -S000007035 long_terminal_repeat YJLWsigma1 chromosome 10 10 197401 197494 W 2011-02-03 2000-05-19 Ty3 LTR -S000007036 long_terminal_repeat YJLWtau1 chromosome 10 10 197545 197915 W 2011-02-03 2000-05-19 Ty4 LTR -S000007039 LTR_retrotransposon YJLWTy4-1 Ty4 chromosome 10 10 197545 203768 W 2011-02-03 2000-05-19|2011-02-03 Ty4 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000003650 transposable_element_gene YJL114W gag protein chromosome 10 10 197915 198595 W 2011-02-03 1996-07-31|2011-02-03 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000034265 CDS YJL114W 10 197915 198595 W 2011-02-03 1996-07-31|2011-02-03 -S000003649 transposable_element_gene YJL113W gag-pol fusion protein chromosome 10 10 198678 203325 W 2011-02-03 1996-07-31|2011-02-03 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000034131 CDS YJL113W 10 198678 198998 W 2011-02-03 1996-07-31|2011-02-03 -S000034132 CDS YJL113W 10 199000 203325 W 2011-02-03 1996-07-31 -S000034133 plus_1_translational_frameshift YJL113W 10 198999 198999 W 2011-02-03 1996-07-31 -S000007037 long_terminal_repeat YJLWtau2 chromosome 10 10 203398 203768 W 2011-02-03 2000-05-19 Ty4 LTR -S000028445 ARS ARS1008 chromosome 10 10 204029 204917 2011-02-03 2002-12-16|2011-02-03 Autonomously Replicating Sequence -S000178124 ARS_consensus_sequence ARS1008 10 204241 204225 C 2014-11-18 2014-11-18 -S000007022 long_terminal_repeat YJLCdelta3 chromosome 10 10 204114 203783 C 2011-02-03 2000-05-19 Ty1 LTR -S000006536 tRNA_gene tD(GUC)J1 chromosome 10 L000003605 10 204735 204806 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000030769 noncoding_exon tD(GUC)J1 10 204735 204806 W 2011-02-03 2000-05-19 -S000003648 ORF Verified YJL112W MDV1 NET2|GAG3|FIS2 chromosome 10 10 205305 207449 W 2011-02-03 1996-07-31|2011-02-03 Peripheral protein of cytosolic face of mitochondrial outer membrane; required for mitochondrial fission; interacts with Fis1p and with the self-assembled oligomeric form of the dynamin-related GTPase Dnm1p; contains WD repeats; MDV1 has a paralog, CAF4, that arose from the whole genome duplication -S000033273 CDS YJL112W 10 205305 207449 W 2011-02-03 1996-07-31|2011-02-03 -S000003647 ORF Verified YJL111W CCT7 chaperonin-containing T-complex subunit CCT7|TCP7 chromosome 10 L000002763 10 207877 209529 W 2011-02-03 1996-07-31 Subunit of the cytosolic chaperonin Cct ring complex; related to Tcp1p, required for the assembly of actin and tubulins in vivo; mutant has increased aneuploidy tolerance -S000033222 CDS YJL111W 10 207877 209529 W 2011-02-03 1996-07-31 -S000003646 ORF Verified YJL110C GZF3 NIL2|DEH1 chromosome 10 L000002858|L000003382 10 211577 209922 C 2011-02-03 1996-07-31 GATA zinc finger protein; negatively regulates nitrogen catabolic gene expression by competing with Gat1p for GATA site binding; function requires a repressive carbon source; dimerizes with Dal80p and binds to Tor1p; GZF3 has a paralog, DAL80, that arose from the whole genome duplication -S000033132 CDS YJL110C 10 211577 209922 C 2011-02-03 1996-07-31 -S000003645 ORF Verified YJL109C UTP10 snoRNA-binding rRNA-processing protein UTP10 chromosome 10 10 217309 212000 C 2011-02-03 1996-07-31 Nucleolar protein; component of the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA; mutant has increased aneuploidy tolerance -S000032396 CDS YJL109C 10 217309 212000 C 2011-02-03 1996-07-31 -S000003644 ORF Verified YJL108C PRM10 pheromone-regulated protein PRM10 chromosome 10 10 218856 217705 C 2011-02-03 1996-07-31 Pheromone-regulated protein; proposed to be involved in mating; predicted to have 5 transmembrane segments; induced by treatment with 8-methoxypsoralen and UVA irradiation -S000032288 CDS YJL108C 10 218856 217705 C 2011-02-03 1996-07-31 -S000003643 ORF Uncharacterized YJL107C chromosome 10 10 220016 218853 C 2011-02-03 1996-07-31 Putative protein of unknown function; expression is induced by activation of the HOG1 mitogen-activated signaling pathway and this induction is Hog1p/Pbs2p dependent; YJL107C and adjacent ORF, YJL108C are merged in related fungi -S000031290 CDS YJL107C 10 220016 218853 C 2011-02-03 1996-07-31 -S000003642 ORF Verified YJL106W IME2 protein kinase IME2|SME1 chromosome 10 L000000862 10 221390 223327 W 2011-02-03 1996-07-31 Serine/threonine protein kinase involved in activation of meiosis; associates with Ime1p and mediates its stability, activates Ndt80p; IME2 expression is positively regulated by Ime1p; human CDK2 can complement ime2 null mutant -S000031252 CDS YJL106W 10 221390 223327 W 2011-02-03 1996-07-31 -S000003641 ORF Verified YJL105W SET4 chromosome 10 10 225055 226737 W 2011-02-03 1996-07-31 Protein of unknown function, contains a SET domain; SET4 has a paralog, SET3, that arose from the whole genome duplication -S000031110 CDS YJL105W 10 225055 226737 W 2011-02-03 1996-07-31 -S000003640 ORF Verified YJL104W PAM16 import motor complex subunit PAM16|TIM16|MIA1 chromosome 10 10 227327 227776 W 2011-02-03 1996-07-31 Subunit of the import motor (PAM complex); the PAM complex is a component of the Translocase of the Inner Mitochondrial membrane (TIM23 complex); forms a 1:1 subcomplex with Pam18p and inhibits its cochaperone activity; contains a J-like domain -S000031000 CDS YJL104W 10 227327 227776 W 2011-02-03 1996-07-31 -S000006501 snoRNA_gene snR37 SNR37 chromosome 10 L000003502 10 228479 228094 C 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2944 -S000036767 noncoding_exon snR37 10 228479 228094 C 2011-02-03 2000-05-19 -S000028446 ARS ARS1009 chromosome 10 10 228552 229043 2011-02-03 2002-12-16 Autonomously Replicating Sequence -S000178125 ARS_consensus_sequence ARS1009 10 228575 228559 C 2014-11-18 2014-11-18 -S000003639 ORF Verified YJL103C GSM1 chromosome 10 10 230881 229025 C 2011-02-03 1996-07-31 Putative zinc cluster protein of unknown function; proposed to be involved in the regulation of energy metabolism, based on patterns of expression and sequence analysis -S000029933 CDS YJL103C 10 230881 229025 C 2011-02-03 1996-07-31 -S000003638 ORF Verified YJL102W MEF2 chromosome 10 L000001058 10 231301 233760 W 2011-02-03 1996-07-31 Mitochondrial elongation factor involved in translational elongation -S000029898 CDS YJL102W 10 231301 233760 W 2011-02-03 1996-07-31 -S000006702 tRNA_gene tR(ACG)J chromosome 10 L000003606 10 233939 234011 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 6 nuclear tRNA genes containing the tDNA-anticodon ACG (converted to ICG in the mature tRNA), decodes CGU, CGC, and probably CGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000030405 noncoding_exon tR(ACG)J 10 233939 234011 W 2011-02-03 2000-05-19 -S000003637 ORF Verified YJL101C GSH1 glutamate--cysteine ligase chromosome 10 L000000735 10 236356 234320 C 2011-02-03 1996-07-31 Gamma glutamylcysteine synthetase; catalyzes the first step in glutathione (GSH) biosynthesis; expression induced by oxidants, cadmium, and mercury; protein abundance increases in response to DNA replication stress -S000037157 CDS YJL101C 10 236356 234320 C 2011-02-03 1996-07-31 -S000003636 ORF Verified YJL100W LSB6 1-phosphatidylinositol 4-kinase LSB6 chromosome 10 10 237263 239086 W 2011-02-03 1996-07-31 Type II phosphatidylinositol 4-kinase; binds Las17p, a homolog of human Wiskott-Aldrich Syndrome protein involved in actin patch assembly and actin polymerization -S000037110 CDS YJL100W 10 237263 239086 W 2011-02-03 1996-07-31 -S000003635 ORF Verified YJL099W CHS6 CSD3 chromosome 10 L000000334 10 239414 241654 W 2011-02-03 1996-07-31 Member of the ChAPs (Chs5p-Arf1p-binding proteins) family; part of the exomer complex that mediates export of specific cargo proteins, including Chs3p, from the Golgi to the plasma membrane; primary component of the Chs5/6 complex that binds directly to membranes; CHS6 has a paralog, BCH2, that arose from the whole genome duplication -S000031796 CDS YJL099W 10 239414 241654 W 2011-02-03 1996-07-31 -S000003634 ORF Verified YJL098W SAP185 chromosome 10 L000003246 10 242082 245258 W 2011-02-03 1996-07-31 Protein that forms a complex with the Sit4p protein phosphatase; required for Sit4p function; member of a family of similar proteins including Sap4p, Sap155p, and Sap190p; SAP185 has a paralog, SAP190, that arose from the whole genome duplication -S000031694 CDS YJL098W 10 242082 245258 W 2011-02-03 1996-07-31 -S000003633 ORF Verified YJL097W PHS1 enoyl-CoA hydratase PHS1 chromosome 10 10 245591 246244 W 2011-02-03 1996-07-31 Essential 3-hydroxyacyl-CoA dehydratase of the ER membrane; involved in elongation of very long-chain fatty acids; evolutionarily conserved, similar to mammalian PTPLA and PTPLB; involved in sphingolipid biosynthesis and protein trafficking -S000031576 CDS YJL097W 10 245591 246244 W 2011-02-03 1996-07-31 -S000003632 ORF Verified YJL096W MRPL49 mitochondrial 54S ribosomal protein YmL49|YmL49 chromosome 10 10 246490 246975 W 2011-02-03 2003-09-22|1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000030716 CDS YJL096W 10 246490 246975 W 2011-02-03 2003-09-22|1996-07-31 -S000077074 matrix_attachment_site ETC3 ETC3 chromosome 10 10 247060 247082 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; located between MRPL49 and BCK1 -S000003631 ORF Verified YJL095W BCK1 mitogen-activated protein kinase kinase kinase BCK1|SSP31|SLK1|SAP3|LAS3 chromosome 10 L000000162 10 247255 251691 W -64 2011-02-03 1996-07-31 MAPKKK acting in the protein kinase C signaling pathway; the kinase C signaling pathway controls cell integrity; upon activation by Pkc1p phosphorylates downstream kinases Mkk1p and Mkk2p; MAPKKK is an acronym for mitogen-activated protein (MAP) kinase kinase kinase -S000030629 CDS YJL095W 10 247255 251691 W 2011-02-03 1996-07-31 -S000003630 ORF Verified YJL094C KHA1 chromosome 10 10 254442 251821 C 2011-02-03 1996-07-31 Putative K+/H+ antiporter; has a probable role in intracellular cation homeostasis; localized to Golgi vesicles and detected in highly purified mitochondria in high-throughput studies -S000030439 CDS YJL094C 10 254442 251821 C 2011-02-03 1996-07-31 -S000003629 ORF Verified YJL093C TOK1 YPK1|YORK|YKC1|DUK1 chromosome 10 L000003009 10 256812 254737 C 2011-02-03 1996-07-31 Outward-rectifier potassium channel of the plasma membrane; has two pore domains in tandem, each of which forms a functional channel permeable to potassium; carboxy tail functions to prevent inner gate closures; target of K1 toxin -S000037648 CDS YJL093C 10 256812 254737 C 2011-02-03 1996-07-31 -S000003628 ORF Verified YJL092W SRS2 DNA helicase SRS2|HPR5|RADH1|RADH chromosome 10 L000000809|L000001578 10 257423 260947 W -61 2011-02-03 1996-07-31 DNA helicase and DNA-dependent ATPase; involved in DNA repair and checkpoint recovery, needed for proper timing of commitment to meiotic recombination and transition from Meiosis I to II; blocks trinucleotide repeat expansion; affects genome stability; disassembles Rad51p nucleoprotein filaments during meiotic recombination; stimulates activity of the Mus81p-Mms4p endonuclease, independently of Srs2p catalytic activity; functional homolog of human RTEL1 -S000037603 CDS YJL092W 10 257423 260947 W 2011-02-03 1996-07-31 -S000003627 ORF Verified YJL091C GWT1 glucosaminyl-phosphotidylinositol O-acyltransferase chromosome 10 10 262552 261080 C 2011-02-03 2003-09-22|1996-07-31 Protein involved in the inositol acylation of GlcN-PI; the inositol acylation of glucosaminyl phosphatidylinositol (GlcN-PI) forms glucosaminyl(acyl)phosphatidylinositol (GlcN(acyl)PI), an intermediate in the biosynthesis of glycosylphosphatidylinositol (GPI) anchors -S000037407 CDS YJL091C 10 262552 261080 C 2011-02-03 2003-09-22|1996-07-31 -S000003626 ORF Verified YJL090C DPB11 protein kinase activating protein DPB11 chromosome 10 L000003001 10 265051 262757 C 2011-02-03 1996-07-31 DNA replication initiation protein; loads DNA pol epsilon onto pre-replication complexes at origins; checkpoint sensor recruited to stalled replication forks by the checkpoint clamp complex where it activates Mec1p; along with Rfa1p, binds to ultrafine anaphase bridges in mitotic cells and prevents accumulation of chromatin bridges by stimulating the Mec1p kinase and suppressing homologous recombination; ortholog of human TopBP1; forms nuclear foci upon DNA replication stress -S000036680 CDS YJL090C 10 265051 262757 C 2011-02-03 1996-07-31 -S000003625 ORF Verified YJL089W SIP4 chromosome 10 L000001893 10 265926 268415 W 2011-02-03 1996-07-31 C6 zinc cluster transcriptional activator; binds to the carbon source-responsive element (CSRE) of gluconeogenic genes; involved in the positive regulation of gluconeogenesis; regulated by Snf1p protein kinase; localized to the nucleus -S000036795 CDS YJL089W 10 265926 268415 W 2011-02-03 1996-07-31 -S000003624 ORF Verified YJL088W ARG3 ornithine carbamoyltransferase|argF chromosome 10 L000000108 10 268799 269815 W -61 2011-02-03 1999-02-28|1996-07-31 Ornithine carbamoyltransferase; also known as carbamoylphosphate:L-ornithine carbamoyltransferase; catalyzes the biosynthesis of the arginine precursor citrulline -S000036728 CDS YJL088W 10 268799 269815 W 2011-02-03 1999-02-28|1996-07-31 -S000003623 ORF Verified YJL087C TRL1 tRNA ligase|RLG1|LIG1 chromosome 10 L000002336 10 272485 270002 C 2011-02-03 1996-07-31 tRNA ligase; required for tRNA splicing and for both splicing and translation of HAC1 mRNA in the UPR; has phosphodiesterase, polynucleotide kinase, and ligase activities; localized at the inner nuclear envelope and partially to polysomes -S000036631 CDS YJL087C 10 272485 270002 C 2011-02-03 1996-07-31 -S000003621 ORF Verified YJL085W EXO70 GTP-Rho binding exocyst subunit EXO70 chromosome 10 L000003349 10 272827 274698 W 2011-02-03 1996-07-31 Subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis prior to SNARE-mediated fusion; PtdIns[4,5]P2-binding protein that localizes to exocytic sites in an actin-independent manner, targeting and anchoring the exocyst with Sec3p; involved in exocyst assembly; direct downstream effector of Rho3p and Cdc42p; relocalizes from bud neck to cytoplasm upon DNA replication stress -S000035634 CDS YJL085W 10 272827 274698 W 2011-02-03 1996-07-31 -S000003622 ORF Dubious YJL086C chromosome 10 10 272846 272478 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified genes YJL085W/EXO70 and YJL087C/TRL1 -S000035697 CDS YJL086C 10 272846 272478 C 2011-02-03 1996-07-31 -S000003620 ORF Verified YJL084C ALY2 ART3 chromosome 10 10 278002 274862 C 2011-02-03 1997-07-27|1996-07-31 Alpha arrestin; controls nutrient-mediated intracellular sorting of permease Gap1p; interacts with AP-1 subunit Apl4p; phosphorylated by Npr1p and also by cyclin-CDK complex Pcl7p-Pho85p; promotes endocytosis of plasma membrane proteins; ALY2 has a paralog, ALY1, that arose from the whole genome duplication -S000035516 CDS YJL084C 10 278002 274862 C 2011-02-03 1997-07-27|1996-07-31 -S000003619 ORF Verified YJL083W TAX4 chromosome 10 10 278841 280655 W 2011-02-03 1996-07-31 EH domain-containing protein; involved in regulating phosphatidylinositol 4,5-bisphosphate levels and autophagy; Irs4p and Tax4p bind and activate the PtdIns phosphatase Inp51p; Irs4p and Tax4p are involved in localizing Atg17p to the PAS; TAX4 has a paralog, IRS4, that arose from the whole genome duplication -S000034560 CDS YJL083W 10 278841 280655 W 2011-02-03 1996-07-31 -S000003618 ORF Verified YJL082W IML2 chromosome 10 10 281185 283380 W 2011-02-03 1996-07-31 Protein required for clearance of inclusion bodies; localizes to the inclusion bodies formed under protein misfolding stress; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; protein abundance increases in response to DNA replication stress; IML2 has a paralog, YKR018C, that arose from the whole genome duplication -S000034438 CDS YJL082W 10 281185 283380 W 2011-02-03 1996-07-31 -S000003617 ORF Verified YJL081C ARP4 ACT3 chromosome 10 L000000027 10 285271 283802 C 2011-02-03 1996-07-31 Nuclear actin-related protein involved in chromatin remodeling; component of chromatin-remodeling enzyme complexes -S000034308 CDS YJL081C 10 285271 283802 C 2011-02-03 1996-07-31 -S000003616 ORF Verified YJL080C SCP160 chromosome 10 L000001817 10 289226 285558 C 2011-02-03 1996-07-31 Essential RNA-binding G protein effector of mating response pathway; ligand-activated RNA-binding protein that delivers RNAs involved in polarization and perpetualizing mating signal to shmoo tip during pheromone signaling; Scp160p-mediated RNA trafficking essential for chemotropism and successful mating; mainly associated with nuclear envelope and ER, interacts in mRNA-dependent manner with translating ribosomes via multiple KH domains, similar to vertebrate vigilins -S000033394 CDS YJL080C 10 289226 285558 C 2011-02-03 1996-07-31 -S000003615 ORF Verified YJL079C PRY1 sterol-binding protein chromosome 10 L000003216 10 290774 289875 C 2011-02-03 1996-07-31 Sterol binding protein involved in the export of acetylated sterols; secreted glycoprotein and member of the CAP protein superfamily (cysteine-rich secretory proteins (CRISP), antigen 5, and pathogenesis related 1 proteins); sterol export function is redundant with that of PRY2; may be involved in detoxification of hydrophobic compounds; PRY1 has a paralog, PRY2, that arose from the whole genome duplication -S000033334 CDS YJL079C 10 290774 289875 C 2011-02-03 1996-07-31 -S000003614 ORF Verified YJL078C PRY3 chromosome 10 L000003218 10 293981 291336 C 2011-02-03 1996-07-31 Cell wall-associated protein involved in export of acetylated sterols; member of the CAP protein superfamily (cysteine-rich secretory proteins (CRISP), antigen 5, and pathogenesis related 1 proteins); role in mating efficiency; expression of full-length transcript is daughter cell-specific; in response to alpha factor, a short transcript starting at +452 is expressed and the long form is repressed by Ste12p -S000032582 CDS YJL078C 10 293981 291336 C 2011-02-03 1996-07-31 -S000028662 ORF Uncharacterized YJL077W-B chromosome 10 10 294047 294145 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032487 CDS YJL077W-B 10 294047 294145 W 2011-02-03 2003-07-29 -S000028661 ORF Uncharacterized YJL077W-A chromosome 10 10 294799 294885 W 2011-02-03 2003-07-29 Protein of unknown function; mRNA identified as translated by ribosome profiling data; completely overlaps the verified gene YJL077C/ICS3 -S000032486 CDS YJL077W-A 10 294799 294885 W 2011-02-03 2003-07-29 -S000003613 ORF Verified YJL077C ICS3 chromosome 10 10 295061 294666 C 2011-02-03 1996-07-31 Protein with a role in copper homeostasis; possible role in vacuolar sorting and processing of secretory proteins; null mutants are hypersensitive to sortin2 -S000032502 CDS YJL077C 10 295061 294666 C 2011-02-03 1996-07-31 -S000003612 ORF Verified YJL076W NET1 SRM8|CFI1|ESC5 chromosome 10 L000004425 10 295245 298814 W 2011-02-03 1996-07-31 Core subunit of the RENT complex; involved in nucleolar silencing and telophase exit; stimulates transcription by RNA polymerase I and regulates nucleolar structure; NET1 has a paralog, TOF2, that arose from the whole genome duplication -S000032450 CDS YJL076W 10 295245 298814 W 2011-02-03 1996-07-31 -S000003611 ORF Dubious YJL075C APQ13 chromosome 10 10 298876 298460 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 85% of ORF overlaps the verified gene NET1; null mutant is sensitive to sorbate -S000031391 CDS YJL075C 10 298876 298460 C 2011-02-03 1996-07-31 -S000028447 ARS ARS1010 chromosome 10 10 298981 299245 2014-11-18 2002-12-16|2014-11-18 Autonomously Replicating Sequence -S000003610 ORF Verified YJL074C SMC3 cohesin subunit SMC3 chromosome 10 L000003992 10 302849 299157 C 2011-02-03 1996-07-31 Subunit of the multiprotein cohesin complex; required for sister chromatid cohesion in mitotic cells; also required, with Rec8p, for cohesion and recombination during meiosis; phylogenetically conserved SMC chromosomal ATPase family member -S000031287 CDS YJL074C 10 302849 299157 C 2011-02-03 1996-07-31 -S000003609 ORF Verified YJL073W JEM1 KAR8 chromosome 10 L000003533 10 303181 305118 W 2011-02-03 1997-10-20|1996-07-31 DnaJ-like chaperone required for nuclear membrane fusion during mating; localizes to the ER membrane; exhibits genetic interactions with KAR2 -S000031229 CDS YJL073W 10 303181 305118 W 2011-02-03 1997-10-20|1996-07-31 -S000003608 ORF Verified YJL072C PSF2 DNA replication protein PSF2|CDC102 chromosome 10 10 305862 305221 C 2011-02-03 1996-07-31 Subunit of the GINS complex (Sld5p, Psf1p, Psf2p, Psf3p); complex is localized to DNA replication origins and implicated in assembly of the DNA replication machinery -S000030195 CDS YJL072C 10 305862 305221 C 2011-02-03 1996-07-31 -S000003607 ORF Verified YJL071W ARG2 acetyl-CoA:L-glutamate N-acetyltransferase|HRB574 chromosome 10 L000003263 10 306132 307856 W 2011-02-03 1996-07-31 Acetylglutamate synthase (glutamate N-acetyltransferase); mitochondrial enzyme that catalyzes the first step in the biosynthesis of the arginine precursor ornithine; forms a complex with Arg5,6p -S000030084 CDS YJL071W 10 306132 307856 W 2011-02-03 1996-07-31 -S000003606 ORF Uncharacterized YJL070C metallo-dependent hydrolase superfamily protein chromosome 10 10 310637 307971 C 2011-02-03 1996-07-31 Putative metallo-dependent hydrolase superfamily protein; similar to AMP deaminases but lacks key catalytic residues and does not rescue purine nucleotide metabolic defect of quadruple aah1 ade8 amd1 his1 mutant; may regulate purine nucleotide homeostasis as overexpression in an AMD1 strain grown in adenine results in greatly reduced GDP and GTP intracellular levels; not an essential gene; YJL070C has a paralog, YBR284W, that arose from the whole genome duplication -S000029919 CDS YJL070C 10 310637 307971 C 2011-02-03 1996-07-31 -S000003605 ORF Verified YJL069C UTP18 chromosome 10 10 312706 310922 C 2011-02-03 1996-07-31 Small-subunit processome protein involved in pre-18S rRNA maturation; part of a subunit of the 90S preribosomal particle capable of interacting directly with the 5' ETS of the 35S pre-rRNA; contains WD40 repeats -S000036438 CDS YJL069C 10 312706 310922 C 2011-02-03 1996-07-31 -S000003604 ORF Verified YJL068C S-formylglutathione hydrolase|SFGH chromosome 10 10 313915 313016 C 2011-02-03 1996-07-31 Esterase that can function as an S-formylglutathione hydrolase; non-essential intracellular esterase; may be involved in the detoxification of formaldehyde, which can be metabolized to S-formylglutathione; similar to human esterase D -S000036339 CDS YJL068C 10 313915 313016 C 2011-02-03 1996-07-31 -S000003603 ORF Dubious YJL067W chromosome 10 10 314084 314434 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036295 CDS YJL067W 10 314084 314434 W 2011-02-03 1996-07-31 -S000003602 ORF Verified YJL066C MPM1 chromosome 10 10 314872 314114 C 2011-02-03 1996-07-31 Mitochondrial intermembrane space protein of unknown function -S000035314 CDS YJL066C 10 314872 314114 C 2011-02-03 1996-07-31 -S000003600 ORF Dubious YJL064W chromosome 10 10 315175 315570 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene YJL065C/DLS1 -S000035084 CDS YJL064W 10 315175 315570 W 2011-02-03 1996-07-31 -S000003601 ORF Verified YJL065C DLS1 chromosome 10 10 315557 315054 C 2011-02-03 1996-07-31 Subunit of ISW2/yCHRAC chromatin accessibility complex; ISW2/yCHRAC also includes Itc1p, Isw2p, and Dpb4p; involved in inheritance of telomeric silencing; DLS1 has a paralog, DPB3, that arose from the whole genome duplication -S000035150 CDS YJL065C 10 315557 315054 C 2011-02-03 1996-07-31 -S000003599 ORF Verified YJL063C MRPL8 mitochondrial 54S ribosomal protein YmL8|YmL8|HRD238 chromosome 10 L000001162|L000002524 10 316475 315759 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000034082 CDS YJL063C 10 316475 315759 C 2011-02-03 1996-07-31 -S000007611 ORF Verified YJL062W-A COA3 COX25|RRG10 chromosome 10 10 316723 316980 W 2011-02-03 2001-02-26 Mitochondrial protein required for cytochrome c oxidase assembly; also involved in translational regulation of Cox1p and prevention of Cox1p aggregation before assembly; located in the mitochondrial inner membrane -S000037188 CDS YJL062W-A 10 316723 316980 W 2011-02-03 2001-02-26 -S000003598 ORF Verified YJL062W LAS21 mannose-ethanolamine phosphotransferase LAS21|GPI7 chromosome 10 L000004283|L000004818 10 317284 319776 W 2011-02-03 1996-07-31 Integral plasma membrane protein; involved in the synthesis of the glycosylphosphatidylinositol (GPI) core structure; mutations affect cell wall integrity -S000034026 CDS YJL062W 10 317284 319776 W 2011-02-03 1996-07-31 -S000003597 ORF Verified YJL061W NUP82 linker nucleoporin NUP82|HRB187 chromosome 10 L000002941 10 320016 322157 W 2011-02-03 1996-07-31 Linker nucleoporin component of the nuclear pore complex (NPC); also part of the NPC cytoplasmic filaments; contributes to nucleocytoplasmic transport and NPC biogenesis; forms stable associations with three FG-nucleoporins (Nsp1p, Nup159p, and Nup116p); relocalizes to the cytosol in response to hypoxia -S000033873 CDS YJL061W 10 320016 322157 W 2011-02-03 1996-07-31 -S000003596 ORF Verified YJL060W BNA3 kynurenine--oxoglutarate transaminase chromosome 10 10 323386 324720 W 2011-02-03 1996-07-31 Kynurenine aminotransferase; catalyzes formation of kynurenic acid from kynurenine; potential Cdc28p substrate -S000033737 CDS YJL060W 10 323386 324720 W 2011-02-03 1996-07-31 -S000003595 ORF Verified YJL059W YHC3 amino acid transporter YHC3|BTN1 chromosome 10 L000003332|L000003284 10 324964 326190 W 2011-02-03 1996-07-31 Protein required for the ATP-dependent transport of arginine; vacuolar membrane protein; involved in the ATP-dependent transport of arginine into the vacuole and possibly in balancing ion homeostasis; human homolog CLN3 involved in Batten disease (juvenile onset neuronal ceroid lipofuscinosis) can complement yeast null mutant -S000034862 CDS YJL059W 10 324964 326190 W 2011-02-03 1996-07-31 -S000003594 ORF Verified YJL058C BIT61 chromosome 10 10 327873 326242 C 2011-02-03 1996-07-31 Subunit of TORC2 membrane-associated complex; involved in regulation of cell cycle-dependent actin cytoskeletal dynamics during polarized growth and cell wall integrity; BIT61 has a paralog, BIT2, that arose from the whole genome duplication -S000032844 CDS YJL058C 10 327873 326242 C 2011-02-03 1996-07-31 -S000003593 ORF Verified YJL057C IKS1 protein kinase IKS1 chromosome 10 L000004209 10 330121 328118 C 2011-02-03 1996-07-31 Protein kinase of unknown cellular role; putative serine/threonine kinase; expression is induced during mild heat stress; deletion mutants are hypersensitive to copper sulphate and resistant to sorbate; interacts with an N-terminal fragment of Sst2p -S000032730 CDS YJL057C 10 330121 328118 C 2011-02-03 1996-07-31 -S000003592 ORF Verified YJL056C ZAP1 ZRG10 chromosome 10 L000003321 10 333073 330431 C 2011-02-03 1996-07-31 Zinc-regulated transcription factor; binds to zinc-responsive promoters to induce transcription of certain genes in presence of zinc, represses other genes in low zinc; regulates its own transcription; contains seven zinc-finger domains -S000032670 CDS YJL056C 10 333073 330431 C 2011-02-03 1996-07-31 -S000003591 ORF Uncharacterized YJL055W chromosome 10 10 333357 334094 W 2011-02-03 1996-07-31 Putative protein of unknown function; functions together with HAM1 to mediate resistance to 5-FU; specifically reduces the incorporation of 5-FU into RNA, without affecting uptake or incorporation of uracil into RNA; proposed to be involved in the metabolism of purine and pyrimidine base analogues; deletion mutants are sensitive to HAP and AHA -S000032627 CDS YJL055W 10 333357 334094 W 2011-02-03 1996-07-31 -S000003590 ORF Verified YJL054W TIM54 chromosome 10 L000004342 10 334265 335701 W 2011-02-03 1996-07-31 Component of the mitochondrial TIM22 complex; involved in insertion of polytopic proteins into the inner membrane -S000031626 CDS YJL054W 10 334265 335701 W 2011-02-03 1996-07-31 -S000003589 ORF Verified YJL053W PEP8 retromer subunit PEP8|VPT4|VPS26|GRD6 chromosome 10 L000001378 10 335898 337037 W 2011-02-03 1996-07-31 Vacuolar protein component of the retromer; forms part of the multimeric membrane-associated retromer complex involved in vacuolar protein sorting along with Vps35p, Vps29p, Vps17p, and Vps5p; essential for endosome-to-Golgi retrograde protein transport; interacts with Ypt7p; protein abundance increases in response to DNA replication stress -S000031497 CDS YJL053W 10 335898 337037 W 2011-02-03 1996-07-31 -S000028448 ARS ARS1011 ARSX-337 chromosome 10 10 337281 337529 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence -S000007610 ORF Uncharacterized YJL052C-A chromosome 10 10 338003 337884 C 2011-02-03 2001-02-26 Putative protein of unknown function; identified based on comparison to related yeast species; mCherry fusion protein localizes to the vacuole -S000037187 CDS YJL052C-A 10 338003 337884 C 2011-02-03 2001-02-26 -S000003588 ORF Verified YJL052W TDH1 glyceraldehyde-3-phosphate dehydrogenase (phosphorylating) TDH1|GAPDH|GLD3 chromosome 10 L000002272 10 338271 339269 W 2011-02-03 1996-07-31 Glyceraldehyde-3-phosphate dehydrogenase (GAPDH), isozyme 1; involved in glycolysis and gluconeogenesis; tetramer that catalyzes the reaction of glyceraldehyde-3-phosphate to 1,3 bis-phosphoglycerate; detected in the cytoplasm and cell wall; protein abundance increases in response to DNA replication stress; GAPDH-derived antimicrobial peptides secreted by S. cerevisiae are active against a wide variety of wine-related yeasts and bateria -S000031373 CDS YJL052W 10 338271 339269 W 2011-02-03 1996-07-31 -S000003587 ORF Verified YJL051W IRC8 chromosome 10 10 339787 342255 W 2011-02-03 1996-07-31 Bud tip localized protein of unknown function; mRNA is targeted to the bud by a She2p dependent transport system; mRNA is cell cycle regulated via Fkh2p, peaking in G2/M phase; null mutant displays increased levels of spontaneous Rad52p foc -S000030449 CDS YJL051W 10 339787 342255 W 2011-02-03 1996-07-31 -S000003586 ORF Verified YJL050W MTR4 ATP-dependent RNA helicase MTR4|DOB1 chromosome 10 L000004110 10 342522 345743 W 2011-02-03 1996-07-31 ATP-dependent 3'-5' RNA helicase of the DExD/H family; involved in nuclear RNA processing and degradation both as a component of TRAMP complex and in TRAMP-independent processes; TRAMP unwinds RNA duplexes, with Mtr4p unwinding activity stimulated by Pap2p/Air2p but not dependent on ongoing polyadenylation; contains an arch domain, with two coiled-coil arms/stalks and a globular fist/KOW domain, which has RNA binding activity and is required for 5.8S rRNA processing -S000030313 CDS YJL050W 10 342522 345743 W 2011-02-03 1996-07-31 -S000003585 ORF Uncharacterized YJL049W CHM7 chromosome 10 10 345973 347325 W 2011-02-03 1996-07-31 Yeast homolog of human CHMP7, localizes to the endoplasmic reticulum presumably as part of an ESCRT-III like complex; null mutant has growth defect at 37 C in an apq12 deletion background; non-essential gene -S000036773 CDS YJL049W 10 345973 347325 W 2011-02-03 1996-07-31 -S000003584 ORF Verified YJL048C UBX6 CUI2 chromosome 10 10 348637 347447 C 2011-02-03 1996-07-31 UBX (ubiquitin regulatory X) domain-containing protein; interacts with Cdc48p, transcription is repressed when cells are grown in media containing inositol and choline; UBX6 has a paralog, UBX7, that arose from the whole genome duplication -S000036634 CDS YJL048C 10 348637 347447 C 2011-02-03 1996-07-31 -S000028804 ORF Uncharacterized YJL047C-A chromosome 10 10 349178 349044 C 2011-02-03 2003-07-29 Putative protein of unknown function -S000033585 CDS YJL047C-A 10 349178 349044 C 2011-02-03 2003-07-29 -S000006451 snoRNA_gene snR60 SNR60 chromosome 10 L000004529 10 349233 349130 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at positions A817 and G908 -S000030821 noncoding_exon snR60 10 349233 349130 C 2011-02-03 2000-05-19 -S000003583 ORF Verified YJL047C RTT101 cullin RTT101|CULC|CUL8 chromosome 10 L000004737 10 352108 349580 C 2011-02-03 1996-07-31 Cullin subunit of a Roc1p-dependent E3 ubiquitin ligase complex; role in anaphase progression; required for recovery after DSB repair; implicated in Mms22-dependent DNA repair; involved with Mms1p in nonfunctional rRNA decay; modified by the ubiquitin-like protein, Rub1p -S000036565 CDS YJL047C 10 352108 349580 C 2011-02-03 1996-07-31 -S000003582 ORF Verified YJL046W AIM22 putative lipoate--protein ligase|RRG3|LIP3 chromosome 10 10 352386 353615 W 2011-02-03 1996-07-31|2005-12-01 Putative lipoate-protein ligase; required along with Lip2 and Lip5 for lipoylation of Lat1p and Kgd2p; similar to E. coli LplA; null mutant displays reduced frequency of mitochondrial genome loss -S000036505 CDS YJL046W 10 352386 353615 W 2011-02-03 1996-07-31|2005-12-01 -S000006781 tRNA_gene tY(GUA)J1 SUP7 chromosome 10 L000003607|L000002186 10 354244 354332 W -32 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations -S000032080 intron tY(GUA)J1 10 354283 354296 W 2011-02-03 2000-05-19 -S000032078 noncoding_exon tY(GUA)J1 10 354244 354282 W 2011-02-03 2000-05-19 -S000032079 noncoding_exon tY(GUA)J1 10 354297 354332 W 2011-02-03 2000-05-19 -S000007024 long_terminal_repeat YJLCdelta5 chromosome 10 10 355175 354844 C 2011-02-03 2000-05-19 Ty1 LTR -S000007023 long_terminal_repeat YJLCdelta4 chromosome 10 10 355204 354538 C 2011-02-03 2000-05-19 Ty1 LTR -S000006714 tRNA_gene tR(UCU)J1 chromosome 10 L000003608 10 355374 355445 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000030321 noncoding_exon tR(UCU)J1 10 355374 355445 W 2011-02-03 2000-05-19 -S000006537 tRNA_gene tD(GUC)J2 chromosome 10 L000003609 10 355456 355527 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000030790 noncoding_exon tD(GUC)J2 10 355456 355527 W 2011-02-03 2000-05-19 -S000003581 ORF Verified YJL045W succinate dehydrogenase SDH1b|SDH1b chromosome 10 10 356024 357928 W 2011-02-03 1996-07-31 Minor succinate dehydrogenase isozyme; participates in oxidation of succinate and transfer of electrons to ubiquinone; induced during the diauxic shift in a Cat8p-dependent manner; YJL045W has a paralog, SDH1, that arose from the whole genome duplication -S000035600 CDS YJL045W 10 356024 357928 W 2011-02-03 1996-07-31 -S000003580 ORF Verified YJL044C GYP6 chromosome 10 L000000748 10 359676 358300 C 2011-02-03 1996-07-31 GTPase-activating protein (GAP) for yeast Rab family member Ypt6p; involved in vesicle mediated protein transport -S000035463 CDS YJL044C 10 359676 358300 C 2011-02-03 1996-07-31 -S000003579 ORF Uncharacterized YJL043W chromosome 10 10 360130 360903 W 2011-02-03 1996-07-31 Putative protein of unknown function; YJL043W is a non-essential gene -S000035409 CDS YJL043W 10 360130 360903 W 2011-02-03 1996-07-31 -S000003578 ORF Verified YJL042W MHP1 chromosome 10 L000002720 10 361249 365445 W 2011-02-03 1996-07-31 Microtubule-associated protein involved in microtubule organization; involved in assembly and stabilization of microtubules; overproduction results in cell cycle arrest at G2 phase; similar to Drosophila protein MAP and to mammalian MAP4 proteins -S000034384 CDS YJL042W 10 361249 365445 W 2011-02-03 1996-07-31 -S000003577 ORF Verified YJL041W NSP1 FG-nucleoporin NSP1 chromosome 10 L000001277 10 365784 368373 W 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; also part of the nuclear pore complex (NPC) nuclear basket; contributes directly to nucleocytoplasmic transport and maintenance of the NPC permeability barrier; found in stable complex with Nup82p, Gle2p and two other FG-nucleoporins (Nup159p and Nup116p); also found in stable complex with Nic96p and two other FG-nucleoproteins (Nup49p and Nup57p) -S000034258 CDS YJL041W 10 365784 365784 W 2011-02-03 1996-07-31 -S000034259 CDS YJL041W 10 365903 368373 W 2011-02-03 1996-07-31 -S000034260 intron YJL041W 10 365785 365902 W 2011-02-03 1996-07-31 -S000003576 ORF Verified YJL039C NUP192 chromosome 10 S000007465 10 373799 368748 C 2011-02-03 1996-07-31 Essential subunit of inner ring of nuclear pore complex (NPC); plays a role in modulating transport through the NPC; homologous to human NUP205 -S000034602 CDS YJL039C 10 373799 368748 C 2011-02-03 1996-07-31 -S000006538 tRNA_gene tD(GUC)J3 chromosome 10 L000003625 10 374495 374424 C 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000030793 noncoding_exon tD(GUC)J3 10 374495 374424 C 2011-02-03 2000-05-19 -S000006715 tRNA_gene tR(UCU)J2 chromosome 10 L000003624 10 374577 374506 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000030328 noncoding_exon tR(UCU)J2 10 374577 374506 C 2011-02-03 2000-05-19 -S000028449 ARS ARS1012 ARSX-375 chromosome 10 10 374880 375122 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence -S000007025 long_terminal_repeat YJLCdelta6 chromosome 10 10 374935 374844 C 2011-02-03 2000-05-19 Ty1 LTR -S000028450 ARS ARS1013 chromosome 10 10 375706 376227 2011-02-03 2002-12-16 Autonomously Replicating Sequence; inefficient as chromosomal replication origin; replication capacity dependent upon Sum1p -S000003575 ORF Verified YJL038C LOH1 OSW4 chromosome 10 10 375774 375115 C 2011-02-03 1996-07-31 Protein involved in outer spore wall assembly; likely involved directly in dityrosine layer assembly; induced during sporulation; repressed during vegetative growth by Sum1p and Hst1p; sequence similar to adjacent ORF, IRC18/YJL037W, and the irc18 loh1 double mutant exhibits reduced dityrosine fluorescence relative to the single mutants; SWAT-GFP and mCherry fusion proteins localize to the cytosol; proposed role in maintenance of genome integrity -S000034497 CDS YJL038C 10 375774 375115 C 2011-02-03 1996-07-31 -S000003574 ORF Verified YJL037W IRC18 OSW6 chromosome 10 10 376662 377336 W 2011-02-03 1996-07-31 Protein involved in outer spore wall assembly; possible role in assembly of the dityrosine layer; similar to adjacent ORF, LOH1; irc18 loh1 double mutant exhibits reduced dityrosine fluorescence relative to single mutants; SWAT-GFP fusion protein localizes to the ER and vacuole, while mCherry fusion localizes to the vacuole; expression induced in respiratory-deficient cells and carbon-limited chemostat culture; null mutant displays increased levels of spontaneous Rad52p foci -S000034457 CDS YJL037W 10 376662 377336 W 2011-02-03 1996-07-31 -S000007026 long_terminal_repeat YJLCdelta7 chromosome 10 10 377870 377598 C 2011-02-03 2000-05-19 Ty1 LTR -S000006759 tRNA_gene tV(AAC)J chromosome 10 L000003610 10 378360 378433 W 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000032964 noncoding_exon tV(AAC)J 10 378360 378433 W 2011-02-03 2000-05-19 -S000003573 ORF Verified YJL036W SNX4 ATG24|CVT13 chromosome 10 S000007467|L000004764 10 378825 380096 W 2011-02-03 1996-07-31 Sorting nexin; involved in retrieval of late-Golgi SNAREs from post-Golgi endosomes to the trans-Golgi network and in cytoplasm to vacuole transport; contains a PX phosphoinositide-binding domain; forms complexes with Snx41p and with Atg20p -S000032435 CDS YJL036W 10 378825 380096 W 2011-02-03 1996-07-31 -S000003572 ORF Verified YJL035C TAD2 tRNA(adenine34) deaminase chromosome 10 S000007489 10 381001 380249 C 2011-02-03 1996-07-31 Subunit of tRNA-specific adenosine-34 deaminase; forms a heterodimer with Tad3p that converts adenosine to inosine at the wobble position of several tRNAs -S000032286 CDS YJL035C 10 381001 380249 C 2011-02-03 1996-07-31 -S000003571 ORF Verified YJL034W KAR2 Hsp70 family ATPase KAR2|BIP|GRP78 chromosome 10 L000000887 10 381327 383375 W 2011-02-03 1996-07-31 ATPase involved in protein import into the ER; also acts as a chaperone to mediate protein folding in the ER and may play a role in ER export of soluble proteins; regulates the unfolded protein response via interaction with Ire1p -S000032230 CDS YJL034W 10 381327 383375 W 2011-02-03 1996-07-31 -S000003570 ORF Verified YJL033W HCA4 RNA-dependent ATPase HCA4|ECM24|DBP4 chromosome 10 L000003421 10 383837 386149 W 2011-02-03 1996-07-31 DEAD box RNA helicase; component of the SSU; interacts with Bfr2p and Enp2p; high-copy number suppression of a U14 snoRNA processing mutant suggests an involvement in 18S rRNA synthesis -S000031248 CDS YJL033W 10 383837 386149 W 2011-02-03 1996-07-31 -S000003569 ORF Dubious YJL032W chromosome 10 10 386348 386662 W 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; overlaps 3' end of essential BET4 gene encoding the alpha subunit of Type II geranylgeranyltransferase -S000031093 CDS YJL032W 10 386348 386662 W 2011-02-03 1996-07-31 -S000003568 ORF Verified YJL031C BET4 Rab geranylgeranyltransferase BET4 chromosome 10 L000000173 10 387438 386368 C 2011-02-03 2004-01-27|1996-07-31 Alpha subunit of Type II geranylgeranyltransferase; required for vesicular transport between the endoplasmic reticulum and the Golgi; provides a membrane attachment moiety to Rab-like proteins Ypt1p and Sec4p -S000030060 CDS YJL031C 10 387348 386368 C 2011-02-03 2004-01-27 -S000030059 CDS YJL031C 10 387438 387436 C 2011-02-03 2004-01-27|1996-07-31 -S000030061 intron YJL031C 10 387435 387349 C 2011-02-03 2004-01-27 -S000003567 ORF Verified YJL030W MAD2 spindle checkpoint protein MAD2 chromosome 10 L000000975 10 387657 388247 W 2011-02-03 1996-07-31 Component of the spindle-assembly checkpoint complex; delays onset of anaphase in cells with defects in mitotic spindle assembly; forms a complex with Mad1p; regulates APC/C activity during prometaphase and metaphase of meiosis I; gene dosage imbalance between MAD1 and MAD2 leads to chromosome instability -S000030009 CDS YJL030W 10 387657 388247 W 2011-02-03 1996-07-31 -S000003566 ORF Verified YJL029C VPS53 chromosome 10 10 390853 388385 C 2011-02-03 1996-07-31 Component of the GARP (Golgi-associated retrograde protein) complex; GARP is required for the recycling of proteins from endosomes to the late Golgi, and for mitosis after DNA damage induced checkpoint arrest; required for vacuolar protein sorting; members of the GARP complex are Vps51p-Vps52p-Vps53p-Vps54p; human ortholog is implicated in progressive cerebello-cerebral atrophy type 2 (PCCA2) -S000030293 CDS YJL029C 10 390853 388385 C 2011-02-03 1996-07-31 -S000006661 tRNA_gene tM(CAU)J1 EMT5 chromosome 10 L000000555|L000003623 10 391115 391043 C 2011-02-03 2000-05-19 Methionine tRNA (tRNA-Met), functions in translational elongation; not involved in translational initiation; predicted by tRNAscan-SE analysis -S000029920 noncoding_exon tM(CAU)J1 10 391115 391043 C 2011-02-03 2000-05-19 -S000003565 ORF Verified YJL028W chromosome 10 10 391311 391646 W 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments -S000030214 CDS YJL028W 10 391311 391646 W 2011-02-03 1996-07-31 -S000003564 ORF Uncharacterized YJL027C chromosome 10 10 392249 391833 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000036407 CDS YJL027C 10 392249 391833 C 2011-02-03 1996-07-31 -S000003563 ORF Verified YJL026W RNR2 ribonucleotide-diphosphate reductase subunit RNR2|CRT6 chromosome 10 L000001656 10 392404 393603 W 0 2011-02-03 1996-07-31 Ribonucleotide-diphosphate reductase (RNR), small subunit; the RNR complex catalyzes the rate-limiting step in dNTP synthesis and is regulated by DNA replication and DNA damage checkpoint pathways via localization of the small subunits; RNR2 has a paralog, RNR4, that arose from the whole genome duplication -S000036365 CDS YJL026W 10 392404 393603 W 2011-02-03 1996-07-31 -S000028660 ORF Dubious YJL026C-A chromosome 10 10 393287 393066 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene YJL026W/RNR2 -S000032485 CDS YJL026C-A 10 393287 393066 C 2011-02-03 2003-07-29 -S000003562 ORF Verified YJL025W RRN7 chromosome 10 L000001773 10 393967 395511 W 2011-02-03 1996-07-31 Component of the core factor (CF) rDNA transcription factor complex; CF is required for transcription of 35S rRNA genes by RNA polymerase I and is composed of Rrn6p, Rrn7p, and Rrn11p -S000036283 CDS YJL025W 10 393967 395511 W 2011-02-03 1996-07-31 -S000003561 ORF Verified YJL024C APS3 YKS7 chromosome 10 L000003174 10 396592 395931 C 2011-02-03 1996-07-31 Small subunit of the clathrin-associated adaptor complex AP-3; involved in vacuolar protein sorting; related to the sigma subunit of the mammalian clathrin AP-3 complex; suppressor of loss of casein kinase 1 function; protein abundance increases in response to DNA replication stress -S000036076 CDS YJL024C 10 396493 395931 C 2011-02-03 1996-07-31 -S000036075 CDS YJL024C 10 396592 396571 C 2011-02-03 1996-07-31 -S000036077 intron YJL024C 10 396570 396494 C 2011-02-03 1996-07-31 -S000006583 tRNA_gene tG(GCC)J1 chromosome 10 L000003622 10 396796 396726 C 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis -S000030415 noncoding_exon tG(GCC)J1 10 396796 396726 C 2011-02-03 2000-05-19 -S000003559 ORF Dubious YJL022W chromosome 10 10 398109 398417 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene PET130 -S000035121 CDS YJL022W 10 398109 398417 W 2011-02-03 1996-07-31 -S000003560 ORF Verified YJL023C PET130 chromosome 10 L000003025 10 398398 397355 C 2011-02-03 1996-07-31 Protein required for respiratory growth; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000035183 CDS YJL023C 10 398398 397355 C 2011-02-03 1996-07-31 -S000028659 ORF Dubious YJL020W-A chromosome 10 10 400981 401238 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene YJL020C/BBC1 -S000032463 CDS YJL020W-A 10 400981 401238 W 2011-02-03 2003-07-29 -S000003557 ORF Verified YJL020C BBC1 YJL021C|MTI1 chromosome 10 10 402410 398937 C 2011-02-03 2001-06-28|1996-07-31 Protein possibly involved in assembly of actin patches; interacts with an actin assembly factor Las17p and with the SH3 domains of Type I myosins Myo3p and Myo5p; localized predominantly to cortical actin patches -S000033969 CDS YJL020C 10 402410 398937 C 2011-02-03 2001-06-28|1996-07-31 -S000003556 ORF Verified YJL019W MPS3 YJL018W|NEP98 chromosome 10 10 402897 404945 W 2011-02-03 2003-01-02|1996-07-31 Nuclear envelope protein; required for SPB insertion, SPB duplication, Kar5p localization near the SPB and nuclear fusion; interacts with Mps2p to tether half-bridge to core SPB; N-terminal acetylation by Eco1p regulates its role in nuclear organization; localizes to the SPB half bridge and telomeres during meiosis; required with Ndj1p and Csm4p for meiotic bouquet formation and telomere-led rapid prophase movement; member of the SUN protein family (Sad1-UNC-84 homology) -S000035368 CDS YJL019W 10 402897 404945 W 2011-02-03 2003-01-02|1996-07-31 -S000003553 ORF Uncharacterized YJL016W TPH3 YJL017W chromosome 10 10 405588 407273 W 2011-02-03 2003-09-29|1996-07-31 Putative protein of unknown function; GFP-fusion protein localizes to the cytoplasm; contains two adjacent PH-like domains; conserved in closely related Saccharomyces species -S000034286 CDS YJL016W 10 405588 407273 W 2011-02-03 2003-09-29|1996-07-31 -S000003552 ORF Dubious YJL015C chromosome 10 10 407426 407142 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame unlikely to encode a functional protein; expression if heat-inducible; located in promoter region of essential CCT3 gene encoding a subunit of the cytosolic chaperonin Cct ring complex, overlaps ORF YJL016W -S000034109 CDS YJL015C 10 407426 407142 C 2011-02-03 1996-07-31|2011-02-03 -S000003551 ORF Verified YJL014W CCT3 chaperonin-containing T-complex subunit CCT3|TCP3|BIN2 chromosome 10 L000002270 10 407558 409162 W 2011-02-03 1996-07-31 Subunit of the cytosolic chaperonin Cct ring complex; related to Tcp1p, required for the assembly of actin and tubulins in vivo; capable of binding Q/N rich proteins and mediating their folding -S000034079 CDS YJL014W 10 407558 409162 W 2011-02-03 1996-07-31 -S000003550 ORF Verified YJL013C MAD3 chromosome 10 L000003179 10 411040 409493 C 2011-02-03 1996-07-31 Subunit of spindle-assembly checkpoint complex; involved in delaying anaphase onset in cells with defects in mitotic spindle assembly; pseudosubstrate inhibitor of APC(Cdc20), the anaphase promoting complex involved in securin (Pds1p) turnover; MAD3 has a paralog, BUB1, that arose from the whole genome duplication -S000032025 CDS YJL013C 10 411040 409493 C 2011-02-03 1996-07-31 -S000003549 ORF Verified YJL012C VTC4 YJL012C-A|PHM3 chromosome 10 S000007513 10 413399 411234 C 2011-02-03 2004-02-19|1996-07-31 Vacuolar membrane polyphosphate polymerase; subunit of the vacuolar transporter chaperone (VTC) complex involved in synthesis and transfer of polyP to the vacuole; regulates membrane trafficking; role in non-autophagic vacuolar fusion; protein abundance increases in response to DNA replication stress -S000031895 CDS YJL012C 10 413399 411234 C 2011-02-03 2004-02-19|1996-07-31 -S000003548 ORF Verified YJL011C RPC17 DNA-directed RNA polymerase III subunit RPC17|C17 chromosome 10 10 414770 414285 C 2011-02-03 1996-07-31|2011-02-03 RNA polymerase III subunit C17; physically interacts with C31, C11, and TFIIIB70; may be involved in the recruitment of pol III by the preinitiation complex; protein abundance increases in response to DNA replication stress; relocalizes to the cytosol in response to hypoxia -S000030894 CDS YJL011C 10 414770 414285 C 2011-02-03 1996-07-31|2011-02-03 -S000006625 tRNA_gene tK(CUU)J chromosome 10 L000003611 10 414966 415038 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000036030 noncoding_exon tK(CUU)J 10 414966 415038 W 2011-02-03 2000-05-19 -S000006773 tRNA_gene tW(CCA)J chromosome 10 L000003621 10 416036 415931 C 2011-02-03 2000-05-19 Tryptophan tRNA (tRNA-Trp), predicted by tRNAscan-SE analysis -S000033314 intron tW(CCA)J 10 416000 415967 C 2011-02-03 2000-05-19 -S000033313 noncoding_exon tW(CCA)J 10 415966 415931 C 2011-02-03 2000-05-19 -S000033312 noncoding_exon tW(CCA)J 10 416036 416001 C 2011-02-03 2000-05-19 -S000007047 long_terminal_repeat YJLWtau3 YJRWtau3 chromosome 10 10 416266 416441 W 2011-02-03 2000-05-19 Ty4 LTR -S000007029 long_terminal_repeat YJLWdelta8 chromosome 10 10 416506 416650 W 2011-02-03 2000-05-19 Ty1 LTR -S000007030 long_terminal_repeat YJLWdelta9 chromosome 10 10 416899 417026 W 2011-02-03 2000-05-19 Ty1 LTR -S000028451 ARS ARS1014 ARSX-417 chromosome 10 10 417195 417440 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence -S000003547 ORF Verified YJL010C NOP9 RNA-binding RNA processing protein NOP9 chromosome 10 10 419562 417562 C 2011-02-03 1996-07-31 Essential subunit of U3-containing 90S preribosome; involved in production of 18S rRNA and assembly of small ribosomal subunit; also part of pre-40S ribosome and required for its export into cytoplasm; binds RNA and contains pumilio domain -S000030801 CDS YJL010C 10 419562 417562 C 2011-02-03 1996-07-31 -S000003546 ORF Dubious YJL009W chromosome 10 10 419855 420181 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps CCT8/YJL008C, a verified gene encoding a subunit of the cytosolic chaperonin Cct ring complex -S000031233 CDS YJL009W 10 419855 420181 W 2011-02-03 1996-07-31 -S000003545 ORF Verified YJL008C CCT8 chaperonin-containing T-complex subunit CCT8 chromosome 10 L000002764 10 421663 419957 C 2011-02-03 1996-07-31|2011-02-03 Subunit of the cytosolic chaperonin Cct ring complex; related to Tcp1p, required for the assembly of actin and tubulins in vivo -S000031107 CDS YJL008C 10 421663 419957 C 2011-02-03 1996-07-31|2011-02-03 -S000007038 long_terminal_repeat YJLWtau4 chromosome 10 10 421946 422295 W 2011-02-03 2000-05-19|2011-02-03 Ty4 LTR -S000007031 long_terminal_repeat YJLWdelta10 chromosome 10 10 422601 422887 W 2011-02-03 2000-05-19 Ty1 LTR -S000006662 tRNA_gene tM(CAU)J2 EMT3 chromosome 10 L000000553|L000003612 10 422937 423009 W 2011-02-03 2000-05-19 Methionine tRNA (tRNA-Met), functions in translational elongation; not involved in translational initiation; predicted by tRNAscan-SE analysis -S000029922 noncoding_exon tM(CAU)J2 10 422937 423009 W 2011-02-03 2000-05-19 -S000003544 ORF Dubious YJL007C chromosome 10 10 423012 422698 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031008 CDS YJL007C 10 423012 422698 C 2011-02-03 1996-07-31 -S000003543 ORF Verified YJL006C CTK2 chromosome 10 L000003011 10 424109 423138 C 2011-02-03 1996-07-31 Beta subunit of C-terminal domain kinase I (CTDK-I); which phosphorylates both RNA pol II subunit Rpo21p to affect transcription and pre-mRNA 3' end processing, and ribosomal protein Rps2p to increase translational fidelity; relocalizes to the cytosol in response to hypoxia -S000030929 CDS YJL006C 10 424109 423138 C 2011-02-03 1996-07-31 -S000006650 tRNA_gene tL(UAA)J SUP51 SUP52 chromosome 10 L000002209|L000003620 10 424515 424432 C 0 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis; can mutate to suppress amber nonsense mutations -S000037406 noncoding_exon tL(UAA)J 10 424515 424432 C 2011-02-03 2000-05-19 -S000003542 ORF Verified YJL005W CYR1 adenylate cyclase|FIL1|TSM0185|SRA4|HSR1|CDC35 chromosome 10 L000000467 10 425157 431237 W 2 2011-02-03 1996-07-31 Adenylate cyclase; required for cAMP production and cAMP-dependent protein kinase signaling; the cAMP pathway controls a variety of cellular processes, including metabolism, cell cycle, stress response, stationary phase, and sporulation -S000029993 CDS YJL005W 10 425157 431237 W 2011-02-03 1996-07-31 -S000003541 ORF Verified YJL004C SYS1 chromosome 10 L000004153 10 432200 431589 C 2011-02-03 1996-07-31 Integral membrane protein of the Golgi; required for targeting of the Arf-like GTPase Arl3p to the Golgi; multicopy suppressor of ypt6 null mutation -S000037910 CDS YJL004C 10 432200 431589 C 2011-02-03 1996-07-31 -S000003540 ORF Verified YJL003W COX16 chromosome 10 10 432644 433000 W 2011-02-03 1996-07-31 Mitochondrial inner membrane protein; required for assembly of cytochrome c oxidase -S000037880 CDS YJL003W 10 432644 433000 W 2011-02-03 1996-07-31 -S000003539 ORF Verified YJL002C OST1 dolichyl-diphosphooligosaccharide--protein glycotransferase subunit OST1|NLT1 chromosome 10 L000002649 10 434651 433221 C 2011-02-03 1996-07-31 Alpha subunit of the oligosaccharyltransferase complex of the ER lumen; complex catalyzes asparagine-linked glycosylation of newly synthesized proteins -S000035955 CDS YJL002C 10 434651 433221 C 2011-02-03 1996-07-31 -S000003538 ORF Verified YJL001W PRE3 proteasome core particle subunit beta 1|CRL21 chromosome 10 L000000418|L000001485 10 435163 435926 W 2011-02-03 1996-07-31 Beta 1 subunit of the 20S proteasome; responsible for cleavage after acidic residues in peptides -S000035909 CDS YJL001W 10 435163 435227 W 2011-02-03 1996-07-31 -S000035910 CDS YJL001W 10 435344 435926 W 2011-02-03 1996-07-31 -S000035911 intron YJL001W 10 435228 435343 W 2011-02-03 1996-07-31 -S000006471 centromere CEN10 CEN10 chromosome 10 L000000303 10 436425 436307 C 0 2011-02-03 2000-05-19|2004-10-08 Chromosome X centromere -S000077296 centromere_DNA_Element_I CEN10 10 436425 436416 C 2011-02-03 2004-10-08 -S000077297 centromere_DNA_Element_II CEN10 10 436415 436332 C 2011-02-03 2004-10-08 -S000077298 centromere_DNA_Element_III CEN10 10 436331 436307 C 2011-02-03 2004-10-08 -S000003761 ORF Verified YJR001W AVT1 chromosome 10 10 436802 438610 W 2011-02-03 1996-07-31 Vacuolar transporter; imports large neutral amino acids into the vacuole; member of a family of seven S. cerevisiae genes (AVT1-7) related to vesicular GABA-glycine transporters -S000033093 CDS YJR001W 10 436802 438610 W 2011-02-03 1996-07-31 -S000003762 ORF Verified YJR002W MPP10 rRNA-processing protein MPP10 chromosome 10 L000004335 10 438865 440646 W 2011-02-03 1996-07-31 Component of the SSU processome and 90S preribosome; required for pre-18S rRNA processing, interacts with and controls the stability of Imp3p and Imp4p, essential for viability; similar to human Mpp10p -S000033184 CDS YJR002W 10 438865 440646 W 2011-02-03 1996-07-31 -S000003763 ORF Uncharacterized YJR003C MRX12 chromosome 10 10 442553 440994 C 2011-02-03 1996-07-31|2006-05-09 Protein that associates with mitochondrial ribosome; detected in highly purified mitochondria in high-throughput studies; predicted to be involved in ribosome biogenesis -S000033209 CDS YJR003C 10 442553 440994 C 2011-02-03 1996-07-31|2006-05-09 -S000028452 ARS ARS1015 chromosome 10 10 442556 442965 2011-02-03 2002-12-16 Autonomously Replicating Sequence -S000003764 ORF Verified YJR004C SAG1 AG(ALPHA)1 chromosome 10 L000001796 10 444861 442909 C 2 2011-02-03 1996-07-31 Alpha-agglutinin of alpha-cells; binds to Aga1p during agglutination, N-terminal half is homologous to the immunoglobulin superfamily and contains binding site for a-agglutinin, C-terminal half is highly glycosylated and contains GPI anchor -S000034030 CDS YJR004C 10 444861 442909 C 2011-02-03 1996-07-31 -S000003765 ORF Verified YJR005W APL1 YAP80 chromosome 10 L000002495 10 445923 448025 W 2011-02-03 1996-07-31 Beta-adaptin; large subunit of the clathrin associated protein complex (AP-2); involved in vesicle mediated transport; similar to mammalian beta-chain of the clathrin associated protein complex -S000034176 CDS YJR005W 10 445923 448025 W 2011-02-03 1996-07-31 -S000028523 ORF Verified YJR005C-A LSO1 chromosome 10 10 448758 448477 C 2011-02-03 2003-07-29 Protein with a potential role in response to iron deprivation; transcription increases during iron deprivation and during treatment with 2-(6-benzyl-2-pyridyl)quinazoline (BPQ) and copper; regulated by Aft1p and, to a lesser extent, by Aft2p; originally identified as a syntenic homolog of an Ashbya gossypii gene; localizes to nucleus and cytoplasm, and nuclear localization is enhanced under iron-replete conditions -S000030322 CDS YJR005C-A 10 448758 448477 C 2011-02-03 2003-07-29 -S000003766 ORF Verified YJR006W POL31 DNA-directed DNA polymerase delta subunit POL31|HYS2|SDP5|HUS2 chromosome 10 L000002981 10 449202 450665 W 2011-02-03 1996-07-31 Subunit of DNA polymerase delta (polymerase III); essential for cell viability; involved in DNA replication and DNA repair; forms a complex with Rev3p, Rev7p and Pol32p; relocalizes to the cytosol in response to hypoxia -S000035159 CDS YJR006W 10 449202 450665 W 2011-02-03 1996-07-31 -S000003767 ORF Verified YJR007W SUI2 translation initiation factor eIF2 subunit alpha chromosome 10 L000002178 10 451020 451934 W 2 2011-02-03 1996-07-31 Alpha subunit of the translation initiation factor eIF2; eIF2 is involved in identification of the start codon; phosphorylation of Ser51 is required for regulation of translation by inhibiting the exchange of GDP for GTP; protein abundance increases in response to DNA replication stress -S000035254 CDS YJR007W 10 451020 451934 W 2011-02-03 1996-07-31 -S000003768 ORF Verified YJR008W MHO1 chromosome 10 10 452430 453446 W 2011-02-03 1996-07-31 Protein of unknown function; inhibits haploid invasive growth when overexpressed; synthetically lethal with phospholipase C (PLC1); expression induced by mild heat-stress on a non-fermentable carbon source, upon entry into stationary phase and upon nitrogen deprivation; repressed by inosine and choline in an Opi1p-dependent manner; highly conserved from bacteria to human; Memo, the human homolog, is an ErbB2 interacting protein with an essential function in cell motility -S000035336 CDS YJR008W 10 452430 453446 W 2011-02-03 1996-07-31 -S000028453 ARS ARS1016 chromosome 10 10 454584 455555 2011-02-03 2002-12-16 Autonomously Replicating Sequence -S000003769 ORF Verified YJR009C TDH2 glyceraldehyde-3-phosphate dehydrogenase (phosphorylating) TDH2|GAPDH|GLD2 chromosome 10 L000002273 10 454681 453683 C 2.95 2011-02-03 1996-07-31 Glyceraldehyde-3-phosphate dehydrogenase (GAPDH), isozyme 2; involved in glycolysis and gluconeogenesis; tetramer that catalyzes reaction of glyceraldehyde-3-phosphate to 1,3 bis-phosphoglycerate; detected in cytoplasm and cell wall; protein abundance increases in response to DNA replication stress; GAPDH-derived antimicrobial peptides are active against a wide variety of wine-related yeasts and bateria; TDH2 has a paralog, TDH3, that arose from the whole genome duplication -S000035380 CDS YJR009C 10 454681 453683 C 2011-02-03 1996-07-31 -S000003771 ORF Verified YJR010W MET3 sulfate adenylyltransferase chromosome 10 L000001078 10 456239 457774 W 3 2011-02-03 1996-07-31 ATP sulfurylase; catalyzes the primary step of intracellular sulfate activation, essential for assimilatory reduction of sulfate to sulfide, involved in methionine metabolism; human homolog PAPSS2 complements yeast null mutant -S000031767 CDS YJR010W 10 456239 457774 W 2011-02-03 1996-07-31 -S000003770 ORF Verified YJR010C-A SPC1 signal peptidase complex subunit SPC1 chromosome 10 L000003006 10 458361 458077 C 2011-02-03 1996-07-31 Subunit of the signal peptidase complex (SPC); SPC cleaves the signal sequence from proteins targeted to the endoplasmic reticulum (ER); homolog of the SPC12 subunit of mammalian signal peptidase complex; protein abundance increases in response to DNA replication stress -S000037612 CDS YJR010C-A 10 458361 458077 C 2011-02-03 1996-07-31 -S000028454 ARS ARS1017 chromosome 10 10 459337 459895 2011-02-03 2002-12-16 Autonomously Replicating Sequence -S000003772 ORF Uncharacterized YJR011C chromosome 10 10 459426 458641 C 2011-02-03 1996-07-31 Putative protein of unknown function; GFP-fusion protein expression is induced in response to the DNA-damaging agent MMS -S000031827 CDS YJR011C 10 459426 458641 C 2011-02-03 1996-07-31 -S000003774 ORF Verified YJR013W GPI14 glycosylphosphatidylinositol-alpha 1,4 mannosyltransferase I|PMH1 chromosome 10 10 460382 461593 W 2011-02-03 2004-02-12|1996-07-31 Glycosylphosphatidylinositol-alpha 1,4 mannosyltransferase I; involved in GPI anchor biosynthesis, requires Pbn1p for function; homolog of mammalian PIG-M -S000037491 CDS YJR013W 10 460382 461593 W 2011-02-03 2004-02-12|1996-07-31 -S000003773 ORF Uncharacterized YJR012C chromosome 10 10 460418 459795 C 2011-02-03 1996-07-31 Essential protein of unknown function; proposed involvement in transport based on mass spectrometry analysis of copurifying proteins; partially overlaps neighboring ORF, GPI14/YJR013W -S000031960 CDS YJR012C 10 460418 459795 C 2011-02-03 1996-07-31 -S000003775 ORF Verified YJR014W TMA22 RBF22 chromosome 10 10 461829 462425 W 2011-02-03 1996-07-31 Protein of unknown function; associates with ribosomes and has a putative RNA binding domain; interacts with Tma20p; similar to human GRAP and human DRP1, which interacts with human Tma20p homolog MCT-1; protein abundance increases in response to DNA replication stress -S000037578 CDS YJR014W 10 461829 462425 W 2011-02-03 1996-07-31 -S000003776 ORF Uncharacterized YJR015W chromosome 10 10 462721 464253 W 2011-02-03 1996-07-31 Putative protein of unknown function; localizes to endoplasmic reticulum and cytoplasm; predicted to encode a membrane transporter based on phylogenetic analysis; not an essential gene; YJR015W has a paralog, SNG1, that arose from the whole genome duplication -S000037660 CDS YJR015W 10 462721 464253 W 2011-02-03 1996-07-31 -S000003777 ORF Verified YJR016C ILV3 dihydroxy-acid dehydratase ILV3 chromosome 10 L000000859 10 466208 464451 C 10 2011-02-03 1996-07-31 Dihydroxyacid dehydratase; catalyzes third step in the common pathway leading to biosynthesis of branched-chain amino acids -S000037686 CDS YJR016C 10 466208 464451 C 2011-02-03 1996-07-31 -S000003779 ORF Dubious YJR018W chromosome 10 10 466786 467148 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030641 CDS YJR018W 10 466786 467148 W 2011-02-03 1996-07-31 -S000003778 ORF Verified YJR017C ESS1 peptidylprolyl isomerase ESS1|PIN1|PTF1 chromosome 10 L000000587 10 467033 466521 C 17 2011-02-03 2003-09-22|1996-07-31 Peptidylprolyl-cis/trans-isomerase (PPIase); specific for phosphorylated S/T residues N-terminal to proline; regulates phosphorylation of RNAPII large subunit (Rpo21p) C-terminal domain (CTD) at Ser7; associates with phospho-Ser5 form of RNAPII in vivo; present along entire coding length of genes; represses initiation of CUTs; required for efficient termination of mRNA transcription, trimethylation of histone H3; human ortholog PIN1 can complement yeast null and ts mutants -S000030503 CDS YJR017C 10 467033 466521 C 2011-02-03 2003-09-22|1996-07-31 -S000003781 ORF Dubious YJR020W chromosome 10 10 468001 468333 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030190 CDS YJR020W 10 468001 468333 W 2011-02-03 1996-07-31 -S000003780 ORF Verified YJR019C TES1 PTE1 chromosome 10 L000003343 10 468281 467232 C 2011-02-03 1996-07-31 Peroxisomal acyl-CoA thioesterase; likely to be involved in fatty acid oxidation rather than fatty acid synthesis; conserved protein also found in human peroxisomes; TES1 mRNA levels increase during growth on fatty acids -S000030681 CDS YJR019C 10 468281 467232 C 2011-02-03 1996-07-31 -S000003782 ORF Verified YJR021C REC107 MER2 chromosome 10 L000001606 10 469579 468555 C 2011-02-03 1996-07-31 Protein involved in early stages of meiotic recombination; involved in coordination between the initiation of recombination and the first division of meiosis; part of a complex (Rec107p-Mei4p-Rec114p) required for ds break formation -S000030251 CDS YJR021C 10 469183 468555 C 2011-02-03 1996-07-31 -S000030250 CDS YJR021C 10 469579 469264 C 2011-02-03 1996-07-31 -S000030252 intron YJR021C 10 469263 469184 C 2011-02-03 1996-07-31 -S000003783 ORF Verified YJR022W LSM8 U4/U6-U5 snRNP complex subunit LSM8 chromosome 10 L000004687 10 469784 470113 W 2011-02-03 2003-09-22|1996-07-31 Lsm (Like Sm) protein; forms heteroheptameric complex (with Lsm2p, Lsm3p, Lsm4p, Lsm5p, Lsm6p, and Lsm7p) that is part of spliceosomal U6 snRNP and is also implicated in processing of pre-tRNA, pre-snoRNA, and pre-rRNA -S000033657 CDS YJR022W 10 469784 470113 W 2011-02-03 2003-09-22|1996-07-31 -S000003784 ORF Dubious YJR023C chromosome 10 10 470205 469804 C 2011-02-03 1996-07-31 Putative protein of unknown function; open reading frame overlaps LSM8/YJR022W encoding an essential snRNP protein required for RNA processing and splicing -S000033704 CDS YJR023C 10 470205 469804 C 2011-02-03 1996-07-31 -S000003785 ORF Verified YJR024C MDE1 methylthioribulose 1-phosphate dehydratase MDE1 chromosome 10 10 470964 470230 C 2011-02-03 1996-07-31 5'-methylthioribulose-1-phosphate dehydratase; acts in the methionine salvage pathway; potential Smt3p sumoylation substrate; expression downregulated by caspofungin and deletion mutant is caspofungin resistant -S000033856 CDS YJR024C 10 470964 470230 C 2011-02-03 1996-07-31 -S000003786 ORF Verified YJR025C BNA1 3-hydroxyanthranilate 3,4-dioxygenase|HAD1 chromosome 10 L000003490 10 471671 471138 C 2011-02-03 1996-07-31 3-hydroxyanthranilic acid dioxygenase; required for the de novo biosynthesis of NAD from tryptophan via kynurenine; expression regulated by Hst1p -S000033981 CDS YJR025C 10 471671 471138 C 2011-02-03 1996-07-31 -S000007040 long_terminal_repeat YJRWdelta11 chromosome 10 10 472463 472800 W 2011-02-03 2000-05-19 Ty1 LTR -S000007048 LTR_retrotransposon YJRWTy1-1 Ty1 chromosome 10 10 472463 478384 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000003787 transposable_element_gene YJR026W gag protein chromosome 10 10 472760 474082 W 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000034898 CDS YJR026W 10 472760 474082 W 2011-02-03 1996-07-31 -S000003788 transposable_element_gene YJR027W gag-pol fusion protein chromosome 10 10 472760 478028 W 2011-02-03 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000035049 CDS YJR027W 10 472760 474061 W 2011-02-03 1996-07-31 -S000035050 CDS YJR027W 10 474063 478028 W 2011-02-03 1996-07-31 -S000035051 plus_1_translational_frameshift YJR027W 10 474062 474062 W 2011-02-03 1996-07-31 -S000007041 long_terminal_repeat YJRWdelta12 chromosome 10 10 478051 478384 W 2011-02-03 2000-05-19 Ty1 LTR -S000007049 LTR_retrotransposon YJRWTy1-2 Ty1 chromosome 10 10 478051 483972 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000003789 transposable_element_gene YJR028W gag protein chromosome 10 10 478344 479666 W 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000035151 CDS YJR028W 10 478344 479666 W 2011-02-03 1996-07-31 -S000003790 transposable_element_gene YJR029W gag-pol fusion protein chromosome 10 10 478344 483612 W 2011-02-03 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000036043 CDS YJR029W 10 478344 479644 W 2011-02-03 1996-07-31 -S000036044 CDS YJR029W 10 479646 483612 W 2011-02-03 1996-07-31 -S000036045 plus_1_translational_frameshift YJR029W 10 479645 479645 W 2011-02-03 1996-07-31 -S000007042 long_terminal_repeat YJRWdelta13 chromosome 10 10 483635 483972 W 2011-02-03 2000-05-19 Ty1 LTR -S000003791 ORF Uncharacterized YJR030C RBH2 RBH2 chromosome 10 10 486196 483959 C 2011-02-03 1996-07-31 Putative protein of unknown function; expression repressed in carbon limited vs carbon replete chemostat cultures; non-essential gene; contains a PH-like domain; RBH2 has a paralog, RBH1, that arose from the whole genome duplication -S000034642 CDS YJR030C 10 486196 483959 C 2011-02-03 1996-07-31 -S000003792 ORF Verified YJR031C GEA1 Arf family guanine nucleotide exchange factor GEA1 chromosome 10 L000004312 10 490812 486586 C 2011-02-03 1996-07-31 Guanine nucleotide exchange factor for ADP ribosylation factors (ARFs); involved in vesicular transport between the Golgi and ER, Golgi organization, and actin cytoskeleton organization; GEA1 has a paralog, GEA2, that arose from the whole genome duplication -S000034771 CDS YJR031C 10 490812 486586 C 2011-02-03 1996-07-31 -S000003793 ORF Verified YJR032W CPR7 peptidylprolyl isomerase CPR7 chromosome 10 L000003230 10 491081 492262 W 2011-02-03 1996-07-31 Peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; binds to Hsp82p and contributes to chaperone activity; plays a role in determining prion variants -S000035830 CDS YJR032W 10 491081 492262 W 2011-02-03 1996-07-31 -S000003794 ORF Verified YJR033C RAV1 SOI3 chromosome 10 S000029472|L000002969 10 496451 492378 C 2011-02-03 1996-07-31 Subunit of RAVE complex (Rav1p, Rav2p, Skp1p); the RAVE complex promotes assembly of the V-ATPase holoenzyme; required for transport between the early and late endosome/PVC and for localization of TGN membrane proteins; potential Cdc28p substrate -S000035875 CDS YJR033C 10 496451 492378 C 2011-02-03 1996-07-31 -S000003795 ORF Verified YJR034W PET191 chromosome 10 L000001400 10 496683 497009 W 2011-02-03 1996-07-31 Protein required for assembly of cytochrome c oxidase; exists as an oligomer; described as both an integral mitochondrial inner membrane protein facing the intermembrane space (IMS) and as a soluble IMS protein; contains a twin Cx9C motif; imported into the IMS via the MIA import machinery -S000037813 CDS YJR034W 10 496683 497009 W 2011-02-03 1996-07-31 -S000003796 ORF Verified YJR035W RAD26 DNA-dependent ATPase RAD26 chromosome 10 L000001569 10 497355 500612 W 2011-02-03 1996-07-31 Protein involved in transcription-coupled nucleotide excision repair; repairs UV-induced DNA lesions; recruitment to DNA lesions is dependent on an elongating RNA polymerase II; homolog of human CSB protein -S000037907 CDS YJR035W 10 497355 500612 W 2011-02-03 1996-07-31 -S000003798 ORF Dubious YJR037W chromosome 10 10 503102 503485 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene HUL4/YJR036C; deletion mutant has decreased spore survival in Drosophila feces -S000030927 CDS YJR037W 10 503102 503485 W 2011-02-03 1996-07-31 -S000003797 ORF Verified YJR036C HUL4 putative E3 ubiquitin-protein ligase HUL4 chromosome 10 10 503391 500713 C 2011-02-03 1996-07-31 Protein with similarity to hect domain E3 ubiquitin-protein ligases; not essential for viability; found in association with Trf4 in TRAMP complex -S000029850 CDS YJR036C 10 503391 500713 C 2011-02-03 1996-07-31 -S000003800 ORF Uncharacterized YJR039W chromosome 10 10 503936 507301 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000031105 CDS YJR039W 10 503936 507301 W 2011-02-03 1996-07-31 -S000003799 ORF Dubious YJR038C chromosome 10 10 504072 503710 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030967 CDS YJR038C 10 504072 503710 C 2011-02-03 1996-07-31 -S000003801 ORF Verified YJR040W GEF1 CLC chromosome 10 L000000701 10 507746 510085 W 2011-02-03 1996-07-31 Voltage-gated chloride channel; localized to the golgi, the endosomal system, and plasma membrane; involved in cation homeostasis; highly homologous to vertebrate voltage-gated chloride channels; modulates TBSV model (+) RNA virus replication by regulating copper metabolism -S000030664 CDS YJR040W 10 507746 510085 W 2011-02-03 1996-07-31 -S000003802 ORF Verified YJR041C URB2 NPA2 chromosome 10 10 513763 510239 C 2011-02-03 1996-07-31 Protein required for normal metabolism of the rRNA primary transcript; nucleolar protein; proposed to be involved in ribosome biogenesis -S000030713 CDS YJR041C 10 513763 510239 C 2011-02-03 1996-07-31 -S000003803 ORF Verified YJR042W NUP85 RAT9 chromosome 10 L000003023 10 514055 516289 W 2011-02-03 1996-07-31 Subunit of the Nup84p subcomplex of the nuclear pore complex (NPC); contributes to nucleocytoplasmic transport and NPC biogenesis and is involved in establishment of a normal nucleocytoplasmic concentration gradient of the GTPase Gsp1p; also plays roles in several processes that may require localization of genes or chromosomes at the nuclear periphery, including double-strand break repair, transcription and chromatin silencing; homologous to human NUP85 aka NUP75 -S000030892 CDS YJR042W 10 514055 516289 W 2011-02-03 1996-07-31 -S000003804 ORF Verified YJR043C POL32 DNA polymerase delta subunit POL32|REV5 chromosome 10 L000004337|S000029416|L000001617 10 517513 516461 C 2011-02-03 1996-07-31 Third subunit of DNA polymerase delta; involved in chromosomal DNA replication; required for error-prone DNA synthesis in the presence of DNA damage and processivity; forms a complex with Rev3p, Rev7p and Pol31p; interacts with Hys2p, PCNA (Pol30p), and Pol1p -S000031802 CDS YJR043C 10 517513 516461 C 2011-02-03 1996-07-31 -S000006663 tRNA_gene tM(CAU)J3 IMT3 chromosome 10 L000003619 10 517884 517813 C 2011-02-03 2000-05-19 Methionine initiator tRNA (tRNA-Met); predicted by tRNAscan-SE analysis; one of four initiator methionine tRNAs in yeast that are functional for translation -S000029924 noncoding_exon tM(CAU)J3 10 517884 517813 C 2011-02-03 2000-05-19 -S000007043 long_terminal_repeat YJRWdelta14 chromosome 10 10 517959 518099 W 2011-02-03 2000-05-19 Ty1 LTR -S000003805 ORF Verified YJR044C VPS55 chromosome 10 10 519185 518763 C 2011-02-03 1996-07-31 Late endosomal protein involved in late endosome to vacuole transport; functional homolog of human obesity receptor gene-related protein (OB-RGRP) -S000031950 CDS YJR044C 10 519185 518763 C 2011-02-03 1996-07-31 -S000003806 ORF Verified YJR045C SSC1 Hsp70 family ATPase SSC1|mtHSP70|ENS1 chromosome 10 L000000561 10 521602 519638 C 2011-02-03 1996-07-31 Hsp70 family ATPase; constituent of the import motor component of the Translocase of the Inner Mitochondrial membrane (TIM23 complex); involved in protein translocation and folding; subunit of SceI endonuclease; SSC1 has a paralog, ECM10, that arose from the whole genome duplication -S000032104 CDS YJR045C 10 521602 519638 C 2011-02-03 1996-07-31 -S000003807 ORF Verified YJR046W TAH11 CDT1|SID2 chromosome 10 L000004733 10 522048 523862 W 2011-02-03 1996-07-31 DNA replication licensing factor; required for pre-replication complex assembly -S000034108 CDS YJR046W 10 522048 523862 W 2011-02-03 1996-07-31 -S000006727 tRNA_gene tS(AGA)J chromosome 10 L000003618 10 524093 524012 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000032380 noncoding_exon tS(AGA)J 10 524093 524012 C 2011-02-03 2000-05-19 -S000003808 ORF Verified YJR047C ANB1 translation elongation factor eIF-5A|eIF-5A|eIF5A|TIF51B|HYP1 chromosome 10 L000000085|L000000846|L000002308 10 525381 524908 C 2011-02-03 1996-07-31 Translation elongation factor eIF-5A; previously thought to function in translation initiation; undergoes an essential hypusination modification; expressed under anaerobic conditions; ANB1 has a paralog, HYP2, that arose from the whole genome duplication; human EIF5A complements the inviability of the yeast hyp2 anb1 double null mutant -S000034179 CDS YJR047C 10 525381 524908 C 2011-02-03 1996-07-31 -S000003809 ORF Verified YJR048W CYC1 cytochrome c isoform 1 chromosome 10 L000000448 10 526335 526664 W 34 2011-02-03 1996-07-31 Cytochrome c, isoform 1; also known as iso-1-cytochrome c; electron carrier of mitochondrial intermembrane space that transfers electrons from ubiquinone-cytochrome c oxidoreductase to cytochrome c oxidase during cellular respiration; CYC1 has a paralog, CYC7, that arose from the whole genome duplication; human homolog CYC1 can complement yeast null mutant; mutations in human CYC1 cause insulin-responsive hyperglycemia -S000034309 CDS YJR048W 10 526335 526664 W 2011-02-03 1996-07-31 -S000003810 ORF Verified YJR049C UTR1 NADH/NAD(+) kinase chromosome 10 L000002680 10 528476 526884 C 2011-02-03 1996-07-31 ATP-NADH kinase; phosphorylates both NAD and NADH; active as a hexamer; enhances the activity of ferric reductase (Fre1p); UTR1 has a paralog, YEF1, that arose from the whole genome duplication -S000034337 CDS YJR049C 10 528476 526884 C 2011-02-03 1996-07-31 -S000003811 ORF Verified YJR050W ISY1 NTC30|UTR3 chromosome 10 L000002730 10 528697 529404 W 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); NTC contains Prp19p and stabilizes U6 snRNA in catalytic forms of spliceosome containing U2, U5, and U6 snRNAs; interacts with Prp16p to modulate splicing fidelity; isy1 syf2 cells have defective spindles -S000033850 CDS YJR050W 10 528697 529404 W 2011-02-03 1996-07-31 -S000003812 ORF Verified YJR051W OSM1 fumarate reductase|FRDS2 chromosome 10 L000001317 10 529861 531366 W 34 2011-02-03 1996-07-31 Fumarate reductase, catalyzes the reduction of fumarate to succinate; required for the reoxidation of intracellular NADH under anaerobic conditions; mutations cause osmotic sensitivity; has two translation start sites, one at the annotated start codon which produces an ER-targeted form required for anaerobic growth, and one at codon 32 which produces a mitochondrially-targeted form; OSM1 has a paralog, FRD1, that arose from the whole genome duplication -S000033966 CDS YJR051W 10 529861 531366 W 2011-02-03 1996-07-31 -S000007032 long_terminal_repeat YJRCdelta15 YJLWdelta15 chromosome 10 10 531675 531516 C 2011-02-03 2000-05-19|2007-04-04 Ty1 LTR -S000006584 tRNA_gene tG(GCC)J2 SUF23 chromosome 10 L000003613|S000029541|L000002170 10 531828 531898 W 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly); can mutate to suppress +1 frameshift mutations -S000030417 noncoding_exon tG(GCC)J2 10 531828 531898 W 2011-02-03 2000-05-19 -S000003813 ORF Verified YJR052W RAD7 UV-damaged DNA-binding protein RAD7 chromosome 10 L000001561 10 532062 533759 W 35 2011-02-03 1996-07-31 Nucleotide excision repair (NER) protein; binds damaged DNA during NER; binds DNA in an ATP-dependent manner (with Rad16p) during NER; required for repair of non-transcribed chromatin; subunit of Nucleotide Excision Repair Factor 4 (NEF4) and the Elongin-Cullin-Socs (ECS) ligase complex -S000034844 CDS YJR052W 10 532062 533759 W 2011-02-03 1996-07-31 -S000003814 ORF Verified YJR053W BFA1 IBD1 chromosome 10 10 534027 535751 W 2011-02-03 1996-07-31 Subunit of a two-component GTPase-activating protein, Bfa1p-Bub2p; contributes to GAP activity, inactivating Tem1 by stimulating GTP hydrolysis following damage or misalignment of the mitotic spindle; functions as a guanine-nucleotide exchange inhibitor (GDI) for Tem1p; involved in multiple cell cycle checkpoint pathways that control mitotic exit; required when telomeres are damaged, but not for all types of chromosomal DNA damage; phosphorylated by the Polo-like kinase Cdc5p -S000034983 CDS YJR053W 10 534027 535751 W 2011-02-03 1996-07-31 -S000003815 ORF Verified YJR054W KCH1 ERM6 chromosome 10 10 536056 537549 W 2011-02-03 1996-07-31 Potassium transporter that mediates K+ influx; activates high-affinity Ca2+ influx system (HACS) during mating pheromone response; expression up-regulated in response to alpha factor; localized to sites of polarized growth; member of a fungal-specific gene family; potential Cdc28p substrate; KCH1 has a paralog, PRM6, that arose from the whole genome duplication -S000035180 CDS YJR054W 10 536056 537549 W 2011-02-03 1996-07-31 -S000007033 long_terminal_repeat YJRCdelta16 YJLWdelta16 chromosome 10 10 538041 537741 C 2011-02-03 2000-05-19|2007-04-04 Ty1 LTR -S000007044 long_terminal_repeat YJRWdelta17 chromosome 10 10 538103 538434 W 2011-02-03 2000-05-19 Ty1 LTR -S000006707 tRNA_gene tR(CCU)J HSX1 chromosome 10 10 538555 538626 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; low abundance tRNA required for growth on nonfermentable carbon sources at high temperatures, for synthesis of heat shock protein Ssc1p, and for Ty1 retrotransposition through the regulation of translational frameshifting -S000032860 noncoding_exon tR(CCU)J 10 538555 538626 W 2011-02-03 2000-05-19 -S000003816 ORF Verified YJR055W HIT1 chromosome 10 L000000786 10 538772 539266 W 2011-02-03 1996-07-31 Protein involved in C/D snoRNP assembly; regulates abundance of Rsa1p; required for growth at high temperature; similar to human ZNHIT3 -S000036066 CDS YJR055W 10 538772 539266 W 2011-02-03 1996-07-31 -S000028455 ARS ARS1018 ARSX-540 chromosome 10 10 540546 540780 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence -S000007045 long_terminal_repeat YJRWdelta18 chromosome 10 10 540766 541087 W 2011-02-03 2000-05-19 Ty1 LTR -S000007034 long_terminal_repeat YJRCdelta19 YJLWdelta19 chromosome 10 10 541427 541095 C 2011-02-03 2000-05-19|2007-04-04 Ty1 LTR -S000006539 tRNA_gene tD(GUC)J4 chromosome 10 L000003615 10 541508 541579 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000030795 noncoding_exon tD(GUC)J4 10 541508 541579 W 2011-02-03 2000-05-19 -S000003817 ORF Verified YJR056C chromosome 10 10 542502 541792 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus; relative distribution to the nucleus increases upon DNA replication stress -S000036154 CDS YJR056C 10 542502 541792 C 2011-02-03 1996-07-31 -S000006782 tRNA_gene tY(GUA)J2 SUP4 chromosome 10 L000003617|L000002183 10 543044 542956 C 36 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations -S000032087 intron tY(GUA)J2 10 543005 542992 C 2011-02-03 2000-05-19 -S000032086 noncoding_exon tY(GUA)J2 10 542991 542956 C 2011-02-03 2000-05-19 -S000032085 noncoding_exon tY(GUA)J2 10 543044 543006 C 2011-02-03 2000-05-19 -S000007046 long_terminal_repeat YJRWdelta20 chromosome 10 10 543448 543770 W 2011-02-03 2000-05-19 Ty1 LTR -S000003818 ORF Verified YJR057W CDC8 bifunctional thymidylate/uridylate kinase chromosome 10 L000000248 10 544062 544712 W 36 2011-02-03 1996-07-31 Thymidylate and uridylate kinase; functions in de novo biosynthesis of pyrimidine deoxyribonucleotides; converts dTMP to dTDP and dUMP to dUTP; essential for mitotic and meiotic DNA replication; homologous to S. pombe tmp1; human homolog DTYMK can complement yeast cdc8 null mutant -S000036320 CDS YJR057W 10 544062 544712 W 2011-02-03 1996-07-31 -S000003819 ORF Verified YJR058C APS2 YAP17 chromosome 10 L000002492 10 545175 544732 C 2011-02-03 1996-07-31 Small subunit of the clathrin-associated adaptor complex AP-2; AP-2 is involved in protein sorting at the plasma membrane; related to the sigma subunit of the mammalian plasma membrane clathrin-associated protein (AP-2) complex -S000036359 CDS YJR058C 10 545175 544732 C 2011-02-03 1996-07-31 -S000003820 ORF Verified YJR059W PTK2 protein kinase PTK2|STK2 chromosome 10 L000003492 10 545787 548243 W 2011-02-03 1996-07-31 Serine/threonine protein kinase; involved in regulation of ion transport across plasma membrane; carboxyl terminus is essential for glucose-dependent Pma1p activation via phosphorylation of Pma1p-Ser899; enhances spermine uptake; PTK2 has a paralog, PTK1, that arose from the whole genome duplication -S000030117 CDS YJR059W 10 545787 548243 W 2011-02-03 1996-07-31 -S000003821 ORF Verified YJR060W CBF1 GFII|CP1|CPF1|CEP1 chromosome 10 L000000311|L000000401 10 548759 549814 W 40 2011-02-03 1996-07-31 Basic helix-loop-helix (bHLH) protein; forms homodimer to bind E-box consensus sequence CACGTG present at MET gene promoters and centromere DNA element I (CDEI); affects nucleosome positioning at this motif; associates with other transcription factors such as Met4p and Isw1p to mediate transcriptional activation or repression; associates with kinetochore proteins, required for chromosome segregation; protein abundance increases in response to DNA replication stress -S000037892 CDS YJR060W 10 548759 549814 W 2011-02-03 1996-07-31 -S000003822 ORF Uncharacterized YJR061W chromosome 10 10 550511 553318 W 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene; transcription repressed by Rm101p; YJR061W has a paralog, MNN4, that arose from the whole genome duplication -S000029930 CDS YJR061W 10 550511 553318 W 2011-02-03 1996-07-31 -S000003823 ORF Verified YJR062C NTA1 amidase|DEA1 chromosome 10 L000001279 10 554849 553476 C 2011-02-03 1996-07-31 Amidase; removes the amide group from N-terminal asparagine and glutamine residues to generate proteins with N-terminal aspartate and glutamate residues that are targets of ubiquitin-mediated degradation -S000029976 CDS YJR062C 10 554849 553476 C 2011-02-03 1996-07-31 -S000003824 ORF Verified YJR063W RPA12 DNA-directed RNA polymerase I core subunit RPA12|A12.2|RRN4 chromosome 10 L000001672 10 555195 555572 W 2011-02-03 1996-07-31 RNA polymerase I subunit A12.2; contains two zinc binding domains, and the N terminal domain is responsible for anchoring to the RNA pol I complex; physically interacts with transcriptional activator Msn4p, to regulate transcription of AYR1, a gene involved in lipid metabolism -S000031049 CDS YJR063W 10 555195 555572 W 2011-02-03 1996-07-31 -S000003825 ORF Verified YJR064W CCT5 chaperonin-containing T-complex subunit CCT5|TCP5 chromosome 10 L000002717 10 555914 557602 W 2011-02-03 1996-07-31 Subunit of the cytosolic chaperonin Cct ring complex; related to Tcp1p, required for the assembly of actin and tubulins in vivo -S000031152 CDS YJR064W 10 555914 557602 W 2011-02-03 1996-07-31 -S000003826 ORF Verified YJR065C ARP3 actin-related protein 3|ACT4 chromosome 10 L000003198 10 559158 557809 C 2011-02-03 1996-07-31 Essential component of the Arp2/3 complex; Arp2/3 is a highly conserved actin nucleation center required for the motility and integrity of actin patches; involved in endocytosis and membrane growth and polarity -S000031207 CDS YJR065C 10 559158 557809 C 2011-02-03 1996-07-31 -S000003827 ORF Verified YJR066W TOR1 phosphatidylinositol kinase-related protein kinase TOR1|DRR1 chromosome 10 L000002322 10 559416 566828 W 44.84 2011-02-03 1996-07-31 PIK-related protein kinase and rapamycin target; subunit of TORC1, a complex that controls growth in response to nutrients by regulating translation, transcription, ribosome biogenesis, nutrient transport and autophagy; involved in meiosis; TOR1 has a paralog, TOR2, that arose from the whole genome duplication -S000032272 CDS YJR066W 10 559416 566828 W 2011-02-03 1996-07-31 -S000003828 ORF Verified YJR067C YAE1 chromosome 10 L000004159 10 567444 567019 C 2011-02-03 1996-07-31 Protein that forms a complex with Lto1p and Rli1p; essential for growth under standard (aerobic) conditions but not under anaerobic conditions; may have a role in protection of ribosomal assembly and function from damage due to reactive oxygen species -S000032323 CDS YJR067C 10 567444 567019 C 2011-02-03 1996-07-31 -S000003829 ORF Verified YJR068W RFC2 replication factor C subunit 2 chromosome 10 L000001623 10 567643 568704 W 2011-02-03 1996-07-31 Subunit of heteropentameric Replication factor C (RF-C); RF-C is a DNA binding protein and ATPase that acts as a clamp loader of the proliferating cell nuclear antigen (PCNA) processivity factor for DNA polymerases delta and epsilon -S000032475 CDS YJR068W 10 567643 568704 W 2011-02-03 1996-07-31 -S000003830 ORF Verified YJR069C HAM1 nucleoside triphosphate pyrophosphohydrolase HAM1 chromosome 10 L000003233 10 569399 568806 C 2011-02-03 1996-07-31 Nucleoside triphosphate pyrophosphohydrolase; active against various substrates including ITP, dITP and XTP; mediates exclusion of non canonical purines, pyrimidines from dNTP pools; functions with YJL055W to mediate resistance to 5-FU; specifically reduces the incorporation of 5-FU into RNA without affecting uptake or incorporation of uracil into RNA; protein abundance increases in response to DNA replication stress; yeast HAM1 can complement knockdown of human homolog ITPA -S000034432 CDS YJR069C 10 569399 568806 C 2011-02-03 1996-07-31 -S000003832 ORF Dubious YJR071W chromosome 10 10 570405 570773 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033295 CDS YJR071W 10 570405 570773 W 2011-02-03 1996-07-31 -S000003831 ORF Verified YJR070C LIA1 MMD1 chromosome 10 10 570598 569621 C 2011-02-03 1996-07-31 Deoxyhypusine hydroxylase; HEAT-repeat containing metalloenzyme that catalyzes hypusine formation; binds to and is required for the modification of Hyp2p (eIF5A); complements S. pombe mmd1 mutants defective in mitochondrial positioning; protein abundance increases in response to DNA replication stress -S000033205 CDS YJR070C 10 570598 569621 C 2011-02-03 1996-07-31 -S000003833 ORF Verified YJR072C NPA3 GTPase NPA3|GPN1|EPA1 chromosome 10 10 572124 570967 C 2011-02-03 1996-07-31 Member of the conserved GPN-loop GTPase family; has a role in transport of RNA polymerase II to the nucleus; exhibits GTP-dependent binding to PolII; has ATPase activity; involved in sister chromatid cohesion; phosphorylated by the Pcl1p-Pho85p kinase complex; human homolog XAB1 interacts with human RNA polymerase II; protein abundance increases in response to DNA replication stress -S000034114 CDS YJR072C 10 572124 570967 C 2011-02-03 1996-07-31 -S000003834 ORF Verified YJR073C OPI3 bifunctional phosphatidyl-N-methylethanolamine N-methyltransferase/phosphatidyl-N-dimethylethanolamine N-methyltransferase|PEM2 chromosome 10 L000001304 10 572935 572315 C 2011-02-03 1996-07-31 Methylene-fatty-acyl-phospholipid synthase; catalyzes the last two steps in phosphatidylcholine biosynthesis; also known as phospholipid methyltransferase -S000034233 CDS YJR073C 10 572935 572315 C 2011-02-03 1996-07-31 -S000003835 ORF Verified YJR074W MOG1 Ran GTPase-binding protein MOG1 chromosome 10 L000004615 10 573095 573751 W 2011-02-03 1996-07-31 Conserved nuclear protein that interacts with GTP-Gsp1p; stimulates nucleotide release from Gsp1p; involved in nuclear protein import; nucleotide release is inhibited by Yrb1p -S000034411 CDS YJR074W 10 573095 573751 W 2011-02-03 1996-07-31 -S000003836 ORF Verified YJR075W HOC1 alpha-1,6-mannosyltransferase chromosome 10 L000003274 10 573981 575171 W 2011-02-03 1996-07-31 Alpha-1,6-mannosyltransferase; involved in cell wall mannan biosynthesis; subunit of a Golgi-localized complex that also contains Anp1p, Mnn9p, Mnn11p, and Mnn10p; identified as a suppressor of a cell lysis sensitive pkc1-371 allele -S000035455 CDS YJR075W 10 573981 575171 W 2011-02-03 1996-07-31 -S000003837 ORF Verified YJR076C CDC11 septin CDC11|PSL9 chromosome 10 L000000251 10 576601 575354 C 54 2011-02-03 1996-07-31 Component of the septin ring that is required for cytokinesis; present at the ends of rod-like septin hetero-oligomers; C-terminal extension is important for recruitment of Bni5p to the mother-bud neck, which in turn is required for Myo1p recruitment and cytokinesis; septin rings at the mother-bud neck act as scaffolds for recruiting cell division factors and as barriers to prevent diffusion of specific proteins between mother and daughter cells -S000035494 CDS YJR076C 10 576601 575354 C 2011-02-03 1996-07-31 -S000003838 ORF Verified YJR077C MIR1 PTP chromosome 10 L000001114 10 578190 577255 C 2011-02-03 1996-07-31 Mitochondrial phosphate carrier; imports inorganic phosphate into mitochondria; functionally redundant with Pic2p but more abundant than Pic2p under normal conditions; phosphorylated -S000035596 CDS YJR077C 10 578190 577255 C 2011-02-03 1996-07-31 -S000003839 ORF Verified YJR078W BNA2 dioxygenase BNA2 chromosome 10 10 578860 580221 W 2011-02-03 1996-07-31 Tryptophan 2,3-dioxygenase or indoleamine 2,3-dioxygenase; required for de novo biosynthesis of NAD from tryptophan via kynurenine; interacts genetically with telomere capping gene CDC13; regulated by Hst1p and Aftp -S000036561 CDS YJR078W 10 578860 580221 W 2011-02-03 1996-07-31 -S000003840 ORF Uncharacterized YJR079W chromosome 10 10 580205 581239 W 2011-02-03 1996-07-31 Putative protein of unknown function; mutation results in impaired mitochondrial respiration -S000036624 CDS YJR079W 10 580205 580347 W 2011-02-03 1996-07-31 -S000036625 CDS YJR079W 10 581053 581239 W 2011-02-03 1996-07-31 -S000036626 intron YJR079W 10 580348 581052 W 2011-02-03 1996-07-31 -S000003841 ORF Verified YJR080C AIM24 FMP26 chromosome 10 10 581616 580432 C 2011-02-03 1996-07-31 Protein with a role in determining mitochondrial architecture; inner membrane protein that interacts physically and genetically with the MICOS complex and is required for its integrity -S000037402 CDS YJR080C 10 581616 580432 C 2011-02-03 1996-07-31 -S000003842 ORF Verified YJR082C EAF6 chromosome 10 10 582255 581914 C 2011-02-03 1996-07-31 Subunit of the NuA4 acetyltransferase complex; this complex acetylates histone H4 and NuA3 acetyltransferase complex that acetylates histone H3 -S000030287 CDS YJR082C 10 582255 581914 C 2011-02-03 1996-07-31 -S000003843 ORF Verified YJR083C ACF4 chromosome 10 10 583537 582608 C 2011-02-03 1996-07-31 Protein of unknown function; computational analysis of large-scale protein-protein interaction data suggests a possible role in actin cytoskeleton organization; potential Cdc28p substrate -S000030434 CDS YJR083C 10 583537 582608 C 2011-02-03 1996-07-31 -S000003844 ORF Verified YJR084W CSN12 chromosome 10 S000007581 10 583733 585004 W 2011-02-03 1996-07-31 Protein that forms a complex with Thp3p; may have a role in transcription elongation and/or mRNA splicing; identified as a COP9 signalosome component but phenotype and interactions suggest it may not be involved with the signalosome -S000031409 CDS YJR084W 10 583733 585004 W 2011-02-03 1996-07-31 -S000003845 ORF Verified YJR085C chromosome 10 10 585437 585120 C 2011-02-03 1996-07-31 Protein of unknown function; GFP-fusion protein is induced in response to the DNA-damaging agent MMS; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; protein abundance increases in response to DNA replication stress -S000031477 CDS YJR085C 10 585437 585120 C 2011-02-03 1996-07-31 -S000003846 ORF Verified YJR086W STE18 chromosome 10 L000002122 10 586068 586400 W 59 2011-02-03 1996-07-31 G protein gamma subunit; forms a dimer with Ste4p to activate the mating signaling pathway, forms a heterotrimer with Gpa1p and Ste4p to dampen signaling; C-terminus is palmitoylated and farnesylated, which are required for normal signaling -S000031665 CDS YJR086W 10 586068 586400 W 2011-02-03 1996-07-31 -S000003847 ORF Dubious YJR087W chromosome 10 10 586400 586750 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the verified genes STE18 and ECM2 -S000032646 CDS YJR087W 10 586400 586750 W 2011-02-03 1996-07-31 -S000003848 ORF Verified YJR088C EMC2 chromosome 10 10 587373 586495 C 2011-02-03 1996-07-31 Member of conserved ER transmembrane complex; required for efficient folding of proteins in the ER; null mutant displays induction of the unfolded protein response; homologous to worm Y57G7A.10/EMC-2, fly CG17556, human TTC35 -S000032686 CDS YJR088C 10 587373 586495 C 2011-02-03 1996-07-31 -S000003849 ORF Verified YJR089W BIR1 chromosome 10 L000004754 10 587718 590582 W 2011-02-03 1996-07-31 Subunit of chromosomal passenger complex (CPC); CPC is comprised of Ipl1p-Sli15p-Bir1p-Nbl1p and regulates chromosome segregation; required for chromosome bi-orientation and for spindle assembly checkpoint activation upon reduced sister kinetochore tension; relative distribution to shortened microtubules increases upon DNA replication stress; sumoylated in an Mms21p-dependent manner; human survivin homolog -S000032816 CDS YJR089W 10 587718 590582 W 2011-02-03 1996-07-31 -S000003850 ORF Verified YJR090C GRR1 SCF ubiquitin ligase complex subunit GRR1|SDC1|SSU2|COT2|CAT80 chromosome 10 L000000730 10 594327 590872 C 60 2011-02-03 1996-07-31 F-box protein component of an SCF ubiquitin-ligase complex; modular substrate specificity factor which associates with core SCF (Cdc53p, Skp1p and Hrt1p/Rbx1p) to form the SCF(Grr1) complex; SCF(Grr1) acts as a ubiquitin-protein ligase directing ubiquitination of substrates such as: Gic2p, Mks1p, Mth1p, Cln1p, Cln2p and Cln3p; involved in carbon catabolite repression, glucose-dependent divalent cation transport, glucose transport, morphogenesis, and sulfite detoxification -S000032905 CDS YJR090C 10 594327 590872 C 2011-02-03 1996-07-31 -S000003851 ORF Verified YJR091C JSN1 PUF1 chromosome 10 L000002964 10 598336 595061 C 2011-02-03 1996-07-31 Member of the Puf family of RNA-binding proteins; interacts with mRNAs encoding membrane-associated proteins; involved in localizing the Arp2/3 complex to mitochondria; overexpression causes increased sensitivity to benomyl; JSN1 has a paralog, PUF2, that arose from the whole genome duplication -S000033011 CDS YJR091C 10 598336 595061 C 2011-02-03 1996-07-31 -S000003852 ORF Verified YJR092W BUD4 chromosome 10 L000000201 10 598735 603078 W 2011-02-03 2004-04-20|1996-07-31|1997-07-27|2008-06-04 Anillin-like protein involved in bud-site selection; required for the axial budding pattern; required for the formation and disassembly of the double septin ring structure, and generally for septin organization; functions as a platform linking the cytokinesis tag septins to the axial landmark through its multiple domains; in vivo substrate of Cdc28p/Clb2p -S000033797 CDS YJR092W 10 598735 603078 W 2011-02-03 2004-04-20|1996-07-31|1997-07-27|2008-06-04 -S000003853 ORF Verified YJR093C FIP1 cleavage polyadenylation factor subunit FIP1 chromosome 10 L000002775 10 604203 603220 C 2011-02-03 1996-07-31 Subunit of cleavage polyadenylation factor (CPF); interacts directly with poly(A) polymerase (Pap1p) to regulate its activity; bridging factor that links Pap1p and the CPF complex via Yth1p -S000033863 CDS YJR093C 10 604203 603220 C 2011-02-03 1996-07-31 -S000003854 ORF Verified YJR094C IME1 transcription factor IME1 chromosome 10 L000000861 10 605651 604569 C 2011-02-03 1996-07-31 Master regulator of meiosis that is active only during meiotic events; activates transcription of early meiotic genes through interaction with Ume6p; degraded by the 26S proteasome following phosphorylation by Ime2p; transcription is negatively regulated in cis by the IRT1 long noncoding antisense RNA -S000034019 CDS YJR094C 10 605651 604569 C 2011-02-03 1996-07-31 -S000178119 ncRNA_gene IRT1 IRT1 SUT643 chromosome 10 10 607424 605936 C 2014-11-18 2014-11-18 Long noncoding RNA that governs mating-type control of gametogenesis; located in the IME1 promoter; in haploids, expression of IME1, the central inducer of gametogenesis, is inhibited in cis by transcription of IRT1, which recruits the Set2p histone methyltransferase and the Set3p histone deacetylase complex to establish repressive chromatin at the IME1 promoter -S000178120 noncoding_exon IRT1 10 607424 605936 C 2014-11-18 2014-11-18 -S000003855 ORF Verified YJR094W-A RPL43B eL43|ribosomal 60S subunit protein L43B|L43e|L43B chromosome 10 L000004470 10 608305 608858 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L43B; homologous to mammalian ribosomal protein L37A, no bacterial homolog; RPL43B has a paralog, RPL43A, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000034757 CDS YJR094W-A 10 608305 608306 W 2011-02-03 1996-07-31 -S000034758 CDS YJR094W-A 10 608582 608858 W 2011-02-03 1996-07-31 -S000034759 intron YJR094W-A 10 608307 608581 W 2011-02-03 1996-07-31 -S000003856 ORF Verified YJR095W SFC1 ACR1 chromosome 10 L000000023 10 609773 610741 W 2011-02-03 1996-07-31 Mitochondrial succinate-fumarate transporter; transports succinate into and fumarate out of the mitochondrion; required for ethanol and acetate utilization -S000034990 CDS YJR095W 10 609773 610741 W 2011-02-03 1996-07-31 -S000003857 ORF Verified YJR096W aldo-keto reductase superfamily protein chromosome 10 10 611195 612043 W 2011-02-03 1996-07-31 Xylose and arabinose reductase; member of the aldo-keto reductase (AKR) family; GFP-fusion protein is induced in response to the DNA-damaging agent MMS -S000035147 CDS YJR096W 10 611195 612043 W 2011-02-03 1996-07-31 -S000003858 ORF Verified YJR097W JJJ3 DPH4 chromosome 10 10 612413 612931 W 2011-02-03 1996-07-31 Protein of unknown function; contains a CSL Zn finger and a DnaJ-domain; involved in diphthamide biosynthesis; ortholog human Dph4 -S000035313 CDS YJR097W 10 612413 612931 W 2011-02-03 1996-07-31 -S000028456 ARS ARS1019 chromosome 10 10 612846 613278 2011-02-03 2002-12-16 Autonomously Replicating Sequence -S000003859 ORF Uncharacterized YJR098C chromosome 10 10 615156 613186 C 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000036139 CDS YJR098C 10 615156 613186 C 2011-02-03 1996-07-31|2011-02-03 -S000003860 ORF Verified YJR099W YUH1 ubiquitin-specific protease YUH1 chromosome 10 L000002565 10 615576 616286 W 57 2011-02-03 1996-07-31 Ubiquitin C-terminal hydrolase; cleaves ubiquitin-protein fusions to generate monomeric ubiquitin; hydrolyzes the peptide bond at the C-terminus of ubiquitin; also the major processing enzyme for the ubiquitin-like protein Rub1p -S000036337 CDS YJR099W 10 615576 616286 W 2011-02-03 1996-07-31 -S000003861 ORF Verified YJR100C AIM25 SLM35 chromosome 10 10 617334 616351 C 2011-02-03 1996-07-31 Mitochondria protein of unknown function; interacts genetically with TOR1 to regulate chronological lifespan, and the response to both heat shock and oxidative stress; involved in maintaining the integrity of the mitochondrial network; negative regulator of mitophagy flux; non-tagged protein is detected in purified mitochondria in high-throughput studies; null mutant is viable and displays an elevated frequency of mitochondrial genome loss; similar to murine NOR1 -S000033573 CDS YJR100C 10 617334 616351 C 2011-02-03 1996-07-31 -S000006654 tRNA_gene tL(UAG)J chromosome 10 L000003616 10 617919 618019 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000035855 intron tL(UAG)J 10 617957 617975 W 2011-02-03 2000-05-19 -S000035853 noncoding_exon tL(UAG)J 10 617919 617956 W 2011-02-03 2000-05-19 -S000035854 noncoding_exon tL(UAG)J 10 617976 618019 W 2011-02-03 2000-05-19 -S000003862 ORF Verified YJR101W RSM26 mitochondrial 37S ribosomal protein RSM26 chromosome 10 10 618234 619034 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit -S000034505 CDS YJR101W 10 618234 619034 W 2011-02-03 1996-07-31 -S000003863 ORF Verified YJR102C VPS25 ESCRT-II subunit protein VPS25|VPL12|VPT25 chromosome 10 10 619765 619157 C 2011-02-03 1996-07-31 Component of the ESCRT-II complex; ESCRT-II is involved in ubiquitin-dependent sorting of proteins into the endosome -S000034557 CDS YJR102C 10 619765 619157 C 2011-02-03 1996-07-31 -S000003864 ORF Verified YJR103W URA8 CTP synthase URA8 chromosome 10 L000002437 10 620754 622490 W 2011-02-03 1996-07-31|2011-02-03 Minor CTP synthase isozyme (see also URA7); catalyzes the ATP-dependent transfer of the amide nitrogen from glutamine to UTP, forming CTP, the final step in de novo biosynthesis of pyrimidines; involved in phospholipid biosynthesis; capable of forming cytoplasmic filaments termed cytoophidium, especially during conditions of glucose depletion; URA8 has a paralog, URA7, that arose from the whole genome duplication -S000034718 CDS YJR103W 10 620754 622490 W 2011-02-03 1996-07-31|2011-02-03 -S000003865 ORF Verified YJR104C SOD1 superoxide dismutase SOD1|CRS4 chromosome 10 L000001978 10 623014 622550 C 2011-02-03 1996-07-31 Cytosolic copper-zinc superoxide dismutase; detoxifies superoxide; stabilizes Yck1p and Yck2p kinases in glucose to repress respiration; phosphorylated by Dun1p, enters nucleus under oxidative stress to promote transcription of stress response genes; human ortholog SOD1 implicated in ALS complements a null allele; abundance increases under DNA replication stress and during exposure to boric acid; localization to mitochondrial intermembrane space is modulated by MICOS complex -S000035647 CDS YJR104C 10 623014 622550 C 2011-02-03 1996-07-31 -S000003866 ORF Verified YJR105W ADO1 adenosine kinase chromosome 10 10 623581 624603 W 2011-02-03 1996-07-31 Adenosine kinase; required for the utilization of S-adenosylmethionine (AdoMet); may be involved in recycling adenosine produced through the methyl cycle -S000035831 CDS YJR105W 10 623581 624603 W 2011-02-03 1996-07-31 -S000003867 ORF Verified YJR106W ECM27 chromosome 10 L000003898 10 624838 627015 W 2011-02-03 1996-07-31|2011-02-03 Protein involved in calcium homeostasis and exit from quiescence; required for proper trehalose levels during quiescence; may play a role in cell wall biosynthesis, mutants are hypersensitive to antifungal, Papulacandin B; null mutants have increased plasmid loss; interacts with Pdr5p -S000035951 CDS YJR106W 10 624838 627015 W 2011-02-03 1996-07-31|2011-02-03 -S000003868 ORF Uncharacterized YJR107W LIH1 putative lipase chromosome 10 10 627340 628326 W 2011-02-03 1996-07-31|2011-02-03 Putative lipase -S000037815 CDS YJR107W 10 627340 628326 W 2011-02-03 1996-07-31|2011-02-03 -S000003869 ORF Verified YJR108W ABM1 chromosome 10 10 628712 629083 W 2011-02-03 1996-07-31 Protein of unknown function; required for normal microtubule organization -S000037909 CDS YJR108W 10 628712 629083 W 2011-02-03 1996-07-31 -S000003870 ORF Verified YJR109C CPA2 carbamoyl-phosphate synthase (glutamine-hydrolyzing) CPA2 chromosome 10 L000000400 10 632941 629585 C 2011-02-03 1996-07-31 Large subunit of carbamoyl phosphate synthetase; carbamoyl phosphate synthetase catalyzes a step in the synthesis of citrulline, an arginine precursor -S000029885 CDS YJR109C 10 632941 629585 C 2011-02-03 1996-07-31 -S000003871 ORF Verified YJR110W YMR1 phosphatidylinositol-3-phosphatase YMR1 chromosome 10 10 633615 635681 W 2011-02-03 1996-07-31 Phosphatidylinositol 3-phosphate (PI3P) phosphatase; involved in various protein sorting pathways, including CVT targeting and endosome to vacuole transport; has similarity to the conserved myotubularin dual specificity phosphatase family -S000037677 CDS YJR110W 10 633615 635681 W 2011-02-03 1996-07-31 -S000003872 ORF Verified YJR111C PXP2 chromosome 10 10 636706 635855 C 2011-02-03 1996-07-31 Peroxisomal matrix protein with naturally active promoter; well-conserved in fungi; localized to peroxisomes under physiological growth conditions; levels of some amino acids are altered upon both knockout and overexpression, suggesting potential involvement of Pxp2p in amino acid metabolism or related cellular metabolic processes (needs further study); GFP-fusion protein displays inherent dual localization with large proportion localizing to cytosol -S000037709 CDS YJR111C 10 636706 635855 C 2011-02-03 1996-07-31 -S000003873 ORF Verified YJR112W NNF1 MIND complex subunit NNF1 chromosome 10 L000003072 10 637030 637635 W 2011-02-03 1996-07-31 Essential component of the MIND kinetochore complex; joins kinetochore subunits contacting DNA to those contacting microtubules; required for accurate chromosome segregation; complex consists of Mtw1p Including Nnf1p-Nsl1p-Dsn1p (MIND) -S000037783 CDS YJR112W 10 637030 637635 W 2011-02-03 1996-07-31 -S000028513 ORF Uncharacterized YJR112W-A chromosome 10 10 637790 638168 W 2011-02-03 2003-07-29 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; identified based on homology to Ashbya gossypii -S000030277 CDS YJR112W-A 10 637790 637809 W 2011-02-03 2003-07-29 -S000030278 CDS YJR112W-A 10 637859 638168 W 2011-02-03 2003-07-29 -S000030279 intron YJR112W-A 10 637810 637858 W 2011-02-03 2003-07-29 -S000003875 ORF Dubious YJR114W SRF2 chromosome 10 10 638659 639051 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF RSM7/YJR113C -S000030784 CDS YJR114W 10 638659 639051 W 2011-02-03 1996-07-31 -S000003874 ORF Verified YJR113C RSM7 mitochondrial 37S ribosomal protein RSM7 chromosome 10 10 638975 638232 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; has similarity to E. coli S7 ribosomal protein -S000030623 CDS YJR113C 10 638975 638232 C 2011-02-03 1996-07-31 -S000003876 ORF Uncharacterized YJR115W chromosome 10 10 639942 640451 W 2011-02-03 1996-07-31 Putative protein of unknown function; YJR115W has a paralog, ECM13, that arose from the whole genome duplication -S000030893 CDS YJR115W 10 639942 640451 W 2011-02-03 1996-07-31 -S000003877 ORF Uncharacterized YJR116W TDA4 chromosome 10 10 640825 641664 W 2011-02-03 1996-07-31 Putative protein of unknown function; null mutant is sensitive to expression of the top1-T722A allele -S000031858 CDS YJR116W 10 640825 641664 W 2011-02-03 1996-07-31 -S000003878 ORF Verified YJR117W STE24 zinc metalloprotease|PIO2|AFC1 chromosome 10 L000003457 10 642007 643368 W 2011-02-03 1996-07-31 Highly conserved zinc metalloprotease; functions in two steps of a-factor maturation, C-terminal CAAX proteolysis and the first step of N-terminal proteolytic processing; cleaves both isoprenylated and non-prenylated oligopeptides; contains multiple transmembrane spans; human homolog ZMPSTE24 implicated in mandibuloacral dysplasia (MAD), and can complement yeast null mutant -S000032024 CDS YJR117W 10 642007 643368 W 2011-02-03 1996-07-31 -S000003879 ORF Verified YJR118C ILM1 chromosome 10 10 644101 643490 C 2011-02-03 1996-07-31 Protein of unknown function; may be involved in mitochondrial DNA maintenance; required for slowed DNA synthesis-induced filamentous growth -S000032105 CDS YJR118C 10 644101 643490 C 2011-02-03 1996-07-31 -S000003880 ORF Verified YJR119C JHD2 histone demethylase|KDM5 chromosome 10 10 646490 644304 C 2011-02-03 1996-07-31 JmjC domain family histone demethylase; promotes global demethylation of H3K4 and repression of noncoding intergenic transcription during sporulation; removes methyl groups added by Set1p methyltransferase; negatively regulated by H3K14 acetylation; protein levels regulated by Not4p polyubiquitin-mediated degradation; regulates sporulation timing by extending period of active transcription in opposition to programmed global transcriptional quiescence; regulates rDNA silencing -S000034072 CDS YJR119C 10 646490 644304 C 2011-02-03 1996-07-31 -S000003881 ORF Verified YJR120W chromosome 10 10 647126 647476 W 2011-02-03 1996-07-31 Protein of unknown function; essential for growth under anaerobic conditions; mutation causes decreased expression of ATP2, impaired respiration, defective sterol uptake, and altered levels/localization of ABC transporters Aus1p and Pdr11p -S000032979 CDS YJR120W 10 647126 647476 W 2011-02-03 1996-07-31 -S000003882 ORF Verified YJR121W ATP2 F1F0 ATP synthase subunit beta chromosome 10 L000000142 10 647607 649142 W 2011-02-03 1996-07-31 Beta subunit of the F1 sector of mitochondrial F1F0 ATP synthase; which is a large, evolutionarily conserved enzyme complex required for ATP synthesis; F1 translationally regulates ATP6 and ATP8 expression to achieve a balanced output of ATP synthase genes encoded in nucleus and mitochondria; phosphorylated -S000033071 CDS YJR121W 10 647607 649142 W 2011-02-03 1996-07-31 -S000003883 ORF Verified YJR122W IBA57 CAF17 chromosome 10 L000003419 10 649776 651269 W 2011-02-03 1996-07-31 Protein involved in incorporating iron-sulfur clusters into proteins; mitochondrial matrix protein; involved in the incorporation of iron-sulfur clusters into mitochondrial aconitase-type proteins; activates the radical-SAM family members Bio2p and Lip5p; interacts with Ccr4p in the two-hybrid system -S000033750 CDS YJR122W 10 649776 651269 W 2011-02-03 1996-07-31 -S000003884 ORF Verified YJR123W RPS5 uS7|ribosomal 40S subunit protein S5|S7|rp14|YS8|S5|S2 chromosome 10 L000002821 10 651901 652578 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; least basic of non-acidic ribosomal proteins; phosphorylated in vivo; essential for viability; homologous to mammalian ribosomal protein S5 and bacterial S7 -S000033852 CDS YJR123W 10 651901 652578 W 2011-02-03 1996-07-31 -S000003885 ORF Uncharacterized YJR124C chromosome 10 10 654238 652892 C 2011-02-03 1996-07-31 Putative protein of unknown function; expression induced under calcium shortage -S000033876 CDS YJR124C 10 654238 652892 C 2011-02-03 1996-07-31 -S000028457 ARS ARS1020 ARSX-654 chromosome 10 10 654375 654614 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence -S000003886 ORF Verified YJR125C ENT3 chromosome 10 10 655963 654737 C 2011-02-03 1996-07-31 Protein containing an N-terminal epsin-like domain; involved in clathrin recruitment and traffic between the Golgi and endosomes; associates with the clathrin adaptor Gga2p -S000034017 CDS YJR125C 10 655963 654737 C 2011-02-03 1996-07-31 -S000003887 ORF Verified YJR126C VPS70 putative zinc metalloprotease chromosome 10 10 658689 656254 C 2011-02-03 1996-07-31 Protein of unknown function involved in vacuolar protein sorting; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum -S000034920 CDS YJR126C 10 658689 656254 C 2011-02-03 1996-07-31 -S000003889 ORF Dubious YJR128W chromosome 10 10 662921 663280 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF RSF2 -S000036069 CDS YJR128W 10 662921 663280 W 2011-02-03 1996-07-31 -S000003888 ORF Verified YJR127C RSF2 ZMS1 chromosome 10 L000002569 10 663059 658917 C 2011-02-03 1996-07-31 Zinc-finger protein; involved in transcriptional control of both nuclear and mitochondrial genes, many of which specify products required for glycerol-based growth, respiration, and other functions; RSF2 has a paralog, TDA9, that arose from the whole genome duplication; relocalizes from nucleus to cytoplasm upon DNA replication stress -S000035071 CDS YJR127C 10 663059 658917 C 2011-02-03 1996-07-31 -S000006492 snoRNA_gene snR3 SNR3 chromosome 10 L000001958 10 663749 663942 W 2011-02-03 2000-05-19|2007-05-08 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at positions U2129, U2133, and U2264 -S000034301 noncoding_exon snR3 10 663749 663942 W 2011-02-03 2000-05-19|2007-05-08 -S000003890 ORF Verified YJR129C EFM3 protein-lysine N-methyltransferase chromosome 10 10 665019 664000 C 2011-02-03 1996-07-31|2011-02-03 S-adenosylmethionine-dependent methyltransferase; seven-beta-strand lysine methyltransferase which trimethylates translation elongation factor EF2 (Eft1p and Eft2p) at lysine 509; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; ortholog of human gene FAM86A -S000036155 CDS YJR129C 10 665019 664000 C 2011-02-03 1996-07-31|2011-02-03 -S000003891 ORF Verified YJR130C STR2 cystathionine gamma-synthase chromosome 10 10 667137 665218 C 2011-02-03 1996-07-31 Cystathionine gamma-synthase, converts cysteine into cystathionine; STR2 has a paralog, YML082W, that arose from the whole genome duplication -S000036945 CDS YJR130C 10 667137 665218 C 2011-02-03 1996-07-31 -S000003892 ORF Verified YJR131W MNS1 mannosyl-oligosaccharide 1,2-alpha-mannosidase chromosome 10 L000001130 10 667644 669293 W 2011-02-03 1996-07-31 Alpha-1,2-mannosidase; involved in ER-associated protein degradation (ERAD); catalyzes the removal of one mannose residue from a glycosylated protein, converting the modification from Man9GlcNAc to Man8GlcNAc; catalyzes the last step in glycoprotein maturation in the ER and is critical for ER protein degradation -S000037068 CDS YJR131W 10 667644 669293 W 2011-02-03 1996-07-31 -S000003893 ORF Verified YJR132W NMD5 KAP119 chromosome 10 L000002939 10 669522 672668 W 2011-02-03 1996-07-31|2011-02-03 Karyopherin; a carrier protein involved in nuclear import of proteins; importin beta homolog -S000037153 CDS YJR132W 10 669522 672668 W 2011-02-03 1996-07-31|2011-02-03 -S000003894 ORF Verified YJR133W XPT1 xanthine phosphoribosyltransferase chromosome 10 10 672991 673620 W 2011-02-03 1996-07-31 Xanthine-guanine phosphoribosyl transferase; required for xanthine utilization and for optimal utilization of guanine -S000037899 CDS YJR133W 10 672991 673620 W 2011-02-03 1996-07-31 -S000003895 ORF Verified YJR134C SGM1 chromosome 10 10 675852 673729 C 2011-02-03 1996-07-31 Protein of unknown function; required for wild-type growth rate on galactose and mannose; localizes to COPI coated vesicles and the Golgi apparatus -S000029858 CDS YJR134C 10 675852 673729 C 2011-02-03 1996-07-31 -S000003896 ORF Verified YJR135C MCM22 chromosome 10 L000003999 10 676778 676059 C 2011-02-03 1996-07-31 Outer kinetochore protein and component of the Ctf3 subcomplex; binds to centromeric DNA in a Ctf19p-dependent manner; involved in chromosome segregation and minichromosome maintenance; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-K and fission yeast sim4 -S000030000 CDS YJR135C 10 676778 676059 C 2011-02-03 1996-07-31 -S000007348 ORF Verified YJR135W-A TIM8 protein transporter TIM8 chromosome 10 10 676971 677234 W 2011-02-03 1999-07-17 Mitochondrial intermembrane space protein; forms a complex with Tim13p that delivers a subset of hydrophobic proteins to the TIM22 complex for inner membrane insertion; homolog of human TIMM8A, implicated in Mohr-Tranebjaerg syndrome, also known as deafness-dystonia-optic neuronopathy (DDON) syndrome; human TIMM8A can complement yeast null mutant -S000032075 CDS YJR135W-A 10 676971 677234 W 2011-02-03 1999-07-17 -S000003897 ORF Verified YJR136C TTI2 chromosome 10 10 678706 677441 C 2011-02-03 1996-07-31 Subunit of the ASTRA complex, involved in chromatin remodeling; telomere length regulator involved in the stability or biogenesis of PIKKs such as TORC1; involved in the cellular stress response; similar to S. pombe Tti2p; may interact with Rsm23p; GFP-fusion protein localizes to the cytoplasm -S000030982 CDS YJR136C 10 678706 677441 C 2011-02-03 1996-07-31 -S000003898 ORF Verified YJR137C MET5 sulfite reductase (NADPH) subunit beta|ECM17 chromosome 10 L000001080|L000003892 10 683285 678957 C 84 2011-02-03 1996-07-31 Sulfite reductase beta subunit; involved in amino acid biosynthesis, transcription repressed by methionine -S000031082 CDS YJR137C 10 683285 678957 C 2011-02-03 1996-07-31 -S000007553 ARS ARS1021 ARS121 chromosome 10 10 684009 684098 2014-11-18 2000-10-17|2014-11-18 Autonomously Replicating Sequence -S000003899 ORF Verified YJR138W IML1 SEA1 chromosome 10 10 684567 689321 W 2011-02-03 1996-07-31|2011-02-03 GTPase-activating protein (GAP) subunit of the Iml1p/SEACIT complex; SEACIT (Iml1p-Npr2p-Npr3p) is a subcomplex of the SEA complex, a coatomer-related complex that associates dynamically with the vacuole; Iml1p functions in the SEACIT complex as a GAP for the Rag family GTPase Gtr1p (EGOC subunit), resulting in the inhibition of TORC1 signaling in response to amino acid deprivation; the Iml1p/SEACIT complex is required for non-nitrogen-starvation (NNS)-induced autophagy -S000031284 CDS YJR138W 10 684567 689321 W 2011-02-03 1996-07-31|2011-02-03 -S000003900 ORF Verified YJR139C HOM6 homoserine dehydrogenase|THR6 chromosome 10 L000000801 10 690524 689445 C 87 2011-02-03 1996-07-31 Homoserine dehydrogenase (L-homoserine:NADP oxidoreductase); dimeric enzyme that catalyzes the third step in the common pathway for methionine and threonine biosynthesis; enzyme has nucleotide-binding, dimerization and catalytic regions -S000032214 CDS YJR139C 10 690524 689445 C 2011-02-03 1996-07-31 -S000028666 ORF Dubious YJR140W-A chromosome 10 10 690961 691110 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene HIR3; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032491 CDS YJR140W-A 10 690961 691110 W 2011-02-03 2003-07-29 -S000003901 ORF Verified YJR140C HIR3 HPC1 chromosome 10 L000003127 10 695696 690750 C 2011-02-03 1996-07-31 Subunit of the HIR complex; a nucleosome assembly complex involved in regulation of histone gene transcription; involved in position-dependent gene silencing and nucleosome reassembly; ortholog of human CABIN1 protein -S000032216 CDS YJR140C 10 695696 690750 C 2011-02-03 1996-07-31 -S000003902 ORF Uncharacterized YJR141W IPA1 putative polyadenylation protein chromosome 10 10 695906 696949 W 2011-02-03 1996-07-31 Essential protein of unknown function -S000033127 CDS YJR141W 10 695906 696949 W 2011-02-03 1996-07-31 -S000003903 ORF Verified YJR142W chromosome 10 10 697141 698169 W 2011-02-03 1996-07-31 8-oxo-dGTP diphosphatase of the Nudix hydrolase family; converts diphosphates of damaged forms of thiamin to monophosphates; GST fusion protein is a Dbf2p-Mob1p phosphorylation target in a proteome chip analysis; synthetic lethal with PH085 deletion; plays a role in restricting Ty1 transposition -S000033186 CDS YJR142W 10 697141 698169 W 2011-02-03 1996-07-31 -S000003904 ORF Verified YJR143C PMT4 dolichyl-phosphate-mannose-protein mannosyltransferase chromosome 10 L000002623 10 700614 698326 C 2011-02-03 1996-07-31 Protein O-mannosyltransferase; transfers mannose residues from dolichyl phosphate-D-mannose to protein serine/threonine residues; appears to form homodimers in vivo and does not complex with other Pmt proteins; target for new antifungals -S000033214 CDS YJR143C 10 700614 698326 C 2011-02-03 1996-07-31 -S000003905 ORF Verified YJR144W MGM101 MGM9 chromosome 10 L000001104 10 700882 701691 W 2011-02-03 1996-07-31 Protein with a role in mitochondrial DNA recombinational repair; also involved in interstrand cross-link repair; binds to and catalyzes the annealing of single-stranded mtDNA; oligomerizes to form rings and filaments; related to Rad52-type recombination proteins, with limited overall similarity but sharing conserved functionally important residues; component of the mitochondrial nucleoid, required for the repair of oxidative mtDNA damage and mitochondrial genome maintenance -S000033297 CDS YJR144W 10 700882 701691 W 2011-02-03 1996-07-31 -S000003906 ORF Verified YJR145C RPS4A eS4|ribosomal 40S subunit protein S4A|S4e|rp5|YS6|S7A|S4A chromosome 10 L000001751 10 703068 702027 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; mutation affects 20S pre-rRNA processing; homologous to mammalian ribosomal protein S4, no bacterial homolog; RPS4A has a paralog, RPS4B, that arose from the whole genome duplication -S000034116 CDS YJR145C 10 702798 702027 C 2011-02-03 1996-07-31 -S000034115 CDS YJR145C 10 703068 703055 C 2011-02-03 1996-07-31 -S000034117 intron YJR145C 10 703054 702799 C 2011-02-03 1996-07-31 -S000003907 ORF Uncharacterized YJR146W chromosome 10 10 703885 704238 W 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels; partially overlaps HMS2 -S000034307 CDS YJR146W 10 703885 704238 W 2011-02-03 1996-07-31 -S000003908 ORF Verified YJR147W HMS2 chromosome 10 L000004442 10 704196 705272 W 2011-02-03 1996-07-31 Protein with similarity to heat shock transcription factors; overexpression suppresses the pseudohyphal filamentation defect of a diploid mep1 mep2 homozygous null mutant; HMS2 has a paralog, SKN7, that arose from the whole genome duplication -S000034417 CDS YJR147W 10 704196 705272 W 2011-02-03 1996-07-31 -S000003909 ORF Verified YJR148W BAT2 branched-chain-amino-acid transaminase BAT2|ECA40|TWT2 chromosome 10 L000003082 10 705744 706874 W 2011-02-03 1996-07-31 Cytosolic branched-chain amino acid (BCAA) aminotransferase; preferentially involved in BCAA catabolism; homolog of murine ECA39; highly expressed during stationary phase and repressed during logarithmic phase; BAT2 has a paralog, BAT1, that arose from the whole genome duplication -S000035457 CDS YJR148W 10 705744 706874 W 2011-02-03 1996-07-31 -S000003910 ORF Uncharacterized YJR149W putative nitronate monooxygenase chromosome 10 10 707160 708374 W 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000035545 CDS YJR149W 10 707160 708374 W 2011-02-03 1996-07-31|2011-02-03 -S000003911 ORF Verified YJR150C DAN1 CCW13 chromosome 10 L000003381 10 709707 708811 C 2011-02-03 1996-07-31|2011-02-03 Cell wall mannoprotein; has similarity to Tir1p, Tir2p, Tir3p, and Tir4p; expressed under anaerobic conditions, completely repressed during aerobic growth -S000036513 CDS YJR150C 10 709707 708811 C 2011-02-03 1996-07-31|2011-02-03 -S000028458 ARS ARS1022 ARSX-712 chromosome 10 10 711896 712142 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence -S000003912 ORF Verified YJR151C DAN4 chromosome 10 10 715740 712255 C 2011-02-03 1996-07-31|2011-02-03 Cell wall mannoprotein; has similarity to Tir1p, Tir2p, Tir3p, and Tir4p; expressed under anaerobic conditions, completely repressed during aerobic growth -S000036600 CDS YJR151C 10 715740 712255 C 2011-02-03 1996-07-31|2011-02-03 -S000028557 ORF Uncharacterized YJR151W-A chromosome 10 10 717580 717630 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR; predicted to have a role in transcription based on computational "guilt by association" analysis -S000031243 CDS YJR151W-A 10 717580 717630 W 2011-02-03 2003-07-29 -S000003913 ORF Verified YJR152W DAL5 allantoate permease|UREP1 chromosome 10 L000000478 10 719666 721297 W 97 2011-02-03 1996-07-31 Allantoate permease; ureidosuccinate permease; also transports dipeptides, though with lower affinity than for allantoate and ureidosuccinate; expression is constitutive but sensitive to nitrogen catabolite repression -S000037362 CDS YJR152W 10 719666 721297 W 2011-02-03 1996-07-31 -S000003914 ORF Verified YJR153W PGU1 PSM1|PGL1 chromosome 10 L000004371|L000004261 10 722815 723900 W 2011-02-03 1996-07-31 Endo-polygalacturonase; pectolytic enzyme that hydrolyzes the alpha-1,4-glycosidic bonds in the rhamnogalacturonan chains in pectins -S000037481 CDS YJR153W 10 722815 723900 W 2011-02-03 1996-07-31 -S000003915 ORF Uncharacterized YJR154W chromosome 10 10 725784 726824 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000030205 CDS YJR154W 10 725784 726824 W 2011-02-03 1996-07-31 -S000003916 ORF Verified YJR155W AAD10 putative aryl-alcohol dehydrogenase chromosome 10 L000004639 10 727405 728271 W 2011-02-03 1996-07-31 Putative aryl-alcohol dehydrogenase; similar to P. chrysosporium aryl-alcohol dehydrogenase; mutational analysis has not yet revealed a physiological role; members of the AAD gene family comprise three pairs (AAD3 + AAD15, AAD6/AAD16 + AAD4, AAD10 + AAD14) whose two genes are more related to one another than to other members of the family -S000030387 CDS YJR155W 10 727405 728271 W 2011-02-03 1996-07-31 -S000003917 ORF Verified YJR156C THI11 4-amino-5-hydroxymethyl-2-methylpyrimidine phosphate synthase chromosome 10 L000003222 10 729596 728574 C 2011-02-03 1996-07-31 Protein involved in synthesis of the thiamine precursor HMP; member of a subtelomeric gene family including THI5, THI11, THI12, and THI13; hydroxymethylpyrimidine is also known as HMP -S000030438 CDS YJR156C 10 729596 728574 C 2011-02-03 1996-07-31 -S000028459 ARS ARS1023 chromosome 10 10 729983 730513 2011-02-03 2002-12-16 Autonomously Replicating Sequence -S000003918 ORF Dubious YJR157W chromosome 10 10 730515 730877 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031435 CDS YJR157W 10 730515 730877 W 2011-02-03 1996-07-31 -S000003919 ORF Verified YJR158W HXT16 HLT3|hexose transporter HXT16 chromosome 10 L000003264 10 732440 734143 W 2011-02-03 1996-07-31 Putative transmembrane polyol transporter; supports growth on and uptake of sorbitol with moderate affinity and mannitol with lower affinity when overexpressed in a strain deleted for hexose family members; minor hexose transport activity when overexpressed in a similar strain; similarity to hexose transporters; expression is repressed by high levels of glucose -S000031532 CDS YJR158W 10 732440 734143 W 2011-02-03 1996-07-31 -S000003920 ORF Verified YJR159W SOR1 L-iditol 2-dehydrogenase SOR1|SDH1 chromosome 10 L000002753 10 736044 737117 W 2011-02-03 1996-07-31 Sorbitol dehydrogenase; protein sequence is 99% identical to the Sor2p sorbitol dehydrogenase; expression is induced in the presence of sorbitol or xylose -S000031666 CDS YJR159W 10 736044 737117 W 2011-02-03 1996-07-31 -S000028460 ARS ARS1024 ARSX-737 chromosome 10 10 737034 737275 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence -S000003921 ORF Verified YJR160C MPH3 alpha-glucoside permease chromosome 10 10 739816 738008 C 2011-02-03 1996-07-31 Alpha-glucoside permease; transports maltose, maltotriose, alpha-methylglucoside, and turanose; identical to Mph2p; encoded in a subtelomeric position in a region likely to have undergone duplication -S000031772 CDS YJR160C 10 739816 738008 C 2011-02-03 1996-07-31 -S000003922 ORF Verified YJR161C COS5 chromosome 10 L000004063 10 743999 742848 C 2011-02-03 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins -S000031918 CDS YJR161C 10 743999 742848 C 2011-02-03 1996-07-31 -S000028461 ARS ARS1025 chromosome 10 10 744408 745008 2011-02-03 2002-12-16 Autonomously Replicating Sequence -S000178126 ARS_consensus_sequence ARS1025 10 744632 744648 W 2014-11-18 2014-11-18 -S000028974 telomere TEL10R chromosome 10 10 744902 745751 W 100 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome X; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats -S000028975 telomeric_repeat TEL10R 10 745663 745751 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome X -S000028976 X_element TEL10R 10 744902 745361 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome X; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YJR162C -S000028977 X_element_combinatorial_repeat TEL10R 10 745362 745662 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr X; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000003923 ORF Dubious YJR162C chromosome 10 10 745261 744911 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032831 CDS YJR162C 10 745261 744911 C 2011-02-03 1996-07-31 -S000001708 ORF Dubious YKL225W chromosome 11 11 451 798 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032685 CDS YKL225W 11 451 798 W 2011-02-03 1996-07-31 -S000028906 telomere TEL11L chromosome 11 11 807 1 C -162 2011-02-03 2003-09-09|2011-02-03 Telomeric region on the left arm of Chromosome XI; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats -S000028907 telomeric_repeat TEL11L 11 67 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome XI -S000028908 X_element TEL11L 11 807 347 C 2011-02-03 2003-09-09|2011-02-03 Telomeric X element Core sequence on the left arm of Chromosome XI; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YKL225W -S000028909 X_element_combinatorial_repeat TEL11L 11 346 68 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr XI; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000001707 ORF Verified YKL224C PAU16 seripauperin PAU16 chromosome 11 11 2181 1810 C 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP and mCherry fusion proteins localize to the vacuole -S000031625 CDS YKL224C 11 2181 1810 C 2011-02-03 1996-07-31 -S000001706 ORF Dubious YKL223W chromosome 11 11 2389 2721 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031556 CDS YKL223W 11 2389 2721 W 2011-02-03 1996-07-31 -S000001705 ORF Verified YKL222C chromosome 11 11 5620 3503 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; similar to transcriptional regulators from the zinc cluster (binuclear cluster) family; null mutant is sensitive to caffeine -S000031466 CDS YKL222C 11 5620 3503 C 2011-02-03 1996-07-31 -S000001704 ORF Verified YKL221W MCH2 chromosome 11 11 6107 7528 W 2011-02-03 1996-07-31|2011-02-03 Protein with similarity to mammalian monocarboxylate permeases; monocarboxylate permeases are involved in transport of monocarboxylic acids across the plasma membrane but mutant is not deficient in monocarboxylate transport -S000031419 CDS YKL221W 11 6107 7528 W 2011-02-03 1996-07-31|2011-02-03 -S000130137 ARS ARS1102 ARSXI-8 chromosome 11 11 7528 8309 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000001703 ORF Verified YKL220C FRE2 ferric/cupric-chelate reductase chromosome 11 L000002805 11 11226 9091 C 2011-02-03 1996-07-31 Ferric reductase and cupric reductase; reduces siderophore-bound iron and oxidized copper prior to uptake by transporters; expression induced by low iron levels but not by low copper levels -S000031305 CDS YKL220C 11 11226 9091 C 2011-02-03 1996-07-31 -S000001702 ORF Verified YKL219W COS9 chromosome 11 L000004067 11 14485 15708 W 1996-07-31 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins -S000030515 CDS YKL219W 11 14485 15708 W 1996-07-31 1996-07-31 -S000001701 ORF Verified YKL218C SRY1 threo-3-hydroxy-L-aspartate ammonia-lyase SRY1 chromosome 11 S000007485 11 18339 17359 C 1996-07-31 1996-07-31 3-hydroxyaspartate dehydratase; deaminates L-threo-3-hydroxyaspartate to form oxaloacetate and ammonia; required in the presence of hydroxyaspartate; highly similar to mouse serine racemase (Srr) but has no serine racemase activity -S000037646 CDS YKL218C 11 18339 17359 C 1996-07-31 1996-07-31 -S000001700 ORF Verified YKL217W JEN1 chromosome 11 L000002666 11 22234 24084 W 1996-07-31 1996-07-31 Monocarboxylate/proton symporter of the plasma membrane; transport activity is dependent on the pH gradient across the membrane; mediates high-affinity uptake of carbon sources lactate, pyuvate, and acetate, and also of the micronutrient selenite, whose structure mimics that of monocarboxylates; expression and localization are tightly regulated, with transcription repression, mRNA degradation, and protein endocytosis and degradation all occurring in the presence of glucose -S000037602 CDS YKL217W 11 22234 24084 W 1996-07-31 1996-07-31 -S000001699 ORF Verified YKL216W URA1 dihydroorotate dehydrogenase chromosome 11 L000002430 11 25215 26159 W -159.7 2011-02-03 1996-07-31 Dihydroorotate dehydrogenase; catalyzes the fourth enzymatic step in the de novo biosynthesis of pyrimidines, converting dihydroorotic acid into orotic acid -S000037467 CDS YKL216W 11 25215 26159 W 2011-02-03 1996-07-31 -S000001698 ORF Verified YKL215C OXP1 5-oxoprolinase chromosome 11 11 30687 26827 C 2011-02-03 1996-07-31 5-oxoprolinase; enzyme is ATP-dependent and functions as a dimer; similar to mouse Oplah gene; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; protein abundance increases in response to DNA replication stress -S000036677 CDS YKL215C 11 30687 26827 C 2011-02-03 1996-07-31 -S000001697 ORF Verified YKL214C YRA2 chromosome 11 11 31693 31082 C 2011-02-03 1996-07-31 Member of the REF (RNA and export factor binding proteins) family; when overexpressed, can substitute for the function of Yra1p in export of poly(A)+ mRNA from the nucleus -S000036577 CDS YKL214C 11 31693 31082 C 2011-02-03 1996-07-31 -S000001696 ORF Verified YKL213C DOA1 ZZZ4|UFD3 chromosome 11 L000002961 11 34107 31960 C 2011-02-03 1996-07-31 WD repeat protein required for ubiquitin-mediated protein degradation; ubiquitin binding cofactor that complexes with Cdc48p; required for ribophagy; controls cellular ubiquitin concentration; promotes efficient NHEJ in postdiauxic/stationary phase; facilitates N-terminus-dependent proteolysis of centromeric histone H3 (Cse4p) for faithful chromosome segregation; protein increases in abundance and relocalizes from nucleus to nuclear periphery upon DNA replication stress -S000036488 CDS YKL213C 11 34107 31960 C 2011-02-03 1996-07-31 -S000001695 ORF Verified YKL212W SAC1 phosphatidylinositol-3-phosphatase SAC1|RSD1 chromosome 11 L000001790 11 34543 36414 W -153.8 2011-02-03 1996-07-31 Phosphatidylinositol phosphate (PtdInsP) phosphatase; involved in hydrolysis of PtdIns[4]P in the early and medial Golgi; regulated by interaction with Vps74p; ER localized transmembrane protein which cycles through the Golgi; involved in protein trafficking and processing, secretion, and cell wall maintenance; regulates sphingolipid biosynthesis through the modulation of PtdIns(4)P metabolism -S000036459 CDS YKL212W 11 34543 36414 W 2011-02-03 1996-07-31 -S000001694 ORF Verified YKL211C TRP3 bifunctional anthranilate synthase/indole-3-glycerol-phosphate synthase chromosome 11 L000002354 11 38153 36699 C -153.8 2011-02-03 1996-07-31 Indole-3-glycerol-phosphate synthase; forms bifunctional hetero-oligomeric anthranilate synthase:indole-3-glycerol phosphate synthase enzyme complex with Trp2p -S000035520 CDS YKL211C 11 38153 36699 C 2011-02-03 1996-07-31 -S000006455 snoRNA_gene snR64 SNR64 chromosome 11 L000004533 11 38811 38911 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position C2337 -S000030843 noncoding_exon snR64 11 38811 38911 W 2011-02-03 2000-05-19 -S000001693 ORF Verified YKL210W UBA1 E1 ubiquitin-activating protein UBA1 chromosome 11 L000002405 11 39163 42237 W -153.3 2011-02-03 1996-07-31 Ubiquitin activating enzyme (E1); involved in ubiquitin-mediated protein degradation and essential for viability; protein abundance increases in response to DNA replication stress -S000035493 CDS YKL210W 11 39163 42237 W 2011-02-03 1996-07-31 -S000001692 ORF Verified YKL209C STE6 ATP-binding cassette a-factor transporter STE6 chromosome 11 L000002116 11 46295 42423 C -152.3 2011-02-03 1996-07-31 Plasma membrane ATP-binding cassette (ABC) transporter; required for the export of a-factor, catalyzes ATP hydrolysis coupled to a-factor transport; contains 12 transmembrane domains and two ATP binding domains; expressed only in MATa cells; human homolog ABCB1 mediates multidrug resistance in many chemotherapy-resistant tumors by effluxing toxic compounds from the cell -S000035512 CDS YKL209C 11 46295 42423 C 2011-02-03 1996-07-31 -S000006748 tRNA_gene tT(CGU)K TRT2 chromosome 11 L000003644 11 46806 46735 C 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis; correct folding and efficient aminoacylation require Lhp1p -S000032223 noncoding_exon tT(CGU)K 11 46806 46735 C 2011-02-03 2000-05-19 -S000001691 ORF Verified YKL208W CBT1 SOC1 chromosome 11 L000004295|S000029465|L000004597 11 47157 47972 W 2011-02-03 1996-07-31 Protein involved in 5' RNA end processing; substrates include mitochondrial COB, 15S_rRNA, and RPM1 transcripts; may also have a role in 3' end processing of the COB pre-mRNA; displays genetic interaction with cell cycle-regulated kinase Dbf2p -S000034559 CDS YKL208W 11 47157 47972 W 2011-02-03 1996-07-31 -S000001690 ORF Verified YKL207W EMC3 AIM27|LRC3 chromosome 11 11 48194 48955 W 2011-02-03 2004-02-13|1996-07-31|2006-05-08 Member of conserved ER transmembrane complex; required for efficient folding of proteins in the ER; required for respiratory growth; null mutant displays induction of the unfolded protein response; homologous to worm Y62E10A.10/EMC-3, fly CG6750, human TMEM111 -S000034425 CDS YKL207W 11 48194 48955 W 2011-02-03 2004-02-13|1996-07-31|2006-05-08 -S000001689 ORF Verified YKL206C ADD66 POC2|PBA2 chromosome 11 11 49809 49006 C 2011-02-03 1996-07-31 Protein involved in 20S proteasome assembly; forms a heterodimer with Pba1p that binds to proteasome precursors; interaction with Pba1p-Add66p may affect function of the mature proteasome and its role in maintaining respiratory metabolism; similar to human PAC2 constituent of the PAC1-PAC2 complex involved in proteasome assembly -S000034304 CDS YKL206C 11 49809 49006 C 2011-02-03 1996-07-31 -S000001688 ORF Verified YKL205W LOS1 Ran GTPase-binding protein LOS1 chromosome 11 L000000950 11 50051 53353 W -149.7 2011-02-03 1996-07-31 Nuclear pore protein; involved in nuclear export of pre-tRNA and in re-export of mature tRNAs after their retrograde import from the cytoplasm; deletion mutation extends replicative lifespan, as does exclusion of Los1p from the nucleus in response to caloric restriction -S000034266 CDS YKL205W 11 50051 53353 W 2011-02-03 1996-07-31 -S000001687 ORF Verified YKL204W EAP1 chromosome 11 11 53704 55602 W 2011-02-03 1996-07-31 eIF4E-associated protein, competes with eIF4G for binding to eIF4E; accelerates mRNA degradation by promoting decapping, facilitated by interaction with eIF4E; essential for Puf5p mediated repression; associates with Puf5p and Dhh1p; inhibits cap-dependent translation; functions independently of eIF4E to maintain genetic stability; plays a role in cell growth, implicated in the TOR signaling cascade -S000033363 CDS YKL204W 11 53704 55602 W 2011-02-03 1996-07-31 -S000118401 ARS ARS1103 ARSXI-56 chromosome 11 11 55671 55917 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178127 ARS_consensus_sequence ARS1103 11 55867 55851 C 2014-11-18 2014-11-18 -S000001686 ORF Verified YKL203C TOR2 phosphatidylinositol kinase-related protein kinase TOR2|DRR2 chromosome 11 L000002323 11 63359 55935 C -152.3 2011-02-03 2004-02-13|1996-07-31 PIK-related protein kinase and rapamycin target; subunit of TORC1, a complex that regulates growth in response to nutrients and TORC2, a complex that regulates cell-cycle dependent polarization of the actin cytoskeleton; involved in meiosis; TOR2 has a paralog, TOR1, that arose from the whole genome duplication -S000033266 CDS YKL203C 11 63359 55935 C 2011-02-03 2004-02-13|1996-07-31 -S000001685 ORF Dubious YKL202W chromosome 11 11 63821 64402 W 2011-02-03 2001-05-31|1996-07-31|1999-03-12 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033230 CDS YKL202W 11 63821 64402 W 2011-02-03 2001-05-31|1996-07-31|1999-03-12 -S000001684 ORF Verified YKL201C MNN4 YKL200C chromosome 11 L000001128 11 67466 63930 C -132.6 2011-02-03 2001-05-31|1996-07-31|1999-03-12 Putative positive regulator of mannosylphosphate transferase Mnn6p; involved in mannosylphosphorylation of N-linked oligosaccharides; expression increases in late-logarithmic and stationary growth phases; coding sequence contains length polymorphisms in different strains; MNN4 has a paralog, YJR061W, that arose from the whole genome duplication -S000032315 CDS YKL201C 11 67466 63930 C 2011-02-03 2001-05-31|1999-03-12|1996-07-31 -S000001681 ORF Verified YKL198C PTK1 putative serine/threonine protein kinase PTK1|POT1|YKT9|YKL199C|STK1|KKT8 chromosome 11 L000003491 11 70220 68232 C 2011-02-03 2003-01-08|1999-03-12|1996-07-31|2011-02-03 Putative serine/threonine protein kinase; regulates spermine uptake; involved in polyamine transport; possible mitochondrial protein; PTK1 has a paralog, PTK2, that arose from the whole genome duplication -S000034854 CDS YKL198C 11 70220 68232 C 2011-02-03 2003-01-08|1996-07-31|1999-03-12|2011-02-03 -S000001680 ORF Verified YKL197C PEX1 AAA family ATPase peroxin 1|PAS1 chromosome 11 L000001337 11 73865 70734 C 2011-02-03 1996-07-31 AAA-peroxin; heterodimerizes with AAA-peroxin Pex6p and participates in the recycling of peroxisomal signal receptor Pex5p from the peroxisomal membrane to the cystosol; induced by oleic acid and upregulated during anaerobiosis; mutations in human PEX1 can lead to severe peroxisomal disorders and early death -S000033983 CDS YKL197C 11 73865 70734 C 2011-02-03 1996-07-31 -S000007055 long_terminal_repeat YKLWdelta1 chromosome 11 11 74236 74518 W 2011-02-03 2000-05-19 Ty1 LTR -S000006671 tRNA_gene tN(GUU)K chromosome 11 L000003629 11 74624 74697 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis -S000030740 noncoding_exon tN(GUU)K 11 74624 74697 W 2011-02-03 2000-05-19 -S000001679 ORF Verified YKL196C YKT6 palmitoyltransferase YKT6 chromosome 11 L000004163 11 75534 74932 C 2011-02-03 1996-07-31 Vesicle membrane protein (v-SNARE) with acyltransferase activity; involved in trafficking to and within the Golgi, endocytic trafficking to the vacuole, and vacuolar fusion; membrane localization due to prenylation at the carboxy-terminus; human homolog YKT6 can complement yeast ykt6 mutant -S000033862 CDS YKL196C 11 75534 74932 C 2011-02-03 1996-07-31 -S000001678 ORF Verified YKL195W MIA40 TIM40|FMP15 chromosome 11 11 75821 77032 W 2011-02-03 2003-09-22|1996-07-31 Import and assembly protein in mitochondrial intermembrane space; component of MIA pathway which mediates import and oxidative folding of substrates including small proteins containing twin cysteine motifs; acts in concert with Erv1p, which oxidizes the cysteine residues of Mia40p to comprise a disulfide relay system that catalyzes import; also mediates folding of Atp23p via a chaperone-like activity; forms a dimer that binds iron-sulfur cluster in vitro -S000033827 CDS YKL195W 11 75821 77032 W 2011-02-03 2003-09-22|1996-07-31 -S000001677 ORF Verified YKL194C MST1 threonine--tRNA ligase MST1 chromosome 11 L000001207 11 78646 77258 C 2011-02-03 1996-07-31 Mitochondrial threonyl-tRNA synthetase; aminoacylates both the canonical threonine tRNA tT(UGU)Q1 and the unusual threonine tRNA tT(UAG)Q2 in vitro; lacks a typical editing domain, but has pre-transfer editing activity stimulated by the unusual tRNA-Thr -S000030386 CDS YKL194C 11 78646 77258 C 2011-02-03 1996-07-31 -S000001676 ORF Verified YKL193C SDS22 type 1 protein phosphatase-activating protein SDS22|EGP1 chromosome 11 L000002590 11 79882 78866 C 2011-02-03 1996-07-31 Regulatory subunit of the type 1 protein phosphatase (PP1) Glc7p; whether it functions as a positive or negative regulator of Glc7p is controversial; involved in the regulation of Glc7p nuclear localization and function -S000030304 CDS YKL193C 11 79882 78866 C 2011-02-03 1996-07-31 -S000001675 ORF Verified YKL192C ACP1 acyl carrier protein chromosome 11 L000004843 11 80537 80160 C 2011-02-03 1996-07-31 Mitochondrial matrix acyl carrier protein; involved in biosynthesis of octanoate, which is a precursor to lipoic acid; activated by phosphopantetheinylation catalyzed by Ppt2p -S000030104 CDS YKL192C 11 80537 80160 C 2011-02-03 1996-07-31 -S000001674 ORF Verified YKL191W DPH2 chromosome 11 L000000522 11 81035 82639 W 2011-02-03 1996-07-31 Protein required for synthesis of diphthamide; required along with Dph1p, Kti11p, Jjj3p, and Dph5p; diphthamide is a modified histidine residue of translation elongation factor 2 (Eft1p or Eft2p); may act in a complex with Dph1p and Kti11p -S000030067 CDS YKL191W 11 81035 82639 W 2011-02-03 1996-07-31 -S000001673 ORF Verified YKL190W CNB1 calcineurin regulatory subunit B|YCN2|CRV1 chromosome 11 L000000371 11 82947 83550 W 2011-02-03 1996-07-31 Calcineurin B; regulatory subunit of calcineurin, a Ca++/calmodulin-regulated type 2B protein phosphatase which regulates Crz1p (stress-response transcription factor); other calcineurin subunit encoded by CNA1 and/or CMP1; regulates function of Aly1p alpha-arrestin; myristoylation by Nmt1p reduces calcineurin activity in response to submaximal Ca signals, is needed to prevent constitutive phosphatase activity; protein abundance increases in response to DNA replication stress -S000029989 CDS YKL190W 11 82947 82998 W 2011-02-03 1996-07-31 -S000029990 CDS YKL190W 11 83075 83550 W 2011-02-03 1996-07-31 -S000029991 intron YKL190W 11 82999 83074 W 2011-02-03 1996-07-31 -S000007050 long_terminal_repeat YKLCdelta2 chromosome 11 11 84115 83808 C 2011-02-03 2000-05-19 Ty1 LTR -S000006651 tRNA_gene tL(UAA)K chromosome 11 L000003630 11 84208 84291 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000037408 noncoding_exon tL(UAA)K 11 84208 84291 W 2011-02-03 2000-05-19 -S000001672 ORF Verified YKL189W HYM1 chromosome 11 L000004365 11 84704 85903 W 2011-02-03 1996-07-31 Component of the RAM signaling network; is involved in regulation of Ace2p activity and cellular morphogenesis, interacts with Kic1p and Sog2p, localizes to sites of polarized growth during budding and during the mating response -S000030561 CDS YKL189W 11 84704 85903 W 2011-02-03 1996-07-31 -S000001671 ORF Verified YKL188C PXA2 ATP-binding cassette long-chain fatty acid transporter PXA2|PAT1 chromosome 11 L000003538 11 88786 86225 C 2011-02-03 1996-07-31 Subunit of heterodimeric peroxisomal ABC transport complex, with Pxa1p; required for import of long-chain fatty acids into peroxisomes; similar to human adrenoleukodystrophy transportesr ABCD1 and ABCD2, and ALD-related proteins; mutations in ABCD1 cause X-linked adrenoleukodystrophy (X-ALD), a peroxisomal disorder; human ABCD1 and ABCD2 can each partially complement yeast pxa1 pxa2 double null mutant -S000030413 CDS YKL188C 11 88786 86225 C 2011-02-03 1996-07-31 -S000130138 ARS ARS1104 ARSXI-89 chromosome 11 11 88789 89287 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000001670 ORF Verified YKL187C FAT3 chromosome 11 11 91536 89284 C 2011-02-03 1996-07-31 Protein required for fatty acid uptake; protein abundance increases in cortical patches in response to oleate exposure; the authentic, non-tagged protein is detected in a phosphorylated state in highly purified mitochondria in high-throughput studies; FAT3 has a paralog, YLR413W, that arose from the whole genome duplication -S000037608 CDS YKL187C 11 91536 89284 C 2011-02-03 1996-07-31 -S000001669 ORF Verified YKL186C MTR2 chromosome 11 L000002934 11 93298 92744 C 2011-02-03 1996-07-31 mRNA transport regulator; essential nuclear protein; Mex67p and Mtr2p form a mRNA export complex which binds to RNA -S000037550 CDS YKL186C 11 93298 92744 C 2011-02-03 1996-07-31 -S000122106 five_prime_UTR_intron YKL186C 11 93465 93312 C 2011-02-03 2007-04-04 -S000001668 ORF Verified YKL185W ASH1 DNA-binding transcription repressor ASH1 chromosome 11 L000003058 11 94499 96265 W 2011-02-03 1996-07-31 Component of the Rpd3L histone deacetylase complex; zinc-finger inhibitor of HO transcription; mRNA is localized and translated in the distal tip of anaphase cells, resulting in accumulation of Ash1p in daughter cell nuclei and inhibition of HO expression; potential Cdc28p substrate -S000037492 CDS YKL185W 11 94499 96265 W 2011-02-03 1996-07-31 -S000001667 ORF Verified YKL184W SPE1 ornithine decarboxylase SPE1|SPE10|ORD1 chromosome 11 L000001307|L000001993|L000001995 11 96757 98157 W -130.3 2011-02-03 1996-07-31 Ornithine decarboxylase; catalyzes the first step in polyamine biosynthesis; degraded in a proteasome-dependent manner in the presence of excess polyamines; deletion decreases lifespan, and increases necrotic cell death and ROS generation -S000032037 CDS YKL184W 11 96757 98157 W 2011-02-03 1996-07-31 -S000119035 ARS ARS1125 ARSXI-98|ARS1104.5 chromosome 11 11 98364 98523 2014-11-18 2014-11-18|2006-10-03 Autonomously Replicating Sequence -S000178128 ARS_consensus_sequence ARS1125 11 98385 98401 W 2014-11-18 2014-11-18 -S000028558 ORF Uncharacterized YKL183C-A chromosome 11 11 98607 98395 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031244 CDS YKL183C-A 11 98607 98395 C 2011-02-03 2003-07-29 -S000001666 ORF Verified YKL183W LOT5 chromosome 11 11 98721 99641 W 2011-02-03 1996-07-31 Protein of unknown function; gene expression increases in cultures shifted to a lower temperature; protein abundance increases in response to DNA replication stress -S000031917 CDS YKL183W 11 98721 99641 W 2011-02-03 1996-07-31 -S000001665 ORF Verified YKL182W FAS1 tetrafunctional fatty acid synthase subunit FAS1 chromosome 11 L000000601 11 100671 106826 W -116.7 2011-02-03 1996-07-31 Beta subunit of fatty acid synthetase; complex catalyzes the synthesis of long-chain saturated fatty acids; contains acetyltransacylase, dehydratase, enoyl reductase, malonyl transacylase, and palmitoyl transacylase activities -S000031771 CDS YKL182W 11 100671 106826 W 2011-02-03 1996-07-31 -S000001664 ORF Verified YKL181W PRS1 ribose phosphate diphosphokinase subunit PRS1|PRP1 chromosome 11 L000001494 11 107316 108599 W 2011-02-03 1996-07-31 5-phospho-ribosyl-1(alpha)-pyrophosphate synthetase; synthesizes PRPP, which is required for nucleotide, histidine, and tryptophan biosynthesis; plays a key role in cell wall integrity (CWI) pathway; one of five related enzymes, which are active as heteromultimeric complexes; missense mutations in human homolog PRPS1 are associated with neuropathic Arts syndrome and Charcot-Marie Tooth (CMTX5) disease -S000029853 CDS YKL181W 11 107316 108599 W 2011-02-03 1996-07-31 -S000001663 ORF Verified YKL180W RPL17A uL22|ribosomal 60S subunit protein L17A|L22|YL17|L20A|L17A|RPL17 chromosome 11 L000001715 11 109269 110129 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L17A; required for processing of 27SB pre-rRNA and formation of stable 66S assembly intermediates; copurifies with the Dam1 complex (aka DASH complex); homologous to mammalian ribosomal protein L17 and bacterial L22; RPL17A has a paralog, RPL17B, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000036148 CDS YKL180W 11 109269 109577 W 2011-02-03 1996-07-31 -S000036149 CDS YKL180W 11 109884 110129 W 2011-02-03 1996-07-31 -S000036150 intron YKL180W 11 109578 109883 W 2011-02-03 1996-07-31 -S000001662 ORF Verified YKL179C COY1 chromosome 11 11 112503 110464 C 2011-02-03 1996-07-31 Golgi membrane protein with similarity to mammalian CASP; genetic interactions with GOS1 (encoding a Golgi snare protein) suggest a role in Golgi function -S000035207 CDS YKL179C 11 112503 110464 C 2011-02-03 1996-07-31 -S000001660 ORF Dubious YKL177W chromosome 11 11 114356 114694 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene STE3 -S000034192 CDS YKL177W 11 114356 114694 W 2011-02-03 1996-07-31 -S000001661 ORF Verified YKL178C STE3 DAF2 chromosome 11 L000002113 11 114627 113215 C 2011-02-03 1996-07-31 Receptor for a factor pheromone; couples to MAP kinase cascade to mediate pheromone response; transcribed in alpha cells and required for mating by alpha cells, ligand bound receptors endocytosed and recycled to the plasma membrane; GPCR -S000035096 CDS YKL178C 11 114627 113215 C 2011-02-03 1996-07-31 -S000001659 ORF Verified YKL176C LST4 chromosome 11 L000004354 11 117986 115500 C 2011-02-03 1996-07-31 Subunit of the Lst4p-Lst7p GTPase activating protein complex for Gtr2p; stimulates the GTPase activity of Rag family GTPase Gtr2p, within the context of the Gtr1p-Gtr2p heterodimer, after amino acid stimulation; required for activation of TORC1 in response to amino acid stimulation; recruited to the vacuolar membrane during amino acid starvation and released from the membrane by TORC1; required for the transport of amino acid permease Gap1p from the Golgi to the cell surface -S000034038 CDS YKL176C 11 117986 115500 C 2011-02-03 1996-07-31 -S000001658 ORF Verified YKL175W ZRT3 Zn(2+) transporter ZRT3 chromosome 11 11 118793 120304 W 2011-02-03 1996-07-31 Vacuolar membrane zinc transporter; transports zinc from storage in the vacuole to the cytoplasm when needed; transcription is induced under conditions of zinc deficiency -S000033999 CDS YKL175W 11 118793 120304 W 2011-02-03 1996-07-31 -S000001657 ORF Verified YKL174C TPO5 chromosome 11 11 122236 120380 C 2011-02-03 1996-07-31 Protein involved in excretion of putrescine and spermidine; putative polyamine transporter in the Golgi or post-Golgi vesicles -S000033149 CDS YKL174C 11 122236 120380 C 2011-02-03 1996-07-31 -S000001656 ORF Verified YKL173W SNU114 U5 snRNP GTPase SNU114|GIN10 chromosome 11 L000003541 11 122517 125543 W 2011-02-03 1996-07-31 GTPase component of U5 snRNP involved in mRNA splicing via spliceosome; binds directly to U5 snRNA; proposed to be involved in conformational changes of the spliceosome; similarity to ribosomal translocation factor EF-2 -S000033113 CDS YKL173W 11 122517 125543 W 2011-02-03 1996-07-31 -S000001655 ORF Verified YKL172W EBP2 chromosome 11 L000004646 11 125759 127042 W 2011-02-03 1996-07-31 Required for 25S rRNA maturation and 60S ribosomal subunit assembly; localizes to the nucleolus and in foci along nuclear periphery; constituent of 66S pre-ribosomal particles; cooperates with Rrs1p and Mps3p to mediate telomere clustering by binding Sir4p, but is not involved in telomere tethering -S000033024 CDS YKL172W 11 125759 127042 W 2011-02-03 1996-07-31 -S000001654 ORF Verified YKL171W NNK1 protein kinase NNK1 chromosome 11 11 127475 130261 W 2011-02-03 1996-07-31 Protein kinase; implicated in proteasome function; interacts with TORC1, Ure2 and Gdh2; overexpression leads to hypersensitivity to rapamycin and nuclear accumulation of Gln3; epitope-tagged protein localizes to the cytoplasm -S000032097 CDS YKL171W 11 127475 130261 W 2011-02-03 1996-07-31 -S000001653 ORF Verified YKL170W MRPL38 mitochondrial 54S ribosomal protein YmL38/YmL34|YmL38|YmL34|MRPL34 chromosome 11 S000029310|L000002693|L000001173 11 130634 131050 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; appears as two protein spots (YmL34 and YmL38) on two-dimensional SDS gels; protein abundance increases in response to DNA replication stress -S000031979 CDS YKL170W 11 130634 131050 W 2011-02-03 1996-07-31 -S000001652 ORF Dubious YKL169C chromosome 11 11 131068 130685 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene MRPL38 -S000030884 CDS YKL169C 11 131068 130685 C 2011-02-03 1996-07-31 -S000001651 ORF Verified YKL168C KKQ8 putative serine/threonine protein kinase KKQ8 chromosome 11 L000004097 11 133462 131288 C 2011-02-03 1996-07-31|2006-05-08 Putative serine/threonine protein kinase with unknown cellular role; KKQ8 has a paralog, HAL5, that arose from the whole genome duplication -S000030812 CDS YKL168C 11 133462 131288 C 2011-02-03 1996-07-31|2006-05-08 -S000001650 ORF Verified YKL167C MRP49 mitochondrial 54S ribosomal protein MRP49 chromosome 11 L000001159 11 134134 133721 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; not essential for mitochondrial translation -S000037870 CDS YKL167C 11 134134 133721 C 2011-02-03 1996-07-31 -S000001649 ORF Verified YKL166C TPK3 cAMP-dependent protein kinase catalytic subunit TPK3 chromosome 11 L000002327 11 135705 134509 C 2011-02-03 1996-07-31 cAMP-dependent protein kinase catalytic subunit; promotes vegetative growth in response to nutrients via the Ras-cAMP signaling pathway; partially redundant with Tpk1p and Tpk2p; localizes to P-bodies during stationary phase; TPK3 has a paralog, TPK1, that arose from the whole genome duplication -S000037767 CDS YKL166C 11 135705 134509 C 2011-02-03 1996-07-31 -S000007617 ORF Dubious YKL165C-A chromosome 11 11 136023 135790 C 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037215 CDS YKL165C-A 11 136023 135790 C 2011-02-03 2001-02-26 -S000001648 ORF Verified YKL165C MCD4 mannose-ethanolamine phosphotransferase MCD4|FSR2|SSU21|ZRG16 chromosome 11 L000003913|S000029172|L000003584 11 140691 137932 C 2011-02-03 1996-07-31 Protein involved in GPI anchor synthesis; multimembrane-spanning protein that localizes to the endoplasmic reticulum; highly conserved among eukaryotes; GPI stands for glycosylphosphatidylinositol -S000037706 CDS YKL165C 11 140691 137932 C 2011-02-03 1996-07-31 -S000006558 tRNA_gene tE(UUC)K chromosome 11 L000003643 11 141089 141018 C 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000036005 noncoding_exon tE(UUC)K 11 141089 141018 C 2011-02-03 2000-05-19 -S000001647 ORF Verified YKL164C PIR1 beta-1,3-glucan linked protein|CCW6 chromosome 11 L000001441 11 142819 141794 C 2011-02-03 1996-07-31 O-glycosylated protein required for cell wall stability; attached to the cell wall via beta-1,3-glucan; mediates mitochondrial translocation of Apn1p; expression regulated by the cell integrity pathway and by Swi5p during the cell cycle; PIR1 has a paralog, YJL160C, that arose from the whole genome duplication -S000036944 CDS YKL164C 11 142819 141794 C 2011-02-03 1996-07-31 -S000001646 ORF Verified YKL163W PIR3 beta-1,3-glucan linked protein|CCW8 chromosome 11 L000001443 11 144401 145378 W 2011-02-03 1996-07-31 O-glycosylated covalently-bound cell wall protein; required for cell wall stability; expression is cell cycle regulated, peaking in M/G1 and also subject to regulation by the cell integrity pathway; coding sequence contains length polymorphisms in different strains; PIR3 has a paralog, HSP150, that arose from the whole genome duplication -S000036912 CDS YKL163W 11 144401 145378 W 2011-02-03 1996-07-31 -S000007244 ORF Dubious YKL162C-A chromosome 11 11 146074 145922 C 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032863 CDS YKL162C-A 11 146074 145922 C 2011-02-03 1999-07-17 -S000001645 ORF Uncharacterized YKL162C chromosome 11 11 148838 147630 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the mitochondrion -S000036809 CDS YKL162C 11 148838 147630 C 2011-02-03 1996-07-31 -S000001644 ORF Verified YKL161C KDX1 putative protein kinase KDX1|MLP1 chromosome 11 11 150687 149386 C 2011-02-03 1996-07-31 Protein kinase; implicated in Slt2p mitogen-activated (MAP) kinase signaling pathway; interacts with numerous components in the mating pheromone and CWI MAPK pathways; associates with Rlm1p; KDX1 has a paralog, SLT2, that arose from the whole genome duplication -S000035941 CDS YKL161C 11 150687 149386 C 2011-02-03 1996-07-31 -S000118402 ARS ARS1106 ARSXI-153 chromosome 11 11 153020 153135 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178129 ARS_consensus_sequence ARS1106 11 153122 153106 C 2014-11-18 2014-11-18 -S000001643 ORF Verified YKL160W ELF1 chromosome 11 11 153269 153706 W 2011-02-03 1996-07-31 Transcription elongation factor with a conserved zinc finger domain; implicated in the maintenance of proper chromatin structure in actively transcribed regions; deletion inhibits Brome mosaic virus (BMV) gene expression -S000035865 CDS YKL160W 11 153269 153706 W 2011-02-03 1996-07-31 -S000001642 ORF Verified YKL159C RCN1 chromosome 11 S000007456 11 154451 153816 C 2011-02-03 1996-07-31 Protein involved in calcineurin regulation during calcium signaling; has similarity to H. sapiens DSCR1 which is found in the Down Syndrome candidate region -S000034776 CDS YKL159C 11 154451 153816 C 2011-02-03 1996-07-31 -S000001640 ORF Verified YKL157W APE2 metallo-aminopeptidase|YKL158W|LAP1 chromosome 11 S000001641|L000000092 11 154991 158232 W -124.8 2011-02-03 2000-07-14|1996-07-31|2011-02-03 Aminopeptidase yscII; may have a role in obtaining leucine from dipeptide substrates; APE2 has a paralog, AAP1, that arose from the whole genome duplication -S000033809 CDS YKL157W 11 154991 155271 W 2011-02-03 2000-07-14|1996-07-31 -S000033810 CDS YKL157W 11 155655 158232 W 2011-02-03 2000-07-14|2011-02-03 -S000033811 intron YKL157W 11 155272 155654 W 2011-02-03 2000-07-14 -S000001639 ORF Verified YKL156W RPS27A eS27|ribosomal 40S subunit protein S27A|S27e|rp61|YS20|S27A chromosome 11 L000002712 11 158613 159212 W 2011-02-03 1996-07-31|2011-02-03 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S27, no bacterial homolog; RPS27A has a paralog, RPS27B, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000033664 CDS YKL156W 11 158613 158615 W 2011-02-03 1996-07-31 -S000033665 CDS YKL156W 11 158967 159212 W 2011-02-03 1996-07-31 -S000033666 intron YKL156W 11 158616 158966 W 2011-02-03 1996-07-31|2011-02-03 -S000028668 ORF Dubious YKL156C-A chromosome 11 11 159091 158975 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene RPS27A; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032493 CDS YKL156C-A 11 159091 158975 C 2011-02-03 2003-07-29 -S000001638 ORF Verified YKL155C RSM22 mitochondrial 37S ribosomal protein RSM22 chromosome 11 11 161342 159456 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; also predicted to be an S-adenosylmethionine-dependent RNA methyltransferase -S000033531 CDS YKL155C 11 161342 159456 C 2011-02-03 1996-07-31 -S000001637 ORF Verified YKL154W SRP102 Signal recognition particle receptor subunit beta chromosome 11 11 161601 162335 W 2011-02-03 1996-07-31 Signal recognition particle (SRP) receptor beta subunit; involved in SRP-dependent protein targeting; anchors the alpha subunit, Srp101p to the ER membrane -S000033491 CDS YKL154W 11 161601 162335 W 2011-02-03 1996-07-31 -S000006716 tRNA_gene tR(UCU)K chromosome 11 L000003642 11 162558 162487 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000037862 noncoding_exon tR(UCU)K 11 162558 162487 C 2011-02-03 2000-05-19 -S000007056 long_terminal_repeat YKLWdelta3 chromosome 11 11 162831 163169 W 2011-02-03 2000-05-19 Ty1 LTR -S000001636 ORF Dubious YKL153W chromosome 11 11 163600 164109 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; transcription of both YLK153W and the overlapping essential gene GPM1 is reduced in the gcr1 null mutant -S000032752 CDS YKL153W 11 163600 164109 W 2011-02-03 1996-07-31 -S000001635 ORF Verified YKL152C GPM1 phosphoglycerate mutase GPM1 chromosome 11 L000000726 11 164385 163642 C 2011-02-03 1996-07-31 Tetrameric phosphoglycerate mutase; mediates the conversion of 3-phosphoglycerate to 2-phosphoglycerate during glycolysis and the reverse reaction during gluconeogenesis -S000032605 CDS YKL152C 11 164385 163642 C 2011-02-03 1996-07-31 -S000001634 ORF Verified YKL151C NNR2 NADHX dehydratase chromosome 11 11 165930 164917 C 2011-02-03 1996-07-31 Widely-conserved NADHX dehydratase; converts (S)-NADHX to NADH in ATP-dependent manner; YKL151C promoter contains STREs (stress response elements) and expression is induced by heat shock or methyl methanesulfonate; downstream intergenic region drives antisense expression and mediates coordinated regulation of YKL151C and GPM1 phosphoglycerate mutase; protein abundance increases in response to DNA replication stress; homolog of Carkd in mammals and C-terminus of YjeF in E.coli -S000031623 CDS YKL151C 11 165930 164917 C 2011-02-03 1996-07-31 -S000001633 ORF Verified YKL150W MCR1 cytochrome-b5 reductase chromosome 11 L000003134 11 166544 167452 W 2011-02-03 1996-07-31 Mitochondrial NADH-cytochrome b5 reductase; involved in ergosterol biosynthesis -S000031554 CDS YKL150W 11 166544 167452 W 2011-02-03 1996-07-31 -S000122105 five_prime_UTR_intron YKL150W 11 166400 166487 W 2011-02-03 2007-04-04 -S000001632 ORF Verified YKL149C DBR1 RNA lariat debranching enzyme|PRP26 chromosome 11 L000000495 11 168829 167612 C -106.4 2011-02-03 1996-07-31 RNA lariat debranching enzyme; catalyzes debranching of lariat introns formed during pre-mRNA splicing; required for efficient Ty1 transposition; knockdown of human homolog Dbr1 rescues toxicity of RNA-binding proteins TDP-43 and FUS which are implicated in amyotrophic lateral sclerosis (ALS), suggests potential therapeutic target for ALS and related TDP-43 proteinopathies; human homolog DBR1 can complement yeast dbr1 null mutant -S000031536 CDS YKL149C 11 168829 167612 C 2011-02-03 1996-07-31 -S000001631 ORF Verified YKL148C SDH1 succinate dehydrogenase flavoprotein subunit SDH1|SDHA chromosome 11 L000001823 11 171129 169207 C 2011-02-03 1996-07-31 Flavoprotein subunit of succinate dehydrogenase; couples the oxidation of succinate to the transfer of electrons to ubiquinone as part of the TCA cycle and the mitochondrial respiratory chain; FAD binding to Sdh1p is required for the assembly of the succinate dehydrogenase subunits; mutations in human ortholog SDHA are associated with Leigh syndrome -S000030671 CDS YKL148C 11 171129 169207 C 2011-02-03 1996-07-31 -S000001629 ORF Verified YKL146W AVT3 chromosome 11 11 171783 173861 W 2011-02-03 1996-07-31 Vacuolar transporter; exports large neutral amino acids from the vacuole; member of a family of seven S. cerevisiae genes (AVT1-7) related to vesicular GABA-glycine transporters -S000030513 CDS YKL146W 11 171783 173861 W 2011-02-03 1996-07-31 -S000001630 ORF Dubious YKL147C chromosome 11 11 172168 171551 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the verified gene AVT3 -S000030585 CDS YKL147C 11 172168 171551 C 2011-02-03 1996-07-31 -S000001628 ORF Verified YKL145W RPT1 proteasome regulatory particle base subunit RPT1|YTA3|CIM5 chromosome 11 L000002557 11 174213 175616 W 2011-02-03 1996-07-31 ATPase of the 19S regulatory particle of the 26S proteasome; one of six ATPases of the regulatory particle; involved in the degradation of ubiquitinated substrates; required for optimal CDC20 transcription; interacts with Rpn12p and Ubr1p; mutant has aneuploidy tolerance -S000030368 CDS YKL145W 11 174213 175616 W 2011-02-03 1996-07-31 -S000028841 ORF Dubious YKL145W-A chromosome 11 11 174958 175050 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified essential gene RPT1; identified by expression profiling and mass spectrometry -S000034526 CDS YKL145W-A 11 174958 175050 W 2011-02-03 2003-07-29 -S000001627 ORF Verified YKL144C RPC25 DNA-directed RNA polymerase III subunit RPC25|C25|YKL1 chromosome 11 L000002427 11 176481 175843 C 2011-02-03 1996-07-31 RNA polymerase III subunit C25; required for transcription initiation; forms a heterodimer with Rpc17p; paralog of Rpb7p -S000037515 CDS YKL144C 11 176481 175843 C 2011-02-03 1996-07-31 -S000001626 ORF Verified YKL143W LTV1 YKL2 chromosome 11 L000000962 11 176781 178172 W 2011-02-03 1996-07-31 Component of the GSE complex; GSE is required for proper sorting of amino acid permease Gap1p; required for ribosomal small subunit export from nucleus; required for growth at low temperature -S000037465 CDS YKL143W 11 176781 178172 W 2011-02-03 1996-07-31 -S000001625 ORF Verified YKL142W MRP8 YKL3 chromosome 11 L000001156 11 178515 179174 W 2011-02-03 1996-07-31 Protein of unknown function; undergoes sumoylation; transcription induced under cell wall stress; protein levels are reduced under anaerobic conditions; protein abundance increases in response to DNA replication stress; originally thought to be a mitochondrial ribosomal protein based on sequence analysis -S000036742 CDS YKL142W 11 178515 179174 W 2011-02-03 1996-07-31 -S000001624 ORF Verified YKL141W SDH3 succinate dehydrogenase cytochrome b subunit SDH3|YKL4|CYB3 chromosome 11 L000001825 11 179667 180263 W 2011-02-03 1996-07-31 Subunit of succinate dehydrogenase and of TIM22 translocase; functions as cytochrome b subunit of succinate dehydrogenase, which couples oxidation of succinate to transfer of electrons to ubiquinone as part of the TCA cycle and the mitochondrial respiratory chain; also required for mitochondrial inner membrane protein import as part of the TIM22 complex; SDH3 has a paralog, SHH3, that arose from the whole genome duplication -S000036643 CDS YKL141W 11 179667 180263 W 2011-02-03 1996-07-31 -S000001623 ORF Verified YKL140W TGL1 YKL5 chromosome 11 L000002293 11 180779 182425 W 2011-02-03 1996-07-31 Steryl ester hydrolase; one of three gene products (Yeh1p, Yeh2p, Tgl1p) responsible for steryl ester hydrolase activity and involved in sterol homeostasis; localized to lipid particle membranes -S000036522 CDS YKL140W 11 180779 182425 W 2011-02-03 1996-07-31 -S000001622 ORF Verified YKL139W CTK1 cyclin-dependent serine/threonine protein kinase CTK1 chromosome 11 L000000432 11 182958 184544 W 2011-02-03 1996-07-31 Catalytic (alpha) subunit of C-terminal domain kinase I (CTDK-I); phosphorylates both RNA pol II subunit Rpo21p to affect transcription and pre-mRNA 3' end processing, and ribosomal protein Rps2p to increase translational fidelity; required for H3K36 trimethylation but not dimethylation by Set2p; suggested stimulatory role in 80S formation during translation initiation; similar to the Drosophila dCDK12 and human CDK12 and probably CDK13 -S000036668 CDS YKL139W 11 182958 184544 W 2011-02-03 1996-07-31 -S000028421 ORF Verified YKL138C-A HSK3 chromosome 11 S000028418 11 185012 184803 C 2011-02-03 2002-06-20 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; is transferred to the kinetochore prior to mitosis -S000029957 CDS YKL138C-A 11 185012 184803 C 2011-02-03 2002-06-20 -S000001621 ORF Verified YKL138C MRPL31 mitochondrial 54S ribosomal protein YmL31|YmL31 chromosome 11 L000001168|L000002529 11 185681 185286 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000035696 CDS YKL138C 11 185681 185286 C 2011-02-03 1996-07-31 -S000001620 ORF Verified YKL137W CMC1 chromosome 11 11 185957 186292 W 2011-02-03 1996-07-31|2005-12-15 Copper-binding protein of the mitochondrial intermembrane space; evolutionarily conserved; may be involved in delivering copper from the matrix to the cytochrome c oxidase complex; contains a twin CX9C motif -S000035632 CDS YKL137W 11 185957 186292 W 2011-02-03 1996-07-31|2005-12-15 -S000001619 ORF Dubious YKL136W chromosome 11 11 186416 186814 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF APL2/YKL135C -S000035555 CDS YKL136W 11 186416 186814 W 2011-02-03 1996-07-31 -S000001618 ORF Verified YKL135C APL2 chromosome 11 L000000094 11 188640 186460 C 2011-02-03 1996-07-31 Beta-adaptin subunit of the clathrin-associated protein (AP-1) complex; binds clathrin; involved in clathrin-dependent Golgi protein sorting; protein abundance increases in response to DNA replication stress -S000034478 CDS YKL135C 11 188640 186460 C 2011-02-03 1996-07-31 -S000001617 ORF Verified YKL134C OCT1 metalloendopeptidase chromosome 11 L000004860 11 191442 189124 C 2011-02-03 1996-07-31|2011-02-03 Mitochondrial intermediate peptidase; cleaves destabilizing N-terminal residues of a subset of proteins upon import, after their cleavage by mitochondrial processing peptidase (Mas1p-Mas2p); may contribute to mitochondrial iron homeostasis -S000034401 CDS YKL134C 11 191442 189124 C 2011-02-03 1996-07-31|2011-02-03 -S000001616 ORF Uncharacterized YKL133C chromosome 11 11 193070 191679 C 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; not required for growth of cells lacking the mitochondrial genome; SWAT-GFP and mCherry fusion proteins localize to the mitochondria; YKL133C has a paralog, MGR3, that arose from the whole genome duplication -S000034300 CDS YKL133C 11 193070 191679 C 2011-02-03 1996-07-31|2011-02-03 -S000001614 ORF Dubious YKL131W chromosome 11 11 194478 194999 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033359 CDS YKL131W 11 194478 194999 W 2011-02-03 1996-07-31 -S000001615 ORF Verified YKL132C RMA1 putative tetrahydrofolate synthase chromosome 11 11 194866 193574 C 2011-02-03 1996-07-31 Putative dihydrofolate synthetase; similar to E. coli folylpolyglutamate synthetase/dihydrofolate synthetase; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; RMA1 has a paralog, FOL3, that arose from the whole genome duplication -S000033390 CDS YKL132C 11 194866 193574 C 2011-02-03 1996-07-31 -S000001613 ORF Verified YKL130C SHE2 chromosome 11 L000004571 11 196028 195288 C 2011-02-03 1996-07-31 RNA-binding protein that binds specific mRNAs and interacts with She3p; part of the mRNA localization machinery that restricts accumulation of certain proteins to the bud; binds to ER-derived membranes and targets mRNAs to cortical ER -S000033257 CDS YKL130C 11 196028 195288 C 2011-02-03 1996-07-31 -S000119036 ARS ARS1126 ARSXI-196|ARS1106.3 chromosome 11 11 196042 196287 2011-02-03 2006-10-03 Autonomously Replicating Sequence -S000001612 ORF Verified YKL129C MYO3 myosin 3 chromosome 11 L000002889 11 200167 196349 C 2011-02-03 1996-07-31|2011-02-03 One of two type I myosins; localizes to actin cortical patches; deletion of MYO3 has little effect on growth, but myo3 myo5 double deletion causes severe defects in growth and actin cytoskeleton organization; MYO3 has a paralog, MYO5, that arose from the whole genome duplication -S000032500 CDS YKL129C 11 200167 196349 C 2011-02-03 1996-07-31|2011-02-03 -S000001611 ORF Verified YKL128C PMU1 putative phosphomutase chromosome 11 L000003276 11 201771 200884 C 2011-02-03 1996-07-31 Putative phosphomutase; contains a region homologous to the active site of phosphomutases; overexpression suppresses the histidine auxotrophy of an ade3 ade16 ade17 triple mutant and the temperature sensitivity of a tps2 mutant -S000032407 CDS YKL128C 11 201771 200884 C 2011-02-03 1996-07-31 -S000007054 long_terminal_repeat YKLCsigma1 chromosome 11 11 202983 202644 C 2011-02-03 2000-05-19 Ty3 LTR -S000006626 tRNA_gene tK(CUU)K chromosome 11 L000003631 11 202999 203071 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000036035 noncoding_exon tK(CUU)K 11 202999 203071 W 2011-02-03 2000-05-19 -S000001610 ORF Verified YKL127W PGM1 phosphoglucomutase PGM1 chromosome 11 L000001412 11 203541 205253 W -108.4 2011-02-03 1996-07-31 Phosphoglucomutase, minor isoform; catalyzes the conversion from glucose-1-phosphate to glucose-6-phosphate, which is a key step in hexose metabolism; PGM1 has a paralog, PGM2, that arose from the whole genome duplication -S000032331 CDS YKL127W 11 203541 205253 W 2011-02-03 1996-07-31 -S000001609 ORF Verified YKL126W YPK1 serine/threonine protein kinase YPK1|SLI2 chromosome 11 L000002541 11 205707 207749 W -97.7 2011-02-03 1996-07-31 S/T protein kinase; phosphorylates, downregulates flippase activator Fpk1p; inactivates Orm1p and Orm2p by phosphorylation in response to compromised sphingolipid synthesis; involved in the TORC-dependent phosphorylation of ribosomal proteins Rps6a/b (S6); mutations affect receptor-mediated endocytosis and sphingolipid-mediated and cell integrity signaling pathways; human homolog SGK1 can complement a null mutant; human homolog SGK2 can complement a ypk1 ypk2 double mutant -S000031322 CDS YKL126W 11 205707 207749 W 2011-02-03 1996-07-31 -S000001608 ORF Verified YKL125W RRN3 rDNA-binding RNA polymerase I transcriptional factor chromosome 11 L000003362 11 208247 210130 W 2011-02-03 1996-07-31 Protein required for transcription of rDNA by RNA polymerase I; transcription factor independent of DNA template; involved in recruitment of RNA polymerase I to rDNA; structure reveals unique HEAT repeat fold and a surface serine patch; phosphorylation of serine patch impairs cell growth and reduces RNA polymerase I binding in vitro and RNA polymerase I recruitment to the rDNA gene in vivo -S000031219 CDS YKL125W 11 208247 210130 W 2011-02-03 1996-07-31 -S000001607 ORF Verified YKL124W SSH4 MLF4 chromosome 11 L000002951 11 210593 212332 W 2011-02-03 1996-07-31 Specificity factor required for Rsp5p-dependent ubiquitination; also required for sorting of cargo proteins at the multivesicular body; identified as a high-copy suppressor of a SHR3 deletion, increasing steady-state levels of amino acid permeases -S000031112 CDS YKL124W 11 210593 212332 W 2011-02-03 1996-07-31 -S000001606 ORF Dubious YKL123W chromosome 11 11 212043 212423 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene SSH4 -S000030083 CDS YKL123W 11 212043 212423 W 2011-02-03 1996-07-31 -S000001605 ORF Verified YKL122C SRP21 signal recognition particle subunit SRP21 chromosome 11 L000002062 11 212998 212495 C 2011-02-03 1996-07-31 Subunit of the signal recognition particle (SRP); SRP functions in protein targeting to the endoplasmic reticulum membrane; not found in mammalian SRP; forms a pre-SRP structure in the nucleolus that is translocated to the cytoplasm -S000029913 CDS YKL122C 11 212998 212495 C 2011-02-03 1996-07-31 -S000119037 ARS ARS1127 ARSXI-213|ARS1106.7 chromosome 11 11 213439 213743 2011-02-03 2006-10-03 Autonomously Replicating Sequence -S000001604 ORF Uncharacterized YKL121W DGR2 chromosome 11 11 214142 216700 W 2011-02-03 1996-07-31 Protein of unknown function; null mutant is resistant to 2-deoxy-D-glucose and displays abnormally elongated buds; DGR2 has a paralog, YMR102C, that arose from the whole genome duplication -S000029872 CDS YKL121W 11 214142 216700 W 2011-02-03 1996-07-31 -S000001603 ORF Verified YKL120W OAC1 chromosome 11 S000007413 11 217344 218318 W 2011-02-03 1996-07-31 Mitochondrial inner membrane transporter; transports oxaloacetate, sulfate, thiosulfate, and isopropylmalate; member of the mitochondrial carrier family -S000037208 CDS YKL120W 11 217344 218318 W 2011-02-03 1996-07-31 -S000001601 ORF Dubious YKL118W chromosome 11 11 219126 219437 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene VPH2 -S000036185 CDS YKL118W 11 219126 219437 W 2011-02-03 1996-07-31 -S000001602 ORF Verified YKL119C VPH2 VMA12|CLS10 chromosome 11 L000002468 11 219217 218570 C 2011-02-03 1996-07-31 Integral membrane protein required for V-ATPase function; not an actual component of the vacuolar H+-ATPase (V-ATPase) complex; functions in the assembly of the V-ATPase; localized to the endoplasmic reticulum (ER); involved in methionine restriction extension of chronological lifespan in an autophagy-dependent manner -S000036236 CDS YKL119C 11 219217 218570 C 2011-02-03 1996-07-31 -S000007051 long_terminal_repeat YKLCdelta4 chromosome 11 11 219723 219395 C 2011-02-03 2000-05-19 Ty1 LTR -S000006515 tRNA_gene tA(AGC)K1 chromosome 11 L000003632 11 219895 219967 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine -S000036246 noncoding_exon tA(AGC)K1 11 219895 219967 W 2011-02-03 2000-05-19 -S000001600 ORF Verified YKL117W SBA1 Hsp90 cochaperone SBA1|CST18 chromosome 11 L000004284|L000002999|S000029122 11 220324 220974 W 2011-02-03 1996-07-31 Co-chaperone that binds and regulates Hsp90 family chaperones; plays a role in determining prion variants; important for pp60v-src activity in yeast; homologous to the mammalian p23 proteins, and like p23 can regulate telomerase activity; protein abundance increases in response to DNA replication stress -S000035238 CDS YKL117W 11 220324 220974 W 2011-02-03 1996-07-31 -S000001599 ORF Verified YKL116C PRR1 serine/threonine protein kinase PRR1 chromosome 11 11 222900 221344 C 2011-02-03 1996-07-31 Serine/threonine protein kinase; inhibits pheromone induced signaling downstream of MAPK, possibly at the level of the Ste12p transcription factor -S000034995 CDS YKL116C 11 222900 221344 C 2011-02-03 1996-07-31 -S000001598 ORF Dubious YKL115C chromosome 11 11 223285 222893 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene PRR1 -S000034081 CDS YKL115C 11 223285 222893 C 2011-02-03 1996-07-31 -S000001597 ORF Verified YKL114C APN1 DNA-(apurinic or apyrimidinic site) lyase APN1 chromosome 11 L000000096 11 224455 223352 C 2011-02-03 1996-07-31 Major apurinic/apyrimidinic endonuclease; 3'-repair diesterase; involved in repair of DNA damage by oxidation and alkylating agents; also functions as a 3'-5' exonuclease to repair 7,8-dihydro-8-oxodeoxyguanosine; genetically interacts with NTG1 to maintain mitochondrial genome integrity -S000033938 CDS YKL114C 11 224455 223352 C 2011-02-03 1996-07-31 -S000001596 ORF Verified YKL113C RAD27 multifunctional nuclease RAD27|FEN1|RTH1|ERC11 chromosome 11 L000002742|L000000565 11 225875 224727 C 2011-02-03 1996-07-31 5' to 3' exonuclease, 5' flap endonuclease; required for Okazaki fragment processing and maturation, for long-patch base-excision repair and large loop repair (LLR), ribonucleotide excision repair; member of the S. pombe RAD2/FEN1 family; relocalizes to the cytosol in response to hypoxia -S000033801 CDS YKL113C 11 225875 224727 C 2011-02-03 1996-07-31 -S000001595 ORF Verified YKL112W ABF1 GFI|SBF-B|DNA-binding protein ABF1|SBF1|REB2|OBF1|BAF1 chromosome 11 L000000159 11 226570 228765 W 2011-02-03 1996-07-31 DNA binding protein with possible chromatin-reorganizing activity; involved in transcriptional activation, gene silencing, and DNA replication and repair -S000033734 CDS YKL112W 11 226570 228765 W 2011-02-03 1996-07-31 -S000001594 ORF Dubious YKL111C chromosome 11 11 228799 228464 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the verified essential gene ABF1 -S000032984 CDS YKL111C 11 228799 228464 C 2011-02-03 1996-07-31 -S000001593 ORF Verified YKL110C KTI12 TOT4 chromosome 11 L000000923 11 229880 228939 C 2011-02-03 1996-07-31 Protein that plays a role in modification of tRNA wobble nucleosides; protein plays role in tRNA wobble nucleoside modification with Elongator complex; involved in sensitivity to G1 arrest induced by zymocin; interacts with chromatin throughout the genome; also interacts with Cdc19p -S000032867 CDS YKL110C 11 229880 228939 C 2011-02-03 1996-07-31 -S000001592 ORF Verified YKL109W HAP4 transcription factor HAP4 chromosome 11 L000000754 11 232227 233891 W 2011-02-03 1996-07-31 Transcription factor; subunit of the heme-activated, glucose-repressed Hap2p/3p/4p/5p CCAAT-binding complex, a transcriptional activator and global regulator of respiratory gene expression; provides the principal activation function of the complex; involved in diauxic shift -S000032773 CDS YKL109W 11 232227 233891 W 2011-02-03 1996-07-31 -S000001591 ORF Verified YKL108W SLD2 DRC1 chromosome 11 L000004708 11 234426 235787 W 2011-02-03 1996-07-31 Single-stranded DNA origin-binding and annealing protein; required for initiation of DNA replication; phosphorylated in S phase by cyclin-dependent kinases (Cdks), promoting origin binding, DNA replication and Dpb11p complex formation; component of the preloading complex; binds the Mcm2-7p complex to prevent inappropriate Mcm2-7p interaction with the GINS complex in G1; required for S phase checkpoint; relative distribution to the nucleus increases upon DNA replication stress -S000032698 CDS YKL108W 11 234426 235787 W 2011-02-03 1996-07-31 -S000001590 ORF Uncharacterized YKL107W putative short-chain dehydrogenase/reductase chromosome 11 11 236141 237070 W 2011-02-03 1996-07-31 Putative short-chain dehydrogenase/reductase; proposed to be a palmitoylated membrane protein -S000032626 CDS YKL107W 11 236141 237070 W 2011-02-03 1996-07-31 -S000007616 ORF Uncharacterized YKL106C-A chromosome 11 11 237266 237147 C 2011-02-03 2001-02-26 Putative protein of unknown function; identified by homology to uncharacterized proteins in other fungi -S000037214 CDS YKL106C-A 11 237266 237147 C 2011-02-03 2001-02-26 -S000001589 ORF Verified YKL106W AAT1 aspartate transaminase AAT1 chromosome 11 L000000009 11 237536 238891 W 2011-02-03 1996-07-31 Mitochondrial aspartate aminotransferase; catalyzes the conversion of oxaloacetate to aspartate in aspartate and asparagine biosynthesis -S000031616 CDS YKL106W 11 237536 238891 W 2011-02-03 1996-07-31 -S000001588 ORF Verified YKL105C SEG2 chromosome 11 11 242583 239185 C 2011-02-03 1996-07-31 Eisosome component; likely plays only a minor role in eisosome assembly; shown to interact with Seg1p by affinity purification and mass spec; SWAT-GFP and mCherry fusion proteins localize to the cell periphery; similar to A. gossypii SEG gene which is important for stabilizing eisosomes; SEG2 has a paralog, SEG1, that arose from the whole genome duplication -S000031413 CDS YKL105C 11 242583 239185 C 2011-02-03 1996-07-31 -S000001587 ORF Verified YKL104C GFA1 glutamine--fructose-6-phosphate transaminase (isomerizing) GFA1 chromosome 11 L000000702 11 245373 243220 C 2011-02-03 1996-07-31 Glutamine-fructose-6-phosphate amidotransferase; catalyzes the formation of glucosamine-6-P and glutamate from fructose-6-P and glutamine in the first step of chitin biosynthesis; GFA1 has a paralogous region, comprising ORFs YMR084W-YMR085W, that arose from the whole genome duplication -S000030506 CDS YKL104C 11 245373 243220 C 2011-02-03 1996-07-31 -S000001586 ORF Verified YKL103C APE1 metalloaminopeptidase APE1|LAP4|API|YSC1 chromosome 11 L000000930 11 247682 246138 C -138 2011-02-03 1996-07-31 Vacuolar aminopeptidase yscI; zinc metalloproteinase that belongs to the peptidase family M18; often used as a marker protein in studies of autophagy and cytosol to vacuole targeting (CVT) pathway; protein increases in abundance and relative distribution to cytoplasmic foci increases upon DNA replication stress -S000030363 CDS YKL103C 11 247682 246138 C 2011-02-03 1996-07-31 -S000001585 ORF Dubious YKL102C chromosome 11 11 248367 248062 C 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; deletion confers sensitivity to citric acid; predicted protein would include a thiol-disulfide oxidoreductase active site -S000030203 CDS YKL102C 11 248367 248062 C 2011-02-03 1996-07-31 -S000001584 ORF Verified YKL101W HSL1 protein kinase HSL1|ELM2|NIK1 chromosome 11 L000003129|L000002839 11 248920 253476 W 2011-02-03 1996-07-31|2011-02-03 Nim1p-related protein kinase; septin-binding kinase that localizes to the bud neck septin ring and regulates the morphogenesis checkpoint; phosphorylates Hsl7p and cooperates with Elm1p to recruit Hsl7p to the mother-bud neck, as a prerequisite for the subsequent recruitment, phosphorylation, and degradation of Swe1p; autophosphorylation enhances interactions with Hsl7p -S000037537 CDS YKL101W 11 248920 253476 W 2011-02-03 1996-07-31|2011-02-03 -S000028840 ORF Dubious YKL100W-A chromosome 11 11 254159 254248 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000034525 CDS YKL100W-A 11 254159 254248 W 2011-02-03 2003-07-29 -S000001583 ORF Verified YKL100C YPF1 aspartic endopeptidase chromosome 11 11 255460 253697 C 2011-02-03 1996-07-31 Intramembrane aspartyl protease of the perinuclear ER membrane; acts in a branch of ER-associated degradation (ERAD) that degrades functional proteins rather than misfolded proteins; regulates abundance of high-affinity plasma membrane transporters, such as Ctr1p and Zrt1p, during the starvation response; has a presenilin fold; member of the GxGD family of intramembrane proteases; closest human homolog is signal peptide peptidase (SPP) -S000037360 CDS YKL100C 11 255460 253697 C 2011-02-03 1996-07-31 -S000001582 ORF Verified YKL099C UTP11 rRNA-processing protein UTP11 chromosome 11 11 256472 255720 C 2011-02-03 1996-07-31|2005-12-15 Subunit of U3-containing Small Subunit (SSU) processome complex; involved in production of 18S rRNA and assembly of small ribosomal subunit -S000031999 CDS YKL099C 11 256472 255720 C 2011-02-03 1996-07-31|2005-12-15 -S000001581 ORF Verified YKL098W MTC2 chromosome 11 11 256770 257843 W 2011-02-03 1996-07-31 Protein of unknown function; mtc2 is synthetically sick with cdc13-1 -S000031070 CDS YKL098W 11 256770 257843 W 2011-02-03 1996-07-31 -S000001580 ORF Dubious YKL097C chromosome 11 11 258913 258503 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species -S000030940 CDS YKL097C 11 258913 258503 C 2011-02-03 1996-07-31 -S000028667 ORF Uncharacterized YKL096C-B chromosome 11 11 259222 259073 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032492 CDS YKL096C-B 11 259222 259073 C 2011-02-03 2003-07-29 -S000001956 ORF Verified YKL096W-A CWP2 YKL097W-A|LPR1 chromosome 11 L000000952|L000002857 11 259253 259531 W 2011-02-03 1996-07-31 Covalently linked cell wall mannoprotein; major constituent of the cell wall; plays a role in stabilizing the cell wall; involved in low pH resistance; precursor is GPI-anchored -S000037786 CDS YKL096W-A 11 259253 259531 W 2011-02-03 1996-07-31 -S000001579 ORF Verified YKL096W CWP1 YJU1 chromosome 11 L000000446|L000002512 11 261132 261851 W 2011-02-03 1996-07-31 Cell wall mannoprotein that localizes to birth scars of daughter cells; linked to a beta-1,3- and beta-1,6-glucan heteropolymer through a phosphodiester bond; required for propionic acid resistance -S000030917 CDS YKL096W 11 261132 261851 W 2011-02-03 1996-07-31 -S000001578 ORF Verified YKL095W YJU2 mRNA splicing protein YJU2|CWC16 chromosome 11 L000002513 11 262277 263113 W 2011-02-03 1996-07-31 Essential protein required for pre-mRNA splicing; associates transiently with the spliceosomal NTC ("nineteen complex") and acts after Prp2p to promote the first catalytic reaction of splicing -S000030823 CDS YKL095W 11 262277 263113 W 2011-02-03 1996-07-31 -S000001577 ORF Verified YKL094W YJU3 acylglycerol lipase chromosome 11 L000002514 11 263349 264290 W 2011-02-03 1996-07-31 Monoglyceride lipase (MGL); functional ortholog of mammalian MGL, localizes to lipid particles and membranes, also member of the eukaryotic serine hydrolase family -S000037906 CDS YKL094W 11 263349 264290 W 2011-02-03 1996-07-31 -S000001576 ORF Verified YKL093W MBR1 chromosome 11 L000001033 11 264789 265808 W 2011-02-03 1996-07-31 Protein involved in mitochondrial functions and stress response; overexpression suppresses growth defects of hap2, hap3, and hap4 mutants; MBR1 has a paralog, ISF1, that arose from the whole genome duplication -S000037808 CDS YKL093W 11 264789 265808 W 2011-02-03 1996-07-31 -S000001575 ORF Verified YKL092C BUD2 ERC25|CLA2 chromosome 11 L000000199 11 269459 266145 C 2011-02-03 1996-07-31 GTPase activating factor for Rsr1p/Bud1p; plays a role in spindle position checkpoint distinct from its role in bud site selection; required for both axial and bipolar budding patterns; mutants exhibit random budding in all cell types; contains two PH-like domains -S000037705 CDS YKL092C 11 269459 266145 C 2011-02-03 1996-07-31 -S000001574 ORF Verified YKL091C phosphatidylinositol/phosphatidylcholine-binding protein|SFH1 chromosome 11 11 270650 269718 C 2011-02-03 1996-07-31 Putative phosphatidylinositol/phosphatidylcholine transfer protein; possibly involved in lipid metabolism; localizes to the nucleus; contains a CRAL/TRIO domain and binds several lipids in a large-scale study; YKL091C has a paralog, SEC14, that arose from the whole genome duplication -S000036936 CDS YKL091C 11 270650 269718 C 2011-02-03 1996-07-31 -S000001573 ORF Verified YKL090W CUE2 chromosome 11 11 271878 273209 W 2011-02-03 1996-07-31 Protein of unknown function; has two CUE domains that bind ubiquitin, which may facilitate intramolecular monoubiquitination -S000036908 CDS YKL090W 11 271878 273209 W 2011-02-03 1996-07-31 -S000001572 ORF Verified YKL089W MIF2 chromosome 11 L000001109 11 273394 275043 W -43 2011-02-03 1996-07-31 Protein required for structural integrity of elongating spindles; localizes to the kinetochore; interacts with histones H2A, H2B, and H4; phosphorylated by Ipl1p; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-C and fission yeast cnp3 -S000036033 CDS YKL089W 11 273394 275043 W 2011-02-03 1996-07-31 -S000001571 ORF Verified YKL088W CAB3 phosphopantothenoylcysteine decarboxylase complex subunit CAB3 chromosome 11 11 275283 276998 W 2011-02-03 1996-07-31 Subunit of PPCDC and CoA-SPC complexes involved in CoA biosynthesis; subunits of the phosphopantothenoylcysteine decarboxylase (PPCDC) complex are: Cab3p, Sis2p, Vhs3p, while the subunits of the CoA-synthesizing protein complex (CoA-SPC) are: Cab2p, Cab3p, Cab4p, and Cab5p as well as Sis2p and Vhs3p; null mutant lethality is complemented by E. coli coaBC -S000035891 CDS YKL088W 11 275283 276998 W 2011-02-03 1996-07-31 -S000001570 ORF Verified YKL087C CYT2 cytochrome c1 heme lyase CYT2|CC1HL chromosome 11 L000000473 11 277863 277189 C 2011-02-03 1996-07-31 Cytochrome c1 heme lyase; involved in maturation of cytochrome c1, which is a subunit of the mitochondrial ubiquinol-cytochrome-c reductase; links heme covalently to apocytochrome c1; human homolog HCCS can complement yeast cyt2 null mutant -S000034890 CDS YKL087C 11 277863 277189 C 2011-02-03 1996-07-31 -S000001569 ORF Verified YKL086W SRX1 sulfiredoxin chromosome 11 11 278281 278664 W 2011-02-03 1996-07-31 Sulfiredoxin; contributes to oxidative stress resistance by reducing cysteine-sulfinic acid groups in the peroxiredoxin Tsa1p, which is formed upon exposure to oxidants; conserved in higher eukaryotes; protein abundance increases in response to DNA replication stress -S000034838 CDS YKL086W 11 278281 278664 W 2011-02-03 1996-07-31 -S000001568 ORF Verified YKL085W MDH1 malate dehydrogenase MDH1 chromosome 11 L000001045 11 279123 280127 W 2011-02-03 1996-07-31 Mitochondrial malate dehydrogenase; catalyzes interconversion of malate and oxaloacetate; involved in the tricarboxylic acid (TCA) cycle; phosphorylated -S000034670 CDS YKL085W 11 279123 280127 W 2011-02-03 1996-07-31 -S000001567 ORF Verified YKL084W HOT13 chromosome 11 11 280509 280859 W 2011-02-03 1996-07-31 Zinc-binding mitochondrial intermembrane space (IMS) protein; involved in a disulfide relay system for IMS import of cysteine-containing proteins; binds Mia40p and stimulates its Erv1p-dependent oxidation, probably by sequestering zinc -S000033808 CDS YKL084W 11 280509 280859 W 2011-02-03 1996-07-31 -S000001566 ORF Dubious YKL083W chromosome 11 11 280921 281535 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the verified essential gene RRP14 -S000033660 CDS YKL083W 11 280921 281535 W 2011-02-03 1996-07-31 -S000001565 ORF Verified YKL082C RRP14 ribosome biosynthesis protein RRP14 chromosome 11 11 282329 281025 C 2011-02-03 1996-07-31 Essential protein, constituent of 66S pre-ribosomal particles; interacts with proteins involved in ribosomal biogenesis and cell polarity; member of the SURF-6 family -S000033529 CDS YKL082C 11 282329 281025 C 2011-02-03 1996-07-31 -S000001564 ORF Verified YKL081W TEF4 translation elongation factor EF1B gamma|EFC1 chromosome 11 L000002280 11 282891 284455 W 2011-02-03 1996-07-31 Gamma subunit of translational elongation factor eEF1B; stimulates the binding of aminoacyl-tRNA (AA-tRNA) to ribosomes by releasing eEF1A (Tef1p/Tef2p) from the ribosomal complex -S000033487 CDS YKL081W 11 282891 283095 W 2011-02-03 1996-07-31 -S000033488 CDS YKL081W 11 283422 284455 W 2011-02-03 1996-07-31 -S000033489 intron YKL081W 11 283096 283421 W 2011-02-03 1996-07-31 -S000007301 snoRNA_gene snR38 SNR38 chromosome 11 L000003053 11 283185 283279 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position G2815 -S000036768 noncoding_exon snR38 11 283185 283279 W 2011-02-03 2000-05-19 -S000001563 ORF Verified YKL080W VMA5 H(+)-transporting V1 sector ATPase subunit C|VAT3|CSL5 chromosome 11 L000002460 11 285030 286208 W 2011-02-03 1996-07-31 Subunit C of the V1 peripheral membrane domain of V-ATPase; part of the electrogenic proton pump found throughout the endomembrane system; required for the V1 domain to assemble onto the vacuolar membrane; the V1 peripheral membrane domain of vacuolar H+-ATPase (V-ATPase) has eight subunits -S000032748 CDS YKL080W 11 285030 286208 W 2011-02-03 1996-07-31 -S000001562 ORF Verified YKL079W SMY1 chromosome 11 L000001940 11 286603 288573 W 2011-02-03 1996-07-31 Kinesin-like myosin passenger-protein; interacts with Myo2p and enhances its interaction with Sec4p during transport of secretory vesicles; controls actin cable structure and dynamics -S000031903 CDS YKL079W 11 286603 288573 W 2011-02-03 1996-07-31 -S000001561 ORF Verified YKL078W DHR2 RNA helicase chromosome 11 11 288845 291052 W 2011-02-03 1996-07-31 Predominantly nucleolar DEAH-box ATP-dependent RNA helicase; required for 18S rRNA synthesis -S000031760 CDS YKL078W 11 288845 291052 W 2011-02-03 1996-07-31 -S000001560 ORF Uncharacterized YKL077W chromosome 11 11 291453 292631 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole -S000031669 CDS YKL077W 11 291453 292631 W 2011-02-03 1996-07-31 -S000001559 ORF Dubious YKL076C PSY1 chromosome 11 11 293221 292838 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 69% of ORF overlaps the uncharacterized ORF YKL075C -S000031531 CDS YKL076C 11 293221 292838 C 2011-02-03 1996-07-31 -S000001558 ORF Uncharacterized YKL075C chromosome 11 11 294308 292956 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; proposed to be involved in resistance to streptozotocin and camptothecin -S000030667 CDS YKL075C 11 294308 292956 C 2011-02-03 1996-07-31 -S000001557 ORF Verified YKL074C MUD2 chromosome 11 L000002794 11 296193 294610 C 2011-02-03 1996-07-31 Protein involved in early pre-mRNA splicing; component of the pre-mRNA-U1 snRNP complex, the commitment complex; interacts with Msl5p/BBP splicing factor and Sub2p; similar to metazoan splicing factor U2AF65 -S000030581 CDS YKL074C 11 296193 294610 C 2011-02-03 1996-07-31 -S000001556 ORF Verified YKL073W LHS1 Hsp70 family chaperone LHS1|SSI1|CER1 chromosome 11 L000004102 11 296430 299075 W 2011-02-03 1996-07-31 Molecular chaperone of the endoplasmic reticulum lumen; involved in polypeptide translocation and folding; nucleotide exchange factor for the ER lumenal Hsp70 chaperone Kar2p; regulated by the unfolded protein response pathway -S000030511 CDS YKL073W 11 296430 299075 W 2011-02-03 1996-07-31 -S000001555 ORF Verified YKL072W STB6 chromosome 11 L000003369 11 299582 301882 W 2011-02-03 1996-07-31 Protein that binds Sin3p in a two-hybrid assay; STB6 has a paralog, STB2, that arose from the whole genome duplication -S000030364 CDS YKL072W 11 299582 301882 W 2011-02-03 1996-07-31 -S000007052 long_terminal_repeat YKLCdelta5 chromosome 11 11 302625 302334 C 2011-02-03 2000-05-19 Ty1 LTR -S000006774 tRNA_gene tW(CCA)K chromosome 11 L000003633 11 302918 303023 W 2011-02-03 2000-05-19 Tryptophan tRNA (tRNA-Trp), predicted by tRNAscan-SE analysis -S000033327 intron tW(CCA)K 11 302954 302987 W 2011-02-03 2000-05-19 -S000033325 noncoding_exon tW(CCA)K 11 302918 302953 W 2011-02-03 2000-05-19 -S000033326 noncoding_exon tW(CCA)K 11 302988 303023 W 2011-02-03 2000-05-19 -S000001554 ORF Uncharacterized YKL071W chromosome 11 11 305114 305884 W 2011-02-03 1996-07-31 Putative protein of unknown function; expression induced in cells treated with the mycotoxin patulin, and also the quinone methide triterpene celastrol; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000037597 CDS YKL071W 11 305114 305884 W 2011-02-03 1996-07-31 -S000001553 ORF Uncharacterized YKL070W chromosome 11 11 306211 306720 W 2011-02-03 1996-07-31 Putative protein of unknown function; expression induced in cells treated with mycotoxins patulin or citrinin; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000037452 CDS YKL070W 11 306211 306720 W 2011-02-03 1996-07-31 -S000001552 ORF Verified YKL069W L-methionine (R)-S-oxide reductase|fRMsr|YKG9 chromosome 11 11 307285 307827 W 2011-02-03 1996-07-31 Methionine-R-sulfoxide reductase; reduces the R enantiomer of free Met-SO, in contrast to Ycl033Cp which reduces Met-R-SO in a peptide linkage; has a role in protection against oxidative stress; relative distribution to the nucleus increases upon DNA replication stress -S000036847 CDS YKL069W 11 307285 307827 W 2011-02-03 1996-07-31 -S000006760 tRNA_gene tV(AAC)K1 chromosome 11 L000003641 11 308217 308144 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000037869 noncoding_exon tV(AAC)K1 11 308217 308144 C 2011-02-03 2000-05-19 -S000028524 ORF Uncharacterized YKL068W-A chromosome 11 11 309206 309442 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by homology to Ashbya gossypii -S000030323 CDS YKL068W-A 11 309206 309442 W 2011-02-03 2003-07-29 -S000001551 ORF Verified YKL068W NUP100 FG-nucleoporin NUP100|[NUP100+]|NSP100 chromosome 11 L000001292 11 310199 313078 W 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; contributes directly to nucleocytoplasmic transport and maintenance of the nuclear pore complex (NPC) permeability barrier and is involved in gene tethering at the nuclear periphery; NUP100 has a paralog, NUP116, that arose from the whole genome duplication -S000036782 CDS YKL068W 11 310199 313078 W 2011-02-03 1996-07-31 -S000006598 tRNA_gene tH(GUG)K chromosome 11 L000003640 11 313472 313401 C 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis -S000033889 noncoding_exon tH(GUG)K 11 313472 313401 C 2011-02-03 2000-05-19 -S000007053 long_terminal_repeat YKLCdelta6 chromosome 11 11 313919 313602 C 2011-02-03 2000-05-19 Ty1 LTR -S000007057 long_terminal_repeat YKLWdelta7 chromosome 11 11 314193 314524 W 2011-02-03 2000-05-19 Ty1 LTR -S000001550 ORF Verified YKL067W YNK1 nucleoside diphosphate kinase|NDK1 chromosome 11 L000002536 11 314812 315273 W 2011-02-03 1996-07-31 Nucleoside diphosphate kinase; catalyzes the transfer of gamma phosphates from nucleoside triphosphates, usually ATP, to nucleoside diphosphates by a mechanism that involves formation of an autophosphorylated enzyme intermediate; protein abundance increases in response to DNA replication stress -S000036722 CDS YKL067W 11 314812 315273 W 2011-02-03 1996-07-31 -S000001549 ORF Dubious YKL066W chromosome 11 11 315281 315724 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the verified gene YNK1 -S000036665 CDS YKL066W 11 315281 315724 W 2011-02-03 1996-07-31 -S000113563 ORF Uncharacterized YKL065W-A chromosome 11 11 315954 316175 W 2011-02-03 2005-11-17 Putative protein of unknown function; SWAT-GFP fusion protein localizes to the endoplasmic reticulum (ER) while mCherry fusion localizes to both the ER and vacuole -S000113565 CDS YKL065W-A 11 315954 316175 W 2011-02-03 2005-11-17 -S000001548 ORF Verified YKL065C YET1 chromosome 11 L000003484 11 317057 316437 C 2011-02-03 1996-07-31|2011-02-03 Endoplasmic reticulum transmembrane protein; may interact with ribosomes, based on co-purification experiments; homolog of human BAP31 protein; YET1 has a paralog, YET2, that arose from the whole genome duplication -S000035692 CDS YKL065C 11 317057 316437 C 2011-02-03 1996-07-31|2011-02-03 -S000001547 ORF Verified YKL064W MNR2 putative Mg(2+) transporter MNR2 chromosome 11 L000003203 11 317764 320673 W 2011-02-03 1996-07-31 Vacuolar membrane protein required for magnesium homeostasis; putative magnesium transporter; has similarity to Alr1p and Alr2p, which mediate influx of Mg2+ and other divalent cations; localizes to sites of contact between the vacuole and mitochondria (vCLAMPs) -S000035630 CDS YKL064W 11 317764 320673 W 2011-02-03 1996-07-31 -S000001546 ORF Uncharacterized YKL063C chromosome 11 11 321518 321015 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the Golgi -S000035510 CDS YKL063C 11 321518 321015 C 2011-02-03 1996-07-31 -S000001545 ORF Verified YKL062W MSN4 stress-responsive transcriptional activator MSN4 chromosome 11 L000001199 11 323228 325120 W 2011-02-03 1996-07-31 Stress-responsive transcriptional activator; activated in stochastic pulses of nuclear localization in response to various stress conditions; binds DNA at stress response elements of responsive genes, inducing gene expression; involved in diauxic shift -S000034556 CDS YKL062W 11 323228 325120 W 2011-02-03 1996-07-31 -S000001544 ORF Verified YKL061W BLI1 chromosome 11 11 325771 326112 W 2011-02-03 1996-07-31 Subunit of the BLOC-1 complex involved in endosomal maturation; interacts with Msb3p; green fluorescent protein (GFP)-fusion protein localizes to the endosome -S000034423 CDS YKL061W 11 325771 326112 W 2011-02-03 1996-07-31 -S000001543 ORF Verified YKL060C FBA1 fructose-bisphosphate aldolase FBA1|LOT1 chromosome 11 L000000604 11 327487 326408 C 2011-02-03 1996-07-31 Fructose 1,6-bisphosphate aldolase; required for glycolysis and gluconeogenesis; catalyzes conversion of fructose 1,6 bisphosphate to glyceraldehyde-3-P and dihydroxyacetone-P; locates to mitochondrial outer surface upon oxidative stress; N-terminally propionylated in vivo -S000034296 CDS YKL060C 11 327487 326408 C 2011-02-03 1996-07-31 -S000001542 ORF Verified YKL059C MPE1 cleavage polyadenylation factor subunit MPE1 chromosome 11 11 329443 328118 C 2011-02-03 1996-07-31 Essential conserved subunit of CPF cleavage and polyadenylation factor; plays a role in 3' end formation of mRNA via the specific cleavage and polyadenylation of pre-mRNA; contains a ubiquitin-like (UBL) domain, a RNA-binding zinc knuckle motif and a RING finger domain; both the zinc knuckle and RING finger are required for pre-mRNA binding; possible role in ubiquitination of Pap1p; relocalizes to the cytosol in response to hypoxia -S000033369 CDS YKL059C 11 329443 328118 C 2011-02-03 1996-07-31 -S000118403 ARS ARS1109 ARSXI-329 chromosome 11 11 329682 329930 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000001541 ORF Verified YKL058W TOA2 transcription initiation factor IIA subunit gamma chromosome 11 L000002317 11 330166 330534 W 2011-02-03 1996-07-31 TFIIA small subunit; involved in transcriptional activation, acts as antirepressor or as coactivator; required, along with Toa1p, for ribosomal protein gene transcription in vivo; homologous to smallest subunit of human and Drosophila TFIIA; protein abundance increases in response to DNA replication stress -S000033347 CDS YKL058W 11 330166 330534 W 2011-02-03 1996-07-31 -S000001540 ORF Verified YKL057C NUP120 RAT2 chromosome 11 L000003138 11 333969 330856 C 2011-02-03 1996-07-31 Subunit of the Nup84p subcomplex of the nuclear pore complex (NPC); contributes to nucleocytoplasmic transport and NPC biogenesis and is involved in establishment of a normal nucleocytoplasmic concentration gradient of the GTPase Gsp1p; also plays roles in several processes that may require localization of genes or chromosomes at the nuclear periphery, including double-strand break repair, transcription and chromatin silencing; homologous to human NUP160 -S000032581 CDS YKL057C 11 333969 330856 C 2011-02-03 1996-07-31 -S000001539 ORF Verified YKL056C TMA19 MMI1|RBF18 chromosome 11 11 334915 334412 C 2011-02-03 1996-07-31 Protein that associates with ribosomes; homolog of translationally controlled tumor protein; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and relocates to the mitochondrial outer surface upon oxidative stress -S000032498 CDS YKL056C 11 334915 334412 C 2011-02-03 1996-07-31 -S000001538 ORF Verified YKL055C OAR1 3-oxoacyl-[acyl-carrier-protein] reductase (NADPH) chromosome 11 11 336157 335321 C 2011-02-03 1996-07-31|2011-02-03 Mitochondrial 3-oxoacyl-[acyl-carrier-protein] reductase; may comprise a type II mitochondrial fatty acid synthase along with Mct1p; human homolog CBR4 complements yeast null mutant -S000032402 CDS YKL055C 11 336157 335321 C 2011-02-03 1996-07-31|2011-02-03 -S000001537 ORF Verified YKL054C DEF1 DNA damage-responsive RNA polymerase-degradation factor DEF1|VID31 chromosome 11 11 338753 336537 C 2011-02-03 1996-07-31 RNAPII degradation factor; forms a complex with Rad26p in chromatin, enables ubiquitination and proteolysis of RNAPII present in an elongation complex; mutant is deficient in Zip1p loading onto chromosomes during meiosis -S000031390 CDS YKL054C 11 338753 336537 C 2011-02-03 1996-07-31 -S000007243 ORF Verified YKL053C-A MDM35 chromosome 11 11 339442 339182 C 2011-02-03 1999-07-17 Mitochondrial intermembrane space protein; forms complex with Ups2p that transfers phosphatidylserine from outer membrane to inner membrane for phosphatidylethanolamine synthesis; mutation affects mitochondrial distribution and morphology; contains twin cysteine-x9-cysteine motifs; protein abundance increases in response to DNA replication stress -S000032996 CDS YKL053C-A 11 339442 339182 C 2011-02-03 1999-07-17 -S000001536 ORF Dubious YKL053W chromosome 11 11 339572 339946 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF ASK1 -S000031321 CDS YKL053W 11 339572 339946 W 2011-02-03 1996-07-31 -S000001535 ORF Verified YKL052C ASK1 chromosome 11 11 340546 339668 C 2011-02-03 1996-07-31|2008-06-03 Essential subunit of the Dam1 complex (aka DASH complex); couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; phosphorylated during the cell cycle by cyclin-dependent kinases; sumoylated in an Mms21p-dependent manner; protein abundance increases in response to DNA replication stress -S000031156 CDS YKL052C 11 340546 339668 C 2011-02-03 1996-07-31|2008-06-03 -S000001534 ORF Verified YKL051W SFK1 chromosome 11 11 341312 342373 W 2011-02-03 1996-07-31 Plasma membrane protein that may act to generate normal levels of PI4P; may act together with or upstream of Stt4p; at least partially mediates proper localization of Stt4p to the plasma membrane -S000031104 CDS YKL051W 11 341312 342373 W 2011-02-03 1996-07-31 -S000001533 ORF Verified YKL050C chromosome 11 11 345620 342852 C 2011-02-03 1996-07-31 Protein of unknown function; the YKL050W protein is a target of the SCFCdc4 ubiquitin ligase complex and YKL050W transcription is regulated by Azf1p; YKL050C has a paralog, EIS1, that arose from the whole genome duplication -S000030029 CDS YKL050C 11 345620 342852 C 2011-02-03 1996-07-31 -S000001532 ORF Verified YKL049C CSE4 centromeric DNA-binding histone H3-like protein CSE4|CSL2 chromosome 11 L000002719 11 346764 346075 C 2011-02-03 2003-01-10|1996-07-31|2003-01-08 Histone H3-like centromere protein; associated with promoters, accessible chromatin, RNAPII-bound regions; phosphorylated Cse4p associates with centromeres; required for proper kinetochore function; levels regulated by E3 ubiquitin ligase Psh1p; phosphorylation may destabilize defective kinetochores to promote bi-orientation; ubiquitination of N-terminus regulates proteolysis for faithful chromosome segregation; yeast CSE4 can complement mutations in human homolog CENPA -S000037076 CDS YKL049C 11 346764 346075 C 2011-02-03 2003-01-10|1996-07-31|2003-01-08 -S000001531 ORF Verified YKL048C ELM1 serine/threonine protein kinase ELM1|LDB9 chromosome 11 L000000548 11 349136 347214 C 2011-02-03 1996-07-31 Serine/threonine protein kinase; regulates the orientation checkpoint, the morphogenesis checkpoint and the metabolic switch from fermentative to oxidative metabolism by phosphorylating the activation loop of Kin4p, Hsl1p and Snf4p respectively; cooperates with Hsl7p in recruiting Hsl1p to the septin ring, a prerequisite for subsequent recruitment, phosphorylation, and degradation of Swe1p; forms part of the bud neck ring; regulates cytokinesis -S000036436 CDS YKL048C 11 349136 347214 C 2011-02-03 1996-07-31 -S000001530 ORF Verified YKL047W ANR2 chromosome 11 S000114863 11 349463 351013 W 2011-02-03 1996-07-31 Protein of unknown function; may have a role in lipid metabolism, based on localization to lipid droplets; predicted to be palmitoylated -S000036411 CDS YKL047W 11 349463 351013 W 2011-02-03 1996-07-31 -S000001529 ORF Verified YKL046C DCW1 putative mannan endo-1,6-alpha-mannosidase chromosome 11 11 352624 351275 C 2011-02-03 1996-07-31 Putative mannosidase; GPI-anchored membrane protein required for cell wall biosynthesis in bud formation;homologous to Dfg5p -S000036235 CDS YKL046C 11 352624 351275 C 2011-02-03 1996-07-31 -S000001528 ORF Verified YKL045W PRI2 DNA primase subunit PRI2 chromosome 11 L000001490 11 353493 355079 W 2011-02-03 1996-07-31 Subunit of DNA primase; DNA primase is required for DNA synthesis and double-strand break repair -S000036183 CDS YKL045W 11 353493 355079 W 2011-02-03 1996-07-31 -S000001527 ORF Verified YKL044W MMO1 chromosome 11 11 356322 356642 W 2011-02-03 1996-07-31 Protein of unknown function; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the mitochondria; mRNA identified as translated by ribosome profiling data; MMO1 is a non-essential gene -S000035237 CDS YKL044W 11 356322 356642 W 2011-02-03 1996-07-31 -S000001526 ORF Verified YKL043W PHD1 chromosome 11 L000001417 11 356748 357848 W 2011-02-03 1996-07-31 Transcriptional activator that enhances pseudohyphal growth; physically interacts with the Tup1-Cyc8 complex and recruits Tup1p to its targets; regulates expression of FLO11, an adhesin required for pseudohyphal filament formation; similar to StuA, an A. nidulans developmental regulator; potential Cdc28p substrate; PHD1 has a paralog, SOK2, that arose from the whole genome duplication -S000035082 CDS YKL043W 11 356748 357848 W 2011-02-03 1996-07-31 -S000001525 ORF Verified YKL042W SPC42 chromosome 11 L000004148 11 358475 359566 W 2011-02-03 1996-07-31 Central plaque component of spindle pole body (SPB); involved in SPB duplication, may facilitate attachment of the SPB to the nuclear membrane -S000034904 CDS YKL042W 11 358475 359566 W 2011-02-03 1996-07-31 -S000001524 ORF Verified YKL041W VPS24 ESCRT-III subunit protein VPS24|VPL26|DID3 chromosome 11 L000004158 11 360143 360817 W 2011-02-03 1996-07-31 One of four subunits of the ESCRT-III complex; forms an endosomal sorting complex required for transport III (ESCRT-III) subcomplex with Did4p; involved in the sorting of transmembrane proteins into the multivesicular body (MVB) pathway -S000034024 CDS YKL041W 11 360143 360817 W 2011-02-03 1996-07-31 -S000001523 ORF Verified YKL040C NFU1 NUB1 chromosome 11 L000004771 11 361828 361058 C 2011-02-03 1996-07-31 Protein involved in Fe-S cluster transfer to mitochondrial clients; protects [4Fe-4S] clusters from damage due to oxidative stress; acts along with Bol3 at a late step in the transfer of [4Fe-4S] clusters from the ISA complex to client proteins; Fe-S loaded homodimer at steady state; similar to NifU, a bacterial protein required for Fe/S cluster maturation; ortholog of the human NFU1, mutations of which are associated with Multiple Mitochondria Dysfunctions Syndrome (MMDS1) -S000033793 CDS YKL040C 11 361828 361058 C 2011-02-03 1996-07-31 -S000001522 ORF Verified YKL039W PTM1 chromosome 11 L000001524 11 362622 364193 W 2011-02-03 1996-07-31|2005-12-15 Protein of unknown function; copurifies with late Golgi vesicles containing the v-SNARE Tlg2p; PTM1 has a paralog, YHL017W, that arose from the whole genome duplication -S000035013 CDS YKL039W 11 362622 364193 W 2011-02-03 1996-07-31|2005-12-15 -S000006460 snoRNA_gene snR69 SNR69 chromosome 11 L000004538 11 364776 364876 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position C2948 -S000030857 noncoding_exon snR69 11 364776 364876 W 2011-02-03 2000-05-19 -S000001521 ORF Verified YKL038W RGT1 chromosome 11 L000003482 11 365605 369117 W 2011-02-03 1996-07-31 Glucose-responsive transcription factor; regulates expression of several glucose transporter (HXT) genes in response to glucose; binds to promoters and acts both as a transcriptional activator and repressor; recruits Tup1p/Cyc8p to target gene promoters; RGT1 has a paralog, EDS1, that arose from the whole genome duplication -S000034833 CDS YKL038W 11 365605 369117 W 2011-02-03 1996-07-31 -S000001520 ORF Verified YKL037W AIM26 chromosome 11 11 369365 369721 W 2011-02-03 1996-07-31 Protein of unknown function; null mutant is viable and displays elevated frequency of mitochondrial genome loss; null mutation confers sensitivity to tunicamycin and DTT -S000032888 CDS YKL037W 11 369365 369721 W 2011-02-03 1996-07-31 -S000001518 ORF Verified YKL035W UGP1 UTP glucose-1-phosphate uridylyltransferase chromosome 11 L000003118 11 369891 371390 W 2011-02-03 1996-07-31 UDP-glucose pyrophosphorylase (UGPase); catalyses the reversible formation of UDP-Glc from glucose 1-phosphate and UTP, involved in a wide variety of metabolic pathways, expression modulated by Pho85p through Pho4p; involved in PKA-mediated oxidative stress resistance and long-term survival in stationary phase; UGP1 has a paralog, YHL012W, that arose from the whole genome duplication -S000032697 CDS YKL035W 11 369891 371390 W 2011-02-03 1996-07-31 -S000001519 ORF Dubious YKL036C chromosome 11 11 369920 369528 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the essential gene UGP1 gene and uncharacterized ORF YKL037W -S000032729 CDS YKL036C 11 369920 369528 C 2011-02-03 1996-07-31 -S000001517 ORF Verified YKL034W TUL1 ubiquitin-protein ligase TUL1 chromosome 11 11 371829 374105 W 2011-02-03 1996-07-31 Subunit of the DSC ubiquitin ligase complex; golgi-localized RING-finger ubiquitin ligase (E3) involved in sorting polar transmembrane domain containing membrane proteins to multivesicular bodies for delivery to the vacuole; proposed involvement in the quality control of misfolded TMD containing proteins; ortholog of fission yeast dsc1 -S000032625 CDS YKL034W 11 371829 374105 W 2011-02-03 1996-07-31 -S000007242 ORF Uncharacterized YKL033W-A putative hydrolase chromosome 11 11 374505 375215 W 2011-02-03 2004-02-13|1999-07-17 Putative protein of unknown function; similar to uncharacterized proteins from other fungi -S000036238 CDS YKL033W-A 11 374505 375215 W 2011-02-03 2004-02-13|1999-07-17 -S000001516 ORF Verified YKL033W TTI1 FMP47 chromosome 11 11 375456 378572 W 2011-02-03 1996-07-31 Subunit of the ASTRA complex, involved in chromatin remodeling; telomere length regulator involved in the stability or biogenesis of PIKKs such as TORC1; similar to S. pombe Tti1p; detected in highly purified mitochondria in high-throughput studies -S000031614 CDS YKL033W 11 375456 378572 W 2011-02-03 1996-07-31 -S000006761 tRNA_gene tV(AAC)K2 chromosome 11 L000003634 11 379680 379753 W 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000037883 noncoding_exon tV(AAC)K2 11 379680 379753 W 2011-02-03 2000-05-19 -S000001515 ORF Verified YKL032C IXR1 DNA-binding transcription repressor IXR1|ORD1 chromosome 11 L000000881 11 381858 380065 C 2011-02-03 1996-07-31 Transcriptional repressor that regulates hypoxic genes during normoxia; involved in the aerobic repression of genes such as COX5b, TIR1, and HEM13; binds DNA intrastrand cross-links formed by cisplatin; HMG (high mobility group box) domain containing protein which binds and bends cisplatin-modified DNA, blocking excision repair; IXR1 has a paralog, ABF2, that arose from the whole genome duplication -S000031407 CDS YKL032C 11 381858 380065 C 2011-02-03 1996-07-31 -S000001514 ORF Dubious YKL031W chromosome 11 11 382072 382485 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species -S000031365 CDS YKL031W 11 382072 382485 W 2011-02-03 1996-07-31 -S000001513 ORF Dubious YKL030W chromosome 11 11 382498 383103 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the verified gene MAE1 -S000030446 CDS YKL030W 11 382498 383103 W 2011-02-03 1996-07-31 -S000001512 ORF Verified YKL029C MAE1 malate dehydrogenase (oxaloacetate-decarboxylating) chromosome 11 L000003506 11 384725 382716 C 2011-02-03 1996-07-31 Mitochondrial malic enzyme; catalyzes the oxidative decarboxylation of malate to pyruvate, which is a key intermediate in sugar metabolism and a precursor for synthesis of several amino acids -S000030570 CDS YKL029C 11 384725 382716 C 2011-02-03 1996-07-31 -S000001511 ORF Verified YKL028W TFA1 transcription factor TFIIE subunit TFA1 chromosome 11 L000002595 11 385758 387206 W 2011-02-03 1996-07-31 TFIIE large subunit; involved in recruitment of RNA polymerase II to the promoter, activation of TFIIH, and promoter opening -S000036771 CDS YKL028W 11 385758 387206 W 2011-02-03 1996-07-31 -S000001510 ORF Verified YKL027W TCD2 tRNA threonylcarbamoyladenosine dehydratase chromosome 11 11 387562 388905 W 2011-02-03 1996-07-31 tRNA threonylcarbamoyladenosine dehydratase; required for the ct6A tRNA base modification, where an adenosine at position 37 is modified to form a cyclized active ester with an oxazolone ring; localized to the mitochondrial outer membrane; TCD2 has a paralog, TCD1, that arose from the whole genome duplication -S000036685 CDS YKL027W 11 387562 388905 W 2011-02-03 1996-07-31 -S000118404 ARS ARS1112 ARSXI-389 chromosome 11 11 388970 389264 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000001509 ORF Verified YKL026C GPX1 glutathione peroxidase GPX1 chromosome 11 11 389883 389380 C 2011-02-03 1996-07-31 Phospholipid hydroperoxide glutathione peroxidase; induced by glucose starvation that protects cells from phospholipid hydroperoxides and nonphospholipid peroxides during oxidative stress; GPX1 has a paralog, HYR1, that arose from the whole genome duplication -S000036560 CDS YKL026C 11 389883 389380 C 2011-02-03 1996-07-31 -S000001508 ORF Verified YKL025C PAN3 ECM35 chromosome 11 L000003340 11 392279 390240 C 2011-02-03 1996-07-31 Essential subunit of the Pan2p-Pan3p poly(A)-ribonuclease complex; poly (A) mRNA binding subunit which recruits mRNA to the complex; the Pan2p-Pan3p complex controls poly(A) tail length and regulates the stoichiometry and activity of postreplication repair complexes -S000035620 CDS YKL025C 11 392279 390240 C 2011-02-03 1996-07-31 -S000001507 ORF Verified YKL024C URA6 bifunctional uridylate/adenylate kinase|SOC8 chromosome 11 L000002435 11 393140 392526 C 18 2011-02-03 1996-07-31 Uridylate kinase; catalyzes the seventh enzymatic step in the de novo biosynthesis of pyrimidines, converting uridine monophosphate (UMP) into uridine-5'-diphosphate (UDP) -S000035543 CDS YKL024C 11 393140 392526 C 2011-02-03 1996-07-31 -S000113559 ORF Uncharacterized YKL023C-A chromosome 11 11 393373 393146 C 2011-02-03 2005-11-17 Putative protein of unknown function -S000113560 CDS YKL023C-A 11 393373 393146 C 2011-02-03 2005-11-17 -S000001506 ORF Uncharacterized YKL023W chromosome 11 11 393721 394554 W 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; predicted by computational methods to be involved in mRNA degradation; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000035506 CDS YKL023W 11 393721 394554 W 2011-02-03 1996-07-31|2011-02-03 -S000001505 ORF Verified YKL022C CDC16 anaphase promoting complex subunit CDC16 chromosome 11 L000000256 11 397248 394726 C -15 2011-02-03 1996-07-31 Subunit of the anaphase-promoting complex/cyclosome (APC/C); which is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; required for sporulation; relocalizes to the cytosol in response to hypoxia -S000034410 CDS YKL022C 11 397248 394726 C 2011-02-03 1996-07-31 -S000001504 ORF Verified YKL021C MAK11 chromosome 11 L000000984 11 398750 397344 C -16 2011-02-03 1996-07-31 Protein involved in an early step of 60S ribosomal subunit biogenesis; essential for cell growth and replication of killer M1 dsRNA virus; contains four beta-transducin repeats -S000034298 CDS YKL021C 11 398750 397344 C 2011-02-03 1996-07-31 -S000001503 ORF Verified YKL020C SPT23 chromosome 11 L000002041 11 402080 398832 C 2011-02-03 1996-07-31 ER membrane protein involved in regulation of OLE1 transcription; inactive ER form dimerizes and one subunit is then activated by ubiquitin/proteasome-dependent processing followed by nuclear targeting; SPT23 has a paralog, MGA2, that arose from the whole genome duplication -S000034167 CDS YKL020C 11 402080 398832 C 2011-02-03 1996-07-31 -S000001502 ORF Verified YKL019W RAM2 bifunctional protein farnesyltransferase/protein geranylgeranyltransferase chromosome 11 L000001580 11 402568 403518 W 2011-02-03 1996-07-31 Alpha subunit of farnesyltransferase and geranylgeranyltransferase-I; farnesyltransferase (Ram2p-Ram1p heterodimer) catalyzes the addition of 15-carbon isoprenoid farnesyl to substrate proteins containing a CAAX consensus motif; type I geranylgeranyltransferase (Ram2p-Cdc43p heterodimer) catalyzes the addition of the 20-carbon isoprenoid geranylgeranyl to substrate proteins containing a CaaL consensus motif; required for membrane localization of Ras proteins and a-factor -S000034702 CDS YKL019W 11 402568 403518 W 2011-02-03 1996-07-31 -S000007615 ORF Uncharacterized YKL018C-A chromosome 11 11 403879 403580 C 2011-02-03 2001-02-26 Putative protein of unknown function; identified by homology; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000037213 CDS YKL018C-A 11 403879 403580 C 2011-02-03 2001-02-26 -S000001501 ORF Verified YKL018W SWD2 WD-repeat containing protein SWD2|SAF37|CPS35 chromosome 11 11 404102 405091 W 2011-02-03 1996-07-31 Subunit of the COMPASS (Set1C) histone H3K4 methyltransferase complex; required for Set1C stability and optimal activity; COMPASS methylates histone H3 on lys 4 and is involved in telomeric silencing; subunit of CPF (cleavage and polyadenylation factor), a complex involved in RNAP II transcription termination -S000034635 CDS YKL018W 11 404102 405091 W 2011-02-03 1996-07-31 -S000001500 ORF Verified YKL017C HCS1 ATP-dependent 5'-3' DNA helicase HCS1|DIP1 chromosome 11 L000003087|L000004272 11 407241 405190 C 2011-02-03 1996-07-31 Hexameric DNA polymerase alpha-associated DNA helicase A; involved in lagging strand DNA synthesis; contains single-stranded DNA stimulated ATPase and dATPase activities; replication protein A stimulates helicase and ATPase activities -S000034495 CDS YKL017C 11 407241 405190 C 2011-02-03 1996-07-31 -S000001499 ORF Verified YKL016C ATP7 F1F0 ATP synthase subunit d chromosome 11 L000000146 11 407989 407465 C 2011-02-03 1996-07-31 Subunit d of the stator stalk of mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis -S000032473 CDS YKL016C 11 407989 407465 C 2011-02-03 1996-07-31 -S000001498 ORF Verified YKL015W PUT3 chromosome 11 L000001537|L000001528 11 408544 411483 W -5 2011-02-03 1996-07-31 Transcriptional activator; binds specific gene recruitment sequences and is required for DNA zip code-mediated targeting of genes to nuclear periphery; regulates proline utilization genes, constitutively binds PUT1 and PUT2 promoters as a dimer, undergoes conformational change to form active state; binds other promoters only under activating conditions; differentially phosphorylated in presence of different nitrogen sources; has a Zn(2)-Cys(6) binuclear cluster domain -S000032428 CDS YKL015W 11 408544 411483 W 2011-02-03 1996-07-31 -S000001497 ORF Verified YKL014C URB1 NPA1 chromosome 11 11 416913 411619 C 2011-02-03 1996-07-31 Protein required for the normal accumulation of 25S and 5.8S rRNAs; nucleolar protein; associated with the 27SA2 pre-ribosomal particle; proposed to be involved in the biogenesis of the 60S ribosomal subunit -S000032267 CDS YKL014C 11 416913 411619 C 2011-02-03 1996-07-31 -S000118405 ARS ARS1113 ARSXI-417 chromosome 11 11 417185 417417 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000001496 ORF Verified YKL013C ARC19 chromosome 11 L000004034 11 418023 417508 C 2011-02-03 1996-07-31 Subunit of the ARP2/3 complex; ARP2/3 is required for the motility and integrity of cortical actin patches; mutation is functionally complemented by human ARPC4 -S000031281 CDS YKL013C 11 418023 417508 C 2011-02-03 1996-07-31 -S000001495 ORF Verified YKL012W PRP40 chromosome 11 L000003078 11 418310 420061 W 2011-02-03 1996-07-31 U1 snRNP protein involved in splicing; interacts with the branchpoint-binding protein during the formation of the second commitment complex -S000031220 CDS YKL012W 11 418310 420061 W 2011-02-03 1996-07-31 -S000001494 ORF Verified YKL011C CCE1 cruciform cutting endonuclease|MGT1 chromosome 11 L000000236 11 421216 420155 C -2 2011-02-03 1996-07-31 Mitochondrial cruciform cutting endonuclease; cleaves Holliday junctions formed during recombination of mitochondrial DNA; CCE1 has a paralog, MRS1, that arose from the whole genome duplication -S000031036 CDS YKL011C 11 421216 420155 C 2011-02-03 1996-07-31 -S000001493 ORF Verified YKL010C UFD4 putative ubiquitin-protein ligase UFD4 chromosome 11 L000003509 11 425875 421424 C 2011-02-03 1996-07-31 Ubiquitin-protein ligase (E3); interacts with Rpt4p and Rpt6p, two subunits of the 19S particle of the 26S proteasome; cytoplasmic E3 involved in the degradation of ubiquitin fusion proteins; relative distribution to the nucleus increases upon DNA replication stress -S000030049 CDS YKL010C 11 425875 421424 C 2011-02-03 1996-07-31 -S000001492 ORF Verified YKL009W MRT4 chromosome 11 L000004450 11 426242 426952 W 2011-02-03 1996-07-31 Protein involved in mRNA turnover and ribosome assembly; required at post-transcriptional step for efficient retrotransposition; localizes to the nucleolus -S000030485 CDS YKL009W 11 426242 426952 W 2011-02-03 1996-07-31 -S000001491 ORF Verified YKL008C LAC1 sphingosine N-acyltransferase LAC1|DGT1 chromosome 11 11 428551 427295 C 2011-02-03 1996-07-31 Ceramide synthase component; involved in synthesis of ceramide from C26(acyl)-coenzyme A and dihydrosphingosine or phytosphingosine, functionally equivalent to Lag1p; LAC1 has a paralog, LAG1, that arose from the whole genome duplication -S000030290 CDS YKL008C 11 428551 427295 C 2011-02-03 1996-07-31 -S000001490 ORF Verified YKL007W CAP1 chromosome 11 L000000214 11 429302 430108 W -2 2011-02-03 1996-07-31 Alpha subunit of the capping protein heterodimer (Cap1p and Cap2p); capping protein (CP) binds to the barbed ends of actin filaments preventing further polymerization; localized predominantly to cortical actin patches; protein increases in abundance and relocalizes from bud neck to plasma membrane upon DNA replication stress -S000030183 CDS YKL007W 11 429302 430108 W 2011-02-03 1996-07-31 -S000002101 ORF Verified YKL006C-A SFT1 chromosome 11 L000002949 11 430632 430198 C 2011-02-03 1996-07-31 Intra-Golgi v-SNARE; required for transport of proteins between an early and a later Golgi compartment -S000037319 CDS YKL006C-A 11 430455 430198 C 2011-02-03 1996-07-31 -S000037318 CDS YKL006C-A 11 430632 430597 C 2011-02-03 1996-07-31 -S000037320 intron YKL006C-A 11 430596 430456 C 2011-02-03 1996-07-31 -S000114301 snoRNA_gene snR87 SNR87 chromosome 11 11 431138 431030 C 2011-02-03 2006-03-02 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position A436 -S000114518 noncoding_exon snR87 11 431138 431030 C 2011-02-03 2006-03-02 -S000001489 ORF Verified YKL006W RPL14A eL14|ribosomal 60S subunit protein L14A|L14e|L14A chromosome 11 L000002706 11 431906 432720 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L14A; N-terminally acetylated; homologous to mammalian ribosomal protein L14, no bacterial homolog; RPL14A has a paralog, RPL14B, that arose from the whole genome duplication -S000030075 CDS YKL006W 11 431906 432034 W 2011-02-03 1996-07-31 -S000030076 CDS YKL006W 11 432433 432720 W 2011-02-03 1996-07-31 -S000030077 intron YKL006W 11 432035 432432 W 2011-02-03 1996-07-31 -S000001488 ORF Verified YKL005C BYE1 chromosome 11 11 434877 433093 C 2011-02-03 1996-07-31 Negative regulator of transcription elongation; contains a TFIIS-like domain that associates with chromatin and a PHD domain that interacts with H3K4me3; multicopy suppressor of temperature-sensitive ess1 mutations, binds RNA polymerase II large subunit -S000036319 CDS YKL005C 11 434877 433093 C 2011-02-03 1996-07-31 -S000001487 ORF Verified YKL004W AUR1 inositol phosphorylceramide synthase chromosome 11 L000002767 11 435580 436785 W 2011-02-03 1996-07-31 Phosphatidylinositol:ceramide phosphoinositol transferase; required for sphingolipid synthesis; can mutate to confer aureobasidin A resistance; also known as IPC synthase -S000036280 CDS YKL004W 11 435580 436785 W 2011-02-03 1996-07-31 -S000001486 ORF Verified YKL003C MRP17 mitochondrial 37S ribosomal protein YmS16 chromosome 11 L000002616 11 437492 437097 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; MRP17 exhibits genetic interactions with PET122, encoding a COX3-specific translational activator -S000036065 CDS YKL003C 11 437492 437097 C 2011-02-03 1996-07-31 -S000001485 ORF Verified YKL002W DID4 ESCRT-III subunit protein DID4|VPS14|CHM2|VPS2|VPT14|VPL2|REN1|GRD7 chromosome 11 L000002955 11 437778 438544 W 2011-02-03 2000-07-22|1996-07-31 Class E Vps protein of the ESCRT-III complex; required for sorting of integral membrane proteins into lumenal vesicles of multivesicular bodies, and for delivery of newly synthesized vacuolar enzymes to the vacuole, involved in endocytosis -S000035271 CDS YKL002W 11 437778 437837 W 2011-02-03 2000-07-22|1996-07-31 -S000035272 CDS YKL002W 11 437906 438544 W 2011-02-03 2000-07-22 -S000035273 intron YKL002W 11 437838 437905 W 2011-02-03 2000-07-22 -S000001484 ORF Verified YKL001C MET14 adenylyl-sulfate kinase chromosome 11 L000001086 11 439385 438777 C .8 2011-02-03 1996-07-31 Adenylylsulfate kinase; required for sulfate assimilation and involved in methionine metabolism; human homolog PAPSS2 complements yeast null mutant -S000034979 CDS YKL001C 11 439385 438777 C 2011-02-03 1996-07-31 -S000006472 centromere CEN11 CEN11 chromosome 11 L000000304 11 440246 440129 C 0 2011-02-03 2000-05-19|2004-10-08 Chromosome XI centromere -S000077299 centromere_DNA_Element_I CEN11 11 440246 440237 C 2011-02-03 2004-10-08 -S000077300 centromere_DNA_Element_II CEN11 11 440236 440154 C 2011-02-03 2004-10-08 -S000077301 centromere_DNA_Element_III CEN11 11 440153 440129 C 2011-02-03 2004-10-08 -S000001709 ORF Verified YKR001C VPS1 dynamin-like GTPase VPS1|VPT26|VPL1|SPO15|LAM1|GRD1 chromosome 11 L000002006 11 442722 440608 C -1 2011-02-03 1996-07-31 Dynamin-like GTPase required for vacuolar sorting; also involved in actin cytoskeleton organization, endocytosis, late Golgi-retention of some proteins, regulation of peroxisome biogenesis -S000030382 CDS YKR001C 11 442722 440608 C 2011-02-03 1996-07-31 -S000001710 ORF Verified YKR002W PAP1 polynucleotide adenylyltransferase PAP1 chromosome 11 L000001336 11 443232 444938 W -1 2011-02-03 1996-07-31 Poly(A) polymerase; one of three factors required for mRNA 3'-end polyadenylation, forms multiprotein complex with polyadenylation factor I (PF I), also required for mRNA nuclear export; may also polyadenylate rRNAs; required for gene looping -S000033778 CDS YKR002W 11 443232 444938 W 2011-02-03 1996-07-31 -S000001711 ORF Verified YKR003W OSH6 oxysterol-binding protein OSH6 chromosome 11 11 445381 446727 W 2011-02-03 1996-07-31 Member of an oxysterol-binding protein family; family members have overlapping, redundant functions in sterol metabolism and collectively perform a function essential for viability; GFP-fusion protein localizes to the cell periphery; overexpression extends lifespan by promoting vacuolar fusion; OSH6 has a paralog, OSH7, that arose from the whole genome duplication -S000033901 CDS YKR003W 11 445381 446727 W 2011-02-03 1996-07-31 -S000118406 ARS ARS1114 ARSXI-448 chromosome 11 11 448020 448254 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000001712 ORF Verified YKR004C ECM9 YKR004C-A chromosome 11 L000003884 11 448036 446799 C 2011-02-03 2003-09-27|1996-07-31 Non-essential protein of unknown function -S000033974 CDS YKR004C 11 447706 446799 C 2011-02-03 2003-09-27 -S000033973 CDS YKR004C 11 448036 447811 C 2011-02-03 2003-09-27|1996-07-31 -S000033975 intron YKR004C 11 447810 447707 C 2011-02-03 2003-09-27 -S000001713 ORF Uncharacterized YKR005C chromosome 11 11 450167 448521 C 2011-02-03 1996-07-31|2007-09-05 Putative protein of unknown function -S000123939 CDS YKR005C 11 449951 448521 C 2011-02-03 2007-09-05 -S000034843 CDS YKR005C 11 450167 450021 C 2011-02-03 1996-07-31|2007-09-05 -S000123938 intron YKR005C 11 450020 449952 C 2011-02-03 2007-09-05 -S000001714 ORF Verified YKR006C MRPL13 mitochondrial 54S ribosomal protein YmL13|YmL13|YK105 chromosome 11 L000001164|L000002526 11 451217 450423 C 2011-02-03 2003-09-22|1996-07-31 Mitochondrial ribosomal protein of the large subunit; not essential for mitochondrial translation -S000034952 CDS YKR006C 11 451217 450423 C 2011-02-03 2003-09-22|1996-07-31 -S000001715 ORF Verified YKR007W MEH1 GSE2|EGO1 chromosome 11 11 451434 451988 W 2011-02-03 1996-07-31 Component of the EGO and GSE complexes; EGO is involved in the regulation of microautophagy and GSE is required for proper sorting of amino acid permease Gap1p; loss results in a defect in vacuolar acidification -S000035149 CDS YKR007W 11 451434 451988 W 2011-02-03 1996-07-31 -S000001716 ORF Verified YKR008W RSC4 chromosome 11 L000004026 11 452201 454078 W 2011-02-03 1996-07-31|2011-02-03 Component of the RSC chromatin remodeling complex; found in close proximity to nucleosomal DNA; displaced from the surface of nucleosomal DNA after chromatin remodeling; acetylated (K25) by Gcn5p, altering replication stress tolerance; contains tandem bromodomains that recognize histone H3 acetylated on K14 (H3K14ac) by Gcn5p -S000036038 CDS YKR008W 11 452201 454078 W 2011-02-03 1996-07-31|2011-02-03 -S000001717 ORF Verified YKR009C FOX2 bifunctional hydroxyacyl-CoA dehydrogenase/enoyl-CoA hydratase FOX2|POX2 chromosome 11 L000000622 11 457054 454352 C 2011-02-03 1996-07-31 3-hydroxyacyl-CoA dehydrogenase and enoyl-CoA hydratase; multifunctional enzyme of the peroxisomal fatty acid beta-oxidation pathway; mutation is functionally complemented by human HSD17B4 -S000036079 CDS YKR009C 11 457054 454352 C 2011-02-03 1996-07-31 -S000007058 long_terminal_repeat YKRCdelta8 chromosome 11 11 458471 458140 C 2011-02-03 2000-05-19 Ty1 LTR -S000006642 tRNA_gene tL(CAA)K chromosome 11 L000003635 11 458557 458670 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000033792 intron tL(CAA)K 11 458595 458626 W 2011-02-03 2000-05-19 -S000033790 noncoding_exon tL(CAA)K 11 458557 458594 W 2011-02-03 2000-05-19 -S000033791 noncoding_exon tL(CAA)K 11 458627 458670 W 2011-02-03 2000-05-19 -S000001718 ORF Verified YKR010C TOF2 chromosome 11 L000004245 11 461239 458924 C 2011-02-03 1996-07-31 Protein required for rDNA silencing and mitotic rDNA condensation; stimulates Cdc14p phosphatase activity and biphasic release to promote rDNA repeat segregation; required for condensin recruitment to the replication fork barrier site; TOF2 has a paralog, NET1, that arose from the whole genome duplication -S000034767 CDS YKR010C 11 461239 458924 C 2011-02-03 1996-07-31 -S000001719 ORF Verified YKR011C TOS5 chromosome 11 11 462696 461635 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; protein abundance increases in response to DNA replication stress -S000035735 CDS YKR011C 11 462696 461635 C 2011-02-03 1996-07-31 -S000130139 ARS ARS1115 ARSXI-463 chromosome 11 11 462699 463742 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000001721 ORF Verified YKR013W PRY2 sterol-binding protein|YFW12 chromosome 11 L000003217 11 463959 464948 W 2011-02-03 1996-07-31 Sterol binding protein involved in the export of acetylated sterols; secreted glycoprotein and member of the CAP protein superfamily (cysteine-rich secretory proteins (CRISP), antigen 5, and pathogenesis related 1 proteins); sterol export function is redundant with that of PRY1; may be involved in detoxification of hydrophobic compounds; PRY2 has a paralog, PRY1, that arose from the whole genome duplication -S000037809 CDS YKR013W 11 463959 464948 W 2011-02-03 1996-07-31 -S000001720 ORF Dubious YKR012C chromosome 11 11 464116 463739 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene PRY2 -S000035867 CDS YKR012C 11 464116 463739 C 2011-02-03 1996-07-31|2011-02-03 -S000001722 ORF Verified YKR014C YPT52 Rab family GTPase YPT52 chromosome 11 L000002546 11 466071 465367 C 2011-02-03 1996-07-31 Endosomal Rab family GTPase; required for vacuolar protein sorting, endocytosis and multivesicular body (MVB) biogenesis and sorting; required for localization of the CORVET complex to endosomes; involved in autophagy and ionic stress tolerance; similar to Vps21p and Ypt53p; mammalian Rab5 homolog; protein abundance increases in response to DNA replication stress -S000037843 CDS YKR014C 11 466071 465367 C 2011-02-03 1996-07-31 -S000001723 ORF Uncharacterized YKR015C chromosome 11 11 468667 466961 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000029849 CDS YKR015C 11 468667 466961 C 2011-02-03 1996-07-31 -S000001724 ORF Verified YKR016W MIC60 FCJ1|AIM28|FMP13 chromosome 11 11 469717 471339 W 2011-02-03 1996-07-31 Component of the MICOS complex; MICOS (formerly MINOS or MitOS) is a mitochondrial inner membrane complex that extends into the intermembrane space and has a role in the maintenance of crista junctions, inner membrane architecture, and formation of contact sites to the outer membrane; Mic60p is also involved in import of intermembrane space (IMS) proteins, probably by positioning Mia40p relative to the TOM complex to receive incoming proteins; ortholog of mammalian mitofilin -S000030918 CDS YKR016W 11 469717 471339 W 2011-02-03 1996-07-31 -S000001725 ORF Verified YKR017C HEL1 E3 ubiquitin-protein ligase HEL1 chromosome 11 11 473349 471694 C 2011-02-03 1996-07-31 RING finger ubiquitin ligase (E3); involved in ubiquitination and degradation of excess histones; interacts with Ubc4p and Rad53p; null mutant sensitive to hydroxyurea (HU) -S000030959 CDS YKR017C 11 473349 471694 C 2011-02-03 1996-07-31 -S000001726 ORF Verified YKR018C chromosome 11 11 475900 473723 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; protein abundance increases in response to DNA replication stress; YKR018C has a paralog, IML2, that arose from the whole genome duplication -S000031035 CDS YKR018C 11 475900 473723 C 2011-02-03 1996-07-31 -S000001727 ORF Verified YKR019C IRS4 chromosome 11 L000004394 11 478063 476216 C 2011-02-03 1996-07-31 EH domain-containing protein; involved in regulating phosphatidylinositol 4,5-bisphosphate levels and autophagy; Irs4p and Tax4p bind and activate the PtdIns phosphatase Inp51p; Irs4p and Tax4p are involved in localizing Atg17p to the PAS; IRS4 has a paralog, TAX4, that arose from the whole genome duplication -S000031136 CDS YKR019C 11 478063 476216 C 2011-02-03 1996-07-31 -S000001728 ORF Verified YKR020W VPS51 VPS67|API3|WHI6 chromosome 11 11 478338 478832 W 2011-02-03 1996-07-31 Component of the GARP (Golgi-associated retrograde protein) complex; GARP is required for the recycling of proteins from endosomes to the late Golgi, and for mitosis after DNA damage induced checkpoint arrest; links the (VFT/GARP) complex to the SNARE Tlg1p; members of the GARP complex are Vps51p-Vps52p-Vps53p-Vps54p -S000030781 CDS YKR020W 11 478338 478832 W 2011-02-03 1996-07-31 -S000001729 ORF Verified YKR021W ALY1 ART6 chromosome 11 11 479234 481981 W 2011-02-03 1996-07-31|2011-02-03 Alpha arrestin, substrate of calcineurin; controls nutrient-mediated intracellular sorting of permease Gap1p; interacts with AP-1 subunit Apl4p; dephosphorylation of Aly1p required for the endocytosis of Dip5p; may regulate endocytosis of plasma membrane proteins by recruiting ubiquitin ligase Rsp5p to plasma membrane targets; ALY1 has a paralog, ALY2, that arose from the whole genome duplication -S000030869 CDS YKR021W 11 479234 481981 W 2011-02-03 1996-07-31|2011-02-03 -S000001730 ORF Verified YKR022C NTR2 chromosome 11 11 483139 482171 C 2011-02-03 1996-07-31 Essential protein that forms a dimer with Ntr1p; also forms a trimer, with Ntr2p and the DExD/H-box RNA helicase Prp43p, that is involved in spliceosome disassembly -S000031793 CDS YKR022C 11 483139 482171 C 2011-02-03 1996-07-31 -S000001731 ORF Uncharacterized YKR023W chromosome 11 11 483419 485011 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000032021 CDS YKR023W 11 483419 485011 W 2011-02-03 1996-07-31 -S000001732 ORF Verified YKR024C DBP7 putative ATP-dependent RNA helicase chromosome 11 L000004205 11 487372 485144 C 2011-02-03 1996-07-31 Putative ATP-dependent RNA helicase of the DEAD-box family; involved in ribosomal biogenesis; required at post-transcriptional step for efficient retrotransposition; essential for growth under anaerobic conditions -S000032100 CDS YKR024C 11 487372 485144 C 2011-02-03 1996-07-31 -S000001733 ORF Verified YKR025W RPC37 DNA-directed RNA polymerase III subunit C37|C37 chromosome 11 11 487770 488618 W 2011-02-03 1996-07-31 RNA polymerase III subunit C37 -S000034103 CDS YKR025W 11 487770 488618 W 2011-02-03 1996-07-31 -S000001734 ORF Verified YKR026C GCN3 translation initiation factor eIF2B subunit alpha|AAS2 chromosome 11 L000000682 11 489655 488738 C 7 2011-02-03 1996-07-31 Alpha subunit of translation initiation factor eIF2B; guanine-nucleotide exchange factor for eIF2; activity subsequently regulated by phosphorylated eIF2; positive regulator of GCN4 expression; assembles into filaments with Gcd2p, Gcd6p, Gcd7p, and Sui2p as cells approach stationary phase and under cytosolic acidification and starvation conditions; human homolog EIF2B1 can complement yeast null mutant -S000034170 CDS YKR026C 11 489655 488738 C 2011-02-03 1996-07-31 -S000007059 long_terminal_repeat YKRCdelta9 chromosome 11 11 490416 490286 C 2011-02-03 2000-05-19 Ty1 LTR -S000007062 long_terminal_repeat YKRWdelta10 chromosome 11 11 490464 490787 W 2011-02-03 2000-05-19 Ty1 LTR -S000006703 tRNA_gene tR(ACG)K chromosome 11 L000003636 11 490968 491040 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 6 nuclear tRNA genes containing the tDNA-anticodon ACG (converted to ICG in the mature tRNA), decodes CGU, CGC, and probably CGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000030411 noncoding_exon tR(ACG)K 11 490968 491040 W 2011-02-03 2000-05-19 -S000001735 ORF Verified YKR027W BCH2 FMP50 chromosome 11 11 491364 493661 W 2011-02-03 1996-07-31 Member of the ChAPs (Chs5p-Arf1p-binding proteins) family; part of the exomer complex with Chs5p to mediate export of specific cargo proteins, including Chs3p, from the Golgi to the plasma membrane; BCH2 has a paralog, CHS6, that arose from the whole genome duplication -S000034303 CDS YKR027W 11 491364 493661 W 2011-02-03 1996-07-31 -S000001736 ORF Verified YKR028W SAP190 chromosome 11 L000002600 11 494257 497358 W 2011-02-03 1996-07-31|2011-02-03 Protein that forms a complex with the Sit4p protein phosphatase; required for Sit4p function; member of a family of similar proteins including Sap4p, Sap155p, and Sap185p; SAP190 has a paralog, SAP185, that arose from the whole genome duplication -S000034368 CDS YKR028W 11 494257 497358 W 2011-02-03 1996-07-31|2011-02-03 -S000001737 ORF Verified YKR029C SET3 histone-binding protein SET3 chromosome 11 11 499833 497578 C 2011-02-03 1996-07-31 Defining member of the SET3 histone deacetylase complex; which is a meiosis-specific repressor of sporulation genes; necessary for efficient transcription by RNAPII; one of two yeast proteins that contains both SET and PHD domains; SET3 has a paralog, SET4, that arose from the whole genome duplication -S000035298 CDS YKR029C 11 499833 497578 C 2011-02-03 1996-07-31 -S000001738 ORF Verified YKR030W GMH1 MSG1 chromosome 11 11 500282 501103 W 2011-02-03 1996-07-31 Golgi membrane protein of unknown function; interacts with Gea1p and Gea2p; required for localization of Gea2p; computational analysis suggests a possible role in either cell wall synthesis or protein-vacuolar targeting -S000033925 CDS YKR030W 11 500282 501103 W 2011-02-03 1996-07-31 -S000001739 ORF Verified YKR031C SPO14 phospholipase D|PLD1 chromosome 11 L000002005|L000002946 11 506395 501344 C 18 2011-02-03 1996-07-31 Phospholipase D; catalyzes the hydrolysis of phosphatidylcholine, producing choline and phosphatidic acid; involved in Sec14p-independent secretion; required for meiosis and spore formation; differently regulated in secretion and meiosis; participates in transcription initiation and/or early elongation of specific genes; interacts with "foot domain" of RNA polymerase II; deletion results in abnormal CTD-Ser5 phosphorylation of RNA polymerase II at specific promoter regions -S000034013 CDS YKR031C 11 506395 501344 C 2011-02-03 1996-07-31 -S000001740 ORF Dubious YKR032W chromosome 11 11 506517 506831 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034971 CDS YKR032W 11 506517 506831 W 2011-02-03 1996-07-31 -S000001742 ORF Verified YKR034W DAL80 UGA43 chromosome 11 L000000480 11 506898 507707 W 14 2011-02-03 1996-07-31 Negative regulator of genes in multiple nitrogen degradation pathways; expression is regulated by nitrogen levels and by Gln3p; member of the GATA-binding family, forms homodimers and heterodimers with Gzf3p; DAL80 has a paralog, GZF3, that arose from the whole genome duplication -S000036062 CDS YKR034W 11 506898 507707 W 2011-02-03 1996-07-31 -S000001741 ORF Dubious YKR033C chromosome 11 11 507304 506879 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene DAL80 -S000035067 CDS YKR033C 11 507304 506879 C 2011-02-03 1996-07-31 -S000006435 ORF Verified YKR035W-A DID2 VPL30|VPS46|CHM1|FTI1 chromosome 11 L000004496 11 507939 508553 W 2011-02-03 1999-07-17 Class E protein of the vacuolar protein-sorting (Vps) pathway; binds Vps4p and directs it to dissociate ESCRT-III complexes; forms a functional and physical complex with Ist1p; human ortholog may be altered in breast tumors -S000034954 CDS YKR035W-A 11 507939 508553 W 2011-02-03 1999-07-17 -S000001743 ORF Dubious YKR035C OPI8 chromosome 11 11 508561 507920 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene DID2/YKR035W-A -S000036116 CDS YKR035C 11 508561 507920 C 2011-02-03 1996-07-31 -S000001744 ORF Verified YKR036C CAF4 chromosome 11 L000003417 11 510633 508702 C 2011-02-03 1996-07-31|2006-05-08|2011-02-03 WD40 repeat-containing protein associated with the CCR4-NOT complex; interacts in a Ccr4p-dependent manner with Ssn2p; also interacts with Fis1p, Mdv1p and Dnm1p and plays a role in mitochondrial fission; CAF4 has a paralog, MDV1, that arose from the whole genome duplication -S000036256 CDS YKR036C 11 510633 508702 C 2011-02-03 1996-07-31|2006-05-08|2011-02-03 -S000001745 ORF Verified YKR037C SPC34 chromosome 11 L000004696 11 511797 510910 C 2011-02-03 1996-07-31 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; also localized to nuclear side of spindle pole body -S000036356 CDS YKR037C 11 511797 510910 C 2011-02-03 1996-07-31 -S000001746 ORF Verified YKR038C KAE1 tRNA N6-adenosine threonylcarbamoyltransferase chromosome 11 11 513159 511999 C 2011-02-03 2003-09-22|1996-07-31 Highly conserved ATPase of HSP70/DnaK family; essential functional component of the EKC/KEOPS complex, with Bud32p, Cgi121p, Pcc1p, and Gon7p; EKC/KEOPS complex is required for t6A tRNA modification and telomeric TG1-3 recombination; may have role in transcription -S000036434 CDS YKR038C 11 513159 511999 C 2011-02-03 2003-09-22|1996-07-31 -S000006540 tRNA_gene tD(GUC)K chromosome 11 L000003639 11 513403 513332 C 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000037688 noncoding_exon tD(GUC)K 11 513403 513332 C 2011-02-03 2000-05-19 -S000007060 long_terminal_repeat YKRCdelta11 chromosome 11 11 513846 513532 C 2011-02-03 2000-05-19 Ty1 LTR -S000001747 ORF Verified YKR039W GAP1 amino acid permease GAP1 chromosome 11 L000000667 11 515063 516871 W 27 2011-02-03 1996-07-31 General amino acid permease; Gap1p senses the presence of amino acid substrates to regulate localization to the plasma membrane when needed; essential for invasive growth -S000030283 CDS YKR039W 11 515063 516871 W 2011-02-03 1996-07-31 -S000118407 ARS ARS1116 ARSXI-517 chromosome 11 11 517017 517265 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000007061 long_terminal_repeat YKRCdelta12 chromosome 11 11 517784 517453 C 2011-02-03 2000-05-19 Ty1 LTR -S000006516 tRNA_gene tA(AGC)K2 chromosome 11 L000003637 11 517988 518060 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine -S000036249 noncoding_exon tA(AGC)K2 11 517988 518060 W 2011-02-03 2000-05-19 -S000001749 ORF Verified YKR041W chromosome 11 11 518198 518950 W 2011-02-03 1996-07-31 Protein of unknown function; localizes to the mitotic spindle; overexpression of YKR041W affects endocytic protein trafficking -S000030043 CDS YKR041W 11 518198 518950 W 2011-02-03 1996-07-31 -S000001748 ORF Dubious YKR040C chromosome 11 11 518566 518063 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YKR041W -S000029852 CDS YKR040C 11 518566 518063 C 2011-02-03 1996-07-31 -S000001750 ORF Verified YKR042W UTH1 SUN family protein UTH1 chromosome 11 L000002766 11 519527 520624 W 2011-02-03 1996-07-31|2005-11-03 Mitochondrial inner membrane protein; role in mitophagy is disputed; implicated in cell wall biogenesis, the oxidative stress response, life span during starvation, and cell death; SUN family member; UTH1 has a paralog, NCA3, that arose from the whole genome duplication -S000031030 CDS YKR042W 11 519527 520624 W 2011-02-03 1996-07-31|2005-11-03 -S000001751 ORF Verified YKR043C SHB17 sedoheptulose-bisphosphatase chromosome 11 11 521712 520897 C 2011-02-03 1996-07-31 Sedoheptulose bisphosphatase involved in riboneogenesis; dephosphorylates sedoheptulose 1,7-bisphosphate, which is converted via the nonoxidative pentose phosphate pathway to ribose-5-phosphate; facilitates the conversion of glycolytic intermediates to pentose phosphate units; also has fructose 1,6-bisphosphatase activity but this is probably not biologically relevant, since deletion does not affect FBP levels; GFP-fusion protein localizes to the cytoplasm and nucleus -S000031078 CDS YKR043C 11 521712 520897 C 2011-02-03 1996-07-31 -S000001752 ORF Verified YKR044W UIP5 chromosome 11 11 522015 523346 W 2011-02-03 1996-07-31 Protein of unknown function that interacts with Ulp1p; a Ubl (ubiquitin-like protein)-specific protease for Smt3p protein conjugates -S000031276 CDS YKR044W 11 522015 523346 W 2011-02-03 1996-07-31 -S000001753 ORF Uncharacterized YKR045C chromosome 11 11 523969 523418 C 2011-02-03 2003-09-22|1996-07-31 Putative protein of unknown function; epitope-tagged protein localizes to the cytoplasm -S000032206 CDS YKR045C 11 523969 523418 C 2011-02-03 2003-09-22|1996-07-31 -S000001754 ORF Verified YKR046C PET10 chromosome 11 11 525074 524223 C 2011-02-03 1996-07-31 Protein of unknown function that localizes to lipid particles; localization suggests a role in lipid metabolism; expression pattern suggests a role in respiratory growth; computational analysis of large-scale protein-protein interaction data suggests a role in ATP/ADP exchange -S000032320 CDS YKR046C 11 525074 524223 C 2011-02-03 1996-07-31 -S000001755 ORF Dubious YKR047W chromosome 11 11 525257 525562 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene NAP1 -S000032471 CDS YKR047W 11 525257 525562 W 2011-02-03 1996-07-31 -S000001756 ORF Verified YKR048C NAP1 histone chaperone NAP1 chromosome 11 L000001232 11 526640 525387 C 2011-02-03 1996-07-31 Histone chaperone; involved in histone exchange by removing and replacing histone H2A-H2B dimers or histone variant dimers from assembled nucleosomes; involved in the transport of H2A and H2B histones to the nucleus; required for the regulation of microtubule dynamics during mitosis; interacts with mitotic cyclin Clb2p; controls bud morphogenesis; phosphorylated by CK2; protein abundance increases in response to DNA replication stress -S000034427 CDS YKR048C 11 526640 525387 C 2011-02-03 1996-07-31 -S000001757 ORF Verified YKR049C FMP46 putative redox protein chromosome 11 11 527231 526830 C 2011-02-03 1996-07-31 Putative redox protein containing a thioredoxin fold; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000034545 CDS YKR049C 11 527231 526830 C 2011-02-03 1996-07-31 -S000001758 ORF Verified YKR050W TRK2 RPD2 chromosome 11 L000002335 11 527815 530484 W 15 2011-02-03 1996-07-31 Component of the Trk1p-Trk2p potassium transport system; contributes to K(+) supply and maintenance of plasma-membrane potential; TRK2 has a paralog, TRK1, that arose from the whole genome duplication -S000033289 CDS YKR050W 11 527815 530484 W 2011-02-03 1996-07-31 -S000001759 ORF Uncharacterized YKR051W chromosome 11 11 530946 532202 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000034162 CDS YKR051W 11 530946 532202 W 2011-02-03 1996-07-31 -S000001760 ORF Verified YKR052C MRS4 Fe(2+) transporter chromosome 11 L000001180 11 533464 532550 C 2011-02-03 1996-07-31 Iron transporter of the mitochondrial carrier family; mediates Fe2+ transport across the inner mitochondrial membrane; active under low-iron conditions; may transport other cations; protein abundance increases in response to DNA replication stress; MRS4 has a paralog, MRS3, that arose from the whole genome duplication -S000034228 CDS YKR052C 11 533464 532550 C 2011-02-03 1996-07-31 -S000001761 ORF Verified YKR053C YSR3 sphinganine kinase YSR3|LBP2 chromosome 11 L000004404 11 535281 534067 C 2011-02-03 1996-07-31 Dihydrosphingosine 1-phosphate phosphatase; membrane protein involved in sphingolipid metabolism; YSR3 has a paralog, LCB3, that arose from the whole genome duplication -S000034357 CDS YKR053C 11 535281 534067 C 2011-02-03 1996-07-31 -S000001762 ORF Verified YKR054C DYN1 dynein heavy chain|PAC6|DHC1 chromosome 11 L000000538 11 547925 535647 C 24.6 2011-02-03 1996-07-31 Cytoplasmic heavy chain dynein; microtubule motor protein; member of the AAA+ protein family, required for anaphase spindle elongation; involved in spindle assembly, chromosome movement, and spindle orientation during cell division, targeted to microtubule tips by Pac1p; motility along microtubules inhibited by She1p -S000035346 CDS YKR054C 11 547925 535647 C 2011-02-03 1996-07-31 -S000001763 ORF Verified YKR055W RHO4 Rho family GTPase RHO4 chromosome 11 L000001633 11 548216 549091 W 2011-02-03 1996-07-31 Non-essential small GTPase; member of the Rho/Rac subfamily of Ras-like proteins; likely to be involved in the establishment of cell polarity; has long N-terminal extension that plays an important role in Rho4p function and is shared with Rho4 homologs in other yeasts and filamentous fungi -S000035541 CDS YKR055W 11 548216 549091 W 2011-02-03 1996-07-31 -S000001764 ORF Verified YKR056W TRM2 RNC1|NUD1|NUC2 chromosome 11 L000001652|L000001284 11 549448 551367 W 2011-02-03 2004-02-13|1996-07-31 tRNA methyltransferase; 5-methylates the uridine residue at position 54 of tRNAs and may also have a role in tRNA stabilization or maturation; endo-exonuclease with a role in DNA repair -S000035618 CDS YKR056W 11 549448 551367 W 2011-02-03 2004-02-13|1996-07-31 -S000001765 ORF Verified YKR057W RPS21A eS21|ribosomal 40S subunit protein S21A|S21e|YS25|S26A|S21A|RPS25 chromosome 11 L000001761 11 551657 552242 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S21, no bacterial homolog; RPS21A has a paralog, RPS21B, that arose from the whole genome duplication -S000036538 CDS YKR057W 11 551657 551680 W 2011-02-03 1996-07-31 -S000036539 CDS YKR057W 11 552003 552242 W 2011-02-03 1996-07-31 -S000036540 intron YKR057W 11 551681 552002 W 2011-02-03 1996-07-31 -S000001766 ORF Verified YKR058W GLG1 glycogenin glucosyltransferase GLG1 chromosome 11 L000002878 11 552770 554620 W 2011-02-03 1996-07-31|2005-12-01 Glycogenin glucosyltransferase; self-glucosylating initiator of glycogen synthesis, also glucosylates n-dodecyl-beta-D-maltoside; SWAT-GFP and mCherry fusion proteins localize to the cell periphery and vacuole respectively; similar to mammalian glycogenin; GLG1 has a paralog, GLG2, that arose from the whole genome duplication -S000036619 CDS YKR058W 11 552770 554620 W 2011-02-03 1996-07-31|2005-12-01 -S000001767 ORF Verified YKR059W TIF1 translation initiation factor eIF4A|eIF4A chromosome 11 L000002302 11 554987 556174 W 22 2011-02-03 1996-07-31 Translation initiation factor eIF4A; DEA(D/H)-box RNA helicase that couples ATPase activity to RNA binding and unwinding; forms a dumbbell structure of two compact domains connected by a linker; interacts with eIF4G; protein abundance increases in response to DNA replication stress; TIF1 has a paralog, TIF2, that arose from the whole genome duplication -S000036719 CDS YKR059W 11 554987 556174 W 2011-02-03 1996-07-31 -S000001768 ORF Verified YKR060W UTP30 chromosome 11 11 556518 557342 W 2011-02-03 1996-07-31 Putative subunit of U3-containing 90S preribosome complex; complex is involved in production of 18S rRNA and assembly of small ribosomal subunit -S000030161 CDS YKR060W 11 556518 557342 W 2011-02-03 1996-07-31 -S000001769 ORF Verified YKR061W KTR2 mannosyltransferase KTR2 chromosome 11 L000000925 11 557677 558954 W 2011-02-03 1996-07-31 Mannosyltransferase involved in N-linked protein glycosylation; member of the KRE2/MNT1 mannosyltransferase family; KTR2 has a paralog, YUR1, that arose from the whole genome duplication -S000030356 CDS YKR061W 11 557677 558954 W 2011-02-03 1996-07-31 -S000006502 snoRNA_gene snR42 SNR42 chromosome 11 L000003409 11 559366 559016 C 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2975 -S000030613 noncoding_exon snR42 11 559366 559016 C 2011-02-03 2000-05-19 -S000001770 ORF Verified YKR062W TFA2 transcription factor TFIIE subunit TFA2 chromosome 11 L000002596 11 559666 560652 W 2011-02-03 1996-07-31 TFIIE small subunit; involved in RNA polymerase II transcription initiation -S000030483 CDS YKR062W 11 559666 560652 W 2011-02-03 1996-07-31 -S000001771 ORF Verified YKR063C LAS1 rRNA-processing protein LAS1 chromosome 11 L000000931 11 562297 560789 C 2011-02-03 1996-07-31 Endonuclease involved in pre-rRNA processing at both ends of ITS2; functions with Grc3p in a conserved mechanism to modulate rRNA processing and ribosome biogenesis; may coordinate the action of the Rat1p-Rai1p exoRNAse; required for the G1/S cell cycle transition; human ortholog is Las1L; mutants require the SSD1-v allele for viability -S000030551 CDS YKR063C 11 562297 560789 C 2011-02-03 1996-07-31 -S000001772 ORF Verified YKR064W OAF3 chromosome 11 11 562547 565138 W 2011-02-03 1996-07-31 Putative transcriptional repressor with Zn(2)-Cys(6) finger; negatively regulates transcription in response to oleate levels, based on mutant phenotype and localization to oleate-responsive promoters; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; forms nuclear foci upon DNA replication stress -S000031527 CDS YKR064W 11 562547 565138 W 2011-02-03 1996-07-31 -S000001773 ORF Verified YKR065C PAM17 FMP18 chromosome 11 11 565892 565299 C 2011-02-03 1996-07-31 Constituent of the TIM23 complex; proposed alternatively to be a component of the import motor (PAM complex) or to interact with and modulate the core TIM23 (Translocase of the Inner mitochondrial Membrane) complex; protein abundance increases in response to DNA replication stress -S000031607 CDS YKR065C 11 565892 565299 C 2011-02-03 1996-07-31 -S000001774 ORF Verified YKR066C CCP1 cytochrome-c peroxidase chromosome 11 L000000238 11 567198 566113 C 2011-02-03 1996-07-31 Mitochondrial cytochrome-c peroxidase; degrades reactive oxygen species in mitochondria, involved in the response to oxidative stress -S000032588 CDS YKR066C 11 567198 566113 C 2011-02-03 1996-07-31 -S000001775 ORF Verified YKR067W GPT2 bifunctional glycerol-3-phosphate/glycerone-phosphate O-acyltransferase GPT2|GAT1 chromosome 11 11 567918 570149 W 2011-02-03 1996-07-31 Glycerol-3-phosphate/dihydroxyacetone phosphate sn-1 acyltransferase; located in lipid particles and the ER; involved in the stepwise acylation of glycerol-3-phosphate and dihydroxyacetone in lipid biosynthesis; the most conserved motifs and functionally relevant residues are oriented towards the ER lumen -S000032727 CDS YKR067W 11 567918 570149 W 2011-02-03 1996-07-31 -S000001776 ORF Verified YKR068C BET3 TRAPP complex core subunit BET3 chromosome 11 L000004057 11 570909 570328 C 2011-02-03 1996-07-31 Core component of transport protein particle (TRAPP) complexes I-III; TRAPP complexes are related multimeric guanine nucleotide-exchange factors for the GTPase Ypt1, regulating ER-Golgi traffic (TRAPPI), intra-Golgi traffic (TRAPPII), endosome-Golgi traffic (TRAPPII and III) and autophagy (TRAPPIII); hydrophilic homodimeric protein that acts in conjunction with SNARE proteins in targeting and fusion of ER to Golgi transport vesicles -S000032759 CDS YKR068C 11 570909 570328 C 2011-02-03 1996-07-31 -S000001777 ORF Verified YKR069W MET1 uroporphyrinogen-III C-methyltransferase|MET20 chromosome 11 L000001089 11 571612 573393 W 2011-02-03 1996-07-31 S-adenosyl-L-methionine uroporphyrinogen III transmethylase; involved in the biosynthesis of siroheme, a prosthetic group used by sulfite reductase; required for sulfate assimilation and methionine biosynthesis -S000032921 CDS YKR069W 11 571612 573393 W 2011-02-03 1996-07-31 -S000001778 ORF Uncharacterized YKR070W chromosome 11 11 573574 574632 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000033052 CDS YKR070W 11 573574 574632 W 2011-02-03 1996-07-31 -S000001779 ORF Verified YKR071C DRE2 electron carrier DRE2 chromosome 11 11 575980 574934 C 2011-02-03 1996-07-31 Component of the cytosolic Fe-S protein assembly (CIA) machinery; contains an Fe-S cluster that receives electrons from NADPH via the action of Tah18p in an early step in the CIA pathway; ortholog of human Ciapin1; protein abundance increases in response to DNA replication stress; inviability of the null mutant is functionally complemented by human CIAPIN1 -S000033101 CDS YKR071C 11 575980 574934 C 2011-02-03 1996-07-31 -S000001780 ORF Verified YKR072C SIS2 phosphopantothenoylcysteine decarboxylase complex subunit SIS2|HAL3 chromosome 11 L000001899 11 578123 576435 C 57 2011-02-03 1996-07-31 Negative regulatory subunit of protein phosphatase 1 (Ppz1p); involved in coenzyme A biosynthesis; subunit of phosphopantothenoylcysteine decarboxylase (PPCDC: Cab3p, Sis2p, Vhs3p) complex and the CoA-Synthesizing Protein Complex (CoA-SPC: Cab2p, Cab3p, Cab4p, Cab5p, Sis2p and Vhs3p); SIS2 has a paralog, VHS3, that arose from the whole genome duplication -S000033861 CDS YKR072C 11 578123 576435 C 2011-02-03 1996-07-31 -S000001781 ORF Dubious YKR073C chromosome 11 11 578507 578187 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033995 CDS YKR073C 11 578507 578187 C 2011-02-03 1996-07-31 -S000006632 tRNA_gene tK(UUU)K chromosome 11 L000003638 11 578965 579060 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000034204 intron tK(UUU)K 11 579002 579024 W 2011-02-03 2000-05-19 -S000034202 noncoding_exon tK(UUU)K 11 578965 579001 W 2011-02-03 2000-05-19 -S000034203 noncoding_exon tK(UUU)K 11 579025 579060 W 2011-02-03 2000-05-19 -S000001782 ORF Verified YKR074W AIM29 chromosome 11 11 579209 579676 W 2011-02-03 1996-07-31 Protein of unknown function; epitope-tagged protein localizes to the cytoplasm; YKR074W is not an essential gene; null mutant displays elevated frequency of mitochondrial genome loss -S000034957 CDS YKR074W 11 579209 579676 W 2011-02-03 1996-07-31 -S000028669 ORF Dubious YKR075W-A chromosome 11 11 580212 580481 W 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a protein; completely overlaps the uncharacterized gene YKR075C; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032494 CDS YKR075W-A 11 580212 580481 W 2011-02-03 2003-07-29 -S000001783 ORF Uncharacterized YKR075C chromosome 11 11 580750 579827 C 2011-02-03 1996-07-31 Protein of unknown function; similar to Reg1p; expression regulated by glucose and Rgt1p; GFP-fusion protein is induced in response to the DNA-damaging agent MMS; YKR075C has a paralog, YOR062C, that arose from the whole genome duplication -S000035052 CDS YKR075C 11 580750 579827 C 2011-02-03 1996-07-31 -S000118408 ARS ARS1118 ARSXI-582 chromosome 11 11 581833 582070 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000001784 ORF Verified YKR076W ECM4 S-glutathionyl-(chloro)hydroquinone reductase|GTO2 chromosome 11 L000003880 11 582283 583395 W 2011-02-03 1996-07-31 S-glutathionyl-(chloro)hydroquinone reductase (GS-HQR); glutathione transferase involved in cell-surface biosynthesis and architecture; catalyzes glutathione (GSH)-dependent reduction of GS-trichloro-p-hydroquinone to trichloro-p-hydroquinone; expression upregulated upon exposure to genotoxic agents, such as methyl methanesulfonate, cisplatin and bleomycin; not an essential gene; similar to YGR154C; green fluorescent protein (GFP)-fusion protein localizes to cytoplasm -S000035311 CDS YKR076W 11 582283 583395 W 2011-02-03 1996-07-31 -S000001785 ORF Verified YKR077W MSA2 chromosome 11 11 583653 584744 W 2011-02-03 1996-07-31 Putative transcriptional activator; interacts with G1-specific transcription factor MBF and G1-specific promoters; MSA2 has a paralog, MSA1, that arose from the whole genome duplication -S000036232 CDS YKR077W 11 583653 584744 W 2011-02-03 1996-07-31 -S000001786 ORF Verified YKR078W chromosome 11 11 584952 586709 W 2011-02-03 1996-07-31 Cytoplasmic protein of unknown function; potential Cdc28p substrate; contains a Phox homology (PX) domain and specifically binds phosphatidylinositol 3-phosphate (PtdIns-3-P); YKR078W has a paralog, VPS5, that arose from the whole genome duplication -S000036335 CDS YKR078W 11 584952 586709 W 2011-02-03 1996-07-31 -S000001787 ORF Verified YKR079C TRZ1 tRNase Z chromosome 11 11 589305 586789 C 2011-02-03 1996-07-31 tRNA 3'-end processing endonuclease tRNase Z; also localized to mitochondria and interacts genetically with Rex2 exonuclease; homolog of the human candidate prostate cancer susceptibility gene ELAC2 -S000036383 CDS YKR079C 11 589305 586789 C 2011-02-03 1996-07-31 -S000001788 ORF Verified YKR080W MTD1 methylenetetrahydrofolate dehydrogenase (NAD(+)) chromosome 11 L000001210 11 590395 591357 W 2011-02-03 1996-07-31 NAD-dependent 5,10-methylenetetrahydrafolate dehydrogenase; plays a catalytic role in oxidation of cytoplasmic one-carbon units; expression is regulated by Bas1p and Bas2p, repressed by adenine, and may be induced by inositol and choline -S000029910 CDS YKR080W 11 590395 591357 W 2011-02-03 1996-07-31 -S000001789 ORF Verified YKR081C RPF2 rRNA-binding ribosome biosynthesis protein RPF2 chromosome 11 11 592540 591506 C 2011-02-03 1996-07-31 Essential protein involved in rRNA maturation and ribosomal assembly; involved in the processing of pre-rRNA and the assembly of the 60S ribosomal subunit; interacts with ribosomal protein L11; localizes predominantly to the nucleolus; constituent of 66S pre-ribosomal particles -S000029955 CDS YKR081C 11 592540 591506 C 2011-02-03 1996-07-31 -S000001790 ORF Verified YKR082W NUP133 RAT3 chromosome 11 L000002620 11 592825 596298 W 2011-02-03 1996-07-31 Subunit of Nup84p subcomplex of nuclear pore complex (NPC); contributes to nucleocytoplasmic transport, NPC biogenesis; is involved in establishment of a normal nucleocytoplasmic concentration gradient of GTPase Gsp1p; also plays roles in several processes that may require localization of genes or chromosomes at nuclear periphery, including double-strand break repair, transcription and chromatin silencing; relocalizes to cytosol in response to hypoxia; homolog of human NUP133 -S000030187 CDS YKR082W 11 592825 596298 W 2011-02-03 1996-07-31 -S000001791 ORF Verified YKR083C DAD2 HSK1 chromosome 11 11 596822 596421 C 2011-02-03 1996-07-31 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; is transferred to the kinetochore prior to mitosis -S000031089 CDS YKR083C 11 596822 596421 C 2011-02-03 1996-07-31 -S000001792 ORF Verified YKR084C HBS1 ribosome dissociation factor GTPase HBS1 chromosome 11 L000000756 11 598890 597055 C 2011-02-03 1996-07-31 GTPase with similarity to translation release factors; together with binding partner Dom34p, facilitates ribosomal subunit dissociation and peptidyl-tRNA release when translation is stalled, particularly in 3' UTRs; genetically implicated in mRNA no-go decay; HBS1 has a paralog, SKI7, that arose from the whole genome duplication -S000031204 CDS YKR084C 11 598890 597055 C 2011-02-03 1996-07-31 -S000001793 ORF Verified YKR085C MRPL20 mitochondrial 54S ribosomal protein YmL20|YmL20 chromosome 11 L000002527|L000001166 11 599681 599094 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000031317 CDS YKR085C 11 599681 599094 C 2011-02-03 1996-07-31 -S000001794 ORF Verified YKR086W PRP16 DEAH-box RNA helicase PRP16|PRP23|RNA16 chromosome 11 L000001504 11 599857 603072 W 2011-02-03 1996-07-31 DEAH-box RNA helicase involved in second catalytic step of splicing and in exon ligation; exhibits ATP-dependent RNA unwinding activity; mediates the release of Yju2p and Cwc25p in the second step; in the absence of ATP, stabilizes the binding of Cwc25p to the spliceosome in the first catalytic step; missense mutation in human ortholog DHX38 associated with early-onset retinitis pigmentosa -S000032379 CDS YKR086W 11 599857 603072 W 2011-02-03 1996-07-31 -S000001795 ORF Verified YKR087C OMA1 metalloendopeptidase chromosome 11 11 604232 603195 C 2011-02-03 2004-07-23|1996-07-31 Metalloendopeptidase of the mitochondrial inner membrane; important for adaptive responses to various homeostatic insults, preservation of normal mitochondrial function under damage-eliciting conditions, and stability of respiratory supercomplexes; involved in turnover of membrane-embedded proteins; mediates degradation of Cox1p in coa2 mutant cells; zebrafish ortholog has a role in organ development and mouse ortholog is also required for respiratory supercomplex stability -S000032444 CDS YKR087C 11 604232 603195 C 2011-02-03 2004-07-23|1996-07-31 -S000001796 ORF Verified YKR088C TVP38 chromosome 11 11 605418 604405 C 2011-02-03 1996-07-31 Integral membrane protein; localized to late Golgi vesicles along with the v-SNARE Tlg2p; required for asymmetric localization of Kar9p during mitosis; GFP-fusion protein localizes to the cytoplasm in a punctate pattern -S000032545 CDS YKR088C 11 605418 604405 C 2011-02-03 1996-07-31 -S000001797 ORF Verified YKR089C TGL4 STC1 chromosome 11 11 608365 605633 C 2011-02-03 1996-07-31 Multifunctional lipase/hydrolase/phospholipase; triacylglycerol lipase, steryl ester hydrolase, and Ca2+-independent phospholipase A2; catalyzes acyl-CoA dependent acylation of LPA to PA; required with Tgl3p for timely bud formation; phosphorylated and activated by Cdc28p; TGL4 has a paralog, TGL5, that arose from the whole genome duplication -S000032624 CDS YKR089C 11 608365 605633 C 2011-02-03 1996-07-31 -S000001798 ORF Verified YKR090W PXL1 chromosome 11 11 608946 611066 W 2011-02-03 1996-07-31|2011-02-03 Protein that localizes to sites of polarized growth; required for selection and/or maintenance of polarized growth sites, may modulate signaling by the GTPases Cdc42p and Rho1p; contains LIM domains and has similarity to metazoan paxillin; relocalizes from bud neck to cytoplasm upon DNA replication stress -S000033373 CDS YKR090W 11 608946 611066 W 2011-02-03 1996-07-31|2011-02-03 -S000001799 ORF Verified YKR091W SRL3 DNA-binding protein SRL3|WHI7 chromosome 11 L000004671 11 611525 612265 W 2011-02-03 2004-07-23|1996-07-31 GTB motif (G1/S transcription factor binding) containing protein; binds SBF-regulated promoters in hydroxyurea-treated cells; when overexpressed, suppresses the lethality of a rad53 null mutation; potential Cdc28p substrate; SRL3 has a paralog, WHI5, that arose from the whole genome duplication -S000034294 CDS YKR091W 11 611525 612265 W 2011-02-03 2004-07-23|1996-07-31 -S000118409 ARS ARS1120 ARSXI-612 chromosome 11 11 612378 612463 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000001800 ORF Verified YKR092C SRP40 chromosome 11 L000002063 11 613885 612665 C 2011-02-03 1996-07-31 Nucleolar serine-rich protein; role in preribosome assembly or transport; may function as a chaperone of small nucleolar ribonucleoprotein particles (snoRNPs); immunologically and structurally to rat Nopp140 -S000034345 CDS YKR092C 11 613885 612665 C 2011-02-03 1996-07-31 -S000001801 ORF Verified YKR093W PTR2 chromosome 11 L000001527 11 615730 617535 W 2011-02-03 1996-07-31 Integral membrane peptide transporter; mediates transport of di- and tri-peptides; conserved protein that contains 12 transmembrane domains; PTR2 expression is regulated by the N-end rule pathway via repression by Cup9p -S000034474 CDS YKR093W 11 615730 617535 W 2011-02-03 1996-07-31 -S000001802 ORF Verified YKR094C RPL40B eL40|ubiquitin-ribosomal 60S subunit protein L40B fusion protein|L40e|L40B|UB12|CEP52B|UBI2 chromosome 11 L000002412|L000000314 11 618750 617996 C 2011-02-03 1996-07-31|2011-02-03 Ubiquitin-ribosomal 60S subunit protein L40B fusion protein; cleaved to yield ubiquitin and ribosomal protein L40B; ubiquitin may facilitate assembly of the ribosomal protein into ribosomes; homologous to mammalian ribosomal protein L40, no bacterial homolog; RPL40B has a paralog, RPL40A, that arose from the whole genome duplication -S000034523 CDS YKR094C 11 618374 617996 C 2011-02-03 1996-07-31 -S000034522 CDS YKR094C 11 618750 618743 C 2011-02-03 1996-07-31 -S000034524 intron YKR094C 11 618742 618375 C 2011-02-03 1996-07-31|2011-02-03 -S000001803 ORF Verified YKR095W MLP1 MPL1 chromosome 11 L000001141|L000001122 11 619805 625432 W 80.3 2011-02-03 1996-07-31 Myosin-like protein associated with the nuclear envelope; nuclear basket protein that connects the nuclear pore complex with the nuclear interior; involved with Tel1p in telomere length control; involved with Pml1p and Pml39p in nuclear retention of unspliced mRNAs; MLP1 has a paralog, MLP2, that arose from the whole genome duplication -S000035599 CDS YKR095W 11 619805 625432 W 2011-02-03 1996-07-31 -S000028512 ORF Verified YKR095W-A PCC1 chromatin DNA-binding EKC/KEOPS complex subunit PCC1 chromosome 11 11 625864 626205 W 2011-02-03 2004-01-28|2003-07-29 Component of the EKC/KEOPS protein complex; EKC/KEOPS complex is required for t6A tRNA modification and telomeric TG1-3 recombination; may have role in transcription; other complex members are Kae1p, Gon7p, Bud32p, and Cgi121p -S000030270 CDS YKR095W-A 11 625864 625901 W 2011-02-03 2004-01-28|2003-07-29 -S000030272 CDS YKR095W-A 11 625977 626205 W 2011-02-03 2004-01-28 -S000030273 intron YKR095W-A 11 625902 625976 W 2011-02-03 2004-01-28|2003-07-29 -S000001804 ORF Verified YKR096W ESL2 chromosome 11 11 626793 630380 W 2011-02-03 1996-07-31 hEST1A/B (SMG5/6)-like protein; contributes to environment-sensing adaptive gene expression responses; Esl2p and Esl1p contain a 14-3-3-like domain and a putative PilT N-terminus ribonuclease domain; interacts with Pex14p; may interact with ribosomes, based on co-purification experiments; green fluorescent protein (GFP)-fusion protein localizes to the nucleus and cytoplasm; ESL2 has a paralog, ESL1, that arose from the whole genome duplication -S000035688 CDS YKR096W 11 626793 630380 W 2011-02-03 1996-07-31 -S000001805 ORF Verified YKR097W PCK1 phosphoenolpyruvate carboxykinase PCK1|PPC1|JPM2 chromosome 11 L000001350 11 631152 632801 W 73.2 2011-02-03 1996-07-31 Phosphoenolpyruvate carboxykinase; key enzyme in gluconeogenesis, catalyzes early reaction in carbohydrate biosynthesis, glucose represses transcription and accelerates mRNA degradation, regulated by Mcm1p and Cat8p, located in the cytosol -S000036623 CDS YKR097W 11 631152 632801 W 2011-02-03 1996-07-31 -S000001806 ORF Verified YKR098C UBP11 ubiquitin-specific protease UBP11 chromosome 11 L000003171 11 635179 633026 C 2011-02-03 1996-07-31 Ubiquitin-specific protease; cleaves ubiquitin from ubiquitinated proteins; UBP11 has a paralog, UBP7, that arose from the whole genome duplication -S000036658 CDS YKR098C 11 635179 633026 C 2011-02-03 1996-07-31 -S000001807 ORF Verified YKR099W BAS1 chromosome 11 L000000161 11 635851 638286 W 82 2011-02-03 1996-07-31 Myb-related transcription factor; involved in regulating basal and induced expression of genes of the purine and histidine biosynthesis pathways; also involved in regulation of meiotic recombination at specific genes -S000036756 CDS YKR099W 11 635851 638286 W 2011-02-03 1996-07-31 -S000001808 ORF Verified YKR100C SKG1 YKR099C-A chromosome 11 11 639968 638901 C 2011-02-03 2004-02-13|1996-07-31 Transmembrane protein with a role in cell wall polymer composition; localizes on inner surface of plasma membrane at bud and in daughter cell; SKG1 has a paralog, AIM20, that arose from the whole genome duplication -S000033006 CDS YKR100C 11 639968 638901 C 2011-02-03 2004-02-13|1996-07-31 -S000001809 ORF Verified YKR101W SIR1 chromosome 11 L000001894 11 640540 642504 W 84 2011-02-03 1996-07-31|2009-02-20 Protein involved in silencing at mating-type loci HML and HMR; recruitment to silent chromatin requires interactions with Orc1p and with Sir4p, through a common Sir1p domain; binds to centromeric chromatin -S000033721 CDS YKR101W 11 640540 642504 W 2011-02-03 1996-07-31|2009-02-20 -S000118410 ARS ARS1123 ARSXI-642 chromosome 11 11 642727 642973 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000001810 ORF Verified YKR102W FLO10 chromosome 11 L000004081 11 646356 649865 W 2011-02-03 1996-07-31 Member of the FLO family of cell wall flocculation proteins; not expressed in most lab strains; overproduction induces flocculation that can be inhibited by mannose, sucrose, or glucose; overproduction also promotes haploid invasive growth and diploid filamentous growth -S000033847 CDS YKR102W 11 646356 649865 W 2011-02-03 1996-07-31 -S000001811 ORF Verified YKR103W NFT1 putative multidrug transporter NFT1 chromosome 11 11 653080 656736 W 2011-02-03 1996-07-31 Putative transporter of the MRP subfamily; adjacent ORFs YKR103W and YKR104W are merged in different strain backgrounds; MRP stands for multidrug resistance-associated protein -S000033929 CDS YKR103W 11 653080 656736 W 2011-02-03 1996-07-31 -S000001812 ORF Verified YKR104W NFT1 chromosome 11 11 656836 657756 W 2011-02-03 1996-07-31 Putative transporter of the MRP subfamily; contains a stop codon in S288C; adjacent ORFs YKR103W and YKR104W are merged in different strain backgrounds; MRP stands for multidrug resistance-associated protein -S000034837 CDS YKR104W 11 656836 657756 W 2011-02-03 1996-07-31 -S000001813 ORF Verified YKR105C VBA5 basic amino acid transporter chromosome 11 11 660464 658716 C 2011-02-03 1996-07-31 Plasma membrane protein of the Major Facilitator Superfamily (MFS); involved in amino acid uptake and drug sensitivity; VBA5 has a paralog, VBA3, that arose from a segmental duplication -S000034879 CDS YKR105C 11 660464 658716 C 2011-02-03 1996-07-31 -S000001814 ORF Verified YKR106W GEX2 glutathione exchanger chromosome 11 11 661442 663289 W 2011-02-03 1996-07-31 Proton:glutathione antiporter; localized to the vacuolar and plasma membranes; expressed at a very low level; potential role in resistance to oxidative stress and modulation of the PKA pathway; GEX2 has a paralog, GEX1, that arose from a segmental duplication -S000035177 CDS YKR106W 11 661442 663289 W 2011-02-03 1996-07-31 -S000007063 long_terminal_repeat YKRWomega1 chromosome 11 11 665430 665668 W 2011-02-03 2000-05-19 Ty5 LTR -S000028978 telomere TEL11R chromosome 11 11 665904 666816 W 89 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome XI; composed of an X element core sequence, X element combinatorial repeats, and a terminal stretch of telomeric repeats -S000028979 telomeric_repeat TEL11R 11 666609 666816 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome XI -S000028980 X_element TEL11R 11 665904 666364 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome XI; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028981 X_element_combinatorial_repeat TEL11R 11 666365 666608 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr XI; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000029411 gene_group RDN1 RDN1 chromosome 12 L000001595 12 105 Ribosomal DNA (rDNA); an approximately 1-2 Mb region on the right arm of chr. XII consisting of 100-200 tandem copies of a 9.1 kb repeat which contains the genes for 5S, 5.8S, 25S and 18S rRNAs (represented by the RDN37, RDN25, RDN18, RDN58, and RDN5 loci); a specific histone modification (H3K56ac) regulates RNA polymerase I transcription of the ribosomal DNA -S000028673 ORF Dubious YLL067W-A chromosome 12 12 843 1325 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps YLL067C -S000032519 CDS YLL067W-A 12 843 1325 W 2003-07-29 2003-07-29 -S000003990 ORF Uncharacterized YLL067C Y' element ATP-dependent helicase chromosome 12 12 4301 585 C 1996-07-31 1996-07-31 Putative Y' element ATP-dependent helicase -S000034997 CDS YLL067C 12 3915 585 C 1996-07-31 1996-07-31 -S000034996 CDS YLL067C 12 4301 4015 C 1996-07-31 1996-07-31 -S000034998 intron YLL067C 12 4014 3916 C 1996-07-31 1996-07-31 -S000028672 ORF Uncharacterized YLL066W-B chromosome 12 12 5605 5775 W 2003-07-29 2003-07-29 Putative protein of unknown function; overexpression causes a cell cycle delay or arrest -S000032518 CDS YLL066W-B 12 5605 5775 W 2003-07-29 2003-07-29 -S000028671 ORF Dubious YLL066W-A chromosome 12 12 6486 6968 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized ORF YLL066C -S000032517 CDS YLL066W-A 12 6486 6968 W 2003-07-29 2003-07-29 -S000003989 ORF Uncharacterized YLL066C Y' element ATP-dependent helicase chromosome 12 12 9836 6120 C 1996-07-31 1996-07-31 Putative Y' element ATP-dependent helicase; YLL066C is not an essential gene -S000034882 CDS YLL066C 12 9450 6120 C 1996-07-31 1996-07-31 -S000034881 CDS YLL066C 12 9836 9550 C 1996-07-31 1996-07-31 -S000034883 intron YLL066C 12 9549 9451 C 1996-07-31 1996-07-31 -S000003988 ORF Dubious YLL065W GIN11 chromosome 12 L000002674 12 11726 12076 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps chromosome XII telomeric element core sequences -S000034819 CDS YLL065W 12 11726 12076 W 1996-07-31 1996-07-31 -S000028910 telomere TEL12L chromosome 12 12 12085 1 C -33 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome XII; composed of an X element core sequence, X element combinatorial repeats, and three distinct regions of telomeric repeats separated by two short Y' elements -S000028911 telomeric_repeat TEL12L 12 75 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome XII -S000028912 telomeric_repeat TEL12L 12 5723 5662 C 2003-09-09 2003-09-09 Middle stretch of telomeric repeats on the left arm of Chromosome XII -S000028913 telomeric_repeat TEL12L 12 11358 11197 C 2003-09-09 2003-09-09 Internal telomeric repeats on the left arm of Chromosome XII -S000028914 X_element TEL12L 12 12085 11626 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome XII; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YLL065W -S000028915 X_element_combinatorial_repeat TEL12L 12 11625 11359 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr XII; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000028916 Y_prime_element TEL12L 12 5661 76 C 2003-09-09 2003-09-09 Short telomeric Y' element on the left arm of Chromosome XII; more end-proximal of two two short telomeric Y' elements; contains an ARS consensus sequence, a region of 36-bp repeats, and two ORFs YLL067C and YLL067W-A -S000028917 Y_prime_element TEL12L 12 11196 5724 C 2003-09-09 2003-09-09 Short Y' element in the left telomere of Chromosome XII; more centromere-proximal of two short Y' elements; contains an ARS consensus sequence, a region of 36-bp repeats, and two ORFs YLL066C and YLL066W-A -S000003987 ORF Verified YLL064C PAU18 seripauperin PAU18 chromosome 12 12 13445 13083 C 1996-07-31 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; identical to Pau6p -S000034617 CDS YLL064C 12 13445 13083 C 1996-07-31 1996-07-31 -S000003986 ORF Verified YLL063C AYT1 acetyltransferase chromosome 12 L000004544 12 16072 14648 C 1996-07-31 1996-07-31 Acetyltransferase; catalyzes trichothecene 3-O-acetylation, suggesting a possible role in trichothecene biosynthesis -S000033720 CDS YLL063C 12 16072 14648 C 1996-07-31 1996-07-31 -S000003985 ORF Verified YLL062C MHT1 S-adenosylmethionine-homocysteine S-methyltransferase MHT1 chromosome 12 12 17613 16639 C 1996-07-31 1996-07-31 S-methylmethionine-homocysteine methyltransferase; functions along with Sam4p in the conversion of S-adenosylmethionine (AdoMet) to methionine to control the methionine/AdoMet ratio -S000033626 CDS YLL062C 12 17613 16639 C 1996-07-31 1996-07-31 -S000003984 ORF Verified YLL061W MMP1 S-methylmethionine permease MMP1 chromosome 12 L000004869 12 17956 19707 W 1996-07-31 1996-07-31 High-affinity S-methylmethionine permease; required for utilization of S-methylmethionine as a sulfur source; has similarity to S-adenosylmethionine permease Sam3p -S000033583 CDS YLL061W 12 17956 19707 W 1996-07-31 1996-07-31 -S000003983 ORF Verified YLL060C GTT2 glutathione transferase GTT2 chromosome 12 L000004613 12 21839 21138 C 1996-07-31 1996-07-31 Glutathione S-transferase capable of homodimerization; functional overlap with Gtt2p, Grx1p, and Grx2p; protein abundance increases in response to DNA replication stress -S000032819 CDS YLL060C 12 21839 21138 C 1996-07-31 1996-07-31 -S000003982 ORF Dubious YLL059C chromosome 12 12 22980 22474 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032747 CDS YLL059C 12 22980 22474 C 1996-07-31 1996-07-31 -S000003981 ORF Uncharacterized YLL058W cystathionine gamma-synthase chromosome 12 12 23569 25296 W 1996-07-31 1996-07-31 Putative protein of unknown function with similarity to Str2p; Str2p is a cystathionine gamma-synthase important in sulfur metabolism; YLL058W is not an essential gene -S000031898 CDS YLL058W 12 23569 25296 W 1996-07-31 1996-07-31 -S000003980 ORF Verified YLL057C JLP1 sulfonate dioxygenase chromosome 12 12 26994 25756 C 1996-07-31 1996-07-31 Fe(II)-dependent sulfonate/alpha-ketoglutarate dioxygenase; involved in sulfonate catabolism for use as a sulfur source; contains sequence that resembles a J domain (typified by the E. coli DnaJ protein); induced by sulphur starvation -S000031705 CDS YLL057C 12 26994 25756 C 1996-07-31 1996-07-31 -S000003979 ORF Uncharacterized YLL056C chromosome 12 12 28305 27409 C 1996-07-31 1996-07-31 Putative protein of unknown function; transcription is activated by paralogous transcription factors Yrm1p and Yrr1p and genes involved in pleiotropic drug resistance (PDR); expression is induced in cells treated with the mycotoxin patulin; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively -S000031618 CDS YLL056C 12 28305 27409 C 1996-07-31 1996-07-31 -S000003978 ORF Verified YLL055W YCT1 chromosome 12 12 30109 31704 W 1996-07-31 1996-07-31 High-affinity cysteine-specific transporter; has similarity to the Dal5p family of transporters; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; YCT1 is not an essential gene -S000031573 CDS YLL055W 12 30109 31704 W 1996-07-31 1996-07-31 -S000130180 ARS ARS1202 chromosome 12 12 30209 31384 2009-05-08 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000003977 ORF Uncharacterized YLL054C chromosome 12 12 35204 32673 C 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function with similarity to Pip2p; an oleate-specific transcriptional activator of peroxisome proliferation; YLL054C is not an essential gene -S000030665 CDS YLL054C 12 35204 32673 C 2011-02-03 1996-07-31|2011-02-03 -S000003976 ORF Uncharacterized YLL053C chromosome 12 12 35961 35503 C 2011-02-03 1996-07-31 Putative protein; in the Sigma 1278B strain background YLL053C is contiguous with AQY2 which encodes an aquaporin -S000030554 CDS YLL053C 12 35961 35503 C 2011-02-03 1996-07-31 -S000003975 ORF Verified YLL052C AQY2 chromosome 12 L000004844 12 36361 35912 C 2011-02-03 1996-07-31 Water channel that mediates water transport across cell membranes; only expressed in proliferating cells; controlled by osmotic signals; may be involved in freeze tolerance; disrupted by a stop codon in many S. cerevisiae strains -S000030412 CDS YLL052C 12 36361 35912 C 2011-02-03 1996-07-31 -S000003974 ORF Verified YLL051C FRE6 putative ferric-chelate reductase chromosome 12 L000003558 12 39471 37333 C 2011-02-03 1996-07-31 Putative ferric reductase with similarity to Fre2p; expression induced by low iron levels -S000037644 CDS YLL051C 12 39471 37333 C 2011-02-03 1996-07-31 -S000003973 ORF Verified YLL050C COF1 cofilin chromosome 12 L000000377 12 40414 39804 C 2011-02-03 1996-07-31 Cofilin, involved in pH-dependent actin filament depolarization; binds both actin monomers and filaments and severs filaments; involved in the selective sorting, export of the secretory cargo from the late golgi; genetically interacts with pmr1; thought to be regulated by phosphorylation at SER4; ubiquitous and essential in eukaryotes -S000037511 CDS YLL050C 12 40221 39804 C 2011-02-03 1996-07-31 -S000037510 CDS YLL050C 12 40414 40401 C 2011-02-03 1996-07-31 -S000037512 intron YLL050C 12 40400 40222 C 2011-02-03 1996-07-31 -S000003972 ORF Verified YLL049W LDB18 chromosome 12 12 40666 41205 W 2011-02-03 1996-07-31 Component of the dynactin complex; dynactin is required for dynein activity; null mutant exhibits defects in nuclear migration and spindle orientation and has reduced affinity for alcian blue dye; has homology to mammalian dynactin subunit p24 -S000037568 CDS YLL049W 12 40666 41205 W 2011-02-03 1996-07-31 -S000003971 ORF Verified YLL048C YBT1 bile acid-transporting ATPase YBT1|BAT1 chromosome 12 L000004345 12 46265 41280 C 2011-02-03 1996-07-31 Transporter of the ATP-binding cassette (ABC) family; involved in bile acid transport; negative regulator of vacuole fusion; regulates release of lumenal Ca2+ stores; similar to mammalian bile transporters; YBT1 has a paralog, VMR1, that arose from the whole genome duplication -S000036801 CDS YLL048C 12 46265 41280 C 2011-02-03 1996-07-31 -S000003970 ORF Dubious YLL047W chromosome 12 12 46672 47055 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene RNP1 -S000036777 CDS YLL047W 12 46672 47055 W 2011-02-03 1996-07-31 -S000003969 ORF Verified YLL046C RNP1 chromosome 12 L000001654 12 47463 46714 C 2011-02-03 1996-07-31 Ribonucleoprotein that contains two RNA recognition motifs (RRM); RNP1 has a paralog, SBP1, that arose from the whole genome duplication -S000036697 CDS YLL046C 12 47463 46714 C 2011-02-03 1996-07-31 -S000003967 ORF Dubious YLL044W chromosome 12 12 48216 48662 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; transcription of both YLL044W and the overlapping gene RPL8B is reduced in the gcr1 null mutant -S000035737 CDS YLL044W 12 48216 48662 W 2011-02-03 1996-07-31 -S000003968 ORF Verified YLL045C RPL8B eL8|ribosomal 60S subunit protein L8B|L8e|rp6|YL5|L8B|L4B|SCL41|KRB1 chromosome 12 L000000911|L000001705 12 48629 47859 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L8B; required for processing of 27SA3 pre-rRNA to 27SB pre-rRNA during assembly of large ribosomal subunit; depletion leads to a turnover of pre-rRNA; L8 binds to Domain I of 25S and 5.8 S rRNAs; mutation results in decreased amounts of free 60S subunits; homologous to mammalian ribosomal protein L7A, no bacterial homolog; RPL8B has a paralog, RPL8A, that arose from the whole genome duplication -S000036622 CDS YLL045C 12 48629 47859 C 2011-02-03 1996-07-31 -S000003966 ORF Verified YLL043W FPS1 chromosome 12 L000000625 12 49938 51947 W 2011-02-03 1996-07-31 Aquaglyceroporin, plasma membrane channel; involved in efflux of glycerol and xylitol, and in uptake of acetic acid, arsenite, and antimonite; key factor in maintaining redox balance by mediating passive diffusion of glycerol; phosphorylated by Hog1p MAPK under acetate stress; deletion improves xylose fermentation; regulated by Rgc1p and Ask10p, which are regulated by Hog1p phosphorylation under osmotic stress; phosphorylation by Ypk1p required to maintain an open state -S000035628 CDS YLL043W 12 49938 51947 W 2011-02-03 1996-07-31 -S000003965 ORF Verified YLL042C ATG10 E2-like conjugating enzyme|APG10 chromosome 12 L000004785 12 52590 52087 C 2011-02-03 1996-07-31 Conserved E2-like conjugating enzyme; mediates formation of the Atg12p-Atg5p conjugate, which is a critical step in autophagy -S000035508 CDS YLL042C 12 52590 52087 C 2011-02-03 1996-07-31 -S000003964 ORF Verified YLL041C SDH2 succinate dehydrogenase iron-sulfur protein subunit SDH2|SDHB|ACN17 chromosome 12 L000001824 12 53931 53131 C 2011-02-03 1996-07-31 Iron-sulfur protein subunit of succinate dehydrogenase; the complex couples the oxidation of succinate to the transfer of electrons to ubiquinone as part of the TCA cycle and the mitochondrial respiratory chain; other members are Sdh1p, Sdh3p, and Sdh4p -S000034473 CDS YLL041C 12 53931 53131 C 2011-02-03 1996-07-31 -S000003963 ORF Verified YLL040C VPS13 membrane morphogenesis protein VPS13|VPT2|SOI1 chromosome 12 L000003510|L000002967 12 63645 54211 C 2011-02-03 1996-07-31 Protein involved in prospore membrane morphogenesis; peripheral membrane protein that localizes to the prospore membrane and at numerous membrane contact sites; involved in sporulation, vacuolar protein sorting, prospore membrane formation during sporulation, and protein-Golgi retention; required for mitochondrial integrity; contains a PH-like domain; homologous to human CHAC and COH1 which are involved in Chorea-acanthocytosis and Cohen syndrome, respectively -S000034394 CDS YLL040C 12 63645 54211 C 2011-02-03 1996-07-31 -S000003962 ORF Verified YLL039C UBI4 ubiquitin|UB14|SCD2 chromosome 12 L000002414 12 65207 64062 C 2011-02-03 1996-07-31 Ubiquitin; becomes conjugated to proteins, marking them for selective degradation via the ubiquitin-26S proteasome system; essential for the cellular stress response; encoded as a polyubiquitin precursor comprised of 5 head-to-tail repeats; protein abundance increases in response to DNA replication stress -S000033435 CDS YLL039C 12 65207 64062 C 2011-02-03 1996-07-31 -S000003961 ORF Verified YLL038C ENT4 chromosome 12 12 66518 65775 C 2011-02-03 1996-07-31 Protein of unknown function; contains an N-terminal epsin-like domain; proposed to be involved in the trafficking of Arn1p in the absence of ferrichrome -S000033366 CDS YLL038C 12 66518 65775 C 2011-02-03 1996-07-31 -S000003960 ORF Dubious YLL037W chromosome 12 12 66562 66942 W 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; overlaps 3' end of essential PRP19 gene encoding an RNA splicing factor -S000033343 CDS YLL037W 12 66562 66942 W 2011-02-03 1996-07-31 -S000003959 ORF Verified YLL036C PRP19 E3 ubiquitin-protein ligase PRP19|PSO4 chromosome 12 L000001506 12 68256 66745 C 2011-02-03 1996-07-31 Splicing factor associated with the spliceosome; contains a U-box, a motif found in a class of ubiquitin ligases, and a WD40 domain; relocalizes to the cytosol in response to hypoxia -S000032580 CDS YLL036C 12 68256 66745 C 2011-02-03 1996-07-31 -S000003958 ORF Verified YLL035W GRC3 polynucleotide 5'-hydroxyl-kinase chromosome 12 12 68580 70478 W 2011-02-03 1996-07-31 Polynucleotide kinase present on rDNA; required for efficient transcription termination by RNA polymerase I; functions with Las1p in a conserved mechanism to modulate rRNA processing and ribosome biogenesis; required for cell growth; mRNA is cell-cycle regulated -S000032549 CDS YLL035W 12 68580 70478 W 2011-02-03 1996-07-31 -S000003957 ORF Verified YLL034C RIX7 putative AAA family ATPase RIX7 chromosome 12 12 73146 70633 C 2011-02-03 1996-07-31 Putative ATPase of the AAA family; required for export of pre-ribosomal large subunits from the nucleus; distributed between the nucleolus, nucleoplasm, and nuclear periphery depending on growth conditions -S000032376 CDS YLL034C 12 73146 70633 C 2011-02-03 1996-07-31 -S000003956 ORF Verified YLL033W IRC19 RRG4|GON2 chromosome 12 12 73409 74101 W 2011-02-03 1996-07-31 Protein of unknown function; YLL033W is not an essential gene but mutant is defective in spore formation; null mutant displays increased levels of spontaneous Rad52p foci -S000032327 CDS YLL033W 12 73409 74101 W 2011-02-03 1996-07-31 -S000003955 ORF Verified YLL032C chromosome 12 12 76747 74270 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YLL032C is not an essential gene -S000031283 CDS YLL032C 12 76747 74270 C 2011-02-03 1996-07-31 -S000003954 ORF Verified YLL031C GPI13 mannose-ethanolamine phosphotransferase GPI13|MPC1 chromosome 12 12 80205 77152 C 2011-02-03 1996-07-31 ER membrane localized phosphoryltransferase; adds phosphoethanolamine onto the third mannose residue of the glycosylphosphatidylinositol (GPI) anchor precursor; similar to human PIG-O protein -S000031131 CDS YLL031C 12 80205 77152 C 2011-02-03 1996-07-31 -S000003953 ORF Dubious YLL030C RRT7 chromosome 12 12 80697 80356 C 2011-02-03 1996-07-31 Protein of unknown function; identified in a screen for mutants with increased levels of rDNA transcription; dubious open reading frame unlikely to encode a protein, based on available experimental and comparative sequence data -S000030186 CDS YLL030C 12 80697 80356 C 2011-02-03 1996-07-31 -S000003952 ORF Verified YLL029W FRA1 RUP2 chromosome 12 12 81461 83710 W 2011-02-03 1996-07-31 Protein involved in negative regulation of iron regulon transcription; forms an iron independent complex with Fra2p, Grx3p, and Grx4p; cytosolic; mutant fails to repress transcription of iron regulon and is defective in spore formation -S000037209 CDS YLL029W 12 81461 83710 W 2011-02-03 1996-07-31 -S000003951 ORF Verified YLL028W TPO1 chromosome 12 12 84804 86564 W 2011-02-03 1996-07-31 Polyamine transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; recognizes spermine, putrescine, and spermidine; catalyzes uptake of polyamines at alkaline pH and excretion at acidic pH; during oxidative stress exports spermine, spermidine from the cell, which controls timing of expression of stress-responsive genes; phosphorylation enhances activity and sorting to the plasma membrane -S000037134 CDS YLL028W 12 84804 86564 W 2011-02-03 1996-07-31 -S000003950 ORF Verified YLL027W ISA1 Fe-binding Fe/S cluster assembly protein ISA1 chromosome 12 L000004953 12 87403 88155 W 2011-02-03 1996-07-31 Protein required for maturation of mitochondrial [4Fe-4S] proteins; functions in a complex with Isa2p and possibly Iba57p; isa1 deletion causes loss of mitochondrial DNA and respiratory deficiency; depletion reduces growth on nonfermentable carbon sources; functional ortholog of bacterial A-type ISC proteins; human ISCA1 can complement isa1 null mutant -S000036472 CDS YLL027W 12 87403 88155 W 2011-02-03 1996-07-31 -S000003949 ORF Verified YLL026W HSP104 chaperone ATPase HSP104 chromosome 12 L000000823 12 88623 91349 W 2011-02-03 1996-07-31 Disaggregase; heat shock protein that cooperates with Ydj1p (Hsp40) and Ssa1p (Hsp70) to refold and reactivate previously denatured, aggregated proteins; responsive to stresses including: heat, ethanol, and sodium arsenite; involved in [PSI+] propagation; protein becomes more abundant and forms cytoplasmic foci in response to DNA replication stress; potentiated Hsp104p variants decrease TDP-43 proteotoxicity by eliminating its cytoplasmic aggregation -S000036386 CDS YLL026W 12 88623 91349 W 2011-02-03 1996-07-31 -S000118469 ARS ARS1206 ARSXII-91 chromosome 12 12 91419 91660 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178130 ARS_consensus_sequence ARS1206 12 91466 91482 W 2014-11-18 2014-11-18 -S000007064 long_terminal_repeat YLLCdelta1 chromosome 12 12 92381 92050 C 2011-02-03 2000-05-19 Ty1 LTR -S000006683 tRNA_gene tP(UGG)L chromosome 12 L000003645 12 92548 92650 W 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin -S000036013 intron tP(UGG)L 12 92584 92614 W 2011-02-03 2000-05-19 -S000036011 noncoding_exon tP(UGG)L 12 92548 92583 W 2011-02-03 2000-05-19 -S000036012 noncoding_exon tP(UGG)L 12 92615 92650 W 2011-02-03 2000-05-19 -S000003948 ORF Verified YLL025W PAU17 seripauperin PAU17 chromosome 12 12 94747 95121 W 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP and mCherry fusion proteins localize to the vacuole; YLL025W is not an essential gene -S000036278 CDS YLL025W 12 94747 95121 W 2011-02-03 1996-07-31 -S000003947 ORF Verified YLL024C SSA2 Hsp70 family chaperone SSA2|YG102 chromosome 12 L000002070 12 97485 95566 C 2011-02-03 1996-07-31 HSP70 family ATP-binding protein; involved in protein folding, vacuolar import of proteins; required for ubiquitin-dependent degradation of short-lived proteins; associated with chaperonin-containing T-complex; 98% identical to paralog Ssa1p with distinct functional specificity in propagation of yeast [URE3] prions and vacuolar-mediated degradation of gluconeogenesis enzymes; binds tRNA, has role in tRNA nuclear import during starvation -S000035290 CDS YLL024C 12 97485 95566 C 2011-02-03 1996-07-31 -S000003946 ORF Verified YLL023C POM33 nucleoporin POM33 chromosome 12 12 98836 97997 C 2011-02-03 1996-07-31 Transmembrane nucleoporin; involved in nuclear pore complex (NPC) distribution, assembly or stabilization; highly conserved across species, orthologous to human TMEM33 and paralogous to Per33p; protein abundance increases in response to DNA replication stress -S000035143 CDS YLL023C 12 98836 97997 C 2011-02-03 1996-07-31 -S000003945 ORF Verified YLL022C HIF1 chromosome 12 L000004439 12 100201 99044 C 2011-02-03 1996-07-31 Non-essential component of the HAT-B histone acetyltransferase complex; localized to the nucleus; has a role in telomeric silencing; other members are Hat1p and Hat2p -S000034956 CDS YLL022C 12 100201 99044 C 2011-02-03 1996-07-31 -S000003944 ORF Verified YLL021W SPA2 PPF1|PEA1|FUS6 chromosome 12 L000001989 12 100947 105347 W -28 2011-02-03 1996-07-31 Component of the polarisome; functions in actin cytoskeletal organization during polarized growth; acts as a scaffold for Mkk1p and Mpk1p cell wall integrity signaling components; potential Cdc28p substrate; coding sequence contains length polymorphisms in different strains; SPA2 has a paralog, SPH1, that arose from the whole genome duplication -S000034900 CDS YLL021W 12 100947 105347 W 2011-02-03 1996-07-31 -S000003943 ORF Dubious YLL020C chromosome 12 12 105861 105556 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene KNS1 -S000033932 CDS YLL020C 12 105861 105556 C 2011-02-03 1996-07-31 -S000028670 ORF Dubious YLL019W-A chromosome 12 12 106908 107000 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene KNS1 -S000032516 CDS YLL019W-A 12 106908 107000 W 2011-02-03 2003-07-29 -S000003942 ORF Verified YLL019C KNS1 serine/threonine protein kinase KNS1|L124 chromosome 12 L000000910 12 107899 105686 C -28 2011-02-03 1996-07-31 Protein kinase involved in negative regulation of PolIII transcription; effector kinase of the TOR signaling pathway and phosphorylates Rpc53p to regulate ribosome and tRNA biosynthesis; member of the LAMMER family of protein kinases, which are serine/threonine kinases also capable of phosphorylating tyrosine residues; capable of autophosphorylation -S000035019 CDS YLL019C 12 107899 105686 C 2011-02-03 1996-07-31 -S000007245 ORF Verified YLL018C-A COX19 chromosome 12 L000004848 12 108972 108676 C 2011-02-03 1999-07-17 Protein required for cytochrome c oxidase assembly; located in the cytosol and mitochondrial intermembrane space; putative copper metallochaperone that delivers copper to cytochrome c oxidase; contains twin cysteine-x9-cysteine motifs -S000037730 CDS YLL018C-A 12 108972 108676 C 2011-02-03 1999-07-17 -S000003941 ORF Verified YLL018C DPS1 aspartate--tRNA ligase DPS1|AspRS chromosome 12 L000002834 12 111575 109902 C 2011-02-03 1996-07-31 Aspartyl-tRNA synthetase, primarily cytoplasmic; homodimeric enzyme that catalyzes the specific aspartylation of tRNA(Asp); class II aminoacyl tRNA synthetase; binding to its own mRNA may confer autoregulation; shares five highly conserved amino acids with human that when mutated cause leukoencephalopathy characterized by hypomyelination with brain stem and spinal cord involvement and leg spasticity (HBSL) -S000034907 CDS YLL018C 12 111575 109902 C 2011-02-03 1996-07-31 -S000003940 pseudogene YLL017W Ras family guanine nucleotide exchange factor SDC25|SDC25 chromosome 12 L000002822|L000003262 12 112234 112545 W 2011-02-03 1996-07-31 Non-essential Ras guanine nucleotide exchange factor (GEF); localized to the membrane; expressed in poor nutrient conditions and on nonfermentable carbon sources; contains a stop codon in S288C, full-length gene includes YLL016W; SDC25 has a paralog, CDC25, that arose from the whole genome duplication -S000034831 CDS YLL017W 12 112234 112545 W 2011-02-03 1996-07-31 -S000003939 pseudogene YLL016W SDC25 Ras family guanine nucleotide exchange factor SDC25 chromosome 12 12 112847 115993 W -3 2011-02-03 1996-07-31 Non-essential Ras guanine nucleotide exchange factor (GEF); localized to the membrane; expressed in poor nutrient conditions and on nonfermentable carbon sources; contains a stop codon in S288C, full-length gene includes YLL017W; SDC25 has a paralog, CDC25, that arose from the whole genome duplication -S000032886 CDS YLL016W 12 112847 115993 W 2011-02-03 1996-07-31 -S000003938 ORF Verified YLL015W BPT1 ATP-binding cassette bilirubin transporter BPT1 chromosome 12 12 116432 121111 W 2011-02-03 1996-07-31 ABC type transmembrane transporter of MRP/CFTR family; found in vacuolar membrane, involved in the transport of unconjugated bilirubin and in heavy metal detoxification via glutathione conjugates, along with Ycf1p -S000032769 CDS YLL015W 12 116432 121111 W 2011-02-03 1996-07-31 -S000003937 ORF Verified YLL014W EMC6 chromosome 12 12 121322 121648 W 2011-02-03 1996-07-31 Member of conserved ER transmembrane complex; required for efficient folding of proteins in the ER; null mutant displays induction of the unfolded protein response; homologous to worm F33D4.7/EMC-6, fly CG11781, human TMEM93 -S000032696 CDS YLL014W 12 121322 121648 W 2011-02-03 1996-07-31 -S000003936 ORF Verified YLL013C PUF3 mRNA-binding protein PUF3 chromosome 12 12 124714 122075 C 2011-02-03 1996-07-31 Protein of the mitochondrial outer surface; links the Arp2/3 complex with the mitochore during anterograde mitochondrial movement; also binds to and promotes degradation of mRNAs for select nuclear-encoded mitochondrial proteins -S000031656 CDS YLL013C 12 124714 122075 C 2011-02-03 1996-07-31 -S000003935 ORF Verified YLL012W YEH1 sterol esterase chromosome 12 12 125534 127255 W 2011-02-03 1996-07-31 Steryl ester hydrolase; one of three gene products (Yeh1p, Yeh2p, Tgl1p) responsible for steryl ester hydrolase activity and involved in sterol homeostasis; localized to lipid particle membranes; YEH1 has a paralog, YEH2, that arose from the whole genome duplication -S000031612 CDS YLL012W 12 125534 127255 W 2011-02-03 1996-07-31 -S000003934 ORF Verified YLL011W SOF1 rRNA-processing protein SOF1 chromosome 12 L000001981 12 127523 128992 W 2011-02-03 1996-07-31 Protein required for biogenesis of 40S (small) ribosomal subunit; has similarity to the beta subunit of trimeric G-proteins and the splicing factor Prp4p; essential gene -S000031493 CDS YLL011W 12 127523 128992 W 2011-02-03 1996-07-31 -S000003933 ORF Verified YLL010C PSR1 phosphatase chromosome 12 12 130613 129330 C 2011-02-03 1996-07-31 Plasma membrane associated protein phosphatase; involved in the general stress response; required along with binding partner Whi2p for full activation of STRE-mediated gene expression, possibly through dephosphorylation of Msn2p; PSR1 has a paralog, PSR2, that arose from the whole genome duplication -S000030481 CDS YLL010C 12 130613 129330 C 2011-02-03 1996-07-31 -S000003932 ORF Verified YLL009C COX17 copper metallochaperone COX17 chromosome 12 L000003085 12 131414 131205 C 2011-02-03 1996-07-31 Copper metallochaperone that transfers copper to Sco1p and Cox11p; eventual delivery to cytochrome c oxidase; contains twin cysteine-x9-cysteine motifs; interacts with the MICOS complex, and interaction is promoted by copper ions; human homolog COX17 partially complements yeast null mutant -S000030695 CDS YLL009C 12 131414 131205 C 2011-02-03 1996-07-31 -S000003931 ORF Verified YLL008W DRS1 putative ATP-dependent RNA helicase chromosome 12 L000000525 12 131729 133987 W 2011-02-03 1996-07-31 Nucleolar DEAD-box protein required for ribosome assembly and function; including synthesis of 60S ribosomal subunits; constituent of 66S pre-ribosomal particles -S000030652 CDS YLL008W 12 131729 133987 W 2011-02-03 1996-07-31 -S000003930 ORF Verified YLL007C LMO1 chromosome 12 12 136299 134302 C 2011-02-03 1996-07-31 Homolog of mammalian ELMO (Engulfment and celL MOtility); upstream component for regulation through the small GTPase Rho5p; may form a complex with Dck1p that acts as a GEF for Rho5p; cytoplasmic protein that relocates to mitochondria under oxidative stress; implicated in mitophagy; not an essential protein -S000036717 CDS YLL007C 12 136299 134302 C 2011-02-03 1996-07-31 -S000028560 ORF Uncharacterized YLL006W-A chromosome 12 12 136345 136521 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031266 CDS YLL006W-A 12 136345 136521 W 2011-02-03 2003-07-29 -S000003929 ORF Verified YLL006W MMM1 ERMES complex subunit MMM1|YME6 chromosome 12 L000001124 12 136586 137866 W 2011-02-03 1996-07-31 ER integral membrane protein, ERMES complex subunit; ERMES links the ER to mitochondria and may promote inter-organellar calcium and phospholipid exchange as well as coordinating mitochondrial DNA replication and growth; required for mitophagy; ERMES complex is often co-localized with peroxisomes and with concentrated areas of pyruvate dehydrogenase -S000036667 CDS YLL006W 12 136586 137866 W 2011-02-03 1996-07-31 -S000130181 ARS ARS1207 chromosome 12 12 138185 139164 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000003928 ORF Verified YLL005C SPO75 chromosome 12 S000007654 12 140546 137940 C 2011-02-03 1996-07-31 Meiosis-specific protein of unknown function; required for spore wall formation during sporulation; dispensable for both nuclear divisions during meiosis -S000036535 CDS YLL005C 12 140546 137940 C 2011-02-03 1996-07-31 -S000003927 ORF Verified YLL004W ORC3 origin recognition complex subunit 3 chromosome 12 L000003074 12 141073 142923 W 2011-02-03 1996-07-31 Subunit of the origin recognition complex (ORC); ORC directs DNA replication by binding to replication origins and is also involved in transcriptional silencing -S000036499 CDS YLL004W 12 141073 142923 W 2011-02-03 1996-07-31 -S000003926 ORF Verified YLL003W SFI1 chromosome 12 L000003991 12 143201 146041 W 2011-02-03 1996-07-31 Centrin (Cdc31p)-binding protein required for SPB duplication; localizes to the half-bridge of the spindle pole body (SPB); required for progression through G(2)-M transition; phosphorylated by Cdc28p-Clb2p and by Cdc5p; dephosphorylated by Cdc14p; has similarity to Xenopus laevis XCAP-C -S000035597 CDS YLL003W 12 143201 146041 W 2011-02-03 1996-07-31 -S000003925 ORF Verified YLL002W RTT109 H3 histone acetyltransferase RTT109|KAT11|REM50|KIM2 chromosome 12 L000003932 12 146291 147601 W 2011-02-03 1996-07-31 Histone acetyltransferase; critical for cell survival in presence of DNA damage during S phase, required for recovery after DSB repair; acetylates H3K56, H3K9; H3K56 acetylation activity required for expression homeostasis, buffering of mRNA synthesis rate against changes in gene dosage during S phase; involved in non-homologous end joining and regulation of Ty1 transposition; prevents hyper-amplification of rDNA; interacts physically with Vps75p -S000035504 CDS YLL002W 12 146291 147601 W 2011-02-03 1996-07-31 -S000003924 ORF Verified YLL001W DNM1 dynamin-related GTPase DNM1 chromosome 12 L000002645 12 147890 150163 W 2011-02-03 1996-07-31 Dynamin-related GTPase involved in mitochondrial organization; required for mitochondrial fission and inheritance; self assembles on the cytoplasmic face of mitochondrial tubules at sites where division will occur; participates in endocytosis and regulates peroxisome fission along with Vps1p; mutants in the human ortholog DNM1L, which mediates mitochondrial fission, peroxisomal division, autophagy, and mitophagy, are associated with slowly progressive infantile encephalopathy -S000035377 CDS YLL001W 12 147890 150163 W 2011-02-03 1996-07-31 -S000006473 centromere CEN12 CEN12 chromosome 12 L000000305 12 150947 150828 C 0 2011-02-03 2000-05-19|2004-10-08 Chromosome XII centromere -S000077287 centromere_DNA_Element_I CEN12 12 150947 150938 C 2011-02-03 2004-10-08 -S000077288 centromere_DNA_Element_II CEN12 12 150937 150853 C 2011-02-03 2004-10-08 -S000077289 centromere_DNA_Element_III CEN12 12 150852 150828 C 2011-02-03 2004-10-08 -S000114848 ARS ARS1208 ARS1208 ARSXII-151|CEN12 ARS chromosome 12 12 150947 151389 2011-02-03 2006-04-13 Autonomously Replicating Sequence -S000178131 ARS_consensus_sequence ARS1208 12 151078 151094 W 2014-11-18 2014-11-18 -S000003991 ORF Uncharacterized YLR001C chromosome 12 12 153977 151389 C 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; predicted to be palmitoylated -S000031754 CDS YLR001C 12 153977 151389 C 2011-02-03 1996-07-31 -S000003992 ORF Verified YLR002C NOC3 chromosome 12 12 156334 154343 C 2011-02-03 1996-07-31 Subunit of a nuclear complex with Noc2p and pre-replicative complexes; the Noc2p-Noc3p complex binds to 66S ribosomal precursors to mediate their maturation and intranuclear transport; binds to chromatin at active replication origins, and is required for pre-RC formation and maintenance during DNA replication licensing -S000031944 CDS YLR002C 12 156334 154343 C 2011-02-03 1996-07-31 -S000118470 ARS ARS1209 ARSXII-157 chromosome 12 12 156648 156884 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000003993 ORF Verified YLR003C CMS1 chromosome 12 12 157730 156855 C 2011-02-03 1996-07-31 Putative subunit of the 90S preribosome processome complex; overexpression rescues supressor mutant of mcm10; null mutant is viable; relocalizes from nucleus to cytoplasm upon DNA replication stress -S000032071 CDS YLR003C 12 157730 156855 C 2011-02-03 1996-07-31 -S000003994 ORF Verified YLR004C THI73 chromosome 12 12 159505 157934 C 2011-02-03 1996-07-31 Putative plasma membrane permease; proposed to be involved in carboxylic acid uptake and repressed by thiamine; substrate of Dbf2p/Mob1p kinase; transcription is altered if mitochondrial dysfunction occurs -S000034068 CDS YLR004C 12 159505 157934 C 2011-02-03 1996-07-31 -S000003995 ORF Verified YLR005W SSL1 TFIIH/NER complex subunit SSL1 chromosome 12 L000002085 12 160049 161434 W 2011-02-03 1996-07-31 Subunit of the core form of RNA polymerase transcription factor TFIIH; has both protein kinase and DNA-dependent ATPase/helicase activities; essential for transcription and nucleotide excision repair; interacts with Tfb4p -S000034240 CDS YLR005W 12 160049 161434 W 2011-02-03 1996-07-31 -S000003996 ORF Verified YLR006C SSK1 mitogen-activated protein kinase kinase kinase SSK1 chromosome 12 L000002084 12 163893 161755 C 2011-02-03 1996-07-31 Cytoplasmic phosphorelay intermediate osmosensor and regulator; part of a two-component signal transducer that mediates osmosensing via a phosphorelay mechanism; required for mitophagy; dephosphorylated form is degraded by the ubiquitin-proteasome system; potential Cdc28p substrate -S000034274 CDS YLR006C 12 163893 161755 C 2011-02-03 1996-07-31 -S000003997 ORF Verified YLR007W NSE1 Smc5-Smc6 complex subunit NSE1 chromosome 12 12 164392 165402 W 2011-02-03 1996-07-31 Component of the SMC5-SMC6 complex; this complex plays a key role in the removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair -S000034350 CDS YLR007W 12 164392 165402 W 2011-02-03 1996-07-31 -S000003998 ORF Verified YLR008C PAM18 TIM14 chromosome 12 12 166083 165577 C 2011-02-03 1996-07-31 Subunit of the import motor (PAM complex); the PAM complex is a component of the Translocase of the Inner Mitochondrial membrane (TIM23 complex); essential J-protein cochaperone that stimulates Ssc1p ATPase activity to drive import; inhibited by Pam16p -S000034382 CDS YLR008C 12 166083 165577 C 2011-02-03 1996-07-31 -S000003999 ORF Verified YLR009W RLP24 ATPase-activating ribosome biosynthesis protein chromosome 12 12 166537 167136 W 2011-02-03 1996-07-31 Essential protein required for ribosomal large subunit biogenesis; associated with pre-60S ribosomal subunits; stimulates the ATPase activity of Afg2p, which is required for release of Rlp24p from the pre-60S particle; has similarity to Rpl24Ap and Rpl24Bp -S000035399 CDS YLR009W 12 166537 167136 W 2011-02-03 1996-07-31 -S000004000 ORF Verified YLR010C TEN1 chromosome 12 12 167802 167320 C 2011-02-03 1996-07-31 Protein that regulates telomeric length; protects telomeric ends in a complex with Cdc13p and Stn1p; similar to human Ten1 which is critical for the telomeric function of the CST (Cdc13p-Stn1p-Ten1p) complex -S000034009 CDS YLR010C 12 167802 167320 C 2011-02-03 1996-07-31 -S000006728 tRNA_gene tS(AGA)L chromosome 12 L000003665 12 168025 167944 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000032403 noncoding_exon tS(AGA)L 12 168025 167944 C 2011-02-03 2000-05-19 -S000007079 long_terminal_repeat YLRCsigma1 chromosome 12 12 168380 168043 C 2011-02-03 2000-05-19 Ty3 LTR -S000004001 ORF Verified YLR011W LOT6 flavin-dependent quinone reductase chromosome 12 12 169103 169678 W 2011-02-03 1996-07-31 FMN-dependent NAD(P)H:quinone reductase; role in apoptosis-like cell death; may be involved in quinone detoxification; expression elevated at low temperature; sequesters the Cin5p transcription factor in the cytoplasm in complex with the proteasome under reducing conditions -S000034963 CDS YLR011W 12 169103 169678 W 2011-02-03 1996-07-31 -S000004002 ORF Uncharacterized YLR012C chromosome 12 12 170281 169982 C 2011-02-03 2003-09-22|1996-07-31 Putative protein of unknown function; YLR012C is not an essential gene -S000035029 CDS YLR012C 12 170281 169982 C 2011-02-03 2003-09-22|1996-07-31 -S000004003 ORF Verified YLR013W GAT3 chromosome 12 S000007451 12 171339 171764 W 2011-02-03 1996-07-31 Protein containing GATA family zinc finger motifs; involved in spore wall assembly; sequence similarity to GAT4, and the double mutant gat3 gat4 exhibits reduced dityrosine fluorescence relative to the single mutants -S000035278 CDS YLR013W 12 171339 171764 W 2011-02-03 1996-07-31 -S000004004 ORF Verified YLR014C PPR1 chromosome 12 L000001475 12 174982 172268 C 8 2011-02-03 1996-07-31 Zinc finger transcription factor; contains a Zn(2)-Cys(6) binuclear cluster domain, positively regulates transcription of URA1, URA3, URA4, and URA10, which are involved in de novo pyrimidine biosynthesis, in response to pyrimidine starvation; activity may be modulated by interaction with Tup1p -S000036111 CDS YLR014C 12 174982 172268 C 2011-02-03 1996-07-31 -S000004005 ORF Verified YLR015W BRE2 CPS60 chromosome 12 12 175227 176744 W 2011-02-03 1996-07-31 Subunit of COMPASS (Set1C) complex; COMPASS methylates Lys4 of histone H3 and functions in silencing at telomeres; has a C-terminal Sdc1 Dpy-30 Interaction (SDI) domain that mediates binding to Sdc1p; similar to trithorax-group protein ASH2L -S000036291 CDS YLR015W 12 175227 176744 W 2011-02-03 1996-07-31 -S000004006 ORF Verified YLR016C PML1 chromosome 12 12 177416 176802 C 2011-02-03 1996-07-31 Subunit of the RES complex; RES complex is required for nuclear retention of unspliced pre-mRNAs; acts in the same pathway as Pml39p and Mlp1p -S000036355 CDS YLR016C 12 177416 176802 C 2011-02-03 1996-07-31 -S000004007 ORF Verified YLR017W MEU1 S-methyl-5-thioadenosine phosphorylase chromosome 12 L000004106 12 177608 178621 W 2011-02-03 1996-07-31 Methylthioadenosine phosphorylase (MTAP); catalyzes the initial step in the methionine salvage pathway; affects polyamine biosynthesis through regulation of ornithine decarboxylase (Spe1p) activity; regulates ADH2 gene expression -S000030114 CDS YLR017W 12 177608 178621 W 2011-02-03 1996-07-31 -S000004008 ORF Verified YLR018C POM34 chromosome 12 12 179606 178707 C 2011-02-03 1996-07-31 Subunit of the transmembrane ring of the nuclear pore complex (NPC); contributes to nucleocytoplasmic transport, NPC biogenesis and spindle pole body duplication -S000030160 CDS YLR018C 12 179606 178707 C 2011-02-03 1996-07-31 -S000004009 ORF Verified YLR019W PSR2 putative phosphatase chromosome 12 12 180288 181481 W 2011-02-03 1996-07-31 Plasma membrane phosphatase involved in the general stress response; required with Psr1p and Whi2p for full activation of STRE-mediated gene expression, possibly through dephosphorylation of Msn2p; PSR2 has a paralog, PSR1, that arose from the whole genome duplication -S000030375 CDS YLR019W 12 180288 181481 W 2011-02-03 1996-07-31 -S000004010 ORF Verified YLR020C YEH2 sterol esterase chromosome 12 12 183405 181789 C 2011-02-03 1996-07-31 Steryl ester hydrolase; catalyzes steryl ester hydrolysis at the plasma membrane; involved in sterol metabolism; YEH2 has a paralog, YEH1, that arose from the whole genome duplication -S000029961 CDS YLR020C 12 183405 181789 C 2011-02-03 1996-07-31 -S000004011 ORF Verified YLR021W IRC25 DMP2|PBA3|POC3 chromosome 12 12 183623 184162 W 2011-02-03 1996-07-31 Component of a heterodimeric Poc4p-Irc25p chaperone; involved in assembly of alpha subunits into the 20S proteasome; may regulate formation of proteasome isoforms with alternative subunits under different conditions; upregulates proteasome assembly in response to the unfolded protein response activated by mistargeting of proteins (UPRam) -S000031024 CDS YLR021W 12 183623 184162 W 2011-02-03 1996-07-31 -S000004012 ORF Verified YLR022C SDO1 guanine nucleotide exchange factor SDO1 chromosome 12 S000029721 12 184926 184174 C 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF) for Ria1p; essential protein involved in ribosome maturation; with Ria1p, promotes release of Tif6p from 60S ribosomal subunits in the cytoplasm so that they can assemble with 40S subunits to generate mature ribosomes; ortholog of the human protein (SBDS) responsible for autosomal recessive Shwachman-Bodian-Diamond Syndrome; highly conserved across archaea and eukaryotes -S000031066 CDS YLR022C 12 184926 184174 C 2011-02-03 1996-07-31 -S000004013 ORF Verified YLR023C IZH3 chromosome 12 12 187129 185498 C 2011-02-03 1996-07-31 Membrane protein involved in zinc ion homeostasis; member of the four-protein IZH family, expression induced by zinc deficiency; deletion reduces sensitivity to elevated zinc and shortens lag phase, overexpression reduces Zap1p activity -S000031203 CDS YLR023C 12 187129 185498 C 2011-02-03 1996-07-31 -S000004014 ORF Verified YLR024C UBR2 putative ubiquitin-protein ligase UBR2 chromosome 12 12 193281 187663 C 2011-02-03 1996-07-31|2011-02-03 Cytoplasmic ubiquitin-protein ligase (E3); component of the Mub1p-Ubr2p-Rad6p ubiquitin ligase complex required for the ubiquitination and degradation of Rpn4p; mediates formation of the ternary complex -S000032202 CDS YLR024C 12 193281 187663 C 2011-02-03 1996-07-31|2011-02-03 -S000004015 ORF Verified YLR025W SNF7 ESCRT-III subunit protein SNF7|VPL5|RNS4|VPS32|DID1 chromosome 12 L000001950 12 194452 195174 W 11.4 2011-02-03 1996-07-31 One of four subunits of the ESCRT-III complex; involved in the sorting of transmembrane proteins into the multivesicular body (MVB) pathway; recruited from the cytoplasm to endosomal membranes; ESCRT-III stands for endosomal sorting complex required for transport III -S000032371 CDS YLR025W 12 194452 195174 W 2011-02-03 1996-07-31 -S000004016 ORF Verified YLR026C SED5 t-SNARE syntaxin chromosome 12 L000001861 12 196472 195450 C 2011-02-03 1996-07-31 cis-Golgi t-SNARE syntaxin; required for vesicular transport between the ER and the Golgi complex; binds at least 9 SNARE proteins -S000032400 CDS YLR026C 12 196472 195450 C 2011-02-03 1996-07-31 -S000004017 ORF Verified YLR027C AAT2 aspartate transaminase AAT2|ASP5 chromosome 12 L000000131|L000002677 12 198085 196829 C 17 2011-02-03 2003-09-22|1996-07-31 Cytosolic aspartate aminotransferase involved in nitrogen metabolism; localizes to peroxisomes in oleate-grown cells -S000032507 CDS YLR027C 12 198085 196829 C 2011-02-03 2003-09-22|1996-07-31 -S000007497 snoRNA_gene snR30 SNR30 chromosome 12 L000001968 12 198784 199389 W 2011-02-03 2000-05-19|2007-05-09 H/ACA box small nucleolar RNA (snoRNA); essential gene required for cleavage of 35S primary rRNA transcript to release the precursor to the 18S rRNA -S000036751 noncoding_exon snR30 12 198784 199389 W 2011-02-03 2000-05-19|2007-05-09 -S000004018 ORF Verified YLR028C ADE16 bifunctional phosphoribosylaminoimidazolecarboxamide formyltransferase/IMP cyclohydrolase ADE16 chromosome 12 L000003305 12 201315 199540 C 2011-02-03 1997-07-30|1996-07-31 Enzyme of 'de novo' purine biosynthesis; contains both 5-aminoimidazole-4-carboxamide ribonucleotide transformylase and inosine monophosphate cyclohydrolase activities; ADE16 has a paralog, ADE17, that arose from the whole genome duplication; ade16 ade17 mutants require adenine and histidine -S000034542 CDS YLR028C 12 201315 199540 C 2011-02-03 1997-07-30|1996-07-31 -S000004019 ORF Verified YLR029C RPL15A eL15|ribosomal 60S subunit protein L15A|L15e|rp15R|YL10|L15A|L13A|RPL10A chromosome 12 L000002705|L000001710 12 202590 201976 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L15A; binds to 5.8 S rRNA; homologous to mammalian ribosomal protein L15, no bacterial homolog; RPL15A has a paralog, RPL15B, that arose from the whole genome duplication -S000034631 CDS YLR029C 12 202590 201976 C 2011-02-03 1996-07-31 -S000004020 ORF Uncharacterized YLR030W chromosome 12 12 203290 204081 W 2011-02-03 1996-07-31 Putative protein of unknown function; S288C contains an in-frame stop codon between ORFs YLR030W and YLR031W -S000034152 CDS YLR030W 12 203290 204081 W 2011-02-03 1996-07-31 -S000004021 ORF Uncharacterized YLR031W chromosome 12 12 204225 204785 W 2011-02-03 1996-07-31 Putative protein of unknown function; S288C contains an in-frame stop codon between ORFs YLR030W and YLR031W; YLR031W has a paralog, YMR124W, that arose from the whole genome duplication -S000034277 CDS YLR031W 12 204225 204785 W 2011-02-03 1996-07-31 -S000004022 ORF Verified YLR032W RAD5 DNA helicase RAD5|SNM2|REV2 chromosome 12 L000001559 12 204991 208500 W 22 2011-02-03 1996-07-31 DNA helicase/Ubiquitin ligase; involved in error-free DNA damage tolerance (DDT), replication fork regression during postreplication repair by template switching, error-prone translesion synthesis; promotes synthesis of free and PCNA-bound polyubiquitin chains by Ubc13p-Mms2p; forms nuclear foci upon DNA replication stress; associates with native telomeres, cooperates with homologous recombination in senescent cells; human homolog HLTF can complement yeast null mutant -S000034393 CDS YLR032W 12 204991 208500 W 2011-02-03 1996-07-31 -S000004023 ORF Verified YLR033W RSC58 chromosome 12 12 208761 210269 W 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; RSC functions in transcriptional regulation and elongation, chromosome stability, and establishing sister chromatid cohesion; involved in telomere maintenance -S000035450 CDS YLR033W 12 208761 210269 W 2011-02-03 1996-07-31 -S000004024 ORF Verified YLR034C SMF3 putative divalent metal ion transporter SMF3 chromosome 12 12 211933 210512 C 2011-02-03 1996-07-31|2011-02-03 Putative divalent metal ion transporter involved in iron homeostasis; transcriptionally regulated by metal ions; member of the Nramp family of metal transport proteins; protein abundance increases in response to DNA replication stress -S000035485 CDS YLR034C 12 211933 210512 C 2011-02-03 1996-07-31|2011-02-03 -S000004025 ORF Verified YLR035C MLH2 mismatch repair protein MLH2 chromosome 12 12 214456 212369 C 2011-02-03 1996-07-31 Protein involved in mismatch repair and meiotic recombination; only certain frameshift intermediates are mismatch repair substrates; forms a complex with Mlh1p -S000035575 CDS YLR035C 12 214456 212369 C 2011-02-03 1996-07-31 -S000006524 tRNA_gene tA(UGC)L chromosome 12 L000003664 12 214955 214883 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 5 nuclear tRNA genes containing the tDNA-anticodon TGC (mature tRNA may be UGC or may contain modified bases), decodes GCA and probably GCG codons into alanine, one of 16 nuclear tRNAs for alanine -S000034887 noncoding_exon tA(UGC)L 12 214955 214883 C 2011-02-03 2000-05-19 -S000007065 long_terminal_repeat YLRCdelta2 chromosome 12 12 215417 215080 C 2011-02-03 2000-05-19 Ty1 LTR -S000007225 transposable_element_gene YLR035C-A gag-pol fusion protein chromosome 12 12 218907 215440 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); YLR035C-A is part of a mutant retrotransposon -S000034784 CDS YLR035C-A 12 218907 215440 C 2011-02-03 1999-07-17 -S000007066 long_terminal_repeat YLRCdelta3 chromosome 12 12 221005 220668 C 2011-02-03 2000-05-19 Ty1 LTR -S000007083 long_terminal_repeat YLRWdelta4 chromosome 12 12 221006 221266 W 2011-02-03 2000-05-19 Ty1 LTR -S000004026 ORF Uncharacterized YLR036C chromosome 12 12 222132 221521 C 2011-02-03 1996-07-31 Putative protein predicted to have transmembrane domains; interacts with HSP90 by yeast two-hybrid analysis; YLR036C is not an essential protein -S000035633 CDS YLR036C 12 222132 221521 C 2011-02-03 1996-07-31 -S000178132 ARS ARS1210 chromosome 12 12 222220 222676 2014-11-18 2014-11-18 Autonomously replicating sequence -S000004027 ORF Verified YLR037C PAU23 seripauperin PAU23|DAN2 chromosome 12 12 223059 222685 C 2011-02-03 1996-07-31 Cell wall mannoprotein; has similarity to Tir1p, Tir2p, Tir3p, and Tir4p; member of the seripauperin multigene family encoded mainly in subtelomeric regions; expressed under anaerobic conditions, completely repressed during aerobic growth -S000036588 CDS YLR037C 12 223059 222685 C 2011-02-03 1996-07-31 -S000004028 ORF Verified YLR038C COX12 cytochrome c oxidase subunit VIb chromosome 12 L000000396 12 225172 224921 C 2011-02-03 1996-07-31 Subunit VIb of cytochrome c oxidase; cytochrome c oxidase is also known as respiratory Complex IV and is the terminal member of the mitochondrial inner membrane electron transport chain; required for assembly of cytochrome c oxidase but not required for activity after assembly; phosphorylated; easily released from the intermembrane space, suggesting a loose association with Complex IV -S000036657 CDS YLR038C 12 225172 224921 C 2011-02-03 1996-07-31 -S000004029 ORF Verified YLR039C RIC1 chromosome 12 L000001638 12 228596 225426 C 2011-02-03 1996-07-31 Protein involved in retrograde transport to the cis-Golgi network; forms heterodimer with Rgp1p that acts as a GTP exchange factor for Ypt6p; involved in transcription of rRNA and ribosomal protein genes -S000036750 CDS YLR039C 12 228596 225426 C 2011-02-03 1996-07-31 -S000004031 ORF Dubious YLR041W chromosome 12 12 229377 229697 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YLR040C -S000030478 CDS YLR041W 12 229377 229697 W 2011-02-03 1996-07-31 -S000004030 ORF Verified YLR040C AFB1 chromosome 12 12 229582 228908 C 2011-02-03 1996-07-31 MATalpha-specific a-factor blocker; contributes to mating efficiency under certain conditions; localizes to the cell wall; predicted to be a GPI-attached protein; upregulated by Mcm1p-Alpha1p transcription factor; partially overlaps the dubious ORF YLR041W -S000030256 CDS YLR040C 12 229582 228908 C 2011-02-03 1996-07-31 -S000004032 ORF Verified YLR042C chromosome 12 12 230451 229966 C 2011-02-03 1996-07-31 Cell wall protein of unknown function; localizes to the cytoplasm; deletion improves xylose fermentation in industrially engineered strains; YLR042C is not an essential gene -S000030545 CDS YLR042C 12 230451 229966 C 2011-02-03 1996-07-31 -S000118471 ARS ARS1211 ARSXII-231 chromosome 12 12 231179 231421 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178133 ARS_consensus_sequence ARS1211 12 231250 231266 W 2014-11-18 2014-11-18 -S000004033 ORF Verified YLR043C TRX1 thioredoxin TRX1|LMA1 chromosome 12 L000002357 12 232013 231702 C -7 2011-02-03 1996-07-31 Cytoplasmic thioredoxin isoenzyme; part of thioredoxin system which protects cells against oxidative and reductive stress; forms LMA1 complex with Pbi2p; acts as a cofactor for Tsa1p; required for ER-Golgi transport and vacuole inheritance; with Trx2p, facilitates mitochondrial import of small Tims Tim9p, Tim10p, Tim13p by maintaining them in reduced form; abundance increases iunder DNA replication stress; TRX1 has a paralog, TRX2, that arose from the whole genome duplication -S000031467 CDS YLR043C 12 232013 231702 C 2011-02-03 1996-07-31 -S000004034 ORF Verified YLR044C PDC1 indolepyruvate decarboxylase 1 chromosome 12 L000001354 12 234081 232390 C -7 2011-02-03 1996-07-31 Major of three pyruvate decarboxylase isozymes; key enzyme in alcoholic fermentation; decarboxylates pyruvate to acetaldehyde; involved in amino acid catabolism; subject to glucose-, ethanol-, and autoregulation; activated by phosphorylation in response to glucose levels; N-terminally propionylated in vivo -S000031581 CDS YLR044C 12 234081 232390 C 2011-02-03 1996-07-31 -S000004035 ORF Verified YLR045C STU2 chromosome 12 L000003019 12 237703 235037 C 2011-02-03 1996-07-31 Microtubule-associated protein (MAP) of the XMAP215/Dis1 family; regulates microtubule dynamics during spindle orientation and metaphase chromosome alignment; interacts with spindle pole body component Spc72p -S000032584 CDS YLR045C 12 237703 235037 C 2011-02-03 1996-07-31 -S000004036 ORF Uncharacterized YLR046C RLA1 chromosome 12 12 238813 238001 C 2011-02-03 1996-07-31 Putative membrane protein; member of the fungal lipid-translocating exporter (LTE) family of proteins; transcription is activated by paralogous transcription factors Yrm1p and Yrr1p along with genes involved in multidrug resistance; YLR046C has a paralog, RTA1, that arose from the whole genome duplication -S000032679 CDS YLR046C 12 238813 238001 C 2011-02-03 1996-07-31 -S000004037 ORF Verified YLR047C FRE8 putative ferric-chelate reductase chromosome 12 12 241407 239347 C 2011-02-03 1996-07-31 Protein with sequence similarity to iron/copper reductases; involved in iron homeostasis; deletion mutant has iron deficiency/accumulation growth defects; expression increased in the absence of copper-responsive transcription factor Mac1p -S000032758 CDS YLR047C 12 241407 239347 C 2011-02-03 1996-07-31 -S000004038 ORF Verified YLR048W RPS0B uS2|ribosomal 40S subunit protein S0B|S2|S0B|YST2|NAB1B chromosome 12 L000002908 12 242232 243349 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; RPS0B has a paralog, RPS0A, that arose from the whole genome duplication; required for maturation of 18S rRNA along with Rps0Ap; deletion of either RPS0 gene reduces growth rate, deletion of both genes is lethal; homologous to human ribosomal protein SA and bacterial S2 -S000032917 CDS YLR048W 12 242232 242321 W 2011-02-03 1996-07-31 -S000032918 CDS YLR048W 12 242681 243349 W 2011-02-03 1996-07-31 -S000032919 intron YLR048W 12 242322 242680 W 2011-02-03 1996-07-31 -S000004039 ORF Uncharacterized YLR049C chromosome 12 12 245172 243886 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000034828 CDS YLR049C 12 245172 243886 C 2011-02-03 1996-07-31 -S000004040 ORF Uncharacterized YLR050C chromosome 12 12 246072 245587 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; YLR050C is not an essential gene -S000033086 CDS YLR050C 12 246072 245587 C 2011-02-03 1996-07-31 -S000004041 ORF Verified YLR051C FCF2 chromosome 12 12 246977 246324 C 2011-02-03 1996-07-31 Nucleolar protein involved in the early steps of 35S rRNA processing; interacts with Faf1p; member of a transcriptionally co-regulated set of genes called the RRB regulon; essential gene -S000033845 CDS YLR051C 12 246977 246324 C 2011-02-03 1996-07-31 -S000004042 ORF Verified YLR052W IES3 chromosome 12 12 247201 247953 W 2011-02-03 1996-07-31 Subunit of the INO80 chromatin remodeling complex -S000034056 CDS YLR052W 12 247201 247953 W 2011-02-03 1996-07-31 -S000004043 ORF Uncharacterized YLR053C chromosome 12 12 248426 248100 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000034893 CDS YLR053C 12 248426 248100 C 2011-02-03 1996-07-31 -S000004044 ORF Verified YLR054C OSW2 chromosome 12 12 250978 248717 C 2011-02-03 2003-09-27|1996-07-31 Protein of unknown function reputedly involved in spore wall assembly -S000035045 CDS YLR054C 12 250860 248717 C 2011-02-03 2003-09-27|1996-07-31 -S000035044 CDS YLR054C 12 250978 250948 C 2011-02-03 2003-09-27 -S000035046 intron YLR054C 12 250947 250861 C 2011-02-03 2003-09-27 -S000004045 ORF Verified YLR055C SPT8 SAGA complex subunit SPT8 chromosome 12 L000002034 12 253080 251272 C 30 2011-02-03 1996-07-31 Subunit of the SAGA transcriptional regulatory complex; not present in SAGA-like complex SLIK/SALSA; required for SAGA-mediated inhibition at some promoters -S000035199 CDS YLR055C 12 253080 251272 C 2011-02-03 1996-07-31 -S000004046 ORF Verified YLR056W ERG3 C-5 sterol desaturase|PSO6|SYR1 chromosome 12 L000000570|L000004043 12 253861 254958 W 2011-02-03 1996-07-31 C-5 sterol desaturase; glycoprotein that catalyzes the introduction of a C-5(6) double bond into episterol, a precursor in ergosterol biosynthesis; transcriptionally down-regulated when ergosterol is in excess; mutants are viable, but cannot grow on non-fermentable carbon sources; substrate of HRD ubiquitin ligase; mutation is functionally complemented by human SC5D -S000036224 CDS YLR056W 12 253861 254958 W 2011-02-03 1996-07-31 -S000004047 ORF Verified YLR057W MNL2 putative mannosidase MNL2 chromosome 12 12 255306 257855 W 2011-02-03 1996-07-31 Putative mannosidase involved in ER-associated protein degradation; localizes to the endoplasmic reticulum; sequence similarity with seven-hairpin glycosidase (GH47) family members, such as Mns1p and Mnl1p, that hydrolyze 1,2-linked alpha-D-mannose residues; non-essential gene -S000036328 CDS YLR057W 12 255306 257855 W 2011-02-03 1996-07-31 -S000004048 ORF Verified YLR058C SHM2 glycine hydroxymethyltransferase SHM2|SHMT2 chromosome 12 L000001882 12 259401 257992 C 2011-02-03 1996-07-31 Cytosolic serine hydroxymethyltransferase; converts serine to glycine plus 5,10 methylenetetrahydrofolate; major isoform involved in generating precursors for purine, pyrimidine, amino acid, and lipid biosynthesis -S000036381 CDS YLR058C 12 259401 257992 C 2011-02-03 1996-07-31 -S000004049 ORF Verified YLR059C REX2 YNT20 chromosome 12 L000003035 12 260547 259738 C 2011-02-03 1996-07-31 3'-5' RNA exonuclease; involved in 3'-end processing of U4 and U5 snRNAs, 5S and 5.8S rRNAs, and RNase P and RNase MRP RNA; localized to mitochondria and null suppresses escape of mtDNA to nucleus in yme1 yme2 mutants; RNase D exonuclease -S000036443 CDS YLR059C 12 260547 259738 C 2011-02-03 1996-07-31 -S000004050 ORF Verified YLR060W FRS1 phenylalanine--tRNA ligase subunit beta chromosome 12 L000000629 12 260979 262766 W 2011-02-03 1996-07-31 Beta subunit of cytoplasmic phenylalanyl-tRNA synthetase; forms a tetramer with Frs2p to generate active enzyme; able to hydrolyze mis-aminoacylated tRNA-Phe, which could contribute to translational quality control -S000030011 CDS YLR060W 12 260979 262766 W 2011-02-03 1996-07-31 -S000004051 ORF Verified YLR061W RPL22A eL22|ribosomal 60S subunit protein L22A|L22e|rp4|l1c|YL31|L22A chromosome 12 L000004460 12 263194 263948 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L22A; required for translation of long 5' UTR of IME1 mRNA and meiotic entry; required for the oxidative stress response, pseudohyphal and invasive growth; homologous to mammalian ribosomal protein L22, no bacterial homolog; RPL22A has a paralog, RPL22B, that arose from the whole genome duplication -S000030138 CDS YLR061W 12 263194 263205 W 2011-02-03 1996-07-31 -S000030139 CDS YLR061W 12 263595 263948 W 2011-02-03 1996-07-31 -S000030140 intron YLR061W 12 263206 263594 W 2011-02-03 1996-07-31 -S000004052 ORF Dubious YLR062C BUD28 chromosome 12 12 263954 263577 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 98% of ORF overlaps the verified gene RPL22A; diploid mutant displays a weak budding pattern phenotype in a systematic assay -S000031086 CDS YLR062C 12 263954 263577 C 2011-02-03 1996-07-31 -S000004053 ORF Verified YLR063W BMT6 25S rRNA (uracil2843-N3)-methyltransferase chromosome 12 12 264157 265254 W 2011-02-03 1996-07-31 Methyltransferase required for m3U2843 methylation of the 25S rRNA; S-adenosylmethionine-dependent; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YLR063W is not an essential gene -S000031280 CDS YLR063W 12 264157 265254 W 2011-02-03 1996-07-31 -S000004054 ORF Verified YLR064W PER33 chromosome 12 12 265456 266277 W 2011-02-03 1996-07-31 Protein that localizes to the endoplasmic reticulum; also associates with the nuclear pore complex; deletion extends chronological lifespan; highly conserved across species, orthologous to human TMEM33 and paralogous to Pom33p; protein abundance increases in response to DNA replication stress -S000031356 CDS YLR064W 12 265456 266277 W 2011-02-03 1996-07-31 -S000004055 ORF Verified YLR065C ENV10 SND2 chromosome 12 12 266918 266373 C 2011-02-03 1996-07-31 Protein involved in SRP-independent targeting of substrates to the ER; component of an alternative ER targeting pathway that has partial functional redundancy with the GET pathway; preference for substrates with downstream transmembrane domains; interacts with Snd1p, Pho88p/Snd3p, and Sec61p-translocon subunits; can compensate for loss of SRP; role in the late endosome-vacuole interface; putative role in secretory protein quality control -S000031430 CDS YLR065C 12 266918 266373 C 2011-02-03 1996-07-31 -S000004056 ORF Verified YLR066W SPC3 signal peptidase complex subunit SPC3 chromosome 12 L000003542|S000029502|L000002875 12 267169 267723 W 2011-02-03 1996-07-31 Subunit of signal peptidase complex; complex catalyzes cleavage of N-terminal signal sequences of proteins targeted to the secretory pathway; homologous to mammalian SPC22/23; other members of the complex are Spc1p, Spc2p, and Sec11p -S000032483 CDS YLR066W 12 267169 267723 W 2011-02-03 1996-07-31 -S000004057 ORF Verified YLR067C PET309 chromosome 12 L000001401 12 270710 267813 C 2011-02-03 1996-07-31 Specific translational activator for the COX1 mRNA; binds to the COX1 mRNA; also influences stability of intron-containing COX1 primary transcripts; localizes to the mitochondrial inner membrane; contains 12 pentatricopeptide repeats (PPRs) -S000032544 CDS YLR067C 12 270710 267813 C 2011-02-03 1996-07-31 -S000004058 ORF Verified YLR068W FYV7 chromosome 12 12 271008 271463 W 2011-02-03 1996-07-31 Essential protein required for maturation of 18S rRNA; required for survival upon exposure to K1 killer toxin -S000032669 CDS YLR068W 12 271008 271463 W 2011-02-03 1996-07-31 -S000004059 ORF Verified YLR069C MEF1 chromosome 12 L000001057 12 273915 271630 C 2011-02-03 1996-07-31 Mitochondrial elongation factor involved in translational elongation -S000033337 CDS YLR069C 12 273915 271630 C 2011-02-03 1996-07-31 -S000004060 ORF Verified YLR070C XYL2 D-xylulose reductase XYL2 chromosome 12 12 275211 274141 C 2011-02-03 1996-07-31 Xylitol dehydrogenase; converts xylitol to D-xylulose; expression induced by xylose, even though this pentose sugar is not well utilized by S. cerevisiae; null mutant has cell wall defect -S000033430 CDS YLR070C 12 275211 274141 C 2011-02-03 1996-07-31 -S000004061 ORF Verified YLR071C RGR1 MED14 chromosome 12 L000001629 12 278626 275378 C 70 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; required for glucose repression, HO repression, RME1 repression and sporulation -S000034340 CDS YLR071C 12 278626 275378 C 2011-02-03 1996-07-31 -S000004062 ORF Verified YLR072W LAM6 LTC1 chromosome 12 12 278862 280943 W 2011-02-03 1996-07-31 Sterol transporter that transfers sterols between membranes; may regulate and coordinate formation of contact sites between organelles; localizes to ER-mitochondrial contact sites in a Tom70p- and Tom71p-dependent manner; mitochondrial localization requires GRAM domain; also localizes to ER-vacuole contact sites, in a Vac8p-dependent manner; has GRAM and StART-like (VASt) domains; one of six StART-like domain-containing proteins in yeast; conserved across eukaryotes -S000034470 CDS YLR072W 12 278862 280943 W 2011-02-03 1996-07-31 -S000004063 ORF Verified YLR073C RFU1 chromosome 12 12 281621 281019 C 2011-02-03 1996-07-31 Protein that inhibits Doa4p deubiquitinating activity; contributes to ubiquitin homeostasis by regulating the conversion of free ubiquitin chains to ubiquitin monomers by Doa4p; GFP-fusion protein localizes to endosomes -S000034520 CDS YLR073C 12 281621 281019 C 2011-02-03 1996-07-31 -S000004064 ORF Verified YLR074C BUD20 chromosome 12 12 282456 281956 C 2011-02-03 1996-07-31 C2H2-type zinc finger protein required for ribosome assembly; shuttling factor which associates with pre-60S particles in the nucleus, accompanying them to the cytoplasm; cytoplasmic dissociation of Bud20p requires Drg1p; N-terminus harbors a nuclear localization signal (NLS) and a nuclear export signal (NES); cytoplasmic Bud20p is reimported by Kap123-dependent pathway; involved in bud-site selection; diploid mutants display a random budding pattern; similar to human ZNF593 -S000035544 CDS YLR074C 12 282456 281956 C 2011-02-03 1996-07-31 -S000004065 ORF Verified YLR075W RPL10 uL16|ribosomal 60S subunit protein L10|L16|L10|QSR1|GRC5 chromosome 12 L000000727 12 282927 283592 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L10; homologous to mammalian ribosomal protein L10 and bacterial L16; responsible for joining the 40S and 60S subunits; regulates translation initiation; similar to members of the QM gene family; protein abundance increases under DNA replication stress; mutations in human homolog implicated in T-cell acute lymphoblastic leukemia and also autism spectrum disorders (ASD); human RPL10 can complement yeast null mutant -S000035684 CDS YLR075W 12 282927 283592 W 2011-02-03 1996-07-31 -S000004066 ORF Dubious YLR076C chromosome 12 12 283607 283185 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the essential gene RPL10 which encodes the ribosomal protein L10 -S000035729 CDS YLR076C 12 283607 283185 C 2011-02-03 1996-07-31 -S000004067 ORF Verified YLR077W FMP25 BCA1 chromosome 12 12 283872 285623 W 2011-02-03 1996-07-31 Protein required for assembly of respiratory complex III; mitochondrial inner membrane protein; required for an early step in assembly of respiratory complex III (cytochrome bc1 complex); mRNA is targeted to mitochondria -S000036693 CDS YLR077W 12 283872 285623 W 2011-02-03 1996-07-31 -S000004068 ORF Verified YLR078C BOS1 SEC32 chromosome 12 L000000192 12 286559 285736 C 2011-02-03 1996-07-31 v-SNARE (vesicle specific SNAP receptor); localized to the endoplasmic reticulum membrane and necessary for vesicular transport from the ER to the Golgi; required for efficient nuclear fusion during mating -S000036710 CDS YLR078C 12 286467 285736 C 2011-02-03 1996-07-31 -S000036709 CDS YLR078C 12 286559 286557 C 2011-02-03 1996-07-31 -S000036711 intron YLR078C 12 286556 286468 C 2011-02-03 1996-07-31 -S000004069 ORF Verified YLR079W SIC1 BYC1|cyclin-dependent protein serine/threonine kinase inhibiting protein SIC1|SDB25 chromosome 12 L000001886|L000001822 12 286820 287674 W 2011-02-03 1996-07-31 Cyclin-dependent kinase inhibitor (CKI); inhibitor of Cdc28-Clb kinase complexes that controls G1/S phase transition, preventing premature S phase and ensuring genomic integrity; phosphorylated by Clb5/6-Cdk1 and Cln1/2-Cdk1 kinase which regulate timing of Sic1p degradation; phosphorylation targets Sic1p for SCF(CDC4)-dependent turnover; functional homolog of mammalian Kip1 -S000036800 CDS YLR079W 12 286820 287674 W 2011-02-03 1996-07-31 -S000004070 ORF Verified YLR080W EMP46 chromosome 12 12 287916 289250 W 2011-02-03 1996-07-31 Integral membrane component of ER-derived COPII-coated vesicles; functions in ER to Golgi transport; EMP46 has a paralog, EMP47, that arose from the whole genome duplication -S000037384 CDS YLR080W 12 287916 289250 W 2011-02-03 1996-07-31 -S000118472 ARS ARS1212 ARSXII-289 chromosome 12 12 289315 289444 2014-11-18 2014-11-18|2006-08-30 Late-firing chromosomal replication origin -S000178134 ARS_consensus_sequence ARS1212 12 289422 289406 C 2014-11-18 2014-11-18 -S000004071 ORF Verified YLR081W GAL2 galactose permease GAL2 chromosome 12 L000000659 12 290212 291936 W 44 2011-02-03 1996-07-31 Galactose permease; required for utilization of galactose; also able to transport glucose -S000037506 CDS YLR081W 12 290212 291936 W 2011-02-03 1996-07-31 -S000004072 ORF Verified YLR082C SRL2 chromosome 12 L000004670 12 293572 292394 C 2011-02-03 1996-07-31 Protein of unknown function; overexpression suppresses the lethality caused by a rad53 null mutation -S000037548 CDS YLR082C 12 293572 292394 C 2011-02-03 1996-07-31 -S000004073 ORF Verified YLR083C EMP70 TMN1|p24a chromosome 12 L000000550 12 296094 294091 C 2011-02-03 1996-07-31 Protein with a role in cellular adhesion and filamentous growth; also endosome-to-vacuole sorting; similar to Tmn3p; member of Transmembrane Nine family of proteins with 9 transmembrane segments; EMP70 has a paralog, TMN2, that arose from the whole genome duplication -S000030358 CDS YLR083C 12 296094 294091 C 2011-02-03 1996-07-31 -S000004074 ORF Verified YLR084C RAX2 chromosome 12 12 300251 296589 C 2011-02-03 1996-07-31 N-glycosylated protein; involved in the maintenance of bud site selection during bipolar budding; localization requires Rax1p; RAX2 mRNA stability is regulated by Mpt5p -S000030482 CDS YLR084C 12 300251 296589 C 2011-02-03 1996-07-31 -S000004075 ORF Verified YLR085C ARP6 chromosome 12 L000003435 12 301989 300673 C 2011-02-03 1996-07-31 Actin-related protein that binds nucleosomes; a component of the SWR1 complex, which exchanges histone variant H2AZ (Htz1p) for chromatin-bound histone H2A -S000030596 CDS YLR085C 12 301989 300673 C 2011-02-03 1996-07-31 -S000004076 ORF Verified YLR086W SMC4 condensin subunit SMC4 chromosome 12 L000003472 12 302243 306499 W 2011-02-03 1996-07-31 Subunit of the condensin complex; condensin reorganizes chromosomes during both mitosis and meiosis; forms a subcomplex with Smc2p that has ATP-hydrolyzing and DNA-binding activity, but other condensin subunits are required for chromatin binding; required for tRNA gene clustering at the nucleolus; potential Cdc28p substrate -S000031513 CDS YLR086W 12 302243 306499 W 2011-02-03 1996-07-31 -S000004077 ORF Verified YLR087C CSF1 chromosome 12 12 315731 306855 C 2011-02-03 1996-07-31 Protein required for fermentation at low temperature; plays a role in the maturation of secretory proteins; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000031547 CDS YLR087C 12 315731 306855 C 2011-02-03 1996-07-31 -S000004078 ORF Verified YLR088W GAA1 GPI-anchor transamidase subunit GAA1|END2 chromosome 12 L000000557 12 316107 317951 W 2011-02-03 1996-07-31 Subunit of the GPI:protein transamidase complex; removes the GPI-anchoring signal and attaches GPI (glycosylphosphatidylinositol) to proteins in the ER; human homolog GPAA1 can complement growth defects of yeast thermosensitive mutant at restrictive temperature -S000031702 CDS YLR088W 12 316107 317951 W 2011-02-03 1996-07-31 -S000004079 ORF Verified YLR089C ALT1 alanine transaminase ALT1 chromosome 12 12 320015 318237 C 2011-02-03 1996-07-31 Alanine transaminase (glutamic pyruvic transaminase); involved in alanine biosynthesis and catabolism; TOR1-independent role in determining chronological lifespan; expression is induced in the presence of alanine; repression is mediated by Nrg1p; ALT1 has a paralog, ALT2, that arose from the whole genome duplication; Alt2p is catalytically inactive -S000031709 CDS YLR089C 12 320015 318237 C 2011-02-03 1996-07-31 -S000004080 ORF Verified YLR090W XDJ1 chromosome 12 L000002487 12 320701 322080 W 2011-02-03 1996-07-31 Chaperone with a role in facilitating mitochondrial protein import; ascomycete-specific member of the DnaJ-like family, closely related to Ydj1p; predicted to be C-terminally prenylated; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000032708 CDS YLR090W 12 320701 322080 W 2011-02-03 1996-07-31 -S000004081 ORF Verified YLR091W GEP5 RRG5 chromosome 12 12 322297 323178 W 2011-02-03 1996-07-31 Protein of unknown function; required for mitochondrial genome maintenance; detected in highly purified mitochondria in high-throughput studies; null mutant has decreased levels of cardiolipin and phosphatidylethanolamine -S000032790 CDS YLR091W 12 322297 323178 W 2011-02-03 1996-07-31 -S000004082 ORF Verified YLR092W SUL2 sulfate permease chromosome 12 L000003473 12 323544 326225 W 2011-02-03 1996-07-31 High affinity sulfate permease; sulfate uptake is mediated by specific sulfate transporters Sul1p and Sul2p, which control the concentration of endogenous activated sulfate intermediates -S000033523 CDS YLR092W 12 323544 326225 W 2011-02-03 1996-07-31 -S000004083 ORF Verified YLR093C NYV1 MAM2 chromosome 12 L000004690 12 327415 326513 C 2011-02-03 2000-07-14|1996-07-31 v-SNARE component of the vacuolar SNARE complex; involved in vesicle fusion; inhibits ATP-dependent Ca(2+) transport activity of Pmc1p in the vacuolar membrane -S000033559 CDS YLR093C 12 327258 326513 C 2011-02-03 2000-07-14|1996-07-31 -S000033558 CDS YLR093C 12 327415 327400 C 2011-02-03 2000-07-14 -S000033560 intron YLR093C 12 327399 327259 C 2011-02-03 2000-07-14 -S000004084 ORF Verified YLR094C GIS3 chromosome 12 L000004863 12 329238 327730 C 2011-02-03 1996-07-31 Protein of unknown function -S000033649 CDS YLR094C 12 329238 327730 C 2011-02-03 1996-07-31 -S000004085 ORF Verified YLR095C IOC2 chromosome 12 12 332115 329677 C 2011-02-03 1996-07-31 Subunit of the Isw1b complex; exhibits nucleosome-stimulated ATPase activity and acts within coding regions to coordinate transcription elongation with termination and processing; contains a PHD finger motif; other complex members are Isw1p and Ioc4p -S000033765 CDS YLR095C 12 332115 329677 C 2011-02-03 1996-07-31 -S000004086 ORF Verified YLR096W KIN2 serine/threonine protein kinase KIN2 chromosome 12 L000000902 12 332590 336033 W 2011-02-03 1996-07-31 Serine/threonine protein kinase involved in regulation of exocytosis; localizes to the cytoplasmic face of the plasma membrane; KIN2 has a paralog, KIN1, that arose from the whole genome duplication -S000034747 CDS YLR096W 12 332590 336033 W 2011-02-03 1996-07-31 -S000004087 ORF Verified YLR097C HRT3 SCF ubiquitin ligase complex subunit HRT3 chromosome 12 12 337265 336231 C 2011-02-03 1996-07-31 Putative SCF-ubiquitin ligase F-box protein; based on both genetic and physical interactions and sequence similarity; identified in association with Cdc53p, Skp1p and Ubi4 in large and small-scale studies -S000034800 CDS YLR097C 12 337265 336231 C 2011-02-03 1996-07-31 -S000004088 ORF Verified YLR098C CHA4 SIL3|SIL2 chromosome 12 L000002854 12 339473 337527 C 2011-02-03 1996-07-31 DNA binding transcriptional activator; mediates serine/threonine activation of the catabolic L-serine (L-threonine) deaminase (CHA1); Zinc-finger protein with Zn[2]-Cys[6] fungal-type binuclear cluster domain -S000034932 CDS YLR098C 12 339473 337527 C 2011-02-03 1996-07-31 -S000004089 ORF Verified YLR099C ICT1 lysophosphatidic acid acyltransferase ICT1 chromosome 12 12 340928 339744 C 2011-02-03 1996-07-31 Lysophosphatidic acid acyltransferase; responsible for enhanced phospholipid synthesis during organic solvent stress; null displays increased sensitivity to Calcofluor white; highly expressed during organic solvent stress; ICT1 has a paralog, ECM18, that arose from the whole genome duplication; human ABHD5 can complement ict1 null mutant -S000035852 CDS YLR099C 12 340928 339744 C 2011-02-03 1996-07-31 -S000007618 ORF Verified YLR099W-A MIM2 chromosome 12 12 341325 341588 W 2011-02-03 2001-02-26 Mitochondrial protein required for outer membrane protein import; involved in import of the subset of proteins with multiple alpha-helical transmembrane segments, including Ugo1p, Tom20p, and Fzo1p; component of a large protein complex in the outer membrane that includes Mim1p; not essential in W303 strain background -S000037216 CDS YLR099W-A 12 341325 341588 W 2011-02-03 2001-02-26 -S000004090 ORF Verified YLR100W ERG27 3-keto-steroid reductase chromosome 12 12 341810 342853 W 2011-02-03 1996-07-31 3-keto sterol reductase; catalyzes the last of three steps required to remove two C-4 methyl groups from an intermediate in ergosterol biosynthesis; mutants are sterol auxotrophs; mutation is functionally complemented by human HSD17B7 -S000033168 CDS YLR100W 12 341810 342853 W 2011-02-03 1996-07-31 -S000004091 ORF Dubious YLR101C chromosome 12 12 342961 342566 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified, essential ORF ERG27/YLR100W -S000033199 CDS YLR101C 12 342961 342566 C 2011-02-03 1996-07-31 -S000178135 ARS ARS1212.5 chromosome 12 12 343577 344032 2014-11-18 2014-11-18 Strong autonomously replicating sequence -S000178136 ARS_consensus_sequence ARS1212.5 12 343855 343871 W 2014-11-18 2014-11-18 -S000004092 ORF Verified YLR102C APC9 anaphase promoting complex subunit 9 chromosome 12 L000004321 12 343767 342970 C 2011-02-03 1996-07-31 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); APC/C is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition -S000033261 CDS YLR102C 12 343767 342970 C 2011-02-03 1996-07-31 -S000004093 ORF Verified YLR103C CDC45 DNA replication initiation factor CDC45|SLD4 chromosome 12 L000003380 12 345941 343989 C 2011-02-03 1996-07-31 DNA replication initiation factor; recruited to MCM pre-RC complexes at replication origins; promotes release of MCM from Mcm10p, recruits elongation machinery; binds tightly to ssDNA, which disrupts interaction with the MCM helicase and stalls it during replication stress; mutants in human homolog may cause velocardiofacial and DiGeorge syndromes -S000033319 CDS YLR103C 12 345941 343989 C 2011-02-03 1996-07-31 -S000004094 ORF Uncharacterized YLR104W LCL2 chromosome 12 12 346585 346980 W 2011-02-03 1996-07-31 Putative protein of unknown function; mutant is deficient in cell wall mannosylphosphate and has long chronological lifespan; genetic interactions suggest a role in ER-associated protein degradation (ERAD); SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole -S000034290 CDS YLR104W 12 346585 346980 W 2011-02-03 1996-07-31 -S000004095 ORF Verified YLR105C SEN2 tRNA splicing endonuclease subunit SEN2 chromosome 12 L000001863 12 348180 347047 C 2011-02-03 1996-07-31 Subunit of the tRNA splicing endonuclease; tRNA splicing endonuclease (Sen complex) is composed of Sen2p, Sen15p, Sen34p, and Sen54p; Sen complex also cleaves the CBP1 mRNA at the mitochondrial surface; Sen2p contains the active site for tRNA 5' splice site cleavage and has similarity to Sen34p and to Archaeal tRNA splicing endonuclease; -S000034355 CDS YLR105C 12 348180 347047 C 2011-02-03 1996-07-31 -S000007313 snoRNA_gene snR79 SNR79 Z9 chromosome 12 L000004807 12 348510 348427 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position C1007 -S000031838 noncoding_exon snR79 12 348510 348427 C 2011-02-03 2000-05-19 -S000004096 ORF Verified YLR106C MDN1 AAA family ATPase midasin|REA1 chromosome 12 S000028419 12 363738 349006 C 2011-02-03 1996-07-31 Huge dynein-related AAA-type ATPase (midasin); forms extended pre-60S particle with the Rix1 complex (Rix1p-Ipi1p-Ipi3p); acts in removal of ribosomal biogenesis factors at successive steps of pre-60S assembly and export from nucleus -S000035344 CDS YLR106C 12 363738 349006 C 2011-02-03 1996-07-31 -S000004097 ORF Verified YLR107W REX3 RNA exonuclease chromosome 12 12 364116 365330 W 2011-02-03 1996-07-31 RNA exonuclease; required for maturation of the RNA component of RNase MRP; functions redundantly with Rnh70p and Rex2p in processing of U5 snRNA and RNase P RNA; member of RNase D family of exonucleases -S000035537 CDS YLR107W 12 364116 365330 W 2011-02-03 1996-07-31 -S000007067 long_terminal_repeat YLRCdelta5 chromosome 12 12 366144 365810 C 2011-02-03 2000-05-19 Ty1 LTR -S000006494 snRNA_gene snR6 SNR6 U6 chromosome 12 L000001961 12 366235 366346 W 2011-02-03 2000-05-19 U6 spliceosomal RNA (U6 snRNA); mediates catalysis of pre-mRNA splicing by the spliceosome; interacts with U4; homology to U6 snRNA, interacts with snr14 -S000034320 noncoding_exon snR6 12 366235 366346 W 2011-02-03 2000-05-19 -S000004098 ORF Verified YLR108C chromosome 12 12 368124 366667 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; YLR108C is not an esssential gene; protein abundance increases in response to DNA replication stress; YLR108C has a paralog, YDR132C, that arose from the whole genome duplication -S000035581 CDS YLR108C 12 368124 366667 C 2011-02-03 1996-07-31 -S000004099 ORF Verified YLR109W AHP1 thioredoxin peroxidase AHP1|cTPxIII chromosome 12 S000007480 12 368781 369311 W 2011-02-03 1996-07-31 Thiol-specific peroxiredoxin; reduces hydroperoxides to protect against oxidative damage; function in vivo requires covalent conjugation to Urm1p -S000036533 CDS YLR109W 12 368781 369311 W 2011-02-03 1996-07-31 -S000004100 ORF Verified YLR110C CCW12 chromosome 12 12 370098 369697 C 2011-02-03 1996-07-31 Cell wall mannoprotein; plays a role in maintenance of newly synthesized areas of cell wall; localizes to periphery of small buds, septum region of larger buds, and shmoo tip; CCW12 has a paralog, YDR134C, that arose from the whole genome duplication -S000037291 CDS YLR110C 12 370098 369697 C 2011-02-03 1996-07-31 -S000004101 ORF Dubious YLR111W chromosome 12 12 370391 370723 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037464 CDS YLR111W 12 370391 370723 W 2011-02-03 1996-07-31 -S000004102 ORF Dubious YLR112W chromosome 12 12 370791 371210 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030153 CDS YLR112W 12 370791 371210 W 2011-02-03 1996-07-31 -S000004103 ORF Verified YLR113W HOG1 mitogen-activated protein kinase HOG1|SSK3 chromosome 12 L000000797 12 371620 372927 W 2011-02-03 1996-07-31 Mitogen-activated protein kinase involved in osmoregulation; controls global reallocation of RNAPII during osmotic shock; mediates recruitment/activation of RNAPII at Hot1p-dependent promoters; binds calmodulin; stimulates antisense transcription to activate CDC28; defines novel S-phase checkpoint with Mrc1p that prevent replication/transcription conflicts; nuclear form represses pseudohyphal growth; autophosphorylates; protein abundance increases under DNA replication stress -S000030351 CDS YLR113W 12 371620 372927 W 2011-02-03 1996-07-31 -S000118473 ARS ARS1213 ARSXII-373 chromosome 12 12 373254 373332 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000007095 long_terminal_repeat YLRWsigma2 chromosome 12 12 373999 374338 W 2011-02-03 2000-05-19 Ty3 LTR -S000006704 tRNA_gene tR(ACG)L chromosome 12 L000003646 12 374355 374427 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 6 nuclear tRNA genes containing the tDNA-anticodon ACG (converted to ICG in the mature tRNA), decodes CGU, CGC, and probably CGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000030443 noncoding_exon tR(ACG)L 12 374355 374427 W 2011-02-03 2000-05-19 -S000004104 ORF Verified YLR114C AVL9 chromosome 12 S000029049|S000029007 12 377238 374944 C 2011-02-03 1996-07-31 Conserved protein involved in exocytic transport from the Golgi; mutation is synthetically lethal with apl2 vps1 double mutation; member of a protein superfamily with orthologs in diverse organisms; relocalizes from bud neck to cytoplasm upon DNA replication stress -S000030429 CDS YLR114C 12 377238 374944 C 2011-02-03 1996-07-31 -S000004105 ORF Verified YLR115W CFT2 cleavage polyadenylation factor subunit CFT2|YDH1 chromosome 12 L000003599 12 377985 380564 W 2011-02-03 1996-07-31 Subunit of the mRNA cleavage and polyadenlylation factor (CPF); required for pre-mRNA cleavage, polyadenylation and poly(A) site recognition, 43% similarity with the mammalian CPSF-100 protein. -S000031398 CDS YLR115W 12 377985 380564 W 2011-02-03 1996-07-31 -S000004106 ORF Verified YLR116W MSL5 mRNA splicing protein MSL5|BBP chromosome 12 L000004109 12 380822 382252 W 2011-02-03 1996-07-31 Component of commitment complex; which defines first step in splicing pathway; essential protein that interacts with Mud2p and Prp40p, forming a bridge between the intron ends; also involved in nuclear retention of pre-mRNA; relocalizes to the cytosol in response to hypoxia -S000031525 CDS YLR116W 12 380822 382252 W 2011-02-03 1996-07-31 -S000004107 ORF Verified YLR117C CLF1 NTC77|SYF3 chromosome 12 L000004628 12 384534 382471 C 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); this complex contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs; homolog of Drosophila crooked neck protein; interacts with U1 snRNP proteins -S000031606 CDS YLR117C 12 384534 382471 C 2011-02-03 1996-07-31 -S000130182 ARS ARS1214 chromosome 12 12 384534 384725 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000004108 ORF Verified YLR118C palmitoyl-(protein) hydrolase|APT1 chromosome 12 12 385408 384725 C 2011-02-03 1996-07-31 Acyl-protein thioesterase responsible for depalmitoylation of Gpa1p; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and nucleus and is induced in response to the DNA-damaging agent MMS -S000032586 CDS YLR118C 12 385408 384725 C 2011-02-03 1996-07-31 -S000004109 ORF Verified YLR119W SRN2 ESCRT-I subunit protein SRN2|VPL16|VPS37|SRN10 chromosome 12 L000003103 12 385534 386175 W 2011-02-03 1996-07-31 Component of the ESCRT-I complex; ESCRT-I is involved in ubiquitin-dependent sorting of proteins into the endosome; suppressor of rna1-1 mutation; may be involved in RNA export from nucleus -S000032725 CDS YLR119W 12 385534 386175 W 2011-02-03 1996-07-31 -S000004110 ORF Verified YLR120C YPS1 aspartyl protease|YAP3 chromosome 12 L000002491 12 388220 386511 C 2011-02-03 1996-07-31 Aspartic protease; hyperglycosylated member of the yapsin family of proteases, attached to the plasma membrane via a glycosylphosphatidylinositol (GPI) anchor; involved in nutrient limitation-induced cleavage of the extracellular inhibitory domain of signaling mucin Msb2p, resulting in activation of the filamentous growth MAPK pathway; involved with other yapsins in the cell wall integrity response; role in KEX2-independent processing of the alpha factor precursor -S000032796 CDS YLR120C 12 388220 386511 C 2011-02-03 1996-07-31 -S000028674 ORF Dubious YLR120W-A chromosome 12 12 388672 388773 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YLR121C -S000032521 CDS YLR120W-A 12 388672 388773 W 2011-02-03 2003-07-29 -S000004111 ORF Verified YLR121C YPS3 aspartyl protease|YPS4 chromosome 12 L000004383 12 390270 388744 C 2011-02-03 1996-07-31 Aspartic protease; member of the yapsin family of proteases involved in cell wall growth and maintenance; attached to the plasma membrane via a glycosylphosphatidylinositol (GPI) anchor -S000032903 CDS YLR121C 12 390270 388744 C 2011-02-03 1996-07-31 -S000004112 ORF Dubious YLR122C chromosome 12 12 391331 390954 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YLR123C -S000033010 CDS YLR122C 12 391331 390954 C 2011-02-03 1996-07-31 -S000004113 ORF Dubious YLR123C chromosome 12 12 391407 391078 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YLR122C; contains characteristic aminoacyl-tRNA motif -S000033100 CDS YLR123C 12 391407 391078 C 2011-02-03 1996-07-31 -S000004114 ORF Dubious YLR124W chromosome 12 12 391600 391944 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033902 CDS YLR124W 12 391600 391944 W 2011-02-03 1996-07-31 -S000004115 ORF Uncharacterized YLR125W chromosome 12 12 393484 393894 W 2011-02-03 1996-07-31 Putative protein of unknown function; mutant has decreased Ty3 transposition; YLR125W is not an essential gene -S000034058 CDS YLR125W 12 393484 393894 W 2011-02-03 1996-07-31 -S000004116 ORF Verified YLR126C putative amidotransferase chromosome 12 12 395520 394765 C 2011-02-03 1996-07-31 Putative glutamine amidotransferase; has Aft1p-binding motif in the promoter; may be involved in copper and iron homeostasis; YLR126C is not an essential protein; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress -S000034899 CDS YLR126C 12 395520 394765 C 2011-02-03 1996-07-31 -S000004117 ORF Verified YLR127C APC2 anaphase promoting complex subunit 2|TID2|RSI1 chromosome 12 L000003970|L000004348 12 398319 395758 C 2011-02-03 1996-07-31 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); which is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; component of the catalytic core of the APC/C; has similarity to cullin Cdc53p -S000035048 CDS YLR127C 12 398319 395758 C 2011-02-03 1996-07-31 -S000004118 ORF Verified YLR128W DCN1 NEDD8 ligase DCN1 chromosome 12 12 398530 399433 W 2011-02-03 1996-07-31 Scaffold-type E3 ligase; required for cullin neddylation and ubiquitin ligase activation; contains a ubiquitin-binding domain (UBA) for ubiquitin and Nedd8 (Rub1p) interaction and a PONY domain involved in cullin binding and neddylation -S000035287 CDS YLR128W 12 398530 398532 W 2011-02-03 1996-07-31 -S000035288 CDS YLR128W 12 398627 399433 W 2011-02-03 1996-07-31 -S000035289 intron YLR128W 12 398533 398626 W 2011-02-03 1996-07-31 -S000004119 ORF Verified YLR129W DIP2 snoRNA-binding rRNA-processing protein DIP2|UTP12 chromosome 12 L000003088 12 399657 402488 W 2011-02-03 1996-07-31 Nucleolar protein; specifically associated with the U3 snoRNA, part of the large ribonucleoprotein complex known as the small subunit (SSU) processome, required for 18S rRNA biogenesis, part of the active pre-rRNA processing complex -S000036230 CDS YLR129W 12 399657 402488 W 2011-02-03 1996-07-31 -S000004120 ORF Verified YLR130C ZRT2 low-affinity Zn(2+) transporter ZRT2 chromosome 12 L000004167 12 404062 402794 C 2011-02-03 1996-07-31 Low-affinity zinc transporter of the plasma membrane; transcription is induced under low-zinc conditions by the Zap1p transcription factor -S000037080 CDS YLR130C 12 404062 402794 C 2011-02-03 1996-07-31 -S000004121 ORF Verified YLR131C ACE2 DNA-binding transcription factor ACE2 chromosome 12 L000000020 12 406822 404510 C 2011-02-03 1996-07-31 Transcription factor required for septum destruction after cytokinesis; phosphorylation by Cbk1p blocks nuclear exit during M/G1 transition, causing localization to daughter cell nuclei, and also increases Ace2p activity; phosphorylation by Cdc28p and Pho85p prevents nuclear import during cell cycle phases other than cytokinesis; part of RAM network that regulates cellular polarity and morphogenesis; ACE2 has a paralog, SWI5, that arose from the whole genome duplication -S000037197 CDS YLR131C 12 406822 404510 C 2011-02-03 1996-07-31 -S000004122 ORF Verified YLR132C USB1 phosphoric diester hydrolase chromosome 12 12 408155 407283 C 2011-02-03 1996-07-31 Putative poly(U)-specific 3'-to-5' RNA exonuclease; involved in 3'-end processing of U6 snRNA removing uridines and generating a terminal 2′,3′ cyclic phosphate; essential protein that localizes to the nucleus and mitochondria; overexpression suppresses the respiratory defects of oxa1 and mtf2 mutants; homolog of S.pombe gene, mpn1 and human gene, hUSB1; mutations in hUSB1 are associated with a rare genodermatosis, poikiloderma with neutropenia (OMIM 604173) -S000037305 CDS YLR132C 12 408155 407283 C 2011-02-03 1996-07-31 -S000004123 ORF Verified YLR133W CKI1 bifunctional choline kinase/ethanolamine kinase CKI1 chromosome 12 L000000346 12 408445 410193 W 2011-02-03 1996-07-31 Choline kinase; catalyzes the first step in phosphatidylcholine synthesis via the CDP-choline (Kennedy pathway); exhibits some ethanolamine kinase activity contributing to phosphatidylethanolamine synthesis via the CDP-ethanolamine pathway; CKI1 has a paralog, EKI1, that arose from the whole genome duplication -S000030014 CDS YLR133W 12 408445 410193 W 2011-02-03 1996-07-31 -S000004124 ORF Verified YLR134W PDC5 indolepyruvate decarboxylase 5 chromosome 12 L000001356 12 410723 412414 W 2011-02-03 1996-07-31 Minor isoform of pyruvate decarboxylase; key enzyme in alcoholic fermentation, decarboxylates pyruvate to acetaldehyde, regulation is glucose- and ethanol-dependent, repressed by thiamine, involved in amino acid catabolism -S000030184 CDS YLR134W 12 410723 412414 W 2011-02-03 1996-07-31 -S000118474 ARS ARS1215 ARSXII-413 chromosome 12 12 412686 412893 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000004125 ORF Verified YLR135W SLX4 chromosome 12 12 413281 415527 W 2011-02-03 1996-07-31 Endonuclease involved in processing DNA; acts during recombination, repair; promotes template switching during break-induced replication (BIR), causing non-reciprocal translocations (NRTs); cleaves branched structures in complex with Slx1p; involved in interstrand cross-link repair, Rad1p/Rad10p-dependent removal of 3'-nonhomologous tails during DSBR via single-strand annealing; relative distribution to nuclear foci increases upon DNA replication stress; FANCP-related factor -S000031127 CDS YLR135W 12 413281 415527 W 2011-02-03 1996-07-31 -S000004126 ORF Verified YLR136C TIS11 CTH2 chromosome 12 L000002895 12 416658 415801 C 2011-02-03 1996-07-31 mRNA-binding protein expressed during iron starvation; binds to a sequence element in the 3'-untranslated regions of specific mRNAs to mediate their degradation; involved in iron homeostasis; protein increases in abundance and relative distribution to the nucleus increases upon DNA replication stress; TIS11 has a paralog, CTH1, that arose from the whole genome duplication -S000031183 CDS YLR136C 12 416658 415801 C 2011-02-03 1996-07-31 -S000004127 ORF Verified YLR137W RKM5 S-adenosylmethionine-dependent methyltransferase chromosome 12 12 417006 418109 W 2011-02-03 1996-07-31 Protein lysine methyltransferase; monomethylates Lys-46 of the ribosomal large subunit Rpl1a/Rpl1b; member of the seven beta-strand methyltransferase superfamily; orthologs only found among fungal species -S000031387 CDS YLR137W 12 417006 418109 W 2011-02-03 1996-07-31 -S000004128 ORF Verified YLR138W NHA1 chromosome 12 L000004113 12 418437 421394 W 2011-02-03 1996-07-31 Na+/H+ antiporter; involved in sodium and potassium efflux through the plasma membrane; required for alkali cation tolerance at acidic pH -S000032374 CDS YLR138W 12 418437 421394 W 2011-02-03 1996-07-31 -S000004129 ORF Verified YLR139C SLS1 chromosome 12 L000002656 12 423473 421542 C 2011-02-03 1996-07-31 Mitochondrial membrane protein; coordinates expression of mitochondrially-encoded genes; may facilitate delivery of mRNA to membrane-bound translation machinery -S000032442 CDS YLR139C 12 423473 421542 C 2011-02-03 1996-07-31 -S000004130 ORF Dubious YLR140W chromosome 12 12 423474 423800 W 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; overlaps essential RRN5 gene which encodes a member of the UAF transcription factor involved in transcription of rDNA by RNA polymerase I -S000033242 CDS YLR140W 12 423474 423800 W 2011-02-03 1996-07-31 -S000004131 ORF Verified YLR141W RRN5 chromosome 12 L000003261 12 423683 424774 W 2011-02-03 1996-07-31 Protein involved in transcription of rDNA by RNA polymerase I; transcription factor, member of UAF (upstream activation factor) family along with Rrn9p and Rrn10p -S000033304 CDS YLR141W 12 423683 424774 W 2011-02-03 1996-07-31 -S000004132 ORF Verified YLR142W PUT1 proline dehydrogenase chromosome 12 L000001535 12 425186 426616 W 73 2011-02-03 1996-07-31 Proline oxidase; nuclear-encoded mitochondrial protein involved in utilization of proline as sole nitrogen source; PUT1 transcription is induced by Put3p in the presence of proline and the absence of a preferred nitrogen source -S000033371 CDS YLR142W 12 425186 426616 W 2011-02-03 1996-07-31 -S000006541 tRNA_gene tD(GUC)L1 chromosome 12 L000003647 12 427132 427203 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000031841 noncoding_exon tD(GUC)L1 12 427132 427203 W 2011-02-03 2000-05-19 -S000004133 ORF Verified YLR143W DPH6 diphthine--ammonia ligase chromosome 12 12 427329 429386 W 2011-02-03 1996-07-31 Diphthamide synthetase; catalyzes the last amidation step of diphthamide biosynthesis using ammonium and ATP; evolutionarily conserved in eukaryotes; dph6 mutants exhibit diphthine accumulation and resistance to sordarin, which is indicative of defects in diphthamide formation on EF2; green fluorescent protein (GFP)-tagged protein localizes to the cytoplasm; DPH6/YLR143W is not an essential gene -S000034284 CDS YLR143W 12 427329 429386 W 2011-02-03 1996-07-31 -S000004134 ORF Verified YLR144C ACF2 PCA1|ENG2 chromosome 12 L000004011 12 432016 429677 C 2011-02-03 1996-07-31 Intracellular beta-1,3-endoglucanase; expression is induced during sporulation; may have a role in cortical actin cytoskeleton assembly; protein abundance increases in response to DNA replication stress -S000034344 CDS YLR144C 12 432016 429677 C 2011-02-03 1996-07-31 -S000004135 ORF Verified YLR145W RMP1 chromosome 12 12 432168 432773 W 2011-02-03 1996-07-31 Subunit of RNase MRP; RNase MRP processes pre-rRNA and has a role in cell cycle-regulated degradation of daughter cell-specific mRNAs; unlike most subunits, not shared between RNase MRP and nuclear RNase P -S000034472 CDS YLR145W 12 432168 432773 W 2011-02-03 1996-07-31 -S000004136 ORF Verified YLR146C SPE4 spermine synthase chromosome 12 L000004341 12 433725 432823 C 2011-02-03 1996-07-31 Spermine synthase; required for the biosynthesis of spermine and also involved in biosynthesis of pantothenic acid -S000034521 CDS YLR146C 12 433725 432823 C 2011-02-03 1996-07-31 -S000113566 ORF Uncharacterized YLR146W-A chromosome 12 12 433870 434058 W 2011-02-03 2005-11-17 Putative protein of unknown function -S000113567 CDS YLR146W-A 12 433870 434058 W 2011-02-03 2005-11-17 -S000004137 ORF Verified YLR147C SMD3 mRNA splicing protein SMD3|Sm D3|SLT16 chromosome 12 L000001929 12 434463 434158 C 2011-02-03 1996-07-31 Core Sm protein Sm D3; part of heteroheptameric complex (with Smb1p, Smd1p, Smd2p, Sme1p, Smx3p, and Smx2p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; homolog of human Sm D3 -S000035546 CDS YLR147C 12 434463 434158 C 2011-02-03 1996-07-31 -S000004138 ORF Verified YLR148W PEP3 tethering complex subunit PEP3|VPT18|VPS18|VAM8 chromosome 12 L000001374|L000002473 12 434641 437397 W 91 2011-02-03 1996-07-31 Component of CORVET membrane tethering complex; vacuolar peripheral membrane protein that promotes vesicular docking/fusion reactions in conjunction with SNARE proteins, required for vacuolar biogenesis -S000035686 CDS YLR148W 12 434641 437397 W 2011-02-03 1996-07-31 -S000004139 ORF Verified YLR149C chromosome 12 12 439823 437631 C 2011-02-03 1996-07-31 Protein of unknown function; overexpression causes a cell cycle delay or arrest; null mutation results in a decrease in plasma membrane electron transport; YLR149C is not an essential gene; protein abundance increases in response to DNA replication stress -S000035734 CDS YLR149C 12 439823 437631 C 2011-02-03 1996-07-31 -S000007619 ORF Dubious YLR149C-A chromosome 12 12 440456 440370 C 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037217 CDS YLR149C-A 12 440456 440370 C 2011-02-03 2001-02-26 -S000004140 ORF Verified YLR150W STM1 MPT4 chromosome 12 L000002574 12 440467 441288 W 2011-02-03 1996-07-31 Protein required for optimal translation under nutrient stress; perturbs association of Yef3p with ribosomes; involved in TOR signaling; binds G4 quadruplex and purine motif triplex nucleic acid; helps maintain telomere structure; protein abundance increases in response to DNA replication stress; serves as a ribosome preservation factor both during quiescence and recovery -S000036485 CDS YLR150W 12 440467 441288 W 2011-02-03 1996-07-31 -S000004141 ORF Verified YLR151C PCD1 8-oxo-dGTP diphosphatase chromosome 12 12 442737 441715 C 2011-02-03 1996-07-31 8-oxo-dGTP diphosphatase; prevents spontaneous mutagenesis via sanitization of oxidized purine nucleoside triphosphates; can also act as peroxisomal pyrophosphatase with specificity for coenzyme A and CoA derivatives, may function to remove potentially toxic oxidized CoA disulfide from peroxisomes to maintain the capacity for beta-oxidation of fatty acids; nudix hydrolase family member; similar E. coli MutT and human, rat and mouse MTH1 -S000036493 CDS YLR151C 12 442737 441715 C 2011-02-03 1996-07-31 -S000004142 ORF Uncharacterized YLR152C chromosome 12 12 444688 442958 C 2011-02-03 1996-07-31 Putative protein of unknown function; YLR152C is not an essential gene -S000036614 CDS YLR152C 12 444688 442958 C 2011-02-03 1996-07-31 -S000004143 ORF Verified YLR153C ACS2 acetate--CoA ligase ACS2 chromosome 12 L000003111 12 447575 445524 C 2011-02-03 1996-07-31 Acetyl-coA synthetase isoform; along with Acs1p, acetyl-coA synthetase isoform is the nuclear source of acetyl-coA for histone acetylation; mutants affect global transcription; required for growth on glucose; expressed under anaerobic conditions -S000036713 CDS YLR153C 12 447575 445524 C 2011-02-03 1996-07-31 -S000004144 ORF Verified YLR154C RNH203 Rnh2C chromosome 12 12 448314 447982 C 2011-02-03 1996-07-31 Ribonuclease H2 subunit; required for RNase H2 activity; role in ribonucleotide excision repair; related to human AGS3 that causes Aicardi-Goutieres syndrome -S000037436 CDS YLR154C 12 448314 447982 C 2011-02-03 1996-07-31 -S000006699 tRNA_gene tQ(UUG)L chromosome 12 L000003663 12 448721 448650 C 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000032585 noncoding_exon tQ(UUG)L 12 448721 448650 C 2011-02-03 2000-05-19 -S000007084 long_terminal_repeat YLRWdelta6 chromosome 12 12 448842 449028 W 2011-02-03 2000-05-19 Ty1 LTR -S000118475 ARS ARS1216 ARSXII-451 chromosome 12 12 450485 450725 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178137 ARS_consensus_sequence ARS1216 12 450506 450522 W 2014-11-18 2014-11-18 -S000029718 rRNA_gene ETS2-1 ETS2-1 3' ETS chromosome 12 12 451785 451575 C 2011-02-03 2004-03-04 Non-coding region located adjacent to and downstream of RDN25; transcribed as part of the 35S rRNA precursor transcript; contains the primary rRNA transcription termination site at +93 and a secondary termination site between +211 and +250 -S000036854 external_transcribed_spacer_region ETS2-1 12 451785 451575 C 2011-02-03 2004-03-04 -S000028675 ORF Dubious YLR154W-A YLR154W-C chromosome 12 12 452438 452623 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; encoded within the 25S rRNA gene on the opposite strand -S000032525 CDS YLR154W-A 12 452438 452623 W 2011-02-03 2003-07-29 -S000028563 ORF Dubious YLR154W-B chromosome 12 12 454392 454556 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; encoded within the 25S rRNA gene on the opposite strand -S000031269 CDS YLR154W-B 12 454392 454556 W 2011-02-03 2003-07-29 -S000028422 ORF Verified YLR154W-C TAR1 YLR154W-A chromosome 12 S000007646 12 454696 455070 W 2011-02-03 2002-06-20 Protein potentially involved in regulation of respiratory metabolism; located in the mitochondria; interacts genetically with RPO41 and physically with Coq5p; encoded within the 25S rRNA gene on the opposite strand -S000029958 CDS YLR154W-C 12 454696 455070 W 2011-02-03 2002-06-20 -S000006484 rRNA_gene RDN25-1 RDN25-1 26S rRNA|RDN25 chromosome 12 12 455181 451786 C 2011-02-03 2000-05-19 25S ribosomal RNA (25S rRNA); component of the large (60S) ribosomal subunit; encoded in the rDNA repeat (RDN1) as part of the 35S primary transcript; formed by endonucleolytic cleavage at the C2 site of internal transcribed spacer 2 (ITS2) -S000032318 noncoding_exon RDN25-1 12 455181 451786 C 2011-02-03 2000-05-19 -S000029716 rRNA_gene ITS2-1 ITS2-1 ITS2 chromosome 12 12 455413 455182 C 2011-02-03 2004-03-04 Non-coding region between RDN58 and RDN25; transcribed as part of the 35S rRNA precursor transcript; forms a stem-loop structure that is required for processing of the precursor transcript -S000036852 internal_transcribed_spacer_region ITS2-1 12 455413 455182 C 2011-02-03 2004-03-04 -S000028676 ORF Dubious YLR154W-E chromosome 12 12 455433 455636 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; encoded within the 35S rRNA gene on the opposite strand -S000032527 CDS YLR154W-E 12 455433 455636 W 2011-02-03 2003-07-29 -S000006488 rRNA_gene RDN58-1 RDN58-1 RDN58 chromosome 12 12 455571 455414 C 2011-02-03 2000-05-19 5.8S ribosomal RNA (5.8S rRNA); component of the large (60S) ribosomal subunit; encoded in the rDNA repeat (RDN1) as part of the 35S primary transcript; 3' end formation involves processing by the exosome complex while 5' end is generated by Kem1p and Rat1p -S000033911 noncoding_exon RDN58-1 12 455571 455414 C 2011-02-03 2000-05-19 -S000028843 ORF Dubious YLR154W-F chromosome 12 12 455883 456023 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; encoded within the 35S rRNA gene on the opposite strand -S000034528 CDS YLR154W-F 12 455883 456023 W 2011-02-03 2003-07-29 -S000029715 rRNA_gene ITS1-1 ITS1-1 ITS1 chromosome 12 12 455932 455572 C 2011-02-03 2004-03-04 Non-coding region between RDN58 and RDN18; transcribed as part of the 35S rRNA precursor transcript; excision during transcript maturation is coupled with processing of the 3' external transcribed spacer (3'ETS) -S000036841 internal_transcribed_spacer_region ITS1-1 12 455932 455572 C 2011-02-03 2004-03-04 -S000006482 rRNA_gene RDN18-1 RDN18-1 RDN18 chromosome 12 12 457732 455933 C 2011-02-03 2000-05-19 18S ribosomal RNA (18S rRNA); component of the small (40S) ribosomal subunit; involved in codon recognition by tRNAs or the release factor eRF1 (Sup45p); encoded in the rDNA repeat (RDN1) as part of the 35S primary transcript -S000033329 noncoding_exon RDN18-1 12 457732 455933 C 2011-02-03 2000-05-19 -S000006486 rRNA_gene RDN37-1 RDN37-1 RDN37 chromosome 12 12 458432 451575 C 2011-02-03 1997-07-30 35S ribosomal RNA (35S rRNA) transcript; encoded by the RDN1 locus; processed into the 25S, 18S and 5.8S rRNAs (represented by the RDN25, RDN18, and RDN58 loci) -S000032929 external_transcribed_spacer_region RDN37-1 12 451785 451575 C 2011-02-03 2000-05-19 -S000032923 external_transcribed_spacer_region RDN37-1 12 458432 457733 C 2011-02-03 2000-05-19 -S000032927 internal_transcribed_spacer_region RDN37-1 12 455413 455182 C 2011-02-03 2000-05-19 -S000032925 internal_transcribed_spacer_region RDN37-1 12 455932 455572 C 2011-02-03 2000-05-19 -S000032928 noncoding_exon RDN37-1 12 455181 451786 C 2011-02-03 2000-05-19 -S000032926 noncoding_exon RDN37-1 12 455571 455414 C 2011-02-03 2000-05-19 -S000032924 noncoding_exon RDN37-1 12 457732 455933 C 2011-02-03 2000-05-19 -S000029717 rRNA_gene ETS1-1 ETS1-1 5' ETS chromosome 12 12 458432 457733 C 2011-02-03 2004-03-04 Non-coding region located immediately upstream of RDN18; transcribed as part of the 35S rRNA precursor transcript; contains an essential U3 snoRNA binding site required for maturation of 18S rRNA -S000036853 external_transcribed_spacer_region ETS1-1 12 458432 457733 C 2011-02-03 2004-03-04 -S000120636 ARS ARS1200-1 ARSXII-459|ARS1216.5|rDNA ARS chromosome 12 12 458991 459097 2011-02-03 2007-02-06 Chromosomal origin of bidirectional DNA replication; an rDNA ARS is presumed to be present in each tandem rDNA repeat, but fewer than one-third of the rDNA ARSs are actually used as replication origins in a given S phase -S000120639 ARS_consensus_sequence ARS1200-1 12 459088 459078 C 2011-02-03 2007-02-06 -S000029329 rRNA_gene NTS2-1 NTS2-1 chromosome 12 L000003944 12 459675 458433 C 2011-02-03 2003-12-09 Nontranscribed region of the rDNA repeat; located between RND5 and the 5'ETS; contains RNA polymerase I termination site -S000032460 non_transcribed_region NTS2-1 12 459675 458433 C 2011-02-03 2003-12-09 -S000006479 rRNA_gene RDN5-1 RDN5-1 MOF9|RDN5 chromosome 12 L000004821|S000029304 12 459676 459796 W 2011-02-03 2000-05-19 5S ribosomal RNA (5S rRNA); only complete sequence of 6 repeated RDN5 alleles; able to support viability when provided as sole form of 5S rRNA; component of the large (60S) ribosomal subunit; localized to the nucleolus via interaction with Rpl5p; may play a role in translational frame fidelity; transcription is mediated by PolIII and activated by TFIIIA and TFIIIE -S000031406 noncoding_exon RDN5-1 12 459676 459796 W 2011-02-03 2000-05-19 -S000029714 rRNA_gene NTS1-2 NTS1-2 NTS1 chromosome 12 12 460711 459797 C 2011-02-03 2004-03-04 Non-transcribed region of the rDNA repeat between the 3' ETS and RDN5; required for rDNA repeat expansion -S000036840 non_transcribed_region NTS1-2 12 460711 459797 C 2011-02-03 2004-03-04 -S000029713 rRNA_gene ETS2-2 ETS2-2 3' ETS chromosome 12 12 460922 460712 C 2011-02-03 2004-03-04 Non-coding region located adjacent to RDN25; transcribed as part of the 35S rRNA precursor transcript; contains the primary rRNA transcription termination site at +93 and a secondary termination site between +211 and +250 -S000036839 external_transcribed_spacer_region ETS2-2 12 460922 460712 C 2011-02-03 2004-03-04 -S000028561 ORF Uncharacterized YLR154C-G chromosome 12 12 462671 462522 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology comparisons and RT-PCR; this ORF is contained within RDN25-2 and RDN37-2 -S000031267 CDS YLR154C-G 12 462671 462522 C 2011-02-03 2003-07-29 -S000006485 rRNA_gene RDN25-2 RDN25-2 26S rRNA|RDN25 chromosome 12 12 464318 460923 C 2011-02-03 2000-05-19 25S ribosomal RNA (25S rRNA); component of the large (60S) ribosomal subunit; encoded in the rDNA repeat (RDN1) as part of the 35S primary transcript; formed by endonucleolytic cleavage at the C2 site of internal transcribed spacer 2 (ITS2) -S000032336 noncoding_exon RDN25-2 12 464318 460923 C 2011-02-03 2000-05-19 -S000029712 rRNA_gene ITS2-2 ITS2-2 ITS2 chromosome 12 12 464550 464319 C 2011-02-03 2004-03-04 Non-coding region between RDN58 and RDN25; transcribed as part of the 35S rRNA precursor transcript; forms a stem-loop structure required for processing of the precursor transcript -S000036837 internal_transcribed_spacer_region ITS2-2 12 464550 464319 C 2011-02-03 2004-03-04 -S000006489 rRNA_gene RDN58-2 RDN58-2 RDN58 chromosome 12 12 464708 464551 C 2011-02-03 2000-05-19 5.8S ribosomal RNA (5.8S rRNA); component of the large (60S) ribosomal subunit; encoded in the rDNA repeat (RDN1) -S000033912 noncoding_exon RDN58-2 12 464708 464551 C 2011-02-03 2000-05-19 -S000029709 rRNA_gene ITS1-2 ITS1-2 ITS1 chromosome 12 12 465069 464709 C 2011-02-03 2004-03-04 Non-coding region between RDN58 and RDN18; transcribed as part of the 35S rRNA precursor transcript; excision during transcript maturation is coupled with processing of the 3' external transcribed spacer (3' ETS) -S000036833 internal_transcribed_spacer_region ITS1-2 12 465069 464709 C 2011-02-03 2004-03-04 -S000006483 rRNA_gene RDN18-2 RDN18-2 RDN18 chromosome 12 12 466869 465070 C 2011-02-03 2000-05-19 18S ribosomal RNA (18S rRNA); component of the small (40S) ribosomal subunit; involved in codon recognition by tRNAs or the release factor eRF1 (Sup45p); encoded in the rDNA repeat (RDN1) as part of the 35S primary transcript -S000033332 noncoding_exon RDN18-2 12 466869 465070 C 2011-02-03 2000-05-19 -S000006487 rRNA_gene RDN37-2 RDN37-2 RDN37 chromosome 12 12 467569 460712 C 2011-02-03 1997-07-30 35S ribosomal RNA (35S rRNA) transcript; encoded by the RDN1 locus; processed into the 25S, 18S and 5.8S rRNAs (represented by the RDN25, RDN18, and RDN58 loci) -S000032939 external_transcribed_spacer_region RDN37-2 12 460922 460712 C 2011-02-03 2000-05-19 -S000032933 external_transcribed_spacer_region RDN37-2 12 467569 466870 C 2011-02-03 2000-05-19 -S000032937 internal_transcribed_spacer_region RDN37-2 12 464550 464319 C 2011-02-03 2000-05-19 -S000032935 internal_transcribed_spacer_region RDN37-2 12 465069 464709 C 2011-02-03 2000-05-19 -S000032938 noncoding_exon RDN37-2 12 464318 460923 C 2011-02-03 2000-05-19 -S000032936 noncoding_exon RDN37-2 12 464708 464551 C 2011-02-03 2000-05-19 -S000032934 noncoding_exon RDN37-2 12 466869 465070 C 2011-02-03 2000-05-19 -S000029707 rRNA_gene ETS1-2 ETS1-2 5' ETS chromosome 12 12 467569 466870 C 2011-02-03 2004-03-04 Non-coding region located immediately upstream of RDN18; transcribed as part of the 35S rRNA precursor transcript; contains an essential U3 snoRNA binding site required for maturation of 18S rRNA -S000036830 external_transcribed_spacer_region ETS1-2 12 467569 466870 C 2011-02-03 2004-03-04 -S000120655 ARS ARS1200-2 ARSXII-468|rDNA ARS chromosome 12 12 468128 468234 2011-02-03 2007-02-06 Chromosomal origin of bidirectional DNA replication; an rDNA ARS is presumed to be present in each tandem rDNA repeat, but fewer than one-third of the rDNA ARSs are actually used as replication origins in a given S phase -S000120656 ARS_consensus_sequence ARS1200-2 12 468225 468215 C 2011-02-03 2007-02-06 -S000029706 rRNA_gene NTS2-2 NTS2-2 NTS2 chromosome 12 12 468812 467570 C 2011-02-03 2004-03-04 Non-transcribed region of the rDNA repeat; located between RDN5 and the 5' ETS -S000036829 non_transcribed_region NTS2-2 12 468812 467570 C 2011-02-03 2004-03-04 -S000006480 rRNA_gene RDN5-2 RDN5-2 RDN5 chromosome 12 12 468813 468931 W 2011-02-03 1997-07-30 Variant 5S ribosomal rRNA (5S rRNA) gene; located within the RDN1 locus; unable to support cell viability when provided as sole source of 5S rRNA; identical in sequence to variant alleles RDN5-3, RDN5-4, and RDN5-5 -S000031412 noncoding_exon RDN5-2 12 468813 468931 W 2011-02-03 2000-05-19 -S000028562 ORF Uncharacterized YLR154C-H chromosome 12 12 468958 468827 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology comparisons and RT-PCR; this ORF partially overlaps RDN5-2; YLR154C-H has a paralog, YLR157C-C, that arose from a segmental duplication -S000031268 CDS YLR154C-H 12 468958 468827 C 2011-02-03 2003-07-29 -S000004145 ORF Verified YLR155C ASP3-1 asparaginase ASP3-1|ASP3 chromosome 12 L000000130 12 470405 469317 C 2011-02-03 1996-07-31 Cell-wall L-asparaginase II involved in asparagine catabolism; expression induced during nitrogen starvation; ORF contains a short non-coding RNA that enhances expression of full-length gene; likely arose in via horizontal gene transfer from the wine yeast Wickerhamomyces anomalus or a close relative; reference strain S288C has four copies of ASP3; ASP3-1 has a paralog, ASP3-3, that arose from a segmental duplication -S000037563 CDS YLR155C 12 470405 469317 C 2011-02-03 1996-07-31 -S000004146 ORF Uncharacterized YLR156W chromosome 12 12 472113 472457 W 2011-02-03 1996-07-31 Putative protein of unknown function; exhibits a two-hybrid interaction with Jsn1p in a large-scale analysis; YLR156W has a paralog, YLR159W, that arose from a segmental duplication -S000030409 CDS YLR156W 12 472113 472457 W 2011-02-03 1996-07-31 -S000006481 rRNA_gene RDN5-3 RDN5-3 RDN5 chromosome 12 12 472465 472583 W 2011-02-03 1997-07-30 Variant 5S ribosomal RNA (5S rRNA) gene; located at a site distal to the RDN1 locus; unable to support cell viability when provided as sole source of 5S rRNA; identical in sequence to variant alleles RDN5-2, RDN5-4, and RDN5-5 -S000031417 noncoding_exon RDN5-3 12 472465 472583 W 2011-02-03 2000-05-19 -S000028564 ORF Uncharacterized YLR156C-A chromosome 12 12 472610 472479 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology comparisons and RT-PCR; partially overlaps RND5-3; YLR156C-A has a paralog, YLR159C-A, that arose from a segmental duplication -S000031270 CDS YLR156C-A 12 472610 472479 C 2011-02-03 2003-07-29 -S000004147 ORF Verified YLR157C ASP3-2 asparaginase ASP3-2|ASP3 chromosome 12 12 474057 472969 C 2011-02-03 1996-07-31 Cell-wall L-asparaginase II involved in asparagine catabolism; expression induced during nitrogen starvation; ORF contains a short non-coding RNA that enhances expression of full-length gene; likely arose in via horizontal gene transfer from the wine yeast Wickerhamomyces anomalus or a close relative; reference strain S288C has four copies of ASP3; ASP3-2 has a paralog, ASP3-4, that arose from a segmental duplication -S000030487 CDS YLR157C 12 474057 472969 C 2011-02-03 1996-07-31 -S000028677 ORF Uncharacterized YLR157W-D YLR157W-A chromosome 12 12 475764 475976 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; YLR157W-D has a paralog, YLR161W, that arose from a segmental duplication -S000032531 CDS YLR157W-D 12 475764 475976 W 2011-02-03 2003-07-29 -S000007068 long_terminal_repeat YLRCdelta7 chromosome 12 12 476310 475976 C 2011-02-03 2000-05-19 Ty1 LTR -S000007374 transposable_element_gene YLR157C-B gag-pol fusion protein chromosome 12 12 481601 476333 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000035905 CDS YLR157C-B 12 480295 476333 C 2011-02-03 1999-07-17 -S000035904 CDS YLR157C-B 12 481601 480297 C 2011-02-03 1999-07-17 -S000035906 plus_1_translational_frameshift YLR157C-B 12 480296 480296 C 2011-02-03 1999-07-17 -S000007373 transposable_element_gene YLR157C-A gag protein chromosome 12 12 481601 480279 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000035900 CDS YLR157C-A 12 481601 480279 C 2011-02-03 1999-07-17 -S000028678 ORF Uncharacterized YLR157W-E YLR157W-B|YLR157W-C chromosome 12 12 481873 482037 W 2011-02-03 2003-07-29 Putative protein of unknown function identified by gene-trapping; microarray-based expression analysis, and genome-wide homology searching; partially overlaps a Ty1 element -S000032535 CDS YLR157W-E 12 481873 482037 W 2011-02-03 2003-07-29 -S000007081 LTR_retrotransposon YLRCTy1-1 Ty1 chromosome 12 12 481897 475976 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007069 long_terminal_repeat YLRCdelta8 chromosome 12 12 481897 481563 C 2011-02-03 2000-05-19 Ty1 LTR -S000029708 rRNA_gene RDN5-4 RDN5-4 RDN5 chromosome 12 12 482045 482163 W 2011-02-03 2004-03-04 Variant 5S ribosomal rRNA (5S rRNA) gene; located at a site distal to the RDN1 locus; unable to support cell viability when provided as sole source of 5S rRNA; identical in sequence to variant alleles RDN5-2, RDN5-3, and RDN5-5 -S000036831 noncoding_exon RDN5-4 12 482045 482163 W 2011-02-03 2004-03-04 -S000028565 ORF Uncharacterized YLR157C-C chromosome 12 12 482190 482059 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology comparisons and RT-PCR; this ORF partially overlaps RDN5-4; YLR157C-C has a paralog, YLR154C-H, that arose from a segmental duplication -S000031271 CDS YLR157C-C 12 482190 482059 C 2011-02-03 2003-07-29 -S000004148 ORF Verified YLR158C ASP3-3 asparaginase ASP3-3|ASP3 chromosome 12 12 483637 482549 C 2011-02-03 1996-07-31 Cell-wall L-asparaginase II involved in asparagine catabolism; expression induced during nitrogen starvation; ORF contains a short non-coding RNA that enhances expression of full-length gene; likely arose in via horizontal gene transfer from the wine yeast Wickerhamomyces anomalus or a close relative; reference strain S288C has four copies of ASP3; ASP3-3 has a paralog, ASP3-1, that arose from a segmental duplication -S000030598 CDS YLR158C 12 483637 482549 C 2011-02-03 1996-07-31 -S000004149 ORF Uncharacterized YLR159W chromosome 12 12 485345 485689 W 2011-02-03 1996-07-31 Putative protein of unknown function; YLR156W, YLR159W, and YLR161W are three identical open reading frames in S288C encoded near the ribosomal DNA region of chromosome 12; YLR159W has a paralog, YLR156W, that arose from a segmental duplication -S000031528 CDS YLR159W 12 485345 485689 W 2011-02-03 1996-07-31 -S000029710 rRNA_gene RDN5-5 RDN5-5 RDN5 chromosome 12 12 485697 485815 W 2011-02-03 2004-03-04 Variant 5S ribosomal rRNA (5S rRNA) gene; located at a site distal to the RDN1 locus; unable to support cell viability when provided as sole source of 5S rRNA; identical in sequence to variant alleles RDN5-2, RDN5-3, and RDN5-4 -S000036834 noncoding_exon RDN5-5 12 485697 485815 W 2011-02-03 2004-03-04 -S000028566 ORF Uncharacterized YLR159C-A chromosome 12 12 485842 485711 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology comparisons and RT-PCR; partially overlaps RND5-5; YLR159C-A has a paralog, YLR156C-A, that arose from a segmental duplication -S000031272 CDS YLR159C-A 12 485842 485711 C 2011-02-03 2003-07-29 -S000004150 ORF Verified YLR160C ASP3-4 asparaginase ASP3-4|ASP3 chromosome 12 12 487289 486201 C 2011-02-03 1996-07-31 Cell-wall L-asparaginase II involved in asparagine catabolism; expression induced during nitrogen starvation; ORF contains a short non-coding RNA that enhances expression of full-length gene; likely arose in via horizontal gene transfer from the wine yeast Wickerhamomyces anomalus or a close relative; reference strain S288C has four copies of ASP3; ASP3-4 has a paralog, ASP3-2, that arose from a segmental duplication -S000031490 CDS YLR160C 12 487289 486201 C 2011-02-03 1996-07-31 -S000004151 ORF Uncharacterized YLR161W chromosome 12 12 488997 489341 W 2011-02-03 1996-07-31 Putative protein of unknown function; YLR156W, YLR159W, and YLR161W are three identical open reading frames in S288C encoded near the ribosomal DNA region of chromosome 12; YLR161W has a paralog, YLR157W-D, that arose from a segmental duplication -S000031592 CDS YLR161W 12 488997 489341 W 2011-02-03 1996-07-31 -S000029711 rRNA_gene RDN5-6 RDN5-6 RDN5 chromosome 12 12 489349 489469 W 2011-02-03 2004-03-04 Variant 5S ribosomal rRNA (5S rRNA) gene; located at a site distal to the RDN1 locus -S000036835 noncoding_exon RDN5-6 12 489349 489469 W 2011-02-03 2004-03-04 -S000004152 ORF Verified YLR162W chromosome 12 12 489573 489929 W 2011-02-03 1996-07-31 Protein of unknown function; overexpression confers resistance to the antimicrobial peptide MiAMP1 and causes growth arrest, apoptosis, and increased sensitivity to cobalt chloride -S000032571 CDS YLR162W 12 489573 489929 W 2011-02-03 1996-07-31 -S000028567 ORF Uncharacterized YLR162W-A RRT15 chromosome 12 12 490406 490594 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology comparisons and RT-PCR; identified in a screen for mutants with decreased levels of rDNA transcription -S000031273 CDS YLR162W-A 12 490406 490594 W 2011-02-03 2003-07-29 -S000028844 ORF Dubious YLR163W-A chromosome 12 12 492812 492925 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034529 CDS YLR163W-A 12 492812 492925 W 2011-02-03 2003-07-29 -S000004153 ORF Verified YLR163C MAS1 MIF1 chromosome 12 L000001026|L000001108 12 493254 491866 C 2011-02-03 1996-07-31 Beta subunit of the mitochondrial processing protease (MPP); essential processing enzyme that cleaves the N-terminal targeting sequences from mitochondrially imported proteins -S000032649 CDS YLR163C 12 493254 491866 C 2011-02-03 1996-07-31 -S000004154 ORF Verified YLR164W SHH4 protein SHH4 chromosome 12 12 493883 494389 W 2011-02-03 1996-07-31 Putative alternate subunit of succinate dehydrogenase (SDH); mitochondrial inner membrane protein; genetic interaction with SDH4 suggests that Shh4p can function as a functional SDH subunit; a fraction copurifies with SDH subunit Sdh3p; expression induced by nitrogen limitation in a GLN3, GAT1-dependent manner; Shh4p has greater similarity to human SDHD (subunit D of SDH, implicated in paraganglioma) than does its paralog Sdh4p -S000032792 CDS YLR164W 12 493883 494389 W 2011-02-03 1996-07-31 -S000004155 ORF Verified YLR165C PUS5 pseudouridine synthase PUS5 chromosome 12 12 495258 494494 C 2011-02-03 1996-07-31 Pseudouridine synthase; catalyzes only the formation of pseudouridine (Psi)-2819 in mitochondrial 21S rRNA; not essential for viability -S000032861 CDS YLR165C 12 495258 494494 C 2011-02-03 1996-07-31 -S000004156 ORF Verified YLR166C SEC10 exocyst subunit SEC10 chromosome 12 L000003428 12 498044 495429 C 2011-02-03 1996-07-31 Essential 100kDa subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis at the plasma membrane prior to SNARE-mediated fusion -S000033562 CDS YLR166C 12 498044 495429 C 2011-02-03 1996-07-31 -S000004157 ORF Verified YLR167W RPS31 eS31|ubiquitin-ribosomal 40S subunit protein S31 fusion protein|S31e|UB13|YS24|S37|S31|UBI3|RPS37 chromosome 12 L000001768|L000002413 12 498947 499405 W 2011-02-03 1996-07-31 Fusion protein cleaved to yield ribosomal protein S31 and ubiquitin; ubiquitin may facilitate assembly of the ribosomal protein into ribosomes; interacts genetically with translation factor eIF2B; homologous to mammalian ribosomal protein S27A, no bacterial homolog -S000033714 CDS YLR167W 12 498947 499405 W 2011-02-03 1996-07-31 -S000004158 ORF Verified YLR168C UPS2 GEP1|AIM30|MSF1|MSF1' chromosome 12 12 500270 499578 C 2011-02-03 1996-07-31 Mitochondrial intermembrane space protein; involved in phospholipid metabolism; forms complex with Mdm35p that transfers phosphatidylserine from outer membrane to inner membrane for phosphatidylethanolamine synthesis; null mutant has defects in mitochondrial morphology; similar to Ups1p, Ups3p and to human PRELI; UPS2 has a paralog, UPS3, that arose from the whole genome duplication -S000033771 CDS YLR168C 12 500270 499578 C 2011-02-03 1996-07-31 -S000004159 ORF Dubious YLR169W chromosome 12 12 500335 500688 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034750 CDS YLR169W 12 500335 500688 W 2011-02-03 1996-07-31 -S000004161 ORF Dubious YLR171W chromosome 12 12 500733 501122 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035908 CDS YLR171W 12 500733 501122 W 2011-02-03 1996-07-31 -S000004160 ORF Verified YLR170C APS1 YAP19 chromosome 12 L000002493 12 501049 500579 C 2011-02-03 1996-07-31 Small subunit of the clathrin-associated adaptor complex AP-1; AP-1 is involved in protein sorting at the trans-Golgi network; homolog of the sigma subunit of the mammalian clathrin AP-1 complex -S000035745 CDS YLR170C 12 501049 500579 C 2011-02-03 1996-07-31 -S000004162 ORF Verified YLR172C DPH5 diphthine synthase chromosome 12 L000000523 12 502162 501260 C 2011-02-03 1996-07-31 Methyltransferase required for synthesis of diphthamide; diphthamide is a modified histidine residue of translation elongation factor 2 (Eft1p or Eft2p); not essential for viability; GFP-Dph5p fusion protein localizes to the cytoplasm -S000035977 CDS YLR172C 12 502162 501260 C 2011-02-03 1996-07-31 -S000004163 ORF Uncharacterized YLR173W chromosome 12 12 502421 504247 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000036883 CDS YLR173W 12 502421 504247 W 2011-02-03 1996-07-31 -S000004164 ORF Verified YLR174W IDP2 isocitrate dehydrogenase (NADP(+)) IDP2 chromosome 12 L000002737 12 504591 505829 W 2011-02-03 1996-07-31 Cytosolic NADP-specific isocitrate dehydrogenase; catalyzes oxidation of isocitrate to alpha-ketoglutarate; levels are elevated during growth on non-fermentable carbon sources and reduced during growth on glucose; IDP2 has a paralog, IDP3, that arose from the whole genome duplication -S000036934 CDS YLR174W 12 504591 505829 W 2011-02-03 1996-07-31 -S000004165 ORF Verified YLR175W CBF5 pseudouridine synthase CBF5 chromosome 12 L000000223 12 506134 507585 W 2011-02-03 1996-07-31 Pseudouridine synthase catalytic subunit of box H/ACA snoRNPs; acts on large and small rRNAs, on snRNA U2, and on some mRNAs; mutations in human ortholog dyskerin cause the disorder dyskeratosis congenita; small nucleolar ribonucleoprotein particles are also known as snoRNPs -S000037702 CDS YLR175W 12 506134 507585 W 2011-02-03 1996-07-31 -S000004166 ORF Verified YLR176C RFX1 CRT1 chromosome 12 L000004129 12 510232 507797 C 2011-02-03 1996-07-31 Major transcriptional repressor of DNA-damage-regulated genes; recruits repressors Tup1p and Cyc8p to their promoters; involved in DNA damage and replication checkpoint pathway; similar to a family of mammalian DNA binding RFX1-4 proteins -S000037720 CDS YLR176C 12 510232 507797 C 2011-02-03 1996-07-31 -S000004167 ORF Uncharacterized YLR177W chromosome 12 12 511054 512940 W 2011-02-03 1996-07-31 Putative protein of unknown function; phosphorylated by Dbf2p-Mob1p in vitro; some strains contain microsatellite polymophisms at this locus; not an essential gene; YLR177W has a paralog, PSP1, that arose from the whole genome duplication -S000037859 CDS YLR177W 12 511054 512940 W 2011-02-03 1996-07-31 -S000118476 ARS ARS1217 ARSXII-513 chromosome 12 12 512867 513115 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178138 ARS_consensus_sequence ARS1217 12 513086 513070 C 2014-11-18 2014-11-18 -S000004168 ORF Verified YLR178C TFS1 DKA1 chromosome 12 L000002291 12 513821 513162 C 124 2011-02-03 1996-07-31 Inhibitor of carboxypeptidase Y (Prc1p), and Ras GAP (Ira2p); phosphatidylethanolamine-binding protein (PEBP) family member and ortholog of hPEBP1/RKIP, a natural metastasis suppressor; targets to vacuolar membranes during stationary phase; acetylated by NatB N-terminal acetyltransferase; protein abundance increases in response to DNA replication stress -S000037879 CDS YLR178C 12 513821 513162 C 2011-02-03 1996-07-31 -S000004169 ORF Verified YLR179C chromosome 12 12 514713 514108 C 2011-02-03 1996-07-31 Protein of unknown function with similarity to Tfs1p; transcription is activated by paralogous proteins Yrm1p and Yrr1p along with proteins involved in multidrug resistance; GFP-tagged protein localizes to the cytoplasm and nucleus -S000030817 CDS YLR179C 12 514713 514108 C 2011-02-03 1996-07-31 -S000004170 ORF Verified YLR180W SAM1 methionine adenosyltransferase SAM1|ETH10 chromosome 12 L000001798 12 515262 516410 W 2011-02-03 1996-07-31 S-adenosylmethionine synthetase; catalyzes transfer of the adenosyl group of ATP to the sulfur atom of methionine; SAM1 has a paralog, SAM2, that arose from the whole genome duplication -S000031889 CDS YLR180W 12 515262 516410 W 2011-02-03 1996-07-31 -S000004171 ORF Verified YLR181C VTA1 chromosome 12 12 517670 516678 C 2011-02-03 1996-07-31 Multivesicular body (MVB) protein; involved in endosomal protein sorting; regulates Vps4p activity by promoting its oligomerization; has an N-terminal Vps60- and Did2- binding domain, a linker region, and a C-terminal Vps4p binding domain -S000031945 CDS YLR181C 12 517670 516678 C 2011-02-03 1996-07-31 -S000004172 ORF Verified YLR182W SWI6 transcriptional regulator SWI6|SDS11|PSL8 chromosome 12 L000002254 12 517940 520351 W 2011-02-03 1996-07-31 Transcription cofactor; forms complexes with Swi4p and Mbp1p to regulate transcription at the G1/S transition; involved in meiotic gene expression; also binds Stb1p to regulate transcription at START; cell wall stress induces phosphorylation by Mpk1p, which regulates Swi6p localization; required for the unfolded protein response, independently of its known transcriptional coactivators -S000032961 CDS YLR182W 12 517940 520351 W 2011-02-03 1996-07-31 -S000004173 ORF Verified YLR183C TOS4 chromosome 12 12 522012 520543 C 2011-02-03 1996-07-31 Putative transcription factor, contains Forkhead Associated domain; binds chromatin; involved in expression homeostasis, buffering of mRNA synthesis rate against gene dosage changes during S phase; target of SBF transcription factor; expression is periodic and peaks in G1; involved in DNA replication checkpoint response; interacts with Rpd3 and Set3 histone deacetylase complexes; APCC(Cdh1) substrate; relative distribution to nucleus increases upon DNA replication stress -S000032995 CDS YLR183C 12 522012 520543 C 2011-02-03 1996-07-31 -S000004174 ORF Dubious YLR184W chromosome 12 12 522106 522453 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033139 CDS YLR184W 12 522106 522453 W 2011-02-03 1996-07-31 -S000004175 ORF Verified YLR185W RPL37A eL37|ribosomal 60S subunit protein L37A|L37e|YL35|L43|L37A chromosome 12 L000002884 12 522663 523288 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L37A; required for processing of 27SB pre-rRNA and formation of stable 66S assembly intermediates; homologous to mammalian ribosomal protein L37, no bacterial homolog; RPL37A has a paralog, RPL37B, that arose from the whole genome duplication -S000033905 CDS YLR185W 12 522663 522669 W 2011-02-03 1996-07-31 -S000033906 CDS YLR185W 12 523029 523288 W 2011-02-03 1996-07-31 -S000033907 intron YLR185W 12 522670 523028 W 2011-02-03 1996-07-31 -S000004176 ORF Verified YLR186W EMG1 18S rRNA pseudouridine methyltransferase|NEP1 chromosome 12 12 523632 524390 W 2011-02-03 1996-07-31 Methyltransferase for rRNA; methylates pseudouridine 18S rRNA residue 1191; member of the SPOUT methyltransferase family; required for maturation of 18S rRNA and for 40S ribosomal subunit production independent of methyltransferase activity; forms homodimers; human ortholog is mutated in Bowen-Conradi syndrome, and equivalent yeast mutation affects Emg1p dimerization and localization but not methyltransferase activity; human EMG1 complements lethality of null and ts mutant -S000034031 CDS YLR186W 12 523632 524390 W 2011-02-03 1996-07-31 -S000004177 ORF Verified YLR187W SKG3 chromosome 12 12 524865 527945 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery, cytoplasm, bud, and bud neck; potential Cdc28p substrate; similar to Skg4p; relocalizes from bud neck to cytoplasm upon DNA replication stress; SKG3 has a paralog, CAF120, that arose from the whole genome duplication -S000034134 CDS YLR187W 12 524865 527945 W 2011-02-03 1996-07-31 -S000004178 ORF Verified YLR188W MDL1 ATP-binding cassette permease MDL1 chromosome 12 L000001049 12 528300 530387 W 2011-02-03 1996-07-31 Mitochondrial inner membrane half-type ABC transporter; mediates export of peptides generated upon proteolysis of mitochondrial proteins; plays a role in the regulation of cellular resistance to oxidative stress -S000034239 CDS YLR188W 12 528300 530387 W 2011-02-03 1996-07-31 -S000004179 ORF Verified YLR189C ATG26 UGT51 chromosome 12 L000004808 12 534393 530797 C 2011-02-03 1996-07-31 UDP-glucose:sterol glucosyltransferase; conserved enzyme involved in synthesis of sterol glucoside membrane lipids; in contrast to ATG26 from P. pastoris, S. cerevisiae ATG26 is not involved in autophagy -S000035108 CDS YLR189C 12 534393 530797 C 2011-02-03 1996-07-31 -S000004180 ORF Verified YLR190W MMR1 chromosome 12 12 535214 536689 W 2011-02-03 1996-07-31 Phosphorylated protein of the mitochondrial outer membrane; localizes only to mitochondria of the bud; interacts with Myo2p to mediate mitochondrial distribution to buds; mRNA is targeted to the bud via the transport system involving She2p -S000036058 CDS YLR190W 12 535214 536689 W 2011-02-03 1996-07-31 -S000004181 ORF Verified YLR191W PEX13 peroxin PEX13|PAS20 chromosome 12 L000003024 12 537272 538432 W 2011-02-03 1996-07-31 Peroxisomal importomer complex component; integral peroxisomal membrane protein required for docking and translocation of peroxisomal matrix proteins; interacts with the PTS1 signal recognition factor Pex5p and the PTS2 signal recognition factor Pex7p; forms a complex with Pex14p and Pex17p; human homolog PEX13 complements yeast null mutant -S000036199 CDS YLR191W 12 537272 538432 W 2011-02-03 1996-07-31 -S000004182 ORF Verified YLR192C HCR1 translation initiation factor eIF3 core subunit j chromosome 12 S000007439 12 539589 538792 C 2011-02-03 1996-07-31 eIF3j component of translation initiation factor 3 (eIF3); dual function protein involved in translation initiation as a substoichiometric component (eIF3j) of eIF3; required for 20S pre-rRNA processing; required at post-transcriptional step for efficient retrotransposition; absence decreases Ty1 Gag:GFP protein levels; binds eIF3 subunits Rpg1p, Prt1p and 18S rRNA; eIF3 also involved in programmed stop codon read through; human homolog EIF3J can complement yeast hcr1 mutant -S000036241 CDS YLR192C 12 539589 538792 C 2011-02-03 1996-07-31 -S000004183 ORF Verified YLR193C UPS1 chromosome 12 12 540536 540009 C 2011-02-03 1996-07-31 Phosphatidic acid transfer protein; plays a role in phospholipid metabolism by transporting phosphatidic acid from the outer to the inner mitochondrial membrane; localizes to the mitochondrial intermembrane space; null mutant has altered cardiolipin and phosphatidic acid levels; ortholog of human PRELI -S000031730 CDS YLR193C 12 540536 540009 C 2011-02-03 1996-07-31 -S000004184 ORF Verified YLR194C NCW2 chromosome 12 12 541573 540809 C 2011-02-03 1996-07-31 Structural constituent of the cell wall; attached to the plasma membrane by a GPI-anchor; expression is upregulated in response to cell wall stress; null mutant is sensitive to the antifungal agent polyhexamethylene biguanide, resistant to zymolyase treatment and has increased chitin deposition -S000031877 CDS YLR194C 12 541573 540809 C 2011-02-03 1996-07-31 -S000004185 ORF Verified YLR195C NMT1 glycylpeptide N-tetradecanoyltransferase NMT1|CDC72 chromosome 12 L000001259 12 543304 541937 C 142 2011-02-03 1996-07-31 N-myristoyl transferase; catalyzes the cotranslational, covalent attachment of myristic acid to the N-terminal glycine residue of several proteins involved in cellular growth and signal transduction -S000031996 CDS YLR195C 12 543304 541937 C 2011-02-03 1996-07-31 -S000004186 ORF Verified YLR196W PWP1 rRNA-processing protein PWP1 chromosome 12 L000001539 12 543968 545698 W 2011-02-03 1996-07-31 Protein with WD-40 repeats involved in rRNA processing; associates with trans-acting ribosome biogenesis factors; similar to beta-transducin superfamily -S000037527 CDS YLR196W 12 543968 545698 W 2011-02-03 1996-07-31 -S000004187 ORF Verified YLR197W NOP56 snoRNP complex protein NOP56|SIK1 chromosome 12 L000002982 12 546097 547611 W 2011-02-03 1996-07-31 Essential evolutionarily-conserved nucleolar protein; component of the box C/D snoRNP complexes that direct 2'-O-methylation of pre-rRNA during its maturation; overexpression causes spindle orientation defects -S000037605 CDS YLR197W 12 546097 547611 W 2011-02-03 1996-07-31 -S000004188 ORF Dubious YLR198C chromosome 12 12 547645 547286 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene SIK1/YLR197W -S000037636 CDS YLR198C 12 547645 547286 C 2011-02-03 1996-07-31 -S000004189 ORF Verified YLR199C PBA1 POC1 chromosome 12 12 548769 547853 C 2011-02-03 2003-09-27|1996-07-31 Protein involved in 20S proteasome assembly; forms a heterodimer with Add66p that binds to proteasome precursors; interaction with Pba1p-Add66p may affect function of the mature proteasome and its role in maintaining respiratory metabolism; similar to human PAC1 constituent of the PAC1-PAC2 complex involved in proteasome assembly -S000030462 CDS YLR199C 12 548677 547853 C 2011-02-03 2003-09-27|1996-07-31 -S000030461 CDS YLR199C 12 548769 548764 C 2011-02-03 2003-09-27 -S000030463 intron YLR199C 12 548763 548678 C 2011-02-03 2003-09-27 -S000004190 ORF Verified YLR200W YKE2 tubulin-binding prefolding complex subunit YKE2|PFD6|GIM1 chromosome 12 L000002791 12 549012 549356 W 2011-02-03 1996-07-31 Subunit of the heterohexameric Gim/prefoldin protein complex; involved in the folding of alpha-tubulin, beta-tubulin, and actin; prefoldin complex also localizes to chromatin of actively transcribed genes in the nucleus and facilitates transcriptional elongation -S000036300 CDS YLR200W 12 549012 549356 W 2011-02-03 1996-07-31 -S000004191 ORF Verified YLR201C COQ9 ubiquinone biosynthesis protein COQ9|FMP53 chromosome 12 12 550293 549511 C 2011-02-03 1996-07-31 Protein required for ubiquinone biosynthesis and respiratory growth; localizes to matrix face of mitochondrial inner membrane in a large complex with ubiquinone biosynthetic enzymes; ubiquinone is also known as coenzyme Q; human homolog COQ9 can complement yeast coq9 null mutant -S000036362 CDS YLR201C 12 550293 549511 C 2011-02-03 1996-07-31 -S000004192 ORF Dubious YLR202C chromosome 12 12 550636 550194 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YLR201C; ORF contains a putative intron -S000037015 CDS YLR202C 12 550458 550194 C 2011-02-03 1996-07-31 -S000037014 CDS YLR202C 12 550636 550575 C 2011-02-03 1996-07-31 -S000037016 intron YLR202C 12 550574 550459 C 2011-02-03 1996-07-31 -S000004193 ORF Verified YLR203C MSS51 chromosome 12 L000001205 12 551960 550650 C 149 2011-02-03 1996-07-31 Specific translational activator for the mitochondrial COX1 mRNA; loosely associated with the matrix face of the mitochondrial inner membrane; localizes to vacuole membrane in response to H2O2; influences both COX1 mRNA translation and Cox1p assembly into cytochrome c oxidase; binds to heme B, which may be a mechanism for sensing oxygen levels in order to regulate cytochrome c oxidase biogenesis -S000037086 CDS YLR203C 12 551960 550650 C 2011-02-03 1996-07-31 -S000004194 ORF Verified YLR204W QRI5 COX24 chromosome 12 L000001551 12 552270 552605 W 2011-02-03 1996-07-31 Mitochondrial inner membrane protein; required for accumulation of spliced COX1 mRNA; may have an additional role in translation of COX1 mRNA -S000037241 CDS YLR204W 12 552270 552605 W 2011-02-03 1996-07-31 -S000004195 ORF Verified YLR205C HMX1 chromosome 12 12 553677 552724 C 2011-02-03 2004-02-05|1996-07-31 ER localized heme oxygenase; involved in heme degradation during iron starvation and in the oxidative stress response; expression is regulated by AFT1 and oxidative stress; relocates to the perinuclear region in the presence of oxidants -S000037310 CDS YLR205C 12 553677 552724 C 2011-02-03 2004-02-05|1996-07-31 -S000004196 ORF Verified YLR206W ENT2 epsin chromosome 12 12 554578 556419 W 2011-02-03 1996-07-31 Epsin-like protein required for endocytosis and actin patch assembly; functionally redundant with Ent1p; contains clathrin-binding motif at C-terminus; ENT2 has a paralog, ENT1, that arose from the whole genome duplication -S000030027 CDS YLR206W 12 554578 556419 W 2011-02-03 1996-07-31 -S000004197 ORF Verified YLR207W HRD3 ubiquitin ligase complex subunit HRD3 chromosome 12 L000003040 12 556788 559289 W 2011-02-03 1996-07-31 ER membrane protein that plays a central role in ERAD; forms HRD complex with Hrd1p and ER-associated protein degradation (ERAD) determinants that engages in lumen to cytosol communication and coordination of ERAD events -S000030185 CDS YLR207W 12 556788 559289 W 2011-02-03 1996-07-31 -S000004198 ORF Verified YLR208W SEC13 GTPase-activating protein SEC13|ANU3 chromosome 12 L000001838 12 559551 560444 W 2011-02-03 1996-07-31 Structural component of 3 complexes; subunit of the Nup84p nuclear pore subcomplex that contributes to nucleocytoplasmic transport and NPC biogenesis; subunit of the COPII vesicle coat required for ER-to-Golgi transport; subunit of SEACAT, a subcomplex of the coatomer-related, vacuolar-associated SEA complex, that inhibits the TORC1 inhibitory role of SEACIT (Iml1p-Npr2p-Npr3p), a GAP for Gtr1p, thereby resulting in activation of TORC1 signaling; human SEC13 homolog -S000031129 CDS YLR208W 12 559551 560444 W 2011-02-03 1996-07-31 -S000004199 ORF Verified YLR209C PNP1 purine-nucleoside phosphorylase chromosome 12 12 561732 560797 C 2011-02-03 1996-07-31 Purine nucleoside phosphorylase; specifically metabolizes inosine and guanosine nucleosides; involved in the nicotinamide riboside salvage pathway -S000031185 CDS YLR209C 12 561732 560797 C 2011-02-03 1996-07-31 -S000004200 ORF Verified YLR210W CLB4 B-type cyclin CLB4 chromosome 12 L000000352 12 562008 563390 W 2011-02-03 1996-07-31 B-type cyclin involved in cell cycle progression; activates Cdc28p to promote the G2/M transition; may be involved in DNA replication and spindle assembly; accumulates during S phase and G2, then targeted for ubiquitin-mediated degradation; CLB4 has a paralog, CLB3, that arose from the whole genome duplication -S000032220 CDS YLR210W 12 562008 563390 W 2011-02-03 1996-07-31 -S000004201 ORF Verified YLR211C ATG38 chromosome 12 12 564531 563792 C 2011-02-03 2000-07-14|1996-07-31 Homodimeric subunit of autophagy-specific PtdIns-3-kinase complex I; required for the integrity of the active PtdIns-3-kinase complex I by maintaining an association between Vps15p-Vps34p and Atg14p-Vps30p subcomplexes; localizes to the pre-autophagosomal structure (PAS) in an Atg14p-dependent manner; ATG38 is non-essential but is required for macroautophagy -S000032247 CDS YLR211C 12 564454 563792 C 2011-02-03 2000-07-14|1996-07-31 -S000032246 CDS YLR211C 12 564531 564514 C 2011-02-03 2000-07-14 -S000032248 intron YLR211C 12 564513 564455 C 2011-02-03 2000-07-14 -S000004202 ORF Verified YLR212C TUB4 gamma-tubulin chromosome 12 L000002751 12 566281 564860 C 2011-02-03 1996-07-31 Gamma-tubulin; involved in nucleating microtubules from both the cytoplasmic and nuclear faces of the spindle pole body; protein abundance increases in response to DNA replication stress -S000032353 CDS YLR212C 12 566281 564860 C 2011-02-03 1996-07-31 -S000004203 ORF Verified YLR213C CRR1 putative glycosylase chromosome 12 S000007422 12 567922 566654 C 2011-02-03 1996-07-31 Putative glycoside hydrolase of the spore wall envelope; required for normal spore wall assembly, possibly for cross-linking between the glucan and chitosan layers; expressed during sporulation -S000033218 CDS YLR213C 12 567922 566654 C 2011-02-03 1996-07-31 -S000004204 ORF Verified YLR214W FRE1 ferric/cupric-chelate reductase chromosome 12 L000000626 12 568567 570627 W 2011-02-03 1996-07-31 Ferric reductase and cupric reductase; reduces siderophore-bound iron and oxidized copper prior to uptake by transporters; expression induced by low copper and iron levels -S000033306 CDS YLR214W 12 568567 570627 W 2011-02-03 1996-07-31 -S000004205 ORF Verified YLR215C CDC123 cell proliferation protein CDC123 chromosome 12 12 571858 570776 C 2011-02-03 1996-07-31 Assembly factor for the eIF2 translation initiation factor complex; regulates translational initiation; conserved residues of this ATP-Grasp protein that bind to ATP-Mg2+ in the pombe ortholog are required for complex assembly in budding yeast; interaction with eIF2 subunit Gcd11p facilitates complex assembly and activity; required for the START transition and timely progression through G2; regulated by nutrient availability; human ortholog complements the yeast mutant -S000033348 CDS YLR215C 12 571858 570776 C 2011-02-03 1996-07-31 -S000004207 ORF Dubious YLR217W chromosome 12 12 572909 573232 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene CPR6 -S000034392 CDS YLR217W 12 572909 573232 W 2011-02-03 1996-07-31 -S000004206 ORF Verified YLR216C CPR6 peptidylprolyl isomerase CPR6|CYP40 chromosome 12 L000003229 12 573211 572096 C 2011-02-03 1996-07-31 Peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; plays a role in determining prion variants; binds to Hsp82p and contributes to chaperone activity; protein abundance increases in response to DNA replication stress -S000033434 CDS YLR216C 12 573211 572096 C 2011-02-03 1996-07-31 -S000004208 ORF Verified YLR218C COA4 CMC3 chromosome 12 12 573918 573466 C 2011-02-03 1996-07-31 Twin Cx(9)C protein involved in cytochrome c oxidase organization; organization includes assembly or stability; localizes to the mitochondrial intermembrane space via the Mia40p-Erv1p system; interacts genetically with CYC1 and with cytochrome c oxidase assembly factors -S000034416 CDS YLR218C 12 573918 573466 C 2011-02-03 1996-07-31 -S000004209 ORF Verified YLR219W MSC3 chromosome 12 12 574151 576337 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery; msc3 mutants are defective in directing meiotic recombination events to homologous chromatids; potential Cdc28p substrate; protein abundance increases in response to DNA replication stress -S000035498 CDS YLR219W 12 574151 576337 W 2011-02-03 1996-07-31 -S000004210 ORF Verified YLR220W CCC1 chromosome 12 L000000234 12 576825 577793 W 2011-02-03 1996-07-31 Vacuolar Fe2+/Mn2+ transporter; suppresses respiratory deficit of yfh1 mutants, which lack the ortholog of mammalian frataxin, by preventing mitochondrial iron accumulation; relative distribution to the vacuole decreases upon DNA replication stress -S000035447 CDS YLR220W 12 576825 577793 W 2011-02-03 1996-07-31 -S000004211 ORF Verified YLR221C RSA3 chromosome 12 12 579024 578362 C 2011-02-03 1996-07-31 Protein with a likely role in ribosomal maturation; required for accumulation of wild-type levels of large (60S) ribosomal subunits; binds to the helicase Dbp6p in pre-60S ribosomal particles in the nucleolus -S000035470 CDS YLR221C 12 579024 578362 C 2011-02-03 1996-07-31 -S000004212 ORF Verified YLR222C UTP13 chromosome 12 12 581771 579318 C 2011-02-03 1996-07-31 Nucleolar protein; component of the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA -S000035533 CDS YLR222C 12 581771 579318 C 2011-02-03 1996-07-31 -S000028568 ORF Dubious YLR222C-A chromosome 12 12 582236 582006 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene IFH1 -S000031274 CDS YLR222C-A 12 582236 582006 C 2011-02-03 2003-07-29 -S000004213 ORF Verified YLR223C IFH1 chromosome 12 L000001775 12 585490 582233 C 2011-02-03 1996-07-31 Coactivator, regulates transcription of ribosomal protein (RP) genes; recruited to RP gene promoters during optimal growth conditions via Fhl1p; subunit of CURI, a complex that coordinates RP production and pre-rRNA processing; regulated by acetylation and phosphorylation at different growth states via TORC1 signaling; IFH1 has a paralog, CRF1, that arose from the whole genome duplication -S000036449 CDS YLR223C 12 585490 582233 C 2011-02-03 1996-07-31 -S000004214 ORF Verified YLR224W UCC1 chromosome 12 12 586464 587573 W 2011-02-03 1996-07-31 F-box protein and component of SCF ubiquitin ligase complexes; involved in ubiquitin-dependent protein catabolism; readily monoubiquitinated in vitro by SCF-Ubc4 complexes; SCF-Ucc1 regulates level of Cit2 citrate synthase protein to maintain citrate homeostasis, acts as metabolic switch for glyoxylate cycle; UCC1 transcription is downregulated in cells grown on C2-compounds -S000036572 CDS YLR224W 12 586464 587573 W 2011-02-03 1996-07-31 -S000004215 ORF Uncharacterized YLR225C chromosome 12 12 588918 587695 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; not an essential gene; YLR225C has a paralog, YDR222W, that arose from the whole genome duplication -S000036615 CDS YLR225C 12 588918 587695 C 2011-02-03 1996-07-31 -S000004216 ORF Verified YLR226W BUR2 CST4 chromosome 12 L000002994|L000000205 12 589354 590541 W 2011-02-03 1996-07-31 Cyclin for the Sgv1p (Bur1p) protein kinase; Sgv1p and Bur2p comprise the CDK-cyclin BUR kinase complex which is involved in transcriptional regulation through its phosphorylation of the carboxy-terminal domain (CTD) of the largest subunit of RNA polymerase II (Rpo21p); BUR kinase is also involved in the recruitment of Spt6p to the CTD at the onset of transcription -S000037389 CDS YLR226W 12 589354 590541 W 2011-02-03 1996-07-31 -S000004217 ORF Verified YLR227C ADY4 chromosome 12 S000007652 12 592043 590562 C 2011-02-03 1996-07-31 Structural component of the meiotic outer plaque; outer plaque is a membrane-organizing center that assembles on the cytoplasmic face of the spindle pole body during meiosis II and triggers the formation of the prospore membrane -S000037438 CDS YLR227C 12 592043 590562 C 2011-02-03 1996-07-31 -S000006655 tRNA_gene tL(UAG)L1 chromosome 12 L000003662 12 592619 592519 C 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000035002 intron tL(UAG)L1 12 592581 592563 C 2011-02-03 2000-05-19 -S000035001 noncoding_exon tL(UAG)L1 12 592562 592519 C 2011-02-03 2000-05-19 -S000035000 noncoding_exon tL(UAG)L1 12 592619 592582 C 2011-02-03 2000-05-19 -S000007070 long_terminal_repeat YLRCdelta9 chromosome 12 12 593035 592706 C 2011-02-03 2000-05-19 Ty1 LTR -S000007085 long_terminal_repeat YLRWdelta10 chromosome 12 12 593145 593478 W 2011-02-03 2000-05-19 Ty1 LTR -S000007098 LTR_retrotransposon YLRWTy1-2 Ty1 chromosome 12 12 593145 599062 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007375 transposable_element_gene YLR227W-A gag protein chromosome 12 12 593438 594760 W 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000035724 CDS YLR227W-A 12 593438 594760 W 2011-02-03 1996-07-31 -S000007376 transposable_element_gene YLR227W-B gag-pol fusion protein chromosome 12 12 593438 598706 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000035730 CDS YLR227W-B 12 593438 594742 W 2011-02-03 1999-07-17 -S000035731 CDS YLR227W-B 12 594744 598706 W 2011-02-03 1999-07-17 -S000035732 plus_1_translational_frameshift YLR227W-B 12 594743 594743 W 2011-02-03 1999-07-17 -S000007086 long_terminal_repeat YLRWdelta11 chromosome 12 12 598729 599062 W 2011-02-03 2000-05-19 Ty1 LTR -S000007087 long_terminal_repeat YLRWdelta12 chromosome 12 12 599268 599544 W 2011-02-03 2000-05-19 Ty1 LTR -S000007080 long_terminal_repeat YLRCtau1 chromosome 12 12 599844 599570 C 2011-02-03 2000-05-19 Ty4 LTR -S000004218 ORF Verified YLR228C ECM22 chromosome 12 L000004375 12 602463 600019 C 2011-02-03 1996-07-31 Sterol regulatory element binding protein; regulates transcription of sterol biosynthetic genes upon sterol depletion, after relocating from intracellular membranes to perinuclear foci; redundant activator of filamentation with UPC2, up-regulating the expression of genes involved in filamentous growth; contains Zn[2]-Cys[6] binuclear cluster; ECM22 has a paralog, UPC2, that arose from the whole genome duplication -S000037567 CDS YLR228C 12 602463 600019 C 2011-02-03 1996-07-31 -S000118477 ARS ARS1218 ARSXII-603 chromosome 12 12 603024 603132 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178139 ARS_consensus_sequence ARS1218 12 603110 603094 C 2014-11-18 2014-11-18 -S000004220 ORF Dubious YLR230W chromosome 12 12 604574 604879 W 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; overlaps 5' end of essential CDC42/YLR229C gene which encodes a small Rho-like GTPase essential for establishment and maintenance of cell polarity -S000030492 CDS YLR230W 12 604574 604879 W 2011-02-03 1996-07-31 -S000004219 ORF Verified YLR229C CDC42 Rho family GTPase CDC42 chromosome 12 L000000276 12 604787 604212 C 165 2011-02-03 1996-07-31 Small rho-like GTPase; essential for establishment and maintenance of cell polarity; plays a role late in cell fusion via activation of key cell fusion regulator Fus2p; mutants have defects in the organization of actin and septins; human homolog CDC42 can complement yeast cdc42 mutant -S000030359 CDS YLR229C 12 604787 604212 C 2011-02-03 1996-07-31 -S000006614 tRNA_gene tI(UAU)L chromosome 12 L000003661 12 605432 605300 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000035162 intron tI(UAU)L 12 605395 605336 C 2011-02-03 2000-05-19 -S000035161 noncoding_exon tI(UAU)L 12 605335 605300 C 2011-02-03 2000-05-19 -S000035160 noncoding_exon tI(UAU)L 12 605432 605396 C 2011-02-03 2000-05-19 -S000004222 ORF Dubious YLR232W chromosome 12 12 606830 607177 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene BNA5 -S000031460 CDS YLR232W 12 606830 607177 W 2011-02-03 1996-07-31 -S000004221 ORF Verified YLR231C BNA5 kynureninase chromosome 12 12 607119 605758 C 2011-02-03 1996-07-31 Kynureninase; required for the de novo biosynthesis of NAD from tryptophan via kynurenine; expression regulated by Hst1p -S000031316 CDS YLR231C 12 607119 605758 C 2011-02-03 1996-07-31 -S000004223 ORF Verified YLR233C EST1 chromosome 12 L000000588 12 609524 607425 C 2011-02-03 1996-07-31 TLC1 RNA-associated factor involved in telomere length regulation; recruitment subunit of telomerase; has G-quadruplex promoting activity required for telomere elongation; role in activating telomere-bound Est2p-TLC1-RNA; EST1 has a paralog, EBS1, that arose from the whole genome duplication -S000031492 CDS YLR233C 12 609524 607425 C 2011-02-03 1996-07-31 -S000004224 ORF Verified YLR234W TOP3 DNA topoisomerase 3|EDR1 chromosome 12 L000002321 12 609783 611753 W 163 2011-02-03 1996-07-31 DNA Topoisomerase III; conserved protein that functions in a complex with Sgs1p and Rmi1p to relax single-stranded negatively-supercoiled DNA preferentially; DNA catenation/decatenation activity is stimulated by RPA and Sgs1p-Top3p-Rmi1p; involved in telomere stability and regulation of mitotic recombination -S000031598 CDS YLR234W 12 609783 611753 W 2011-02-03 1996-07-31 -S000004225 ORF Dubious YLR235C chromosome 12 12 611930 611532 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORFs TOP3/YLR234W and YLR236C -S000031634 CDS YLR235C 12 611930 611532 C 2011-02-03 1996-07-31 -S000004226 ORF Dubious YLR236C chromosome 12 12 612117 611794 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF YLR235C -S000032651 CDS YLR236C 12 612117 611794 C 2011-02-03 1996-07-31 -S000004227 ORF Verified YLR237W THI7 thiamine transporter THI7|THI10 chromosome 12 L000003514 12 612367 614163 W 2011-02-03 1996-07-31 Plasma membrane transporter responsible for the uptake of thiamine; contributes to uptake of 5-aminoimidazole-4-carboxamide-1-beta-D-ribofuranoside (acadesine); member of the major facilitator superfamily of transporters; mutation of human ortholog causes thiamine-responsive megaloblastic anemia -S000032815 CDS YLR237W 12 612367 614163 W 2011-02-03 1996-07-31 -S000004228 ORF Verified YLR238W FAR10 chromosome 12 12 614755 616191 W 2011-02-03 1996-07-31 Protein involved in recovery from arrest in response to pheromone; acts in a cell cycle arrest recovery pathway independent from Far1p; interacts with Far3p, Far7p, Far8p, Far9p, and Far11p; potential Cdc28p substrate; FAR10 has a paralog, VPS64, that arose from the whole genome duplication -S000033527 CDS YLR238W 12 614755 616191 W 2011-02-03 1996-07-31 -S000004229 ORF Verified YLR239C LIP2 lipoyl(octanoyl) transferase LIP2 chromosome 12 12 617318 616332 C 2011-02-03 1996-07-31 Lipoyl ligase; involved in the modification of mitochondrial enzymes by the attachment of lipoic acid groups -S000033564 CDS YLR239C 12 617318 616332 C 2011-02-03 1996-07-31 -S000004230 ORF Verified YLR240W VPS34 phosphatidylinositol 3-kinase VPS34|VPS7|STT8|VPT29|VPL7|PEP15|END12 chromosome 12 L000002476 12 617533 620160 W 2011-02-03 1996-07-31 Phosphatidylinositol (PI) 3-kinase that synthesizes PI-3-phosphate; forms membrane-associated signal transduction complex with Vps15p to regulate protein sorting; activated by the GTP-bound form of Gpa1p; a fraction is localized, with Vps15p, to nuclear pores at nucleus-vacuole junctions and may facilitate transcription elongation for genes positioned at the nuclear periphery -S000034710 CDS YLR240W 12 617533 620160 W 2011-02-03 1996-07-31 -S000004231 ORF Verified YLR241W CSC1 chromosome 12 12 620473 622821 W 2011-02-03 1996-07-31 Calcium permeable gated cation channel; may be involved in detoxification; similar to Arabidopsis CSC1 -S000035645 CDS YLR241W 12 620473 622821 W 2011-02-03 1996-07-31 -S000130183 ARS ARS1219 chromosome 12 12 623198 623861 2011-02-03 2009-05-08 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay -S000004232 ORF Verified YLR242C ARV1 sterol homeostasis protein ARV1 chromosome 12 L000003505 12 623883 622918 C 2011-02-03 1996-07-31 Cortical ER protein; implicated in the membrane insertion of tail-anchored C-terminal single transmembrane domain proteins; may function in transport of glycosylphosphatidylinositol intermediates into the ER lumen; required for normal intracellular sterol distribution; human ARV1, required for normal cholesterol and bile acid homeostasis, can complement yeast arv1 null mutant; human variant causing early onset epileptic encephalopathy is unable to rescue the yeast null -S000035677 CDS YLR242C 12 623883 622918 C 2011-02-03 1996-07-31 -S000004233 ORF Verified YLR243W GPN3 putative signal sequence-binding GTPase GPN3 chromosome 12 12 624203 625021 W 2011-02-03 1996-07-31 Putative GTPase with a role in biogenesis of RNA pol II and polIII; may be involved in assembly of RNA polymerases II and III and in their transport into the nucleus; may have a role in sister chromatid cohesion; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively; contains a Gly-Pro-Asn motif in the G domain; similar to Npa3p and Gpn2p -S000035796 CDS YLR243W 12 624203 625021 W 2011-02-03 1996-07-31 -S000004234 ORF Verified YLR244C MAP1 methionine aminopeptidase MAP1 chromosome 12 L000001025 12 626331 625168 C 2011-02-03 1996-07-31 Methionine aminopeptidase; catalyzes the cotranslational removal of N-terminal methionine from nascent polypeptides; function is partially redundant with that of Map2p -S000035829 CDS YLR244C 12 626331 625168 C 2011-02-03 1996-07-31 -S000004235 ORF Verified YLR245C CDD1 cytidine deaminase chromosome 12 L000004644 12 626930 626502 C 2011-02-03 1996-07-31 Cytidine deaminase; catalyzes the modification of cytidine to uridine in vitro but native RNA substrates have not been identified, localizes to both the nucleus and cytoplasm -S000035981 CDS YLR245C 12 626930 626502 C 2011-02-03 1996-07-31 -S000004236 ORF Verified YLR246W ERF2 palmitoyltransferase ERF2 chromosome 12 12 627118 628197 W 2011-02-03 1996-07-31 Subunit of a palmitoyltransferase; this complex adds a palmitoyl lipid moiety to heterolipidated substrates such as Ras1p and Ras2p through a thioester linkage; mutants partially mislocalize Ras2p to the vacuole; palmitoyltransferase is composed of Erf2p and Shr5p -S000036884 CDS YLR246W 12 627118 628197 W 2011-02-03 1996-07-31 -S000006643 tRNA_gene tL(CAA)L chromosome 12 L000003648 12 628383 628497 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000033796 intron tL(CAA)L 12 628421 628453 W 2011-02-03 2000-05-19 -S000033794 noncoding_exon tL(CAA)L 12 628383 628420 W 2011-02-03 2000-05-19 -S000033795 noncoding_exon tL(CAA)L 12 628454 628497 W 2011-02-03 2000-05-19 -S000004237 ORF Verified YLR247C IRC20 E3 ubiquitin-protein ligase IRC20 chromosome 12 12 633354 628684 C 2011-02-03 1996-07-31 E3 ubiquitin ligase and putative helicase; involved in synthesis-dependent strand annealing-mediated homologous recombination; ensures precise end-joining along with Srs2p in the Yku70p/Yku80p/Lig4p-dependent nonhomologous end joining (NHEJ) pathway; localizes to both the mitochondrion and the nucleus; contains a Snf2/Swi2 family ATPase/helicase and a RING finger domain; interacts with Cdc48p and Smt3p; null mutant displays increased levels of spontaneous Rad52p foci -S000036895 CDS YLR247C 12 633354 628684 C 2011-02-03 1996-07-31 -S000004238 ORF Verified YLR248W RCK2 serine/threonine protein kinase RCK2|CMK3|CLK1 chromosome 12 L000001593 12 634252 636084 W 2011-02-03 1996-07-31 Protein kinase involved in response to oxidative and osmotic stress; identified as suppressor of S. pombe cell cycle checkpoint mutations; similar to CaM (calmodulin) kinases; RCK2 has a paralog, RCK1, that arose from the whole genome duplication -S000037704 CDS YLR248W 12 634252 636084 W 2011-02-03 1996-07-31 -S000004239 ORF Verified YLR249W YEF3 translation elongation factor EF-3|EF-3|eEF3|TEF3 chromosome 12 L000002505 12 636780 639914 W 2011-02-03 1996-07-31 Translation elongation factor 3; contains two ABC cassettes; binds and hydrolyzes ATP; YEF3 has a paralog, HEF3, that arose from the whole genome duplication -S000037766 CDS YLR249W 12 636780 639914 W 2011-02-03 1996-07-31 -S000004240 ORF Verified YLR250W SSP120 chromosome 12 L000002091 12 640317 641021 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern -S000030689 CDS YLR250W 12 640317 641021 W 2011-02-03 1996-07-31 -S000004241 ORF Verified YLR251W SYM1 ethanol metabolism protein chromosome 12 12 641464 642057 W 2011-02-03 1996-07-31 Protein required for ethanol metabolism; induced by heat shock and localized to the inner mitochondrial membrane; homologous to mammalian peroxisomal membrane protein Mpv17; human homolog MPV17 is implicated in hepatocerebral mtDNA depletion syndromes (MDDS), and complements yeast null mutant -S000030794 CDS YLR251W 12 641464 642057 W 2011-02-03 1996-07-31 -S000004242 ORF Dubious YLR252W chromosome 12 12 641957 642262 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene SYM1, a mitochondrial protein involved in ethanol metabolism -S000030890 CDS YLR252W 12 641957 642262 W 2011-02-03 1996-07-31 -S000004243 ORF Verified YLR253W MCP2 MRX13 chromosome 12 12 642627 644336 W 2011-02-03 1996-07-31 Mitochondrial protein of unknown function involved in lipid homeostasis; associates with mitochondrial ribosome; integral membrane protein that localizes to the mitochondrial inner membrane; involved in mitochondrial morphology; non-essential gene which interacts genetically with MDM10, and other members of the ERMES complex; transcription is periodic during the metabolic cycle; homologous to human aarF domain containing kinase, ADCK1 -S000031890 CDS YLR253W 12 642627 644336 W 2011-02-03 1996-07-31 -S000004244 ORF Verified YLR254C NDL1 chromosome 12 12 644973 644404 C 2011-02-03 1996-07-31 Homolog of nuclear distribution factor NudE; NUDEL; interacts with Pac1p and regulates dynein targeting to microtubule plus ends -S000031972 CDS YLR254C 12 644973 644404 C 2011-02-03 1996-07-31 -S000004245 ORF Dubious YLR255C chromosome 12 12 645953 645600 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032077 CDS YLR255C 12 645953 645600 C 2011-02-03 1996-07-31 -S000004246 ORF Verified YLR256W HAP1 CYP1 chromosome 12 L000002665 12 646415 650923 W 2011-02-03 1996-07-31 Zinc finger transcription factor; involved in the complex regulation of gene expression in response to levels of heme and oxygen; localizes to the mitochondrion as well as to the nucleus; the S288C sequence differs from other strain backgrounds due to a Ty1 insertion in the carboxy terminus -S000033058 CDS YLR256W 12 646415 650923 W 2011-02-03 1996-07-31 -S000007088 long_terminal_repeat YLRWdelta13 chromosome 12 12 650824 651157 W 2011-02-03 2000-05-19 Ty1 LTR -S000007099 LTR_retrotransposon YLRWTy1-3 Ty1 chromosome 12 12 650824 656743 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007377 transposable_element_gene YLR256W-A gag protein chromosome 12 12 651117 652439 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000035661 CDS YLR256W-A 12 651117 652439 W 2011-02-03 1999-07-17 -S000007089 long_terminal_repeat YLRWdelta14 chromosome 12 12 656410 656743 W 2011-02-03 2000-05-19 Ty1 LTR -S000006517 tRNA_gene tA(AGC)L chromosome 12 L000003660 12 657006 656934 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine -S000032303 noncoding_exon tA(AGC)L 12 657006 656934 C 2011-02-03 2000-05-19 -S000007096 long_terminal_repeat YLRWsigma3 chromosome 12 12 657022 657365 W 2011-02-03 2000-05-19 Ty3 LTR -S000007090 long_terminal_repeat YLRWdelta15 chromosome 12 12 657449 657767 W 2011-02-03 2000-05-19 Ty1 LTR -S000004247 ORF Verified YLR257W chromosome 12 12 658826 659791 W 2011-02-03 1996-07-31 Protein of unknown function; protein abundance increases in response to DNA replication stress -S000033141 CDS YLR257W 12 658826 659791 W 2011-02-03 1996-07-31 -S000118478 ARS ARS1220 ARSXII-660 chromosome 12 12 659884 659935 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178140 ARS_consensus_sequence ARS1220 12 659892 659908 W 2014-11-18 2014-11-18 -S000004248 ORF Verified YLR258W GSY2 glycogen (starch) synthase GSY2 chromosome 12 L000000740 12 660716 662833 W 2011-02-03 1996-07-31 Glycogen synthase; expression induced by glucose limitation, nitrogen starvation, heat shock, and stationary phase; activity regulated by cAMP-dependent, Snf1p and Pho85p kinases as well as by the Gac1p-Glc7p phosphatase; GSY2 has a paralog, GSY1, that arose from the whole genome duplication; relocalizes from cytoplasm to plasma membrane upon DNA replication stress -S000033909 CDS YLR258W 12 660716 662833 W 2011-02-03 1996-07-31 -S000004249 ORF Verified YLR259C HSP60 chaperone ATPase HSP60|MNA2|MIF4|CPN60 chromosome 12 L000000819 12 665002 663284 C 2011-02-03 1996-07-31 Tetradecameric mitochondrial chaperonin; required for ATP-dependent folding of precursor polypeptides and complex assembly; prevents aggregation and mediates protein refolding after heat shock; role in mtDNA transmission; phosphorylated -S000033960 CDS YLR259C 12 665002 663284 C 2011-02-03 1996-07-31 -S000004250 ORF Verified YLR260W LCB5 sphinganine kinase LCB5 chromosome 12 L000004329 12 665844 667907 W 2011-02-03 1996-07-31 Minor sphingoid long-chain base kinase; possibly involved in synthesis of long-chain base phosphates, which function as signaling molecules; LCB5 has a paralog, LCB4, that arose from the whole genome duplication -S000035015 CDS YLR260W 12 665844 667907 W 2011-02-03 1996-07-31 -S000004251 ORF Uncharacterized YLR261C VPS63 chromosome 12 12 668563 668237 C 2011-02-03 1996-07-31 Putative protein of unknown function; not conserved in closely related Saccharomyces species; 98% of ORF overlaps the verified gene YPT6; deletion causes a vacuolar protein sorting defect; decreased levels of protein in enolase deficient mutant -S000035062 CDS YLR261C 12 668563 668237 C 2011-02-03 1996-07-31 -S000004252 ORF Verified YLR262C YPT6 Rab family GTPase YPT6 chromosome 12 L000002896|L000002948 12 668891 668244 C 2011-02-03 1996-07-31 Rab family GTPase; required for endosome-to-Golgii, intra-Golgi retrograde, and retrograde Golgi-to-ER transport; temporarily at the Golgi, dissociating into the cytosol on arrival of the late Golgi GTPase Ypt32p; Golgi-localized form is GTP bound, while cytosolic form is GDP-bound; required for delivery of Atg9p to the phagophore assembly site during autophagy under heat stress, with Ypt6p for starvation induced autophagy and for the CVT pathway; homolog of mammalian Rab6 -S000035164 CDS YLR262C 12 668891 668244 C 2011-02-03 1996-07-31 -S000007246 ORF Verified YLR262C-A TMA7 RBF7 chromosome 12 12 669662 669468 C 2011-02-03 1999-07-17 Protein of unknown that associates with ribosomes; null mutant exhibits translation defects, altered polyribosome profiles, and resistance to the translation inhibitor anisomcyin; protein abundance increases in response to DNA replication stress -S000036510 CDS YLR262C-A 12 669662 669468 C 2011-02-03 1999-07-17 -S000004253 ORF Verified YLR263W RED1 chromosome 12 L000001608 12 670340 672823 W 2011-02-03 1996-07-31 Protein component of the synaptonemal complex axial elements; involved in chromosome segregation during the first meiotic division; critical for coupling checkpoint signaling to SC formation; promotes interhomolog recombination by phosphorylating Hop1p; also interacts with Mec3p and Ddc1p -S000036094 CDS YLR263W 12 670340 672823 W 2011-02-03 1996-07-31 -S000004254 ORF Verified YLR264W RPS28B eS28|ribosomal 40S subunit protein S28B|S28e|YS27|S33B|S28B|RPS33B chromosome 12 L000002744 12 673131 673334 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S28, no bacterial homolog; has an extraribosomal function in autoregulation, in which Rps28Bp binds to a decapping complex via Edc3p, which then binds to RPS28B mRNA leading to its decapping and degradation; RPS28B has a paralog, RPS28A, that arose from the whole genome duplication -S000036202 CDS YLR264W 12 673131 673334 W 2011-02-03 1996-07-31 -S000028808 ORF Uncharacterized YLR264C-A chromosome 12 12 673944 673828 C 2011-02-03 2003-07-29 Putative protein of unknown function -S000033593 CDS YLR264C-A 12 673944 673828 C 2011-02-03 2003-07-29 -S000004255 ORF Verified YLR265C NEJ1 LIF2 chromosome 12 12 675455 674427 C 2011-02-03 1996-07-31 Protein involved in regulation of nonhomologous end joining; interacts with DNA ligase IV components Dnl4p and Lif1p; repressed by MAT heterozygosity; regulates cellular distribution of Lif1p -S000036242 CDS YLR265C 12 675455 674427 C 2011-02-03 1996-07-31 -S000004256 ORF Verified YLR266C PDR8 chromosome 12 12 677724 675619 C 2011-02-03 1996-07-31 Transcription factor; targets include ATP-binding cassette (ABC) transporters, major facilitator superfamily transporters, and other genes involved in the pleiotropic drug resistance (PDR) phenomenon; PDR8 has a paralog, YRR1, that arose from the whole genome duplication -S000031731 CDS YLR266C 12 677724 675619 C 2011-02-03 1996-07-31 -S000004257 ORF Uncharacterized YLR267W BOP2 chromosome 12 L000004722 12 678212 679924 W 2011-02-03 1996-07-31 Protein of unknown function -S000031962 CDS YLR267W 12 678212 679924 W 2011-02-03 1996-07-31 -S000004258 ORF Verified YLR268W SEC22 SNAP receptor SEC22|TS26|TSL26|SLY2 chromosome 12 L000001845|S000029606|L000002362 12 680200 680844 W 2011-02-03 1996-07-31 R-SNARE protein; assembles into SNARE complex with Bet1p, Bos1p and Sed5p; cycles between the ER and Golgi complex; involved in anterograde and retrograde transport between the ER and Golgi; synaptobrevin homolog -S000037429 CDS YLR268W 12 680200 680844 W 2011-02-03 1996-07-31 -S000004260 ORF Verified YLR270W DCS1 5'-(N(7)-methyl 5'-triphosphoguanosine)-(mRNA) diphosphatase|DcpS chromosome 12 12 681186 682238 W 2011-02-03 1996-07-31 Non-essential hydrolase involved in mRNA decapping; activates Xrn1p; may function in a feedback mechanism to regulate deadenylation, contains pyrophosphatase activity and a HIT (histidine triad) motif; acts as inhibitor of neutral trehalase Nth1p; required for growth on glycerol medium; protein abundance increases in response to DNA replication stress; DCS1 has a paralog, DCS2, that arose from the whole genome duplication -S000037138 CDS YLR270W 12 681186 682238 W 2011-02-03 1996-07-31 -S000004259 ORF Dubious YLR269C chromosome 12 12 681216 680866 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037460 CDS YLR269C 12 681216 680866 C 2011-02-03 1996-07-31 -S000004261 ORF Uncharacterized YLR271W CMG1 chromosome 12 12 682737 683561 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and the nucleus and is induced in response to the DNA-damaging agent MMS -S000037234 CDS YLR271W 12 682737 683561 W 2011-02-03 1996-07-31 -S000004262 ORF Verified YLR272C YCS4 condensin subunit YCS4|LOC7 chromosome 12 12 687202 683672 C 2011-02-03 1996-07-31 Subunit of the condensin complex; required for establishment and maintenance of chromosome condensation, chromosome segregation, chromatin binding of condensin, tRNA gene clustering at the nucleolus, and silencing at the mating type locus; required for replication slow zone (RSZ) breakage following Mec1p inactivation -S000037272 CDS YLR272C 12 687202 683672 C 2011-02-03 1996-07-31 -S000006762 tRNA_gene tV(AAC)L chromosome 12 L000003659 12 687932 687859 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000032966 noncoding_exon tV(AAC)L 12 687932 687859 C 2011-02-03 2000-05-19 -S000007071 long_terminal_repeat YLRCdelta16 chromosome 12 12 688368 688119 C 2011-02-03 2000-05-19 Ty1 LTR -S000007091 long_terminal_repeat YLRWdelta17 chromosome 12 12 688369 688664 W 2011-02-03 2000-05-19 Ty1 LTR -S000004263 ORF Verified YLR273C PIG1 protein phosphatase regulator PIG1 chromosome 12 L000001436 12 691029 689083 C 2011-02-03 1996-07-31 Putative targeting subunit for type-1 protein phosphatase Glc7p; tethers Glc7p to Gsy2p glycogen synthase; PIG1 has a paralog, GAC1, that arose from the whole genome duplication -S000037347 CDS YLR273C 12 691029 689083 C 2011-02-03 1996-07-31 -S000004264 ORF Verified YLR274W MCM5 MCM DNA helicase complex subunit MCM5|CDC46|BOB1 chromosome 12 L000000279 12 691555 693882 W 2011-02-03 1996-07-31 Component of the Mcm2-7 hexameric helicase complex; MCM complex is important for priming origins of DNA replication in G1 and becomes an active ATP-dependent helicase that promotes DNA melting and elongation when activated by Cdc7p-Dbf4p in S-phase -S000030019 CDS YLR274W 12 691555 693882 W 2011-02-03 1996-07-31 -S000004265 ORF Verified YLR275W SMD2 mRNA splicing protein SMD2|Sm D2 chromosome 12 L000004145 12 694378 694800 W 2011-02-03 1996-07-31 Core Sm protein Sm D2; part of heteroheptameric complex (with Smb1p, Smd1p, Smd3p, Sme1p, Smx3p, and Smx2p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; homolog of human Sm D2 -S000030096 CDS YLR275W 12 694378 694382 W 2011-02-03 1996-07-31 -S000030097 CDS YLR275W 12 694473 694800 W 2011-02-03 1996-07-31 -S000030098 intron YLR275W 12 694383 694472 W 2011-02-03 1996-07-31 -S000004266 ORF Verified YLR276C DBP9 ATP-dependent DNA/RNA helicase chromosome 12 L000004249 12 696830 695046 C 2011-02-03 1996-07-31 DEAD-box protein required for 27S rRNA processing; exhibits DNA, RNA and DNA/RNA helicase activities; ATPase activity shows preference for DNA over RNA; DNA helicase activity abolished by mutation in RNA-binding domain -S000030144 CDS YLR276C 12 696830 695046 C 2011-02-03 1996-07-31 -S000004267 ORF Verified YLR277C YSH1 cleavage polyadenylation factor subunit YSH1|BRR5 chromosome 12 L000003344 12 699495 697156 C 2011-02-03 1996-07-31 Endoribonuclease; subunit of the mRNA cleavage and polyadenylation specificity complex; required for 3' processing, splicing, and transcriptional termination of mRNAs and snoRNAs; protein abundance increases in response to DNA replication stress; YSH1 has a paralog, SYC1, that arose from the whole genome duplication -S000030344 CDS YLR277C 12 699495 697156 C 2011-02-03 1996-07-31 -S000004268 ORF Uncharacterized YLR278C chromosome 12 12 704024 699999 C 2011-02-03 1996-07-31 Zinc-cluster protein; GFP-fusion protein localizes to the nucleus; mutant shows moderate growth defect on caffeine; has a prion-domain like fragment that increases frequency of [URE3]; YLR278C is not an essential gene -S000033636 CDS YLR278C 12 704024 699999 C 2011-02-03 1996-07-31 -S000004269 ORF Dubious YLR279W chromosome 12 12 704309 704698 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033857 CDS YLR279W 12 704309 704698 W 2011-02-03 1996-07-31 -S000004270 ORF Dubious YLR280C chromosome 12 12 704833 704483 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033385 CDS YLR280C 12 704833 704483 C 2011-02-03 1996-07-31 -S000004271 ORF Uncharacterized YLR281C chromosome 12 12 704960 704493 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to mitochondria; YLR281C is not an essential gene -S000033456 CDS YLR281C 12 704960 704493 C 2011-02-03 1996-07-31 -S000004273 ORF Uncharacterized YLR283W chromosome 12 12 705186 706130 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to mitochondria; YLR283W is not an essential gene -S000034433 CDS YLR283W 12 705186 706130 W 2011-02-03 1996-07-31 -S000004272 ORF Dubious YLR282C chromosome 12 12 705412 705071 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; deletion mutation confers an increase in Ty1 transposition -S000033516 CDS YLR282C 12 705412 705071 C 2011-02-03 1996-07-31 -S000004274 ORF Verified YLR284C ECI1 dodecenoyl-CoA isomerase chromosome 12 L000004206 12 707040 706198 C 2011-02-03 1996-07-31 Peroxisomal delta3,delta2-enoyl-CoA isomerase; hexameric protein that converts 3-hexenoyl-CoA to trans-2-hexenoyl-CoA, essential for the beta-oxidation of unsaturated fatty acids, oleate-induced; ECI1 has a paralog, DCI1, that arose from the whole genome duplication -S000034471 CDS YLR284C 12 707040 706198 C 2011-02-03 1996-07-31 -S000004275 ORF Verified YLR285W NNT1 EFM7|S-adenosylmethionine-dependent methyltransferase chromosome 12 12 707360 708145 W 2011-02-03 1996-07-31 S-adenosylmethionine-dependent methyltransferase; novel N-terminal protein methyltransferase that trimethylates the N-terminal glycine residue (G2) and also dimethylates lysine (K3) on elongation factor eEF1A (Tef1p/Tef2p); has a role in rDNA silencing and in lifespan determination -S000034643 CDS YLR285W 12 707360 708145 W 2011-02-03 1996-07-31 -S000028569 ORF Uncharacterized YLR285C-A chromosome 12 12 708338 708168 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031275 CDS YLR285C-A 12 708338 708168 C 2011-02-03 2003-07-29 -S000028679 ORF Dubious YLR286W-A chromosome 12 12 708562 708696 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene CTS1 -S000032537 CDS YLR286W-A 12 708562 708696 W 2011-02-03 2003-07-29 -S000004276 ORF Verified YLR286C CTS1 SCW2 chromosome 12 L000000434|S000029435|L000004563 12 710136 708448 C 2011-02-03 1996-07-31 Endochitinase; required for cell separation after mitosis; transcriptional activation during the G1 phase of the cell cycle is mediated by transcription factor Ace2p -S000034680 CDS YLR286C 12 710136 708448 C 2011-02-03 1996-07-31 -S000004277 ORF Uncharacterized YLR287C chromosome 12 12 712058 710991 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YLR287C is not an essential gene -S000035680 CDS YLR287C 12 712058 710991 C 2011-02-03 1996-07-31 -S000004278 ORF Verified YLR287C-A RPS30A eS30|ribosomal 40S subunit protein S30A|S30e|S30A chromosome 12 L000003183 12 713158 712537 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S30, no bacterial homolog; RPS30A has a paralog, RPS30B, that arose from the whole genome duplication -S000030932 CDS YLR287C-A 12 712725 712537 C 2011-02-03 1996-07-31 -S000030931 CDS YLR287C-A 12 713158 713156 C 2011-02-03 1996-07-31 -S000030933 intron YLR287C-A 12 713155 712726 C 2011-02-03 1996-07-31 -S000004279 ORF Verified YLR288C MEC3 PSO9|PIP3 chromosome 12 L000002907 12 714904 713480 C 2011-02-03 1996-07-31 DNA damage and meiotic pachytene checkpoint protein; subunit of a heterotrimeric complex (Rad17p-Mec3p-Ddc1p) that forms a sliding clamp, loaded onto partial duplex DNA by a clamp loader complex; homolog of human and S. pombe Hus1 -S000035804 CDS YLR288C 12 714904 713480 C 2011-02-03 1996-07-31 -S000004280 ORF Verified YLR289W GUF1 GTPase GUF1 chromosome 12 L000002749 12 715089 717026 W 2011-02-03 1996-07-31 Mitochondrial matrix GTPase; associates with mitochondrial ribosomes; important for translation under temperature and nutrient stress; may have a role in translational fidelity; similar to bacterial LepA elongation factor -S000037787 CDS YLR289W 12 715089 717026 W 2011-02-03 1996-07-31 -S000004281 ORF Verified YLR290C COQ11 ubiquinone biosynthesis protein COQ11|MRX2 chromosome 12 12 717978 717145 C 2011-02-03 1996-07-31 Putative oxidoreductase, subunit of Coenzyme Q biosynthetic complexes; required for synthesis of wild-type levels of Coenzyme Q (ubiquinone); member of the short-chain dehydrogenase/reductase (SDR) superfamily; orthologous gene in some other fungi is fused to the COQ10 ortholog -S000036802 CDS YLR290C 12 717978 717145 C 2011-02-03 1996-07-31 -S000004282 ORF Verified YLR291C GCD7 translation initiation factor eIF2B subunit beta chromosome 12 L000000675 12 719462 718317 C 2011-02-03 1996-07-31 Beta subunit of the translation initiation factor eIF2B; the guanine-nucleotide exchange factor for eIF2; activity subsequently regulated by phosphorylated eIF2; first identified as a negative regulator of GCN4 expression; human homolog EIF2B2 can complement yeast mutant, allows growth down-regulation of yeast gene -S000036871 CDS YLR291C 12 719462 718317 C 2011-02-03 1996-07-31 -S000004283 ORF Verified YLR292C SEC72 Sec63 complex subunit SEC72|SIM2|SEC67 chromosome 12 L000001857 12 720370 719789 C 2011-02-03 1996-07-31 Non-essential subunit of Sec63 complex; with Sec61 complex, Kar2p/BiP and Lhs1p forms a channel competent for SRP-dependent and post-translational SRP-independent protein targeting and import into the ER; other members are Sec63p, Sec62p, and Sec66p -S000037611 CDS YLR292C 12 720370 719789 C 2011-02-03 1996-07-31 -S000130184 ARS ARS1221 chromosome 12 12 720784 721418 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000004284 ORF Verified YLR293C GSP1 Ran GTPase GSP1|CST17|CNR1 chromosome 12 L000000736 12 721430 720771 C 2011-02-03 1996-07-31 Ran GTPase; GTP binding protein (mammalian Ranp homolog) involved in the maintenance of nuclear organization, RNA processing and transport; regulated by Srm1p, Rna1p, Yrb1p, Yrb2p, Yrp4p, Yrb30p, Cse1p and Kap95p; GSP1 has a paralog, GSP2, that arose from the whole genome duplication -S000037671 CDS YLR293C 12 721430 720771 C 2011-02-03 1996-07-31 -S000004285 ORF Dubious YLR294C chromosome 12 12 722030 721701 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene ATP14 -S000037718 CDS YLR294C 12 722030 721701 C 2011-02-03 1996-07-31 -S000004286 ORF Verified YLR295C ATP14 F1F0 ATP synthase subunit h chromosome 12 L000003379 12 722373 721999 C 2011-02-03 1996-07-31 Subunit h of the F0 sector of mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; protein abundance increases in response to DNA replication stress -S000037778 CDS YLR295C 12 722373 721999 C 2011-02-03 1996-07-31 -S000004287 ORF Dubious YLR296W chromosome 12 12 722978 723304 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030715 CDS YLR296W 12 722978 723304 W 2011-02-03 1996-07-31 -S000004288 ORF Verified YLR297W chromosome 12 12 724044 724433 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole; not an essential gene; induced by treatment with 8-methoxypsoralen and UVA irradiation; relocalizes from nucleus to vacuole upon DNA replication stress; YLR297W has a paralog, YOR186W, that arose from the whole genome duplication -S000030831 CDS YLR297W 12 724044 724433 W 2011-02-03 1996-07-31 -S000004289 ORF Verified YLR298C YHC1 U1C|U1-C chromosome 12 L000004161 12 725416 724721 C 2011-02-03 1996-07-31 Component of the U1 snRNP complex required for pre-mRNA splicing; putative ortholog of human U1C protein, which is involved in formation of a complex between U1 snRNP and the pre-mRNA 5' splice site -S000030863 CDS YLR298C 12 725416 724721 C 2011-02-03 1996-07-31 -S000004290 ORF Verified YLR299W ECM38 gamma-glutamyltransferase|CIS2 chromosome 12 L000003905 12 726069 728051 W 2011-02-03 1996-07-31 Gamma-glutamyltranspeptidase; major glutathione-degrading enzyme; involved in detoxification of electrophilic xenobiotics; expression induced mainly by nitrogen starvation -S000031951 CDS YLR299W 12 726069 728051 W 2011-02-03 1996-07-31 -S000028680 ORF Dubious YLR299C-A chromosome 12 12 728003 727911 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene ECM38 -S000032551 CDS YLR299C-A 12 728003 727911 C 2011-02-03 2003-07-29 -S000004291 ORF Verified YLR300W EXG1 glucan 1,3-beta-glucosidase|SCW6|BGL1 chromosome 12 L000000592|S000029437|L000004567 12 728955 730301 W 206 2011-02-03 1996-07-31 Major exo-1,3-beta-glucanase of the cell wall; involved in cell wall beta-glucan assembly; exists as three differentially glycosylated isoenzymes; EXG1 has a paralog, SPR1, that arose from the whole genome duplication -S000030080 CDS YLR300W 12 728955 730301 W 2011-02-03 1996-07-31 -S000004292 ORF Verified YLR301W HRI1 chromosome 12 12 730825 731559 W 2011-02-03 1996-07-31 Protein of unknown function that interacts with Sec72p and Hrr25p -S000030226 CDS YLR301W 12 730825 731559 W 2011-02-03 1996-07-31 -S000007072 long_terminal_repeat YLRCdelta18 chromosome 12 12 732000 731668 C 2011-02-03 2000-05-19 Ty2 LTR -S000006656 tRNA_gene tL(UAG)L2 chromosome 12 L000003649 12 732090 732190 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000035006 intron tL(UAG)L2 12 732128 732146 W 2011-02-03 2000-05-19 -S000035004 noncoding_exon tL(UAG)L2 12 732090 732127 W 2011-02-03 2000-05-19 -S000035005 noncoding_exon tL(UAG)L2 12 732147 732190 W 2011-02-03 2000-05-19 -S000004294 ORF Verified YLR303W MET17 bifunctional cysteine synthase/O-acetylhomoserine aminocarboxypropyltransferase MET17|MET25|MET15 chromosome 12 L000001091|L000001088 12 732542 733876 W 2011-02-03 1996-07-31 O-acetyl homoserine-O-acetyl serine sulfhydrylase; required for Methionine and cysteine biosynthesis -S000030497 CDS YLR303W 12 732542 733876 W 2011-02-03 1996-07-31 -S000004293 ORF Dubious YLR302C chromosome 12 12 732553 732191 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030295 CDS YLR302C 12 732553 732191 C 2011-02-03 1996-07-31 -S000007073 long_terminal_repeat YLRCdelta19 chromosome 12 12 734671 734501 C 2011-02-03 2000-05-19 Ty1 LTR -S000006607 tRNA_gene tI(AAU)L1 chromosome 12 L000003650 12 734802 734875 W 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000033931 noncoding_exon tI(AAU)L1 12 734802 734875 W 2011-02-03 2000-05-19 -S000004295 ORF Verified YLR304C ACO1 aconitate hydratase ACO1|GLU1 chromosome 12 L000000022 12 737548 735212 C 2011-02-03 1996-07-31 Aconitase; required for the tricarboxylic acid (TCA) cycle and also independently required for mitochondrial genome maintenance; component of the mitochondrial nucleoid; mutation leads to glutamate auxotrophy; human homolog ACO2 can complement yeast null mutant -S000031331 CDS YLR304C 12 737548 735212 C 2011-02-03 1996-07-31 -S000004296 ORF Verified YLR305C STT4 1-phosphatidylinositol 4-kinase STT4 chromosome 12 L000002137 12 743863 738161 C 2011-02-03 1996-07-31 Phosphatidylinositol-4-kinase; functions in the Pkc1p protein kinase pathway; required for normal vacuole morphology, cell wall integrity, and actin cytoskeleton organization -S000031384 CDS YLR305C 12 743863 738161 C 2011-02-03 1996-07-31 -S000004297 ORF Verified YLR306W UBC12 NEDD8-conjugating protein UBC12 chromosome 12 L000003386 12 744151 744851 W 2011-02-03 1996-07-31 Enzyme that mediates the conjugation of Rub1p; a ubiquitin-like protein, to other proteins; related to E2 ubiquitin-conjugating enzymes -S000031518 CDS YLR306W 12 744151 744153 W 2011-02-03 1996-07-31 -S000031519 CDS YLR306W 12 744288 744851 W 2011-02-03 1996-07-31 -S000031520 intron YLR306W 12 744154 744287 W 2011-02-03 1996-07-31 -S000118479 ARS ARS1223 ARSXII-745 chromosome 12 12 744943 745179 2011-02-03 2006-08-30 Autonomously Replicating Sequence; replication capacity dependent upon Sum1p -S000178141 ARS_consensus_sequence ARS1223 12 745116 745100 C 2014-11-18 2014-11-18 -S000004298 ORF Verified YLR307W CDA1 chitin deacetylase CDA1 chromosome 12 L000003112 12 745620 746525 W 2011-02-03 1996-07-31 Chitin deacetylase; together with Cda2p involved in the biosynthesis ascospore wall component, chitosan; required for proper rigidity of the ascospore wall -S000031600 CDS YLR307W 12 745620 746525 W 2011-02-03 1996-07-31 -S000028525 ORF Uncharacterized YLR307C-A chromosome 12 12 747111 746848 C 2011-02-03 2003-07-29 Putative protein of unknown function -S000030327 CDS YLR307C-A 12 747111 746848 C 2011-02-03 2003-07-29 -S000004299 ORF Verified YLR308W CDA2 chitin deacetylase CDA2 chromosome 12 L000003113 12 747937 748875 W 2011-02-03 1996-07-31 Chitin deacetylase; together with Cda1p involved in the biosynthesis ascospore wall component, chitosan; required for proper rigidity of the ascospore wall -S000032597 CDS YLR308W 12 747937 748875 W 2011-02-03 1996-07-31 -S000004300 ORF Verified YLR309C IMH1 SYS3 chromosome 12 L000003981 12 751769 749034 C 2011-02-03 1996-07-31|2011-02-03 Protein involved in vesicular transport; mediates transport between an endosomal compartment and the Golgi, contains a Golgi-localization (GRIP) domain that interacts with activated Arl1p-GTP to localize Imh1p to the Golgi -S000032653 CDS YLR309C 12 751769 749034 C 2011-02-03 1996-07-31|2011-02-03 -S000004301 ORF Verified YLR310C CDC25 Ras family guanine nucleotide exchange factor CDC25|CDC25'|CTN1 chromosome 12 L000000264|L000000263 12 756993 752224 C 213 2011-02-03 1996-07-31 Membrane bound guanine nucleotide exchange factor; also known as a GEF or GDP-release factor; indirectly regulates adenylate cyclase through activation of Ras1p and Ras2p by stimulating the exchange of GDP for GTP; required for progression through G1; thermosensitivity of the cdc25-5 mutant is functionally complemented by human RASGRF1 or by a fragment of human SOS1 comprising the CDC25-related catalytic domain -S000032496 CDS YLR310C 12 756993 752224 C 2011-02-03 1996-07-31 -S000004302 ORF Dubious YLR311C chromosome 12 12 757612 757265 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034499 CDS YLR311C 12 757612 757265 C 2011-02-03 1996-07-31 -S000004303 ORF Verified YLR312C ATG39 QNQ1 chromosome 12 12 758833 757637 C 2011-02-03 1996-07-31 Autophagy receptor with a role in degradation of the ER and nucleus; involved specifically in autophagy of perinuclear endoplasmic reticulum in response to nitrogen starvation or rapamycin treatment; localizes to the perinuclear ER -S000034606 CDS YLR312C 12 758833 757637 C 2011-02-03 1996-07-31 -S000004304 ORF Verified YLR312W-A MRPL15 mitochondrial 54S ribosomal protein YmL15|YmL15 chromosome 12 L000002688 12 759480 760241 W 2011-02-03 2001-06-12|1997-07-01|2006-10-03 Mitochondrial ribosomal protein of the large subunit -S000037404 CDS YLR312W-A 12 759480 760241 W 2011-02-03 1997-07-01|2006-10-03 -S000004305 ORF Verified YLR313C SPH1 YLR312C-B chromosome 12 L000004149 12 762342 760750 C 2011-02-03 2004-02-05|1996-07-31|2011-02-03 Protein involved in shmoo formation and bipolar bud site selection; localizes to sites of polarized growth in a cell cycle dependent- and Spa2p-dependent manner, interacts with MAPKKs Mkk1p, Mkk2p, and Ste7p; SPH1 has a paralog, SPA2, that arose from the whole genome duplication -S000034673 CDS YLR313C 12 762342 760750 C 2011-02-03 2004-02-05|1996-07-31|2011-02-03 -S000004306 ORF Verified YLR314C CDC3 septin CDC3 chromosome 12 L000000243 12 764137 762575 C 215 2004-02-05 1996-07-31|2011-02-03 Component of the septin ring that is required for cytokinesis; septins are GTP-binding proteins that assemble with other septins into rod-like complexes that can associate with other rods to form filament polymers; septin rings at the mother-bud neck act as scaffolds for recruiting factors needed for cell division and as barriers to prevent diffusion of specific proteins between mother and daughter cells -S000034752 CDS YLR314C 12 764137 762575 C 2004-02-05 1996-07-31|2011-02-03 -S000004307 ORF Verified YLR315W NKP2 chromosome 12 12 764808 765269 W 2004-02-05 1996-07-31 Central kinetochore protein and subunit of the Ctf19 complex; mutants have elevated rates of chromosome loss; orthologous to fission yeast kinetochore protein cnl2 -S000035712 CDS YLR315W 12 764808 765269 W 2004-02-05 1996-07-31 -S000004309 ORF Dubious YLR317W chromosome 12 12 765655 766089 W 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; may be part of a bicistronic transcript with NKP2/YLR315W; overlaps the verified ORF TAD3/YLR316C -S000035934 CDS YLR317W 12 765655 766089 W 2004-02-05 1996-07-31 -S000004308 ORF Verified YLR316C TAD3 chromosome 12 S000007486 12 766358 765266 C 2004-02-05 2000-07-22|1996-07-31 Subunit of tRNA-specific adenosine-34 deaminase; forms a heterodimer with Tad2p that converts adenosine to inosine at the wobble position of several tRNAs -S000035749 CDS YLR316C 12 766073 765266 C 2004-02-05 2000-07-22|1996-07-31 -S000035748 CDS YLR316C 12 766181 766130 C 2004-02-05 2000-07-22 -S000035747 CDS YLR316C 12 766358 766250 C 2004-02-05 2000-07-22 -S000035751 intron YLR316C 12 766129 766074 C 2004-02-05 2000-07-22 -S000035750 intron YLR316C 12 766249 766182 C 2004-02-05 2000-07-22 -S000004310 ORF Verified YLR318W EST2 TERT chromosome 12 L000003504 12 766542 769196 W 2004-02-05 1996-07-31|2011-02-03 Reverse transcriptase subunit of the telomerase holoenzyme; essential for telomerase core catalytic activity, involved in other aspects of telomerase assembly and function; mutations in human homolog are associated with aplastic anemia -S000036808 CDS YLR318W 12 766542 769196 W 2004-02-05 1996-07-31|2011-02-03 -S000004311 ORF Verified YLR319C BUD6 AIP3 chromosome 12 L000000071|L000002602 12 771684 769318 C 221 2004-02-05 1996-07-31 Actin- and formin-interacting protein; participates in actin cable assembly and organization as a nucleation-promoting factor (NPF) for formins Bni1p and Bnr1p; a triple helical coiled-coil domain in the C-terminal region interacts with Bni1p; involved in polarized cell growth; isolated as bipolar budding mutant; potential Cdc28p substrate -S000036838 CDS YLR319C 12 771684 769318 C 2004-02-05 1996-07-31 -S000004312 ORF Verified YLR320W MMS22 SLM2 chromosome 12 12 771940 776304 W 2004-02-05 1996-07-31 Subunit of E3 ubiquitin ligase complex involved in replication repair; stabilizes protein components of the replication fork, such as the fork-pausing complex and leading strand polymerase, preventing fork collapse and promoting efficient recovery during replication stress; required for accurate meiotic chromosome segregation -S000036604 CDS YLR320W 12 771940 776304 W 2004-02-05 1996-07-31 -S000004314 ORF Dubious YLR322W VPS65 chromosome 12 12 777628 777942 W 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 75% of ORF overlaps the verified gene SFH1; deletion causes a vacuolar protein sorting defect and blocks anaerobic growth -S000036774 CDS YLR322W 12 777628 777942 W 2004-02-05 1996-07-31 -S000004313 ORF Verified YLR321C SFH1 chromosome 12 L000003282 12 777864 776584 C 2004-02-05 1996-07-31 Component of the RSC chromatin remodeling complex; essential gene required for cell cycle progression and maintenance of proper ploidy; phosphorylated in the G1 phase of the cell cycle; Snf5p paralog; hSNF5 tumor suppressor ortholog -S000036636 CDS YLR321C 12 777864 776584 C 2004-02-05 1996-07-31 -S000004315 ORF Verified YLR323C CWC24 U2-type spliceosomal complex subunit CWC24 chromosome 12 12 778952 778173 C 2004-02-05 1996-07-31 General splicing factor; required for stable U2 snRNP binding to primary transcripts; essential for the first step of splicing; component of the pre-catalytic spliceosome complex containing Cef1p; similar to S. pombe Cwf24p -S000030574 CDS YLR323C 12 778952 778173 C 2004-02-05 1996-07-31 -S000004316 ORF Verified YLR324W PEX30 peroxisome biogenesis protein chromosome 12 12 779215 780786 W 2004-02-05 1996-07-31 ER-resident protein involved in peroxisomal biogenesis; ER-localized protein that associates with peroxisomes; interacts with Pex29p and reticulons Rtn1p and Yop1p to regulate peroxisome biogenesis from the ER; role in peroxisomal-destined vesicular flow from the ER; partially redundant with Pex31p; may function at a step downstream of steps mediated by Pex28p and Pex29p; PEX30 has a paralog, PEX31, that arose from the whole genome duplication -S000030797 CDS YLR324W 12 779215 780786 W 2004-02-05 1996-07-31 -S000004317 ORF Verified YLR325C RPL38 eL38|ribosomal 60S subunit protein L38|L38e|L38 chromosome 12 L000004468 12 781379 781143 C 2004-02-05 1996-07-31 Ribosomal 60S subunit protein L38; homologous to mammalian ribosomal protein L38, no bacterial homolog -S000030800 CDS YLR325C 12 781379 781143 C 2004-02-05 1996-07-31 -S000004318 ORF Uncharacterized YLR326W chromosome 12 12 782174 782896 W 2004-02-05 1996-07-31 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the cell periphery; predicted to be palmitoylated -S000031891 CDS YLR326W 12 782174 782896 W 2004-02-05 1996-07-31 -S000004319 ORF Verified YLR327C TMA10 RBF9|SFL2 chromosome 12 12 783387 783127 C 2004-02-05 1996-07-31 Protein of unknown function that associates with ribosomes; protein abundance increases in response to DNA replication stress; TMA10 has a paralog, STF2, that arose from the whole genome duplication -S000031973 CDS YLR327C 12 783387 783127 C 2004-02-05 1996-07-31 -S000006732 tRNA_gene tX(XXX)L tS(GCU)L chromosome 12 L000003651 12 784354 784453 W 2004-02-05 2000-05-19 tRNA of undetermined specificity, predicted by tRNAscan-SE analysis; very similar to serine tRNAs -S000037471 intron tX(XXX)L 12 784390 784409 W 2004-02-05 2000-05-19 -S000037469 noncoding_exon tX(XXX)L 12 784354 784389 W 2004-02-05 2000-05-19 -S000037470 noncoding_exon tX(XXX)L 12 784410 784453 W 2004-02-05 2000-05-19 -S000004320 ORF Verified YLR328W NMA1 nicotinamide-nucleotide adenylyltransferase NMA1 chromosome 12 12 784913 786118 W 2004-02-05 1996-07-31 Nicotinic acid mononucleotide adenylyltransferase; catalyzes the transfer of the adenylyl moiety of ATP to nicotinamide mononucleotide to form NAD; involved in pathways of NAD biosynthesis, including the de novo, NAD(+) salvage, and nicotinamide riboside salvage pathways; homolog of human NMNAT; NMA1 has a paralog, NMA2, that arose from the whole genome duplication -S000032965 CDS YLR328W 12 784913 786118 W 2004-02-05 1996-07-31 -S000004321 ORF Verified YLR329W REC102 chromosome 12 L000001604 12 786442 787333 W 235 2006-01-09 1996-07-31|2006-01-09 Protein involved in early stages of meiotic recombination; required for chromosome synapsis; forms a complex with Rec104p and Spo11p necessary during the initiation of recombination -S000113993 CDS YLR329W 12 786442 786615 W 2006-01-09 2006-01-09 -S000033059 CDS YLR329W 12 786713 787333 W 2006-01-09 1996-07-31|2006-01-09 -S000113994 intron YLR329W 12 786616 786712 W 2006-01-09 2006-01-09 -S000004322 ORF Verified YLR330W CHS5 CAL3 chromosome 12 L000000333 12 787664 789679 W 2004-02-05 1996-07-31 Component of the exomer complex; the exomer which also contains Csh6p, Bch1p, Bch2p, and Bud7, is involved in the export of select proteins, such as chitin synthase Chs3p, from the Golgi to the plasma membrane; interacts selectively with the activated, GTP-bound form of Arf1p; Chs5p is the only protein with a BRCT domain that is not localized to the nucleus -S000032805 CDS YLR330W 12 787664 789679 W 2004-02-05 1996-07-31 -S000004324 ORF Verified YLR332W MID2 KAI1 chromosome 12 L000001107|L000000885 12 790676 791806 W 2004-02-05 1996-07-31 O-glycosylated plasma membrane protein; acts as a sensor for cell wall integrity signaling and activates the pathway; interacts with Rom2p, a guanine nucleotide exchange factor for Rho1p, and with cell integrity pathway protein Zeo1p; MID2 has a paralog, MTL1, that arose from the whole genome duplication -S000034864 CDS YLR332W 12 790676 791806 W 2004-02-05 1996-07-31 -S000004323 ORF Dubious YLR331C JIP3 chromosome 12 12 791046 790669 C 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 98% of ORF overlaps the verified gene MID2 -S000032848 CDS YLR331C 12 791046 790669 C 2004-02-05 1996-07-31 -S000007097 long_terminal_repeat YLRWsigma4 chromosome 12 12 793552 793870 W 2004-02-05 2000-05-19 Ty3 LTR -S000006542 tRNA_gene tD(GUC)L2 chromosome 12 L000003652 12 793918 793989 W 2004-02-05 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000031888 noncoding_exon tD(GUC)L2 12 793918 793989 W 2004-02-05 2000-05-19 -S000118480 ARS ARS1226 ARSXII-794 chromosome 12 12 794100 794231 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178142 ARS_consensus_sequence ARS1226 12 794208 794192 C 2014-11-18 2014-11-18 -S000006452 snoRNA_gene snR61 SNR61 chromosome 12 L000004530 12 794575 794486 C 2004-02-05 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A1133 -S000030825 noncoding_exon snR61 12 794575 794486 C 2004-02-05 2000-05-19 -S000006446 snoRNA_gene snR55 SNR55 chromosome 12 L000004524 12 794794 794697 C 2004-02-05 2000-05-19 C/D box small nucleolar RNA (snoRNA); predicted to guide 2'-O-methylation of small subunit (SSU) rRNA at position U1269 -S000030741 noncoding_exon snR55 12 794794 794697 C 2004-02-05 2000-05-19 -S000006448 snoRNA_gene snR57 SNR57 chromosome 12 L000004526 12 795024 794937 C 2004-02-05 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position G1572 -S000030763 noncoding_exon snR57 12 795024 794937 C 2004-02-05 2000-05-19 -S000004325 ORF Verified YLR333C RPS25B eS25|ribosomal 40S subunit protein S25B|S25e|rp45|YS23|S31B|S25B chromosome 12 L000001766 12 795899 795573 C 2004-02-05 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S25, no bacterial homolog; RPS25B has a paralog, RPS25A, that arose from the whole genome duplication -S000034910 CDS YLR333C 12 795899 795573 C 2004-02-05 1996-07-31 -S000122107 five_prime_UTR_intron YLR333C 12 796335 795913 C 2007-04-04 2007-04-04 -S000007092 long_terminal_repeat YLRWdelta20 chromosome 12 12 796899 797088 W 2004-02-05 2000-05-19 Ty1 LTR -S000004326 ORF Dubious YLR334C chromosome 12 12 797078 796698 C 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps a stand-alone long terminal repeat sequence whose presence indicates a retrotransposition event occurred here -S000035063 CDS YLR334C 12 797078 796698 C 2004-02-05 1996-07-31 -S000006559 tRNA_gene tE(UUC)L chromosome 12 L000003653 12 797178 797249 W 2004-02-05 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; target of K. lactis zymocin -S000036008 noncoding_exon tE(UUC)L 12 797178 797249 W 2004-02-05 2000-05-19 -S000004327 ORF Verified YLR335W NUP2 nucleoporin NUP2 chromosome 12 L000001289 12 797430 799592 W 2004-02-05 1996-07-31 Nucleoporin involved in nucleocytoplasmic transport; binds to either the nucleoplasmic or cytoplasmic faces of the nuclear pore complex depending on Ran-GTP levels; also has a role in chromatin organization -S000035216 CDS YLR335W 12 797430 799592 W 2004-02-05 1996-07-31 -S000004328 ORF Verified YLR336C SGD1 chromosome 12 L000003498 12 802396 799697 C 2004-02-05 1996-07-31 Essential nuclear protein; required for biogenesis of the small ribosomal subunit; has a possible role in the osmoregulatory glycerol response; putative homolog of human NOM1 which is implicated in acute myeloid leukemia -S000035257 CDS YLR336C 12 802396 799697 C 2004-02-05 1996-07-31 -S000004330 ORF Dubious YLR338W OPI9 chromosome 12 12 804346 805203 W 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF VRP1/YLR337C -S000031689 CDS YLR338W 12 804346 805203 W 2004-02-05 1996-07-31 -S000004329 ORF Verified YLR337C VRP1 YLR337W|MDP2|END5 chromosome 12 L000001055|L000002481 12 805106 802653 C 2004-02-05 1996-07-31 Verprolin, proline-rich actin-associated protein; involved in cytoskeletal organization and cytokinesis; promotes actin nucleation and endocytosis; related to mammalian Wiskott-Aldrich syndrome protein (WASP)-interacting protein (WIP) -S000036142 CDS YLR337C 12 805106 802653 C 2004-02-05 1996-07-31 -S000004332 ORF Verified YLR340W RPP0 uL10|ribosomal protein P0|P0|L10E|A0|RPL10E chromosome 12 L000002669 12 805887 806825 W 2004-02-05 1996-07-31 Conserved ribosomal protein P0 of the ribosomal stalk; involved in interaction between translational elongation factors and the ribosome; phosphorylated on serine 302; homologous to mammalian ribosomal protein LP0 and bacterial L10 -S000036299 CDS YLR340W 12 805887 806825 W 2004-02-05 1996-07-31 -S000004331 ORF Dubious YLR339C chromosome 12 12 806335 805784 C 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the essential gene RPP0 -S000031733 CDS YLR339C 12 806335 805784 C 2004-02-05 1996-07-31 -S000004333 ORF Verified YLR341W SPO77 chromosome 12 12 807385 808818 W 2004-02-05 1996-07-31 Meiosis-specific protein of unknown function; required for spore wall formation during sporulation and for timely prospore membrane closure along with SPS1; required with Sps1p for phosphorylation and turnover of Ssp1p; dispensable for both nuclear divisions during meiosis -S000036414 CDS YLR341W 12 807385 808818 W 2004-02-05 1996-07-31 -S000004334 ORF Verified YLR342W FKS1 1,3-beta-D-glucan synthase|PBR1|GSC1|ETG1|CWH53|CND1 chromosome 12 L000000445|L000000732 12 809997 815627 W 2004-02-05 1996-07-31 Catalytic subunit of 1,3-beta-D-glucan synthase; functionally redundant with alternate catalytic subunit Gsc2p; binds to regulatory subunit Rho1p; involved in cell wall synthesis and maintenance; localizes to sites of cell wall remodeling; FKS1 has a paralog, GSC2, that arose from the whole genome duplication -S000036475 CDS YLR342W 12 809997 815627 W 2004-02-05 1996-07-31 -S000028571 ORF Uncharacterized YLR342W-A chromosome 12 12 815810 815983 W 2003-07-29 2003-07-29 Putative protein of unknown function -S000031299 CDS YLR342W-A 12 815810 815983 W 2003-07-29 2003-07-29 -S000004335 ORF Verified YLR343W GAS2 1,3-beta-glucanosyltransferase chromosome 12 12 816094 817761 W 2004-02-05 1996-07-31 1,3-beta-glucanosyltransferase; involved with Gas4p in spore wall assembly; has similarity to Gas1p -S000037140 CDS YLR343W 12 816094 817761 W 2004-02-05 1996-07-31 -S000007074 long_terminal_repeat YLRCdelta21 chromosome 12 12 818403 818073 C 2004-02-05 2000-05-19 Ty1 LTR -S000006706 tRNA_gene tR(CCG)L TRR4 chromosome 12 L000003654 12 818609 818680 W 2004-02-05 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; single essential nuclear tRNA gene containing the tDNA-anticodon CCG (presumably CCG in the mature tRNA), decodes CGG codons into arginine, one of 19 nuclear tRNAs for arginine; correct folding and efficient aminoacylation require Lhp1p -S000037079 noncoding_exon tR(CCG)L 12 818609 818680 W 2004-02-05 2000-05-19 -S000004336 ORF Verified YLR344W RPL26A uL24|ribosomal 60S subunit protein L26A|L24|YL33|L33A|L26A chromosome 12 L000004461 12 819312 820142 W 2004-02-05 1996-07-31 Ribosomal 60S subunit protein L26A; binds to 5.8S rRNA; non-essential even when paralog is also deleted; deletion has minimal affections on ribosome biosynthesis; homologous to mammalian ribosomal protein L26 and bacterial L24; RPL26A has a paralog, RPL26B, that arose from the whole genome duplication -S000037238 CDS YLR344W 12 819312 819330 W 2004-02-05 1996-07-31 -S000037239 CDS YLR344W 12 819778 820142 W 2004-02-05 1996-07-31 -S000037240 intron YLR344W 12 819331 819777 W 2004-02-05 1996-07-31 -S000004337 ORF Uncharacterized YLR345W bifunctional fructose-2,6-bisphosphate 2-phosphatase/6-phosphofructo-2-kinase chromosome 12 12 820511 822040 W 2004-02-05 1996-07-31 Similar to 6-phosphofructo-2-kinase enzymes; mRNA expression is repressed by the Rfx1p-Tup1p-Ssn6p repressor complex; YLR345W is not an essential gene -S000037321 CDS YLR345W 12 820511 822040 W 2004-02-05 1996-07-31 -S000004338 ORF Verified YLR346C CIS1 chromosome 12 12 822592 822287 C 2004-02-05 1996-07-31 Protein of unknown function found in mitochondria; expression is regulated by transcription factors involved in pleiotropic drug resistance, Pdr1p and Yrr1p; not an essential gene; YLR346C has a paralog, YGR035C, that arose from the whole genome duplication -S000037348 CDS YLR346C 12 822592 822287 C 2004-02-05 1996-07-31 -S000028681 ORF Dubious YLR347W-A chromosome 12 12 824789 824929 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified ORF KAP95/YLR347C -S000032552 CDS YLR347W-A 12 824789 824929 W 2011-02-03 2003-07-29 -S000004339 ORF Verified YLR347C KAP95 karyopherin beta|RSL1 chromosome 12 L000002781|L000002885 12 826413 823828 C 2011-02-03 1996-07-31 Karyopherin beta; forms a complex with Srp1p/Kap60p; interacts with nucleoporins to mediate nuclear import of NLS-containing cargo proteins via the nuclear pore complex; regulates PC biosynthesis; GDP-to-GTP exchange factor for Gsp1p -S000029972 CDS YLR347C 12 826413 823828 C 2011-02-03 1996-07-31 -S000004341 ORF Dubious YLR349W chromosome 12 12 827521 828027 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified ORF DIC1/YLR348C -S000030302 CDS YLR349W 12 827521 828027 W 2011-02-03 1996-07-31 -S000004340 ORF Verified YLR348C DIC1 chromosome 12 L000004327 12 827873 826977 C 2011-02-03 1996-07-31 Mitochondrial dicarboxylate carrier; integral membrane protein, catalyzes a dicarboxylate-phosphate exchange across the inner mitochondrial membrane, transports cytoplasmic dicarboxylates into the mitochondrial matrix -S000030051 CDS YLR348C 12 827873 826977 C 2011-02-03 1996-07-31 -S000004342 ORF Verified YLR350W ORM2 sphingolipid homeostasis protein ORM2 chromosome 12 12 828730 829380 W 2011-02-03 1996-07-31 Protein that mediates sphingolipid homeostasis; evolutionarily conserved, required for resistance to agents that induce unfolded protein response; Orm1p and Orm2p together control membrane biogenesis by coordinating lipid homeostasis with protein quality control; protein abundance increases in response to DNA replication stress; ORM2 has a paralog, ORM1, that arose from the whole genome duplication -S000032574 CDS YLR350W 12 828730 829380 W 2011-02-03 1996-07-31 -S000004343 ORF Verified YLR351C NIT3 putative hydrolase chromosome 12 L000004213 12 830364 829489 C 2011-02-03 1996-07-31 Nit protein; one of two proteins in S. cerevisiae with similarity to the Nit domain of NitFhit from fly and worm and to the mouse and human Nit protein which interacts with the Fhit tumor suppressor; nitrilase superfamily member -S000032619 CDS YLR351C 12 830364 829489 C 2011-02-03 1996-07-31 -S000004344 ORF Uncharacterized YLR352W chromosome 12 12 831116 833539 W 2011-02-03 1996-07-31 Putative protein of unknown function with similarity to F-box proteins; interacts with Skp1p and Cdc53p; YLR352W is not an essential gene -S000033355 CDS YLR352W 12 831116 833539 W 2011-02-03 1996-07-31 -S000004345 ORF Verified YLR353W BUD8 chromosome 12 L000002759 12 834352 836163 W 2011-02-03 1996-07-31 Protein involved in bud-site selection; diploid mutants display a unipolar budding pattern instead of the wild-type bipolar pattern, and bud at the proximal pole; BUD8 has a paralog, BUD9, that arose from the whole genome duplication -S000033422 CDS YLR353W 12 834352 836163 W 2011-02-03 1996-07-31 -S000004346 ORF Verified YLR354C TAL1 sedoheptulose-7-phosphate:D-glyceraldehyde-3-phosphate transaldolase TAL1 chromosome 12 L000002261 12 837357 836350 C 2011-02-03 1996-07-31 Transaldolase, enzyme in the non-oxidative pentose phosphate pathway; converts sedoheptulose 7-phosphate and glyceraldehyde 3-phosphate to erythrose 4-phosphate and fructose 6-phosphate; TAL1 has a paralog, NQM1, that arose from the whole genome duplication -S000033457 CDS YLR354C 12 837357 836350 C 2011-02-03 1996-07-31 -S000004347 ORF Verified YLR355C ILV5 ketol-acid reductoisomerase chromosome 12 L000000860 12 839253 838066 C 252 2011-02-03 1996-07-31 Acetohydroxyacid reductoisomerase and mtDNA binding protein; involved in branched-chain amino acid biosynthesis and maintenance of wild-type mitochondrial DNA; found in mitochondrial nucleoids -S000033517 CDS YLR355C 12 839253 838066 C 2011-02-03 1996-07-31 -S000004348 ORF Verified YLR356W ATG33 chromosome 12 12 840321 840914 W 2011-02-03 1996-07-31 Mitochondrial mitophagy-specific protein; required primarily for mitophagy induced at post-log phase; not required for other types of selective autophagy or macroautophagy; conserved within fungi, but not in higher eukaryotes; ATG33 has a paralog, SCM4, that arose from the whole genome duplication -S000034434 CDS YLR356W 12 840321 840914 W 2011-02-03 1996-07-31 -S000004349 ORF Verified YLR357W RSC2 chromosome 12 L000004025 12 841331 844000 W 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; required for expression of mid-late sporulation-specific genes; involved in telomere maintenance; RSC2 has a paralog, RSC1, that arose from the whole genome duplication -S000034579 CDS YLR357W 12 841331 844000 W 2011-02-03 1996-07-31 -S000004350 ORF Uncharacterized YLR358C chromosome 12 12 844050 843487 C 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels; partially overlaps ORF RSC2/YLR357W -S000034588 CDS YLR358C 12 844050 843487 C 2011-02-03 1996-07-31 -S000004351 ORF Verified YLR359W ADE13 adenylosuccinase ADE13|BRA8|BRA1 chromosome 12 L000003938 12 844282 845730 W 2011-02-03 1996-07-31 Adenylosuccinate lyase; catalyzes two steps in the 'de novo' purine nucleotide biosynthetic pathway; expression is repressed by adenine and activated by Bas1p and Pho2p; mutations in human ortholog ADSL cause adenylosuccinase deficiency; human ADSL can complement yeast ADE13 null mutant -S000035650 CDS YLR359W 12 844282 845730 W 2011-02-03 1996-07-31 -S000004352 ORF Verified YLR360W VPS38 VPL17 chromosome 12 L000003511 12 846103 847422 W 2011-02-03 1996-07-31 Part of a Vps34p phosphatidylinositol 3-kinase complex; functions in carboxypeptidase Y (CPY) sorting; binds Vps30p and Vps34p to promote production of phosphatidylinositol 3-phosphate (PtdIns3P) which stimulates kinase activity; required for overflow degradation of misfolded proteins when ERAD is saturated -S000036679 CDS YLR360W 12 846103 847422 W 2011-02-03 1996-07-31 -S000004353 ORF Verified YLR361C DCR2 phosphoprotein phosphatase chromosome 12 12 849124 847388 C 2011-02-03 1996-07-31 Protein phosphatase; involved in downregulation of the unfolded protein response (UPR), at least in part through dephosphorylation of Ire1p; dosage-dependent positive regulator of the G1/S phase transition through control of the timing of START; physically interacts with, dephosphorylates and destabilizes Sic1p; SWAT-GFP and mCherry fusion proteins localize to the vacuole -S000036700 CDS YLR361C 12 849124 847388 C 2011-02-03 1996-07-31 -S000028845 ORF Uncharacterized YLR361C-A chromosome 12 12 849679 849383 C 2011-02-03 2003-07-29 Putative protein of unknown function -S000034530 CDS YLR361C-A 12 849679 849383 C 2011-02-03 2003-07-29 -S000004354 ORF Verified YLR362W STE11 mitogen-activated protein kinase kinase kinase STE11 chromosome 12 L000002118 12 849866 852019 W 244 2011-02-03 1999-07-17|1996-07-31 Signal transducing MEK kinase; involved in pheromone response and pseudohyphal/invasive growth pathways where it phosphorylates Ste7p, and the high osmolarity response pathway, via phosphorylation of Pbs2p; regulated by Ste20p and Ste50p; protein abundance increases in response to DNA replication stress -S000036796 CDS YLR362W 12 849866 852019 W 2011-02-03 1999-07-17|1996-07-31 -S000004355 ORF Verified YLR363C NMD4 chromosome 12 L000002938 12 853151 852495 C 2011-02-03 1996-07-31 Protein that may be involved in nonsense-mediated mRNA decay; interacts with Nam7p, relocalizes from nucleus to cytoplasmic foci upon DNA replication stress -S000036803 CDS YLR363C 12 853151 852495 C 2011-02-03 1996-07-31 -S000007620 ORF Verified YLR363W-A chromosome 12 12 853461 853718 W 2011-02-03 2001-02-26 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; relocalizes from nucleus to nucleolus upon DNA replication stress -S000037218 CDS YLR363W-A 12 853461 853718 W 2011-02-03 2001-02-26 -S000004356 ORF Verified YLR364W GRX8 glutathione-disulfide reductase GRX8 chromosome 12 12 854062 854391 W 2011-02-03 1996-07-31 Glutaredoxin that employs a dithiol mechanism of catalysis; monomeric; activity is low and null mutation does not affect sensitivity to oxidative stress; GFP-fusion protein localizes to the cytoplasm; expression strongly induced by arsenic -S000037591 CDS YLR364W 12 854062 854391 W 2011-02-03 1996-07-31 -S000004357 ORF Dubious YLR365W chromosome 12 12 855199 855531 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps dubious gene YLR364C-A; YLR365W is not an essential gene -S000037651 CDS YLR365W 12 855199 855531 W 2011-02-03 1996-07-31 -S000004358 ORF Dubious YLR366W chromosome 12 12 855538 855843 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YLR364C-A -S000037710 CDS YLR366W 12 855538 855843 W 2011-02-03 1996-07-31 -S000028846 ORF Dubious YLR364C-A chromosome 12 12 855645 855523 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YLR366W -S000034531 CDS YLR364C-A 12 855645 855523 C 2011-02-03 2003-07-29 -S000004359 ORF Verified YLR367W RPS22B uS8|ribosomal 40S subunit protein S22B|S8|rp50|YS22|S24B|S22B chromosome 12 L000003030 12 856442 857317 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S15A and bacterial S8; RPS22B has a paralog, RPS22A, that arose from the whole genome duplication -S000037773 CDS YLR367W 12 856442 856574 W 2011-02-03 1996-07-31 -S000037774 CDS YLR367W 12 857058 857317 W 2011-02-03 1996-07-31 -S000122108 five_prime_UTR_intron YLR367W 12 855878 856434 W 2011-02-03 2007-04-04 -S000037775 intron YLR367W 12 856575 857057 W 2011-02-03 1996-07-31 -S000006504 snoRNA_gene snR44 SNR44 chromosome 12 L000003411 12 856710 856920 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U1056 and small subunit (SSU) rRNA at position U106 -S000030616 noncoding_exon snR44 12 856710 856920 W 2011-02-03 2000-05-19 -S000004360 ORF Verified YLR368W MDM30 SCF ubiquitin ligase complex subunit MDM30|DSG1 chromosome 12 12 857540 859336 W 2011-02-03 1996-07-31 F-box component of an SCF ubiquitin protein ligase complex; associates with and is required for Fzo1p ubiquitination and for mitochondria fusion; stimulates nuclear export of specific mRNAs; promotes ubiquitin-mediated degradation of Gal4p in some strains -S000030625 CDS YLR368W 12 857540 859336 W 2011-02-03 1996-07-31 -S000004361 ORF Verified YLR369W SSQ1 Hsp70 family ATPase SSQ1|SSH1|SSC2 chromosome 12 L000004573 12 859552 861525 W 2011-02-03 1996-07-31 Mitochondrial hsp70-type molecular chaperone; required for assembly of iron/sulfur clusters into proteins at a step after cluster synthesis, and for maturation of Yfh1p, which is a homolog of human frataxin implicated in Friedreich's ataxia -S000030742 CDS YLR369W 12 859552 861525 W 2011-02-03 1996-07-31 -S000004362 ORF Verified YLR370C ARC18 chromosome 12 L000004033 12 862254 861718 C 2011-02-03 1996-07-31 Subunit of the ARP2/3 complex; ARP2/3 is required for the motility and integrity of cortical actin patches -S000031542 CDS YLR370C 12 862254 861718 C 2011-02-03 1996-07-31 -S000004363 ORF Verified YLR371W ROM2 Rho family guanine nucleotide exchange factor ROM2 chromosome 12 L000003182 12 862714 866784 W 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF) for Rho1p and Rho2p; mutations are synthetically lethal with mutations in rom1, which also encodes a GEF; Rom2p localization to the bud surface is dependent on Ack1p; ROM2 has a paralog, ROM1, that arose from the whole genome duplication -S000031699 CDS YLR371W 12 862714 866784 W 2011-02-03 1996-07-31 -S000004364 ORF Verified YLR372W ELO3 SUR4|fatty acid elongase ELO3|APA1|VBM1|SRE1 chromosome 12 L000002245 12 867354 868391 W 2011-02-03 1996-07-31 Elongase; involved in fatty acid and sphingolipid biosynthesis; synthesizes very long chain 20-26-carbon fatty acids from C18-CoA primers; involved in regulation of sphingolipid biosynthesis; lethality of the elo2 elo3 double null mutation is functionally complemented by human ELOVL1 and weakly complemented by human ELOVL3 or ELOV7 -S000031801 CDS YLR372W 12 867354 868391 W 2011-02-03 1996-07-31 -S000004365 ORF Verified YLR373C VID22 chromosome 12 12 871367 868662 C 2011-02-03 1996-07-31 Glycosylated integral membrane protein localized to plasma membrane; plays a role in fructose-1,6-bisphosphatase (FBPase) degradation; involved in FBPase transport from the cytosol to Vid (vacuole import and degradation) vesicles; VID22 has a paralog, ENV11, that arose from the whole genome duplication -S000031859 CDS YLR373C 12 871367 868662 C 2011-02-03 1996-07-31 -S000004367 ORF Verified YLR375W STP3 chromosome 12 L000003371 12 871697 872728 W 2011-02-03 1996-07-31 Zinc-finger protein of unknown function; possibly involved in pre-tRNA splicing and in uptake of branched-chain amino acids; STP3 has a paralog, STP4, that arose from the whole genome duplication -S000032922 CDS YLR375W 12 871697 872728 W 2011-02-03 1996-07-31 -S000004366 ORF Dubious YLR374C chromosome 12 12 871842 871453 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF STP3/YLR375W -S000032763 CDS YLR374C 12 871842 871453 C 2011-02-03 1996-07-31 -S000004368 ORF Verified YLR376C PSY3 chromosome 12 12 873554 872826 C 2011-02-03 1996-07-31 Component of Shu complex (aka PCSS complex); Shu complex also includes Shu1, Csm2, Shu2, and promotes error-free DNA repair; promotes Rad51p filament assembly; Shu complex mediates inhibition of Srs2p function; Psy3p and Csm2p contain similar DNA-binding regions which work together to form a single DNA binding site; deletion of PSY3 results in a mutator phenotype; deletion increases sensitivity to anticancer drugs oxaliplatin and cisplatin but not mitomycin C -S000032974 CDS YLR376C 12 873554 872826 C 2011-02-03 1996-07-31 -S000004369 ORF Verified YLR377C FBP1 fructose 1,6-bisphosphate 1-phosphatase|ACN8 chromosome 12 L000000605 12 874792 873746 C 2011-02-03 1996-07-31 Fructose-1,6-bisphosphatase; key regulatory enzyme in the gluconeogenesis pathway, required for glucose metabolism; undergoes either proteasome-mediated or autophagy-mediated degradation depending on growth conditions; glucose starvation results in redistribution to the periplasm; interacts with Vid30p -S000033041 CDS YLR377C 12 874792 873746 C 2011-02-03 1996-07-31 -S000006633 tRNA_gene tK(UUU)L chromosome 12 L000003655 12 875376 875471 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000034214 intron tK(UUU)L 12 875413 875435 W 2011-02-03 2000-05-19 -S000034212 noncoding_exon tK(UUU)L 12 875376 875412 W 2011-02-03 2000-05-19 -S000034213 noncoding_exon tK(UUU)L 12 875436 875471 W 2011-02-03 2000-05-19 -S000004371 ORF Dubious YLR379W chromosome 12 12 876922 877296 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the essential ORF SEC61/YLR378C -S000033877 CDS YLR379W 12 876922 877296 W 2011-02-03 1996-07-31 -S000004370 ORF Verified YLR378C SEC61 translocon subunit SEC61 chromosome 12 L000001852 12 877178 875736 C 2011-02-03 1996-07-31 Conserved ER protein translocation channel; essential subunit of Sec61 complex (Sec61p, Sbh1p, and Sss1p); forms channel for SRP-dependent protein import; with Sec63 complex allows SRP-independent protein import into ER; involved in posttranslational soluble protein import into the ER, ERAD of soluble substrates, and misfolded soluble protein export from the ER -S000033713 CDS YLR378C 12 877178 875736 C 2011-02-03 1996-07-31 -S000004372 ORF Verified YLR380W CSR1 SFH2 chromosome 12 S000007449 12 878282 879508 W 2004-02-05 1996-07-31 Phosphatidylinositol transfer protein; has a potential role in regulating lipid and fatty acid metabolism under heme-depleted conditions; interacts specifically with thioredoxin peroxidase; may have a role in oxidative stress resistance; protein abundance increases in response to DNA replication stress -S000034850 CDS YLR380W 12 878282 879508 W 2004-02-05 1996-07-31 -S000004373 ORF Verified YLR381W CTF3 CHL3 chromosome 12 L000000320 12 879723 881924 W 2004-02-05 1996-07-31 Outer kinetochore protein that forms a complex with Mcm16p and Mcm22p; may bind the kinetochore to spindle microtubules; required for the spindle assembly checkpoint; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-I and fission yeast mis6 -S000034982 CDS YLR381W 12 879723 881924 W 2004-02-05 1996-07-31 -S000004374 ORF Verified YLR382C NAM2 leucine--tRNA ligase NAM2|LeuRS|MSL1 chromosome 12 L000001229 12 884751 882067 C 325 2004-02-05 1996-07-31 Mitochondrial leucyl-tRNA synthetase; also has direct role in splicing of several mitochondrial group I introns; indirectly required for mitochondrial genome maintenance; human homolog LARS2 can complement yeast null mutant, and is implicated in Perrault syndrome -S000035844 CDS YLR382C 12 884751 882067 C 2004-02-05 1996-07-31 -S000004375 ORF Verified YLR383W SMC6 DNA repair protein SMC6|RHC18 chromosome 12 L000004130 12 885288 888632 W 2004-02-05 1996-07-31 Component of the SMC5-SMC6 complex; this complex plays a key role in the removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair; homologous to S. pombe rad18 -S000036068 CDS YLR383W 12 885288 888632 W 2004-02-05 1996-07-31 -S000118987 ARS ARS1238 ARSXII-889|ARS1227.5 chromosome 12 12 888570 888810 2006-10-02 2006-10-02 Autonomously Replicating Sequence -S000178143 ARS_consensus_sequence ARS1238 12 888741 888725 C 2014-11-18 2014-11-18 -S000004376 ORF Verified YLR384C IKI3 Elongator subunit IKI3|KTI7|TOT1|ELP1 chromosome 12 L000003563 12 892900 888851 C 2004-02-05 1996-07-31 Subunit of Elongator complex; Elongator is required for modification of wobble nucleosides in tRNA; maintains structural integrity of Elongator; homolog of human IKAP, mutations in which cause familial dysautonomia (FD) -S000036126 CDS YLR384C 12 892900 888851 C 2004-02-05 1996-07-31 -S000004377 ORF Verified YLR385C SWC7 AWS1 chromosome 12 12 893390 892992 C 2004-02-05 1996-07-31 Protein of unknown function; component of the Swr1p complex that incorporates Htz1p into chromatin -S000036905 CDS YLR385C 12 893390 892992 C 2004-02-05 1996-07-31 -S000004378 ORF Verified YLR386W VAC14 chromosome 12 12 893628 896270 W 2004-02-05 1996-07-31 Enzyme regulator; involved in synthesis of phosphatidylinositol 3,5-bisphosphate, in control of trafficking of some proteins to the vacuole lumen via the MVB, and in maintenance of vacuole size and acidity; binds negative (Fig4p) and positive (Fab1p) regulators of PtdIns(3,5)P(2) to control endolysosome function; similar to mammalian Vac14p -S000037006 CDS YLR386W 12 893628 896270 W 2004-02-05 1996-07-31 -S000004379 ORF Verified YLR387C REH1 chromosome 12 12 897672 896374 C 2004-02-05 1996-07-31 Cytoplasmic 60S subunit biogenesis factor; associates with pre-60S particles; similar to Rei1p and shares partially redundant function in cytoplasmic 60S subunit maturation; contains dispersed C2H2 zinc finger domains -S000037044 CDS YLR387C 12 897672 896374 C 2004-02-05 1996-07-31 -S000004380 ORF Verified YLR388W RPS29A uS14|ribosomal 40S subunit protein S29A|S14|YS29|S36A|S29A|YS29A chromosome 12 L000004482|S000029649|L000002549 12 898651 898821 W 2004-02-05 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S29 and bacterial S14; RPS29A has a paralog, RPS29B, that arose from the whole genome duplication -S000037830 CDS YLR388W 12 898651 898821 W 2004-02-05 1996-07-31 -S000122109 five_prime_UTR_intron YLR388W 12 898158 898645 W 2007-04-04 2007-04-04 -S000006500 snoRNA_gene snR34 SNR34 chromosome 12 L000001972 12 899180 899382 W 2007-05-10 2000-05-19|2007-05-10 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at positions U2826 and U2880 -S000036763 noncoding_exon snR34 12 899180 899382 W 2007-05-10 2000-05-19|2007-05-10 -S000004381 ORF Verified YLR389C STE23 metalloendopeptidase chromosome 12 L000003081 12 902660 899577 C 2004-02-05 2004-02-05|1996-07-31 Metalloprotease; involved in N-terminal processing of pro-a-factor to mature form; expressed in both haploids and diploids; one of two yeast homologs of human insulin-degrading enzyme (hIDE); homolog Axl1p is also involved in processing of pro-a-factor -S000037885 CDS YLR389C 12 902660 899577 C 2004-02-05 2004-02-05|1996-07-31 -S000004382 ORF Verified YLR390W ECM19 chromosome 12 L000003894 12 903066 903404 W 2004-02-05 1996-07-31 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000030926 CDS YLR390W 12 903066 903404 W 2004-02-05 1996-07-31 -S000006429 ORF Verified YLR390W-A CCW14 ICWP|YLR391W|SSR1|YLR391W-A chromosome 12 L000004428 12 903724 904440 W 2004-02-05 1997-07-30 Covalently linked cell wall glycoprotein; present in the inner layer of the cell wall -S000037801 CDS YLR390W-A 12 903724 904440 W 2004-02-05 1997-07-30 -S000004384 ORF Verified YLR392C ART10 chromosome 12 12 906305 904749 C 2004-02-05 1996-07-31 Protein of unknown function that contains 2 PY motifs; ubiquinated by Rsp5p; overexpression confers resistance to arsenite; green fluorescent protein (GFP)-fusion protein localizes it to the cytoplasm; non-essential gene -S000031038 CDS YLR392C 12 906305 904749 C 2004-02-05 1996-07-31 -S000004385 ORF Verified YLR393W ATP10 chromosome 12 L000000147 12 907079 907918 W 2004-02-05 1996-07-31 Assembly factor for the F0 sector of mitochondrial F1F0 ATP synthase; mitochondrial inner membrane protein; interacts genetically with ATP6 -S000032047 CDS YLR393W 12 907079 907918 W 2004-02-05 1996-07-31 -S000004386 ORF Verified YLR394W CST9 SUMO ligase CST9|ZIP3 chromosome 12 L000002996 12 907950 909398 W 2004-02-05 1996-07-31 SUMO E3 ligase; required for synaptonemal complex formation; localizes to synapsis initiation sites on meiotic chromosomes; associates with centromeres early in meiosis, then with chromosome axes and finally with double-strand break sites that are engaged in repair by crossovers; potential Cdc28p substrate -S000032126 CDS YLR394W 12 907950 909398 W 2004-02-05 1996-07-31 -S000004387 ORF Verified YLR395C COX8 cytochrome c oxidase subunit VIII chromosome 12 L000000392 12 909965 909729 C 2004-02-05 1996-07-31 Subunit VIII of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain -S000032155 CDS YLR395C 12 909965 909729 C 2004-02-05 1996-07-31 -S000004388 ORF Verified YLR396C VPS33 tethering complex ATP-binding subunit VPS33|VPT33|VPL25|VAM5|SLP1|PEP14|MET27|CLS14 chromosome 12 L000002475 12 912310 910235 C 2004-02-05 1996-07-31 ATP-binding protein that is a subunit of the HOPS and CORVET complexes; essential for protein sorting, vesicle docking, and fusion at the vacuole; binds to SNARE domains -S000032235 CDS YLR396C 12 912310 910235 C 2004-02-05 1996-07-31 -S000004389 ORF Verified YLR397C AFG2 AAA family ATPase AFG2|DRG1 chromosome 12 L000000056 12 914892 912550 C 2004-02-05 1996-07-31 ATPase of the CDC48/PAS1/SEC18 (AAA) family, forms a hexameric complex; is essential for pre-60S maturation and release of several preribosome maturation factors; releases Rlp24p from purified pre-60S particles in vitro; target of the ribosomal biosynthesis inhibitor diazaborine; may be involved in degradation of aberrant mRNAs -S000032306 CDS YLR397C 12 914892 912550 C 2004-02-05 1996-07-31 -S000004390 ORF Verified YLR398C SKI2 SKI complex RNA helicase subunit SKI2 chromosome 12 L000001903 12 919019 915156 C 2004-02-05 1996-07-31 Ski complex component and putative RNA helicase; mediates 3'-5' RNA degradation by the cytoplasmic exosome; null mutants have superkiller phenotype of increased viral dsRNAs and are synthetic lethal with mutations in 5'-3' mRNA decay; mutations in the human ortholog, SKIV2L, causes Syndromic diarrhea/Trichohepatoenteric (SD/THE) syndrome -S000033167 CDS YLR398C 12 919019 915156 C 2004-02-05 1996-07-31 -S000130185 ARS ARS1228 chromosome 12 12 919800 920994 2009-05-08 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000028682 ORF Dubious YLR399W-A chromosome 12 12 920869 920973 W 2004-02-05 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the characterized ORF BDF1/YLR399C -S000032553 CDS YLR399W-A 12 920869 920973 W 2004-02-05 2003-07-29 -S000004391 ORF Verified YLR399C BDF1 chromatin-binding protein BDF1 chromosome 12 L000000165 12 921596 919536 C 2004-02-05 1996-07-31 Protein involved in transcription initiation; functions at TATA-containing promoters; associates with the basal transcription factor TFIID; contains two bromodomains; corresponds to the C-terminal region of mammalian TAF1; redundant with Bdf2p; BDF1 has a paralog, BDF2, that arose from the whole genome duplication -S000033234 CDS YLR399C 12 921596 919536 C 2004-02-05 1996-07-31 -S000004392 ORF Dubious YLR400W chromosome 12 12 922063 922536 W 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031650 CDS YLR400W 12 922063 922536 W 2004-02-05 1996-07-31 -S000004393 ORF Verified YLR401C DUS3 tRNA dihydrouridine synthase DUS3 chromosome 12 12 924448 922442 C 2006-01-09 1996-07-31|2006-01-09 Dihydrouridine synthase; member of a widespread family of conserved proteins including Smm1p, Dus1p, and Dus4p; contains a consensus oleate response element (ORE) in its promoter region; forms nuclear foci upon DNA replication stress -S000031698 CDS YLR401C 12 924448 922442 C 2006-01-09 1996-07-31|2006-01-09 -S000004394 ORF Dubious YLR402W chromosome 12 12 924889 925080 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032705 CDS YLR402W 12 924889 925080 W 2011-02-03 1996-07-31|2011-02-03 -S000004395 ORF Verified YLR403W SFP1 zinc-coordinating transcription factor SFP1|[ISP+]|[ISP(+)] chromosome 12 L000001872 12 925568 927619 W 2011-02-03 1996-07-31 Regulates transcription of ribosomal protein and biogenesis genes; regulates response to nutrients and stress, G2/M transitions during mitotic cell cycle and DNA-damage response, and modulates cell size; regulated by TORC1 and Mrs6p; sequence of zinc finger, ChIP localization data, and protein-binding microarray (PBM) data, and computational analyses suggest it binds DNA directly at highly active RP genes and indirectly through Rap1p at others; can form the [ISP+] prion -S000032808 CDS YLR403W 12 925568 927619 W 2011-02-03 1996-07-31 -S000004396 ORF Verified YLR404W SEI1 seipin|FLD1 chromosome 12 12 928743 929600 W 2011-02-03 1996-07-31 Seipin involved in lipid droplet (LD) assembly; controls lipid particle morphology, number, and size; promotes initiation of LD formation on the ER; ensures that LDs bud from the ER towards the cytosolic side of the membrane; forms a complex with Ldb16p at ER-LD contact sites, stabilizing these sites; null mutants have localized accumulation of phosphatidic acid (PA) marker proteins; BSCL2, human homolog implicated in congenital lipodystrophy, complements yeast null mutant -S000032908 CDS YLR404W 12 928743 929600 W 2011-02-03 1996-07-31 -S000004397 ORF Verified YLR405W DUS4 tRNA dihydrouridine synthase chromosome 12 12 929789 930892 W 2011-02-03 1996-07-31 Dihydrouridine synthase; member of a widespread family of conserved proteins including Smm1p, Dus1p, and Dus3p -S000034865 CDS YLR405W 12 929789 930892 W 2011-02-03 1996-07-31 -S000130186 ARS ARS1230 chromosome 12 12 930891 931064 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000004398 ORF Verified YLR406C RPL31B eL31|ribosomal 60S subunit protein L31B|L31e|YL28|L34B|L31B chromosome 12 L000004463 12 931755 931065 C 2011-02-03 1999-07-17|1996-07-31 Ribosomal 60S subunit protein L31B; associates with karyopherin Sxm1p; loss of both Rpl31p and Rpl39p confers lethality; homologous to mammalian ribosomal protein L31, no bacterial homolog; RPL31B has a paralog, RPL31A, that arose from the whole genome duplication -S000034912 CDS YLR406C 12 931349 931065 C 2011-02-03 1999-07-17|1996-07-31 -S000034911 CDS YLR406C 12 931755 931699 C 2011-02-03 1999-07-17|1996-07-31 -S000034913 intron YLR406C 12 931698 931350 C 2011-02-03 1999-07-17|1996-07-31 -S000028683 ORF Uncharacterized YLR406C-A chromosome 12 12 932355 932206 C 2011-02-03 2003-07-29 Putative protein of unknown function; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole -S000032554 CDS YLR406C-A 12 932355 932206 C 2011-02-03 2003-07-29 -S000004399 ORF Uncharacterized YLR407W chromosome 12 12 932967 933653 W 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; null mutant displays elongated buds and a large fraction of budded cells have only one nucleus -S000035114 CDS YLR407W 12 932967 933653 W 2011-02-03 1996-07-31|2011-02-03 -S000004400 ORF Verified YLR408C BLS1 BLB1 chromosome 12 12 934253 933885 C 2011-02-03 1996-07-31 Subunit of the BLOC-1 complex involved in endosomal maturation; green fluorescent protein (GFP)-fusion protein localizes to the endosome; YLR408C is not an essential gene -S000035167 CDS YLR408C 12 934253 933885 C 2011-02-03 1996-07-31 -S000004401 ORF Verified YLR409C UTP21 rRNA-processing protein UTP21 chromosome 12 12 937233 934414 C 2011-02-03 1996-07-31 Subunit of U3-containing 90S preribosome and SSU processome complexes; involved in production of 18S rRNA and assembly of small ribosomal subunit; synthetic defect with STI1 Hsp90 cochaperone; human homolog linked to glaucoma; Small Subunit processome is also known as SSU processome -S000035261 CDS YLR409C 12 937233 934414 C 2011-02-03 1996-07-31 -S000004402 ORF Verified YLR410W VIP1 inositol polyphosphate kinase VIP1 chromosome 12 L000004547 12 937541 940981 W 2011-02-03 1996-07-31 Inositol hexakisphosphate and inositol heptakisphosphate kinase; inositol heptakisphosphate (IP7) production is important for phosphate signaling; involved in cortical actin cytoskeleton function, and invasive pseudohyphal growth analogous to S. pombe asp1; inositol hexakisphosphate is also known as IP6 -S000035093 CDS YLR410W 12 937541 940981 W 2011-02-03 1996-07-31 -S000007093 long_terminal_repeat YLRWdelta22 chromosome 12 12 941192 941523 W 2011-02-03 2000-05-19 Ty2 LTR -S000007100 LTR_retrotransposon YLRWTy2-1 Ty2 chromosome 12 12 941192 947150 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007379 transposable_element_gene YLR410W-A gag protein chromosome 12 12 941483 942799 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000034166 CDS YLR410W-A 12 941483 942799 W 2011-02-03 1999-07-17 -S000007380 transposable_element_gene YLR410W-B gag-pol fusion protein chromosome 12 12 941483 946796 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000034173 CDS YLR410W-B 12 941483 942775 W 2011-02-03 1999-07-17 -S000034174 CDS YLR410W-B 12 942777 946796 W 2011-02-03 1999-07-17 -S000034175 plus_1_translational_frameshift YLR410W-B 12 942776 942776 W 2011-02-03 1999-07-17 -S000007094 long_terminal_repeat YLRWdelta23 chromosome 12 12 946819 947150 W 2011-02-03 2000-05-19 Ty2 LTR -S000004403 ORF Verified YLR411W CTR3 high-affinity Cu transporter CTR3 chromosome 12 L000003441 12 947253 947978 W 2011-02-03 1996-07-31 High-affinity copper transporter of the plasma membrane; acts as a trimer; gene is disrupted by a Ty2 transposon insertion in many laboratory strains of S. cerevisiae -S000035281 CDS YLR411W 12 947253 947978 W 2011-02-03 1996-07-31 -S000004404 ORF Verified YLR412W BER1 chromosome 12 S000116954 12 948368 949192 W 2011-02-03 1996-07-31 Protein involved in microtubule-related processes; GFP-fusion protein localizes to the cytoplasm and is induced in response to the DNA-damaging agent MMS; YLR412W is not an essential gene; similar to Arabidopsis SRR1 gene -S000036189 CDS YLR412W 12 948368 949192 W 2011-02-03 1996-07-31 -S000028572 ORF Uncharacterized YLR412C-A chromosome 12 12 950473 950267 C 2011-02-03 2003-07-29 Putative protein of unknown function -S000031300 CDS YLR412C-A 12 950473 950267 C 2011-02-03 2003-07-29 -S000004405 ORF Verified YLR413W INA1 chromosome 12 12 951156 953183 W 2011-02-03 1996-07-31 Protein of unknown function; not an essential gene; YLR413W has a paralog, FAT3, that arose from the whole genome duplication -S000036302 CDS YLR413W 12 951156 953183 W 2011-02-03 1996-07-31 -S000004406 ORF Verified YLR414C PUN1 chromosome 12 12 954144 953353 C 2011-02-03 1996-07-31 Plasma membrane protein with a role in cell wall integrity; co-localizes with Sur7p in punctate membrane patches; null mutant displays decreased thermotolerance; transcription induced upon cell wall damage and metal ion stress -S000036366 CDS YLR414C 12 954144 953353 C 2011-02-03 1996-07-31 -S000004407 ORF Uncharacterized YLR415C chromosome 12 12 954597 954259 C 2011-02-03 1996-07-31 Putative protein of unknown function; YLR415C is not an essential gene -S000036440 CDS YLR415C 12 954597 954259 C 2011-02-03 1996-07-31 -S000004408 ORF Dubious YLR416C chromosome 12 12 954889 954491 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037090 CDS YLR416C 12 954889 954491 C 2011-02-03 1996-07-31 -S000004409 ORF Verified YLR417W VPS36 ESCRT-II subunit protein VPS36|VPL11|VAC3|GRD12 chromosome 12 L000002958 12 955010 956710 W 2011-02-03 1996-07-31 Component of the ESCRT-II complex; contains the GLUE (GRAM Like Ubiquitin binding in EAP45) domain which is involved in interactions with ESCRT-I and ubiquitin-dependent sorting of proteins into the endosome; plays a role in the formation of mutant huntingtin (Htt) aggregates in yeast -S000037244 CDS YLR417W 12 955010 956710 W 2011-02-03 1996-07-31 -S000004410 ORF Verified YLR418C CDC73 chromosome 12 L000002792 12 958095 956914 C 2011-02-03 1996-07-31 Component of the Paf1p complex; binds to and modulates the activity of RNA polymerases I and II; required for expression of certain genes, modification of some histones, and telomere maintenance; involved in transcription elongation as demonstrated by the G-less-based run-on (GLRO) assay; protein abundance increases in response to DNA replication stress; human homolog, parafibromin, is a tumour suppressor linked to breast, renal and gastric cancers -S000037277 CDS YLR418C 12 958095 956914 C 2011-02-03 1996-07-31 -S000004411 ORF Uncharacterized YLR419W putative helicase chromosome 12 12 958428 962735 W 2011-02-03 1996-07-31 Putative helicase with limited sequence similarity to human Rb protein; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YLR419W is not an essential gene -S000037392 CDS YLR419W 12 958428 962735 W 2011-02-03 1996-07-31 -S000006652 tRNA_gene tL(UAA)L chromosome 12 L000003658 12 963055 962972 C 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000037412 noncoding_exon tL(UAA)L 12 963055 962972 C 2011-02-03 2000-05-19 -S000007075 long_terminal_repeat YLRWdelta24 YLRCdelta24 chromosome 12 12 963230 963545 W 2011-02-03 2000-05-19|2007-04-03 Ty1 LTR -S000004412 ORF Verified YLR420W URA4 dihydroorotase chromosome 12 L000002433 12 963785 964879 W 304 2011-02-03 1996-07-31 Dihydroorotase; catalyzes the third enzymatic step in the de novo biosynthesis of pyrimidines, converting carbamoyl-L-aspartate into dihydroorotate -S000031350 CDS YLR420W 12 963785 964879 W 2011-02-03 1996-07-31 -S000004413 ORF Verified YLR421C RPN13 proteasome regulatory particle lid subunit RPN13 chromosome 12 12 965560 965090 C 2011-02-03 1996-07-31 Subunit of the 19S regulatory particle of the 26S proteasome lid; acts as a ubiquitin receptor for the proteasome; null mutants accumulate ubiquitinated Gcn4p and display decreased 26S proteasome stability; protein abundance increases in response to DNA replication stress -S000031396 CDS YLR421C 12 965560 965090 C 2011-02-03 1996-07-31 -S000004414 ORF Verified YLR422W DCK1 chromosome 12 12 965897 971695 W 2011-02-03 1996-07-31 Dock family protein (Dedicator Of CytoKinesis), homolog of human DOCK1; upstream component for regulation through the small GTPase Rho5p; may form a complex with Lmo1p that acts as a GEF for Rho5p; interacts with Ino4p; cytoplasmic protein that relocates to mitochondria under oxidative stress; implicated in mitophagy; not an essential protein; DOCK proteins act as guanine nucleotide exchange factors -S000032478 CDS YLR422W 12 965897 971695 W 2011-02-03 1996-07-31 -S000004415 ORF Verified YLR423C ATG17 protein kinase regulatory subunit ATG17|APG17 chromosome 12 12 973170 971917 C 2011-02-03 1996-07-31 Scaffold protein responsible for phagophore assembly site organization; regulatory subunit of an autophagy-specific complex that includes Atg1p and Atg13p; stimulates Atg1p kinase activity; human ortholog RB1CC1/FIP200 interacts with p53, which inhibits autophagy in human cells -S000032513 CDS YLR423C 12 973170 971917 C 2011-02-03 1996-07-31 -S000004416 ORF Verified YLR424W SPP382 mRNA splicing protein SPP382|NTR1|CCF8 chromosome 12 12 973395 975521 W 2011-02-03 1996-07-31 Essential protein that forms a dimer with Ntr2p; also forms a trimer, with Ntr2p and Prp43p, that is involved in spliceosome disassembly; found also in a multisubunit complex with the splicing factor Clf1p; suppressor of prp38-1 mutation -S000032667 CDS YLR424W 12 973395 975521 W 2011-02-03 1996-07-31 -S000006672 tRNA_gene tN(GUU)L chromosome 12 L000003657 12 976056 975983 C 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis -S000030743 noncoding_exon tN(GUU)L 12 976056 975983 C 2011-02-03 2000-05-19 -S000007076 long_terminal_repeat YLRCdelta25 chromosome 12 12 976589 976258 C 2011-02-03 2000-05-19 Ty2 LTR -S000007082 LTR_retrotransposon YLRCTy2-2 Ty2 chromosome 12 12 981700 976258 C 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; mutated in S288C -S000007077 long_terminal_repeat YLRCdelta26 chromosome 12 12 981700 981369 C 2011-02-03 2000-05-19 Ty2 LTR -S000004417 ORF Verified YLR425W TUS1 Rho family guanine nucleotide exchange factor TUS1|SOP10 chromosome 12 L000004619|L000004622 12 982894 986817 W 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF) that modulates Rho1p activity; involved in the cell integrity signaling pathway; interacts with Rgl1p; localization of Tus1p to the bed neck is regulated by Rgl1p; multicopy suppressor of tor2 mutation and ypk1 ypk2 double mutation; potential Cdc28p substrate -S000033357 CDS YLR425W 12 982894 986817 W 2011-02-03 1996-07-31 -S000004418 ORF Uncharacterized YLR426W TDA5 chromosome 12 12 987062 988113 W 2011-02-03 1996-07-31 Putative protein of unknown function; detected in highly purified mitochondria in high-throughput studies; proposed to be involved in resistance to mechlorethamine and streptozotocin; null mutant sensitive to expression of top1-T722A allele -S000033424 CDS YLR426W 12 987062 987141 W 2011-02-03 1996-07-31 -S000033425 CDS YLR426W 12 987213 988113 W 2011-02-03 1996-07-31 -S000033426 intron YLR426W 12 987142 987212 W 2011-02-03 1996-07-31 -S000004419 ORF Verified YLR427W MAG2 chromosome 12 12 988428 990440 W 2011-02-03 1996-07-31 Cytoplasmic protein of unknown function; induced in response to mycotoxin patulin; ubiquitinated protein similar to the human ring finger motif protein RNF10; predicted to be involved in repair of alkylated DNA due to interaction with MAG1 -S000033509 CDS YLR427W 12 988428 990440 W 2011-02-03 1996-07-31 -S000004421 ORF Verified YLR429W CRN1 chromosome 12 L000004279 12 990777 992732 W 2011-02-03 1996-07-31 Coronin; cortical actin cytoskeletal component that associates with the Arp2p/Arp3p complex to regulate its activity; plays a role in regulation of actin patch assembly -S000034435 CDS YLR429W 12 990777 992732 W 2011-02-03 1996-07-31 -S000004420 ORF Dubious YLR428C chromosome 12 12 990961 990617 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF CRN1 -S000033519 CDS YLR428C 12 990961 990617 C 2011-02-03 1996-07-31 -S000004422 ORF Verified YLR430W SEN1 putative DNA/RNA helicase SEN1|NRD2|CIK3 chromosome 12 L000001862 12 993434 1000129 W 2011-02-03 1996-07-31 ATP-dependent 5' to 3' RNA/DNA and DNA helicase; subunit of the exosome-associated Nrd1p complex that mediates 3' end formation of snRNAs, snoRNAs, CUTs and some mRNAs; helicase-independent role in transcription-coupled repair; coordinates replication with transcription, associating with moving forks and preventing errors that occur when forks encounter transcribed regions; homolog of Senataxin, implicated in Ataxia-Oculomotor Apraxia 2 and a dominant form of juvenile ALS -S000035580 CDS YLR430W 12 993434 1000129 W 2011-02-03 1996-07-31 -S000004423 ORF Verified YLR431C ATG23 CVT23 chromosome 12 12 1001703 1000342 C 2011-02-03 1996-07-31 Peripheral membrane protein required for autophagy and CVT; required for cytoplasm-to-vacuole targeting (Cvt) pathway and efficient macroautophagy; cycles between the phagophore assembly site (PAS) and non-PAS locations; forms a complex with Atg9p and Atg27p -S000035614 CDS YLR431C 12 1001703 1000342 C 2011-02-03 1996-07-31 -S000004424 ORF Verified YLR432W IMD3 IMP dehydrogenase IMD3 chromosome 12 12 1002557 1004128 W 2011-02-03 1996-07-31 Inosine monophosphate dehydrogenase; catalyzes the rate-limiting step in the de novo synthesis of GTP; member of a four-gene family in S. cerevisiae, constitutively expressed; IMD3 has a paralog, IMD4, that arose from the whole genome duplication -S000035774 CDS YLR432W 12 1002557 1004128 W 2011-02-03 1996-07-31 -S000004425 ORF Verified YLR433C CNA1 calcineurin catalytic subunit A|CMP1 chromosome 12 L000000370 12 1006008 1004347 C 2011-02-03 1996-07-31 Calcineurin A; one isoform (the other is Cmp2p) of the catalytic subunit of calcineurin, a Ca++/calmodulin-regulated protein phosphatase which regulates Crz1p (a stress-response transcription factor), the other calcineurin subunit is CNB1; regulates the function of Aly1p alpha-arrestin; CNA1 has a paralog, CMP2, that arose from the whole genome duplication -S000036640 CDS YLR433C 12 1006008 1004347 C 2011-02-03 1996-07-31 -S000004427 ORF Verified YLR435W TSR2 chromosome 12 12 1006378 1006995 W 2011-02-03 2003-09-22|1996-07-31 Protein with a potential role in pre-rRNA processing -S000036797 CDS YLR435W 12 1006378 1006995 W 2011-02-03 2003-09-22|1996-07-31 -S000004426 ORF Dubious YLR434C chromosome 12 12 1006408 1006025 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF TSR2/YLR435W -S000036704 CDS YLR434C 12 1006408 1006025 C 2011-02-03 1996-07-31 -S000118481 ARS ARS1232 ARSXII-1007 chromosome 12 12 1007186 1007475 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178144 ARS_consensus_sequence ARS1232 12 1007235 1007251 W 2014-11-18 2014-11-18 -S000004428 ORF Verified YLR436C ECM30 chromosome 12 L000003900 12 1011245 1007421 C 2011-02-03 1996-07-31 Protein of unknown function; may play a role in cell wall biosynthesis, mutants have abormal relative levels of mannose and glucose and have Gap1p sorting and transport defects; (GFP)-fusion protein localizes to the cytoplasm -S000036822 CDS YLR436C 12 1011245 1007421 C 2011-02-03 1996-07-31 -S000004429 ORF Verified YLR437C DIF1 chromosome 12 12 1012023 1011622 C 2011-02-03 1996-07-31 Protein that regulates nuclear localization of Rnr2p and Rnr4p; phosphorylated by Dun1p in response to DNA damage and degraded; N-terminal half shows similarity to S. pombe Spd1 protein; DIF1 has a paralog, SML1, that arose from the whole genome duplication -S000036873 CDS YLR437C 12 1012023 1011622 C 2011-02-03 1996-07-31 -S000004430 ORF Verified YLR438W CAR2 ornithine-oxo-acid transaminase|cargB chromosome 12 L000000217 12 1012501 1013775 W 330 2011-02-03 1996-07-31 L-ornithine transaminase (OTAse); catalyzes the second step of arginine degradation, expression is dually-regulated by allophanate induction and a specific arginine induction process; not nitrogen catabolite repression sensitive; protein abundance increases in response to DNA replication stress; human homolog OAT complements yeast null mutant -S000037652 CDS YLR438W 12 1012501 1013775 W 2011-02-03 1996-07-31 -S000028684 ORF Dubious YLR437C-A chromosome 12 12 1012686 1012459 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF CAR2/YLR438W -S000032558 CDS YLR437C-A 12 1012686 1012459 C 2011-02-03 2003-07-29 -S000118482 ARS ARS1233 ARSXII-1014 chromosome 12 12 1013795 1014022 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178145 ARS_consensus_sequence ARS1233 12 1013861 1013845 C 2014-11-18 2014-11-18 -S000006434 ORF Verified YLR438C-A LSM3 U4/U6-U5 snRNP complex subunit LSM3|USS2|SMX4 chromosome 12 L000004507 12 1014178 1013909 C 2011-02-03 1999-07-17 Lsm (Like Sm) protein; part of heteroheptameric complexes (Lsm2p-7p and either Lsm1p or 8p): cytoplasmic Lsm1p complex involved in mRNA decay; nuclear Lsm8p complex part of U6 snRNP and possibly involved in processing tRNA, snoRNA, and rRNA; protein increases in abundance and relocalizes from nucleus to cytoplasmic foci upon DNA replication stress -S000037756 CDS YLR438C-A 12 1014178 1013909 C 2011-02-03 1999-07-17 -S000004431 ORF Verified YLR439W MRPL4 mitochondrial 54S ribosomal protein YmL4|YmL4 chromosome 12 L000002523|L000001160 12 1014491 1015450 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; homolog of prokaryotic L29 ribosomal protein; located at the ribosomal tunnel exit -S000037711 CDS YLR439W 12 1014491 1015450 W 2011-02-03 1996-07-31 -S000004432 ORF Verified YLR440C SEC39 DSL3 chromosome 12 12 1017697 1015568 C 2011-02-03 1996-07-31 Component of the Dsl1p tethering complex; this complex interacts with ER SNAREs Sec20p and Use1p; mediates Sey1p-independent homotypic ER fusion; proposed to be involved in protein secretion; localizes to the ER and nuclear envelope -S000030454 CDS YLR440C 12 1017697 1015568 C 2011-02-03 1996-07-31 -S000004433 ORF Verified YLR441C RPS1A eS1|ribosomal 40S subunit protein S1A|S1e|rp10A|S1A|RP10A chromosome 12 L000001664 12 1018908 1018141 C 2011-02-03 1996-07-31 Ribosomal protein 10 (rp10) of the small (40S) subunit; homologous to mammalian ribosomal protein S3A, no bacterial homolog; RPS1A has a paralog, RPS1B, that arose from the whole genome duplication -S000030594 CDS YLR441C 12 1018908 1018141 C 2011-02-03 1996-07-31 -S000004434 ORF Verified YLR442C SIR3 chromatin-silencing protein SIR3|STE8|MAR2|CMT1 chromosome 12 L000001896 12 1022251 1019315 C 337 2011-02-03 1996-07-31 Silencing protein; interacts with Sir2p, Sir4p, and histone H3/H4 tails to establish transcriptionally silent chromatin; required for spreading of silenced chromatin; recruited to chromatin through interaction with Rap1p; C-terminus assumes variant winged helix-turn-helix (wH) fold that mediates homodimerization, which is critical for holo-SIR complex loading; required for telomere hypercluster formation in quiescent yeast cells; has paralog ORC1 from whole genome duplication -S000030676 CDS YLR442C 12 1022251 1019315 C 2011-02-03 1996-07-31 -S000004435 ORF Verified YLR443W ECM7 ZRG15 chromosome 12 L000003882 12 1022625 1023971 W 2011-02-03 1996-07-31 Putative integral membrane protein with a role in calcium uptake; non-essential protein; mutant has cell wall defects and Ca+ uptake deficiencies; transcription is induced under conditions of zinc deficiency -S000031587 CDS YLR443W 12 1022625 1023971 W 2011-02-03 1996-07-31 -S000004436 ORF Dubious YLR444C chromosome 12 12 1023988 1023686 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031628 CDS YLR444C 12 1023988 1023686 C 2011-02-03 1996-07-31 -S000118483 ARS ARS1234 ARSXII-1024 chromosome 12 12 1024026 1024186 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000004437 ORF Verified YLR445W GMC2 chromosome 12 12 1024189 1024837 W 2011-02-03 2004-02-03|1996-07-31 Protein involved in meiotic crossing over; component of the Synaptonemal Complex (SC) along with Ecm11p; required for the efficient loading of the SC transverse filament protein, Zip1p; promotes SUMOylation of Ecm11p; mutants are delayed in meiotic nuclear division and are defective in synaptonemal complex assembly; transcription is regulated by Ume6p and induced in response to alpha factor -S000031804 CDS YLR445W 12 1024189 1024572 W 2011-02-03 2004-02-03|1996-07-31 -S000031805 CDS YLR445W 12 1024655 1024837 W 2011-02-03 2004-02-03 -S000031806 intron YLR445W 12 1024573 1024654 W 2011-02-03 2004-02-03 -S000004438 ORF Uncharacterized YLR446W hexokinase chromosome 12 12 1025214 1026515 W 2011-02-03 1996-07-31 Putative hexokinase; transcript is upregulated during sporulation and the unfolded protein response; YLR446W is not an essential gene -S000031911 CDS YLR446W 12 1025214 1026515 W 2011-02-03 1996-07-31 -S000004439 ORF Verified YLR447C VMA6 H(+)-transporting V0 sector ATPase subunit d chromosome 12 L000002461 12 1027893 1026856 C 2011-02-03 1996-07-31 Subunit d of the V0 integral membrane domain of V-ATPase; part of the electrogenic proton pump found in the endomembrane system; required for V1 domain assembly on the vacuolar membrane; the V0 integral membrane domain of vacuolar H+-ATPase (V-ATPase) has five subunits -S000032768 CDS YLR447C 12 1027893 1026856 C 2011-02-03 1996-07-31 -S000004440 ORF Verified YLR448W RPL6B eL6|ribosomal 60S subunit protein L6B|L6e|rp18|YL16|L6B|L17B chromosome 12 L000001714 12 1028854 1029768 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L6B; binds 5.8S rRNA; homologous to mammalian ribosomal protein L6, no bacterial homolog; RPL6B has a paralog, RPL6A, that arose from the whole genome duplication -S000032930 CDS YLR448W 12 1028854 1028868 W 2011-02-03 1996-07-31 -S000032931 CDS YLR448W 12 1029253 1029768 W 2011-02-03 1996-07-31 -S000032932 intron YLR448W 12 1028869 1029252 W 2011-02-03 1996-07-31 -S000004441 ORF Verified YLR449W FPR4 peptidylprolyl isomerase FPR4 chromosome 12 L000004352 12 1030834 1032012 W 2011-02-03 1996-07-31 Peptidyl-prolyl cis-trans isomerase (PPIase); nuclear proline isomerase; affects expression of multiple genes via its role in nucleosome assembly; catalyzes isomerization of proline residues in histones H3 and H4, which affects lysine methylation of those histones; PPIase domain acts as a transcriptional repressor when tethered to DNA by lexA, and repressor activity is dependent on PPIase activity; contains a nucleoplasmin-like fold and can form pentamers -S000033009 CDS YLR449W 12 1030834 1032012 W 2011-02-03 1996-07-31 -S000004442 ORF Verified YLR450W HMG2 hydroxymethylglutaryl-CoA reductase (NADPH) HMG2 chromosome 12 L000000790 12 1032627 1035764 W 343 2011-02-03 1996-07-31 HMG-CoA reductase; converts HMG-CoA to mevalonate, a rate-limiting step in sterol biosynthesis; one of two isozymes; overproduction induces assembly of peripheral ER membrane arrays and short nuclear-associated membrane stacks; forms foci at nuclear periphery upon DNA replication stress; HMG2 has a paralog, HMG1, that arose from the whole genome duplication; human homolog HMGCR can complement yeast hmg2 mutant -S000033695 CDS YLR450W 12 1032627 1035764 W 2011-02-03 1996-07-31 -S000004443 ORF Verified YLR451W LEU3 leucine-responsive transcriptional regulator LEU3 chromosome 12 L000000944 12 1036093 1038753 W 346 2011-02-03 1996-07-31 Zinc-knuckle transcription factor, repressor and activator; regulates genes involved in branched chain amino acid biosynthesis and ammonia assimilation; acts as a repressor in leucine-replete conditions and as an activator in the presence of alpha-isopropylmalate, an intermediate in leucine biosynthesis that accumulates during leucine starvation -S000033823 CDS YLR451W 12 1036093 1038753 W 2011-02-03 1996-07-31 -S000004444 ORF Verified YLR452C SST2 GTPase-activating protein SST2 chromosome 12 L000002093 12 1041366 1039270 C 344 2011-02-03 1996-07-31 GTPase-activating protein for Gpa1p; regulates desensitization to alpha factor pheromone; also required to prevent receptor-independent signaling of the mating pathway; member of the RGS (regulator of G-protein signaling) family -S000034630 CDS YLR452C 12 1041366 1039270 C 2011-02-03 1996-07-31 -S000004445 ORF Verified YLR453C RIF2 chromosome 12 L000003513 12 1042986 1041799 C 2011-02-03 1996-07-31 Protein that binds to the Rap1p C-terminus; acts synergistically with Rif1p to help control telomere length and establish telomeric silencing; deletion results in telomere elongation; RIF2 has a paralog, ORC4, that arose from the whole genome duplication -S000034787 CDS YLR453C 12 1042986 1041799 C 2011-02-03 1996-07-31 -S000004446 ORF Uncharacterized YLR454W FMP27 chromosome 12 12 1043998 1051884 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000034985 CDS YLR454W 12 1043998 1051884 W 2011-02-03 1996-07-31 -S000006608 tRNA_gene tI(AAU)L2 chromosome 12 L000003656 12 1052144 1052071 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000033933 noncoding_exon tI(AAU)L2 12 1052144 1052071 C 2011-02-03 2000-05-19 -S000007078 long_terminal_repeat YLRCdelta27 chromosome 12 12 1052632 1052303 C 2011-02-03 2000-05-19 Ty1 LTR -S000004447 ORF Verified YLR455W PDP3 chromosome 12 12 1053629 1054543 W 2011-02-03 1996-07-31 Component of the NuA3b histone acetyltransferase complex; regulates interaction between NuA3b and H3K36me3 at the transcribed regions of genes; contains PWWP domain; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO); protein abundance increases in response to DNA replication stress; relocalizes to the cytosol in response to hypoxia -S000035931 CDS YLR455W 12 1053629 1054543 W 2011-02-03 1996-07-31 -S000004448 ORF Uncharacterized YLR456W pyridoxal 5'-phosphate synthase chromosome 12 12 1055070 1055684 W 2011-02-03 1996-07-31 Protein of unknown function; predicted to encode a pyridoxal 5'-phosphate synthase based on sequence similarity but purified protein does not possess this activity, nor does it bind flavin mononucleotide (FMN); null mutant displays increased resistance to antifungal agents gliotoxin, cycloheximide and H2O2; YLR456W has a paralog, YPR172W, that arose from the whole genome duplication -S000036078 CDS YLR456W 12 1055070 1055684 W 2011-02-03 1996-07-31 -S000004450 ORF Dubious YLR458W chromosome 12 12 1056455 1056835 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps 5' end of essential NBP1/YLR457C gene required for mitosis -S000036948 CDS YLR458W 12 1056455 1056835 W 2011-02-03 1996-07-31 -S000004449 ORF Verified YLR457C NBP1 chromosome 12 L000001234 12 1056771 1055812 C 2011-02-03 1996-07-31 Spindle pole body (SPB) component; required for the insertion of the duplication plaque into the nuclear membrane during SPB duplication; essential for bipolar spindle formation; component of the Mps2p-Bbp1p complex; NBP1 has a paralog, YPR174C, that arose from the whole genome duplication -S000036128 CDS YLR457C 12 1056771 1055812 C 2011-02-03 1996-07-31 -S000004451 ORF Verified YLR459W GAB1 GPI-anchor transamidase subunit GAB1|CDC91 chromosome 12 L000000290 12 1057334 1058518 W 2011-02-03 1996-07-31 GPI transamidase subunit; involved in attachment of glycosylphosphatidylinositol (GPI) anchors to proteins; may have a role in recognition of the attachment signal or of the lipid portion of GPI -S000037010 CDS YLR459W 12 1057334 1058518 W 2011-02-03 1996-07-31 -S000178146 ARS ARS1235 chromosome 12 12 1059439 1059923 2014-11-18 2014-11-18 Autonomously replicating sequence -S000178147 ARS_consensus_sequence ARS1235 12 1059718 1059702 C 2014-11-18 2014-11-18 -S000004452 ORF Uncharacterized YLR460C chromosome 12 12 1060887 1059757 C 2011-02-03 1996-07-31 Member of the quinone oxidoreductase family; up-regulated in response to the fungicide mancozeb; possibly up-regulated by iodine -S000037785 CDS YLR460C 12 1060887 1059757 C 2011-02-03 1996-07-31 -S000004453 ORF Verified YLR461W PAU4 seripauperin PAU4 chromosome 12 L000002731 12 1062919 1063281 W 2011-02-03 1996-07-31 Member of the seripauperin multigene family; encoded mainly in subtelomeric regions; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole; active during alcoholic fermentation; regulated by anaerobiosis; negatively regulated by oxygen; repressed by heme -S000029848 CDS YLR461W 12 1062919 1063281 W 2011-02-03 1996-07-31 -S000028982 telomere TEL12R chromosome 12 12 1064281 1078177 W 350 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome XII; composed of an X element core sequence, X element combinatorial repeats, two distinct regions of telomeric repeats, and two long Y' elements -S000028984 telomeric_repeat TEL12R 12 1065031 1065155 W 2011-02-03 2003-09-09 Internal telomeric repeats on the right arm of Chromosome XII -S000028983 telomeric_repeat TEL12R 12 1071646 1071653 W 2011-02-03 2003-09-09 Internal telomeric repeats on the right arm of Chromosome XII -S000028985 X_element TEL12R 12 1064281 1064747 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome XII; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028986 X_element_combinatorial_repeat TEL12R 12 1064748 1065030 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr XII; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000028988 Y_prime_element TEL12R 12 1065156 1071645 W 2011-02-03 2003-09-09 Long telomeric Y' element on the right arm of Chromosome XII; more centromere-proximal of two long telomeric Y' elements; contains an ARS consensus sequence, a region of 36-bp repeats, 5 ORFs (YLR466W, YLR462W, YLR464W, YLR463C, YLR465C), and part of ORF YLR466C-B -S000028987 Y_prime_element TEL12R 12 1071654 1078177 W 2011-02-03 2003-09-09 Long telomeric Y' element on the right arm of Chromosome XII; more end-proximal of two long telomeric Y' elements; contains an ARS consensus sequence, a region of 36-bp repeats, ORFs YRF1-5/YLR467W and YLR467C-A, and part of ORF YLR466C-B -S000004454 ORF Uncharacterized YLR462W chromosome 12 12 1065956 1066564 W 2011-02-03 1996-07-31 Putative protein of unknown function with similarity to helicases; YLR462W is within the telomere on the right arm of chromosome XII -S000030870 CDS YLR462W 12 1065956 1066564 W 2011-02-03 1996-07-31 -S000004456 ORF Uncharacterized YLR464W chromosome 12 12 1066572 1067501 W 2011-02-03 1996-07-31 Putative protein of unknown function; intron is predicted but not detected experimentally; YLR464W overlaps the verified gene YRF1-4/YLR466W and two dubious ORFs YLR463C and YLR465C -S000031004 CDS YLR464W 12 1066572 1067084 W 2011-02-03 1996-07-31 -S000031005 CDS YLR464W 12 1067364 1067501 W 2011-02-03 1996-07-31 -S000031006 intron YLR464W 12 1067085 1067363 W 2011-02-03 1996-07-31 -S000004455 ORF Dubious YLR463C chromosome 12 12 1066816 1066265 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the uncharacterized ORFs YLR462W and YLR464W -S000030903 CDS YLR463C 12 1066816 1066265 C 2011-02-03 1996-07-31 -S000004458 ORF Verified YLR466W YRF1-4 Y' element ATP-dependent helicase protein 1 copy 4|YRF1 chromosome 12 12 1067087 1071235 W 2011-02-03 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p -S000032053 CDS YLR466W 12 1067087 1071235 W 2011-02-03 1996-07-31 -S000004457 ORF Dubious YLR465C BSC3 chromosome 12 12 1067353 1067045 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 100% of YLR465C overlaps the uncharacterized ORF YLR464W and 86% of YLR465C overlaps the verified gene YRF1-4 -S000031044 CDS YLR465C 12 1067353 1067045 C 2011-02-03 1996-07-31 -S000028685 ORF Dubious YLR466C-A chromosome 12 12 1070869 1070387 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YRF1-4/YLR466W -S000032560 CDS YLR466C-A 12 1070869 1070387 C 2011-02-03 2003-07-29 -S000028686 ORF Dubious YLR466C-B chromosome 12 12 1071710 1071594 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032562 CDS YLR466C-B 12 1071710 1071594 C 2011-02-03 2003-07-29 -S000004459 ORF Verified YLR467W YRF1-5 Y' element ATP-dependent helicase protein 1 copy 5|YRF1 chromosome 12 12 1072508 1077898 W 2011-02-03 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p -S000032127 CDS YLR467W 12 1072508 1077898 W 2011-02-03 1996-07-31 -S000028687 ORF Dubious YLR467C-A chromosome 12 12 1077532 1077050 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YRF1-4/YLR466W -S000032565 CDS YLR467C-A 12 1077532 1077050 C 2011-02-03 2003-07-29 -S000028690 ORF Dubious YML133W-B chromosome 13 13 827 1309 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized ORF YML133C -S000032587 CDS YML133W-B 13 827 1309 W 2003-07-29 2003-07-29 -S000028689 ORF Dubious YML133W-A chromosome 13 13 1610 2185 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized ORF YML133C -S000032568 CDS YML133W-A 13 1610 2185 W 2003-07-29 2003-07-29 -S000004602 ORF Uncharacterized YML133C Y' element ATP-dependent helicase chromosome 13 13 4684 461 C 1996-07-31 1996-07-31 Putative Y' element ATP-dependent helicase; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YML133C contains an intron -S000033211 CDS YML133C 13 3791 461 C 1996-07-31 1996-07-31 -S000033210 CDS YML133C 13 4684 3891 C 1996-07-31 1996-07-31 -S000033212 intron YML133C 13 3890 3792 C 1996-07-31 1996-07-31 -S000028918 telomere TEL13L chromosome 13 13 6344 1 C -102 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome XIII; composed of an X element core sequence, X element combinatorial repeats, a short region of telomeric repeats, a short Y' element, and a short terminal region of telomeric repeats -S000028919 telomeric_repeat TEL13L 13 51 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome XIII -S000028920 telomeric_repeat TEL13L 13 5585 5538 C 2003-09-09 2003-09-09 Internal telomeric repeats on the left arm of Chromosome XIII -S000028921 X_element TEL13L 13 6344 5875 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome XIII; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028922 X_element_combinatorial_repeat TEL13L 13 5874 5586 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr XIII; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000028923 Y_prime_element TEL13L 13 5537 52 C 2003-09-09 2003-09-09 Telomeric short Y' element on the left arm of Chromosome XIII; contains an ARS consensus sequence, a region of 36-bp repeats, and three ORFs (YML133C, YML133W-A, YML133W-B) -S000004601 ORF Verified YML132W COS3 chromosome 13 L000004061 13 7244 8383 W 1996-07-31 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins -S000033185 CDS YML132W 13 7244 8383 W 1996-07-31 1996-07-31 -S000004600 ORF Verified YML131W chromosome 13 13 10198 11295 W 2011-02-03 1996-07-31 Protein of unknown function; similar to medium chain dehydrogenase/reductases; expression induced by stresses including osmotic shock, DNA damaging agents, and other chemicals; GFP-fusion protein localizes to the cytoplasm; protein abundance increases in response to DNA replication stress -S000033094 CDS YML131W 13 10198 11295 W 2011-02-03 1996-07-31 -S000004599 ORF Verified YML130C ERO1 ER oxidoreductin chromosome 13 L000004013 13 13174 11483 C 2011-02-03 1996-07-31 Thiol oxidase required for oxidative protein folding in the ER; essential for maintaining ER redox balance; feedback regulated via reduction and oxidation of regulatory bonds; reduced Pdi1p activates Ero1p by direct reduction of Ero1p regulatory bonds; depletion of thiol substrates and accumulation of oxidized Pdi1p results in inactivation of Ero1p by both Pdi1p-mediated oxidation and autonomous oxidation of Ero1p regulatory bonds; ero1-1 mutation complemented by human ERO1L -S000032133 CDS YML130C 13 13174 11483 C 2011-02-03 1996-07-31 -S000004598 ORF Verified YML129C COX14 chromosome 13 L000000398 13 14753 14541 C 2011-02-03 1996-07-31 Mitochondrial cytochrome c oxidase (complex IV) assembly factor; also involved in translational regulation of Cox1p and prevention of Cox1p aggregation before assembly; associates with complex IV assembly intermediates and complex III/complex IV supercomplexes; located in the mitochondrial membrane -S000031027 CDS YML129C 13 14753 14541 C 2011-02-03 1996-07-31 -S000004597 ORF Verified YML128C MSC1 chromosome 13 13 16676 15135 C 2011-02-03 1996-07-31 Protein of unknown function; mutant is defective in directing meiotic recombination events to homologous chromatids; the authentic, non-tagged protein is detected in highly purified mitochondria and is phosphorylated -S000030934 CDS YML128C 13 16676 15135 C 2011-02-03 1996-07-31 -S000004596 ORF Verified YML127W RSC9 chromosome 13 13 17064 18809 W 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; DNA-binding protein involved in the synthesis of rRNA and in transcriptional repression and activation of genes regulated by the Target of Rapamycin (TOR) pathway -S000030913 CDS YML127W 13 17064 18809 W 2011-02-03 1996-07-31 -S000004595 ORF Verified YML126C ERG13 hydroxymethylglutaryl-CoA synthase|HMGS chromosome 13 L000004090 13 20535 19060 C 2011-02-03 1996-07-31 3-hydroxy-3-methylglutaryl-CoA (HMG-CoA) synthase; catalyzes the formation of HMG-CoA from acetyl-CoA and acetoacetyl-CoA; involved in the second step in mevalonate biosynthesis -S000030789 CDS YML126C 13 20535 19060 C 2011-02-03 1996-07-31 -S000004594 ORF Verified YML125C PGA3 cytochrome-b5 reductase|NQR1 chromosome 13 13 21699 20761 C 2011-02-03 1996-07-31 Putative cytochrome b5 reductase, localized to the plasma membrane; may be involved in regulation of lifespan; required for maturation of Gas1p and Pho8p, proposed to be involved in protein trafficking; PGA3 has a paralog, AIM33, that arose from the whole genome duplication -S000037858 CDS YML125C 13 21699 20761 C 2011-02-03 1996-07-31 -S000004593 ORF Verified YML124C TUB3 alpha-tubulin TUB3 chromosome 13 L000002389 13 23683 22048 C -101 2011-02-03 1996-07-31 Alpha-tubulin; associates with beta-tubulin (Tub2p) to form tubulin dimer, which polymerizes to form microtubules; expressed at lower level than Tub1p; TUB3 has a paralog, TUB1, that arose from the whole genome duplication -S000037763 CDS YML124C 13 23360 22048 C 2011-02-03 1996-07-31 -S000037762 CDS YML124C 13 23683 23659 C 2011-02-03 1996-07-31 -S000037764 intron YML124C 13 23658 23361 C 2011-02-03 1996-07-31 -S000004592 ORF Verified YML123C PHO84 phosphate transporter PHO84|phoT chromosome 13 L000001430 13 25800 24037 C -100.5 2011-02-03 1996-07-31 High-affinity inorganic phosphate (Pi) transporter; also low-affinity manganese transporter; regulated by Pho4p and Spt7p; mutation confers resistance to arsenate; exit from the ER during maturation requires Pho86p; cells overexpressing Pho84p accumulate heavy metals but do not develop symptoms of metal toxicity -S000037701 CDS YML123C 13 25800 24037 C 2011-02-03 1996-07-31 -S000004591 ORF Uncharacterized YML122C chromosome 13 13 26418 26038 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YML122C is not an essential gene -S000036933 CDS YML122C 13 26418 26038 C 2011-02-03 1996-07-31 -S000004590 ORF Verified YML121W GTR1 Rag GTPase GTR1 chromosome 13 L000000742 13 26930 27862 W -99.6 1996-07-31 1996-07-31 Subunit of a TORC1-stimulating GTPase complex; subunit of the heterodimeric Gtr1-Gtr2 GTPase complex that stimulates TORC1 in response to amino acid stimulation; tethered to the vacuolar membrane as part of the EGOC, a complex required for sorting of Gap1p and microautophagy; involved in phosphate transport and telomeric chromatin silencing; activated by the the Iml1p (GAP) subunit of the SEACIT complex; similar to human RagA and RagB -S000036898 CDS YML121W 13 26930 27862 W 1996-07-31 1996-07-31 -S000004589 ORF Verified YML120C NDI1 NADH-ubiquinone reductase (H(+)-translocating) NDI1 chromosome 13 L000001239 13 29807 28266 C 1996-07-31 1996-07-31 NADH:ubiquinone oxidoreductase; transfers electrons from NADH to ubiquinone in respiratory chain but does not pump protons, in contrast to higher eukaryotic multisubunit respiratory complex I; upon apoptotic stress, is activated in mitochondria by N-terminal cleavage, then translocates to cytoplasm to induce apoptosis; homolog of human AIFM2; yeast NDI1 complements several phenotypes of human cell line with mutated MT-ND4, implicated in Leber hereditary optic neuropathy -S000036805 CDS YML120C 13 29807 28266 C 1996-07-31 1996-07-31 -S000004588 ORF Uncharacterized YML119W chromosome 13 13 30611 31684 W 1996-07-31 1996-07-31 Putative protein of unknown function; YML119W is not an essential gene; potential Cdc28p substrate -S000035884 CDS YML119W 13 30611 31684 W 1996-07-31 1996-07-31 -S000118365 ARS ARS1303 ARSXIII-32 chromosome 13 13 31766 31835 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000004587 ORF Verified YML118W NGL3 3'-5' poly(A) RNA exonuclease chromosome 13 13 32334 33851 W 1996-07-31 1996-07-31 3'-5' exonuclease specific for poly-A RNAs; has a domain similar to a magnesium-dependent endonuclease motif in mRNA deadenylase Ccr4p; similar to Ngl1p; NGL3 has a paralog, NGL2, that arose from the whole genome duplication -S000034970 CDS YML118W 13 32334 33851 W 1996-07-31 1996-07-31 -S000004585 ORF Verified YML117W NAB6 chromosome 13 13 34243 37647 W 1996-07-31 1996-07-31 Putative RNA-binding protein; associates with mRNAs encoding cell wall proteins in high-throughput studies; deletion mutants display increased sensitivity to some cell wall disrupting agents; expression negatively regulated by cAMP -S000034816 CDS YML117W 13 34243 37647 W 1996-07-31 1996-07-31 -S000004586 ORF Dubious YML116W-A YML117W-A chromosome 13 13 37472 37774 W 1996-07-31 1996-07-31 Putative protein of unknown function -S000031380 CDS YML116W-A 13 37472 37774 W 1996-07-31 1996-07-31 -S000004584 ORF Verified YML116W ATR1 borate transporter|SNQ1 chromosome 13 L000001956|L000002831 13 38196 39824 W 1996-07-31 1996-07-31 Multidrug efflux pump of the major facilitator superfamily; required for resistance to aminotriazole and 4-nitroquinoline-N-oxide; ATR1 has a paralog, YMR279C, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000034666 CDS YML116W 13 38196 39824 W 1996-07-31 1996-07-31 -S000130187 ARS ARS1304 chromosome 13 13 39824 40187 2009-05-08 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000178150 ARS_consensus_sequence ARS1304 13 40149 40133 C 2014-11-18 2014-11-18 -S000004583 ORF Verified YML115C VAN1 LDB13|VRG8|VRG7 chromosome 13 L000002453 13 41794 40187 C 38 1996-07-31 1996-07-31 Component of the mannan polymerase I; complex contains Van1p and Mnn9p and is involved in the first steps of mannan synthesis; mutants are vanadate-resistant -S000033712 CDS YML115C 13 41794 40187 C 1996-07-31 1996-07-31 -S000004582 ORF Verified YML114C TAF8 TafII65|TAF65 chromosome 13 13 43575 42043 C 1996-07-31 1996-07-31 TFIID subunit (65 kDa); involved in RNA polymerase II transcription initiation -S000033619 CDS YML114C 13 43575 42043 C 1996-07-31 1996-07-31 -S000004581 ORF Verified YML113W DAT1 chromosome 13 L000000485 13 44045 44791 W 1996-07-31 1996-07-31 DNA binding protein that recognizes oligo(dA).oligo(dT) tracts; Arg side chain in its N-terminal pentad Gly-Arg-Lys-Pro-Gly repeat is required for DNA-binding; relocalizes to the cytosol in response to hypoxia; not essential for viability -S000033570 CDS YML113W 13 44045 44791 W 1996-07-31 1996-07-31 -S000004580 ORF Verified YML112W CTK3 chromosome 13 L000003012 13 45063 45953 W 1996-07-31 1996-07-31 Gamma subunit of C-terminal domain kinase I; CTDK-I phosphorylates RNA polymerase II subunit Rpo21p to affect transcription and pre-mRNA 3' end processing, and also phosphorylates ribosomal protein Rps2p to increase translational fidelity; protein abundance increases in response to DNA replication stress -S000032868 CDS YML112W 13 45063 45953 W 1996-07-31 1996-07-31 -S000004579 ORF Verified YML111W BUL2 ubiquitin-ubiquitin ligase BUL2 chromosome 13 L000004755 13 46942 49704 W 1996-07-31 1996-07-31 Component of the Rsp5p E3-ubiquitin ligase complex; involved in intracellular amino acid permease sorting, functions in heat shock element mediated gene expression, essential for growth in stress conditions; BUL2 has a paralog, BUL1, that arose from the whole genome duplication -S000032740 CDS YML111W 13 46942 49704 W 1996-07-31 1996-07-31 -S000004578 ORF Verified YML110C COQ5 2-hexaprenyl-6-methoxy-1,4-benzoquinone methyltransferase|DBI56 chromosome 13 L000003398 13 50954 50031 C 1996-07-31 1996-07-31 2-hexaprenyl-6-methoxy-1,4-benzoquinone methyltransferase; involved in ubiquinone (Coenzyme Q) biosynthesis; localizes to the matrix face of the mitochondrial inner membrane in a large complex with other ubiquinone biosynthetic enzymes; respiratory defect of the null mutant is partially complemented by human COQ5 -S000032570 CDS YML110C 13 50954 50031 C 1996-07-31 1996-07-31 -S000004577 ORF Verified YML109W ZDS2 CES4 chromosome 13 L000003287 13 51640 54468 W 1996-07-31 1996-07-31 Protein with a role in regulating Swe1p-dependent polarized growth; involved in maintenance of Cdc55p in the cytoplasm where it promotes mitotic entry; interacts with silencing proteins at the telomere; implicated in the mitotic exit network through regulation of Cdc14p localization; ZDS2 has a paralog, ZDS1, that arose from the whole genome duplication -S000031758 CDS YML109W 13 51640 54468 W 1996-07-31 1996-07-31 -S000004576 ORF Verified YML108W chromosome 13 13 54793 55110 W 1996-07-31 1996-07-31 Protein of unknown function; structure defines a new subfamily of the split beta-alpha-beta sandwiches; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; YML108W is not an essential gene; relative distribution to the nucleus increases upon DNA replication stress -S000031668 CDS YML108W 13 54793 55110 W 1996-07-31 1996-07-31 -S000004575 ORF Verified YML107C PML39 chromosome 13 13 56269 55265 C 2003-09-22 2003-09-22|1996-07-31 Protein required for nuclear retention of unspliced pre-mRNAs; required along with Mlp1p and Pml1p; anchored to nuclear pore complex via Mlp1p and Mlp2p; found with the subset of nuclear pores farthest from the nucleolus; may interact with ribosomes -S000031517 CDS YML107C 13 56269 55265 C 2003-09-22 2003-09-22|1996-07-31 -S000004574 ORF Verified YML106W URA5 orotate phosphoribosyltransferase URA5|PYR5 chromosome 13 L000002434 13 56773 57453 W 1996-07-31 1996-07-31 Major orotate phosphoribosyltransferase (OPRTase) isozyme; catalyzes the fifth enzymatic step in de novo biosynthesis of pyrimidines, converting orotate into orotidine-5'-phosphate; URA5 has a paralog, URA10, that arose from the whole genome duplication -S000030709 CDS YML106W 13 56773 57453 W 1996-07-31 1996-07-31 -S000004573 ORF Verified YML105C SEC65 RNA-binding signal recognition particle subunit SEC65 chromosome 13 L000001855 13 58687 57866 C 1996-07-31 1996-07-31 Subunit of the signal recognition particle (SRP); involved in protein targeting to the ER; interacts with Srp54p; homolog of mammalian SRP19 -S000030552 CDS YML105C 13 58687 57866 C 1996-07-31 1996-07-31 -S000004572 ORF Verified YML104C MDM1 chromosome 13 L000001051 13 62322 58939 C 1996-07-31 1996-07-31 PtdIns-3-P binding protein that tethers the ER to vacuoles at NVJs; anchored in the ER membrane at nucleus-vacuole junctions and binds phosphatidylinositol 3-phosphate (PtdIns-3-P) in the vacuolar membrane via its Phox homology (PX) domain; expressed predominantly in late G1 to early S phase of the cell cycle; mutation affects nuclear and mitochondrial transmission to daughter buds; similar to 4 human genes, one of which (SNX14) is associated with neurological disease -S000030408 CDS YML104C 13 62322 58939 C 1996-07-31 1996-07-31 -S000004571 ORF Verified YML103C NUP188 chromosome 13 L000003099 13 67549 62582 C 1996-07-31 1996-07-31 Subunit of the inner ring of the nuclear pore complex (NPC); contributes to NPC organization and nucleocytoplasmic transport; homologous to human NUP188 -S000037631 CDS YML103C 13 67549 62582 C 1996-07-31 1996-07-31 -S000081376 snoRNA_gene snR85 SNR85 chromosome 13 13 67938 67768 C 2006-01-24 2006-01-24 H/ACA box small nucleolar RNA (snoRNA); predicted to guide pseudouridylation of small subunit (SSU) rRNA at position U1181 -S000114174 noncoding_exon snR85 13 67938 67768 C 2006-01-24 2006-01-24 -S000004570 ORF Verified YML102W CAC2 chromosome 13 L000003389 13 68294 69700 W 1996-07-31 1996-07-31 Subunit of chromatin assembly factor I (CAF-1), with Rlf2p and Msi1p; chromatin assembly by CAF-1 is important for multiple processes including silencing at telomeres, mating type loci, and rDNA; maintenance of kinetochore structure, deactivation of the DNA damage checkpoint after DNA repair, chromatin dynamics during transcription; and repression of divergent transcription; relocalizes to the cytosol in response to hypoxia -S000037576 CDS YML102W 13 68294 69700 W 1996-07-31 1996-07-31 -S000004569 ORF Dubious YML101C-A YML102C-A chromosome 13 13 69726 69409 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032439 CDS YML101C-A 13 69726 69409 C 1996-07-31 1996-07-31 -S000004568 ORF Verified YML101C CUE4 chromosome 13 13 70088 69735 C 1996-07-31 1996-07-31 Protein of unknown function; has a CUE domain that binds ubiquitin, which may facilitate intramolecular monoubiquitination; CUE4 has a paralog, CUE1, that arose from the whole genome duplication -S000037386 CDS YML101C 13 70088 69735 C 1996-07-31 1996-07-31 -S000028688 ORF Uncharacterized YML100W-A chromosome 13 13 70138 70311 W 2003-07-29 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032567 CDS YML100W-A 13 70138 70311 W 2003-07-29 2003-07-29 -S000004566 ORF Verified YML100W TSL1 trehalose 6-phosphate synthase/phosphatase complex subunit chromosome 13 L000002361 13 70624 73920 W 1996-07-31 1996-07-31 Large subunit of trehalose 6-phosphate synthase/phosphatase complex; Tps1p-Tps2p complex converts uridine-5'-diphosphoglucose and glucose 6-phosphate to trehalose; contributes to survival to acute lethal heat stress; mutant has aneuploidy tolerance; protein abundance increases in response to DNA replication stress; TSL1 has a paralog, TPS3, that arose from the whole genome duplication -S000036726 CDS YML100W 13 70624 73920 W 1996-07-31 1996-07-31 -S000004567 ORF Dubious YML099W-A YML100W-A chromosome 13 13 74229 74558 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF ARG81/YML099C -S000037139 CDS YML099W-A 13 74229 74558 W 1996-07-31 1996-07-31 -S000004565 ORF Verified YML099C ARG81 ARGRII|ARGR2 chromosome 13 L000000114|L000000113 13 77040 74398 C -63 1996-07-31 1996-07-31 Zinc finger transcription factor involved in arginine-responsive genes; Zn(2)-Cys(6) binuclear cluster domain type; involved in the regulation of arginine-responsive genes; acts with Arg80p and Arg82p -S000032192 CDS YML099C 13 77040 74398 C 1996-07-31 1996-07-31 -S000004564 ORF Verified YML098W TAF13 TafII19|TAF19|FUN81 chromosome 13 L000000650 13 77267 77770 W -63 1996-07-31 1996-07-31 TFIID subunit (19 kDa); involved in RNA polymerase II transcription initiation, similar to histone H4 with atypical histone fold motif of Spt3-like transcription factors -S000032162 CDS YML098W 13 77267 77770 W 1996-07-31 1996-07-31 -S000004563 ORF Verified YML097C VPS9 guanine nucleotide exchange factor VPS9|VPT9|VPL31 chromosome 13 L000002659 13 79690 78335 C 1996-07-31 1996-07-31 Guanine nucleotide exchange factor (GEF) and ubiquitin receptor; involved in vesicle-mediated vacuolar transport, including Golgi-endosome trafficking and sorting through the multivesicular body (MVB); stimulates the intrinsic guanine nucleotide exchange activity of Rab family members (Vps21p/Ypt52p/Ypt53p); partially redundant with GEF MUK1; required for localization of the CORVET complex to endosomes; similar to mammalian ras inhibitors; contains a Ub-interacting CUE domain -S000031138 CDS YML097C 13 79690 78335 C 1996-07-31 1996-07-31 -S000004562 ORF Uncharacterized YML096W putative asparagine synthase chromosome 13 13 79909 81486 W 1996-07-31 1996-07-31 Putative protein with similarity to asparagine synthetases; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YML096W is not an essential gene and partially overlaps the verified gene RAD10 -S000031103 CDS YML096W 13 79909 81486 W 1996-07-31 1996-07-31 -S000004560 ORF Verified YML095C RAD10 chromosome 13 L000001563 13 82113 81481 C 48 1996-07-31 1996-07-31 Single-stranded DNA endonuclease (with Rad1p); cleaves single-stranded DNA during nucleotide excision repair and double-strand break repair; subunit of Nucleotide Excision Repair Factor 1 (NEF1); homolog of human ERCC1 protein -S000030965 CDS YML095C 13 82113 81481 C 1996-07-31 1996-07-31 -S000004559 ORF Verified YML094W GIM5 PFD5 chromosome 13 L000004370 13 82275 82849 W 1996-07-31 1996-07-31 Subunit of the heterohexameric cochaperone prefoldin complex; prefoldin binds specifically to cytosolic chaperonin and transfers target proteins to it; prefoldin complex also localizes to chromatin of actively transcribed genes in the nucleus and facilitates transcriptional elongation -S000030920 CDS YML094W 13 82275 82290 W 1996-07-31 1996-07-31 -S000030921 CDS YML094W 13 82374 82849 W 1996-07-31 1996-07-31 -S000030922 intron YML094W 13 82291 82373 W 1996-07-31 1996-07-31 -S000004561 ORF Dubious YML094C-A YML095C-A chromosome 13 13 82620 82219 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene GIM5/YML094W; deletion confers sensitivity to GSAO -S000032030 CDS YML094C-A 13 82620 82219 C 1996-07-31 1996-07-31 -S000004558 ORF Verified YML093W UTP14 chromosome 13 13 83090 85789 W 1996-07-31 1996-07-31 Subunit of U3-containing Small Subunit (SSU) processome complex; involved in production of 18S rRNA and assembly of small ribosomal subunit -S000029918 CDS YML093W 13 83090 85789 W 1996-07-31 1996-07-31 -S000004557 ORF Verified YML092C PRE8 proteasome core particle subunit alpha 2 chromosome 13 L000002700 13 86739 85987 C 1996-07-31 1996-07-31 Alpha 2 subunit of the 20S proteasome -S000037849 CDS YML092C 13 86739 85987 C 1996-07-31 1996-07-31 -S000004556 ORF Verified YML091C RPM2 ribonuclease P chromosome 13 L000001743 13 90731 87123 C 1996-07-31 1996-07-31 Protein subunit of mitochondrial RNase P; has roles in nuclear transcription, cytoplasmic and mitochondrial RNA processing, and mitochondrial translation; distributed to mitochondria, cytoplasmic processing bodies, and the nucleus -S000036004 CDS YML091C 13 90731 87123 C 1996-07-31 1996-07-31 -S000004555 ORF Dubious YML090W chromosome 13 13 90744 91130 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YML089C; exhibits growth defect on a non-fermentable (respiratory) carbon source -S000035949 CDS YML090W 13 90744 91130 W 1996-07-31 1996-07-31 -S000004554 ORF Dubious YML089C chromosome 13 13 91409 91041 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; expression induced by calcium shortage -S000036274 CDS YML089C 13 91409 91041 C 1996-07-31 1996-07-31 -S000077071 ncRNA_gene ZOD1 ZOD1 chromosome 13 13 91970 92027 W 2014-11-18 2014-11-18 tDNA relic, ancient tDNA for tRNA-Ile; weakly transcribed by RNA polymerase III; located upstream of UFO1; associated with components of the Pol III machinery: Tfc4p, Brf1p, Bdp1, and Rpc34p -S000178148 noncoding_exon ZOD1 13 91970 92027 W 2014-11-18 2014-11-18 -S000004553 ORF Verified YML088W UFO1 SCF ubiquitin ligase complex subunit UFO1 chromosome 13 13 92235 94241 W 1996-07-31 1996-07-31 F-box receptor protein; subunit of the Skp1-Cdc53-F-box receptor (SCF) E3 ubiquitin ligase complex; binds to phosphorylated Ho endonuclease, allowing its ubiquitination by SCF and subsequent degradation -S000036233 CDS YML088W 13 92235 94241 W 1996-07-31 1996-07-31 -S000118366 ARS ARS1305 ARSXIII-94 chromosome 13 13 94217 94463 2006-08-30 2006-08-30 Autonomously Replicating Sequence -S000004552 ORF Verified YML087C AIM33 cytochrome-b5 reductase chromosome 13 13 95369 94431 C 1996-07-31 1996-07-31 Protein of unknown function, highly conserved across species; homolog of human CYB5R4; null mutant displays reduced frequency of mitochondrial genome loss; AIM33 has a paralog, PGA3, that arose from the whole genome duplication -S000036086 CDS YML087C 13 95369 94431 C 1996-07-31 1996-07-31 -S000004551 ORF Verified YML086C ALO1 D-arabinono-1,4-lactone oxidase chromosome 13 L000004264 13 97371 95791 C 1996-07-31 1996-07-31 D-Arabinono-1,4-lactone oxidase; catalyzes the final step in biosynthesis of dehydro-D-arabinono-1,4-lactone, which is protective against oxidative stress -S000036007 CDS YML086C 13 97371 95791 C 1996-07-31 1996-07-31 -S000004550 ORF Verified YML085C TUB1 alpha-tubulin TUB1 chromosome 13 L000002387 13 99400 97941 C -62 1996-07-31 1996-07-31 Alpha-tubulin; associates with beta-tubulin (Tub2p) to form tubulin dimer, which polymerizes to form microtubules; relative distribution to nuclear foci increases upon DNA replication stress; TUB1 has a paralog, TUB3, that arose from the whole genome duplication -S000035128 CDS YML085C 13 99259 97941 C 1996-07-31 1996-07-31 -S000035127 CDS YML085C 13 99400 99376 C 1996-07-31 1996-07-31 -S000035129 intron YML085C 13 99375 99260 C 1996-07-31 1996-07-31 -S000004549 ORF Dubious YML084W chromosome 13 13 99489 99797 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035047 CDS YML084W 13 99489 99797 W 1996-07-31 1996-07-31 -S000004548 ORF Verified YML083C chromosome 13 13 101050 99794 C 1996-07-31 1996-07-31 Protein of unknown function; transcriptionally regulated by Upc2p via an upstream sterol response element; strong increase in transcript abundance during anaerobic growth compared to aerobic growth; cells deleted for YML083C do not exhibit growth defects in anerobic or anaerobic conditions -S000034849 CDS YML083C 13 101050 99794 C 1996-07-31 1996-07-31 -S000004547 ORF Uncharacterized YML082W putative cystathionine gamma-synthase chromosome 13 13 101862 103811 W 1996-07-31 1996-07-31 Putative protein predicted to have carbon-sulfur lyase activity; transcriptionally regulated by Upc2p via an upstream sterol response element; green fluorescent protein (GFP)-fusion protein localizes to the nucleus and the cytoplasm; not an essential gene; YML082W has a paralog, STR2, that arose from the whole genome duplication -S000034791 CDS YML082W 13 101862 103811 W 1996-07-31 1996-07-31 -S000007247 ORF Verified YML081C-A ATP18 F1F0 ATP synthase subunit i chromosome 13 L000004548 13 104162 103983 C 1997-07-17 1997-07-17 Subunit of the mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; termed subunit I or subunit j; does not correspond to known ATP synthase subunits in other organisms -S000032427 CDS YML081C-A 13 104162 103983 C 1997-07-17 1997-07-17 -S000004546 ORF Verified YML081W TDA9 AAF1 chromosome 13 13 104777 108532 W 1996-07-31 1996-07-31 Transcription factor that regulates acetate production; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; null mutant is sensitive to expression of the top1-T722A allele; not an essential gene; TDA9 has a paralog, RSF2, that arose from the whole genome duplication -S000033928 CDS YML081W 13 104777 108532 W 1996-07-31 1996-07-31 -S000004545 ORF Verified YML080W DUS1 tRNA dihydrouridine synthase chromosome 13 13 108806 110077 W 1996-07-31 1996-07-31 Dihydrouridine synthase; member of a widespread family of conserved proteins including Smm1p, Dus3p, and Dus4p; modifies pre-tRNA(Phe) at U17 -S000033787 CDS YML080W 13 108806 110077 W 1996-07-31 1996-07-31 -S000004544 ORF Uncharacterized YML079W chromosome 13 13 110247 110852 W 1996-07-31 1996-07-31 Non-essential protein of unknown function; has structural resemblance to plant storage and ligand binding proteins (canavalin, glycinin, auxin binding protein) and to some enzymes (epimerase, germin); localizes to the nucleus and cytoplasm -S000031763 CDS YML079W 13 110247 110852 W 1996-07-31 1996-07-31 -S000004543 ORF Verified YML078W CPR3 peptidylprolyl isomerase CPR3|CYP3 chromosome 13 L000000464|L000000402 13 111002 111550 W 1996-07-31 1996-07-31 Mitochondrial peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; involved in protein refolding after import into mitochondria -S000031645 CDS YML078W 13 111002 111550 W 1996-07-31 1996-07-31 -S000004542 ORF Verified YML077W BET5 TRAPP subunit BET5 chromosome 13 L000004608 13 111865 112344 W 1996-07-31 1996-07-31 Core component of transport protein particle (TRAPP) complexes I-III; TRAPP complexes are related multimeric guanine nucleotide-exchange factors for the GTPase Ypt1p, regulating ER-Golgi traffic (TRAPPI), intra-Golgi traffic (TRAPPII), endosome-Golgi traffic (TRAPPII and III) and autophagy (TRAPPIII); human homology TRAPPC1 complements yeast null mutant -S000031560 CDS YML077W 13 111865 112344 W 1996-07-31 1996-07-31 -S000004541 ORF Verified YML076C WAR1 chromosome 13 13 115347 112513 C 1996-07-31 1996-07-31 Homodimeric Zn2Cys6 zinc finger transcription factor; binds to a weak acid response element to induce transcription of PDR12 and FUN34, encoding an acid transporter and a putative ammonia transporter, respectively -S000030680 CDS YML076C 13 115347 112513 C 1996-07-31 1996-07-31 -S000004540 ORF Verified YML075C HMG1 hydroxymethylglutaryl-CoA reductase (NADPH) HMG1 chromosome 13 L000000789 13 118898 115734 C -50 1996-07-31 1996-07-31 HMG-CoA reductase; catalyzes conversion of HMG-CoA to mevalonate, which is a rate-limiting step in sterol biosynthesis; one of two isozymes; localizes to nuclear envelope; overproduction induces formation of karmellae; forms foci at nuclear periphery upon DNA replication stress; HMG1 has a paralog, HMG2, that arose from the whole genome duplication; human homolog HMGCR can complement yeast hmg1 mutant -S000030566 CDS YML075C 13 118898 115734 C 1996-07-31 1996-07-31 -S000004539 ORF Verified YML074C FPR3 peptidylprolyl isomerase FPR3|NPI46 chromosome 13 L000001268 13 121324 120089 C 1996-07-31 1996-07-31 Nucleolar peptidyl-prolyl cis-trans isomerase (PPIase); FK506 binding protein; affects expression of multiple genes via its role in nucleosome assembly; phosphorylated by casein kinase II (Cka1p-Cka2p-Ckb1p-Ckb2p) and dephosphorylated by Ptp1p; PPIase domain acts as a transcriptional repressor when tethered to DNA by lexA, and repressor activity is dependent on PPIase activity; FPR3 has a paralog, FPR4, that arose from the whole genome duplication -S000030502 CDS YML074C 13 121324 120089 C 1996-07-31 1996-07-31 -S000004538 ORF Verified YML073C RPL6A eL6|ribosomal 60S subunit protein L6A|L6e|rp18|YL16|L6A|L17A|YL16A chromosome 13 L000004165 13 124172 123227 C 1996-07-31 1996-07-31 Ribosomal 60S subunit protein L6A; N-terminally acetylated; binds 5.8S rRNA; homologous to mammalian ribosomal protein L6, no bacterial homolog; RPL6A has a paralog, RPL6B, that arose from the whole genome duplication -S000037684 CDS YML073C 13 123742 123227 C 1996-07-31 1996-07-31 -S000037683 CDS YML073C 13 124172 124158 C 1996-07-31 1996-07-31 -S000037685 intron YML073C 13 124157 123743 C 1996-07-31 1996-07-31 -S000004537 ORF Verified YML072C TCB3 chromosome 13 13 129367 124730 C 1996-07-31 1996-07-31 Cortical ER protein involved in ER-plasma membrane tethering; one of 6 proteins (Ist2p, Scs2p, Scs22p, Tcb1p, Tcb2p, Tcb3p) that connect ER to the plasma membrane (PM) and regulate PM phosphatidylinositol-4-phosphate (PI4P) levels by controlling access of Sac1p phosphatase to its substrate PI4P in the PM; localized to the bud via specific mRNA transport; non-tagged protein detected in a phosphorylated state in mitochondria; C-termini of Tcb1p, Tcb2p and Tcb3p interact -S000037588 CDS YML072C 13 129367 124730 C 1996-07-31 1996-07-31 -S000004536 ORF Verified YML071C COG8 Golgi transport complex subunit COG8|DOR1 chromosome 13 13 131572 129749 C 1996-07-31 1996-07-31 Component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments -S000037526 CDS YML071C 13 131572 129749 C 1996-07-31 1996-07-31 -S000006718 tRNA_gene tR(UCU)M2 chromosome 13 L000003686 13 131896 131825 C 2000-05-19 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000031505 noncoding_exon tR(UCU)M2 13 131896 131825 C 2000-05-19 2000-05-19 -S000007101 long_terminal_repeat YMLCdelta1 chromosome 13 13 132321 131989 C 2000-05-19 2000-05-19 Ty1 LTR -S000004535 ORF Verified YML070W DAK1 dihydroxyacetone kinase chromosome 13 L000004203 13 133475 135229 W 1996-07-31 1996-07-31 Dihydroxyacetone kinase; required for detoxification of dihydroxyacetone (DHA); involved in stress adaptation -S000037490 CDS YML070W 13 133475 135229 W 1996-07-31 1996-07-31 -S000004534 ORF Verified YML069W POB3 FACT complex subunit POB3 chromosome 13 L000003326 13 135500 137158 W 1996-07-31 1996-07-31 Subunit of the heterodimeric FACT complex (Spt16p-Pob3p); FACT associates with chromatin via interaction with Nhp6Ap and Nhp6Bp, and reorganizes nucleosomes to facilitate access to DNA by RNA and DNA polymerases; protein abundance increases in response to DNA replication stress -S000036481 CDS YML069W 13 135500 137158 W 1996-07-31 1996-07-31 -S000118367 ARS ARS1307 ARSXIII-137 chromosome 13 13 137300 137548 2006-08-30 2006-08-30 Autonomously Replicating Sequence -S000178151 ARS_consensus_sequence ARS1307 13 137321 137337 W 2014-11-18 2014-11-18 -S000004533 ORF Verified YML068W ITT1 chromosome 13 13 137550 138944 W 1996-07-31 1996-07-31 Protein that modulates the efficiency of translation termination; interacts with translation release factors eRF1 (Sup45p) and eRF3 (Sup35p) in vitro, contains a zinc finger domain characteristic of the TRIAD class of proteins -S000036418 CDS YML068W 13 137550 138944 W 1996-07-31 1996-07-31 -S000004532 ORF Verified YML067C ERV41 chromosome 13 13 140214 139063 C 1996-07-31 1996-07-31 Protein localized to COPII-coated vesicles; forms a complex with Erv46p; involved in the membrane fusion stage of transport; has homology to human ERGIC2 (PTX1) protein -S000035439 CDS YML067C 13 140090 139063 C 1996-07-31 1996-07-31 -S000035438 CDS YML067C 13 140214 140184 C 1996-07-31 1996-07-31 -S000035440 intron YML067C 13 140183 140091 C 1996-07-31 1996-07-31 -S000004531 ORF Verified YML066C SMA2 chromosome 13 13 141533 140424 C 1996-07-31 1996-07-31 Meiosis-specific prospore membrane protein; required to produce bending force necessary for proper assembly of the prospore membrane during sporulation -S000035365 CDS YML066C 13 141533 140424 C 1996-07-31 1996-07-31 -S000004530 ORF Verified YML065W ORC1 origin recognition complex subunit 1 chromosome 13 L000003162 13 142210 144954 W 1996-07-31 1996-07-31 Largest subunit of the origin recognition complex; involved in directing DNA replication by binding to replication origins; also involved in transcriptional silencing; exhibits ATPase activity; ORC1 has a paralog, SIR3, that arose from the whole genome duplication -S000035334 CDS YML065W 13 142210 144954 W 1996-07-31 1996-07-31 -S000004529 ORF Verified YML064C TEM1 Ras family GTPase TEM1 chromosome 13 L000002282 13 145876 145139 C 1996-07-31 1996-07-31 GTP-binding protein of the Ras superfamily; involved in termination of M-phase; controls actomyosin and septin dynamics during cytokinesis -S000035202 CDS YML064C 13 145876 145139 C 1996-07-31 1996-07-31 -S000004528 ORF Verified YML063W RPS1B eS1|ribosomal 40S subunit protein S1B|S1e|rp10B|S1B|RP10B|PLC2 chromosome 13 L000001665 13 146482 147249 W 1996-07-31 1996-07-31 Ribosomal protein 10 (rp10) of the small (40S) subunit; homologous to mammalian ribosomal protein S3A, no bacterial homolog; RPS1B has a paralog, RPS1A, that arose from the whole genome duplication -S000035158 CDS YML063W 13 146482 147249 W 1996-07-31 1996-07-31 -S000004527 ORF Verified YML062C MFT1 MFT52 chromosome 13 L000001099 13 148683 147505 C 1996-07-31 1996-07-31 Subunit of the THO complex; THO is a nuclear complex comprised of Hpr1p, Mft1p, Rlr1p, and Thp2p, that is involved in transcription elongation and mitotic recombination; involved in telomere maintenance -S000034129 CDS YML062C 13 148683 147505 C 1996-07-31 1996-07-31 -S000004526 ORF Verified YML061C PIF1 DNA helicase PIF1|TST1 chromosome 13 L000001435 13 151532 148953 C 1996-07-31 1996-07-31 DNA helicase, potent G-quadruplex DNA binder/unwinder; possesses strand annealing activity; promotes DNA synthesis during break-induced replication; important for crossover recombination; translation from different start sites produces mitochondrial and nuclear forms; nuclear form is a catalytic inhibitor of telomerase; mitochondrial form involved in DNA repair and recombination; mutations affect Zn, Fe homeostasis; regulated by Rad53p-dependent phosphorylation in rho0 cells -S000034029 CDS YML061C 13 151532 148953 C 1996-07-31 1996-07-31 -S000004525 ORF Verified YML060W OGG1 8-oxoguanine glycosylase OGG1 chromosome 13 L000003339 13 151871 153001 W 1996-07-31 1996-07-31 Nuclear and mitochondrial glycosylase/lyase; specifically excises 7,8-dihydro-8-oxoguanine residues located opposite cytosine or thymine residues in DNA, repairs oxidative damage to mitochondrial DNA, contributes to UVA resistance -S000033997 CDS YML060W 13 151871 153001 W 1996-07-31 1996-07-31 -S000004524 ORF Verified YML059C NTE1 lysophospholipase chromosome 13 13 158258 153219 C 1996-07-31 1996-07-31 Serine esterase; homolog of human neuropathy target esterase (NTE); Nte1p-mediated phosphatidylcholine turnover influences transcription factor Opi1p localization, affecting transcriptional regulation of phospholipid biosynthesis genes -S000032143 CDS YML059C 13 158258 153219 C 1996-07-31 1996-07-31 -S000007472 ORF Verified YML058W-A HUG1 chromosome 13 L000004561 13 158760 158966 W 1998-11-10 1998-11-10 Ribonucleotide reductase inhibitor; intrinsically disordered protein that binds to and inhibits Rnr2p; involved in the Mec1p-mediated checkpoint pathway; transcription is induced by genotoxic stress and by activation of the Rad53p pathway; protein abundance increases in response to DNA replication stress -S000030950 CDS YML058W-A 13 158760 158966 W 1998-11-10 1998-11-10 -S000178152 ARS ARS1307.5 chromosome 13 13 158887 159277 2014-11-18 2014-11-18 Autonomously replicating sequence -S000178153 ARS_consensus_sequence ARS1307.5 13 159046 159062 W 2014-11-18 2014-11-18 -S000004523 ORF Verified YML058W SML1 ribonucleotide reductase inhibiting protein SML1 chromosome 13 L000004580 13 159383 159697 W 1996-07-31 1996-07-31 Ribonucleotide reductase inhibitor; involved in regulating dNTP production; regulated by Mec1p and Rad53p during DNA damage and S phase; SML1 has a paralog, DIF1, that arose from the whole genome duplication -S000032114 CDS YML058W 13 159383 159697 W 1996-07-31 1996-07-31 -S000004521 ORF Verified YML057W CMP2 calcineurin catalytic subunit A|CNA2 chromosome 13 L000000368 13 160180 161994 W 1996-07-31 1996-07-31 Calcineurin A; one isoform (the other is Cna1p) of the catalytic subunit of calcineurin, a Ca++/calmodulin-regulated protein phosphatase which regulates Crz1p (a stress-response transcription factor), the other calcineurin subunit is CNB1; regulates the function of Aly1p alpha-arrestin; CMP2 has a paralog, CNA1, that arose from the whole genome duplication -S000032034 CDS YML057W 13 160180 161994 W 1996-07-31 1996-07-31 -S000004522 ORF Dubious YML057C-A YML058C-A chromosome 13 13 160412 160023 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene CMP2/YML057W -S000036471 CDS YML057C-A 13 160412 160023 C 1996-07-31 1996-07-31 -S000006445 snoRNA_gene snR54 SNR54 chromosome 13 L000004523 13 163620 163535 C 2000-05-19 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position A974 -S000030738 noncoding_exon snR54 13 163620 163535 C 2000-05-19 2000-05-19 -S000004520 ORF Verified YML056C IMD4 IMP dehydrogenase IMD4 chromosome 13 13 164176 162194 C 1996-07-31 1996-07-31 Inosine monophosphate dehydrogenase; catalyzes the rate-limiting step in the de novo synthesis of GTP; member of a four-gene family in S. cerevisiae, constitutively expressed; IMD4 has a paralog, IMD3, that arose from the whole genome duplication -S000031022 CDS YML056C 13 163308 162194 C 1996-07-31 1996-07-31 -S000031021 CDS YML056C 13 164176 163717 C 1996-07-31 1996-07-31 -S000031023 intron YML056C 13 163716 163309 C 1996-07-31 1996-07-31 -S000004519 ORF Verified YML055W SPC2 signal peptidase complex subunit SPC2|SPY1 chromosome 13 L000002874 13 164790 165326 W 1996-07-31 1996-07-31 Subunit of signal peptidase complex; complex catalyzes cleavage of N-terminal signal sequences of proteins targeted to the secretory pathway; homologous to mammalian SPC25; other members of the complex are Spc1p, Spc1p, and Sec11p -S000030975 CDS YML055W 13 164790 165326 W 1996-07-31 1996-07-31 -S000004518 ORF Verified YML054C CYB2 FCB2 chromosome 13 L000000447 13 167308 165533 C -30 1996-07-31 1996-07-31 Cytochrome b2 (L-lactate cytochrome-c oxidoreductase); component of the mitochondrial intermembrane space, required for lactate utilization; expression is repressed by glucose and anaerobic conditions -S000030874 CDS YML054C 13 167308 165533 C 1996-07-31 1996-07-31 -S000028573 ORF Uncharacterized YML054C-A chromosome 13 13 167781 167623 C 2003-07-29 2003-07-29 Putative protein of unknown function -S000031301 CDS YML054C-A 13 167781 167623 C 2003-07-29 2003-07-29 -S000007102 long_terminal_repeat YMLCdelta2 chromosome 13 13 168681 168349 C 2000-05-19 2000-05-19 Ty2 LTR -S000006783 tRNA_gene tY(GUA)M1 SUP5 chromosome 13 L000003666|L000002184 13 168795 168883 W -34 2000-05-19 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations -S000032294 intron tY(GUA)M1 13 168834 168847 W 2000-05-19 2000-05-19 -S000032292 noncoding_exon tY(GUA)M1 13 168795 168833 W 2000-05-19 2000-05-19 -S000032293 noncoding_exon tY(GUA)M1 13 168848 168883 W 2000-05-19 2000-05-19 -S000004517 ORF Uncharacterized YML053C chromosome 13 13 169754 169116 C 1996-07-31 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and the nucleus; overexpression causes a cell cycle delay or arrest; YML053C is not an essential gene -S000030788 CDS YML053C 13 169754 169116 C 1996-07-31 1996-07-31 -S000004516 ORF Verified YML052W SUR7 chromosome 13 L000004152 13 170402 171310 W 1996-07-31 1996-07-31 Plasma membrane protein, component of eisosomes; long-lived protein that remains stable in eisosomes of mother cells while other eisosome proteins, Pil1p and Lsp1p, turn over; may function to anchor the eisosome in place; sporulation and plasma membrane sphingolipid content are altered in mutants; localizes to furrow-like invaginations (MCC patches) -S000037898 CDS YML052W 13 170402 171310 W 1996-07-31 1996-07-31 -S000004515 ORF Verified YML051W GAL80 transcription regulator GAL80 chromosome 13 L000000665 13 171594 172901 W -33 1996-07-31 1996-07-31 Transcriptional regulator involved in the repression of GAL genes; involved in the repression of GAL genes in the absence of galactose; inhibits transcriptional activation by Gal4p; inhibition relieved by Gal3p or Gal1p binding -S000037805 CDS YML051W 13 171594 172901 W 1996-07-31 1996-07-31 -S000004514 ORF Verified YML050W AIM32 chromosome 13 13 173139 174074 W 1996-07-31 1996-07-31 Protein of unknown function; null mutant is viable and displays elevated frequency of mitochondrial genome loss -S000037724 CDS YML050W 13 173139 174074 W 1996-07-31 1996-07-31 -S000004513 ORF Verified YML049C RSE1 U2 snRNP complex subunit RSE1 chromosome 13 L000004030 13 178305 174220 C 1996-07-31 1996-07-31 Protein involved in pre-mRNA splicing; component of the pre-spliceosome; associates with U2 snRNA; involved in ER to Golgi transport -S000036229 CDS YML049C 13 178305 174220 C 1996-07-31 1996-07-31 -S000004511 ORF Verified YML048W GSF2 ECM6 chromosome 13 L000003209 13 178426 179637 W 1996-07-31 1996-07-31 Endoplasmic reticulum (ER) localized integral membrane protein; may promote secretion of certain hexose transporters, including Gal2p; involved in glucose-dependent repression -S000036176 CDS YML048W 13 178426 179637 W 1996-07-31 1996-07-31 -S000004512 ORF Dubious YML047W-A YML048W-A chromosome 13 13 179893 180258 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF PRM6/YML047C -S000031724 CDS YML047W-A 13 179893 180258 W 1996-07-31 1996-07-31 -S000004510 ORF Verified YML047C PRM6 pheromone-regulated K(+) transporter PRM6|KCH2 chromosome 13 13 181075 180017 C 1996-07-31 1996-07-31 Potassium transporter that mediates K+ influx; activates high-affinity Ca2+ influx system (HACS) during mating pheromone response; expression up-regulated in response to alpha factor; regulated by Ste12p during mating; localized to sites of polarized growth; member of a fungal-specific gene family; PRM6 has a paralog, KCH1, that arose from the whole genome duplication -S000035933 CDS YML047C 13 181075 180017 C 1996-07-31 1996-07-31 -S000004509 ORF Verified YML046W PRP39 chromosome 13 L000001511 13 181474 183363 W 1996-07-31 1996-07-31 U1 snRNP protein involved in splicing; contains multiple tetriatricopeptide repeats -S000035883 CDS YML046W 13 181474 183363 W 1996-07-31 1996-07-31 -S000118368 ARS ARS1308 ARSXIII-184 chromosome 13 13 183797 183887 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178154 ARS_consensus_sequence ARS1308 13 183874 183858 C 2014-11-18 2014-11-18 -S000006585 tRNA_gene tG(GCC)M chromosome 13 L000003685 13 183968 183898 C 2000-05-19 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis -S000029832 noncoding_exon tG(GCC)M 13 183968 183898 C 2000-05-19 2000-05-19 -S000007103 long_terminal_repeat YMLWdelta3 chromosome 13 13 184170 184501 W 2000-05-19 2000-05-19 Ty1 LTR -S000007107 LTR_retrotransposon YMLWTy1-1 Ty1 chromosome 13 13 184170 190083 W 2000-05-19 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007381 transposable_element_gene YML045W-A gag protein chromosome 13 13 184461 185783 W 1996-07-31 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000036727 CDS YML045W-A 13 184461 185783 W 1996-07-31 1996-07-31 -S000004508 transposable_element_gene YML045W gag-pol fusion protein chromosome 13 13 184461 189729 W 1996-07-31 1999-07-17|1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000034966 CDS YML045W 13 184461 185765 W 1999-07-17 1999-07-17|1996-07-31 -S000034967 CDS YML045W 13 185767 189729 W 1999-07-17 1999-07-17|1996-07-31 -S000034968 plus_1_translational_frameshift YML045W 13 185766 185766 W 1999-07-17 1999-07-17|1996-07-31 -S000007104 long_terminal_repeat YMLWdelta4 chromosome 13 13 189752 190083 W 2000-05-19 2000-05-19 Ty1 LTR -S000004507 ORF Verified YML043C RRN11 chromosome 13 L000004133 13 191767 190244 C 1996-07-31 1996-07-31 Component of the core factor (CF) rDNA transcription factor complex; CF is required for transcription of 35S rRNA genes by RNA polymerase I and is composed of Rrn6p, Rrn7p, and Rrn11p -S000033836 CDS YML043C 13 191767 190244 C 1996-07-31 1996-07-31 -S000004506 ORF Verified YML042W CAT2 carnitine O-acetyltransferase CAT2|YCAT chromosome 13 L000000218 13 192788 194800 W 1996-07-31 1996-07-31 Carnitine acetyl-CoA transferase; present in both mitochondria and peroxisomes; transfers activated acetyl groups to carnitine to form acetylcarnitine which can be shuttled across membranes -S000033788 CDS YML042W 13 192788 194800 W 1996-07-31 1996-07-31 -S000004505 ORF Verified YML041C VPS71 SWC6 chromosome 13 13 195755 194913 C 1996-07-31 1996-07-31 Nucleosome-binding component of the SWR1 complex; SWR1 exchanges histone variant H2AZ (Htz1p) for chromatin-bound histone H2A; required for vacuolar protein sorting -S000033617 CDS YML041C 13 195755 194913 C 1996-07-31 1996-07-31 -S000006684 tRNA_gene tP(UGG)M SUF7 chromosome 13 L000002155|L000003684 13 196170 196068 C -32 2000-05-19 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin; can mutate to suppress +1 frameshift mutations in proline codons -S000036019 intron tP(UGG)M 13 196134 196104 C 2000-05-19 2000-05-19 -S000036018 noncoding_exon tP(UGG)M 13 196103 196068 C 2000-05-19 2000-05-19 -S000036017 noncoding_exon tP(UGG)M 13 196170 196135 C 2000-05-19 2000-05-19 -S000007105 long_terminal_repeat YMLWdelta5 chromosome 13 13 196332 196668 W 2000-05-19 2000-05-19 Ty1 LTR -S000007108 LTR_retrotransposon YMLWTy1-2 Ty1 chromosome 13 13 196332 202234 W 2000-05-19 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000004504 transposable_element_gene YML040W gag protein chromosome 13 13 196628 197950 W 1996-07-31 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000033569 CDS YML040W 13 196628 197950 W 1996-07-31 1996-07-31 -S000004503 transposable_element_gene YML039W gag-pol fusion protein chromosome 13 S000029016 13 196628 201896 W 1996-07-31 1999-07-17|1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000032892 CDS YML039W 13 196628 197932 W 1999-07-17 1999-07-17|1996-07-31 -S000032893 CDS YML039W 13 197934 201896 W 1999-07-17 1999-07-17|1996-07-31 -S000032894 plus_1_translational_frameshift YML039W 13 197933 197933 W 1999-07-17 1999-07-17|1996-07-31 -S000007106 long_terminal_repeat YMLWdelta6 chromosome 13 13 201919 202234 W 2000-05-19 2000-05-19 Ty1 LTR -S000004502 ORF Verified YML038C YMD8 chromosome 13 13 204103 202775 C 1996-07-31 1996-07-31 Putative nucleotide sugar transporter; has similarity to Vrg4p -S000032731 CDS YML038C 13 204103 202775 C 1996-07-31 1996-07-31 -S000004501 ORF Uncharacterized YML037C chromosome 13 13 205408 204386 C 1996-07-31 1996-07-31 Putative protein of unknown function; has some characteristics of a transcriptional activator; may be a target of Dbf2p-Mob1p kinase; GFP-fusion protein co-localizes with clathrin-coated vesicles; YML037C is not an essential gene -S000031852 CDS YML037C 13 205408 204386 C 1996-07-31 1996-07-31 -S000004500 ORF Verified YML036W CGI121 chromosome 13 13 205642 206293 W 2007-07-10 1996-07-31|2007-07-10 Component of the EKC/KEOPS complex; EKC/KEOPS complex is required for t6A tRNA modification and telomeric TG1-3 recombination; may have role in transcription; Cgi121p is dispensable for tRNA modification; other complex members are Bud32p, Kae1p, Pcc1p, and Gon7p -S000031755 CDS YML036W 13 205642 206097 W 2007-07-10 1996-07-31|2007-07-10 -S000123281 CDS YML036W 13 206204 206293 W 2007-07-10 2007-07-10 -S000123280 intron YML036W 13 206098 206203 W 2007-07-10 2007-07-10 -S000004498 ORF Verified YML035C AMD1 AMP deaminase|AMD3 chromosome 13 L000000082|L000002678 13 208860 206428 C 1996-07-31 1996-07-31 AMP deaminase; tetrameric enzyme that catalyzes the deamination of AMP to form IMP and ammonia; thought to be involved in regulation of intracellular purine (adenine, guanine, and inosine) nucleotide pools -S000031615 CDS YML035C 13 208860 206428 C 1996-07-31 1996-07-31 -S000004497 ORF Verified YML034W SRC1 HEH1|YML033W chromosome 13 S000004496 13 209525 212155 W 1998-11-10 1998-11-10|1996-07-31 Inner nuclear membrane protein; highly enriched at telomeres and subtelomeric regions; functions in regulation of subtelomeric genes and is linked to TREX (transcription export) factors; SRC1 produces 2 splice variant proteins with different functions; alternative splicing of SRC1 pre-mRNA is promoted by Hub1p; mutant has aneuploidy tolerance; SEC1 has a paralog, HEH2, that arose from the whole genome duplication -S000031569 CDS YML034W 13 209525 211444 W 1998-11-10 1998-11-10|1996-07-31 -S000031570 CDS YML034W 13 211571 212155 W 1998-11-10 1998-11-10 -S000031571 intron YML034W 13 211445 211570 W 1998-11-10 1998-11-10 -S000004499 ORF Dubious YML034C-A YML035C-A chromosome 13 13 209826 209428 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF SRC1/YML034W -S000031984 CDS YML034C-A 13 209826 209428 C 1996-07-31 1996-07-31 -S000004494 ORF Verified YML032C RAD52 recombinase RAD52 chromosome 13 L000001572 13 213930 212515 C -18 2003-01-07 2003-01-07|1996-07-31 Protein that stimulates strand exchange; stimulates strand exchange by facilitating Rad51p binding to single-stranded DNA; anneals complementary single-stranded DNA; involved in the repair of double-strand breaks in DNA during vegetative growth and meiosis and UV induced sister chromatid recombination -S000030550 CDS YML032C 13 213930 212515 C 2003-01-07 2003-01-07|1996-07-31 -S000004493 ORF Verified YML031W NDC1 chromosome 13 L000001237 13 214189 216156 W -18 1996-07-31 1996-07-31 Subunit of the transmembrane ring of the nuclear pore complex (NPC); contributes to nucleocytoplasmic transport, NPC biogenesis and spindle pole body duplication; homologous to human NDC1 -S000030507 CDS YML031W 13 214189 216156 W 1996-07-31 1996-07-31 -S000028809 ORF Dubious YML031C-A YML032C-A chromosome 13 S000004495 13 214421 214086 C 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF NDC1/YML031W -S000033595 CDS YML031C-A 13 214421 214086 C 2003-07-29 2003-07-29 -S000004492 ORF Verified YML030W RCF1 AIM31 chromosome 13 13 216435 216914 W 1996-07-31 1996-07-31 Cytochrome c oxidase subunit; required for assembly of the Complex III-Complex IV supercomplex, and for assembly of Cox13p and Rcf2p into cytochrome c oxidase; similar to Rcf2p, and either Rcf1p or Rcf2p is required for late-stage assembly of the Cox12p and Cox13p subunits and for cytochrome c oxidase activity; required for growth under hypoxic conditions; member of the hypoxia induced gene family; C. elegans and human orthologs are functional in yeast -S000030362 CDS YML030W 13 216435 216914 W 1996-07-31 1996-07-31 -S000004491 ORF Verified YML029W USA1 chromosome 13 L000003225 13 217362 219878 W 1996-07-31 1996-07-31 Scaffold subunit of the Hrd1p ubiquitin ligase; also promotes ligase oligomerization; involved in ER-associated protein degradation (ERAD); interacts with the U1 snRNP-specific protein, Snp1p -S000037625 CDS YML029W 13 217362 219878 W 1996-07-31 1996-07-31 -S000004490 ORF Verified YML028W TSA1 thioredoxin peroxidase TSA1|cTPxI|TPX1|ZRG14 chromosome 13 L000002365 13 220138 220728 W 1996-07-31 1996-07-31 Thioredoxin peroxidase; acts as both ribosome-associated and free cytoplasmic antioxidant; self-associates to form high-molecular weight chaperone complex under oxidative stress; chaperone activity essential for growth in zinc deficiency; required for telomere length maintenance; binds and modulates Cdc19p activity; protein abundance increases, forms cytoplasmic foci during DNA replication stress; TSA1 has a paralog, TSA2, that arose from the whole genome duplication -S000037561 CDS YML028W 13 220138 220728 W 1996-07-31 1996-07-31 -S000004489 ORF Verified YML027W YOX1 chromosome 13 L000002540 13 221406 222563 W 1996-07-31 1996-07-31 Homeobox transcriptional repressor; binds to Mcm1p and to early cell cycle boxes (ECBs) in the promoters of cell cycle-regulated genes expressed in M/G1 phase; expression is cell cycle-regulated; phosphorylated by Cdc28p; relocalizes from nucleus to cytoplasm upon DNA replication stress; YOX1 has a paralog, YHP1, that arose from the whole genome duplication -S000036828 CDS YML027W 13 221406 222563 W 1996-07-31 1996-07-31 -S000004488 ORF Verified YML026C RPS18B uS13|ribosomal 40S subunit protein S18B|S18B|S13 chromosome 13 L000004481 13 223828 222987 C 1996-07-31 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S18 and bacterial S13; RPS18B has a paralog, RPS18A, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000036754 CDS YML026C 13 223380 222987 C 1996-07-31 1996-07-31 -S000036753 CDS YML026C 13 223828 223782 C 1996-07-31 1996-07-31 -S000036755 intron YML026C 13 223781 223381 C 1996-07-31 1996-07-31 -S000004487 ORF Verified YML025C YML6 mitochondrial 54S ribosomal protein YmL6 chromosome 13 13 225365 224406 C 1996-07-31 1996-07-31 Mitochondrial ribosomal protein of the large subunit; has similarity to E. coli L4 ribosomal protein and human mitoribosomal MRP-L4 protein; essential for viability, unlike most other mitoribosomal proteins -S000036690 CDS YML025C 13 225239 224406 C 1996-07-31 1996-07-31 -S000036689 CDS YML025C 13 225365 225339 C 1996-07-31 1996-07-31 -S000036691 intron YML025C 13 225338 225240 C 1996-07-31 1996-07-31 -S000004486 ORF Verified YML024W RPS17A eS17|ribosomal 40S subunit protein S17A|S17e|rp51A|S17A|RPL51A|RP51A chromosome 13 L000001740|L000004479|L000001669 13 225889 226697 W 1996-07-31 1996-07-31 Ribosomal protein 51 (rp51) of the small (40s) subunit; homologous to mammalian ribosomal protein S17, no bacterial homolog; RPS17A has a paralog, RPS17B, that arose from the whole genome duplication -S000036659 CDS YML024W 13 225889 225891 W 1996-07-31 1996-07-31 -S000036660 CDS YML024W 13 226290 226697 W 1996-07-31 1996-07-31 -S000036661 intron YML024W 13 225892 226289 W 1996-07-31 1996-07-31 -S000004485 ORF Verified YML023C NSE5 Smc5-Smc6 complex subunit NSE5 chromosome 13 13 228664 226994 C 1996-07-31 1996-07-31 Component of the SMC5-SMC6 complex; this complex plays a key role in the removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair -S000035667 CDS YML023C 13 228664 226994 C 1996-07-31 1996-07-31 -S000004484 ORF Verified YML022W APT1 adenine phosphoribosyltransferase APT1 chromosome 13 L000002641 13 228937 229500 W 1996-07-31 1996-07-31 Adenine phosphoribosyltransferase; catalyzes the formation of AMP from adenine and 5-phosphoribosylpyrophosphate; involved in the salvage pathway of purine nucleotide biosynthesis; APT1 has a paralog, APT2, that arose from the whole genome duplication -S000035625 CDS YML022W 13 228937 229500 W 1996-07-31 1996-07-31 -S000004483 ORF Verified YML021C UNG1 uracil-DNA glycosylase chromosome 13 L000002428 13 230813 229734 C -16 1996-07-31 1996-07-31 Uracil-DNA glycosylase; required for repair of uracil in DNA formed by spontaneous cytosine deamination; efficiently excises uracil from single-stranded DNA in vivo; not required for strand-specific mismatch repair; cell-cycle regulated, expressed in late G1; localizes to mitochondria and nucleus -S000035496 CDS YML021C 13 230813 229734 C 1996-07-31 1996-07-31 -S000004482 ORF Uncharacterized YML020W chromosome 13 13 231149 233143 W 1996-07-31 1996-07-31 Putative protein of unknown function -S000034551 CDS YML020W 13 231149 233143 W 1996-07-31 1996-07-31 -S000004481 ORF Verified YML019W OST6 dolichyl-diphosphooligosaccharide--protein glycotransferase chromosome 13 L000004224 13 233457 234455 W 1996-07-31 1996-07-31 Subunit of the oligosaccharyltransferase complex of the ER lumen; complex catalyzes asparagine-linked glycosylation of newly synthesized proteins; similar to and partially functionally redundant with Ost3p -S000033544 CDS YML019W 13 233457 234455 W 1996-07-31 1996-07-31 -S000004480 ORF Verified YML018C chromosome 13 13 235952 234771 C 1996-07-31 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the membrane of the vacuole; physical interaction with Atg27p suggests a possible role in autophagy; YML018C is not an essential gene; relative distribution to the vacuolar membrane decreases upon DNA replication stress; YML018C has a paralog, THI74, that arose from the whole genome duplication -S000033433 CDS YML018C 13 235952 234771 C 1996-07-31 1996-07-31 -S000004479 ORF Verified YML017W PSP2 MRS15 chromosome 13 L000002882 13 236588 238731 W 2004-01-30 2004-01-30|1996-07-31|1999-07-17 Asn rich cytoplasmic protein that contains RGG motifs; high-copy suppressor of group II intron-splicing defects of a mutation in MRS2 and of a conditional mutation in POL1 (DNA polymerase alpha); possible role in mitochondrial mRNA splicing -S000033400 CDS YML017W 13 236588 236591 W 2004-01-30 2004-01-30|1999-07-17|1996-07-31 -S000033401 CDS YML017W 13 236954 238731 W 2004-01-30 2004-01-30 -S000033402 intron YML017W 13 236592 236953 W 2004-01-30 2004-01-30 -S000004478 ORF Verified YML016C PPZ1 salt homeostasis regulator chromosome 13 L000001478 13 241536 239458 C 1996-07-31 1996-07-31 Serine/threonine protein phosphatase Z, isoform of Ppz2p; involved in regulation of potassium transport, which affects osmotic stability, cell cycle progression, and halotolerance -S000032668 CDS YML016C 13 241536 239458 C 1996-07-31 1996-07-31 -S000004477 ORF Verified YML015C TAF11 TafII40|TAF40 chromosome 13 L000003461 13 243029 241989 C 1996-07-31 1996-07-31 TFIID subunit (40 kDa); involved in RNA polymerase II transcription initiation, similar to histone H3 with atypical histone fold motif of Spt3-like transcription factors -S000032578 CDS YML015C 13 243029 241989 C 1996-07-31 1996-07-31 -S000004476 ORF Verified YML014W TRM9 tRNA (carboxymethyluridine(34)-5-O)-methyltransferase|KTI1 chromosome 13 S000028426 13 243225 244064 W 1996-07-31 1996-07-31 tRNA methyltransferase; catalyzes modification of wobble bases in tRNA anticodons to 2, 5-methoxycarbonylmethyluridine and 5-methoxycarbonylmethyl-2-thiouridine; may act as part of a complex with Trm112p; deletion mutation increases translational infidelity, including amino acid misincorporation and -1 frameshifting, and also confers resistance to zymocin; null mutant displays activation of stress responses -S000032547 CDS YML014W 13 243225 244064 W 1996-07-31 1996-07-31 -S000004475 ORF Verified YML013W UBX2 SEL1 chromosome 13 13 244149 245903 W 1996-07-31 1996-07-31 Bridging factor involved in ER-associated protein degradation (ERAD); bridges the cytosolic Cdc48p-Npl1p-Ufd1p ATPase complex and the membrane associated Ssm4p and Hrd1p ubiquitin ligase complexes; contains a UBX (ubiquitin regulatory X) domain and a ubiquitin-associated (UBA) domain; redistributes from the ER to lipid droplets during the diauxic shift and stationary phase; required for the maintenance of lipid homeostasis -S000032448 CDS YML013W 13 244149 245903 W 1996-07-31 1996-07-31 -S000004474 ORF Dubious YML012C-A YML013C-A chromosome 13 13 245914 245537 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene SEL1 -S000037094 CDS YML012C-A 13 245914 245537 C 1996-07-31 1996-07-31 -S000004473 ORF Verified YML012W ERV25 chromosome 13 L000004076 13 246116 246751 W 1996-07-31 1996-07-31 Member of the p24 family involved in ER to Golgi transport; role in misfolded protein quality control; forms a heterotrimeric complex with Erp1, Erp2p, and Emp24, -S000031434 CDS YML012W 13 246116 246751 W 1996-07-31 1996-07-31 -S000004472 ORF Verified YML011C RAD33 chromosome 13 13 247428 246895 C 1996-07-31 1996-07-31 Protein involved in nucleotide excision repair; green fluorescent protein (GFP)-fusion protein localizes to the nucleus -S000031265 CDS YML011C 13 247428 246895 C 1996-07-31 1996-07-31 -S000004470 ORF Verified YML010W SPT5 transcription elongation factor SPT5 chromosome 13 L000002031 13 247677 250868 W -5 1996-07-31 1996-07-31 Spt4p/5p (DSIF) transcription elongation factor complex subunit; the Spt4/5 complex binds to ssRNA in a sequence-specific manner, and in concert with RNAP I and II has multiple roles regulating transcriptional elongation, RNA processing, quality control, and transcription-coupled repair; interacts with DNA upstream of RNAPII and the non-template strand of the transcription bubble; Spt5p is the only transcription elongation factor conserved in all domains of life -S000031213 CDS YML010W 13 247677 250868 W 1996-07-31 1996-07-31 -S000004471 ORF Dubious YML009W-B YML010W-A chromosome 13 13 250435 250911 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; deletion mutation confers an increase in Ty1 transposition -S000032788 CDS YML009W-B 13 250435 250911 W 1996-07-31 1996-07-31 -S000004469 ORF Dubious YML009C-A YML010W-B|YML010C-B chromosome 13 13 251001 250675 C 1997-07-01 1997-07-01 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORFs SPT5/YML010W and YML009W-B -S000031473 CDS YML009C-A 13 251001 250675 C 1997-07-01 1997-07-01 -S000004468 ORF Verified YML009C MRPL39 mitochondrial 54S ribosomal protein YmL39|YmL39 chromosome 13 L000002695 13 251516 251304 C 1996-07-31 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000037268 CDS YML009C 13 251516 251304 C 1996-07-31 1996-07-31 -S000004467 ORF Verified YML008C ERG6 sterol 24-C-methyltransferase|VID1|SED6|LIS1|ISE1 chromosome 13 L000000572|S000029637|L000003110 13 252990 251839 C 2 1996-07-31 1996-07-31 Delta(24)-sterol C-methyltransferase; converts zymosterol to fecosterol in the ergosterol biosynthetic pathway by methylating position C-24; localized to lipid particles, the plasma membrane-associated endoplasmic reticulum, and the mitochondrial outer membrane -S000037178 CDS YML008C 13 252990 251839 C 1996-07-31 1996-07-31 -S000007621 ORF Uncharacterized YML007C-A chromosome 13 13 253272 253162 C 2001-02-26 2001-02-26 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to mitochondria -S000037219 CDS YML007C-A 13 253272 253162 C 2001-02-26 2001-02-26 -S000004466 ORF Verified YML007W YAP1 PDR4|DNA-binding transcription factor YAP1|SNQ3|PAR1 chromosome 13 L000001364 13 253848 255800 W -8 1996-07-31 1996-07-31 Basic leucine zipper (bZIP) transcription factor; required for oxidative stress tolerance; activated by H2O2 through the multistep formation of disulfide bonds and transit from the cytoplasm to the nucleus; Yap1p is degraded in the nucleus after the oxidative stress has passed; mediates resistance to cadmium; relative distribution to the nucleus increases upon DNA replication stress; YAP1 has a paralog, CAD1, that arose from the whole genome duplication -S000037132 CDS YML007W 13 253848 255800 W 1996-07-31 1996-07-31 -S000004465 ORF Verified YML006C GIS4 chromosome 13 L000004864 13 258416 256092 C 1996-07-31 1996-07-31 CAAX box containing protein of unknown function; proposed to be involved in the RAS/cAMP signaling pathway -S000036417 CDS YML006C 13 258416 256092 C 1996-07-31 1996-07-31 -S000006729 tRNA_gene tS(AGA)M chromosome 13 L000003683 13 259239 259158 C 2000-05-19 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000032411 noncoding_exon tS(AGA)M 13 259239 259158 C 2000-05-19 2000-05-19 -S000004464 ORF Verified YML005W TRM12 TYW2 chromosome 13 13 260221 261609 W 1996-07-31 1996-07-31 S-adenosylmethionine-dependent methyltransferase; required for wybutosine formation in phenylalanine-accepting tRNA; member of the seven beta-strand family -S000036385 CDS YML005W 13 260221 261609 W 1996-07-31 1996-07-31 -S000004463 ORF Verified YML004C GLO1 lactoylglutathione lyase GLO1 chromosome 13 L000000712 13 262685 261705 C 1996-07-31 1996-07-31 Monomeric glyoxalase I; catalyzes the detoxification of methylglyoxal (a by-product of glycolysis) via condensation with glutathione to produce S-D-lactoylglutathione; expression regulated by methylglyoxal levels and osmotic stress -S000036221 CDS YML004C 13 262685 261705 C 1996-07-31 1996-07-31 -S000118369 ARS ARS1309 ARSXIII-263 chromosome 13 13 263063 263296 2006-08-30 2006-08-30 Autonomously Replicating Sequence -S000178155 ARS_consensus_sequence ARS1309 13 263126 263142 W 2014-11-18 2014-11-18 -S000004462 ORF Uncharacterized YML003W chromosome 13 13 263483 264355 W 1996-07-31 1996-07-31 Putative protein of unknown function -S000036178 CDS YML003W 13 263483 264355 W 1996-07-31 1996-07-31 -S000004461 ORF Uncharacterized YML002W chromosome 13 13 264541 266754 W 1996-07-31 1996-07-31 Putative protein of unknown function; expression induced by heat and by calcium shortage -S000035235 CDS YML002W 13 264541 266754 W 1996-07-31 1996-07-31 -S000004460 ORF Verified YML001W YPT7 Rab family GTPase YPT7|VAM4|AST4 chromosome 13 L000002544 13 267174 267800 W 1996-07-31 1996-07-31 Rab family GTPase; GTP-binding protein of the rab family; required for homotypic fusion event in vacuole inheritance, for endosome-endosome fusion; localizes to sites of contact between the vacuole and mitochondria (vCLAMPs); interacts with the cargo selection/retromer complex for retrograde sorting; similar to mammalian Rab7 -S000035058 CDS YML001W 13 267174 267800 W 1996-07-31 1996-07-31 -S000006474 centromere CEN13 CEN13 chromosome 13 L000000306 13 268031 268149 W 0 2004-10-08 2000-05-19|2004-10-08 Chromosome XIII centromere -S000077278 centromere_DNA_Element_I CEN13 13 268031 268040 W 2004-10-05 2004-10-05 -S000077279 centromere_DNA_Element_II CEN13 13 268041 268124 W 2004-10-05 2004-10-05 -S000077280 centromere_DNA_Element_III CEN13 13 268125 268149 W 2004-10-05 2004-10-05 -S000004603 ORF Verified YMR001C CDC5 polo kinase CDC5|PKX2|MSD2 chromosome 13 L000000245 13 271136 269019 C -14 1996-07-31 1996-07-31 Polo-like kinase; controls targeting and activation of Rho1p at cell division site via Rho1p guanine nucleotide exchange factors; regulates Spc72p; also functions in adaptation to DNA damage during meiosis; regulates the shape of the nucleus and expansion of the nuclear envelope during mitosis; similar to Xenopus Plx1 and S. pombe Plo1p; human homologs PLK1, PLK3 can each complement yeast cdc5 thermosensitive mutants -S000031052 CDS YMR001C 13 271136 269019 C 1996-07-31 1996-07-31 -S000028691 ORF Uncharacterized YMR001C-A chromosome 13 13 271577 271347 C 2003-07-29 2003-07-29 Putative protein of unknown function -S000032590 CDS YMR001C-A 13 271577 271347 C 2003-07-29 2003-07-29 -S000004604 ORF Verified YMR002W MIX17 MIC17 chromosome 13 13 272193 272663 W 1996-07-31 1996-07-31 Mitochondrial intermembrane space protein; required for normal oxygen consumption; contains twin cysteine-x9-cysteine motifs; protein abundance increases in response to DNA replication stress -S000031255 CDS YMR002W 13 272193 272663 W 1996-07-31 1996-07-31 -S000004605 ORF Verified YMR003W AIM34 chromosome 13 13 273118 273714 W 1996-07-31 1996-07-31 Protein of unknown function; GFP-fusion protein localizes to the mitochondria; null mutant is viable and displays reduced frequency of mitochondrial genome loss -S000032255 CDS YMR003W 13 273118 273714 W 1996-07-31 1996-07-31 -S000004606 ORF Verified YMR004W MVP1 chromosome 13 L000001221 13 274017 275552 W 1996-07-31 1996-07-31 Protein required for sorting proteins to the vacuole; Mvp1p and Vps1p act in concert to promote membrane traffic to the vacuole; participates in transcription initiation and/or early elongation of specific genes; interacts with "foot domain" of RNA polymerase II; deletion results in abnormal CTD-Ser5 phosphorylation of RNA polymerase II at specific promoter regions; protein abundance increases in response to DNA replication stress -S000032360 CDS YMR004W 13 274017 275552 W 1996-07-31 1996-07-31 -S000004607 ORF Verified YMR005W TAF4 TafII48|MPT1|TSG2|TAF48 chromosome 13 L000001144 13 276045 277211 W 1996-07-31 1996-07-31 TFIID subunit (48 kDa); involved in RNA polymerase II transcription initiation; potential Cdc28p substrate -S000032443 CDS YMR005W 13 276045 277211 W 1996-07-31 1996-07-31 -S000004608 ORF Verified YMR006C PLB2 lysophospholipase chromosome 13 L000004866 13 279681 277561 C 1996-07-31 1996-07-31 Phospholipase B (lysophospholipase) involved in lipid metabolism; displays transacylase activity in vitro; overproduction confers resistance to lysophosphatidylcholine -S000032499 CDS YMR006C 13 279681 277561 C 1996-07-31 1996-07-31 -S000004609 ORF Uncharacterized YMR007W chromosome 13 13 279960 280340 W 1996-07-31 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YMR007W is not an essential gene -S000034599 CDS YMR007W 13 279960 280340 W 1996-07-31 1996-07-31 -S000004610 ORF Verified YMR008C PLB1 lysophospholipase chromosome 13 L000001447 13 282584 280590 C 1996-07-31 1996-07-31 Phospholipase B (lysophospholipase) involved in lipid metabolism; required for efficient acyl chain remodeling of newly synthesized phosphatidylethanolamine-derived phosphatidylcholine; required for deacylation of phosphatidylcholine and phosphatidylethanolamine but not phosphatidylinositol; PLB1 has a paralog, PLB3, that arose from the whole genome duplication -S000034626 CDS YMR008C 13 282584 280590 C 1996-07-31 1996-07-31 -S000004611 ORF Verified YMR009W ADI1 acireductone dioxygenase (Ni2+-requiring) chromosome 13 13 284102 284641 W 2011-02-03 1996-07-31 Acireductone dioxygenease involved in methionine salvage pathway; transcribed as polycistronic mRNA with YMR010W and regulated post-transcriptionally by RNase III (Rnt1p) cleavage; ADI1 mRNA is induced in heat shock conditions; human ortholog ADI1 can complement yeast adi1 mutant -S000034714 CDS YMR009W 13 284102 284641 W 2011-02-03 1996-07-31 -S000004612 ORF Verified YMR010W ANY1 chromosome 13 13 285100 286317 W 2011-02-03 1996-07-31 Putative protein of unknown function; null allele suppresses the lethality of neo1 and dop1 null alleles, as well as the growth defect of a mon2 null allele, and the cold sensitivity of a drs2 null; proposed function as a phospholipid scramblase that reduces membrane asymmetry; PQ loop family member; localizes to the cytoplasm and endoplasmic reticulum in HTP studies; non-essential gene -S000034268 CDS YMR010W 13 285100 286317 W 2011-02-03 1996-07-31 -S000118370 ARS ARS1310 ARSXIII-287 chromosome 13 13 286835 286951 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000004613 ORF Verified YMR011W HXT2 hexose transporter HXT2 chromosome 13 L000000836 13 288079 289704 W 2011-02-03 1996-07-31 High-affinity glucose transporter of the major facilitator superfamily; expression is induced by low levels of glucose and repressed by high levels of glucose -S000034391 CDS YMR011W 13 288079 289704 W 2011-02-03 1996-07-31 -S000007117 long_terminal_repeat YMRCtau1 chromosome 13 13 290224 290049 C 2011-02-03 2000-05-19 Ty4 LTR -S000006560 tRNA_gene tE(UUC)M chromosome 13 L000003667 13 290801 290872 W 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000036015 noncoding_exon tE(UUC)M 13 290801 290872 W 2011-02-03 2000-05-19 -S000004614 ORF Verified YMR012W CLU1 translation initiation factor 3 subunit CLU1|TIF31 chromosome 13 L000003531 13 291134 294967 W 2011-02-03 1996-07-31 Subunit of the eukaryotic translation initiation factor 3 (eIF3); component of unknown function; deletion causes defects in mitochondrial organization but not in growth or translation initiation; can rescue cytokinesis and mitochondrial organization defects of the Dictyostelium cluA- mutant; eIF3 is also involved in programmed stop codon readthrough -S000035421 CDS YMR012W 13 291134 294967 W 2011-02-03 1996-07-31 -S000028847 ORF Dubious YMR013C-A chromosome 13 13 296620 296471 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF SEC59/YML013C -S000034532 CDS YMR013C-A 13 296620 296471 C 2011-02-03 2003-07-29 -S000004615 ORF Verified YMR013C SEC59 dolichol kinase chromosome 13 L000001851 13 296738 295179 C 3 2011-02-03 1996-07-31 Dolichol kinase; catalyzes the terminal step in dolichyl monophosphate (Dol-P) biosynthesis; required for viability and for normal rates of lipid intermediate synthesis and protein N-glycosylation -S000035477 CDS YMR013C 13 296738 295179 C 2011-02-03 1996-07-31 -S000007312 snoRNA_gene snR78 SNR78 Z8 chromosome 13 L000004806 13 297278 297364 W 2011-02-03 2000-05-19|2007-05-08 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U2421 -S000031835 noncoding_exon snR78 13 297278 297364 W 2011-02-03 2000-05-19|2007-05-08 -S000007311 snoRNA_gene snR77 SNR77 Z7 chromosome 13 L000004805 13 297506 297593 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position U578 -S000031791 noncoding_exon snR77 13 297506 297593 W 2011-02-03 2000-05-19 -S000007310 snoRNA_gene snR76 SNR76 Z6 chromosome 13 L000004804 13 297725 297833 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position C2197 -S000031789 noncoding_exon snR76 13 297725 297833 W 2011-02-03 2000-05-19 -S000007309 snoRNA_gene snR75 SNR75 Z5 chromosome 13 L000004803 13 297918 298006 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position G2288 -S000031787 noncoding_exon snR75 13 297918 298006 W 2011-02-03 2000-05-19 -S000007308 snoRNA_gene snR74 SNR74 Z4 chromosome 13 L000004802 13 298138 298225 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position A28 -S000031786 noncoding_exon snR74 13 298138 298225 W 2011-02-03 2000-05-19 -S000007307 snoRNA_gene snR73 SNR73 Z3 chromosome 13 L000004801 13 298307 298412 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position C2959 -S000031785 noncoding_exon snR73 13 298307 298412 W 2011-02-03 2000-05-19 -S000007622 ORF Dubious YMR013W-A chromosome 13 13 298311 298391 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the characterized snoRNA gene snR73 -S000037220 CDS YMR013W-A 13 298311 298391 W 2011-02-03 2001-02-26 -S000007306 snoRNA_gene snR72 SNR72 Z2 chromosome 13 L000004800 13 298554 298651 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A876 -S000031784 noncoding_exon snR72 13 298554 298651 W 2011-02-03 2000-05-19 -S000004616 ORF Verified YMR014W BUD22 chromosome 13 13 298868 300427 W 2011-02-03 1996-07-31 Protein required for rRNA maturation and ribosomal subunit biogenesis; required for 18S rRNA maturation; also required for small ribosomal subunit biogenesis; cosediments with pre-ribosomal particles; mutation decreases efficiency of +1 Ty1 frameshifting and transposition, and affects budding pattern -S000035607 CDS YMR014W 13 298868 300427 W 2011-02-03 1996-07-31 -S000004617 ORF Verified YMR015C ERG5 C-22 sterol desaturase|CYP61 chromosome 13 L000003978 13 302485 300869 C 2011-02-03 1996-07-31 C-22 sterol desaturase; a cytochrome P450 enzyme that catalyzes the formation of the C-22(23) double bond in the sterol side chain in ergosterol biosynthesis; may be a target of azole antifungal drugs -S000035627 CDS YMR015C 13 302485 300869 C 2011-02-03 1996-07-31 -S000004618 ORF Verified YMR016C SOK2 chromosome 13 L000004147 13 305593 303236 C 2011-02-03 1996-07-31 Nuclear protein that negatively regulates pseudohyphal differentiation; plays a regulatory role in the cyclic AMP (cAMP)-dependent protein kinase (PKA) signal transduction pathway; relocalizes to the cytosol in response to hypoxia; SOK2 has a paralog, PHD1, that arose from the whole genome duplication -S000036571 CDS YMR016C 13 305593 303236 C 2011-02-03 1996-07-31 -S000004619 ORF Verified YMR017W SPO20 DBI9 chromosome 13 L000003397 13 307489 308682 W 2011-02-03 1996-07-31 Meiosis-specific subunit of the t-SNARE complex; required for prospore membrane formation during sporulation; similar to but not functionally redundant with Sec9p; binds to phosphatidic acid; SNAP-25 homolog -S000036703 CDS YMR017W 13 307489 308682 W 2011-02-03 1996-07-31 -S000004620 ORF Uncharacterized YMR018W PEX9 chromosome 13 13 310208 311752 W 2011-02-03 1996-07-31 Putative protein of unknown function with similarity to human PEX5Rp; transcription increases during colony development similar to genes involved in peroxisome biogenesis; YMR018W is not an essential gene; PEX5Rp is also known as peroxin protein 5 related protein -S000030567 CDS YMR018W 13 310208 311752 W 2011-02-03 1996-07-31 -S000004621 ORF Verified YMR019W STB4 chromosome 13 L000003367 13 312156 315005 W 2011-02-03 1996-07-31 Putative transcription factor; contains a Zn(II)2Cys6 zinc finger domain characteristic of DNA-binding proteins; computational analysis suggests a role in regulation of expression of genes encoding transporters; binds Sin3p in a two-hybrid assay; -S000030693 CDS YMR019W 13 312156 315005 W 2011-02-03 1996-07-31 -S000004622 ORF Verified YMR020W FMS1 polyamine oxidase chromosome 13 L000003091 13 315377 316903 W 2011-02-03 1996-07-31 Polyamine oxidase; converts spermine to spermidine, which is required for the essential hypusination modification of translation factor eIF-5A; also involved in pantothenic acid biosynthesis -S000030473 CDS YMR020W 13 315377 316903 W 2011-02-03 1996-07-31 -S000004623 ORF Verified YMR021C MAC1 CUA1 chromosome 13 L000000973|L000001035 13 318418 317165 C 2011-02-03 1996-07-31 Copper-sensing transcription factor; involved in regulation of genes required for high affinity copper transport; required for regulation of yeast copper genes in response to DNA-damaging agents; undergoes changes in redox state in response to changing levels of copper or MMS -S000030536 CDS YMR021C 13 318418 317165 C 2011-02-03 1996-07-31 -S000004624 ORF Verified YMR022W UBC7 E2 ubiquitin-conjugating protein UBC7|DER2|QRI8 chromosome 13 L000001552 13 318680 319177 W 2011-02-03 1996-07-31 Ubiquitin conjugating enzyme; involved in the ER-associated protein degradation (ERAD) pathway and in the inner nuclear membrane-associated degradation (INMAD) pathway; requires Cue1p for recruitment to the ER membrane; proposed to be involved in chromatin assembly -S000031503 CDS YMR022W 13 318680 319177 W 2011-02-03 1996-07-31 -S000004625 ORF Verified YMR023C MSS1 PET53 chromosome 13 L000001201 13 321017 319437 C 2011-02-03 1996-07-31 Mitochondrial protein; forms a heterodimer complex with Mto1p that performs the 5-carboxymethylaminomethyl modification of the wobble uridine base in mitochondrial tRNAs; similar to human GTPBP3 -S000031572 CDS YMR023C 13 321017 319437 C 2011-02-03 1996-07-31 -S000006518 tRNA_gene tA(AGC)M1 chromosome 13 L000003682 13 321219 321147 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine -S000036429 noncoding_exon tA(AGC)M1 13 321219 321147 C 2011-02-03 2000-05-19 -S000004626 ORF Verified YMR024W MRPL3 mitochondrial 54S ribosomal protein YmL3|YmL3 chromosome 13 L000002683 13 321875 323047 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; located in close proximity to the polypeptide exit channel of the ribosome; mutations in human homolog MRPL44 cause childhood cardiomyopathy; human MRPL44 deficiency results in inefficient assembly of the mitochondrial ribosome, and in tissue-specific respiratory chain deficiency, manifesting as either Complex I+Complex IV or Complex IV deficiency, depending on a cell type -S000032636 CDS YMR024W 13 321875 323047 W 2011-02-03 1996-07-31 -S000004627 ORF Verified YMR025W CSI1 chromosome 13 S000028416 13 323300 324187 W 2011-02-03 1996-07-31 Subunit of the Cop9 signalosome; which is required for deneddylation, or removal of the ubiquitin-like protein Rub1p from Cdc53p (cullin); involved in adaptation to pheromone signaling; functional equivalent of canonical Csn6 subunit of the COP9 signalosome -S000032707 CDS YMR025W 13 323300 324187 W 2011-02-03 1996-07-31 -S000004628 ORF Verified YMR026C PEX12 ubiquitin-protein ligase peroxin 12|PAS11 chromosome 13 L000004223|L000003964 13 325435 324236 C 2011-02-03 1996-07-31 C3HC4-type RING-finger peroxin and E3 ubiquitin ligase; required for peroxisome biogenesis and peroxisomal matrix protein import; forms translocation subcomplex with Pex2p and Pex10p; mutations in human homolog cause peroxisomal disorder -S000032743 CDS YMR026C 13 325435 324236 C 2011-02-03 1996-07-31 -S000004629 ORF Verified YMR027W putative methyltransferase chromosome 13 L000004444 13 325877 327289 W 2011-02-03 1996-07-31 A metal-dependent phosphatase, part of the DUF89 protein family; dephosphorylates fructose-1-phosphate; human ortholog, C6orf211 is involved in response to DNA damage; green fluorescent protein (GFP)-fusion protein localizes to the nucleus and cytoplasm; YMR027W is not an essential gene -S000032910 CDS YMR027W 13 325877 327289 W 2011-02-03 1996-07-31 -S000004630 ORF Verified YMR028W TAP42 chromosome 13 L000002599 13 327482 328582 W 2011-02-03 1996-07-31 Essential protein involved in the TOR signaling pathway; physically associates with the protein phosphatase 2A and the SIT4 protein phosphatase catalytic subunits -S000034867 CDS YMR028W 13 327482 328582 W 2011-02-03 1996-07-31 -S000004631 ORF Verified YMR029C FAR8 chromosome 13 13 330231 328660 C 2011-02-03 1996-07-31 Protein involved in recovery from arrest in response to pheromone; acts in a cell cycle arrest recovery pathway independent from Far1p; interacts with Far3p, Far7p, Far9p, Far10p, and Far11p -S000034915 CDS YMR029C 13 330231 328660 C 2011-02-03 1996-07-31 -S000004632 ORF Verified YMR030W RSF1 chromosome 13 13 330793 331923 W 2011-02-03 1996-07-31 Protein required for respiratory growth; localized to both the nucleus and mitochondrion; may interact with transcription factors to mediate the transition to respiratory growth and activate transcription of nuclear and mitochondrial genes -S000033894 CDS YMR030W 13 330793 331923 W 2011-02-03 1996-07-31 -S000004634 ORF Dubious YMR031W-A chromosome 13 13 334709 335035 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; null mutant displays shortened telomeres; partially overlaps the uncharacterized ORF YMR031C -S000036523 CDS YMR031W-A 13 334709 335035 W 2011-02-03 1996-07-31 -S000004633 ORF Verified YMR031C EIS1 chromosome 13 13 334743 332212 C 2011-02-03 1996-07-31 Component of the eisosome required for proper eisosome assembly; similar to Uso1p; authentic, non-tagged protein is detected in a phosphorylated state in highly purified mitochondria in high-throughput studies; protein increases in abundance and relocalizes from plasma membrane to cytoplasm upon DNA replication stress; EIS1 has a paralog, YKL050C, that arose from the whole genome duplication -S000033984 CDS YMR031C 13 334743 332212 C 2011-02-03 1996-07-31 -S000004635 ORF Verified YMR032W HOF1 formin-binding protein HOF1|CYK2 chromosome 13 L000004406 13 335298 337307 W 2011-02-03 1996-07-31 Protein that regulates actin cytoskeleton organization; required for cytokinesis, actin cable organization, and secretory vesicle trafficking; localized to bud neck; phosphorylated by Dbf2p; regulates actomyosin ring dynamics and septin localization; contains an SH3 domain; N terminus controls cell size and levels of actin cables, while C terminus controls actin cable organization via direct regulation of the formin Bnr1p -S000034951 CDS YMR032W 13 335298 337307 W 2011-02-03 1996-07-31 -S000028574 ORF Uncharacterized YMR030W-A chromosome 13 13 337313 337603 W 2011-02-03 2003-07-29 Putative protein of unknown function; mCherry fusion protein localizes to the cytosol -S000031303 CDS YMR030W-A 13 337313 337603 W 2011-02-03 2003-07-29 -S000004636 ORF Verified YMR033W ARP9 RSC12|SWP59 chromosome 13 L000003438 13 337788 339277 W 2011-02-03 1996-07-31 Component of both the SWI/SNF and RSC chromatin remodeling complexes; actin-related protein involved in transcriptional regulation -S000035135 CDS YMR033W 13 337788 337817 W 2011-02-03 1996-07-31 -S000035136 CDS YMR033W 13 337904 339277 W 2011-02-03 1996-07-31 -S000035137 intron YMR033W 13 337818 337903 W 2011-02-03 1996-07-31 -S000004637 ORF Verified YMR034C RCH1 chromosome 13 13 340722 339418 C 2011-02-03 1996-07-31 Putative transporter; localizes to the plasma membrane in response to high levels of extracellular calcium; member of the SLC10 carrier family; identified in a transposon mutagenesis screen as a gene involved in azole resistance; YMR034C is not an essential gene -S000035192 CDS YMR034C 13 340722 339418 C 2011-02-03 1996-07-31 -S000004638 ORF Verified YMR035W IMP2 endopeptidase catalytic subunit chromosome 13 L000002836 13 341142 341675 W 2011-02-03 1996-07-31 Catalytic subunit of mitochondrial inner membrane peptidase complex; required for maturation of mitochondrial proteins of the intermembrane space; complex contains two catalytic subunits (Imp1p and Imp2p that differ in substrate specificity), and Som1p -S000036191 CDS YMR035W 13 341142 341675 W 2011-02-03 1996-07-31 -S000004639 ORF Verified YMR036C MIH1 putative tyrosine protein phosphatase MIH1 chromosome 13 L000001111 13 343520 341856 C 2011-02-03 1996-07-31 Protein tyrosine phosphatase involved in cell cycle control; regulates the phosphorylation state of Cdc28p; homolog of S. pombe cdc25 -S000036273 CDS YMR036C 13 343520 341856 C 2011-02-03 1996-07-31 -S000004640 ORF Verified YMR037C MSN2 stress-responsive transcriptional activator MSN2 chromosome 13 L000001198 13 346517 344403 C 2011-02-03 1996-07-31 Stress-responsive transcriptional activator; activated in stochastic pulses of nuclear localization in response to various stress conditions; binds DNA at stress response elements of responsive genes; relative distribution to nucleus increases upon DNA replication stress -S000036377 CDS YMR037C 13 346517 344403 C 2011-02-03 1996-07-31 -S000004641 ORF Verified YMR038C CCS1 copper chaperone CCS1|LYS7|CCS chromosome 13 L000000968 13 348260 347511 C 30 2011-02-03 1996-07-31 Copper chaperone for superoxide dismutase Sod1p; involved in oxidative stress protection; Met-X-Cys-X2-Cys motif within N-terminus is involved in insertion of copper into Sod1p under conditions of copper deprivation; required for regulation of yeast copper genes in response to DNA-damaging agents; protein abundance increases in response to DNA replication stress; human homolog CCS can complement yeast ccs1 null mutant -S000036442 CDS YMR038C 13 348260 347511 C 2011-02-03 1996-07-31 -S000004642 ORF Verified YMR039C SUB1 chromatin-binding transcription coactivator SUB1|TSP1 chromosome 13 L000003936 13 349522 348644 C 2011-02-03 1996-07-31 Transcriptional regulator; facilitates elongation through factors that modify RNAP II; role in peroxide resistance involving Rad2p; role in nonhomologous end-joining (NHEJ) of ds breaks in plasmid DNA, but not chromosomal DNA; role in the hyperosmotic stress response through polymerase recruitment at RNAP II and RNAP III genes; negatively regulates sporulation; protein abundance increases in response to DNA replication stress; functionally complemented by human SUB1 (PC4) -S000037092 CDS YMR039C 13 349522 348644 C 2011-02-03 1996-07-31 -S000004643 ORF Verified YMR040W YET2 chromosome 13 13 350381 350863 W 2011-02-03 1996-07-31 Protein of unknown function that may interact with ribosomes; based on co-purification experiments; homolog of human BAP31 protein; YET2 has a paralog, YET1, that arose from the whole genome duplication -S000030127 CDS YMR040W 13 350381 350863 W 2011-02-03 1996-07-31 -S000004644 ORF Verified YMR041C ARA2 D-arabinose 1-dehydrogenase (NAD(P)(+)) ARA2 chromosome 13 13 351973 350966 C 2011-02-03 1996-07-31 NAD-dependent arabinose dehydrogenase; involved in biosynthesis of dehydro-D-arabinono-1,4-lactone; similar to plant L-galactose dehydrogenase -S000030237 CDS YMR041C 13 351973 350966 C 2011-02-03 1996-07-31 -S000006568 tRNA_gene tF(GAA)M chromosome 13 L000003668 13 352280 352370 W 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis -S000035417 intron tF(GAA)M 13 352317 352334 W 2011-02-03 2000-05-19 -S000035415 noncoding_exon tF(GAA)M 13 352280 352316 W 2011-02-03 2000-05-19 -S000035416 noncoding_exon tF(GAA)M 13 352335 352370 W 2011-02-03 2000-05-19 -S000004645 ORF Verified YMR042W ARG80 ARGRI|ARGR1 chromosome 13 L000000112 13 352603 353136 W 36 2011-02-03 1996-07-31 Transcription factor involved in regulating arginine-responsive genes; acts with Arg81p and Arg82p -S000031259 CDS YMR042W 13 352603 353136 W 2011-02-03 1996-07-31 -S000004646 ORF Verified YMR043W MCM1 transcription factor MCM1|FUN80 chromosome 13 L000001037 13 353871 354731 W 35 2011-02-03 1996-07-31 Transcription factor; involved in cell-type-specific transcription and pheromone response; plays a central role in the formation of both repressor and activator complexes; relocalizes to the cytosol in response to hypoxia -S000031354 CDS YMR043W 13 353871 354731 W 2011-02-03 1996-07-31 -S000004647 ORF Verified YMR044W IOC4 chromosome 13 13 355384 356811 W 2011-02-03 1996-07-31 Member of a complex (Isw1b) with Isw1p and Ioc2p; interacts directly with H3K36me3 nucleosomes through its PWWP domain to recruit the Isw1b complex to open reading frames in a Set2p-dependent manner; Isw1b exhibits nucleosome-stimulated ATPase activity and acts within coding regions to coordinate transcription elongation with termination and processing -S000032363 CDS YMR044W 13 355384 356811 W 2011-02-03 1996-07-31 -S000007109 long_terminal_repeat YMRCdelta7 chromosome 13 13 357336 357005 C 2011-02-03 2000-05-19 Ty1 LTR -S000004648 transposable_element_gene YMR045C gag-pol fusion protein chromosome 13 13 362627 357359 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000032431 CDS YMR045C 13 361321 357359 C 2011-02-03 1999-07-17|1996-07-31 -S000032430 CDS YMR045C 13 362627 361323 C 2011-02-03 1999-07-17|1996-07-31 -S000032432 plus_1_translational_frameshift YMR045C 13 361322 361322 C 2011-02-03 1999-07-17|1996-07-31 -S000004649 transposable_element_gene YMR046C gag protein chromosome 13 13 362627 361305 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000032514 CDS YMR046C 13 362627 361305 C 2011-02-03 1996-07-31 -S000007248 ORF Dubious YMR046W-A chromosome 13 13 362702 362830 W 2011-02-03 1997-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033646 CDS YMR046W-A 13 362702 362830 W 2011-02-03 1997-07-17 -S000007119 LTR_retrotransposon YMRCTy1-3 Ty1 chromosome 13 13 362918 357005 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007110 long_terminal_repeat YMRCdelta8 chromosome 13 13 362918 362587 C 2011-02-03 2000-05-19 Ty1 LTR -S000006599 tRNA_gene tH(GUG)M chromosome 13 L000003669 13 363064 363135 W 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis -S000033895 noncoding_exon tH(GUG)M 13 363064 363135 W 2011-02-03 2000-05-19 -S000004650 ORF Verified YMR047C NUP116 FG-nucleoporin NUP116|NSP116 chromosome 13 L000001293 13 366705 363364 C 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; contributes directly to nucleocytoplasmic transport and maintenance of the nuclear pore complex (NPC) permeability barrier; forms a stable association with Nup82p, Gle2p and two other FG-nucleoporins (Nsp1p and Nup159p); NUP116 has a paralog, NUP100, that arose from the whole genome duplication -S000032621 CDS YMR047C 13 366705 363364 C 2011-02-03 1996-07-31 -S000004651 ORF Verified YMR048W CSM3 chromosome 13 13 366981 367934 W 2011-02-03 1996-07-31 Replication fork associated factor; required for stable replication fork pausing; component of the DNA replication checkpoint pathway; required for accurate chromosome segregation during meiosis; forms nuclear foci upon DNA replication stress -S000033358 CDS YMR048W 13 366981 367934 W 2011-02-03 1996-07-31 -S000004652 ORF Verified YMR049C ERB1 chromosome 13 13 370517 368094 C 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; forms a complex with Nop7p and Ytm1p that is required for maturation of the large ribosomal subunit; required for maturation of the 25S and 5.8S ribosomal RNAs; homologous to mammalian Bop1 -S000033387 CDS YMR049C 13 370517 368094 C 2011-02-03 1996-07-31 -S000118371 ARS ARS1312 ARSXIII-371 chromosome 13 13 371001 371105 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178156 ARS_consensus_sequence ARS1312 13 371019 371035 W 2014-11-18 2014-11-18 -S000006763 tRNA_gene tV(AAC)M1 chromosome 13 L000003681 13 372518 372445 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000030017 noncoding_exon tV(AAC)M1 13 372518 372445 C 2011-02-03 2000-05-19 -S000007111 long_terminal_repeat YMRCdelta9 chromosome 13 13 373034 372697 C 2011-02-03 2000-05-19 Ty1 LTR -S000004653 transposable_element_gene YMR050C gag-pol fusion protein chromosome 13 13 378325 373057 C 2011-02-03 1999-07-17|1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000034328 CDS YMR050C 13 377019 373057 C 2011-02-03 1999-07-17|1996-07-31 -S000034327 CDS YMR050C 13 378325 377021 C 2011-02-03 1999-07-17|1996-07-31 -S000034329 plus_1_translational_frameshift YMR050C 13 377020 377020 C 2011-02-03 1999-07-17|1996-07-31 -S000004654 transposable_element_gene YMR051C gag protein chromosome 13 13 378325 377003 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000034409 CDS YMR051C 13 378325 377003 C 2011-02-03 1996-07-31 -S000007120 LTR_retrotransposon YMRCTy1-4 Ty1 chromosome 13 13 378622 372697 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007112 long_terminal_repeat YMRCdelta10 chromosome 13 13 378622 378285 C 2011-02-03 2000-05-19 Ty1 LTR -S000007113 long_terminal_repeat YMRCdelta11 chromosome 13 13 379061 378727 C 2011-02-03 2000-05-19 Ty1 LTR -S000007121 long_terminal_repeat YMRWdelta12 chromosome 13 13 379072 379198 W 2011-02-03 2000-05-19 Ty1 LTR -S000006775 tRNA_gene tW(CCA)M chromosome 13 L000003680 13 379408 379303 C 2011-02-03 2000-05-19 Tryptophan tRNA (tRNA-Trp), predicted by tRNAscan-SE analysis -S000034112 intron tW(CCA)M 13 379372 379339 C 2011-02-03 2000-05-19 -S000034111 noncoding_exon tW(CCA)M 13 379338 379303 C 2011-02-03 2000-05-19 -S000034110 noncoding_exon tW(CCA)M 13 379408 379373 C 2011-02-03 2000-05-19 -S000004656 ORF Verified YMR052W FAR3 chromosome 13 L000002919 13 379586 380200 W 2011-02-03 1996-07-31 Protein of unknown function; involved in recovery from cell cycle arrest in response to pheromone, in a Far1p-independent pathway; interacts with Far7p, Far8p, Far9p, Far10p, and Far11p; localizes to the endoplasmic reticulum; protein abundance increases in response to DNA replication stress -S000035481 CDS YMR052W 13 379586 380200 W 2011-02-03 1996-07-31 -S000004655 ORF Dubious YMR052C-A chromosome 13 13 380434 380069 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036215 CDS YMR052C-A 13 380434 380069 C 2011-02-03 1996-07-31 -S000004657 ORF Verified YMR053C STB2 chromosome 13 L000002108 13 382898 380346 C 2011-02-03 1996-07-31 Protein that interacts with Sin3p in a two-hybrid assay; part of a large protein complex with Sin3p and Stb1p; STB2 has a paralog, STB6, that arose from the whole genome duplication -S000035527 CDS YMR053C 13 382898 380346 C 2011-02-03 1996-07-31 -S000004658 ORF Verified YMR054W STV1 H(+)-transporting V0 sector ATPase subunit a chromosome 13 L000002139 13 383303 385975 W 2011-02-03 1996-07-31 Subunit a of the vacuolar-ATPase V0 domain; one of two isoforms (Stv1p and Vph1p); Stv1p is located in V-ATPase complexes of the Golgi and endosomes while Vph1p is located in V-ATPase complexes of the vacuole -S000035660 CDS YMR054W 13 383303 385975 W 2011-02-03 1996-07-31 -S000004659 ORF Verified YMR055C BUB2 PAC7 chromosome 13 L000000197 13 387021 386101 C 2011-02-03 1996-07-31 Mitotic exit network regulator; forms GTPase-activating Bfa1p-Bub2p complex that binds Tem1p and spindle pole bodies, blocks cell cycle progression before anaphase in response to spindle and kinetochore damage -S000035699 CDS YMR055C 13 387021 386101 C 2011-02-03 1996-07-31 -S000004660 ORF Verified YMR056C AAC1 ADP/ATP carrier protein AAC1 chromosome 13 L000000003 13 388244 387315 C 2011-02-03 1996-07-31 Mitochondrial inner membrane ADP/ATP translocator; exchanges cytosolic ADP for mitochondrially synthesized ATP; phosphorylated; Aac1p is a minor isoform while Pet9p is the major ADP/ATP translocator; relocalizes from mitochondrion to cytoplasm upon DNA replication stress -S000036642 CDS YMR056C 13 388244 387315 C 2011-02-03 1996-07-31 -S000004661 ORF Dubious YMR057C chromosome 13 13 388730 388359 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF AAC1 -S000036707 CDS YMR057C 13 388730 388359 C 2011-02-03 1996-07-31 -S000004662 ORF Verified YMR058W FET3 ferroxidase FET3 chromosome 13 L000000610 13 388822 390732 W 2011-02-03 1996-07-31 Ferro-O2-oxidoreductase; multicopper oxidase that oxidizes ferrous (Fe2+) to ferric iron (Fe3+) for subsequent cellular uptake by transmembrane permease Ftr1p; required for high-affinity iron uptake and involved in mediating resistance to copper ion toxicity, belongs to class of integral membrane multicopper oxidases; protein abundance increases in response to DNA replication stress -S000036798 CDS YMR058W 13 388822 390732 W 2011-02-03 1996-07-31 -S000004663 ORF Verified YMR059W SEN15 chromosome 13 L000003972 13 391099 391485 W 2011-02-03 1996-07-31|2006-05-10 Subunit of the tRNA splicing endonuclease; tRNA splicing endonuclease (Sen complex) is composed of Sen2p, Sen15p, Sen34p, and Sen54p; Sen complex also cleaves the CBP1 mRNA at the mitochondrial surface -S000036866 CDS YMR059W 13 391099 391485 W 2011-02-03 1996-07-31|2006-05-10 -S000004664 ORF Verified YMR060C SAM37 SAM complex subunit SAM37|TOM37|PET3027|MAS37 chromosome 13 L000002841|L000003251 13 392515 391532 C 2011-02-03 1996-07-31 Component of the Sorting and Assembly Machinery (SAM) complex; the SAM (or TOB) complex is located in the mitochondrial outer membrane; binds precursors of beta-barrel proteins and facilitates their outer membrane insertion; contributes to SAM complex stability -S000037417 CDS YMR060C 13 392515 391532 C 2011-02-03 1996-07-31 -S000004665 ORF Verified YMR061W RNA14 cleavage polyadenylation factor subunit RNA14 chromosome 13 L000001650 13 392755 394788 W 2011-02-03 1996-07-31 Component of the cleavage and polyadenylation factor I (CF I); CF 1, composed of the CF 1A complex (Rna14p, Rna15p, Clp1p, Pcf11p) and Hrp1, is involved in cleavage and polyadenylation of mRNA 3' ends; bridges interaction between Rna15p and Hrp1p in the CF I complex; mutant displays reduced transcription elongation in the G-less-based run-on (GLRO) assay; required for gene looping and maintenance of genome stability; relocalizes to the cytosol in response to hypoxia -S000037628 CDS YMR061W 13 392755 394788 W 2011-02-03 1996-07-31 -S000004666 ORF Verified YMR062C ARG7 glutamate N-acetyltransferase|ECM40 chromosome 13 L000003528 13 396379 395054 C 2011-02-03 1996-07-31 Mitochondrial ornithine acetyltransferase; catalyzes the fifth step in arginine biosynthesis; also possesses acetylglutamate synthase activity, regenerates acetylglutamate while forming ornithine -S000037657 CDS YMR062C 13 396379 395054 C 2011-02-03 1996-07-31 -S000004667 ORF Verified YMR063W RIM9 chromosome 13 L000003427 13 397077 397796 W 2011-02-03 1996-07-31 Plasma membrane protein of unknown function; involved in the proteolytic activation of Rim101p in response to alkaline pH; interacts with Rim21p and Dfg16p to form a pH-sensing complex in the Rim101 pathway and is required to maintain Rim21p levels; has similarity to A. nidulans PalI; -S000030541 CDS YMR063W 13 397077 397796 W 2011-02-03 1996-07-31 -S000004668 ORF Verified YMR064W AEP1 NCA1 chromosome 13 L000000053 13 397903 399459 W 2011-02-03 1996-07-31 Protein required for expression of the mitochondrial OLI1 gene; mitochondrial OLI1 gene encodes subunit 9 of F1-F0 ATP synthase -S000030637 CDS YMR064W 13 397903 399459 W 2011-02-03 1996-07-31 -S000004669 ORF Verified YMR065W KAR5 FIG3 chromosome 13 L000003315 13 399702 401216 W 2011-02-03 1996-07-31 Protein required for nuclear membrane fusion during karyogamy; localizes to the membrane with a soluble portion in the endoplasmic reticulum lumen, may form a complex with Jem1p and Kar2p; similar to zebrafish Brambleberry protein; expression of the gene is regulated by pheromone -S000031502 CDS YMR065W 13 399702 401216 W 2011-02-03 1996-07-31 -S000004670 ORF Verified YMR066W SOV1 chromosome 13 L000004620 13 401541 404237 W 2011-02-03 1996-07-31 Mitochondrial protein of unknown function -S000031589 CDS YMR066W 13 401541 404237 W 2011-02-03 1996-07-31 -S000004671 ORF Verified YMR067C UBX4 CUI1 chromosome 13 13 405573 404323 C 2011-02-03 1996-07-31 UBX domain-containing protein that interacts with Cdc48p; involved in degradation of polyubiquitinated proteins via the ERAD (ER-associated degradation) pathway; modulates the Cdc48p-Nplp-Ufd1p AAA ATPase complex during its role in delivery of misfolded proteins to the proteasome; protein abundance increases in response to DNA replication stress -S000031655 CDS YMR067C 13 405573 404323 C 2011-02-03 1996-07-31 -S000004672 ORF Verified YMR068W AVO2 chromosome 13 13 406304 407584 W 2011-02-03 1996-07-31 Component of a complex containing the Tor2p kinase and other proteins; complex may have a role in regulation of cell growth -S000031807 CDS YMR068W 13 406304 407584 W 2011-02-03 1996-07-31 -S000004673 ORF Verified YMR069W NAT4 NAA40 chromosome 13 13 407709 408566 W 2011-02-03 1996-07-31 N alpha-acetyl-transferase; involved in acetylation of the N-terminal residues of histones H4 and H2A -S000032728 CDS YMR069W 13 407709 408566 W 2011-02-03 1996-07-31 -S000004674 ORF Verified YMR070W MOT3 [MOT3]|[MOT3+]|ROX7 chromosome 13 L000002675 13 409154 410626 W 43 2011-02-03 1996-07-31 Transcriptional repressor, activator; role in cellular adjustment to osmotic stress including modulation of mating efficiency; involved in repression of subset of hypoxic genes by Rox1p, repression of several DAN/TIR genes during aerobic growth, ergosterol biosynthetic genes in response to hyperosmotic stress; contributes to recruitment of Tup1p-Cyc8p general repressor to promoters; relocalizes to cytosol under hypoxia; forms [MOT3+] prion under anaerobic conditions -S000032777 CDS YMR070W 13 409154 410626 W 2011-02-03 1996-07-31 -S000004675 ORF Verified YMR071C TVP18 chromosome 13 13 411265 410762 C 2011-02-03 1996-07-31 Integral membrane protein; localized to late Golgi vesicles along with the v-SNARE Tlg2p; may interact with ribosomes, based on co-purification experiments; may have a role in intracellular sterol transport -S000032836 CDS YMR071C 13 411265 410762 C 2011-02-03 1996-07-31 -S000004676 ORF Verified YMR072W ABF2 DNA-binding protein ABF2|mtTFA|HM|p19 chromosome 13 L000000012 13 411569 412120 W 2011-02-03 1996-07-31 Mitochondrial DNA-binding protein; involved in mitochondrial DNA replication and recombination, member of HMG1 DNA-binding protein family; activity may be regulated by protein kinase A phosphorylation; ABF2 has a paralog, IXR1, that arose from the whole genome duplication; human homolog TFAM can complement yeast abf2 mutant, rescuing the loss-of-mitochondrial DNA phenotype in a yeast abf2 strain -S000033599 CDS YMR072W 13 411569 412120 W 2011-02-03 1996-07-31 -S000004677 ORF Verified YMR073C IRC21 chromosome 13 13 412873 412268 C 2011-02-03 1996-07-31 Protein of unknown function; may be involved in resistance to carboplatin and cisplatin; null mutant displays increase in spontaneous Rad52p foci; contains a lipid-binding domain and binds cardiolipin in a large-scale study -S000033642 CDS YMR073C 13 412873 412268 C 2011-02-03 1996-07-31 -S000004678 ORF Verified YMR074C SDD2 chromosome 13 13 413473 413036 C 2011-02-03 1996-07-31 Protein with homology to human PDCD5; PDCD5 is involved in programmed cell death; N-terminal region forms a conserved triple-helix bundle structure; overproduction suppresses lethality due to expression of the dominant PET9 allele AAC2-A128P; overexpression promotes H2O2-induced apoptosis; YMR074C is not an essential gene; protein abundance increases in response to DNA replication stress -S000033760 CDS YMR074C 13 413473 413036 C 2011-02-03 1996-07-31 -S000004680 ORF Verified YMR075W RCO1 chromosome 13 13 413982 416036 W 2011-02-03 1996-07-31 Essential component of the Rpd3S histone deacetylase complex; interacts with Eaf3p -S000034738 CDS YMR075W 13 413982 416036 W 2011-02-03 1996-07-31 -S000004679 ORF Dubious YMR075C-A chromosome 13 13 416053 415688 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF RCO1/YMR075W -S000033031 CDS YMR075C-A 13 416053 415688 C 2011-02-03 1996-07-31 -S000004681 ORF Verified YMR076C PDS5 chromosome 13 L000003047 13 420029 416196 C 2011-02-03 1996-07-31 Cohesion maintenance factor; involved in sister chromatid condensation and cohesion; colocalizes with cohesin on chromosomes; performs its cohesin maintenance function in pre-anaphase cells by protecting the integrity of the cohesion complex; also required during meiosis; relocalizes to the cytosol in response to hypoxia -S000034790 CDS YMR076C 13 420029 416196 C 2011-02-03 1996-07-31 -S000006764 tRNA_gene tV(AAC)M2 chromosome 13 L000003679 13 420661 420588 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000030020 noncoding_exon tV(AAC)M2 13 420661 420588 C 2011-02-03 2000-05-19 -S000004682 ORF Verified YMR077C VPS20 ESCRT-III subunit protein VPS20|VPL10|VPT20|CHM6 chromosome 13 13 422149 421484 C 2011-02-03 1996-07-31 Myristoylated subunit of the ESCRT-III complex; the endosomal sorting complex required for transport of transmembrane proteins into the multivesicular body pathway to the lysosomal/vacuolar lumen; cytoplasmic protein recruited to endosomal membranes -S000034931 CDS YMR077C 13 422149 421484 C 2011-02-03 1996-07-31 -S000004683 ORF Verified YMR078C CTF18 CHL12 chromosome 13 L000000431|L000000325 13 424728 422503 C 2011-02-03 1996-07-31 Subunit of a complex with Ctf8p; shares some subunits with Replication Factor C and is required for sister chromatid cohesion; may have overlapping functions with Rad24p in the DNA damage replication checkpoint -S000035849 CDS YMR078C 13 424728 422503 C 2011-02-03 1996-07-31 -S000004684 ORF Verified YMR079W SEC14 phosphatidylinositol/phosphatidylcholine transfer protein SEC14|PIT1 chromosome 13 L000001839 13 424989 426059 W 2011-02-03 1996-07-31 Phosphatidylinositol/phosphatidylcholine transfer protein; involved in regulating PtdIns, PtdCho, and ceramide metabolism, products of which regulate intracellular transport and UPR; has a role in localization of lipid raft proteins; functionally homologous to mammalian PITPs; SEC14 has a paralog, YKL091C, that arose from the whole genome duplication -S000036083 CDS YMR079W 13 424989 424997 W 2011-02-03 1996-07-31 -S000036084 CDS YMR079W 13 425154 426059 W 2011-02-03 1996-07-31 -S000036085 intron YMR079W 13 424998 425153 W 2011-02-03 1996-07-31 -S000004685 ORF Verified YMR080C NAM7 SUT2|ATP-dependent RNA helicase NAM7|SUP113|UPF1|MOF4|IFS2 chromosome 13 L000002429|S000029550|L000002232 13 429627 426712 C 60 2011-02-03 1996-07-31 ATP-dependent RNA helicase of the SFI superfamily; involved in nonsense mediated mRNA decay; required for efficient translation termination at nonsense codons and targeting of NMD substrates to P-bodies; binds to the small ribosomal subunit via an interaction with Rps26; forms cytoplasmic foci upon DNA replication stress -S000036887 CDS YMR080C 13 429627 426712 C 2011-02-03 1996-07-31 -S000004686 ORF Verified YMR081C ISF1 MBR3 chromosome 13 L000001034 13 431095 430079 C 2011-02-03 1996-07-31 Serine-rich, hydrophilic protein; overexpression suppresses growth defects of hap2, hap3, and hap4 mutants; expression is under glucose control; cotranscribed with NAM7 in a cyp1 mutant; ISF1 has a paralog, MBR1, that arose from the whole genome duplication -S000036954 CDS YMR081C 13 431095 430079 C 2011-02-03 1996-07-31 -S000004687 ORF Uncharacterized YMR082C chromosome 13 13 432125 431769 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YMR082C is not an essential gene -S000037719 CDS YMR082C 13 432125 431769 C 2011-02-03 1996-07-31 -S000004688 ORF Verified YMR083W ADH3 alcohol dehydrogenase ADH3 chromosome 13 L000000043 13 434788 435915 W 45 2011-02-03 1996-07-31 Mitochondrial alcohol dehydrogenase isozyme III; involved in the shuttling of mitochondrial NADH to the cytosol under anaerobic conditions and ethanol production -S000037845 CDS YMR083W 13 434788 435915 W 2011-02-03 1996-07-31 -S000004689 ORF Uncharacterized YMR084W putative glutamine--fructose-6-phosphate transaminase chromosome 13 13 436628 437416 W 2011-02-03 1996-07-31 Putative protein of unknown function; YMR084W and adjacent ORF YMR085W are merged in related strains, and together are paralogous to glutamine-fructose-6-phosphate amidotransferase GFA1 -S000030786 CDS YMR084W 13 436628 437416 W 2011-02-03 1996-07-31 -S000004690 ORF Uncharacterized YMR085W chromosome 13 13 437491 438789 W 2011-02-03 1996-07-31 Putative protein of unknown function; YMR085W and adjacent ORF YMR084W are merged in related strains, and together are paralogous to glutamine-fructose-6-phosphate amidotransferase GFA1 -S000030871 CDS YMR085W 13 437491 438789 W 2011-02-03 1996-07-31 -S000004692 ORF Verified YMR086W SEG1 chromosome 13 13 439208 442090 W 2011-02-03 1996-07-31 Component of eisosome required for proper eisosome assembly; precedes Pil1p/Lsp1p during eisosome formation, controls eisosome length and shape; diffusely distributed, forms heterogeneous patches at plasma membrane in small buds, also found in medium and large buds; expression repressed by cAMP; similar to A. gossypii SEG gene and to S. pombe Sle1p, important for generating eisosomes; SEG1 has a paralog, SEG2, that arose from the whole genome duplication -S000030930 CDS YMR086W 13 439208 442090 W 2011-02-03 1996-07-31 -S000004691 ORF Dubious YMR086C-A chromosome 13 13 442364 442026 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037663 CDS YMR086C-A 13 442364 442026 C 2011-02-03 1996-07-31 -S000004693 ORF Verified YMR087W putative ADP-ribose 1''-phosphate phosphatase chromosome 13 S000154613 13 442527 443381 W 2011-02-03 1996-07-31 Putative ADP-ribose-1''-monophosphatase; converts ADP-ribose-1''-monophosphate to ADP-ribose; may have a role in tRNA splicing; contains an A1pp domain -S000031010 CDS YMR087W 13 442527 443381 W 2011-02-03 1996-07-31 -S000004694 ORF Verified YMR088C VBA1 chromosome 13 13 445102 443414 C 2011-02-03 1996-07-31 Permease of basic amino acids in the vacuolar membrane -S000031056 CDS YMR088C 13 445102 443414 C 2011-02-03 1996-07-31 -S000004695 ORF Verified YMR089C YTA12 m-AAA protease subunit YTA12|RCA1 chromosome 13 L000001591|L000002564 13 448086 445609 C 2011-02-03 1996-07-31 Mitochondrial inner membrane m-AAA protease component; mediates degradation of misfolded or unassembled proteins; also required for correct assembly of mitochondrial enzyme complexes; overexpression of human AFG3L2 complements respiratory defect of yeast afg3 yta12 double null mutation, but overexpression of disease-associated AFG3L2 variants does not; expression of both human SPG7 (paraplegin) and AFG3L2 complements yeast yta12 afg3 double mutation -S000032008 CDS YMR089C 13 448086 445609 C 2011-02-03 1996-07-31 -S000004696 ORF Uncharacterized YMR090W chromosome 13 13 449245 449928 W 2011-02-03 1996-07-31 Putative protein of unknown function; similar to DTDP-glucose 4,6-dehydratases; GFP-fusion protein localizes to the cytoplasm; up-regulated in response to the fungicide mancozeb; not essential for viability -S000033126 CDS YMR090W 13 449245 449928 W 2011-02-03 1996-07-31 -S000004697 ORF Verified YMR091C NPL6 RSC7 chromosome 13 L000001272 13 451365 450058 C 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; interacts with Rsc3p, Rsc30p, Ldb7p, and Htl1p to form a module important for a broad range of RSC functions -S000033161 CDS YMR091C 13 451365 450058 C 2011-02-03 1996-07-31 -S000004698 ORF Verified YMR092C AIP1 chromosome 13 L000000069 13 453479 451632 C 2011-02-03 1996-07-31 Actin cortical patch component; interacts with the actin depolymerizing factor cofilin; inhibits elongation of aged ADP-actin filaments decorated with cofilin to maintain a high level of assembly-competent actin species; required to restrict cofilin localization to cortical patches; putative regulator of cytokinesis; contains WD repeats; protein increases in abundance and relocalizes from cytoplasm to plasma membrane upon DNA replication stress -S000033958 CDS YMR092C 13 453479 451632 C 2011-02-03 1996-07-31 -S000004699 ORF Verified YMR093W UTP15 snoRNA-binding rRNA-processing protein UTP15 chromosome 13 13 454015 455556 W 2011-02-03 1996-07-31 Nucleolar protein; component of the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA -S000034125 CDS YMR093W 13 454015 455556 W 2011-02-03 1996-07-31 -S000004700 ORF Verified YMR094W CTF13 CBF3C chromosome 13 L000000429 13 455825 457261 W 2011-02-03 1996-07-31 Subunit of the CBF3 complex; CBF3 binds to the CDE III element of centromeres, bending the DNA upon binding, and may be involved in sister chromatid cohesion during mitosis -S000034211 CDS YMR094W 13 455825 457261 W 2011-02-03 1996-07-31 -S000004701 ORF Verified YMR095C SNO1 putative pyridoxal 5'-phosphate synthase chromosome 13 L000003451 13 457959 457285 C 2011-02-03 1996-07-31 Protein of unconfirmed function; involved in pyridoxine metabolism; expression is induced during stationary phase; forms a putative glutamine amidotransferase complex with Snz1p, with Sno1p serving as the glutaminase -S000035105 CDS YMR095C 13 457959 457285 C 2011-02-03 1996-07-31 -S000004702 ORF Verified YMR096W SNZ1 pyridoxine biosynthesis protein SNZ1 chromosome 13 L000002575 13 458408 459301 W 2011-02-03 1996-07-31 Protein involved in vitamin B6 biosynthesis; member of a stationary phase-induced gene family; coregulated with SNO1; interacts with Sno1p and with Yhr198p, perhaps as a multiprotein complex containing other Snz and Sno proteins -S000035303 CDS YMR096W 13 458408 459301 W 2011-02-03 1996-07-31 -S000004703 ORF Verified YMR097C MTG1 putative GTPase MTG1 chromosome 13 13 460527 459424 C 2011-02-03 1996-07-31 Putative GTPase peripheral to the mitochondrial inner membrane; essential for respiratory competence, likely functions in assembly of the large ribosomal subunit, has homologs in plants and animals -S000035321 CDS YMR097C 13 460527 459424 C 2011-02-03 1996-07-31 -S000004704 ORF Verified YMR098C ATP25 LRC4 chromosome 13 13 462609 460771 C 2011-02-03 1996-07-31 Mitochondrial protein required for the stability of Oli1p (Atp9p) mRNA; also required for the Oli1p ring formation; YMR098C is not an essential gene -S000035398 CDS YMR098C 13 462609 460771 C 2011-02-03 1996-07-31 -S000007114 long_terminal_repeat YMRCdelta13 chromosome 13 13 463461 463128 C 2011-02-03 2000-05-19 Ty1 LTR -S000006543 tRNA_gene tD(GUC)M chromosome 13 L000003670 13 463554 463625 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000030421 noncoding_exon tD(GUC)M 13 463554 463625 W 2011-02-03 2000-05-19 -S000004705 ORF Verified YMR099C glucose-6-phosphate 1-epimerase chromosome 13 13 464827 463934 C 2011-02-03 1996-07-31 Glucose-6-phosphate 1-epimerase (hexose-6-phosphate mutarotase); likely involved in carbohydrate metabolism; GFP-fusion protein localizes to both the nucleus and cytoplasm and is induced in response to the DNA-damaging agent MMS -S000035458 CDS YMR099C 13 464827 463934 C 2011-02-03 1996-07-31 -S000004706 ORF Verified YMR100W MUB1 chromosome 13 L000004359 13 466300 468162 W 2011-02-03 1996-07-31 MYND domain-containing protein; component of the Mub1p-Ubr2p-Rad6p ubiquitin ligase complex, required for ubiquitination and degradation of Rpn4p; interacts with Ubr2p (E3) and indirectly with Rad6p (E2); short-lived protein degraded in a Ubr2p/Rad6p dependent manner; proposed to function as both a partner and substrate of the Ubr2p/Rad6p ubiquitin ligase; similar to the A. nidulans samB gene -S000032955 CDS YMR100W 13 466300 468162 W 2011-02-03 1996-07-31 -S000118372 ARS ARS1316 ARSXIII-468 chromosome 13 13 468179 468469 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178157 ARS_consensus_sequence ARS1316 13 468236 468252 W 2014-11-18 2014-11-18 -S000004707 ORF Verified YMR101C SRT1 ditrans,polycis-polyprenyl diphosphate synthase chromosome 13 L000004878 13 469476 468445 C 2011-02-03 1996-07-31 Forms the dehydrodolichyl diphosphate syntase (DDS) complex with NUS1; involved in synthesis of long-chain dolichols (19-22 isoprene units; as opposed to Rer2p which synthesizes shorter-chain dolichols); localizes to lipid bodies; transcription is induced during stationary phase -S000032988 CDS YMR101C 13 469476 468445 C 2011-02-03 1996-07-31 -S000004708 ORF Uncharacterized YMR102C chromosome 13 13 472352 469848 C 2011-02-03 1996-07-31 Protein of unknown function; transcription is activated by paralogous transcription factors Yrm1p and Yrr1p along with genes involved in multidrug resistance; mutant shows increased resistance to azoles; not an essential gene; YMR102C has a paralog, DGR2, that arose from the whole genome duplication -S000033083 CDS YMR102C 13 472352 469848 C 2011-02-03 1996-07-31 -S000004709 ORF Uncharacterized YMR103C chromosome 13 13 473264 472902 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YMR103C is not an essential gene -S000033841 CDS YMR103C 13 473264 472902 C 2011-02-03 1996-07-31 -S000004710 ORF Verified YMR104C YPK2 putative protein kinase YPK2|YKR2 chromosome 13 L000002542 13 475453 473420 C 2011-02-03 1996-07-31 Protein kinase similar to S/T protein kinase Ypk1p; functionally redundant with YPK1 at the genetic level; participates in a signaling pathway required for optimal cell wall integrity; involved in the TORC-dependent phosphorylation of ribosomal proteins Rps6a/b (S6); human homolog SGK2 can complement a ypk1 ypk2 double mutant -S000033988 CDS YMR104C 13 475453 473420 C 2011-02-03 1996-07-31 -S000004711 ORF Verified YMR105C PGM2 phosphoglucomutase PGM2|GAL5 chromosome 13 L000001413 13 477606 475897 C 2011-02-03 1996-07-31 Phosphoglucomutase; catalyzes the conversion from glucose-1-phosphate to glucose-6-phosphate, which is a key step in hexose metabolism; functions as the acceptor for a Glc-phosphotransferase; protein abundance increases in response to DNA replication stress; PGM2 has a paralog, PGM1, that arose from the whole genome duplication -S000034889 CDS YMR105C 13 477606 475897 C 2011-02-03 1996-07-31 -S000130188 ARS ARS1317 chromosome 13 13 477606 478301 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000028692 ORF Uncharacterized YMR105W-A chromosome 13 13 478064 478258 W 2011-02-03 2003-07-29 Putative protein of unknown function -S000032592 CDS YMR105W-A 13 478064 478258 W 2011-02-03 2003-07-29 -S000004712 ORF Verified YMR106C YKU80 ATP-dependent DNA helicase YKU80|HDF2 chromosome 13 L000004089 13 480190 478301 C 2011-02-03 1996-07-31 Subunit of telomeric Ku complex (Yku70p-Yku80p); involved in telomere length maintenance, structure and telomere position effect; required for localization of telomerase ribonucleoprotein via interaction with TLC1 guide RNA; relocates to sites of double-strand cleavage to promote nonhomologous end joining during DSB repair; colocalizes with quiescent cell telomere hyperclusters -S000035040 CDS YMR106C 13 480190 478301 C 2011-02-03 1996-07-31 -S000006627 tRNA_gene tK(CUU)M chromosome 13 L000003678 13 480693 480621 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000036046 noncoding_exon tK(CUU)M 13 480693 480621 C 2011-02-03 2000-05-19 -S000007115 long_terminal_repeat YMRCdelta14 chromosome 13 13 481547 481214 C 2011-02-03 2000-05-19 Ty1 LTR -S000007122 long_terminal_repeat YMRWdelta15 chromosome 13 13 481571 481808 W 2011-02-03 2000-05-19 Ty1 LTR -S000004713 ORF Verified YMR107W SPG4 chromosome 13 13 483014 483361 W 2011-02-03 1996-07-31 Protein required for high temperature survival during stationary phase; not required for growth on nonfermentable carbon sources -S000035284 CDS YMR107W 13 483014 483361 W 2011-02-03 1996-07-31 -S000004714 ORF Verified YMR108W ILV2 acetolactate synthase catalytic subunit|THI1|SMR1 chromosome 13 L000002296|L000002515|L000000858 13 484084 486147 W 66 2011-02-03 1996-07-31 Acetolactate synthase; catalyses the first common step in isoleucine and valine biosynthesis and is the target of several classes of inhibitors, localizes to the mitochondria; expression of the gene is under general amino acid control -S000036218 CDS YMR108W 13 484084 486147 W 2011-02-03 1996-07-31 -S000004715 ORF Verified YMR109W MYO5 myosin 5 chromosome 13 L000002935 13 486587 490246 W 2011-02-03 1996-07-31 One of two type I myosin motors; contains proline-rich tail homology 2 (TH2) and SH3 domains; MYO5 deletion has little effect on growth, but myo3 myo5 double deletion causes severe defects in growth and actin cytoskeleton organization; MYO5 has a paralog, MYO3, that arose from the whole genome duplication -S000036305 CDS YMR109W 13 486587 490246 W 2011-02-03 1996-07-31 -S000004716 ORF Verified YMR110C HFD1 hexadecenal dehydrogenase chromosome 13 13 491992 490394 C 2011-02-03 1996-07-31 Dehydrogenase involved in ubiquinone and sphingolipid metabolism; oxidizes 4-hydroxybenzaldehyde into 4-hydroxybenzoic acid in ubiquinone biosynthesis; converts hexadecenal to hexadecenoic acid in sphingosine 1-phosphate breakdown pathway; located in the mitochondrial outer membrane and also in lipid particles; human homolog ALDH3A2, a fatty aldehyde dehydrogenase (FALDH) mutated in neurocutaneous disorder Sjogren-Larsson syndrome, can complement yeast hfd1 mutant -S000037194 CDS YMR110C 13 491992 490394 C 2011-02-03 1996-07-31 -S000004717 ORF Verified YMR111C chromosome 13 13 493792 492404 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; YMR111C is not an essential gene; forms nuclear foci upon DNA replication stress -S000037278 CDS YMR111C 13 493792 492404 C 2011-02-03 1996-07-31 -S000004718 ORF Verified YMR112C MED11 chromosome 13 L000004634 13 494495 494100 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential protein -S000029941 CDS YMR112C 13 494495 494100 C 2011-02-03 1996-07-31 -S000004719 ORF Verified YMR113W FOL3 dihydrofolate synthase chromosome 13 13 494999 496282 W 2011-02-03 1996-07-31 Dihydrofolate synthetase, involved in folic acid biosynthesis; catalyzes conversion of dihydropteroate to dihydrofolate in folate coenzyme biosynthesis; FOL3 has a paralog, RMA1, that arose from the whole genome duplication -S000030131 CDS YMR113W 13 494999 496282 W 2011-02-03 1996-07-31 -S000004720 ORF Verified YMR114C putative peptide hydrolase chromosome 13 13 497449 496343 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; green fluorescent protein (GFP)-fusion protein localizes to the nucleus and cytoplasm; YMR114C is not an essential gene -S000030240 CDS YMR114C 13 497449 496343 C 2011-02-03 1996-07-31 -S000004721 ORF Verified YMR115W MGR3 FMP24 chromosome 13 13 497704 499209 W 2011-02-03 1996-07-31 Subunit of the mitochondrial (mt) i-AAA protease supercomplex; i-AAA degrades misfolded mitochondrial proteins; forms a subcomplex with Mgr1p that binds to substrates to facilitate proteolysis; required for growth of cells lacking mtDNA -S000031261 CDS YMR115W 13 497704 499209 W 2011-02-03 1996-07-31 -S000007501 snoRNA_gene snR24 SNR24 U24 chromosome 13 L000002911 13 500072 499984 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); commonly referred to as U24; guides 2'-O-methylation of large subunit (LSU) rRNA at positions C1437, C1449, and C1450 -S000036664 noncoding_exon snR24 13 500072 499984 C 2011-02-03 2000-05-19 -S000004722 ORF Verified YMR116C ASC1 RACK1|guanine nucleotide-binding protein subunit beta|ASU9|NAD1|CPC2 chromosome 13 L000003529|L000000135|S000029045 13 500688 499456 C 2011-02-03 1996-07-31 G-protein beta subunit and guanine dissociation inhibitor for Gpa2p; ortholog of RACK1 that inhibits translation; core component of the small (40S) ribosomal subunit; required to prevent frameshifting at ribosomes stalled at repeated CGA codons; regulates P-body formation induced by replication stress; represses Gcn4p in the absence of amino acid starvation -S000031294 CDS YMR116C 13 499878 499456 C 2011-02-03 1996-07-31 -S000031293 CDS YMR116C 13 500688 500152 C 2011-02-03 1996-07-31 -S000031295 intron YMR116C 13 500151 499879 C 2011-02-03 1996-07-31 -S000004723 ORF Verified YMR117C SPC24 kinetochore-associated Ndc80 complex subunit SPC24 chromosome 13 L000004694 13 501891 501250 C 2011-02-03 1996-07-31 Component of the kinetochore-associated Ndc80 complex; involved in chromosome segregation, spindle checkpoint activity, and kinetochore clustering; evolutionarily conserved; other members include Ndc80p, Nuf2p, Spc24p, and Spc25p -S000031427 CDS YMR117C 13 501891 501250 C 2011-02-03 1996-07-31 -S000004724 ORF Uncharacterized YMR118C SHH3 protein SHH3 chromosome 13 13 502734 502144 C 2011-02-03 1996-07-31 Putative mitochondrial inner membrane protein of unknown function; although similar to paralogous Sdh3p, Shh3p is not a stoichiometric subunit of either succinate dehydrogenase or of the TIM22 translocase; SHH3 has a paralog, SDH3, that arose from the whole genome duplication -S000032434 CDS YMR118C 13 502734 502144 C 2011-02-03 1996-07-31 -S000007123 long_terminal_repeat YMRWdelta16 chromosome 13 13 503192 503389 W 2011-02-03 2000-05-19 Ty1 LTR -S000130189 ARS ARS1319 chromosome 13 13 503389 503771 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000007128 long_terminal_repeat YMRWtau2 chromosome 13 13 503771 504141 W 2011-02-03 2000-05-19 Ty4 LTR -S000007124 long_terminal_repeat YMRWdelta17 chromosome 13 13 504346 504677 W 2011-02-03 2000-05-19 Ty1 LTR -S000006644 tRNA_gene tL(CAA)M chromosome 13 L000003671 13 504895 505008 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000033800 intron tL(CAA)M 13 504933 504964 W 2011-02-03 2000-05-19 -S000033798 noncoding_exon tL(CAA)M 13 504895 504932 W 2011-02-03 2000-05-19 -S000033799 noncoding_exon tL(CAA)M 13 504965 505008 W 2011-02-03 2000-05-19 -S000004725 ORF Verified YMR119W ASI1 putative ubiquitin-protein ligase ASI1 chromosome 13 13 505333 507207 W 2011-02-03 1996-07-31 Subunit of the inner nuclear membrane Asi ubiquitin ligase complex; the Asi complex targets both misfolded proteins of the inner nuclear membrane-associated degradation (INMAD) pathway and regulators of sterol biosynthesis for ubiquitin-mediated degradation; acts with Asi2p and Asi3p to ensure the fidelity of SPS-sensor signaling by targeting latent unprocessed forms of Stp1p and Stp2p, maintaining the repressed state of gene expression in the absence of inducing amino acids -S000032577 CDS YMR119W 13 505333 507207 W 2011-02-03 1996-07-31 -S000004726 ORF Dubious YMR119W-A chromosome 13 13 506996 507370 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps 3' end of ORF ASI1/YMR119W -S000037793 CDS YMR119W-A 13 506996 507370 W 2011-02-03 1996-07-31 -S000004727 ORF Verified YMR120C ADE17 bifunctional phosphoribosylaminoimidazolecarboxamide formyltransferase/IMP cyclohydrolase ADE17 chromosome 13 L000003306 13 509280 507502 C 2011-02-03 1996-07-31 Enzyme of 'de novo' purine biosynthesis; contains both 5-aminoimidazole-4-carboxamide ribonucleotide transformylase and inosine monophosphate cyclohydrolase activities; ADE17 has a paralog, ADE16, that arose from the whole genome duplication; ade16 ade17 mutants require adenine and histidine -S000033275 CDS YMR120C 13 509280 507502 C 2011-02-03 1996-07-31 -S000004728 ORF Verified YMR121C RPL15B eL15|ribosomal 60S subunit protein L15B|L15e|rp15R|YL10|L15B|L13B chromosome 13 L000004456 13 510348 509734 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L15B; binds to 5.8 S rRNA; homologous to mammalian ribosomal protein L15, no bacterial homolog; RPL15B has a paralog, RPL15A, that arose from the whole genome duplication; relocalizes from nucleus to nucleolus upon DNA replication stress -S000033342 CDS YMR121C 13 510348 509734 C 2011-02-03 1996-07-31 -S000004729 ORF Uncharacterized YMR122C chromosome 13 13 511075 510701 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YMR122C is not an essential gene -S000033409 CDS YMR122C 13 511075 510701 C 2011-02-03 1996-07-31 -S000007524 ORF Uncharacterized YMR122W-A chromosome 13 13 511315 511569 W 2011-02-03 2000-07-14 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and endoplasmic reticulum -S000037063 CDS YMR122W-A 13 511315 511569 W 2011-02-03 2000-07-14 -S000004730 ORF Verified YMR123W PKR1 chromosome 13 13 513593 513961 W 2011-02-03 1996-07-31 V-ATPase assembly factor; functions with other V-ATPase assembly factors in the ER to efficiently assemble the V-ATPase membrane sector (V0); protein abundance increases in response to DNA replication stress -S000034386 CDS YMR123W 13 513593 513961 W 2011-02-03 1996-07-31 -S000004731 ORF Verified YMR124W EPO1 chromosome 13 13 514456 517287 W 2011-02-03 1996-07-31 Protein involved in septin-ER tethering; interacts with ER membrane protein, Scs2p, and Shs1p, a septin ring component, at bud neck to create ER diffusion barrier; GFP-fusion protein localizes to the cell periphery, cytoplasm, bud, and bud neck; interacts with Crm1p in two-hybrid assay; YMR124W has a paralog, YLR031W, that arose from the whole genome duplication -S000034454 CDS YMR124W 13 514456 517287 W 2011-02-03 1996-07-31 -S000004732 ORF Verified YMR125W STO1 SUT1|CBP80|GCR3|CBC1 chromosome 13 L000002131 13 517539 520446 W 87 2011-02-03 1999-11-17|1996-07-31 Large subunit of the nuclear mRNA cap-binding protein complex; interacts with Npl3p to carry nuclear poly(A)+ mRNA to cytoplasm; also involved in nuclear mRNA degradation and telomere maintenance; orthologous to mammalian CBP80 -S000035482 CDS YMR125W 13 517539 517563 W 2011-02-03 1999-11-17|1996-07-31 -S000035483 CDS YMR125W 13 517886 520446 W 2011-02-03 1999-11-17 -S000035484 intron YMR125W 13 517564 517885 W 2011-02-03 1999-11-17 -S000004733 ORF Uncharacterized YMR126C DLT1 chromosome 13 13 521789 520761 C 2011-02-03 1996-07-31 Protein of unknown function; mutant sensitive to 6-azauracil (6AU) and mycophenolic acid (MPA) -S000035540 CDS YMR126C 13 521789 520761 C 2011-02-03 1996-07-31 -S000004734 ORF Verified YMR127C SAS2 KAT8 chromosome 13 L000001802 13 523345 522329 C 2011-02-03 1996-07-31 Histone acetyltransferase (HAT) catalytic subunit of the SAS complex; acetylates free histones and nucleosomes and regulates transcriptional silencing; member of the MYSTacetyltransferase family; other members are Sas4p and Sas5p -S000035616 CDS YMR127C 13 523345 522329 C 2011-02-03 1996-07-31 -S000004735 ORF Verified YMR128W ECM16 ATP-dependent RNA helicase ECM16|DHR1 chromosome 13 L000003891 13 523696 527499 W 2011-02-03 1996-07-31 Essential DEAH-box ATP-dependent RNA helicase specific to U3 snoRNP; predominantly nucleolar in distribution; required for 18S rRNA synthesis -S000035779 CDS YMR128W 13 523696 527499 W 2011-02-03 1996-07-31 -S000004736 ORF Verified YMR129W POM152 chromosome 13 L000001464 13 527804 531817 W 2011-02-03 1996-07-31 Glycoprotein subunit of transmembrane ring of nuclear pore complex; contributes to nucleocytoplasmic transport, nuclear pore complex (NPC) biogenesis and spindle pole body duplication; homologous to human NUP210 -S000036687 CDS YMR129W 13 527804 531817 W 2011-02-03 1996-07-31 -S000004737 ORF Uncharacterized YMR130W chromosome 13 13 532119 533027 W 2011-02-03 1996-07-31 Putative protein of unknown function; YMR130W is not an essential gene -S000036551 CDS YMR130W 13 532119 533027 W 2011-02-03 1996-07-31 -S000004738 ORF Verified YMR131C RRB1 ribosome biosynthesis protein RRB1 chromosome 13 13 534698 533163 C 2011-02-03 1996-07-31 Specific chaperone for ribosomal protein Rpl3p; binds to nascent Rpl3p during translation; essential gene -S000036599 CDS YMR131C 13 534698 533163 C 2011-02-03 1996-07-31 -S000004739 ORF Uncharacterized YMR132C JLP2 chromosome 13 13 535570 534944 C 2011-02-03 1996-07-31 Protein of unknown function; contains sequence that closely resembles a J domain (typified by the E. coli DnaJ protein) -S000036706 CDS YMR132C 13 535570 534944 C 2011-02-03 1996-07-31 -S000118373 ARS ARS1320 ARSXIII-536 chromosome 13 13 535597 535844 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178158 ARS_consensus_sequence ARS1320 13 535770 535754 C 2014-11-18 2014-11-18 -S000004740 ORF Verified YMR133W REC114 chromosome 13 L000001607 13 536207 537609 W 91 2011-02-03 1999-07-17|1996-07-31 Protein involved in early stages of meiotic recombination; possibly involved in the coordination of recombination and meiotic division; mutations lead to premature initiation of the first meiotic division -S000037485 CDS YMR133W 13 536207 537448 W 2011-02-03 1999-07-17|1996-07-31 -S000037486 CDS YMR133W 13 537565 537609 W 2011-02-03 1999-07-17 -S000037487 intron YMR133W 13 537449 537564 W 2011-02-03 1999-07-17 -S000004741 ORF Verified YMR134W ERG29 chromosome 13 13 537838 538551 W 2011-02-03 1996-07-31 Protein of unknown function involved in ergosterol biosynthesis; conditional mutants produce less ergosterol, display impaired oxygen consumption, respiratory growth, mitochondrial iron utilization, and are more sensitive to oxidative stress; mutant bm-8 has a growth defect on iron-limited medium that is complemented by overexpression of Yfh1p; protein localizes to the cytoplasm, ER and nuclear envelope; highly conserved in ascomycetes -S000037629 CDS YMR134W 13 537838 538551 W 2011-02-03 1996-07-31 -S000004743 ORF Dubious YMR135W-A chromosome 13 13 539911 540444 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036832 CDS YMR135W-A 13 539911 540444 W 2011-02-03 1996-07-31 -S000004742 ORF Verified YMR135C GID8 glucose-induced degradation complex subunit GID8|DCR1 chromosome 13 13 540056 538689 C 2011-02-03 1996-07-31 Subunit of GID Complex, binds strongly to central component Vid30p; GID Complex is involved in proteasome-dependent catabolite inactivation of fructose-1,6-bisphosphatase; recruits Rmd5p, Fyv10 and Vid28p to GID Complex; contains LisH, CTLH, and CRA domains that mediate binding to Vid30p (LisH) and Rmd5p and Vid28p (CTLH and CRA); dosage-dependent regulator of START -S000030355 CDS YMR135C 13 540056 538689 C 2011-02-03 1996-07-31 -S000004744 ORF Verified YMR136W GAT2 chromosome 13 S000007443 13 541199 542881 W 2011-02-03 1996-07-31 Protein containing GATA family zinc finger motifs; similar to Gln3p and Dal80p; expression repressed by leucine -S000030544 CDS YMR136W 13 541199 542881 W 2011-02-03 1996-07-31 -S000130190 ARS ARS1321 chromosome 13 13 542881 542978 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000004745 ORF Verified YMR137C PSO2 SNM1 chromosome 13 L000001953 13 544963 542978 C 2011-02-03 1996-07-31 Nuclease required for DNA single- and double-strand break repair; acts at a post-incision step in repair of breaks that result from interstrand cross-links produced by a variety of mono- and bi-functional psoralen derivatives; induced by UV-irradiation; forms nuclear foci upon DNA replication stress -S000030595 CDS YMR137C 13 544963 542978 C 2011-02-03 1996-07-31 -S000004746 ORF Verified YMR138W CIN4 Arf family GTPase CIN4|UGX1|GTP1 chromosome 13 L000000338 13 545155 545730 W 86 2011-02-03 1996-07-31 GTP-binding protein involved in beta-tubulin (Tub2p) folding; isolated as mutant with increased chromosome loss and sensitivity to benomyl; regulated by the GTPase-activating protein, Cin2p, the human retinitis pigmentosa 2 (RP2) homolog -S000031508 CDS YMR138W 13 545155 545730 W 2011-02-03 1996-07-31 -S000004747 ORF Verified YMR139W RIM11 serine/threonine protein kinase RIM11|MDS1|GSK3 chromosome 13 L000001056 13 546125 547237 W 2011-02-03 1996-07-31 Protein kinase; required for signal transduction during entry into meiosis; promotes the formation of the Ime1p-Ume6p complex by phosphorylating Ime1p and Ume6p; shares similarity with mammalian glycogen synthase kinase 3-beta; protein abundance increases in response to DNA replication stress; RIM11 has a paralog, MRK1, that arose from the whole genome duplication -S000031611 CDS YMR139W 13 546125 547237 W 2011-02-03 1996-07-31 -S000004748 ORF Verified YMR140W SIP5 chromosome 13 13 547714 549183 W 2011-02-03 1996-07-31 Protein of unknown function; interacts with both the Reg1p/Glc7p phosphatase and the Snf1p kinase; forms cytoplasmic foci upon DNA replication stress -S000031580 CDS YMR140W 13 547714 549183 W 2011-02-03 1996-07-31 -S000004749 ORF Uncharacterized YMR141C chromosome 13 13 550044 549736 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YMR141C is not an essential gene -S000031632 CDS YMR141C 13 550044 549736 C 2011-02-03 1996-07-31 -S000028575 ORF Dubious YMR141W-A chromosome 13 13 550911 551135 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene RPL13B/YMR142C -S000031304 CDS YMR141W-A 13 550911 551135 W 2011-02-03 2003-07-29 -S000004750 ORF Verified YMR142C RPL13B eL13|ribosomal 60S subunit protein L13B|L13e|L13B chromosome 13 L000004455 13 551207 550206 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L13B; not essential for viability; homologous to mammalian ribosomal protein L13, no bacterial homolog; RPL13B has a paralog, RPL13A, that arose from the whole genome duplication -S000032639 CDS YMR142C 13 550801 550206 C 2011-02-03 1996-07-31 -S000032638 CDS YMR142C 13 551207 551204 C 2011-02-03 1996-07-31 -S000032640 intron YMR142C 13 551203 550802 C 2011-02-03 1996-07-31 -S000004751 ORF Verified YMR143W RPS16A uS9|ribosomal 40S subunit protein S16A|S9|rp61R|S16A chromosome 13 L000004477 13 551928 552903 W 2011-02-03 2000-07-22|1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S16 and bacterial S9; RPS16A has a paralog, RPS16B, that arose from the whole genome duplication -S000032779 CDS YMR143W 13 551928 551951 W 2011-02-03 2000-07-22|1996-07-31 -S000032780 CDS YMR143W 13 552496 552903 W 2011-02-03 1996-07-31 -S000032781 intron YMR143W 13 551952 552495 W 2011-02-03 2000-07-22|1996-07-31 -S000004752 ORF Uncharacterized YMR144W FDO1 chromosome 13 13 553362 554390 W 2011-02-03 1996-07-31 Protein involved in directionality of mating type switching; acts with Fkh1p to control which donor mating-type locus is inserted into MAT locus during mating type switching; localized to the nucleus; not an essential gene -S000033505 CDS YMR144W 13 553362 554390 W 2011-02-03 1996-07-31 -S000130191 ARS ARS1322 chromosome 13 13 553422 554331 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000004753 ORF Verified YMR145C NDE1 NADH-ubiquinone reductase (H(+)-translocating) NDE1|NDH1 chromosome 13 13 556475 554793 C 2011-02-03 1996-07-31 Mitochondrial external NADH dehydrogenase; type II NAD(P)H:quinone oxidoreductase that catalyzes the oxidation of cytosolic NADH; Nde1p and Nde2p provide cytosolic NADH to the mitochondrial respiratory chain; NDE1 has a paralog, NDE2, that arose from the whole genome duplication -S000033554 CDS YMR145C 13 556475 554793 C 2011-02-03 1996-07-31 -S000004754 ORF Verified YMR146C TIF34 translation initiation factor eIF3 subunit i chromosome 13 L000003329 13 558524 557481 C 2011-02-03 1996-07-31 eIF3i subunit of the eukaryotic translation initiation factor 3 (eIF3); subunit of the core complex of eIF3; essential for translation; stimulates rate of ribosomal scanning during translation reinitiation; eIF3 is also involved in programmed stop codon readthrough -S000033644 CDS YMR146C 13 558524 557481 C 2011-02-03 1996-07-31 -S000004755 ORF Uncharacterized YMR147W chromosome 13 13 559199 559870 W 2011-02-03 1996-07-31 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the cell periphery -S000033833 CDS YMR147W 13 559199 559870 W 2011-02-03 1996-07-31 -S000004756 ORF Verified YMR148W OSW5 chromosome 13 13 560366 560812 W 2011-02-03 1996-07-31 Protein of unknown function with possible role in spore wall assembly; predicted to contain an N-terminal transmembrane domain; osw5 null mutant spores exhibit increased spore wall permeability and sensitivity to beta-glucanase digestion -S000034741 CDS YMR148W 13 560366 560812 W 2011-02-03 1996-07-31 -S000004757 ORF Verified YMR149W SWP1 dolichyl-diphosphooligosaccharide-protein glycotransferase chromosome 13 L000002255 13 560996 561856 W 2011-02-03 1996-07-31 Delta subunit of the oligosaccharyl transferase glycoprotein complex; complex is required for N-linked glycosylation of proteins in the endoplasmic reticulum -S000034875 CDS YMR149W 13 560996 561856 W 2011-02-03 1996-07-31 -S000004759 ORF Dubious YMR151W YIM2 chromosome 13 L000002672 13 562506 562943 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 5% of ORF overlaps the verified gene IMP1 -S000036792 CDS YMR151W 13 562506 562943 W 2011-02-03 1996-07-31 -S000004758 ORF Verified YMR150C IMP1 endopeptidase catalytic subunit IMP1|PET-TS2858 chromosome 13 L000000864 13 562528 561956 C 92 2011-02-03 1996-07-31 Catalytic subunit of mitochondrial inner membrane peptidase complex; required for maturation of mitochondrial proteins of the intermembrane space; complex contains two catalytic subunits (Imp1p and Imp2p that differ in substrate specificty) and Som1p -S000035827 CDS YMR150C 13 562528 561956 C 2011-02-03 1996-07-31 -S000004760 ORF Verified YMR152W YIM1 chromosome 13 L000002671 13 563096 564193 W 2011-02-03 1996-07-31 Protein of unknown function; null mutant displays sensitivity to DNA damaging agents; may have a role in lipid metabolism, based on localization to lipid droplets; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; protein abundance increases in response to DNA replication stress -S000036879 CDS YMR152W 13 563096 564193 W 2011-02-03 1996-07-31 -S000004762 ORF Verified YMR153W NUP53 FG-nucleoporin NUP53 chromosome 13 13 564435 565862 W 2011-02-03 1996-07-31 FG-nucleoporin component of central core of nuclear pore complex (NPC); also part of the NPC nuclear basket; contributes directly to nucleocytoplasmic transport; involved in regulation of transcription and mitosis; induces membrane tubulation, which may contribute to nuclear pore assembly; NUP53 has a paralog, ASM4, that arose from the whole genome duplication -S000036930 CDS YMR153W 13 564435 565862 W 2011-02-03 1996-07-31 -S000004761 ORF Dubious YMR153C-A chromosome 13 13 565909 565574 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps 3' end of verified gene NUP53/YMR153W -S000036598 CDS YMR153C-A 13 565909 565574 C 2011-02-03 1996-07-31 -S000004763 ORF Verified YMR154C RIM13 CPL1 chromosome 13 L000004172 13 568182 565999 C 2011-02-03 1996-07-31 Calpain-like cysteine protease; involved in proteolytic activation of Rim101p in response to alkaline pH; localizes to punctate structures in alkaline conditions and in vps4 mutant; has similarity to A. nidulans palB -S000036955 CDS YMR154C 13 568182 565999 C 2011-02-03 1996-07-31 -S000004764 ORF Uncharacterized YMR155W chromosome 13 13 568551 570194 W 2011-02-03 1996-07-31 Putative protein of unknown function; identified as interacting with Hsp82p in a high-throughput two-hybrid screen -S000037749 CDS YMR155W 13 568551 570194 W 2011-02-03 1996-07-31 -S000004765 ORF Verified YMR156C TPP1 polynucleotide 3'-phosphatase chromosome 13 13 571016 570300 C 2011-02-03 1996-07-31 DNA 3'-phosphatase; functions in repair of endogenous damage of double-stranded DNA, activity is specific for removal of 3' phosphates at strand breaks; similar to the l-2-haloacid dehalogenase superfamily; homolog of human polynucleotide kinase/3'-phosphatase -S000037789 CDS YMR156C 13 571016 570300 C 2011-02-03 1996-07-31 -S000004766 ORF Verified YMR157C AIM36 FMP39 chromosome 13 13 572044 571277 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant displays reduced respiratory growth and elevated frequency of mitochondrial genome loss; the authentic, non-tagged protein is detected in purified mitochondria in high-throughput studies -S000037876 CDS YMR157C 13 572044 571277 C 2011-02-03 1996-07-31 -S000004767 ORF Verified YMR158W MRPS8 mitochondrial 37S ribosomal protein MRPS8 chromosome 13 13 572248 572715 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit -S000030873 CDS YMR158W 13 572248 572715 W 2011-02-03 1996-07-31 -S000006664 tRNA_gene tM(CAU)M EMT4 chromosome 13 L000003677|L000000554 13 572955 572883 C 2011-02-03 2000-05-19 Methionine tRNA (tRNA-Met), functions in translational elongation; not involved in translational initiation; predicted by tRNAscan-SE analysis -S000034574 noncoding_exon tM(CAU)M 13 572955 572883 C 2011-02-03 2000-05-19 -S000007249 ORF Uncharacterized YMR158C-A YMR158C-B chromosome 13 13 573331 573194 C 2011-02-03 1997-07-17 Putative protein of unknown function; may contain a lipid attachment site; YMR158C-A is not an essential gene -S000030986 CDS YMR158C-A 13 573331 573194 C 2011-02-03 1997-07-17 -S000007116 long_terminal_repeat YMRCdelta18 chromosome 13 13 573338 573112 C 2011-02-03 2000-05-19 Ty1 LTR -S000004768 ORF Dubious YMR158W-B YMR158W-A chromosome 13 13 574471 574791 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene ATG16/YMR159C -S000034209 CDS YMR158W-B 13 574471 574791 W 2011-02-03 1996-07-31 -S000004769 ORF Verified YMR159C ATG16 APG15|APG16|CVT11|SAP18 chromosome 13 L000004135|L000004762|S000029036|L000004787 13 574928 574476 C 2011-02-03 1996-07-31 Conserved protein involved in autophagy; interacts with Atg12p-Atg5p conjugates to form Atg12p-Atg5p-Atg16p multimers, which binds to membranes and localizes to the pre-autophagosomal structure and are required for autophagy; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress -S000030904 CDS YMR159C 13 574928 574476 C 2011-02-03 1996-07-31 -S000004770 ORF Verified YMR160W chromosome 13 13 575066 577516 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the membrane of the vacuole; mutant has enhanced sensitivity to overexpression of mutant huntingtin; YMR160W is not an essential gene; relative distribution within the vacuolar membrane changes upon DNA replication stress -S000032016 CDS YMR160W 13 575066 577516 W 2011-02-03 1996-07-31 -S000004771 ORF Verified YMR161W HLJ1 type I HSP40 co-chaperone HLJ1 chromosome 13 L000002962 13 577718 578392 W 2011-02-03 1996-07-31 Co-chaperone for Hsp40p; anchored in the ER membrane; with its homolog Ydj1p promotes ER-associated protein degradation (ERAD) of integral membrane substrates; similar to E. coli DnaJ -S000032125 CDS YMR161W 13 577718 578392 W 2011-02-03 1996-07-31 -S000004772 ORF Verified YMR162C DNF3 aminophospholipid-translocating P4-type ATPase DNF3 chromosome 13 13 583921 578951 C 2011-02-03 1996-07-31 Trans-golgi network aminophospholipid translocase (flippase); type 4 P-type ATPase; involved in phospholipid translocation, contributing to the maintenance of membrane lipid asymmetry in post-Golgi secretory vesicles; role in protein trafficking between the Golgi and endosomal system; localizes to the trans-Golgi network; localizes to the shmoo tip where it has a redundant role in the cellular response to mating pheromone -S000032992 CDS YMR162C 13 583921 578951 C 2011-02-03 1996-07-31 -S000004773 ORF Verified YMR163C INP2 chromosome 13 13 586388 584271 C 2011-02-03 1996-07-31 Peroxisome-specific receptor important for peroxisome inheritance; co-fractionates with peroxisome membranes and co-localizes with peroxisomes in vivo; physically interacts with the myosin V motor Myo2p; INP2 is not an essential gene -S000033087 CDS YMR163C 13 586388 584271 C 2011-02-03 1996-07-31 -S000006765 tRNA_gene tV(AAC)M3 chromosome 13 L000003676 13 586709 586636 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000030039 noncoding_exon tV(AAC)M3 13 586709 586636 C 2011-02-03 2000-05-19 -S000004774 ORF Verified YMR164C MSS11 chromosome 13 L000003920 13 589550 587274 C 2011-02-03 1996-07-31 Transcription factor; involved in regulation of invasive growth and starch degradation; controls the activation of FLO11 and STA2 in response to nutritional signals; forms a heterodimer with Flo8p that interacts with the Swi/Snf complex during transcriptional activation of FLO1, FLO11, and STA1 -S000033162 CDS YMR164C 13 589550 587274 C 2011-02-03 1996-07-31 -S000004775 ORF Verified YMR165C PAH1 phosphatidate phosphatase PAH1|SMP2 chromosome 13 L000001934 13 592628 590040 C 2011-02-03 1996-07-31 Mg2+-dependent phosphatidate (PA) phosphatase; dephosphorylates PA to yield diacylglycerol; regulates phospholipid synthesis, nuclear/ER membrane growth, lipid droplet formation, triacylglycerol synthesis, vacuolar homeostasis and cell wall integrity; phosphorylated by Pho85p/Pho80p, Cdc28p/Cyclin B, PKA, PKC, and CKII, regulating activity, localization, and proteosomal degradation; homolog of mammalian lipins 1 and 2; human homologs LPIN1, LPIN2, LPIN3 complement the null -S000033959 CDS YMR165C 13 592628 590040 C 2011-02-03 1996-07-31 -S000004776 ORF Verified YMR166C MME1 chromosome 13 13 594473 593367 C 2011-02-03 1996-07-31 Transporter of the mitochondrial inner membrane that exports magnesium; involved in mitochondrial Mg2+ homeostasis; has similarity to human mitochondrial ATP-Mg/Pi carriers -S000034071 CDS YMR166C 13 594473 593367 C 2011-02-03 1996-07-31 -S000004777 ORF Verified YMR167W MLH1 mismatch repair ATPase MLH1|PMS2 chromosome 13 L000001121 13 594886 597195 W 2011-02-03 1996-07-31 Protein required for mismatch repair in mitosis and meiosis; also required for crossing over during meiosis; forms a complex with Pms1p and Msh2p-Msh3p during mismatch repair; human homolog is associated with hereditary non-polyposis colon cancer -S000034230 CDS YMR167W 13 594886 597195 W 2011-02-03 1996-07-31 -S000004778 ORF Verified YMR168C CEP3 CSL1|CBF3B|CBF3 chromosome 13 L000000312|L000000222 13 599158 597332 C 2011-02-03 1996-07-31 Essential kinetochore protein; component of the CBF3 complex that binds the CDEIII region of the centromere; contains an N-terminal Zn2Cys6 type zinc finger domain, a C-terminal acidic domain, and a putative coiled coil dimerization domain -S000035106 CDS YMR168C 13 599158 597332 C 2011-02-03 1996-07-31 -S000004779 ORF Verified YMR169C ALD3 aldehyde dehydrogenase (NAD(+)) ALD3 chromosome 13 L000002992 13 600872 599352 C 2011-02-03 1996-07-31 Cytoplasmic aldehyde dehydrogenase; involved in beta-alanine synthesis; uses NAD+ as the preferred coenzyme; very similar to Ald2p; expression is induced by stress and repressed by glucose -S000035214 CDS YMR169C 13 600872 599352 C 2011-02-03 1996-07-31 -S000004780 ORF Verified YMR170C ALD2 aldehyde dehydrogenase (NAD(+)) ALD2 chromosome 13 L000003120|L000002991 13 603082 601562 C 2011-02-03 1996-07-31 Cytoplasmic aldehyde dehydrogenase; involved in ethanol oxidation and beta-alanine biosynthesis; uses NAD+ as the preferred coenzyme; expression is stress induced and glucose repressed; very similar to Ald3p -S000036140 CDS YMR170C 13 603082 601562 C 2011-02-03 1996-07-31 -S000004781 ORF Verified YMR171C EAR1 chromosome 13 13 605520 603868 C 2011-02-03 1996-07-31 Specificity factor required for Rsp5p-dependent ubiquitination; also required for sorting of specific cargo proteins at the multivesicular body; mRNA is targeted to the bud via the mRNA transport system involving She2p -S000036240 CDS YMR171C 13 605520 603868 C 2011-02-03 1996-07-31 -S000004783 ORF Verified YMR172W HOT1 chromosome 13 L000004957 13 605981 608140 W 2011-02-03 1996-07-31 Transcription factor for glycerol biosynthetic genes; required for the transient induction of glycerol biosynthetic genes GPD1 and GPP2 in response to high osmolarity; targets Hog1p to osmostress responsive promoters; has similarity to Msn1p and Gcr1p -S000031822 CDS YMR172W 13 605981 608140 W 2011-02-03 1996-07-31 -S000004782 ORF Dubious YMR172C-A chromosome 13 13 608211 607828 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps 3' end of ORF HOT1/YMR172W -S000034962 CDS YMR172C-A 13 608211 607828 C 2011-02-03 1996-07-31 -S000004784 ORF Verified YMR173W DDR48 DNA damage-responsive protein 48|FSP chromosome 13 L000000498 13 608689 609981 W 2011-02-03 1996-07-31 DNA damage-responsive protein; expression is increased in response to heat-shock stress or treatments that produce DNA lesions; contains multiple repeats of the amino acid sequence NNNDSYGS; protein abundance increases in response to DNA replication stress -S000031955 CDS YMR173W 13 608689 609981 W 2011-02-03 1996-07-31 -S000004785 ORF Dubious YMR173W-A chromosome 13 13 608897 610081 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene DDR48/YML173W -S000030427 CDS YMR173W-A 13 608897 610081 W 2011-02-03 1996-07-31 -S000004786 ORF Verified YMR174C PAI3 IA3 chromosome 13 L000001332 13 610365 610159 C 2011-02-03 1996-07-31 Cytoplasmic proteinase A (Pep4p) inhibitor; dependent on Pbs2p and Hog1p protein kinases for osmotic induction; intrinsically unstructured, N-terminal half becomes ordered in the active site of proteinase A upon contact -S000031994 CDS YMR174C 13 610365 610159 C 2011-02-03 1996-07-31 -S000004787 ORF Verified YMR175W SIP18 chromosome 13 L000002670 13 611016 611255 W 2011-02-03 1996-07-31 Phospholipid-binding hydrophilin; essential to overcome desiccation-rehydration process; expression is induced by osmotic stress; SIP18 has a paralog, GRE1, that arose from the whole genome duplication -S000037525 CDS YMR175W 13 611016 611255 W 2011-02-03 1996-07-31 -S000118374 ARS ARS1323 ARSXIII-611 chromosome 13 13 611275 611489 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178159 ARS_consensus_sequence ARS1323 13 611317 611333 W 2014-11-18 2014-11-18 -S000028848 ORF Uncharacterized YMR175W-A chromosome 13 13 611314 611508 W 2011-02-03 2003-07-29 Putative protein of unknown function -S000034535 CDS YMR175W-A 13 611314 611508 W 2011-02-03 2003-07-29 -S000004788 ORF Verified YMR176W ECM5 chromosome 13 L000003881 13 611740 615975 W 2011-02-03 1996-07-31 Subunit of the Snt2C complex; physically associates with Snt2p and Rpd3p; along with Snt2p, recruits Rpd3p to a small number of promoters; also colocalizes with Snt2p, independently of Rpd3p, to promoters of stress response genes in response to oxidative stress; contains ATP/GTP-binding site motif A; null mutant exhibits increased cellular volume, large drooping buds with elongated necks; relative distribution to the nucleus increases upon DNA replication stress -S000037587 CDS YMR176W 13 611740 615975 W 2011-02-03 1996-07-31 -S000004789 ORF Verified YMR177W MMT1 MFT1 chromosome 13 L000004107 13 616566 618098 W 2011-02-03 1996-07-31 Putative metal transporter involved in mitochondrial iron accumulation; MMT1 has a paralog, MMT2, that arose from the whole genome duplication -S000037682 CDS YMR177W 13 616566 618098 W 2011-02-03 1996-07-31 -S000004790 ORF Verified YMR178W chromosome 13 13 618479 619303 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and nucleus; YMR178W is not an essential gene; protein abundance increases in response to DNA replication stress -S000030501 CDS YMR178W 13 618479 619303 W 2011-02-03 1996-07-31 -S000004791 ORF Verified YMR179W SPT21 chromosome 13 L000002040 13 619858 622134 W 2011-02-03 1996-07-31 Protein with a role in transcriptional silencing; required for normal transcription at several loci including HTA2-HTB2 and HHF2-HHT2, but not required at the other histone loci; functionally related to Spt10p; localizes to nuclear foci that become diffuse upon DNA replication stress -S000030565 CDS YMR179W 13 619858 622134 W 2011-02-03 1996-07-31 -S000004792 ORF Verified YMR180C CTL1 polynucleotide 5'-phosphatase|CTH1 chromosome 13 S000007412 13 623213 622251 C 2011-02-03 1996-07-31 RNA 5'-triphosphatase, localizes to both the nucleus and cytoplasm; CTL1 has a paralog, CET1, that arose from the whole genome duplication -S000037398 CDS YMR180C 13 623213 622251 C 2011-02-03 1996-07-31 -S000004793 ORF Uncharacterized YMR181C chromosome 13 13 624080 623616 C 2011-02-03 1996-07-31 Protein of unknown function; mRNA transcribed as part of a bicistronic transcript with a predicted transcriptional repressor RGM1/YMR182C; mRNA is destroyed by nonsense-mediated decay (NMD); not an essential gene; YMR181C has a paralog, YPL229W, that arose from the whole genome duplication -S000030034 CDS YMR181C 13 624080 623616 C 2011-02-03 1996-07-31 -S000004794 ORF Verified YMR182C RGM1 chromosome 13 L000001627 13 625167 624532 C 2011-02-03 1996-07-31 Putative zinc finger DNA binding transcription factor; contains two N-terminal C2H2 zinc fingers and C-terminal proline rich domain; overproduction impairs cell growth and induces expression of genes involved in monosaccharide catabolism and aldehyde metabolism; regulates expression of of Y' telomeric elements and subtelomeric COS genes; relocalizes to the cytosol in response to hypoxia; RGM1 has a paralog, USV1, that arose from the whole genome duplication -S000030142 CDS YMR182C 13 625167 624532 C 2011-02-03 1996-07-31 -S000028693 ORF Uncharacterized YMR182W-A chromosome 13 13 625811 625897 W 2011-02-03 2003-07-29 Putative protein of unknown function -S000032593 CDS YMR182W-A 13 625811 625897 W 2011-02-03 2003-07-29 -S000028468 snoRNA_gene snR83 SNR83 RUF3 chromosome 13 13 626349 626654 W 2011-02-03 2004-04-01 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of small subunit (SSU) rRNA at positions U1290 and U1415 -S000030105 noncoding_exon snR83 13 626349 626654 W 2011-02-03 2004-04-01 -S000004795 ORF Verified YMR183C SSO2 syntaxin chromosome 13 L000002090 13 627808 626921 C 2011-02-03 1996-07-31 Plasma membrane t-SNARE; involved in fusion of secretory vesicles at the plasma membrane; syntaxin homolog that is functionally redundant with Sso1p; SSO2 has a paralog, SSO1, that arose from the whole genome duplication -S000030342 CDS YMR183C 13 627808 626921 C 2011-02-03 1996-07-31 -S000004796 ORF Verified YMR184W ADD37 chromosome 13 13 628189 628785 W 2011-02-03 1996-07-31 Protein of unknown function; involved in ER-associated protein degradation; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and is induced in response to the DNA-damaging agent MMS; YMR184W is not an essential gene; protein abundance increases in response to DNA replication stress -S000033702 CDS YMR184W 13 628189 628785 W 2011-02-03 1996-07-31 -S000004797 ORF Verified YMR185W RTP1 chromosome 13 13 629025 631970 W 2011-02-03 1996-07-31 Protein required for the nuclear import and biogenesis of RNA pol II; conflicting evidence on whether null mutant is viable with elongated buds, or inviable; interacts with Rpb2, Rpb3, Nup116p, Nup100p and components of the R2TP complex (Rvb1p, Rvb2p, Pih1p); similar to human TMCO7 gene -S000033842 CDS YMR185W 13 629025 631970 W 2011-02-03 1996-07-31 -S000004798 ORF Verified YMR186W HSC82 Hsp90 family chaperone HSC82|HSP90 chromosome 13 L000000813 13 632355 634472 W 2011-02-03 1996-07-31 Cytoplasmic chaperone of the Hsp90 family; plays a role in determining prion variants; redundant in function and nearly identical with Hsp82p, and together they are essential; expressed constitutively at 10-fold higher basal levels than HSP82 and induced 2-3 fold by heat shock; contains two acid-rich unstructured regions that promote the solubility of chaperone-substrate complexes; HSC82 has a paralog, HSP82, that arose from the whole genome duplication -S000033979 CDS YMR186W 13 632355 634472 W 2011-02-03 1996-07-31 -S000118375 ARS ARS1324 ARSXIII-635 chromosome 13 13 634501 634588 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000004799 ORF Uncharacterized YMR187C chromosome 13 13 635984 634689 C 2011-02-03 1996-07-31 Putative protein of unknown function; YMR187C is not an essential gene -S000033992 CDS YMR187C 13 635984 634689 C 2011-02-03 1996-07-31 -S000004800 ORF Verified YMR188C MRPS17 mitochondrial 37S ribosomal protein MRPS17 chromosome 13 13 637004 636291 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit -S000034878 CDS YMR188C 13 637004 636291 C 2011-02-03 1996-07-31 -S000004801 ORF Verified YMR189W GCV2 glycine decarboxylase subunit P|GSD2 chromosome 13 L000000734 13 637500 640604 W 2011-02-03 1996-07-31 P subunit of the mitochondrial glycine decarboxylase complex; glycine decarboxylase is required for the catabolism of glycine to 5,10-methylene-THF; expression is regulated by levels of 5,10-methylene-THF in the cytoplasm -S000035091 CDS YMR189W 13 637500 640604 W 2011-02-03 1996-07-31 -S000004802 ORF Verified YMR190C SGS1 ATP-dependent DNA helicase SGS1 chromosome 13 L000001877 13 645258 640915 C 115.6 2011-02-03 1996-07-31 RecQ family nucleolar DNA helicase; role in genome integrity maintenance, chromosome synapsis, meiotic joint molecule/crossover formation; stimulates activity of Top3p; rapidly lost in response to rapamycin in Rrd1p-dependent manner; forms nuclear foci upon DNA replication stress; yeast SGS1 complements mutations in human homolog BLM implicated in Bloom syndrome; also similar to human WRN implicated in Werner syndrome; human BLM and WRN can each complement yeast null mutant -S000034467 CDS YMR190C 13 645258 640915 C 2011-02-03 1996-07-31 -S000004803 ORF Verified YMR191W SPG5 chromosome 13 13 645656 646777 W 2011-02-03 2003-09-22|1996-07-31 Protein required for proteasome assembly during quiescence; binds to base of the proteasome regulartory particle; required for survival at high temperature during stationary phase; not required for growth on nonfermentable carbon sources -S000034638 CDS YMR191W 13 645656 646777 W 2011-02-03 2003-09-22|1996-07-31 -S000004804 ORF Verified YMR192W GYL1 APP2 chromosome 13 13 647118 649280 W 2011-02-03 1996-07-31 Putative GTPase activating protein (GAP) with a role in exocytosis; stimulates Gyp5p GAP activity on Ypt1p, colocalizes with Gyp5p at sites of polarized growth; interacts with Gyp5p, Rvs161p, and Rvs167p; involved in recruiting Rvs167p to the bud tip during polarized growth; increases in abundance and relocalizes from bud neck to cytoplasm upon DNA replication stress; GYL1 has a paralog, GYP5, that arose from the whole genome duplication -S000034769 CDS YMR192W 13 647118 649280 W 2011-02-03 1996-07-31 -S000118376 ARS ARS1325 ARSXIII-649 chromosome 13 13 649309 649552 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178160 ARS_consensus_sequence ARS1325 13 649361 649377 W 2014-11-18 2014-11-18 -S000004806 ORF Verified YMR193W MRPL24 mitochondrial 54S ribosomal protein YmL24/YmL14|YmL14|YmL24|MRPL14 chromosome 13 L000002690 13 650036 650812 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; two mitochondrial ribosomal proteins, YmL14 and YmL24, have been assigned to the same gene -S000035736 CDS YMR193W 13 650036 650812 W 2011-02-03 1996-07-31 -S000004807 ORF Verified YMR194W RPL36A eL36|ribosomal 60S subunit protein L36A|L36e|YL39|L39|L36A|RPL39B chromosome 13 L000004467|L000003236 13 651145 651910 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L36A; N-terminally acetylated; binds to 5.8 S rRNA; homologous to mammalian ribosomal protein L36, no bacterial homolog; RPL36A has a paralog, RPL36B, that arose from the whole genome duplication -S000035869 CDS YMR194W 13 651145 651160 W 2011-02-03 1996-07-31 -S000035870 CDS YMR194W 13 651624 651910 W 2011-02-03 1996-07-31 -S000035871 intron YMR194W 13 651161 651623 W 2011-02-03 1996-07-31 -S000004805 ORF Dubious YMR193C-A chromosome 13 13 651458 651072 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035259 CDS YMR193C-A 13 651458 651072 C 2011-02-03 1996-07-31 -S000007293 snoRNA_gene snR11 SNR11 chromosome 13 L000004943|L000002848 13 652275 652532 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2416 -S000036590 noncoding_exon snR11 13 652275 652532 W 2011-02-03 2000-05-19 -S000028514 ORF Verified YMR194C-B CMC4 chromosome 13 13 652887 652594 C 2011-02-03 2003-07-29 Protein that localizes to the mitochondrial intermembrane space; localizes via the Mia40p-Erv1p system; contains twin cysteine-x(9)-cysteine motifs -S000030281 CDS YMR194C-B 13 652775 652594 C 2011-02-03 2003-07-29 -S000030280 CDS YMR194C-B 13 652887 652848 C 2011-02-03 2003-07-29 -S000030282 intron YMR194C-B 13 652847 652776 C 2011-02-03 2003-07-29 -S000007250 ORF Dubious YMR194C-A chromosome 13 13 653136 652912 C 2011-02-03 1997-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037816 CDS YMR194C-A 13 653136 652912 C 2011-02-03 1997-07-17 -S000004808 ORF Verified YMR195W ICY1 chromosome 13 S000007527 13 654034 654417 W 2011-02-03 1996-07-31 Protein of unknown function; required for viability in rich media of cells lacking mitochondrial DNA; mutants have an invasive growth defect with elongated morphology; induced by amino acid starvation; ICY1 has a paralog, ICY2, that arose from the whole genome duplication -S000036003 CDS YMR195W 13 654034 654417 W 2011-02-03 1996-07-31 -S000004809 ORF Uncharacterized YMR196W chromosome 13 13 655076 658342 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YMR196W is not an essential gene -S000037847 CDS YMR196W 13 655076 658342 W 2011-02-03 1996-07-31 -S000004810 ORF Verified YMR197C VTI1 v-SNARE protein VTI1 chromosome 13 L000003598 13 659198 658545 C 2011-02-03 1996-07-31 Protein involved in cis-Golgi membrane traffic; v-SNARE that interacts with two t-SNARES, Sed5p and Pep12p; required for multiple vacuolar sorting pathways; human homolog VTI1A can complement yeast null mutant -S000037881 CDS YMR197C 13 659198 658545 C 2011-02-03 1996-07-31 -S000004811 ORF Verified YMR198W CIK1 chromosome 13 L000000335 13 659745 661529 W 2011-02-03 1996-07-31 Kinesin-associated protein; required for both karyogamy and mitotic spindle organization, interacts stably and specifically with Kar3p and may function to target this kinesin to a specific cellular role; locus encodes a long and short transcript with differing functions; CIK1 has a paralog, VIK1, that arose from the whole genome duplication -S000029971 CDS YMR198W 13 659745 661529 W 2011-02-03 1996-07-31 -S000004812 ORF Verified YMR199W CLN1 cyclin CLN1 chromosome 13 L000000357 13 662644 664284 W 2011-02-03 1996-07-31 G1 cyclin involved in regulation of the cell cycle; activates Cdc28p kinase to promote the G1 to S phase transition; late G1 specific expression depends on transcription factor complexes, MBF (Swi6p-Mbp1p) and SBF (Swi6p-Swi4p); CLN1 has a paralog, CLN2, that arose from the whole genome duplication; cell cycle arrest phenotype of the cln1 cln2 cln3 triple null mutant is complemented by any of human cyclins CCNA2, CCNB1, CCNC, CCND1, or CCNE1 -S000030961 CDS YMR199W 13 662644 664284 W 2011-02-03 1996-07-31 -S000004813 ORF Verified YMR200W ROT1 chromosome 13 L000003404 13 664752 665522 W 2011-02-03 1996-07-31 Molecular chaperone involved in protein folding in ER; mutation causes defects in cell wall synthesis and lysis of autophagic bodies, suppresses tor2 mutations, and is synthetically lethal with kar2-1 and with rot2 mutations; involved in N-linked glycosylation and O-mannosylation; transmembrane helix Ser250 is essential for Rot1p to interact with other membrane components and exert its functional role, avoiding exposure of Ser H-bonding group at lipid-exposed surface -S000035501 CDS YMR200W 13 664752 665522 W 2011-02-03 1996-07-31 -S000004814 ORF Verified YMR201C RAD14 chromosome 13 L000001564 13 667044 665845 C 2011-02-03 1996-07-31 Protein that recognizes and binds damaged DNA during NER; subunit of Nucleotide Excision Repair Factor 1 (NEF1); contains zinc finger motif; homolog of human XPA protein; NER stands for nucleotide excision repair -S000035530 CDS YMR201C 13 666933 665845 C 2011-02-03 1996-07-31 -S000035529 CDS YMR201C 13 667044 667018 C 2011-02-03 1996-07-31 -S000035531 intron YMR201C 13 667017 666934 C 2011-02-03 1996-07-31 -S000178149 matrix_attachment_site ETC5 ETC5 chromosome 13 13 667324 667346 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; can act as a transcription-blocking insulator or as a heterochromatin barrier element; located within ncRNA RNA170 which lies between divergently transcribed genes RAD14 and ERG2 -S000114171 ncRNA_gene RNA170 RNA170 chromosome 13 S000077076 13 667456 667288 C 2011-02-03 2006-01-23 RNA polymerase III transcribed RNA of unknown function; conserved in other yeast species -S000114172 noncoding_exon RNA170 13 667456 667288 C 2011-02-03 2006-01-23 -S000004815 ORF Verified YMR202W ERG2 C-8 sterol isomerase ERG2|END11 chromosome 13 L000000569|L000004560 13 667537 668205 W 2011-02-03 1996-07-31 C-8 sterol isomerase; catalyzes isomerization of delta-8 double bond to delta-7 position at an intermediate step in ergosterol biosynthesis; transcriptionally down-regulated when ergosterol is in excess; mutation is functionally complemented by human EBP -S000036484 CDS YMR202W 13 667537 668205 W 2011-02-03 1996-07-31 -S000004816 ORF Verified YMR203W TOM40 MOM38|ISP42 chromosome 13 L000000878 13 668492 669655 W 2011-02-03 1996-07-31 Component of the TOM (translocase of outer membrane) complex; responsible for recognition and initial import steps for all mitochondrially directed proteins; constitutes the core element of the protein conducting pore; pre-Tom40p is phosphorylated by PKA, which impairs its import into mitochondria under non-respiratory conditions -S000036557 CDS YMR203W 13 668492 669655 W 2011-02-03 1996-07-31 -S000004817 ORF Verified YMR204C INP1 chromosome 13 13 671325 670063 C 2011-02-03 1996-07-31 Peripheral membrane protein of peroxisomes; involved in peroxisomal inheritance; recruitment to peroxisomes is mediated by interaction with Pex3p at the peroxisomal membrane -S000036611 CDS YMR204C 13 671325 670063 C 2011-02-03 1996-07-31 -S000004818 ORF Verified YMR205C PFK2 6-phosphofructokinase subunit beta chromosome 13 L000001405 13 674766 671887 C 132 2011-02-03 1996-07-31 Beta subunit of heterooctameric phosphofructokinase; involved in glycolysis; indispensable for anaerobic growth; activated by fructose-2,6-bisphosphate and AMP; mutation inhibits glucose induction of cell cycle-related genes -S000036708 CDS YMR205C 13 674766 671887 C 2011-02-03 1996-07-31 -S000004819 ORF Uncharacterized YMR206W chromosome 13 13 675896 676837 W 2011-02-03 1996-07-31 Putative protein of unknown function; not an essential gene; YMR206W has a paralog, YNR014W, that arose from the whole genome duplication -S000037504 CDS YMR206W 13 675896 676837 W 2011-02-03 1996-07-31 -S000004820 ORF Verified YMR207C HFA1 acetyl-CoA carboxylase HFA1 chromosome 13 L000000769 13 683564 677193 C 2011-02-03 1996-07-31 Mitochondrial acetyl-coenzyme A carboxylase; catalyzes production of malonyl-CoA in mitochondrial fatty acid biosynthesis; relocalizes from mitochondrion to cytoplasm upon DNA replication stress; genetic and comparative analysis suggests that translation begins at a non-canonical (Ile) start codon at -372 relative to the annotated start codon -S000037547 CDS YMR207C 13 683564 677193 C 2011-02-03 1996-07-31 -S000004821 ORF Verified YMR208W ERG12 mevalonate kinase|RAR1 chromosome 13 L000000578 13 684467 685798 W 176 2011-02-03 1996-07-31 Mevalonate kinase; acts in the biosynthesis of isoprenoids and sterols, including ergosterol, from mevalonate; human MVK functionally complements the lethality of the erg12 null mutation -S000030406 CDS YMR208W 13 684467 685798 W 2011-02-03 1996-07-31 -S000004822 ORF Uncharacterized YMR209C chromosome 13 13 687284 685911 C 2011-02-03 1996-07-31 Putative S-adenosylmethionine-dependent methyltransferase; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively; YMR209C is not an essential gene -S000030480 CDS YMR209C 13 687284 685911 C 2011-02-03 1996-07-31 -S000004823 ORF Verified YMR210W MGL2 putative carboxylic ester hydrolase chromosome 13 13 687516 688865 W 2011-02-03 1996-07-31 Monoacylglycerol lipase; palmitoyl monoacylglycerol is the preferred substrate; role in triacylglycerol catabolism; minor role in medium-chain fatty acid ethyl ester biosynthesis; contains an alpha/beta hydrolase domain and a typical lipase motif; has similarity to acyltransferases, Eeb1p and Eht1p, and human ABHD1 -S000031343 CDS YMR210W 13 687516 688865 W 2011-02-03 1996-07-31 -S000004824 ORF Verified YMR211W DML1 chromosome 13 13 689083 690510 W 2011-02-03 1996-07-31 Essential protein involved in mtDNA inheritance; may also function in the partitioning of the mitochondrial organelle or in the segregation of chromosomes, exhibits regions similar to members of a GTPase family -S000031451 CDS YMR211W 13 689083 690510 W 2011-02-03 1996-07-31 -S000004825 ORF Verified YMR212C EFR3 chromosome 13 13 693043 690695 C 2011-02-03 1996-07-31 Protein required for Stt4-containing PI kinase complex localization; required for Stt4-containing phosphoinositide (PI) kinase patch assembly at the plasma membrane; recruited to the plasma membrane via a conserved basic patch near its N-terminus; exhibits synthetic lethal genetic interactions with PHO85; has sequence similarity to the Drosophila rolling blackout (RBO) gene -S000031486 CDS YMR212C 13 693043 690695 C 2011-02-03 1996-07-31 -S000004826 ORF Verified YMR213W CEF1 NTC85 chromosome 13 L000004270 13 693381 695153 W 2011-02-03 1996-07-31 Essential splicing factor; associated with Prp19p and the spliceosome, contains an N-terminal c-Myb DNA binding motif necessary for cell viability but not for Prp19p association, evolutionarily conserved and homologous to S. pombe Cdc5p -S000031586 CDS YMR213W 13 693381 695153 W 2011-02-03 1996-07-31 -S000004827 ORF Verified YMR214W SCJ1 chromosome 13 L000001811 13 695350 696483 W 2011-02-03 2003-09-22|1996-07-31 One of several homologs of bacterial chaperone DnaJ; located in the ER lumen where it cooperates with Kar2p to mediate maturation of proteins -S000032566 CDS YMR214W 13 695350 696483 W 2011-02-03 2003-09-22|1996-07-31 -S000004828 ORF Verified YMR215W GAS3 putative 1,3-beta-glucanosyltransferase chromosome 13 13 696796 698370 W 2011-02-03 1996-07-31 Putative 1,3-beta-glucanosyltransferase; has similarity go other GAS family members; low abundance, possibly inactive member of the GAS family of GPI-containing proteins; localizes to the cell wall; mRNA induced during sporulation -S000032695 CDS YMR215W 13 696796 698370 W 2011-02-03 1996-07-31 -S000004829 ORF Verified YMR216C SKY1 serine/threonine protein kinase SKY1 chromosome 13 L000003941 13 701039 698811 C 2011-02-03 1996-07-31 SR protein kinase (SRPK); involved in regulating proteins involved in mRNA metabolism and cation homeostasis; similar to human SRPK1 -S000032724 CDS YMR216C 13 701039 698811 C 2011-02-03 1996-07-31 -S000004830 ORF Verified YMR217W GUA1 GMP synthase (glutamine-hydrolyzing) chromosome 13 L000000744 13 701790 703367 W 2011-02-03 1996-07-31 GMP synthase; highly conserved enzyme that catalyzes the second step in the biosynthesis of GMP from inosine 5'-phosphate (IMP); transcription is not subject to regulation by guanine but is negatively regulated by nutrient starvation; reduction-of-function mutation gua1-G388D causes changes in cellular guanine nucleotide pools, defects in general protein synthesis, and impaired translation of GCN4 mRNA -S000033507 CDS YMR217W 13 701790 703367 W 2011-02-03 1996-07-31 -S000004831 ORF Verified YMR218C TRS130 transport protein particle complex II subunit TRS130 chromosome 13 S000007468 13 706887 703579 C 2011-02-03 1996-07-31 Component of transport protein particle (TRAPP) complex II; TRAPPII is a multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating intra-Golgi and endosome-Golgi traffic -S000033556 CDS YMR218C 13 706887 703579 C 2011-02-03 1996-07-31 -S000004832 ORF Verified YMR219W ESC1 chromosome 13 L000004422 13 707133 712109 W 2011-02-03 1996-07-31 Protein involved in telomeric silencing; required for quiescent cell telomere hypercluster localization at nuclear membrane vicinity; interacts with PAD4-domain of Sir4p -S000033701 CDS YMR219W 13 707133 712109 W 2011-02-03 1996-07-31 -S000004833 ORF Verified YMR220W ERG8 phosphomevalonate kinase chromosome 13 L000000574 13 712316 713671 W 2011-02-03 1996-07-31 Phosphomevalonate kinase; an essential cytosolic enzyme that acts in the biosynthesis of isoprenoids and sterols, including ergosterol, from mevalonate -S000035642 CDS YMR220W 13 712316 713671 W 2011-02-03 1996-07-31 -S000004834 ORF Uncharacterized YMR221C FMP42 chromosome 13 13 715445 713931 C 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; physical interaction with Atg27p suggests a possible role in autophagy -S000035674 CDS YMR221C 13 715445 713931 C 2011-02-03 1996-07-31 -S000004835 ORF Verified YMR222C FSH2 putative serine hydrolase chromosome 13 13 716309 715638 C 2011-02-03 1996-07-31 Putative serine hydrolase that localizes to the cytoplasm; sequence is similar to S. cerevisiae Fsh1p and Fsh3p and the human candidate tumor suppressor OVCA2 -S000035719 CDS YMR222C 13 716309 715638 C 2011-02-03 1996-07-31 -S000004836 ORF Verified YMR223W UBP8 ubiquitin-specific protease UBP8 chromosome 13 L000004587 13 716715 718130 W 2011-02-03 1996-07-31 Ubiquitin-specific protease component of the SAGA acetylation complex; required for SAGA (Spt-Ada-Gcn5-Acetyltransferase)-mediated deubiquitination of histone H2B -S000035903 CDS YMR223W 13 716715 718130 W 2011-02-03 1996-07-31 -S000004837 ORF Verified YMR224C MRE11 MRX complex nuclease subunit|NGS1|XRS4|RAD58 chromosome 13 L000004732|L000001149|L000004275 13 720653 718575 C 2011-02-03 1996-07-31 Nuclease subunit of the MRX complex with Rad50p and Xrs2p; complex functions in repair of DNA double-strand breaks and in telomere stability; Mre11p associates with Ser/Thr-rich ORFs in premeiotic phase; nuclease activity required for MRX function; widely conserved; forms nuclear foci upon DNA replication stress -S000035950 CDS YMR224C 13 720653 718575 C 2011-02-03 1996-07-31 -S000004838 ORF Verified YMR225C MRPL44 mitochondrial 54S ribosomal protein YmL44|YmL44|YMR44 chromosome 13 L000002534 13 721403 720960 C 158 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; protein abundance increases in response to DNA replication stress -S000036820 CDS YMR225C 13 721198 720960 C 2011-02-03 1996-07-31 -S000036819 CDS YMR225C 13 721403 721346 C 2011-02-03 1996-07-31 -S000036821 intron YMR225C 13 721345 721199 C 2011-02-03 1996-07-31 -S000004839 ORF Verified YMR226C oxidoreductase|TMA29 chromosome 13 13 722396 721593 C 2011-02-03 1996-07-31 NADP(+)-dependent serine dehydrogenase and carbonyl reductase; acts on serine, L-allo-threonine, and other 3-hydroxy acids; green fluorescent protein fusion protein localizes to the cytoplasm and nucleus; may interact with ribosomes, based on co-purification experiments -S000036891 CDS YMR226C 13 722396 721593 C 2011-02-03 1996-07-31 -S000004840 ORF Verified YMR227C TAF7 TafII67|TAF67 chromosome 13 L000003463 13 724385 722613 C 2011-02-03 1996-07-31 TFIID subunit (67 kDa); involved in RNA polymerase II transcription initiation -S000036956 CDS YMR227C 13 724385 722613 C 2011-02-03 1996-07-31 -S000004841 ORF Verified YMR228W MTF1 RNA polymerase specificity factor chromosome 13 L000001211 13 724626 725651 W 157.9 2011-02-03 1996-07-31 Mitochondrial RNA polymerase specificity factor; has structural similarity to S-adenosylmethionine-dependent methyltransferases and functional similarity to bacterial sigma-factors; Mtf1p interacts with and stabilizes the Rpo41p-promoter complex, enhancing DNA bending and melting to facilitate pre-initiation open complex formation -S000037761 CDS YMR228W 13 724626 725651 W 2011-02-03 1996-07-31 -S000004842 ORF Verified YMR229C RRP5 chromosome 13 L000003232 13 731123 725934 C 2011-02-03 1996-07-31 RNA binding protein involved in synthesis of 18S and 5.8S rRNAs; component of ribosomal small subunit (SSU) processome and 90S preribosome; required for pre-rRNA packaging and compaction of processome into dense terminal balls; part of Mak21p-Noc2p-Rrp5p module that associates with nascent pre-rRNA during transcription with role in biogenesis of large ribosomal subunit; binds single stranded tracts of U's; relocalizes from nucleolus to nucleus upon DNA replication stress -S000037792 CDS YMR229C 13 731123 725934 C 2011-02-03 1996-07-31 -S000004843 ORF Verified YMR230W RPS10B eS10|ribosomal 40S subunit protein S10B|S10e|S10B chromosome 13 L000004476 13 732414 733141 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S10, no bacterial homolog; RPS10B has a paralog, RPS10A, that arose from the whole genome duplication; mutations in the human homolog associated with Diamond-Blackfan anemia -S000030773 CDS YMR230W 13 732414 732465 W 2011-02-03 1996-07-31 -S000030774 CDS YMR230W 13 732876 733141 W 2011-02-03 1996-07-31 -S000030775 intron YMR230W 13 732466 732875 W 2011-02-03 1996-07-31 -S000028576 ORF Uncharacterized YMR230W-A chromosome 13 13 733268 733456 W 2011-02-03 2003-07-29 Putative protein of unknown function -S000031309 CDS YMR230W-A 13 733268 733456 W 2011-02-03 2003-07-29 -S000004844 ORF Verified YMR231W PEP5 tethering complex subunit PEP5|VPT11|VPS11|VPL9|VAM1|END1 chromosome 13 L000001376|L000002957 13 733545 736634 W 152 2011-02-03 1996-07-31 Histone E3 ligase, component of CORVET membrane tethering complex; peripheral vacuolar membrane protein required for protein trafficking and vacuole biogenesis; interacts with Pep7p; involved in ubiquitination and degradation of excess histones -S000030876 CDS YMR231W 13 733545 736634 W 2011-02-03 1996-07-31 -S000004845 ORF Verified YMR232W FUS2 chromosome 13 L000000654 13 736926 738959 W 160 2011-02-03 1996-07-31 Cell fusion regulator; cytoplasmic protein localized to shmoo tip; required for alignment of parental nuclei before nuclear fusion during mating; contains a Dbl-homology domain; binds specifically with activated Cdc42p -S000031887 CDS YMR232W 13 736926 738959 W 2011-02-03 1996-07-31 -S000004846 ORF Verified YMR233W TRI1 chromosome 13 13 739185 739865 W 2011-02-03 1996-07-31 Non-essential sumoylated protein of unknown function; similar to components of human SWI/SNF complex including SMRD3; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm, nucleus and nucleolus; TRI1 has a paralog, UAF30, that arose from the whole genome duplication -S000032018 CDS YMR233W 13 739185 739865 W 2011-02-03 1996-07-31 -S000004847 ORF Verified YMR234W RNH1 RNA-DNA hybrid ribonuclease chromosome 13 L000001653 13 740266 741312 W 160 2011-02-03 1996-07-31 Ribonuclease H1; able to bind double-stranded RNAs and RNA-DNA hybrids; associates with RNAse polymerase I. -S000032129 CDS YMR234W 13 740266 741312 W 2011-02-03 1996-07-31 -S000004848 ORF Verified YMR235C RNA1 GTPase-activating protein RNA1 chromosome 13 L000001649 13 742735 741512 C 159 2011-02-03 1996-07-31 GTPase activating protein (GAP) for Gsp1p; involved in nuclear transport -S000032993 CDS YMR235C 13 742735 741512 C 2011-02-03 1996-07-31 -S000004849 ORF Verified YMR236W TAF9 chromatin modification protein|TafII17|TAF17 chromosome 13 L000003459 13 742971 743444 W 2011-02-03 1996-07-31 Subunit (17 kDa) of TFIID and SAGA complexes; involved in RNA polymerase II transcription initiation and in chromatin modification, similar to histone H3 -S000033137 CDS YMR236W 13 742971 743444 W 2011-02-03 1996-07-31 -S000004850 ORF Verified YMR237W BCH1 exomer complex subunit chromosome 13 13 743749 745923 W 2011-02-03 1996-07-31 Member of the ChAPs family (Chs5p-Arf1p-binding proteins); members include Bch1p, Bch2p, Bud7p, and Chs6p; ChAPs family proteins form the exomer complex with Chs5p to mediate export of specific cargo proteins from the Golgi to the plasma membrane; interacts selectively with the activated, GTP-bound form of Arf1p; may interact with ribosomes; protein abundance increases and forms cytoplasmic foci in response to DNA replication stress -S000033208 CDS YMR237W 13 743749 745923 W 2011-02-03 1996-07-31 -S000004851 ORF Verified YMR238W DFG5 putative mannan endo-1,6-alpha-mannosidase chromosome 13 L000004072 13 746353 747729 W 2011-02-03 1996-07-31 Putative mannosidase; essential glycosylphosphatidylinositol (GPI)-anchored membrane protein required for cell wall biogenesis in bud formation, involved in filamentous growth, homologous to Dcw1p -S000034028 CDS YMR238W 13 746353 747729 W 2011-02-03 1996-07-31 -S000006717 tRNA_gene tR(UCU)M1 chromosome 13 L000003675 13 747963 747892 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000031501 noncoding_exon tR(UCU)M1 13 747963 747892 C 2011-02-03 2000-05-19 -S000004852 ORF Verified YMR239C RNT1 ribonuclease III chromosome 13 L000002844 13 749677 748262 C 2011-02-03 1996-07-31 Nuclear dsRNA-specific ribonuclease (RNase III); involved in rDNA transcription, rRNA processing and U2 snRNA 3' end formation by cleavage of a stem-loop structure at the 3' end of U2 snRNA; involved in polyadenylation-independent transcription termination; involved in the cell wall stress response, regulating the degradation of cell wall integrity and morphogenesis checkpoint genes -S000034074 CDS YMR239C 13 749677 748262 C 2011-02-03 1996-07-31 -S000004853 ORF Verified YMR240C CUS1 U2 snRNP complex subunit CUS1 chromosome 13 L000002833 13 751240 749930 C 2011-02-03 1996-07-31 Protein required for assembly of U2 snRNP into the spliceosome; forms a complex with Hsh49p and Hsh155p -S000035059 CDS YMR240C 13 751240 749930 C 2011-02-03 1996-07-31 -S000004854 ORF Verified YMR241W YHM2 chromosome 13 L000004516 13 751961 752905 W 2011-02-03 1996-07-31 Citrate and oxoglutarate carrier protein; exports citrate from and imports oxoglutarate into the mitochondrion, causing net export of NADPH reducing equivalents; also associates with mt nucleoids and has a role in replication and segregation of the mt genome -S000035206 CDS YMR241W 13 751961 752905 W 2011-02-03 1996-07-31 -S000004855 ORF Verified YMR242C RPL20A eL20|ribosomal 60S subunit protein L20A|L20e|L20A|L18A|RPL18A2 chromosome 13 L000004458|L000003149 13 754220 753225 C 2011-02-03 2003-09-27|1996-07-31|2007-07-10 Ribosomal 60S subunit protein L20A; homologous to mammalian ribosomal protein L18A, no bacterial homolog; RPL20A has a paralog, RPL20B, that arose from the whole genome duplication -S000035252 CDS YMR242C 13 753742 753225 C 2011-02-03 2003-09-27 -S000035251 CDS YMR242C 13 754220 754220 C 2011-02-03 2003-09-27|1996-07-31|2007-07-10 -S000035253 intron YMR242C 13 754219 753743 C 2011-02-03 2003-09-27|2007-07-10 -S000028694 ORF Uncharacterized YMR242W-A chromosome 13 13 754297 754386 W 2011-02-03 2003-07-29 Putative protein of unknown function -S000032596 CDS YMR242W-A 13 754297 754386 W 2011-02-03 2003-07-29 -S000004856 ORF Verified YMR243C ZRC1 Zn(2+) transporter ZRC1|OSR1 chromosome 13 L000002570 13 756166 754838 C 2011-02-03 1996-07-31 Vacuolar membrane zinc transporter; transports zinc from cytosol to vacuole for storage; also has role in resistance to zinc shock resulting from sudden influx of zinc into cytoplasm; human ortholog SLC30A10 functions as a Mn transporter and mutations in SLC30A10 cause neurotoxic accumulation of Mn in liver and brain; ZRC1 has a paralog, COT1, that arose from the whole genome duplication -S000036141 CDS YMR243C 13 756166 754838 C 2011-02-03 1996-07-31 -S000004858 ORF Uncharacterized YMR244W chromosome 13 13 757250 758317 W 2011-02-03 1996-07-31 Putative protein of unknown function; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole -S000031680 CDS YMR244W 13 757250 758317 W 2011-02-03 1996-07-31 -S000118377 ARS ARS1327 ARSXIII-758 chromosome 13 13 758224 758471 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178161 ARS_consensus_sequence ARS1327 13 758417 758401 C 2014-11-18 2014-11-18 -S000004859 ORF Dubious YMR245W chromosome 13 13 758563 759183 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031825 CDS YMR245W 13 758563 759183 W 2011-02-03 1996-07-31 -S000004857 ORF Verified YMR244C-A COA6 chromosome 13 13 758831 758517 C 2011-02-03 1996-07-31 Protein involved in cytochrome c oxidase (Complex IV) assembly; involved in delivery of copper to Complex IV; also required for efficient formation of respiratory supercomplexes comprised of Complexes III and IV; localizes to the mitochondrial intermembrane space; ortholog implicated in cardiac defects in zebrafish and human; transcription is induced in response to the DNA-damaging agent MMS; protein abundance increases in response to DNA replication stress -S000035790 CDS YMR244C-A 13 758831 758517 C 2011-02-03 1996-07-31 -S000004860 ORF Verified YMR246W FAA4 long-chain fatty acid-CoA ligase FAA4 chromosome 13 L000002647 13 759807 761891 W 2011-02-03 1996-07-31 Long chain fatty acyl-CoA synthetase; activates fatty acids with a preference for C12:0-C16:0 chain lengths; role in the competitive import of long-chain fatty acids and sphingoid long-chain bases; role in stationary phase survival; localizes to lipid particles and the plasma membrane; role in sphingolipid-to-glycerolipid metabolism; forms cytoplasmic foci upon replication stress; faa1 faa4 double null complemented by any of human ACSBG1, ACSL1, 3, 4, 5, 6, SLC27A2, or 4 -S000031958 CDS YMR246W 13 759807 761891 W 2011-02-03 1996-07-31 -S000119075 snoRNA_gene snR86 SNR86 chromosome 13 13 763113 762110 C 2011-02-03 2006-10-05 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2314 -S000119077 noncoding_exon snR86 13 763113 762110 C 2011-02-03 2006-10-05 -S000004861 ORF Verified YMR247C RKR1 ubiquitin-protein ligase RKR1|LTN1 chromosome 13 13 768039 763351 C 2011-02-03 1996-07-31 RING domain E3 ubiquitin ligase; involved in ubiquitin-mediated degradation of non-stop proteins and translationally stalled ER membrane proteins; component of ribosome-bound RQC (ribosome quality control) complex; degrades products of mRNAs lacking a termination codon regardless of a poly(A) tail; functional connections to chromatin modification; homolog of mouse Listerin, mutations in which reported to cause neurodegeneration -S000031995 CDS YMR247C 13 768039 763351 C 2011-02-03 1996-07-31 -S000006519 tRNA_gene tA(AGC)M2 chromosome 13 L000003674 13 768441 768369 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine -S000036431 noncoding_exon tA(AGC)M2 13 768441 768369 C 2011-02-03 2000-05-19 -S000007125 long_terminal_repeat YMRWdelta19 chromosome 13 13 768548 768879 W 2011-02-03 2000-05-19 Ty2 LTR -S000028849 ORF Uncharacterized YMR247W-A chromosome 13 13 769283 769426 W 2011-02-03 2003-07-29 Putative protein of unknown function; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole -S000034536 CDS YMR247W-A 13 769283 769426 W 2011-02-03 2003-07-29 -S000004862 ORF Verified YMR250W GAD1 glutamate decarboxylase GAD1 chromosome 13 S000007509 13 770801 772558 W 2011-02-03 1996-07-31 Glutamate decarboxylase; converts glutamate into gamma-aminobutyric acid (GABA) during glutamate catabolism; involved in response to oxidative stress -S000037211 CDS YMR250W 13 770801 772558 W 2011-02-03 1996-07-31 -S000118378 ARS ARS1328 ARSXIII-773 chromosome 13 13 772631 772879 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000004863 ORF Verified YMR251W GTO3 omega-class glutathione transferase chromosome 13 13 772915 774015 W 2011-02-03 1996-07-31 Omega class glutathione transferase; putative cytosolic localization -S000037313 CDS YMR251W 13 772915 774015 W 2011-02-03 1996-07-31 -S000004864 ORF Verified YMR251W-A HOR7 chromosome 13 L000003980 13 774752 774931 W 2011-02-03 1996-07-31 Protein of unknown function; overexpression suppresses Ca2+ sensitivity of mutants lacking inositol phosphorylceramide mannosyltransferases Csg1p and Csh1p; transcription is induced under hyperosmotic stress and repressed by alpha factor; HOR7 has a paralog, DDR2, that arose from the whole genome duplication -S000035256 CDS YMR251W-A 13 774752 774931 W 2011-02-03 1996-07-31 -S000004865 ORF Uncharacterized YMR252C chromosome 13 13 775719 775315 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to mitochondria; YMR252C is not an essential gene -S000037324 CDS YMR252C 13 775719 775315 C 2011-02-03 1996-07-31 -S000004866 ORF Uncharacterized YMR253C chromosome 13 13 777190 775946 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; YMR253C is not an essential gene -S000037399 CDS YMR253C 13 777190 775946 C 2011-02-03 1996-07-31 -S000004867 ORF Dubious YMR254C chromosome 13 13 777923 777615 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030036 CDS YMR254C 13 777923 777615 C 2011-02-03 1996-07-31 -S000004868 ORF Verified YMR255W GFD1 chromosome 13 L000004632 13 778001 778567 W 2011-02-03 1996-07-31 Coiled-coiled protein of unknown function; identified as a high-copy suppressor of a dbp5 mutation; protein abundance increases in response to DNA replication stress -S000030249 CDS YMR255W 13 778001 778567 W 2011-02-03 1996-07-31 -S000004869 ORF Verified YMR256C COX7 cytochrome c oxidase subunit VII chromosome 13 L000000391 13 779127 778945 C 2011-02-03 1996-07-31 Subunit VII of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain -S000030343 CDS YMR256C 13 779127 778945 C 2011-02-03 1996-07-31 -S000004870 ORF Verified YMR257C PET111 chromosome 13 L000001393 13 782031 779629 C 177 2011-02-03 1996-07-31 Mitochondrial translational activator specific for the COX2 mRNA; located in the mitochondrial inner membrane -S000033634 CDS YMR257C 13 782031 779629 C 2011-02-03 1996-07-31 -S000004871 ORF Verified YMR258C ROY1 chromosome 13 13 784281 782620 C 2011-02-03 1996-07-31 GTPase inhibitor with similarity to F-box proteins; inhibits Ypt52p GTPase activity by preventing Ypt52p from binding GTP; involved in regulating intracellular trafficking; physically interacts with Skp1p -S000033770 CDS YMR258C 13 784281 782620 C 2011-02-03 1996-07-31 -S000004872 ORF Verified YMR259C TRM732 tRNA methylation protein TRM732 chromosome 13 13 788883 784621 C 2011-02-03 1996-07-31 Protein involved in 2'-O-methylation of C32 of substrate tRNAs; interacts with 2'-O-ribose methyltransferase Trm7p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; non-essential gene; yeast null mutant can be functionally complemented by human THADA, mutations in which have been implicated in epithelial thyroid adenomas, type 2 diabetes, and polycystic ovary syndrome (PCOS) -S000033886 CDS YMR259C 13 788883 784621 C 2011-02-03 1996-07-31 -S000004873 ORF Verified YMR260C TIF11 chromosome 13 L000002306 13 789839 789378 C 2011-02-03 1996-07-31 Translation initiation factor eIF1A; essential protein that forms a complex with Sui1p (eIF1) and the 40S ribosomal subunit and scans for the start codon; C-terminus associates with Fun12p (eIF5B); N terminus interacts with eIF2 and eIF3 -S000033454 CDS YMR260C 13 789839 789378 C 2011-02-03 1996-07-31 -S000004874 ORF Verified YMR261C TPS3 trehalose 6-phosphate synthase/phosphatase complex subunit chromosome 13 L000002718 13 793369 790205 C 2011-02-03 1996-07-31 Regulatory subunit of trehalose-6-phosphate synthase/phosphatase; involved in synthesis of storage carbohydrate trehalose; expression is induced by stress conditions and repressed by the Ras-cAMP pathway; TPS3 has a paralog, TSL1, that arose from the whole genome duplication -S000033514 CDS YMR261C 13 793369 790205 C 2011-02-03 1996-07-31 -S000004875 ORF Uncharacterized YMR262W putative endodeoxyribonuclease chromosome 13 13 793726 794667 W 2011-02-03 1996-07-31|2011-02-03 Protein of unknown function; interacts weakly with Knr4p; YMR262W is not an essential gene -S000033607 CDS YMR262W 13 793726 794667 W 2011-02-03 1996-07-31|2011-02-03 -S000004876 ORF Verified YMR263W SAP30 chromosome 13 13 794919 795524 W 2011-02-03 1996-07-31 Component of Rpd3L histone deacetylase complex; involved in silencing at telomeres, rDNA, and silent mating-type loci; involved in telomere maintenance -S000034555 CDS YMR263W 13 794919 795524 W 2011-02-03 1996-07-31 -S000004877 ORF Verified YMR264W CUE1 KIS4 chromosome 13 L000003518 13 795805 796416 W 2011-02-03 1996-07-31 Ubiquitin-binding protein; ER membrane protein that recruits and integrates the ubiquitin-conjugating enzyme Ubc7p into ER membrane-bound ubiquitin ligase complexes that function in the ER-associated degradation (ERAD) pathway for misfolded proteins; contains a CUE domain that binds ubiquitin to facilitate intramolecular monoubiquitination and to promote diubiquitin elongation, facilitating polyubiquitin chain formation -S000034641 CDS YMR264W 13 795805 796416 W 2011-02-03 1996-07-31 -S000004878 ORF Uncharacterized YMR265C chromosome 13 13 797925 796540 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000034679 CDS YMR265C 13 797925 796540 C 2011-02-03 1996-07-31 -S000004879 ORF Verified YMR266W RSN1 chromosome 13 13 798518 801379 W 2011-02-03 1996-07-31 Membrane protein of unknown function; overexpression suppresses NaCl sensitivity of sro7 mutant cells by restoring sodium pump (Ena1p) localization to the plasma membrane -S000035756 CDS YMR266W 13 798518 801379 W 2011-02-03 1996-07-31 -S000004880 ORF Verified YMR267W PPA2 inorganic diphosphatase PPA2|IPP2 chromosome 13 L000001469 13 801772 802704 W 2011-02-03 1996-07-31 Mitochondrial inorganic pyrophosphatase; required for mitochondrial function and possibly involved in energy generation from inorganic pyrophosphate; human ortholog, PPA2, functionally complements the null mutant; mutations in human PPA2 cause a mitochondrial disease resulting in sudden unexpected cardiac arrest in infants -S000035874 CDS YMR267W 13 801772 802704 W 2011-02-03 1996-07-31 -S000004881 ORF Verified YMR268C PRP24 U6 snRNP complex subunit PRP24 chromosome 13 L000002842 13 804222 802888 C 2011-02-03 1996-07-31 Splicing factor that reanneals snRNPs during spliceosome recycling; reanneals U4 and U6 snRNPs -S000035917 CDS YMR268C 13 804222 802888 C 2011-02-03 1996-07-31 -S000004882 ORF Verified YMR269W TMA23 YMR268W-A chromosome 13 13 804456 805091 W 2011-02-03 2004-02-27|1996-07-31 Nucleolar protein implicated in ribosome biogenesis; deletion extends chronological lifespan -S000037848 CDS YMR269W 13 804456 805091 W 2011-02-03 2004-02-27|1996-07-31 -S000118379 ARS ARS1329 ARSXIII-805 chromosome 13 13 805152 805282 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178162 ARS_consensus_sequence ARS1329 13 805162 805178 W 2014-11-18 2014-11-18 -S000004883 ORF Verified YMR270C RRN9 chromosome 13 L000003278 13 806423 805326 C 2011-02-03 1996-07-31 Protein involved in promoting high level transcription of rDNA; subunit of UAF (upstream activation factor) for RNA polymerase I -S000036870 CDS YMR270C 13 806423 805326 C 2011-02-03 1996-07-31 -S000004884 ORF Verified YMR271C URA10 orotate phosphoribosyltransferase URA10 chromosome 13 L000002438 13 807548 806865 C 2011-02-03 1996-07-31 Minor orotate phosphoribosyltransferase (OPRTase) isozyme; catalyzes the fifth enzymatic step in the de novo biosynthesis of pyrimidines, converting orotate into orotidine-5'-phosphate; URA10 has a paralog, URA5, that arose from the whole genome duplication -S000037601 CDS YMR271C 13 807548 806865 C 2011-02-03 1996-07-31 -S000006690 tRNA_gene tQ(CUG)M CDC65 SUP60|SUP70|DNA33 chromosome 13 L000000287|L000003673 13 808317 808246 C 187 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; can mutate to cause constitutive pseudohyphal growth in homozygous diploids; required for localization of transcription factor Gln3p to the nucleus in response to nitrogen starvation or rapamycin treatment -S000036125 noncoding_exon tQ(CUG)M 13 808317 808246 C 2011-02-03 2000-05-19 -S000007118 long_terminal_repeat YMRCtau3 chromosome 13 13 808906 808537 C 2011-02-03 2000-05-19 Ty4 LTR -S000007126 long_terminal_repeat YMRWdelta20 chromosome 13 13 809000 809233 W 2011-02-03 2000-05-19 Ty1 LTR -S000028695 ORF Dubious YMR272W-A chromosome 13 13 810466 810579 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene SCS7/YMR272C -S000032602 CDS YMR272W-A 13 810466 810579 W 2011-02-03 2003-07-29 -S000004885 ORF Verified YMR272C SCS7 fatty acid alpha-hydroxylase|FAH1 chromosome 13 L000004408 13 810777 809623 C 2011-02-03 1996-07-31 Sphingolipid alpha-hydroxylase; functions in the alpha-hydroxylation of sphingolipid-associated very long chain fatty acids, has both cytochrome b5-like and hydroxylase/desaturase domains, not essential for growth -S000037670 CDS YMR272C 13 810777 809623 C 2011-02-03 1996-07-31 -S000028696 ORF Uncharacterized YMR272W-B chromosome 13 13 811089 811196 W 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole -S000032604 CDS YMR272W-B 13 811089 811196 W 2011-02-03 2003-07-29 -S000004886 ORF Verified YMR273C ZDS1 OSS1|NRC1|CKM1|CES1 chromosome 13 L000002813 13 813980 811233 C 2011-02-03 1996-07-31 Protein with a role in regulating Swe1p-dependent polarized growth; involved in maintaining Cdc55p in the cytoplasm where it promotes mitotic entry; involved in mitotic exit through Cdc14p regulation; interacts with silencing proteins at telomeres; has a role in Bcy1p localization; implicated in mRNA nuclear export; ZDS1 has a paralog, ZDS2, that arose from the whole genome duplication -S000037717 CDS YMR273C 13 813980 811233 C 2011-02-03 1996-07-31 -S000004887 ORF Verified YMR274C RCE1 CAAX prenyl protease chromosome 13 L000004125 13 815311 814364 C 2011-02-03 1996-07-31 Type II CAAX prenyl protease; involved in the proteolysis and maturation of Ras and the a-factor mating pheromone -S000037777 CDS YMR274C 13 815311 814364 C 2011-02-03 1996-07-31 -S000118380 ARS ARS1330 ARSXIII-815 chromosome 13 13 815342 815567 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178163 ARS_consensus_sequence ARS1330 13 815391 815407 W 2014-11-18 2014-11-18 -S000004888 ORF Verified YMR275C BUL1 ubiquitin-ubiquitin ligase BUL1|SMM2|RDS1|DAG1 chromosome 13 L000002733 13 818581 815651 C 2011-02-03 1996-07-31 Ubiquitin-binding component of the Rsp5p E3-ubiquitin ligase complex; disruption causes temperature-sensitive growth, overexpression causes missorting of amino acid permeases; BUL1 has a paralog, BUL2, that arose from the whole genome duplication -S000030633 CDS YMR275C 13 818581 815651 C 2011-02-03 1996-07-31 -S000004889 ORF Verified YMR276W DSK2 chromosome 13 L000002646 13 818827 819948 W 2011-02-03 1996-07-31 Nuclear-enriched ubiquitin-like polyubiquitin-binding protein; required for spindle pole body (SPB) duplication and for transit through the G2/M phase of the cell cycle; involved in proteolysis; interacts with the proteasome; protein abundance increases in response to DNA replication stress -S000030830 CDS YMR276W 13 818827 819948 W 2011-02-03 1996-07-31 -S000004890 ORF Verified YMR277W FCP1 protein serine/threonine phosphatase chromosome 13 L000003350 13 820256 822454 W 2011-02-03 1996-07-31 Carboxy-terminal domain (CTD) phosphatase; essential for dephosphorylation of the repeated C-terminal domain of the RNA polymerase II large subunit (Rpo21p); relocalizes to the cytosol in response to hypoxia -S000031799 CDS YMR277W 13 820256 822454 W 2011-02-03 1996-07-31 -S000004891 ORF Verified YMR278W PRM15 PGM3|phosphoribomutase PRM15 chromosome 13 13 822763 824631 W 2011-02-03 1996-07-31 Phosphoribomutase; catalyzes interconversion of ribose-1-phosphate and ribose-5-phosphate; has some phosphoglucomutase activity but primary activity in vivo is phosphoribomutase; contributes to ribose recycling in the pentose phosphate pathway; transcription induced in response to stress; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; non-essential -S000031949 CDS YMR278W 13 822763 824631 W 2011-02-03 1996-07-31 -S000004892 ORF Verified YMR279C chromosome 13 13 826351 824729 C 2011-02-03 1996-07-31 Putative boron transporter involved in boron efflux and resistance; overexpression mutant but not null mutant displays boron tolerance phenotype; identified as a heat-induced gene in a high-throughout screen; YMR279C is not an essential gene; YMR279C has a paralog, ATR1, that arose from the whole genome duplication -S000031988 CDS YMR279C 13 826351 824729 C 2011-02-03 1996-07-31 -S000004893 ORF Verified YMR280C CAT8 DNA-binding transcription factor CAT8|MSP8|DIL1 chromosome 13 L000000220 13 831329 827028 C 2011-02-03 1996-07-31 Zinc cluster transcriptional activator; necessary for derepression of a variety of genes under non-fermentative growth conditions, active after diauxic shift, binds carbon source responsive elements; relative distribution to the nucleus increases upon DNA replication stress -S000032751 CDS YMR280C 13 831329 827028 C 2011-02-03 1996-07-31 -S000004894 ORF Verified YMR281W GPI12 N-acetylglucosaminylphosphatidylinositol deacetylase chromosome 13 L000004952 13 832339 833253 W 2011-02-03 1996-07-31 ER membrane protein involved in the second step of GPI anchor assembly; the second step is the de-N-acetylation of the N-acetylglucosaminylphosphatidylinositol intermediate; functional homolog of human PIG-Lp; GPI stands for glycosylphosphatidylinositol -S000032913 CDS YMR281W 13 832339 833253 W 2011-02-03 1996-07-31 -S000004895 ORF Verified YMR282C AEP2 ATP13 chromosome 13 L000000054 13 835098 833356 C 2011-02-03 1996-07-31 Mitochondrial protein; likely involved in translation of the mitochondrial OLI1 mRNA; exhibits genetic interaction with the OLI1 mRNA 5'-untranslated leader -S000032972 CDS YMR282C 13 835098 833356 C 2011-02-03 1996-07-31 -S000004896 ORF Verified YMR283C RIT1 tRNA A64-2'-O-ribosylphosphate transferase chromosome 13 L000001645 13 836867 835326 C 2011-02-03 1996-07-31 Initiator methionine 2'-O-ribosyl phosphate transferase; modifies the initiator methionine tRNA at position 64 to distinguish it from elongator methionine tRNA -S000033039 CDS YMR283C 13 836867 835326 C 2011-02-03 1996-07-31 -S000007127 long_terminal_repeat YMRWdelta21 chromosome 13 13 837450 837764 W 2011-02-03 2000-05-19 Ty1 LTR -S000130192 ARS ARS1331 chromosome 13 13 837764 837928 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000006784 tRNA_gene tY(GUA)M2 SUP8 chromosome 13 L000003672|L000002187 13 837928 838016 W 193 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations -S000032300 intron tY(GUA)M2 13 837967 837980 W 2011-02-03 2000-05-19 -S000032298 noncoding_exon tY(GUA)M2 13 837928 837966 W 2011-02-03 2000-05-19 -S000032299 noncoding_exon tY(GUA)M2 13 837981 838016 W 2011-02-03 2000-05-19 -S000004897 ORF Verified YMR284W YKU70 ATP-dependent DNA helicase YKU70|KU70|NES24|HDF1 chromosome 13 L000000759 13 838187 839995 W 2011-02-03 1996-07-31 Subunit of the telomeric Ku complex (Yku70p-Yku80p); involved in telomere length maintenance, structure and telomere position effect; required for localization of telomerase ribonucleoprotein to nucleus via interaction with the TLC1 guide RNA; relocates to sites of double-strand cleavage to promote nonhomologous end joining during DSB repair -S000033764 CDS YMR284W 13 838187 839995 W 2011-02-03 1996-07-31 -S000004898 ORF Verified YMR285C NGL2 RNA exonuclease chromosome 13 13 841691 840144 C 2011-02-03 1996-07-31 Protein involved in 5.8S rRNA processing; Ccr4p-like RNase required for correct 3'-end formation of 5.8S rRNA at site E; similar to Ngl1p; NGL2 has a paralog, NGL3, that arose from the whole genome duplication -S000033818 CDS YMR285C 13 841691 840144 C 2011-02-03 1996-07-31 -S000004899 ORF Verified YMR286W MRPL33 mitochondrial 54S ribosomal protein YmL33|YmL33 chromosome 13 L000002530|L000001170 13 841942 842202 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000034015 CDS YMR286W 13 841942 842202 W 2011-02-03 1996-07-31 -S000004900 ORF Verified YMR287C DSS1 MSU1 chromosome 13 L000001208 13 845345 842436 C 2011-02-03 1996-07-31 3'-5' exoribonuclease; component of the mitochondrial degradosome along with the ATP-dependent RNA helicase Suv3p; the degradosome associates with the ribosome and mediates turnover of aberrant or unprocessed RNAs -S000034048 CDS YMR287C 13 845345 842436 C 2011-02-03 1996-07-31 -S000004901 ORF Verified YMR288W HSH155 U2 snRNP complex subunit HSH155 chromosome 13 13 845571 848486 W 2011-02-03 1996-07-31 U2-snRNP associated splicing factor; forms extensive associations with the branch site-3' splice site-3' exon region upon prespliceosome formation; similarity to the mammalian U2 snRNP-associated splicing factor SAP155 -S000035070 CDS YMR288W 13 845571 848486 W 2011-02-03 1996-07-31 -S000004902 ORF Verified YMR289W ABZ2 aminodeoxychorismate lyase ABZ2 chromosome 13 13 848685 849809 W 2011-02-03 1996-07-31 Aminodeoxychorismate lyase (4-amino-4-deoxychorismate lyase); catalyzes the third step in para-aminobenzoic acid biosynthesis; involved in folic acid biosynthesis -S000035264 CDS YMR289W 13 848685 849809 W 2011-02-03 1996-07-31 -S000004904 ORF Dubious YMR290W-A chromosome 13 13 851422 851769 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps 5' end of essential HAS1/YMR290C gene which encodes an ATP-dependent RNA helicase -S000037856 CDS YMR290W-A 13 851422 851769 W 2011-02-03 1996-07-31|2011-02-03 -S000004903 ORF Verified YMR290C HAS1 ATP-dependent RNA helicase HAS1 chromosome 13 L000004179 13 851591 850074 C 2011-02-03 1996-07-31 ATP-dependent RNA helicase; involved in the biogenesis of 40S and 60S ribosome subunits; localizes to both the nuclear periphery and nucleolus; highly enriched in nuclear pore complex fractions; constituent of 66S pre-ribosomal particles -S000036112 CDS YMR290C 13 851591 850074 C 2011-02-03 1996-07-31 -S000004905 ORF Verified YMR291W TDA1 protein kinase TDA1 chromosome 13 13 852630 854390 W 2011-02-03 1996-07-31 Protein kinase of unknown cellular role; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; null mutant is sensitive to expression of the top1-T722A allele; not an essential gene; relocalizes from nucleus to cytoplasm upon DNA replication stress -S000036939 CDS YMR291W 13 852630 854390 W 2011-02-03 1996-07-31 -S000004906 ORF Verified YMR292W GOT1 chromosome 13 L000004951 13 854795 855293 W 2011-02-03 1996-07-31 Homodimeric protein that is packaged into COPII vesicles; cycles between the ER and Golgi; involved in secretory transport but not directly required for aspects of transport assayed in vitro; may influence membrane composition -S000037002 CDS YMR292W 13 854795 854816 W 2011-02-03 1996-07-31 -S000037003 CDS YMR292W 13 854899 855293 W 2011-02-03 1996-07-31 -S000037004 intron YMR292W 13 854817 854898 W 2011-02-03 1996-07-31 -S000004907 ORF Verified YMR293C HER2 QRS1|glutamyl-tRNA(Gln) amidotransferase subunit HER2|RRG6|GEP6|LRC6 chromosome 13 S000124020 13 856793 855399 C 2011-02-03 1996-07-31 Subunit of the trimeric GatFAB AmidoTransferase(AdT) complex; involved in the formation of Q-tRNAQ; required for remodeling of ER caused by Hmg2p overexpression; similar to bacterial GatA glutamyl-tRNA amidotransferase -S000037041 CDS YMR293C 13 856793 855399 C 2011-02-03 1996-07-31 -S000004908 ORF Verified YMR294W JNM1 PAC3|INS1 chromosome 13 L000000884 13 856966 858087 W 2011-02-03 1996-07-31 Component of the yeast dynactin complex; consisting of Nip100p, Jnm1p, and Arp1p; required for proper nuclear migration and spindle partitioning during mitotic anaphase B -S000037827 CDS YMR294W 13 856966 858087 W 2011-02-03 1996-07-31 -S000004909 ORF Dubious YMR294W-A chromosome 13 13 858209 858568 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; substantially overlaps YMR295C; deletion causes sensitivity to unfolded protein response-inducing agents -S000031101 CDS YMR294W-A 13 858209 858568 W 2011-02-03 1996-07-31 -S000004910 ORF Verified YMR295C IBI2 chromosome 13 13 858890 858297 C 2011-02-03 1996-07-31 Protein of unknown function that associates with ribosomes; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery and bud; not an essential gene; protein abundance increases in response to DNA replication stress; YMR295C has a paralog, YGR273C, that arose from the whole genome duplication -S000037861 CDS YMR295C 13 858890 858297 C 2011-02-03 1996-07-31 -S000004911 ORF Verified YMR296C LCB1 serine C-palmitoyltransferase LCB1|TSC2|END8 chromosome 13 L000000934 13 860891 859215 C 2011-02-03 1996-07-31 Component of serine palmitoyltransferase; responsible along with Lcb2p for the first committed step in sphingolipid synthesis, which is the condensation of serine with palmitoyl-CoA to form 3-ketosphinganine -S000029901 CDS YMR296C 13 860891 859215 C 2011-02-03 1996-07-31 -S000004912 ORF Verified YMR297W PRC1 CPY1|carboxypeptidase C PRC1|CPY|LBC1 chromosome 13 L000001481 13 861922 863520 W 210 2011-02-03 1996-07-31 Vacuolar carboxypeptidase Y (proteinase C, CPY); broad-specificity C-terminal exopeptidase involved in non-specific protein degradation in the vacuole; member of the serine carboxypeptidase family -S000030979 CDS YMR297W 13 861922 863520 W 2011-02-03 1996-07-31 -S000004913 ORF Verified YMR298W LIP1 sphingosine N-acyltransferase subunit LIP1 chromosome 13 13 863819 864271 W 2011-02-03 1996-07-31 Ceramide synthase subunit; single-span ER membrane protein associated with Lag1p and Lac1p and required for ceramide synthase activity, null mutant grows extremely slowly and is defective in ceramide synthesis -S000031080 CDS YMR298W 13 863819 864271 W 2011-02-03 1996-07-31 -S000004914 ORF Verified YMR299C DYN3 dynein light intermediate chain chromosome 13 13 865350 864412 C 2011-02-03 1996-07-31|2011-02-03 Dynein light intermediate chain (LIC); localizes with dynein, null mutant is defective in nuclear migration -S000031115 CDS YMR299C 13 865350 864412 C 2011-02-03 1996-07-31|2011-02-03 -S000004915 ORF Verified YMR300C ADE4 amidophosphoribosyltransferase chromosome 13 L000000034 13 867091 865559 C 213 2011-02-03 1996-07-31 Phosphoribosylpyrophosphate amidotransferase (PRPPAT); catalyzes first step of the 'de novo' purine nucleotide biosynthetic pathway; also known as amidophosphoribosyltransferase -S000036627 CDS YMR300C 13 867091 865559 C 2011-02-03 1996-07-31 -S000004916 ORF Verified YMR301C ATM1 ATP-binding cassette Fe/S cluster precursor transporter ATM1 chromosome 13 L000000140 13 869627 867555 C 2011-02-03 1996-07-31 Mitochondrial inner membrane ATP-binding cassette (ABC) transporter; exports mitochondrially synthesized precursors of iron-sulfur (Fe/S) clusters to the cytosol; human homolog ABCB7 can complement yeast null mutant -S000036724 CDS YMR301C 13 869627 867555 C 2011-02-03 1996-07-31 -S000004917 ORF Verified YMR302C YME2 PRP12|RNA12 chromosome 13 L000001503 13 872625 870073 C 2011-02-03 1996-07-31 Integral inner mitochondrial membrane protein; role in maintaining mitochondrial nucleoid structure and number; mutants exhibit an increased rate of mitochondrial DNA escape; shows some sequence similarity to exonucleases -S000030571 CDS YMR302C 13 872625 870073 C 2011-02-03 1996-07-31 -S000004918 ORF Verified YMR303C ADH2 alcohol dehydrogenase ADH2|ADR2 chromosome 13 L000000042|L000000051 13 874337 873291 C 216 2011-02-03 1996-07-31 Glucose-repressible alcohol dehydrogenase II; catalyzes the conversion of ethanol to acetaldehyde; involved in the production of certain carboxylate esters; regulated by ADR1 -S000030697 CDS YMR303C 13 874337 873291 C 2011-02-03 1996-07-31 -S000004920 ORF Verified YMR304W UBP15 ubiquitin-specific protease UBP15 chromosome 13 L000004589 13 874987 878679 W 2011-02-03 1996-07-31 Ubiquitin-specific protease involved in protein deubiquitination; forms a complex with AAA peroxins Pex1p and Pex6p; deubiquitinates mono- and polyubiquitinated forms of Pex5p; deubiquitinates Clb5p, counteracting APC activity, and facilitating both Clb5p accumulation and S phase entry; physically interacts with anaphase-promoting complex/cyclosome (APC/C) activator, Cdh1p; catalytic activity regulated by an N-terminal TRAF-like domain and and C-terminal sequences -S000030883 CDS YMR304W 13 874987 878679 W 2011-02-03 1996-07-31 -S000004919 ORF Dubious YMR304C-A chromosome 13 13 879130 878780 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps 3' end of verified ORF SCW10/YMR305C -S000037462 CDS YMR304C-A 13 879130 878780 C 2011-02-03 1996-07-31 -S000004921 ORF Verified YMR305C SCW10 putative family 17 glucosidase chromosome 13 13 880232 879063 C 2011-02-03 1996-07-31 Cell wall protein with similarity to glucanases; may play a role in conjugation during mating based on mutant phenotype and its regulation by Ste12p; SWC10 has a paralog, SCW4, that arose from the whole genome duplication -S000031740 CDS YMR305C 13 880232 879063 C 2011-02-03 1996-07-31 -S000004923 ORF Verified YMR306W FKS3 putative 1,3-beta-D-glucan synthase chromosome 13 L000004080 13 881159 886516 W 2011-02-03 1996-07-31 Protein involved in spore wall assembly; has similarity to 1,3-beta-D-glucan synthase catalytic subunits Fks1p and Gsc2p; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000032042 CDS YMR306W 13 881159 886516 W 2011-02-03 1996-07-31 -S000004922 ORF Dubious YMR306C-A chromosome 13 13 886572 886183 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps 3' end of ORF FKS3/YMR306W -S000034582 CDS YMR306C-A 13 886572 886183 C 2011-02-03 1996-07-31 -S000004924 ORF Verified YMR307W GAS1 1,3-beta-glucanosyltransferase GAS1|GGP1|CWH52 chromosome 13 L000000669 13 887003 888682 W 2011-02-03 1997-07-17 Beta-1,3-glucanosyltransferase; required for cell wall assembly and also has a role in transcriptional silencing; localizes to cell surface via a glycosylphosphatidylinositol (GPI) anchor; also found at nuclear periphery; genetic interactions with histone H3 lysine acetyltransferases GCN5 and SAS3 indicate previously unsuspected functions for Gas1 in DNA damage response and cell cycle regulation -S000032131 CDS YMR307W 13 887003 888682 W 2011-02-03 1997-07-17 -S000028578 ORF Dubious YMR307C-A chromosome 13 13 887925 887731 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene GAS1/YMR307W -S000031312 CDS YMR307C-A 13 887925 887731 C 2011-02-03 2003-07-29 -S000004925 ORF Verified YMR308C PSE1 KAP121 chromosome 13 L000001519 13 892221 888952 C 2011-02-03 1996-07-31 Karyopherin/importin that interacts with the nuclear pore complex; acts as the nuclear import receptor for specific proteins, including Pdr1p, Yap1p, Ste12p, and Aft1p -S000032994 CDS YMR308C 13 892221 888952 C 2011-02-03 1996-07-31 -S000004926 ORF Verified YMR309C NIP1 translation initiation factor eIF3 core subunit c chromosome 13 L000001252 13 895426 892988 C 2011-02-03 1996-07-31 eIF3c subunit of the eukaryotic translation initiation factor 3 (eIF3); involved in the assembly of preinitiation complex and start codon selection; eIF3 is also involved in programmed stop codon readthrough -S000033088 CDS YMR309C 13 895426 892988 C 2011-02-03 1996-07-31 -S000004927 ORF Uncharacterized YMR310C putative methyltransferase chromosome 13 13 896669 895716 C 2011-02-03 1996-07-31 Putative methyltransferase; predicted to be involved in ribosome biogenesis; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; not an essential gene; YMR310C has a paralog, YGR283C, that arose from the whole genome duplication -S000032818 CDS YMR310C 13 896669 895716 C 2011-02-03 1996-07-31 -S000004928 ORF Verified YMR311C GLC8 chromosome 13 L000000707 13 897603 896914 C 2011-02-03 1996-07-31 Regulatory subunit of protein phosphatase 1 (Glc7p); involved in glycogen metabolism and chromosome segregation; proposed to regulate Glc7p activity via conformational alteration; ortholog of the mammalian protein phosphatase inhibitor 2; protein abundance increases in response to DNA replication stress -S000034823 CDS YMR311C 13 897603 896914 C 2011-02-03 1996-07-31 -S000118381 ARS ARS1332 ARSXIII-898 chromosome 13 13 897935 897985 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178164 ARS_consensus_sequence ARS1332 13 897977 897961 C 2014-11-18 2014-11-18 -S000004929 ORF Verified YMR312W ELP6 Elongator subunit ELP6|KTI4|TOT6|HAP3 chromosome 13 13 898405 899226 W 2011-02-03 1996-07-31 Subunit of hexameric RecA-like ATPase Elp456 Elongator subcomplex; which is required for modification of wobble nucleosides in tRNA; required for Elongator structural integrity -S000035014 CDS YMR312W 13 898405 899226 W 2011-02-03 1996-07-31 -S000004930 ORF Verified YMR313C TGL3 bifunctional triglyceride lipase/lysophosphatidylethanolamine acyltransferase chromosome 13 13 901307 899379 C 2011-02-03 1996-07-31 Bifunctional triacylglycerol lipase and LPE acyltransferase; major lipid particle-localized triacylglycerol (TAG) lipase; catalyzes acylation of lysophosphatidylethanolamine (LPE), a function which is essential for sporulation; protein level and stability of Tgl3p are markedly reduced in the absence of lipid droplets; required with Tgl4p for timely bud formation -S000035060 CDS YMR313C 13 901307 899379 C 2011-02-03 1996-07-31 -S000004931 ORF Verified YMR314W PRE5 proteasome core particle subunit alpha 6 chromosome 13 L000001487 13 901709 902413 W 2011-02-03 1996-07-31 Alpha 6 subunit of the 20S proteasome; protein abundance increases in response to DNA replication stress -S000035211 CDS YMR314W 13 901709 902413 W 2011-02-03 1996-07-31 -S000004932 ORF Verified YMR315W chromosome 13 13 902800 903849 W 2011-02-03 1996-07-31 Protein with NADP(H) oxidoreductase activity; transcription is regulated by Stb5p in response to NADPH depletion induced by diamide; promoter contains a putative Stb5p binding site; protein abundance increases in response to DNA replication stress -S000036057 CDS YMR315W 13 902800 903849 W 2011-02-03 1996-07-31 -S000028697 ORF Uncharacterized YMR315W-A chromosome 13 13 904286 904393 W 2011-02-03 2003-07-29 Putative protein of unknown function -S000032606 CDS YMR315W-A 13 904286 904393 W 2011-02-03 2003-07-29 -S000004935 ORF Verified YMR316W DIA1 chromosome 13 13 904825 905835 W 2011-02-03 1996-07-31 Protein of unknown function; involved in invasive and pseudohyphal growth; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern -S000036198 CDS YMR316W 13 904825 905835 W 2011-02-03 1996-07-31 -S000004933 ORF Uncharacterized YMR316C-A chromosome 13 13 905973 905662 C 2011-02-03 1996-07-31 Protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; mRNA identified as translated by ribosome profiling data; overlaps the verified gene DIA1/YMR316W -S000036747 CDS YMR316C-A 13 905973 905662 C 2011-02-03 1996-07-31 -S000004936 ORF Uncharacterized YMR317W chromosome 13 13 907364 910786 W 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; has some similarity to sialidase from Trypanosoma; YMR317W is not an essential gene -S000031682 CDS YMR317W 13 907364 910786 W 2011-02-03 1996-07-31|2011-02-03 -S000004934 ORF Dubious YMR316C-B chromosome 13 13 907629 907321 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps 5' end of ORF YMR317W -S000036748 CDS YMR316C-B 13 907629 907321 C 2011-02-03 1996-07-31 -S000004937 ORF Verified YMR318C ADH6 NADP-dependent alcohol dehydrogenase|ADHVI chromosome 13 13 912143 911061 C 2011-02-03 1996-07-31 NADPH-dependent medium chain alcohol dehydrogenase; has broad substrate specificity; member of the cinnamyl family of alcohol dehydrogenases; may be involved in fusel alcohol synthesis or in aldehyde tolerance; protein abundance increases in response to DNA replication stress -S000031726 CDS YMR318C 13 912143 911061 C 2011-02-03 1996-07-31 -S000004938 ORF Verified YMR319C FET4 chromosome 13 L000000611 13 914538 912880 C 2011-02-03 1996-07-31 Low-affinity Fe(II) transporter of the plasma membrane -S000031875 CDS YMR319C 13 914538 912880 C 2011-02-03 1996-07-31 -S000004939 ORF Uncharacterized YMR320W chromosome 13 13 916746 917051 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YMR320W is not an essential gene -S000036413 CDS YMR320W 13 916746 917051 W 2011-02-03 1996-07-31 -S000004940 ORF Uncharacterized YMR321C chromosome 13 13 917896 917579 C 2011-02-03 1996-07-31 Putative protein of unknown function; proposed to be a palmitoylated membrane protein; YMR321C has a paralog, SAM4, that arose from a single-locus duplication -S000036437 CDS YMR321C 13 917896 917579 C 2011-02-03 1996-07-31 -S000130193 ARS ARS1333 chromosome 13 13 917896 918366 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000004941 ORF Verified YMR322C SNO4 glutathione-independent methylglyoxalase family protein|HSP34 chromosome 13 13 919079 918366 C 2011-02-03 1996-07-31 Possible chaperone and cysteine protease; required for transcriptional reprogramming during the diauxic shift and for survival in stationary phase; similar to bacterial Hsp31 and yeast Hsp31p, Hsp32p, and Hsp33p; DJ-1/ThiJ/PfpI superfamily member; predicted involvement in pyridoxine metabolism; induced by mild heat stress and copper deprivation -S000037082 CDS YMR322C 13 919079 918366 C 2011-02-03 1996-07-31 -S000004942 ORF Verified YMR323W ERR3 phosphopyruvate hydratase ERR3 chromosome 13 13 920088 921401 W 2011-02-03 1996-07-31 Enolase, a phosphopyruvate hydratase; catalyzes the conversion of 2-phosphoglycerate to phosphoenolpyruvate; complements the growth defect of an ENO1 ENO2 double mutant in glucose -S000037230 CDS YMR323W 13 920088 921401 W 2011-02-03 1996-07-31 -S000004943 ORF Dubious YMR324C chromosome 13 13 922444 922202 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; transcription is AZF1 dependent in glycerol-lactate medium and SLT2 dependent in response to the lipid hydroperoxides -S000037270 CDS YMR324C 13 922444 922202 C 2011-02-03 1996-07-31 -S000004944 ORF Verified YMR325W PAU19 seripauperin PAU19 chromosome 13 13 922641 923015 W 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions -S000037375 CDS YMR325W 13 922641 923015 W 2011-02-03 1996-07-31 -S000130194 ARS ARS1335 chromosome 13 13 923015 923494 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000028989 telomere TEL13R chromosome 13 13 923541 924431 W 219 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome XIII; composed of an X element core sequence, X element combinatorial repeats, and a terminal stretch of telomeric repeats -S000028990 telomeric_repeat TEL13R 13 924307 924431 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome XIII -S000028991 X_element TEL13R 13 923541 924005 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome XIII; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YMR326C -S000028992 X_element_combinatorial_repeat TEL13R 13 924006 924306 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr XIII; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000004945 ORF Dubious YMR326C chromosome 13 13 923802 923494 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the telomere on the right arm of chromosome 13 -S000037400 CDS YMR326C 13 923802 923494 C 2011-02-03 1996-07-31 -S000028704 ORF Dubious YNL339W-B chromosome 14 14 734 1216 W 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032643 CDS YNL339W-B 14 734 1216 W 2003-07-29 2003-07-29 -S000028703 ORF Dubious YNL339W-A chromosome 14 14 1517 2092 W 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032637 CDS YNL339W-A 14 1517 2092 W 2003-07-29 2003-07-29 -S000005283 ORF Verified YNL339C YRF1-6 Y' element ATP-dependent helicase protein 1 copy 6|YRF1 chromosome 14 14 6098 371 C 1996-07-31 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p -S000031358 CDS YNL339C 14 5931 371 C 1996-07-31 1996-07-31 -S000031357 CDS YNL339C 14 6098 6080 C 1996-07-31 1996-07-31 -S000031359 intron YNL339C 14 6079 5932 C 1996-07-31 1996-07-31 -S000005282 ORF Dubious YNL338W chromosome 14 14 6561 6719 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps TEL14L-XC, which is a telomeric X element core sequence on the left arm of chromosome XIV -S000030505 CDS YNL338W 14 6561 6719 W 1996-07-31 1996-07-31 -S000005281 ORF Dubious YNL337W chromosome 14 14 7165 7419 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030361 CDS YNL337W 14 7165 7419 W 1996-07-31 1996-07-31 -S000028924 telomere TEL14L chromosome 14 14 7428 1 C -238 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome XIV; composed of an X element core sequence, X element combinatorial repeats, a short stretch of telomeric repeats, and a long Y' element -S000028925 telomeric_repeat TEL14L 14 6691 6618 C 2003-09-09 2003-09-09 Internal telomeric repeats on the left arm of Chromosome XIV; spans ORF YNL338W -S000028926 X_element TEL14L 14 7428 6964 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome XIV; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YNL337W -S000028927 X_element_combinatorial_repeat TEL14L 14 6963 6692 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr XIV; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000028928 Y_prime_element TEL14L 14 6617 1 C 2003-09-09 2003-09-09 Telomeric long Y' element on the left arm of Chromosome XIV; contains an ARS consensus sequence, a region of 36-bp repeats, and three ORFs (YRF1-6/YNL339C, YNL339W-A, YNL339W-B) -S000005280 ORF Verified YNL336W COS1 chromosome 14 L000004060 14 8330 9475 W 1996-07-31 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins -S000030202 CDS YNL336W 14 8330 9475 W 1996-07-31 1996-07-31 -S000005279 ORF Verified YNL335W DDI3 cyanamide hydratase chromosome 14 14 11452 12129 W 1996-07-31 1996-07-31 Cyanamide hydratase that detoxifies cyanamide; member of the HD domain metalloprotein superfamily; expression is induced over 100-fold by cyanamide and by SN2-type DNA alkylating agents such as MMS and DMA; induction decreased in rad6 and rad18 mutants; gene and protein are identical to DDI2 and Ddi2p -S000037479 CDS YNL335W 14 11452 12129 W 1996-07-31 1996-07-31 -S000005278 ORF Verified YNL334C SNO2 putative pyridoxal 5'-phosphate synthase chromosome 14 L000003452 14 12876 12208 C 1996-07-31 1996-07-31 Protein of unknown function; nearly identical to Sno3p; expression is induced before the diauxic shift and also in the absence of thiamin -S000037293 CDS YNL334C 14 12876 12208 C 1996-07-31 1996-07-31 -S000005277 ORF Verified YNL333W SNZ2 pyridoxine biosynthesis protein SNZ2 chromosome 14 L000002576 14 13267 14163 W 1996-07-31 1996-07-31 Member of a stationary phase-induced gene family; transcription of SNZ2 is induced prior to diauxic shift, and also in the absence of thiamin in a Thi2p-dependent manner; forms a coregulated gene pair with SNO2; interacts with Thi11p -S000037255 CDS YNL333W 14 13267 14163 W 1996-07-31 1996-07-31 -S000005276 ORF Verified YNL332W THI12 4-amino-5-hydroxymethyl-2-methylpyrimidine phosphate synthase chromosome 14 L000003223 14 14832 15854 W 1996-07-31 1996-07-31 Protein involved in synthesis of the thiamine precursor HMP; member of a subtelomeric gene family including THI5, THI11, THI12, and THI13; hydroxymethylpyrimidine is also known as HMP -S000036570 CDS YNL332W 14 14832 15854 W 1996-07-31 1996-07-31 -S000005275 ORF Verified YNL331C AAD14 putative aryl-alcohol dehydrogenase chromosome 14 L000004676 14 17248 16118 C 1996-07-31 1996-07-31 Putative aryl-alcohol dehydrogenase; similar to P. chrysosporium aryl-alcohol dehydrogenase; mutational analysis has not yet revealed a physiological role; members of the AAD gene family comprise three pairs (AAD3 + AAD15, AAD6/AAD16 + AAD4, AAD10 + AAD14) whose two genes are more related to one another than to other members of the family -S000036424 CDS YNL331C 14 17248 16118 C 1996-07-31 1996-07-31 -S000005274 ORF Verified YNL330C RPD3 histone deacetylase RPD3|MOF6|SDS6|SDI2|REC3 chromosome 14 L000001696|L000001603 14 19302 18001 C -237 1996-07-31 1996-07-31 Histone deacetylase, component of both the Rpd3S and Rpd3L complexes; regulates transcription, silencing, autophagy and other processes by influencing chromatin remodeling; forms at least two different complexes which have distinct functions and members; Rpd3(L) recruitment to the subtelomeric region is regulated by interaction with the arginine methyltransferase, Hmt1p -S000036315 CDS YNL330C 14 19302 18001 C 1996-07-31 1996-07-31 -S000005273 ORF Verified YNL329C PEX6 AAA family ATPase peroxin 6|PAS8 chromosome 14 L000001341 14 22633 19541 C 1996-07-31 1996-07-31 AAA-peroxin; heterodimerizes with AAA-peroxin Pex1p and participates in the recycling of peroxisomal signal receptor Pex5p from the peroxisomal membrane to the cystosol; mutations in human PEX6 can lead to severe peroxisomal disorders and early death -S000034361 CDS YNL329C 14 22633 19541 C 1996-07-31 1996-07-31 -S000005272 ORF Verified YNL328C MDJ2 chromosome 14 L000004357 14 23274 22834 C 1996-07-31 1996-07-31 Constituent of the mitochondrial import motor; associated with the presequence translocase; function overlaps with that of Pam18p; stimulates the ATPase activity of Ssc1p to drive mitochondrial import; contains a J domain -S000034238 CDS YNL328C 14 23274 22834 C 1996-07-31 1996-07-31 -S000005271 ORF Verified YNL327W EGT2 chromosome 14 L000004074 14 24048 27173 W 2011-02-03 1996-07-31|2011-02-03 Glycosylphosphatidylinositol (GPI)-anchored cell wall endoglucanase; required for proper cell separation after cytokinesis; expression is activated by Swi5p and tightly regulated in a cell cycle-dependent manner -S000034184 CDS YNL327W 14 24048 27173 W 2011-02-03 1996-07-31|2011-02-03 -S000005270 ORF Verified YNL326C PFA3 palmitoyltransferase PFA3 chromosome 14 14 28347 27337 C 2011-02-03 1996-07-31 Palmitoyltransferase for Vac8p; required for vacuolar membrane fusion; contains an Asp-His-His-Cys-cysteine rich (DHHC-CRD) domain; autoacylates; required for vacuolar integrity under stress conditions -S000033265 CDS YNL326C 14 28347 27337 C 2011-02-03 1996-07-31 -S000118382 ARS ARS1405 ARSXIV-29 chromosome 14 14 28469 28700 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178165 ARS_consensus_sequence ARS1405 14 28654 28638 C 2014-11-18 2014-11-18 -S000005268 ORF Dubious YNL324W chromosome 14 14 31050 31445 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033183 CDS YNL324W 14 31050 31445 W 2011-02-03 1996-07-31 -S000005269 ORF Verified YNL325C FIG4 phosphatidylinositol-3,5-bisphosphate 5-phosphatase chromosome 14 L000003583 14 31378 28739 C 2011-02-03 1996-07-31 Phosphatidylinositol 3,5-bisphosphate (PtdIns[3,5]P) phosphatase; required for efficient mating and response to osmotic shock; physically associates with and regulated by Vac14p; contains a SAC1-like domain; homologous to human FIG4, which is associated with CMT4J, a form of Charcot-Marie-Tooth disorder -S000033213 CDS YNL325C 14 31378 28739 C 2011-02-03 1996-07-31 -S000005267 ORF Verified YNL323W LEM3 ROS3|BRE3 chromosome 14 14 31944 33188 W 2011-02-03 1996-07-31 Membrane protein of the plasma membrane and ER; interacts specifically in vivo with the phospholipid translocase (flippase) Dnf1p; involved in translocation of phospholipids and alkylphosphocholine drugs across the plasma membrane; null mutant requires tryptophan due to mislocalization of tryptophan permease Tat2p -S000033125 CDS YNL323W 14 31944 33188 W 2011-02-03 1996-07-31 -S000005266 ORF Verified YNL322C KRE1 chromosome 14 L000000912 14 34235 33294 C -235 2011-02-03 1996-07-31 Cell wall glycoprotein involved in beta-glucan assembly; serves as a K1 killer toxin membrane receptor -S000032211 CDS YNL322C 14 34235 33294 C 2011-02-03 1996-07-31 -S000005265 ORF Verified YNL321W VNX1 chromosome 14 14 34696 37422 W 2011-02-03 1996-07-31 Calcium/H+ antiporter localized to the endoplasmic reticulum membrane; member of the calcium exchanger (CAX) family; potential Cdc28p substrate -S000032167 CDS YNL321W 14 34696 37422 W 2011-02-03 1996-07-31 -S000005264 ORF Uncharacterized YNL320W chromosome 14 14 37700 38554 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000032112 CDS YNL320W 14 37700 38554 W 2011-02-03 1996-07-31 -S000005263 ORF Dubious YNL319W chromosome 14 14 38642 39082 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene HXT14 -S000031153 CDS YNL319W 14 38642 39082 W 2011-02-03 1996-07-31 -S000005262 ORF Verified YNL318C HXT14 chromosome 14 L000002762 14 40329 38707 C 2011-02-03 1996-07-31 Protein with similarity to hexose transporter family members; expression is induced in low glucose and repressed in high glucose; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000030981 CDS YNL318C 14 40329 38707 C 2011-02-03 1996-07-31 -S000005261 ORF Verified YNL317W PFS2 cleavage polyadenylation factor subunit PFS2 chromosome 14 14 40619 42016 W 2011-02-03 1996-07-31 Integral subunit of the pre-mRNA CPF complex; the cleavage and polyadenylation factor (CPF) complex plays an essential role in mRNA 3'-end formation by bridging different processing factors and thereby promoting the assembly of the processing complex -S000030052 CDS YNL317W 14 40619 42016 W 2011-02-03 1996-07-31 -S000005260 ORF Verified YNL316C PHA2 prephenate dehydratase PHA2 chromosome 14 L000001414 14 43075 42071 C -227 2011-02-03 2003-09-22|1996-07-31 Prephenate dehydratase; catalyzes the conversion of prephanate to phenylpyruvate, which is a step in the phenylalanine biosynthesis pathway -S000029856 CDS YNL316C 14 43075 42071 C 2011-02-03 2003-09-22|1996-07-31 -S000005259 ORF Verified YNL315C ATP11 chromosome 14 L000000148 14 44280 43324 C 2011-02-03 1996-07-31 Molecular chaperone; required for the assembly of alpha and beta subunits into the F1 sector of mitochondrial F1F0 ATP synthase; N-terminally propionylated in vivo -S000037828 CDS YNL315C 14 44280 43324 C 2011-02-03 1996-07-31 -S000005258 ORF Verified YNL314W DAL82 DURM chromosome 14 L000000482 14 44447 45214 W 2011-02-03 1996-07-31 Positive regulator of allophanate inducible genes; binds a dodecanucleotide sequence upstream of all genes that are induced by allophanate; contains an UISALL DNA-binding, a transcriptional activation, and a coiled-coil domain -S000037152 CDS YNL314W 14 44447 45214 W 2011-02-03 1996-07-31 -S000005257 ORF Verified YNL313C EMW1 tetratricopeptide repeat-containing protein EMW1 chromosome 14 14 48022 45308 C 2011-02-03 1996-07-31 Essential conserved protein with a role in cell wall integrity; contains six TPR (tetratricopeptide repeat) domains clustered in the C-terminal region; conditional mutant is suppressed by overexpression of GFA1; protein abundance increases in response to DNA replication stress -S000037005 CDS YNL313C 14 48022 45308 C 2011-02-03 1996-07-31 -S000005256 ORF Verified YNL312W RFA2 RPA32|RPA2|BUF1 chromosome 14 L000000203|L000001621 14 48287 49216 W 2011-02-03 1996-07-31 Subunit of heterotrimeric Replication Protein A (RPA); RPA is a highly conserved single-stranded DNA binding protein involved in DNA replication, repair, and recombination; RPA protects against inappropriate telomere recombination, and upon telomere uncapping, prevents cell proliferation by a checkpoint-independent pathway; in concert with Sgs1p-Top2p-Rmi1p, stimulates DNA catenation/decatenation activity of Top3p; protein abundance increases in response to DNA replication s -S000036978 CDS YNL312W 14 48287 48293 W 2011-02-03 1996-07-31 -S000036979 CDS YNL312W 14 48402 49216 W 2011-02-03 1996-07-31 -S000036980 intron YNL312W 14 48294 48401 W 2011-02-03 1996-07-31 -S000005255 ORF Verified YNL311C SKP2 putative SCF ubiquitin ligase complex subunit SKP2 chromosome 14 14 51688 49397 C 2011-02-03 1996-07-31 F-box protein of unknown function; predicted to be part of an SCF ubiquitin protease complex; involved in regulating protein levels of sulfur metabolism enzymes; may interact with ribosomes, based on co-purification experiments -S000036212 CDS YNL311C 14 51688 49397 C 2011-02-03 1996-07-31 -S000005254 ORF Verified YNL310C ZIM17 HEP1|TIM15|FMP28 chromosome 14 14 52431 51907 C 2011-02-03 1996-07-31|2006-05-10 Protein co-chaperone with a zinc finger motif; essential for protein import into mitochondria; may act with Pam18p to facilitate recognition and folding of imported proteins by Ssc1p (mtHSP70) in the mitochondrial matrix; required for the maintenance of Ssc1p solubility and assists in the functional interaction of Ssc1p with substrate proteins -S000036042 CDS YNL310C 14 52431 51907 C 2011-02-03 1996-07-31|2006-05-10 -S000005253 ORF Verified YNL309W STB1 chromosome 14 L000002107 14 52662 53924 W 2011-02-03 2003-09-22|1996-07-31 Protein with role in regulation of MBF-specific transcription at Start; phosphorylated by Cln-Cdc28p kinases in vitro; unphosphorylated form binds Swi6p, which is required for Stb1p function; expression is cell-cycle regulated; STB1 has a paralog, YOL131W, that arose from the whole genome duplication -S000035181 CDS YNL309W 14 52662 53924 W 2011-02-03 2003-09-22|1996-07-31 -S000005252 ORF Verified YNL308C KRI1 chromosome 14 S000007481 14 55897 54122 C 2011-02-03 1996-07-31 Essential nucleolar protein required for 40S ribosome biogenesis; associate with snR30; physically and functionally interacts with Krr1p -S000034918 CDS YNL308C 14 55897 54122 C 2011-02-03 1996-07-31 -S000005251 ORF Verified YNL307C MCK1 serine/threonine/tyrosine protein kinase MCK1|CMS1|YPK1 chromosome 14 L000001036|S000029094|L000000369 14 57573 56446 C 1996-07-31 1996-07-31 Dual-specificity ser/thr and tyrosine protein kinase; roles in chromosome segregation, meiotic entry, genome stability, phosphorylation-dependent protein degradation (Rcn1p and Cdc6p), inhibition of protein kinase A, transcriptional regulation, inhibition of RNA pol III, calcium stress and inhibition of Clb2p-Cdc28p after nuclear division; MCK1 has a paralog, YGK3, that arose from the whole genome duplication -S000034016 CDS YNL307C 14 57573 56446 C 1996-07-31 1996-07-31 -S000005250 ORF Verified YNL306W MRPS18 mitochondrial 37S ribosomal protein YmS18|YmS18 chromosome 14 14 58155 58808 W 1996-07-31 1996-07-31 Mitochondrial ribosomal protein of the small subunit; essential for viability, unlike most other mitoribosomal proteins -S000033967 CDS YNL306W 14 58155 58808 W 1996-07-31 1996-07-31 -S000005249 ORF Verified YNL305C BXI1 YBH3 chromosome 14 14 59791 58898 C 1996-07-31 1996-07-31 Protein involved in apoptosis; variously described as containing a BCL-2 homology (BH3) domain or as a member of the BAX inhibitor family; reported to promote apoptosis under some conditions and to inhibit it in others; localizes to ER and vacuole; may link the unfolded protein response to apoptosis via regulation of calcium-mediated signaling; translocates to mitochondria under apoptosis-inducing conditions in a process involving Mir1p and Cor1p -S000033769 CDS YNL305C 14 59791 58898 C 1996-07-31 1996-07-31 -S000005248 ORF Verified YNL304W YPT11 Rab family GTPase YPT11 chromosome 14 14 60297 61550 W 2005-11-07 1996-07-31|2005-11-07 Rab GTPase; Myo2p-binding protein implicated in mother-to-bud transport of cortical endoplasmic reticulum (ER), late Golgi, and mitochondria during cell division; function is regulated at multiple levels; abundance of active Ypt11p forms is controlled by phosphorylation status and degradation; normally a low-abundance protein whose ER localization is only detected when protein is highly over expressed -S000033723 CDS YNL304W 14 60297 61550 W 2005-11-07 1996-07-31|2005-11-07 -S000005247 ORF Dubious YNL303W chromosome 14 14 61510 61857 W 2005-11-07 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033069 CDS YNL303W 14 61510 61857 W 2005-11-07 1996-07-31 -S000118383 ARS ARS1406 ARSXIV-62 chromosome 14 14 61599 61895 2006-08-30 2006-08-30 Autonomously Replicating Sequence -S000178166 ARS_consensus_sequence ARS1406 14 61694 61710 W 2014-11-18 2014-11-18 -S000005246 ORF Verified YNL302C RPS19B eS19|ribosomal 40S subunit protein S19B|S19e|rp55B|YS16B|S19B|S16aB|RP55B chromosome 14 L000002703|L000002725 14 62943 61958 C 2005-11-07 1996-07-31 Protein component of the small (40S) ribosomal subunit; required for assembly and maturation of pre-40 S particles; homologous to mammalian ribosomal protein S19, no bacterial homolog; mutations in human RPS19 are associated with Diamond Blackfan anemia; RPS19B has a paralog, RPS19A, that arose from the whole genome duplication -S000032915 CDS YNL302C 14 62372 61958 C 2005-11-07 1996-07-31 -S000032914 CDS YNL302C 14 62943 62924 C 2005-11-07 1996-07-31 -S000032916 intron YNL302C 14 62923 62373 C 2005-11-07 1996-07-31 -S000005245 ORF Verified YNL301C RPL18B eL18|ribosomal 60S subunit protein L18B|L18e|rp28B|L18B|RP28B chromosome 14 L000002702 14 64562 63570 C 2005-11-07 1996-07-31 Ribosomal 60S subunit protein L18B; homologous to mammalian ribosomal protein L18, no bacterial homolog; RPL18B has a paralog, RPL18A, that arose from the whole genome duplication -S000032846 CDS YNL301C 14 64018 63570 C 2005-11-07 1996-07-31 -S000032845 CDS YNL301C 14 64562 64451 C 2005-11-07 1996-07-31 -S000032847 intron YNL301C 14 64450 64019 C 2005-11-07 1996-07-31 -S000005244 ORF Uncharacterized YNL300W TOS6 chromosome 14 14 65744 66052 W 2005-11-07 1996-07-31 Glycosylphosphatidylinositol-dependent cell wall protein; expression is periodic and decreases in respone to ergosterol perturbation or upon entry into stationary phase; depletion increases resistance to lactic acid -S000032776 CDS YNL300W 14 65744 66052 W 2005-11-07 1996-07-31 -S000005243 ORF Verified YNL299W TRF5 non-canonical poly(A) polymerase TRF5 chromosome 14 L000003385 14 66517 68445 W 2005-11-07 1996-07-31|2005-11-03 Non-canonical poly(A) polymerase; involved in nuclear RNA degradation as a component of the TRAMP complex; catalyzes polyadenylation of hypomodified tRNAs, and snoRNA and rRNA precursors; overlapping but non-redundant functions with Pap2p -S000035690 CDS YNL299W 14 66517 68445 W 2005-11-07 1996-07-31|2005-11-03 -S000005242 ORF Verified YNL298W CLA4 serine/threonine protein kinase CLA4|ERC10 chromosome 14 L000000564|L000002643 14 68915 71443 W 2005-11-07 1996-07-31 Cdc42p-activated signal transducing kinase; member of the PAK (p21-activated kinase) family, along with Ste20p and Skm1p; involved in septin ring assembly, vacuole inheritance, cytokinesis, sterol uptake regulation; phosphorylates Cdc3p and Cdc10p; CLA4 has a paralog, SKM1, that arose from the whole genome duplication -S000035601 CDS YNL298W 14 68915 71443 W 2005-11-07 1996-07-31 -S000005240 ORF Dubious YNL296W chromosome 14 14 76273 76587 W 2005-11-07 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; deletion adversely affects sporulation; deletion mutant exhibits synthetic phenotype under expression of mutant huntingtin fragment, but gene does not have human ortholog -S000034476 CDS YNL296W 14 76273 76587 W 2005-11-07 1996-07-31 -S000005241 ORF Verified YNL297C MON2 YSL2 chromosome 14 14 76583 71673 C 2005-11-07 1996-07-31 Protein with a role in endocytosis and vacuole integrity; peripheral membrane protein; interacts with and negatively regulates Arl1p; localizes to the endosome; member of the Sec7p family of proteins -S000034548 CDS YNL297C 14 76583 71673 C 2005-11-07 1996-07-31 -S000005239 ORF Uncharacterized YNL295W MRX6 chromosome 14 14 76946 78520 W 2005-11-07 1996-07-31 Protein that associates with mitochondrial ribosome -S000034395 CDS YNL295W 14 76946 78520 W 2005-11-07 1996-07-31 -S000005238 ORF Verified YNL294C RIM21 PAL2 chromosome 14 14 80260 78659 C 2005-11-07 1996-07-31 pH sensor molecule, component of the RIM101 pathway; has a role in cell wall construction and alkaline pH response; is glycosylated and phosphorylated; interacts with Dfg16p and Rim9p to form a pH-sensing complex; localization to the plasma membrane is dependent on Dfg16p and Rim9p; has similarity to A. nidulans PalH -S000033436 CDS YNL294C 14 80260 78659 C 2005-11-07 1996-07-31 -S000005237 ORF Verified YNL293W MSB3 Rab GTPase-activating protein MSB3|GYP3 chromosome 14 L000003918 14 80640 82541 W 2005-11-07 1996-07-31 Rab GTPase-activating protein; regulates endocytosis via inactivation of Vps21p at endosomes and vacuole fusion via inactivation of Ypt7p at vacuoles; also acts on Ypt52p and Sec4p; localizes to plasma membrane, sites of polarized growth; relocalizes from bud neck to cytoplasm upon DNA replication stress; similar to TBC-domain Tre2 oncogene; MSB3 has a paralog, MSB4, that arose from the whole genome duplication; human homolog USP6NL can complement yeast msb3 msb4 double null -S000033388 CDS YNL293W 14 80640 82541 W 2005-11-07 1996-07-31 -S000005236 ORF Verified YNL292W PUS4 pseudouridine synthase PUS4 chromosome 14 L000003347 14 82806 84017 W 2005-11-07 1996-07-31 Pseudouridine synthase; catalyzes only the formation of pseudouridine-55 (Psi55), a highly conserved tRNA modification, in mitochondrial and cytoplasmic tRNAs; also responsible for pseudouracil modification of some mRNAs; PUS4 overexpression leads to translational derepression of GCN4 (Gcd- phenotype) -S000033311 CDS YNL292W 14 82806 84017 W 2005-11-07 1996-07-31 -S000005235 ORF Verified YNL291C MID1 chromosome 14 L000002584 14 85815 84169 C 2005-11-07 1996-07-31 N-glycosylated integral membrane protein of the ER and plasma membrane; functions as a stretch-activated Ca2+-permeable cation channel required for Ca2+ influx stimulated by pheromone; interacts with Cch1p; forms an oligomer -S000033221 CDS YNL291C 14 85815 84169 C 2005-11-07 1996-07-31 -S000005234 ORF Verified YNL290W RFC3 replication factor C subunit 3 chromosome 14 L000001624 14 86218 87240 W 2005-11-07 1996-07-31 Subunit of heteropentameric Replication factor C (RF-C); which is a DNA binding protein and ATPase that acts as a clamp loader of the proliferating cell nuclear antigen (PCNA) processivity factor for DNA polymerases delta and epsilon; relocalizes to the cytosol in response to hypoxia -S000032410 CDS YNL290W 14 86218 87240 W 2005-11-07 1996-07-31 -S000005233 ORF Verified YNL289W PCL1 HCS26 chromosome 14 L000002783 14 87897 88736 W 2005-11-07 1996-07-31 Cyclin, interacts with cyclin-dependent kinase Pho85p; member of the Pcl1,2-like subfamily, involved in the regulation of polarized growth and morphogenesis and progression through the cell cycle; is ubiquitinated by Dma1p; phosphorylation by Pho85p targets it for degradation; localizes to sites of polarized cell growth -S000032399 CDS YNL289W 14 87897 88736 W 2005-11-07 1996-07-31 -S000007304 snoRNA_gene snR40 SNR40 chromosome 14 L000003055 14 89210 89306 W 2005-11-07 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U898 and small subunit (SSU) rRNA at position G1271 -S000030610 noncoding_exon snR40 14 89210 89306 W 2005-11-07 2000-05-19 -S000118384 ARS ARS1407 ARSXIV-90 chromosome 14 14 89531 89804 2006-08-30 2006-08-30 Autonomously Replicating Sequence -S000178167 ARS_consensus_sequence ARS1407 14 89755 89739 C 2014-11-18 2014-11-18 -S000005232 ORF Verified YNL288W CAF40 CCR4-NOT core subunit CAF40 chromosome 14 14 90303 91424 W 2005-11-07 1996-07-31 Component of the CCR4-NOT transcriptional complex; evolutionarily conserved; involved in controlling mRNA initiation, elongation, and degradation; binds Cdc39p -S000031389 CDS YNL288W 14 90303 91424 W 2005-11-07 1996-07-31 -S000005231 ORF Verified YNL287W SEC21 coatomer subunit gamma chromosome 14 L000001844 14 91994 94801 W 2005-11-07 1996-07-31 Gamma subunit of coatomer; coatomer is a heptameric protein complex that together with Arf1p forms the COPI coat; involved in ER to Golgi transport of selective cargo -S000031285 CDS YNL287W 14 91994 94801 W 2005-11-07 1996-07-31 -S000005230 ORF Verified YNL286W CUS2 U2 snRNP complex subunit CUS2 chromosome 14 L000003273 14 95223 96080 W 2005-11-07 1996-07-31 Putative checkpoint factor in transcription; binds to U2 snRNA and Prp11p; regulates toggling of the U2 snRNA stem II region between different structures; contains two RNA recognition motifs (RRMs) -S000031155 CDS YNL286W 14 95223 96080 W 2005-11-07 1996-07-31 -S000005229 ORF Dubious YNL285W chromosome 14 14 96173 96544 W 2005-11-07 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030192 CDS YNL285W 14 96173 96544 W 2005-11-07 1996-07-31 -S000130140 ARS ARS1409 chromosome 14 14 96247 96463 2009-05-06 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000006591 tRNA_gene tG(UCC)N SUF6 chromosome 14 L000003700|L000002154 14 96312 96241 C -192 2005-11-07 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons -S000037566 noncoding_exon tG(UCC)N 14 96312 96241 C 2005-11-07 2000-05-19 -S000007140 long_terminal_repeat YNLWtau1 chromosome 14 14 96451 96609 W 2005-11-07 2000-05-19 Ty4 LTR -S000007129 long_terminal_repeat YNLCdelta1 chromosome 14 14 96941 96610 C 2005-11-07 2000-05-19 Ty1 LTR -S000007387 transposable_element_gene YNL284C-B gag-pol fusion protein chromosome 14 S000029017 14 102232 96964 C 2005-11-07 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000031728 CDS YNL284C-B 14 100926 96964 C 2005-11-07 1999-07-17 -S000031727 CDS YNL284C-B 14 102232 100928 C 2005-11-07 1999-07-17 -S000031729 plus_1_translational_frameshift YNL284C-B 14 100927 100927 C 2005-11-07 1999-07-17 -S000007386 transposable_element_gene YNL284C-A gag protein chromosome 14 14 102232 100910 C 2005-11-07 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000031717 CDS YNL284C-A 14 102232 100910 C 2005-11-07 1999-07-17 -S000007134 LTR_retrotransposon YNLCTy1-1 Ty1 chromosome 14 14 102523 96610 C 2005-11-07 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007130 long_terminal_repeat YNLCdelta2 chromosome 14 14 102523 102192 C 2005-11-07 2000-05-19 Ty1 LTR -S000007133 long_terminal_repeat YNLCsigma1 chromosome 14 14 102700 102632 C 2005-11-07 2000-05-19 Ty3 LTR -S000006673 tRNA_gene tN(GUU)N1 chromosome 14 L000003687 14 102716 102789 W 2005-11-07 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis -S000035559 noncoding_exon tN(GUU)N1 14 102716 102789 W 2005-11-07 2000-05-19 -S000005228 ORF Verified YNL284C MRPL10 mitochondrial 54S ribosomal protein YmL10/YmL18|YmL10|YmL18|MRPL18 chromosome 14 L000002689|S000029308|L000002685 14 104102 103134 C 2005-11-07 1996-07-31 Mitochondrial ribosomal protein of the large subunit; appears as two protein spots (YmL10 and YmL18) on two-dimensional SDS gels -S000029964 CDS YNL284C 14 104102 103134 C 2005-11-07 1996-07-31 -S000006744 tRNA_gene tT(AGU)N1 chromosome 14 L000003688 14 104805 104877 W 2005-11-07 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000037414 noncoding_exon tT(AGU)N1 14 104805 104877 W 2005-11-07 2000-05-19 -S000005227 ORF Verified YNL283C WSC2 STA3 chromosome 14 L000004217 14 106695 105184 C 2005-11-07 1996-07-31 Sensor-transducer of the stress-activated PKC1-MPK1 signaling pathway; involved in maintenance of cell wall integrity and recovery from heat shock; required for the arrest of secretion response; WSC2 has a paralog, WSC3, that arose from the whole genome duplication -S000037312 CDS YNL283C 14 106695 105184 C 2005-11-07 1996-07-31 -S000005226 ORF Verified YNL282W POP3 chromosome 14 L000004338 14 107687 108274 W 2005-11-07 1996-07-31 Subunit of both RNase MRP and nuclear RNase P; RNase MRP cleaves pre-rRNA, while nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs; relocalizes to the cytosol in response to hypoxia -S000037263 CDS YNL282W 14 107687 108274 W 2005-11-07 1996-07-31 -S000005225 ORF Verified YNL281W HCH1 chromosome 14 L000004817 14 108467 108928 W 2005-11-07 1996-07-31 Heat shock protein regulator; binds to Hsp90p and may stimulate ATPase activity; originally identified as a high-copy number suppressor of a HSP90 loss-of-function mutation; role in regulating Hsp90 inhibitor drug sensitivity; GFP-fusion protein localizes to the cytoplasm and nucleus; protein abundance increases in response to DNA replication stress -S000037163 CDS YNL281W 14 108467 108928 W 2005-11-07 1996-07-31 -S000005224 ORF Verified YNL280C ERG24 delta(14)-sterol reductase chromosome 14 L000000580 14 110411 109095 C 2005-11-07 1996-07-31 C-14 sterol reductase; acts in ergosterol biosynthesis; mutants accumulate the abnormal sterol ignosterol (ergosta-8,14 dienol), and are viable under anaerobic growth conditions but inviable on rich medium under aerobic conditions -S000037018 CDS YNL280C 14 110411 109095 C 2005-11-07 1996-07-31 -S000005223 ORF Verified YNL279W PRM1 pheromone-regulated protein PRM1 chromosome 14 14 110917 112902 W 2005-11-07 1996-07-31 Pheromone-regulated multispanning membrane protein; involved in membrane fusion during mating; predicted to have 5 transmembrane segments and a coiled coil domain; localizes to the shmoo tip; regulated by Ste12p -S000035312 CDS YNL279W 14 110917 112902 W 2005-11-07 1996-07-31 -S000005222 ORF Verified YNL278W CAF120 chromosome 14 14 113271 116453 W 2005-11-07 1996-07-31 Part of the CCR4-NOT transcriptional regulatory complex; involved in controlling mRNA initiation, elongation, and degradation; contains a PH-like domain; CAF120 has a paralog, SKG3, that arose from the whole genome duplication -S000035145 CDS YNL278W 14 113271 116453 W 2005-11-07 1996-07-31 -S000028852 ORF Uncharacterized YNL277W-A chromosome 14 14 116679 116867 W 2005-11-07 2003-07-29 Putative protein of unknown function -S000034565 CDS YNL277W-A 14 116679 116867 W 2005-11-07 2003-07-29 -S000005221 ORF Verified YNL277W MET2 homoserine O-acetyltransferase chromosome 14 L000001077 14 117349 118809 W -187 2005-11-07 1996-07-31 L-homoserine-O-acetyltransferase; catalyzes the conversion of homoserine to O-acetyl homoserine which is the first step of the methionine biosynthetic pathway -S000034987 CDS YNL277W 14 117349 118809 W 2005-11-07 1996-07-31 -S000005220 ORF Dubious YNL276C chromosome 14 14 118826 118431 C 2005-11-07 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene MET2/YNL277W -S000033996 CDS YNL276C 14 118826 118431 C 2005-11-07 1996-07-31 -S000005219 ORF Verified YNL275W BOR1 chromosome 14 14 119268 120998 W 2005-11-07 1996-07-31 Boron efflux transporter of the plasma membrane; binds HCO3-, I-, Br-, NO3- and Cl-; has similarity to the characterized boron efflux transporter A. thaliana BOR1 -S000033936 CDS YNL275W 14 119268 120998 W 2005-11-07 1996-07-31 -S000005218 ORF Verified YNL274C GOR1 glyoxylate reductase chromosome 14 14 122170 121118 C 2005-11-07 1996-07-31 Glyoxylate reductase; null mutation results in increased biomass after diauxic shift; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; protein abundance increases in response to DNA replication stress -S000033106 CDS YNL274C 14 122170 121118 C 2005-11-07 1996-07-31 -S000005217 ORF Verified YNL273W TOF1 chromosome 14 L000004244 14 122883 126599 W 2005-11-07 1996-07-31 Subunit of a replication-pausing checkpoint complex; Tof1p-Mrc1p-Csm3p acts at the stalled replication fork to promote sister chromatid cohesion after DNA damage, facilitating gap repair of damaged DNA; interacts with the MCM helicase; relocalizes to the cytosol in response to hypoxia -S000033053 CDS YNL273W 14 122883 126599 W 2005-11-07 1996-07-31 -S000130141 ARS ARS1410 chromosome 14 14 126599 126805 2009-05-06 2009-05-06 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay -S000005216 ORF Verified YNL272C SEC2 guanine nucleotide exchange factor SEC2 chromosome 14 L000001828 14 129084 126805 C -176 2005-11-07 1996-07-31 Guanyl-nucleotide exchange factor for the small G-protein Sec4p; essential for post-Golgi vesicle transport and for autophagy; associates with the exocyst, via exocyst subunit Sec15p, on secretory vesicles -S000032904 CDS YNL272C 14 129084 126805 C 2005-11-07 1996-07-31 -S000005215 ORF Verified YNL271C BNI1 formin BNI1|SHE5|PPF3 chromosome 14 L000000190 14 135383 129522 C 2011-02-03 1996-07-31|2011-02-03 Formin; polarisome component; nucleates the formation of linear actin filaments, involved in cell processes such as budding and mitotic spindle orientation which require the formation of polarized actin cables; recruited to the division site in a Glc7p/Ref2p dependent manner following release of Bnr1p; functionally redundant with BNR1 -S000032829 CDS YNL271C 14 135383 129522 C 2011-02-03 1996-07-31|2011-02-03 -S000005214 ORF Verified YNL270C ALP1 arginine permease ALP1|APL1 chromosome 14 L000000080 14 137661 135940 C 2011-02-03 1996-07-31 Arginine transporter; expression is normally very low and it is unclear what conditions would induce significant expression; ALP1 has a paralog, CAN1, that arose from the whole genome duplication -S000031915 CDS YNL270C 14 137661 135940 C 2011-02-03 1996-07-31 -S000005213 ORF Verified YNL269W BSC4 chromosome 14 14 137699 138094 W 2011-02-03 1996-07-31 Protein of unknown function; protein-coding gene that evolved de novo via a series of point mutations in noncoding sequence; ORF exhibits genomic organization compatible with a translational readthrough-dependent mode of expression; readthrough is increased upon depletion of Sup35p; may be involved in DNA repair pathway during stationary phase and contribute to robustness of cells when shifted to a nutrient-poor environment -S000032644 CDS YNL269W 14 137699 138094 W 2011-02-03 1996-07-31 -S000005212 ORF Verified YNL268W LYP1 lysine permease chromosome 14 L000000963 14 138550 140385 W 2011-02-03 1996-07-31 Lysine permease; one of three amino acid permeases (Alp1p, Can1p, Lyp1p) responsible for uptake of cationic amino acids -S000031660 CDS YNL268W 14 138550 140385 W 2011-02-03 1996-07-31 -S000005211 ORF Verified YNL267W PIK1 1-phosphatidylinositol 4-kinase|PIK120|PIK41 chromosome 14 L000001439|L000001438 14 140878 144078 W 2011-02-03 1996-07-31 Phosphatidylinositol 4-kinase; catalyzes first step in the biosynthesis of phosphatidylinositol-4,5-biphosphate; may control cytokinesis through the actin cytoskeleton; may control nonselective autophagy and mitophagy through trafficking of Atg9p -S000031530 CDS YNL267W 14 140878 144078 W 2011-02-03 1996-07-31 -S000005210 ORF Dubious YNL266W chromosome 14 14 144245 144664 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF IST1/YNL265C -S000031404 CDS YNL266W 14 144245 144664 W 2011-02-03 1996-07-31 -S000005209 ORF Verified YNL265C IST1 chromosome 14 14 145281 144280 C 2011-02-03 1996-07-31 Protein with positive role in the multivesicular body sorting pathway; functions and forms a complex with Did2p; recruitment to endosomes is mediated by the Vps2p-Vps24p subcomplex of ESCRT-III; also interacts with Vps4p -S000030432 CDS YNL265C 14 145149 144280 C 2011-02-03 1996-07-31 -S000030431 CDS YNL265C 14 145281 145255 C 2011-02-03 1996-07-31 -S000030433 intron YNL265C 14 145254 145150 C 2011-02-03 1996-07-31 -S000005208 ORF Verified YNL264C PDR17 phosphatidylinositol transporter|SFH4|ISS1 chromosome 14 L000004780 14 146615 145563 C 2011-02-03 1996-07-31 Phosphatidylinositol transfer protein (PITP); downregulates Plb1p-mediated turnover of phosphatidylcholine; forms a complex with Psd2p which appears essential for maintenance of vacuolar PE levels; found in the cytosol and microsomes; homologous to Pdr16p; deletion affects phospholipid composition -S000030276 CDS YNL264C 14 146615 145563 C 2011-02-03 1996-07-31 -S000005207 ORF Verified YNL263C YIF1 chromosome 14 L000004141|L000003364 14 147840 146896 C 2011-02-03 1996-07-31 Integral membrane protein; required for the fusion of ER-derived COPII transport vesicles with the Golgi; interacts with Yip1p and Yos1p; localizes to the Golgi, the ER, and COPII vesicles; homolog of human YIPF3 -S000037532 CDS YNL263C 14 147840 146896 C 2011-02-03 1996-07-31 -S000005206 ORF Verified YNL262W POL2 DNA polymerase epsilon catalytic subunit|DUN2 chromosome 14 L000001461 14 148212 154880 W -170 2011-02-03 1996-07-31 Catalytic subunit of DNA polymerase (II) epsilon; a chromosomal DNA replication polymerase that exhibits processivity and proofreading exonuclease activity; participates in leading-strand synthesis during DNA replication; also involved in DNA synthesis during DNA repair; interacts extensively with Mrc1p -S000037477 CDS YNL262W 14 148212 154880 W 2011-02-03 1996-07-31 -S000005205 ORF Verified YNL261W ORC5 origin recognition complex subunit 5 chromosome 14 L000002814 14 155100 156539 W 2011-02-03 1996-07-31 Subunit of the origin recognition complex (ORC); ORC directs DNA replication by binding to replication origins and is also involved in transcriptional silencing -S000037358 CDS YNL261W 14 155100 156539 W 2011-02-03 1996-07-31 -S000005204 ORF Verified YNL260C LTO1 ribosome biosynthesis protein LTO1 chromosome 14 14 157455 156859 C 2011-02-03 1996-07-31 Essential protein that forms a complex with Rli1p and Yae1p; ortholog of human ORAOV1, which is overexpressed in solid tumors; inviability of null mutant under standard conditions is complemented by overexpression of ORAOV1; essential for growth under standard (aerobic) conditions but not under anaerobic conditions; may have a role in protection of ribosomal assembly and function from damage due to reactive oxygen species -S000036594 CDS YNL260C 14 157455 156859 C 2011-02-03 1996-07-31 -S000005203 ORF Verified YNL259C ATX1 copper metallochaperone ATX1 chromosome 14 L000000155 14 157865 157644 C 2011-02-03 1996-07-31 Cytosolic copper metallochaperone; transports copper to the secretory vesicle copper transporter Ccc2p for eventual insertion into Fet3p, which is a multicopper oxidase required for high-affinity iron uptake; human homolog ATOX1 can complement yeast atx1 mutant; overexpression of human ATOX1 suppresses lysine auxotrophy of the yeast sod1 null mutant, as does overexpression of yeast ATX1 -S000035583 CDS YNL259C 14 157865 157644 C 2011-02-03 1996-07-31 -S000005202 ORF Verified YNL258C DSL1 RNS1 chromosome 14 L000004950 14 160373 158109 C 2011-02-03 1996-07-31 Peripheral membrane protein needed for Golgi-to-ER retrograde traffic; mediates Sey1p-independent homotypic ER fusion; forms Dsl1 tethering complex with Sec39p and Tip20p that forms a stable complex with ER SNAREs Sec20p, Ufe1p and Use1p and is functionally conserved from yeast to mammalian cells; component of the ER target site that interacts with coatomer; interacts with different subunits of COPI vesicle coat; interacts with Cin5p; homolog of fly and human ZW10 gene -S000035489 CDS YNL258C 14 160373 158109 C 2011-02-03 1996-07-31 -S000005201 ORF Verified YNL257C SIP3 LAM3 chromosome 14 L000001892 14 164320 160631 C 2011-02-03 1996-07-31 Putative sterol transfer protein; has a probable role in retrograde transport of sterols from the plasma membrane to the ER; co-localizes to puncta in the cortical ER with Ysp2p; contains GRAM, StART-like (VASt) and two PH-like domains; one of 6 StART-like domain-containing proteins in yeast that may be involved in sterol transfer between intracellular membranes; conserved across eukaryotes; previously identified as a transcription cofactor that interacts with DNA-bound Snf1p -S000035355 CDS YNL257C 14 164320 160631 C 2011-02-03 1996-07-31 -S000005200 ORF Verified YNL256W FOL1 trifunctional dihydropteroate synthetase/dihydrohydroxymethylpterin pyrophosphokinase/dihydroneopterin aldolase FOL1 chromosome 14 L000000620 14 164623 167097 W -170 2011-02-03 2003-09-22|1996-07-31 Multifunctional enzyme of the folic acid biosynthesis pathway; has dihydropteroate synthetase, dihydro-6-hydroxymethylpterin pyrophosphokinase, and dihydroneopterin aldolase activities -S000034407 CDS YNL256W 14 164623 167097 W 2011-02-03 2003-09-22|1996-07-31 -S000005199 ORF Verified YNL255C GIS2 mRNA-binding translational activator GIS2 chromosome 14 L000004862 14 167790 167329 C 2011-02-03 1996-07-31 Translational activator for mRNAs with internal ribosome entry sites; associates with polysomes and binds to a specific subset of mRNAs; localizes to RNA processing bodies (P bodies) and to stress granules; may have a role in translation regulation under stress conditions; ortholog of human ZNF9/CNBP, a gene involved in myotonic dystrophy type 2 -S000034231 CDS YNL255C 14 167790 167329 C 2011-02-03 1996-07-31 -S000005198 ORF Verified YNL254C RTC4 chromosome 14 14 169248 168043 C 2011-02-03 1996-07-31 Protein of unknown function; null mutation suppresses cdc13-1 temperature sensitivity; (GFP)-fusion protein localizes to both the cytoplasm and the nucleus -S000034113 CDS YNL254C 14 169248 168043 C 2011-02-03 1996-07-31 -S000077373 ARS ARS1411 ARSXIV-170 chromosome 14 14 169675 169753 2014-11-18 2014-11-18|2004-10-18|2006-09-07 ARS activated in late S phase -S000178168 ARS_consensus_sequence ARS1411 14 169748 169732 C 2014-11-18 2014-11-18 -S000005197 ORF Verified YNL253W TEX1 chromosome 14 14 170018 171286 W 2011-02-03 1996-07-31 Protein involved in mRNA export; component of the transcription export (TREX) complex -S000033293 CDS YNL253W 14 170018 171286 W 2011-02-03 1996-07-31 -S000005196 ORF Verified YNL252C MRPL17 mitochondrial 54S ribosomal protein YmL17/YmL30|YmL17|YmL30|MRPL30 chromosome 14 L000001703|L000002266|L000002692 14 172286 171441 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000033203 CDS YNL252C 14 172286 171441 C 2011-02-03 1996-07-31 -S000005195 ORF Verified YNL251C NRD1 Nrd1 complex RNA-binding subunit chromosome 14 L000002862 14 174315 172588 C 2011-02-03 1996-07-31 RNA-binding subunit of Nrd1 complex; complex interacts with exosome to mediate 3'-end formation of some mRNAs, snRNAs, snoRNAs, and CUTs; interacts with CTD of RNA pol II large subunit Rpo21p at phosphorylated Ser5 to direct transcription termination of non-polyadenylated transcripts; H3K4 trimethylation of transcribed regions by Set1p enhances recruitment of Nrd1p to those sites; role in regulation of mitochondrial abundance and cell size -S000033151 CDS YNL251C 14 174315 172588 C 2011-02-03 1996-07-31 -S000005194 ORF Verified YNL250W RAD50 MRX complex DNA-binding subunit chromosome 14 L000001570 14 175410 179348 W -170 2011-02-03 1996-07-31 Subunit of MRX complex with Mre11p and Xrs2p; complex is involved in processing double-strand DNA breaks in vegetative cells, initiation of meiotic DSBs, telomere maintenance, and nonhomologous end joining; forms nuclear foci upon DNA replication stress -S000033124 CDS YNL250W 14 175410 179348 W 2011-02-03 1996-07-31 -S000005193 ORF Verified YNL249C MPA43 chromosome 14 L000003096 14 181022 179394 C 2011-02-03 1996-07-31 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000032322 CDS YNL249C 14 181022 179394 C 2011-02-03 1996-07-31 -S000005192 ORF Verified YNL248C RPA49 DNA-directed RNA polymerase I subunit RPA49|A49 chromosome 14 L000001673 14 182608 181361 C 2011-02-03 1996-07-31 RNA polymerase I subunit A49; essential for nucleolar assembly and for high polymerase loading rate; required for nucleolar localization of Rpa34p -S000032212 CDS YNL248C 14 182608 181361 C 2011-02-03 1996-07-31 -S000005191 ORF Verified YNL247W cysteine--tRNA ligase chromosome 14 14 182875 185178 W 2011-02-03 1996-07-31 Cysteinyl-tRNA synthetase; may interact with ribosomes, based on co-purification experiments; human gene CARS allows growth of the yeast haploid null mutant after sporulation of a heterozygous diploid -S000031279 CDS YNL247W 14 182875 185178 W 2011-02-03 1996-07-31 -S000005190 ORF Verified YNL246W VPS75 chromosome 14 14 185460 186349 W 2011-02-03 1996-07-31 NAP family histone chaperone; binds to histones and Rtt109p, stimulating histone acetyltransferase activity; possesses nucleosome assembly activity in vitro; proposed role in vacuolar protein sorting and in double-strand break repair; protein abundance increases in response to DNA replication stress; relocalizes to the cytosol in response to hypoxia -S000031149 CDS YNL246W 14 185460 185491 W 2011-02-03 1996-07-31 -S000031150 CDS YNL246W 14 185587 186349 W 2011-02-03 1996-07-31 -S000031151 intron YNL246W 14 185492 185586 W 2011-02-03 1996-07-31 -S000005189 ORF Verified YNL245C CWC25 U2-type spliceosomal complex subunit CWC25 chromosome 14 14 186885 186346 C 2011-02-03 1996-07-31 Splicing factor required for the first step of pre-mRNA splicing; binding to the spliceosome requires Prp2p and Yju2p; heat-stable protein; has similarity to S. pombe Cwf25p -S000030978 CDS YNL245C 14 186885 186346 C 2011-02-03 1996-07-31 -S000005188 ORF Verified YNL244C SUI1 translation initiation factor eIF1|RFR1|MOF2 chromosome 14 L000002177 14 187496 187170 C -171 2011-02-03 1996-07-31 Translation initiation factor eIF1; component of a complex involved in recognition of the initiator codon; modulates translation accuracy at the initiation phase -S000029973 CDS YNL244C 14 187496 187170 C 2011-02-03 1996-07-31 -S000005187 ORF Verified YNL243W SLA2 MOP2|END4 chromosome 14 L000001913|L000002421 14 188051 190957 W 2011-02-03 1996-07-31|2011-02-03 Adaptor protein that links actin to clathrin and endocytosis; involved in membrane cytoskeleton assembly and cell polarization; present in the actin cortical patch of the emerging bud tip; dimer in vivo -S000029929 CDS YNL243W 14 188051 190957 W 2011-02-03 1996-07-31|2011-02-03 -S000005186 ORF Verified YNL242W ATG2 APG2|AUT8|SPO72 chromosome 14 L000004782 14 191324 196102 W 2011-02-03 1996-07-31 Peripheral membrane protein required for autophagic vesicle formation; also required for vesicle formation during pexophagy and the cytoplasm-to-vaucole targeting (Cvt) pathway; involved in Atg9p cycling between the phagophore assembly site and mitochondria; contains an APT1 domain that binds phosphatidylinositol-3-phosphate; essential for cell cycle progression from G2/M to G1 under nitrogen starvation; forms cytoplasmic foci upon DNA replication stress -S000037889 CDS YNL242W 14 191324 196102 W 2011-02-03 1996-07-31 -S000077374 ARS ARS1412 ARSXIV-196 chromosome 14 14 196134 196232 2014-11-18 2014-11-18|2004-10-18|2006-09-07 ARS activated in late S phase -S000005185 ORF Verified YNL241C ZWF1 glucose-6-phosphate dehydrogenase|POS10|MET19 chromosome 14 L000002572 14 197943 196426 C -153 2011-02-03 1996-07-31 Glucose-6-phosphate dehydrogenase (G6PD); catalyzes the first step of the pentose phosphate pathway; involved in adapting to oxidative stress; protein abundance increases in response to DNA replication stress; homolog of human G6PD which is deficient in patients with hemolytic anemia; human G6PD can complement yeast zwf1 null mutant -S000037074 CDS YNL241C 14 197943 196426 C 2011-02-03 1996-07-31 -S000005184 ORF Verified YNL240C NAR1 chromosome 14 14 199977 198502 C 2011-02-03 1996-07-31 Subunit of the cytosolic iron-sulfur (FeS) protein assembly machinery; required for maturation of cytosolic and nuclear FeS proteins and for normal resistance to oxidative stress; deficiency results in shortened lifespan and sensitivity to paraquat; homologous to human Narf -S000037001 CDS YNL240C 14 199977 198502 C 2011-02-03 1996-07-31 -S000005183 ORF Verified YNL239W LAP3 bleomycin hydrolase|YCP1|GAL6|BLH1 chromosome 14 L000002502|L000000929 14 200569 201933 W -152 2011-02-03 2003-01-07|1996-07-31 Cysteine aminopeptidase with homocysteine-thiolactonase activity; protects cells against homocysteine toxicity; has bleomycin hydrolase activity in vitro; transcription is regulated by galactose via Gal4p; orthologous to human BLMH -S000036318 CDS YNL239W 14 200569 201933 W 2011-02-03 2003-01-07|1996-07-31 -S000005182 ORF Verified YNL238W KEX2 kexin KEX2|yscF|SRB1|VMA45|QDS1 chromosome 14 L000000896 14 202428 204872 W -147 2011-02-03 1996-07-31 Kexin, a subtilisin-like protease (proprotein convertase); a calcium-dependent serine protease involved in the activation of proproteins of the secretory pathway -S000036210 CDS YNL238W 14 202428 204872 W 2011-02-03 1996-07-31 -S000005181 ORF Verified YNL237W YTP1 chromosome 14 L000003036 14 205188 206567 W 2011-02-03 1996-07-31 Probable type-III integral membrane protein of unknown function; has regions of similarity to mitochondrial electron transport proteins -S000036063 CDS YNL237W 14 205188 206567 W 2011-02-03 1996-07-31 -S000005180 ORF Verified YNL236W SIN4 SSX3|MED16|RYE1|TSF3|SSN4|SSF5|SDI3|GAL22|BEL2 chromosome 14 L000001888|S000029516|L000002099 14 206930 209854 W -145 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; contributes to both postive and negative transcriptional regulation; dispensible for basal transcription -S000035179 CDS YNL236W 14 206930 209854 W 2011-02-03 1996-07-31 -S000005179 ORF Dubious YNL235C chromosome 14 14 209979 209548 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF SIN4/YNL236W, a subunit of the mediator complex -S000034886 CDS YNL235C 14 209979 209548 C 2011-02-03 1996-07-31 -S000005178 ORF Verified YNL234W chromosome 14 14 210233 211513 W 2011-02-03 1996-07-31 Protein of unknown function with similarity to globins; has a functional heme-binding domain; mutant has aneuploidy tolerance; transcription induced by stress conditions; may be involved in glucose signaling or metabolism; regulated by Rgt1 -S000034841 CDS YNL234W 14 210233 211513 W 2011-02-03 1996-07-31 -S000005177 ORF Verified YNL233W BNI4 chromosome 14 L000003517 14 211922 214600 W 2011-02-03 1996-07-31 Targeting subunit for Glc7p protein phosphatase; localized to the bud neck, required for localization of chitin synthase III to the bud neck via interaction with the chitin synthase III regulatory subunit Skt5p; phosphorylation by Slt2p and Kss1p involved in regulating Bni4p in septum assembly -S000033930 CDS YNL233W 14 211922 214600 W 2011-02-03 1996-07-31 -S000005176 ORF Verified YNL232W CSL4 exosome non-catalytic core subunit CSL4|SKI4 chromosome 14 L000001905|L000004677 14 214923 215801 W 2011-02-03 1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; predicted to contain an S1 RNA binding domain; human homolog EXOSC1 partially complements yeast csl4 null mutant, and can complement inviability of strain in which expression of CSL4 is repressed -S000033848 CDS YNL232W 14 214923 215801 W 2011-02-03 1996-07-31 -S000005175 ORF Verified YNL231C PDR16 phosphatidylinositol transporter|SFH3 chromosome 14 L000004779 14 217042 215987 C 2011-02-03 1996-07-31 Phosphatidylinositol transfer protein (PITP); controlled by the multiple drug resistance regulator Pdr1p; localizes to lipid particles and microsomes; controls levels of various lipids, may regulate lipid synthesis; homologous to Pdr17p; protein abundance increases in response to DNA replication stress -S000033675 CDS YNL231C 14 217042 215987 C 2011-02-03 1996-07-31 -S000005174 ORF Verified YNL230C ELA1 elongin A chromosome 14 L000004956 14 218662 217523 C 2011-02-03 1996-07-31 Elongin A; F-box protein that forms a heterodimer with Elc1p and is required for ubiquitin-dependent degradation of the RNA Polymerase II subunit Rpo21p; subunit of the Elongin-Cullin-Socs (ECS) ligase complex -S000033008 CDS YNL230C 14 218662 217523 C 2011-02-03 1996-07-31 -S000005173 ORF Verified YNL229C URE2 [URE3] chromosome 14 L000002439 14 220201 219137 C -142 2011-02-03 1996-07-31 Nitrogen catabolite repression transcriptional regulator; inhibits GLN3 transcription in good nitrogen source; role in sequestering Gln3p and Gat1p to the cytoplasm; has glutathione peroxidase activity and can mutate to acquire GST activity; self-assembly under limited nitrogen conditions creates [URE3] prion and releases catabolite repression -S000034177 CDS YNL229C 14 220201 219137 C 2011-02-03 1996-07-31 -S000005172 ORF Dubious YNL228W chromosome 14 14 220645 221421 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF YNL227C/JJJ1 -S000034107 CDS YNL228W 14 220645 221421 W 2011-02-03 1996-07-31 -S000005170 ORF Dubious YNL226W chromosome 14 14 222239 222649 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene JJJ1/YNL227C -S000032023 CDS YNL226W 14 222239 222649 W 2011-02-03 1996-07-31 -S000005171 ORF Verified YNL227C JJJ1 chromosome 14 14 222431 220659 C 2011-02-03 1996-07-31 Co-chaperone that stimulates the ATPase activity of Ssa1p; required for a late step of ribosome biogenesis; associated with the cytosolic large ribosomal subunit; contains a J-domain; mutation causes defects in fluid-phase endocytosis -S000032103 CDS YNL227C 14 222431 220659 C 2011-02-03 1996-07-31 -S000005169 ORF Verified YNL225C CNM67 chromosome 14 L000004012 14 224469 222724 C 2011-02-03 1996-07-31 Component of the spindle pole body outer plaque; required for spindle orientation and mitotic nuclear migration; CNM67 has a paralog, ADY3, that arose from the whole genome duplication -S000031798 CDS YNL225C 14 224469 222724 C 2011-02-03 1996-07-31 -S000005168 ORF Verified YNL224C SQS1 PFA1 chromosome 14 14 227099 224796 C 2011-02-03 1996-07-31 Protein that stimulates the ATPase and helicase activities of Prp43p; acts with Prp43p to stimulate 18s rRNA maturation by Nob1p; overexpression antagonizes the suppression of splicing defects by spp382 mutants; component of pre-ribosomal particles; relocalizes from nucleus to nucleolus upon DNA replication stress -S000030829 CDS YNL224C 14 227099 224796 C 2011-02-03 1996-07-31 -S000005167 ORF Verified YNL223W ATG4 cysteine protease ATG4|AUT2|APG4 chromosome 14 L000004606|L000004784 14 227370 228854 W 2011-02-03 2003-09-22|1996-07-31 Conserved cysteine protease required for autophagy; cleaves Atg8p to a form required for autophagosome and Cvt vesicle generation -S000030783 CDS YNL223W 14 227370 228854 W 2011-02-03 2003-09-22|1996-07-31 -S000005166 ORF Verified YNL222W SSU72 RNA polymerase II subunit A C-terminal domain phosphatase chromosome 14 L000003154 14 229094 229714 W 2011-02-03 1996-07-31 Phosphatase and transcription/RNA-processing factor; associates with TFIIB and cleavage/polyadenylation factor Pta1p; exhibits phosphatase activity on serine-5 and serine-7 of the RNA polymerase II C-terminal domain; affects start site selection and transcriptional read through in vivo -S000030662 CDS YNL222W 14 229094 229714 W 2011-02-03 1996-07-31 -S000007295 snRNA_gene snR19 SNR19 U1 chromosome 14 L000001967 14 230672 230105 C 2011-02-03 2004-04-02 U1 spliceosomal RNA (U1 snRNA); snRNA U1 homolog -S000036596 noncoding_exon snR19 14 230672 230105 C 2011-02-03 2004-04-02 -S000005165 ORF Verified YNL221C POP1 ribonuclease P/MRP protein subunit POP1 chromosome 14 L000002587 14 233695 231068 C 2011-02-03 1996-07-31 Subunit of RNase MRP, nuclear RNase P and telomerase complexes; RNase MRP cleaves pre-rRNA, nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs, while telomerase replenishes telomeric DNA; binds to the RPR1 RNA subunit in RNase P -S000037760 CDS YNL221C 14 233695 231068 C 2011-02-03 1996-07-31 -S000005164 ORF Verified YNL220W ADE12 adenylosuccinate synthase|BRA9 chromosome 14 L000000039 14 234413 235714 W -151 2011-02-03 1996-07-31 Adenylosuccinate synthase; catalyzes the first step in synthesis of adenosine monophosphate from inosine 5'monophosphate during purine nucleotide biosynthesis; exhibits binding to single-stranded autonomously replicating (ARS) core sequence -S000037738 CDS YNL220W 14 234413 235714 W 2011-02-03 1996-07-31 -S000005163 ORF Verified YNL219C ALG9 dolichyl-P-Man:Man(6)GlcNAc(2)-PP-dolichol alpha-1,2-mannosyltransferase chromosome 14 L000003394 14 237663 235996 C 2011-02-03 1996-07-31 Mannosyltransferase, involved in N-linked glycosylation; catalyzes the transfer of both the seventh mannose residue on B-arm and ninth mannose residue on the C-arm from Dol-P-Man to lipid-linked oligosaccharides; human homolog ALG9 can complement yeast null mutant; mutation of human homolog causes type 1 congenital disorders of glycosylation -S000029975 CDS YNL219C 14 237663 235996 C 2011-02-03 1996-07-31 -S000005162 ORF Verified YNL218W MGS1 ssDNA-dependent ATPase MGS1 chromosome 14 14 238238 240001 W 2011-02-03 1996-07-31 Protein with DNA-dependent ATPase and ssDNA annealing activities; involved in maintenance of genome; interacts functionally with DNA polymerase delta; homolog of human Werner helicase interacting protein (WHIP); forms nuclear foci upon DNA replication stress -S000029915 CDS YNL218W 14 238238 240001 W 2011-02-03 1996-07-31 -S000005161 ORF Uncharacterized YNL217W putative serine/threonine-protein phosphatase chromosome 14 14 240331 241311 W 2011-02-03 1996-07-31 Putative protein of unknown function; weak sequence similarity to bis (5'-nucleotidyl)-tetraphosphatases; (GFP)-fusion protein localizes to the vacuole; null mutant is highly sensitive to azaserine and resistant to sodium-O-vandate -S000037905 CDS YNL217W 14 240331 241311 W 2011-02-03 1996-07-31 -S000005160 ORF Verified YNL216W RAP1 DNA-binding transcription factor RAP1|TUF1|TBA1|GRF1 chromosome 14 L000001581 14 241689 244172 W -148 2011-02-03 1996-07-31 Essential DNA-binding transcription regulator that binds many loci; involved in transcription activation, repression, chromatin silencing, telomere length maintenance; relocalizes to cytosol under hypoxia; conserved protein with N-terminal BRCT domain, central region with homology to Myb DNA binding domain, and C-terminal Rap1-specific protein-interaction domain (RCT domain); recruits Sir complex to telomeric DNA; present in quiescent cell telomere hyperclusters -S000037812 CDS YNL216W 14 241689 244172 W 2011-02-03 1996-07-31 -S000005159 ORF Verified YNL215W IES2 chromosome 14 14 244468 245430 W 2011-02-03 1996-07-31 Protein that associates with the INO80 chromatin remodeling complex; associates with the INO80 complex under low-salt conditions; essential for growth under anaerobic conditions; protein abundance increases in response to DNA replication stress -S000035947 CDS YNL215W 14 244468 245430 W 2011-02-03 1996-07-31 -S000005158 ORF Verified YNL214W PEX17 PAS9 chromosome 14 L000003963 14 245617 246216 W 2011-02-03 1996-07-31 Membrane peroxin of the peroxisomal importomer complex; complex facilitates the import of peroxisomal matrix proteins; required for peroxisome biogenesis -S000035811 CDS YNL214W 14 245617 246216 W 2011-02-03 1996-07-31 -S000005157 ORF Verified YNL213C RRG9 chromosome 14 14 247104 246460 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant lacks mitochondrial DNA and cannot grow on glycerol; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000034770 CDS YNL213C 14 247104 246460 C 2011-02-03 1996-07-31 -S000005156 ORF Verified YNL212W VID27 chromosome 14 14 247461 249809 W 2011-02-03 1996-07-31 Cytoplasmic protein of unknown function; possibly involved in vacuolar protein degradation; not essential for proteasome-dependent degradation of fructose-1,6-bisphosphatase (FBPase); null mutants exhibit normal growth; contains two PH-like domains -S000034713 CDS YNL212W 14 247461 249809 W 2011-02-03 1996-07-31 -S000005155 ORF Uncharacterized YNL211C MRX7 chromosome 14 14 250315 250055 C 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; green fluorescent protein (GFP)-fusion protein localizes to mitochondria; YNL211C is not an essential gene -S000034553 CDS YNL211C 14 250315 250055 C 2011-02-03 1996-07-31 -S000077375 ARS ARS1413 chromosome 14 14 250315 250931 2011-02-03 2004-10-18 Strong origin of replication activated in late S phase -S000005154 ORF Verified YNL210W MER1 chromosome 14 L000001074 14 250931 251743 W -138 2011-02-03 1996-07-31 mRNA-binding protein required for meiosis-specific mRNA splicing; required for chromosome pairing and meiotic recombination; Mer1p regulon embraces four essential meiotic pre-mRNAs: REC107, HFM1, AMA1 and SPO22 -S000034504 CDS YNL210W 14 250931 251743 W 2011-02-03 1996-07-31 -S000005153 ORF Verified YNL209W SSB2 Hsp70 family ATPase SSB2|YG103 chromosome 14 L000002715 14 252059 253900 W 2011-02-03 1996-07-31 Cytoplasmic ATPase that is a ribosome-associated molecular chaperone; functions with J-protein partner Zuo1p; may be involved in the folding of newly-synthesized polypeptide chains; member of the HSP70 family; SSB2 has a paralog, SSB1, that arose from the whole genome duplication -S000035043 CDS YNL209W 14 252059 253900 W 2011-02-03 1996-07-31 -S000005152 ORF Verified YNL208W chromosome 14 14 254418 255017 W 2011-02-03 2004-02-19|1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; authentic, non-tagged protein is detected in purified mitochondria in high-throughput studies; potential orthologs found in other fungi -S000034895 CDS YNL208W 14 254418 255017 W 2011-02-03 2004-02-19|1996-07-31 -S000005151 ORF Verified YNL207W RIO2 protein kinase RIO2 chromosome 14 14 255353 256630 W 2011-02-03 1996-07-31 Essential serine kinase involved in the processing of 20S pre-rRNA; involved in the processing of the 20S pre-rRNA into mature 18S rRNA; has similarity to Rio1p -S000034789 CDS YNL207W 14 255353 256630 W 2011-02-03 1996-07-31 -S000005150 ORF Verified YNL206C RTT106 chromosome 14 14 258155 256788 C 2011-02-03 1996-07-31 Histone chaperone; involved in regulation of chromatin structure in both transcribed and silenced chromosomal regions; affects transcriptional elongation; has a role in regulation of Ty1 transposition; interacts physically and functionally with Chromatin Assembly Factor-1 (CAF-1) -S000033853 CDS YNL206C 14 258155 256788 C 2011-02-03 1996-07-31 -S000005149 ORF Dubious YNL205C chromosome 14 14 258577 258155 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033703 CDS YNL205C 14 258577 258155 C 2011-02-03 1996-07-31 -S000005148 ORF Verified YNL204C SPS18 SPX18 chromosome 14 L000002042 14 259277 258375 C 2011-02-03 1996-07-31 Protein of unknown function, contains a putative zinc-binding domain; expressed during sporulation; SPS18 has a paralog, GCS1, that arose from the whole genome duplication -S000030383 CDS YNL204C 14 259277 258375 C 2011-02-03 1996-07-31 -S000005146 ORF Verified YNL202W SPS19 SPX19 chromosome 14 L000002043 14 259578 260456 W 2011-02-03 1996-07-31|2006-05-10 Peroxisomal 2,4-dienoyl-CoA reductase; auxiliary enzyme of fatty acid beta-oxidation; homodimeric enzyme required for growth and sporulation on petroselineate medium; expression induced during late sporulation and in the presence of oleate -S000030188 CDS YNL202W 14 259578 260456 W 2011-02-03 1996-07-31|2006-05-10 -S000005147 ORF Dubious YNL203C chromosome 14 14 260050 259439 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030248 CDS YNL203C 14 260050 259439 C 2011-02-03 1996-07-31 -S000005145 ORF Verified YNL201C PSY2 chromosome 14 14 263203 260627 C 2011-02-03 1996-07-31 Subunit of protein phosphatase PP4 complex; Pph3p and Psy2p form the active complex, Psy4p may provide additional substrate specificity; regulates recovery from the DNA damage checkpoint, the gene conversion- and single-strand annealing-mediated pathways of meiotic double-strand break repair and efficient Non-Homologous End-Joining (NHEJ) pathway; Pph3p and Psy2p localize to foci on meiotic chromosomes; putative homolog of mammalian R3 -S000030016 CDS YNL201C 14 263203 260627 C 2011-02-03 1996-07-31 -S000005144 ORF Verified YNL200C NNR1 NADHX epimerase chromosome 14 14 264453 263713 C 2011-02-03 1996-07-31 NADHX epimerase; catalyzes isomerization of (R)- and (S)-NADHX; homologous to AIBP in mammals and the N- terminal domain of YjeF in E.coli; enzyme is widespread in eukaryotes, prokaryotes and archaea; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000037373 CDS YNL200C 14 264453 263713 C 2011-02-03 1996-07-31 -S000005143 ORF Verified YNL199C GCR2 chromosome 14 L000000691 14 266530 264926 C 2011-02-03 1996-07-31 Transcriptional activator of genes involved in glycolysis; interacts and functions with the DNA-binding protein Gcr1p -S000032854 CDS YNL199C 14 266530 264926 C 2011-02-03 1996-07-31 -S000005142 ORF Dubious YNL198C chromosome 14 14 266816 266514 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032762 CDS YNL198C 14 266816 266514 C 2011-02-03 1996-07-31 -S000005141 ORF Verified YNL197C WHI3 mRNA-binding protein WHI3 chromosome 14 L000002486 14 269593 267608 C 2011-02-03 1996-07-31 RNA binding protein that sequesters CLN3 mRNA in cytoplasmic foci; regulates genes involved in the cell cycle, sister chromatid cohesion, and stress response; acts as a cytoplasmic retention factor for Cdc28p and associated cyclins; regulates cell fate and dose-dependently regulates the critical cell size required for passage through Start; Tpk1p (PKA) mediated phosphorylation (S568) inhibits Whi3p function, decreasing its interaction with CLN3 mRNA; regulates ploidy -S000032683 CDS YNL197C 14 269593 267608 C 2011-02-03 1996-07-31 -S000005140 ORF Verified YNL196C SLZ1 chromosome 14 L000004192 14 271171 270275 C 2011-02-03 1996-07-31 Sporulation-specific protein with a leucine zipper motif; subunit of the MIS complex which controls mRNA methylation during during the induction of sporulation -S000032589 CDS YNL196C 14 271171 270275 C 2011-02-03 1996-07-31 -S000005139 ORF Uncharacterized YNL195C chromosome 14 14 272308 271523 C 2011-02-03 2004-02-18|1996-07-31 Protein of unknown function; shares a promoter with YNL194C; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YNL195C has a paralog, HBT1, that arose from the whole genome duplication -S000031608 CDS YNL195C 14 272308 271523 C 2011-02-03 2004-02-18|1996-07-31 -S000005138 ORF Verified YNL194C chromosome 14 14 273615 272710 C 2011-02-03 1996-07-31 Integral membrane protein; required for sporulation and plasma membrane sphingolipid content; similar to SUR7; GFP-fusion protein is induced in response to the DNA-damaging agent MMS; GFP-fusion protein is more abundant at MCCs (membrane compartment occupied by Can1) in the presence of glycerol and oleate; YNL194C has a paralog, FMP45, that arose from the whole genome duplication -S000031471 CDS YNL194C 14 273615 272710 C 2011-02-03 1996-07-31 -S000005137 ORF Uncharacterized YNL193W chromosome 14 14 274368 276044 W 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; exhibits a two-hybrid interaction with Yhr151cp in a large-scale analysis -S000031402 CDS YNL193W 14 274368 276044 W 2011-02-03 1996-07-31|2011-02-03 -S000005136 ORF Verified YNL192W CHS1 chitin synthase CHS1|USA4 chromosome 14 L000000329 14 276502 279897 W 2011-02-03 1996-07-31|2011-02-03 Chitin synthase I; requires activation from zymogenic form in order to catalyze the transfer of N-acetylglucosamine (GlcNAc) to chitin; required for repairing the chitin septum during cytokinesis; transcription activated by mating factor -S000030484 CDS YNL192W 14 276502 279897 W 2011-02-03 1996-07-31|2011-02-03 -S000077376 ARS ARS1414 ARSXIV-280 chromosome 14 14 279982 280071 2014-11-18 2014-11-18|2004-10-18|2006-09-07 ARS activated in mid-S phase -S000178169 ARS_consensus_sequence ARS1414 14 280063 280047 C 2014-11-18 2014-11-18 -S000005135 ORF Verified YNL191W DUG3 glutamine amidotransferase subunit DUG3 chromosome 14 14 280432 281505 W 2011-02-03 1996-07-31 Component of glutamine amidotransferase (GATase II); forms a complex with Dug2p to degrade glutathione (GSH) and other peptides containing a gamma-glu-X bond in an alternative pathway to GSH degradation by gamma-glutamyl transpeptidase (Ecm38p) -S000030357 CDS YNL191W 14 280432 281505 W 2011-02-03 1996-07-31 -S000005134 ORF Verified YNL190W chromosome 14 14 282395 283009 W 2011-02-03 1996-07-31 Hydrophilin essential in desiccation-rehydration process; cell wall protein; contains a putative GPI-attachment site -S000030164 CDS YNL190W 14 282395 283009 W 2011-02-03 1996-07-31 -S000005133 ORF Verified YNL189W SRP1 karyopherin alpha|SCM1|KAP60 chromosome 14 L000002755|L000002780 14 284260 285888 W 2011-02-03 1996-07-31 Karyopherin alpha homolog; forms a dimer with karyopherin beta Kap95p to mediate import of nuclear proteins, binds the nuclear localization signal of the substrate during import; involved in cotranslational protein degradation; binds ribosome-bound nascent polypeptides; Srp1p and Sts1p couple proteasomes to nascent polypeptides emerging from the ribosome for cotranslational degradation -S000036720 CDS YNL189W 14 284260 285888 W 2011-02-03 1996-07-31 -S000005132 ORF Verified YNL188W KAR1 chromosome 14 L000000886 14 286308 287609 W -208 2011-02-03 1996-07-31 Protein involved in karyogamy and spindle pole body duplication; involved in karyogamy during mating; involved in spindle pole body duplication during mitosis; localizes to the half-bridge of the spindle pole body; interacts with Spc72p during karyogamy; also interacts with Cdc31p; essential gene -S000036621 CDS YNL188W 14 286308 287609 W 2011-02-03 1996-07-31 -S000005131 ORF Verified YNL187W SWT21 chromosome 14 14 287994 289067 W 2011-02-03 1996-07-31 Protein involved in mRNA splicing; contains a consensus nuclear export signal (NES) sequence similar to the consensus sequence recognized by Crm1p; interacts genetically with Prp40p and Tgs1p; contains WD40 repeats -S000036547 CDS YNL187W 14 287994 289067 W 2011-02-03 1996-07-31 -S000005130 ORF Verified YNL186W UBP10 ubiquitin-specific protease UBP10|DOT4 chromosome 14 L000004391|L000004588 14 289498 291876 W 2011-02-03 1996-07-31|2011-02-03 Ubiquitin-specific protease, deubiquitinates Ub-protein moieties; interacts with proteins that function in rRNA production and ribosome biogenesis via its intrinsically disordered regions; stabilizes Rpa190p by deubiquitination; controls PCNA deubiquitylation; may regulate silencing by acting on Sir4p; involved in posttranscriptionally regulating Gap1p, possibly other transporters; localized to the nucleolus; null mutant phenotypes are functionally complemented by human USP36 -S000035619 CDS YNL186W 14 289498 291876 W 2011-02-03 1996-07-31|2011-02-03 -S000005129 ORF Verified YNL185C MRPL19 mitochondrial 54S ribosomal protein YmL19|YmL19 chromosome 14 14 292669 292193 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000035486 CDS YNL185C 14 292669 292193 C 2011-02-03 1996-07-31 -S000005128 ORF Uncharacterized YNL184C chromosome 14 14 292883 292557 C 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels -S000035350 CDS YNL184C 14 292883 292557 C 2011-02-03 1996-07-31 -S000005127 ORF Verified YNL183C NPR1 serine/threonine protein kinase NPR1 chromosome 14 L000001273 14 295509 293137 C 2011-02-03 1996-07-31 Protein kinase; stabilizes several plasma membrane amino acid transporters by antagonizing their ubiquitin-mediated degradation; phosphorylates Aly2p; negatively regulates Ldb19p-mediated endocytosis through phosphorylation of Ldb19p, which prevents its association with the plasma membrane; Npr1p activity is negatively regulated via phosphorylation by the TOR complex; NPR1 has a paralog, PRR2, that arose from the whole genome duplication -S000034359 CDS YNL183C 14 295509 293137 C 2011-02-03 1996-07-31 -S000005126 ORF Verified YNL182C IPI3 chromatin-binding/pre-rRNA-processing protein IPI3 chromosome 14 14 297627 295960 C 2011-02-03 1996-07-31 Component of the Rix1 complex and pre-replicative complexes (pre-RCs); required for processing of ITS2 sequences from 35S pre-rRNA; component of the pre-60S ribosomal particle with the dynein-related AAA-type ATPase Mdn1p; required for pre-RC formation and maintenance during DNA replication licensing; highly conserved protein which contains several WD40 motifs; IPI3 is an essential gene; other members include Rix1p, Ipi1p, and Ipi3p -S000034229 CDS YNL182C 14 297627 295960 C 2011-02-03 1996-07-31 -S000005125 ORF Uncharacterized YNL181W PBR1 putative oxidoreductase chromosome 14 14 298335 299558 W 2011-02-03 1996-07-31|2011-02-03 Putative oxidoreductase; required for cell viability -S000034164 CDS YNL181W 14 298335 299558 W 2011-02-03 1996-07-31|2011-02-03 -S000005124 ORF Verified YNL180C RHO5 Rho family GTPase RHO5|YNS0 chromosome 14 L000004798 14 300649 299654 C 2011-02-03 1998-11-10|1996-07-31 Non-essential small GTPase of the Rho/Rac family of Ras-like proteins; RAC1 ortholog; regulated by phosphorylation and ubiquitination; likely involved in protein kinase C (Pkc1p)-dependent signal transduction pathway that controls cell integrity -S000033264 CDS YNL180C 14 300649 299654 C 2011-02-03 1998-11-10|1996-07-31 -S000005123 ORF Dubious YNL179C SRF6 chromosome 14 14 301103 300666 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; deletion in cyr1 mutant results in loss of stress resistance -S000034571 CDS YNL179C 14 301103 300666 C 2011-02-03 1996-07-31 -S000005122 ORF Verified YNL178W RPS3 uS3|ribosomal 40S subunit protein S3|rp13|YS3|S3|SUF14 chromosome 14 L000002161|L000001749 14 302680 303402 W -125 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; has apurinic/apyrimidinic (AP) endonuclease activity; essential for viability; nascent Rps3p is bound by specific chaperone Yar1p during translation; homologous to mammalian ribosomal protein S3 and bacterial S3 -S000034489 CDS YNL178W 14 302680 303402 W 2011-02-03 1996-07-31 -S000005121 ORF Verified YNL177C MRPL22 mitochondrial 54S ribosomal protein YmL22|YmL22 chromosome 14 14 304615 303686 C 2011-02-03 1996-07-31|2011-02-03 Mitochondrial ribosomal protein of the large subunit -S000032401 CDS YNL177C 14 304615 303686 C 2011-02-03 1996-07-31|2011-02-03 -S000005120 ORF Verified YNL176C TDA7 chromosome 14 14 306980 305070 C 2011-02-03 1996-07-31|2011-02-03 Cell cycle-regulated gene of unknown function; promoter bound by Fkh2p; null mutant is sensitive to expression of the top1-T722A allele; TDA7 has a paralog, YDL211C, that arose from the whole genome duplication -S000032321 CDS YNL176C 14 306980 305070 C 2011-02-03 1996-07-31|2011-02-03 -S000005118 ORF Dubious YNL174W chromosome 14 14 308074 308646 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene NOP13/YNL175C -S000031277 CDS YNL174W 14 308074 308646 W 2011-02-03 1996-07-31 -S000005119 ORF Verified YNL175C NOP13 chromosome 14 14 308612 307401 C 2011-02-03 1996-07-31|2011-02-03 Nucleolar protein found in preribosomal complexes; contains an RNA recognition motif (RRM); relative distribution to the nucleolus increases upon DNA replication stress -S000032207 CDS YNL175C 14 308612 307401 C 2011-02-03 1996-07-31|2011-02-03 -S000005117 ORF Verified YNL173C MDG1 chromosome 14 L000001044 14 310057 308957 C 2011-02-03 1996-07-31 Plasma membrane protein; involved in G-protein mediated pheromone signaling pathway; overproduction suppresses bem1 mutations; MDG1 has a paralog, CRP1, that arose from the whole genome duplication -S000031079 CDS YNL173C 14 310057 308957 C 2011-02-03 1996-07-31 -S000005116 ORF Verified YNL172W APC1 anaphase promoting complex subunit 1 chromosome 14 L000004053 14 310636 315882 W 2011-02-03 1996-07-31|2011-02-03 Largest subunit of the Anaphase-Promoting Complex/Cyclosome; APC/C is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; component of the platform domain of the APC/C, based on structural analysis; localizes to nuclear foci that become diffuse upon DNA replication stress -S000031033 CDS YNL172W 14 310636 315882 W 2011-02-03 1996-07-31|2011-02-03 -S000005114 ORF Dubious YNL170W chromosome 14 14 315978 316373 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000029916 CDS YNL170W 14 315978 316373 W 2011-02-03 1996-07-31 -S000005115 ORF Dubious YNL171C chromosome 14 14 315997 315629 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000029970 CDS YNL171C 14 315997 315629 C 2011-02-03 1996-07-31 -S000005113 ORF Verified YNL169C PSD1 phosphatidylserine decarboxylase 1 chromosome 14 L000001518 14 317671 316169 C 2011-02-03 1996-07-31 Phosphatidylserine decarboxylase of the mitochondrial inner membrane; converts phosphatidylserine to phosphatidylethanolamine; regulates mitochondrial fusion and morphology by affecting lipid mixing in the mitochondrial membrane and by influencing the ratio of long to short forms of Mgm1p; partly exposed to the mitochondrial intermembrane space; autocatalytically processed -S000030171 CDS YNL169C 14 317671 316169 C 2011-02-03 1996-07-31 -S000005112 ORF Uncharacterized YNL168C FMP41 chromosome 14 14 318809 318030 C 2011-02-03 1996-07-31 Putative protein of unknown function; GFP-fusion protein is induced in response to the DNA-damaging agent MMS; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000036435 CDS YNL168C 14 318809 318030 C 2011-02-03 1996-07-31 -S000005111 ORF Verified YNL167C SKO1 ACR1 chromosome 14 L000001909 14 321359 319416 C -110 2011-02-03 1996-07-31 Basic leucine zipper transcription factor of the ATF/CREB family; forms a complex with Tup1p and Cyc8p to both activate and repress transcription; cytosolic and nuclear protein involved in osmotic and oxidative stress responses -S000036358 CDS YNL167C 14 321359 319416 C 2011-02-03 1996-07-31 -S000118385 ARS ARS1415 ARSXIV-322 chromosome 14 14 321921 322213 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178170 ARS_consensus_sequence ARS1415 14 322000 322016 W 2014-11-18 2014-11-18 -S000005110 ORF Verified YNL166C BNI5 chromosome 14 14 323565 322219 C 2011-02-03 1996-07-31 Linker protein responsible for recruitment of myosin to the bud neck; interacts with the C-terminal extensions of septins Cdc11p and Shs1p and binds Myo1p to promote cytokinesis -S000036259 CDS YNL166C 14 323565 322219 C 2011-02-03 1996-07-31 -S000005109 ORF Uncharacterized YNL165W chromosome 14 14 323832 325052 W 2011-02-03 1996-07-31 Putative protein of unknown function; YNL165W is not an essential gene -S000036209 CDS YNL165W 14 323832 325052 W 2011-02-03 1996-07-31 -S000130142 ARS ARS1416 chromosome 14 14 325054 325267 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000005108 ORF Verified YNL164C IBD2 chromosome 14 14 326320 325265 C 2011-02-03 1996-07-31 Component of the BUB2-dependent spindle checkpoint pathway; interacts with Bfa1p and functions upstream of Bub2p and Bfa1p -S000035227 CDS YNL164C 14 326320 325265 C 2011-02-03 1996-07-31 -S000005107 ORF Verified YNL163C RIA1 GTPase RIA1|EFL1 chromosome 14 14 330073 326741 C 2011-02-03 1996-07-31 Cytoplasmic GTPase/eEF2-like factor involved in ribosomal biogenesis; with Sdo1p, a guanine nucleotide exchange factor (GEF), promotes release of Tif6p from 60S ribosomal subunits in the cytoplasm so that they can assemble with 40S subunits to generate mature ribosomes; required for quality control check of newly made large ribosomal subunits before they are released into the pool of translating ribosomes -S000035069 CDS YNL163C 14 330073 326741 C 2011-02-03 1996-07-31 -S000007624 ORF Uncharacterized YNL162W-A chromosome 14 14 330329 330547 W 2011-02-03 2001-02-26 Putative protein of unknown function; identified by homology -S000037222 CDS YNL162W-A 14 330329 330547 W 2011-02-03 2001-02-26 -S000005106 ORF Verified YNL162W RPL42A eL42|ribosomal 60S subunit protein L42A|L44e|YL27|L42A|L41A chromosome 14 L000001731 14 331322 332154 W 2011-02-03 1999-11-17|1996-07-31 Ribosomal 60S subunit protein L42A; homologous to mammalian ribosomal protein L36A, no bacterial homolog; RPL42A has a paralog, RPL42B, that arose from the whole genome duplication -S000034972 CDS YNL162W 14 331322 331325 W 2011-02-03 1996-07-31 -S000034973 CDS YNL162W 14 331838 332154 W 2011-02-03 1999-11-17|1996-07-31 -S000034974 intron YNL162W 14 331326 331837 W 2011-02-03 1999-11-17|1996-07-31 -S000005105 ORF Verified YNL161W CBK1 serine/threonine protein kinase CBK1 chromosome 14 L000004609 14 332597 334867 W 2011-02-03 1996-07-31 Serine/threonine protein kinase of the the RAM signaling network; Ndr/LATS family member; binds regulatory subunit Mob2p; involved in regulation of cellular morphogenesis, polarized growth, and septum destruction; phosphorylation by Cbk1p regulates localization and activity of Ace2p transcription factor and Ssd1p translational repressor; Cbk1p activity is regulated by both phosphorylation and specific localization; relocalizes to cytoplasm upon DNA replication stress -S000034836 CDS YNL161W 14 332597 334867 W 2011-02-03 1996-07-31 -S000005104 ORF Verified YNL160W YGP1 chromosome 14 L000002509 14 336545 337609 W 2011-02-03 1996-07-31 Cell wall-related secretory glycoprotein; induced by nutrient deprivation-associated growth arrest and upon entry into stationary phase; may be involved in adaptation prior to stationary phase entry; YGP1 has a paralog, SPS100, that arose from the whole genome duplication -S000033927 CDS YNL160W 14 336545 337609 W 2011-02-03 1996-07-31 -S000005103 ORF Verified YNL159C ASI2 chromosome 14 14 339347 338478 C 2011-02-03 1996-07-31 Subunit of the inner nuclear membrane Asi ubiquitin ligase complex; the Asi complex targets both misfolded proteins of the inner nuclear membrane-associated degradation (INMAD) pathway and inner for ubiquitin-mediated degradation; acts with Asi1p and Asi3p to ensure the fidelity of SPS-sensor signaling by targeting latent unprocessed forms of Stp1p and Stp2p, maintaining the repressed state of gene expression in the absence of inducing amino acids -S000035302 CDS YNL159C 14 339347 338478 C 2011-02-03 1996-07-31 -S000005102 ORF Verified YNL158W PGA1 chromosome 14 14 339612 340208 W 2011-02-03 1996-07-31 Essential component of GPI-mannosyltransferase II; complex is responsible for second mannose addition to GPI precursors as a partner of Gpi18p; required for maturation of Gas1p and Pho8p; has synthetic genetic interactions with secretory pathway genes -S000034371 CDS YNL158W 14 339612 340208 W 2011-02-03 1996-07-31 -S000005101 ORF Verified YNL157W IGO1 phosphatase regulator chromosome 14 14 340352 340858 W 2011-02-03 1996-07-31 Protein required for initiation of G0 program; prevents degradation of nutrient-regulated mRNAs via the 5'-3' mRNA decay pathway; phosphorylated by Rim15p; GFP protein localizes to the cytoplasm and nucleus; IGO1 has a paralog, IGO2, that arose from the whole genome duplication -S000034306 CDS YNL157W 14 340352 340858 W 2011-02-03 1996-07-31 -S000005100 ORF Verified YNL156C NSG2 chromosome 14 14 341968 341069 C 2011-02-03 1996-07-31 Protein involved in regulation of sterol biosynthesis; specifically stabilizes Hmg2p, one of two HMG-CoA isoenzymes that catalyze the rate-limiting step in sterol biosynthesis; homolog of mammalian INSIG proteins; NSG2 has a paralog, NSG1, that arose from the whole genome duplication -S000034171 CDS YNL156C 14 341968 341069 C 2011-02-03 1996-07-31 -S000005099 ORF Verified YNL155W CUZ1 chromosome 14 14 342516 343340 W 2011-02-03 1996-07-31 Protein with a role in the ubiquitin-proteasome pathway; interacts with ubiquitinated protein, Cdc48p and the proteasomal regulatory particle; may protect cells from trivalent metalloid induced proteotoxicity; contains a PACE promoter element and is co-regulated with proteasome subunit genes; AN1-type zinc finger protein, with DHHC and ubiquitin-like domains (UBL); ortholog of ZFAND1, a human gene linked to cancer; protein abundance increases under DNA replication stress -S000034106 CDS YNL155W 14 342516 343340 W 2011-02-03 1996-07-31 -S000005098 ORF Verified YNL154C YCK2 serine/threonine protein kinase YCK2 chromosome 14 L000002501 14 345276 343636 C 2011-02-03 1996-07-31 Palmitoylated plasma membrane-bound casein kinase I (CK1) isoform; shares redundant functions with Yck1p in morphogenesis, proper septin assembly, endocytic trafficking, and glucose sensing; stabilized by Sod1p binding in the presence of glucose and oxygen, causing glucose repression of respiratory metabolism; involved in the phosphorylation and regulation of glucose sensor Rgt2p; YCK2 has a paralog, YCK1, that arose from the whole genome duplication -S000032102 CDS YNL154C 14 345276 343636 C 2011-02-03 1996-07-31 -S000005097 ORF Verified YNL153C GIM3 tubulin-binding prefolding complex subunit GIM3|PFD4 chromosome 14 L000004369 14 346058 345669 C 2011-02-03 1996-07-31 Subunit of the heterohexameric cochaperone prefoldin complex; prefoldin binds specifically to cytosolic chaperonin and transfers target proteins to it; prefoldin complex also localizes to chromatin of actively transcribed genes in the nucleus and facilitates transcriptional elongation -S000031948 CDS YNL153C 14 346058 345669 C 2011-02-03 1996-07-31 -S000005096 ORF Verified YNL152W INN1 chromosome 14 14 346313 347542 W 2011-02-03 1996-07-31 Essential protein that associates with contractile actomyosin ring; required for ingression of the plasma membrane into the bud neck during cytokinesis; C2 domain, a membrane targeting module, is required for function; activates chitin synthase activity of Chs2p during cytokinesis -S000031853 CDS YNL152W 14 346313 347542 W 2011-02-03 1996-07-31 -S000005095 ORF Verified YNL151C RPC31 DNA-directed RNA polymerase III subunit C31|C31|RPC8|ACP2 chromosome 14 L000001688 14 348521 347766 C -237 2011-02-03 1996-07-31 RNA polymerase III subunit C31 -S000030811 CDS YNL151C 14 348521 347766 C 2011-02-03 1996-07-31 -S000005094 ORF Dubious YNL150W chromosome 14 14 349251 349658 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; extensive overlap with PGA2/YNL149C, an uncharacterized gene with a proposed role in protein trafficking -S000030782 CDS YNL150W 14 349251 349658 W 2011-02-03 1996-07-31 -S000005093 ORF Verified YNL149C PGA2 chromosome 14 14 349756 349367 C 2011-02-03 1996-07-31 Essential protein required for maturation of Gas1p and Pho8p; involved in protein trafficking; GFP-fusion protein localizes to the ER and YFP-fusion protein to the nuclear envelope-ER network; null mutants have a cell separation defect -S000031137 CDS YNL149C 14 349756 349367 C 2011-02-03 1996-07-31 -S000005092 ORF Verified YNL148C ALF1 chromosome 14 L000003527 14 350671 349907 C 2011-02-03 1996-07-31 Alpha-tubulin folding protein; similar to mammalian cofactor B; Alf1p-GFP localizes to cytoplasmic microtubules; required for the folding of alpha-tubulin and may play an additional role in microtubule maintenance -S000031037 CDS YNL148C 14 350671 349907 C 2011-02-03 1996-07-31 -S000005091 ORF Verified YNL147W LSM7 Sm-like protein LSM7 chromosome 14 L000004686 14 350940 351383 W 2011-02-03 1996-07-31|2007-09-06 Lsm (Like Sm) protein; part of heteroheptameric complexes (Lsm2p-7p and either Lsm1p or 8p): cytoplasmic Lsm1p complex involved in mRNA decay; nuclear Lsm8p complex part of U6 snRNP and possibly involved in processing tRNA, snoRNA, and rRNA; protein abundance increases and forms cytoplasmic foci in response to DNA replication stress -S000031001 CDS YNL147W 14 350940 350957 W 2011-02-03 1996-07-31 -S000031002 CDS YNL147W 14 351054 351383 W 2011-02-03 1996-07-31|2007-09-06 -S000031003 intron YNL147W 14 350958 351053 W 2011-02-03 1996-07-31|2007-09-06 -S000028851 ORF Uncharacterized YNL146C-A chromosome 14 14 351580 351386 C 2011-02-03 2003-07-29 Putative protein of unknown function -S000034564 CDS YNL146C-A 14 351580 351386 C 2011-02-03 2003-07-29 -S000005090 ORF Uncharacterized YNL146W chromosome 14 14 351715 352017 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; YNL146W is not an essential gene -S000030919 CDS YNL146W 14 351715 352017 W 2011-02-03 1996-07-31 -S000005089 ORF Verified YNL145W MFA2 mating pheromone a chromosome 14 L000001097 14 352414 352530 W -107.4 2011-02-03 1996-07-31 Mating pheromone a-factor; made by a cells; interacts with alpha cells to induce cell cycle arrest and other responses leading to mating; biogenesis involves C-terminal modification, N-terminal proteolysis, and export; also encoded by MFA1 -S000029912 CDS YNL145W 14 352414 352530 W 2011-02-03 1996-07-31 -S000028702 ORF Dubious YNL144W-A chromosome 14 14 353061 353144 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized gene YNL144C -S000032635 CDS YNL144W-A 14 353061 353144 W 2011-02-03 2003-07-29 -S000005088 ORF Uncharacterized YNL144C chromosome 14 14 355042 352820 C 2011-02-03 1996-07-31 Putative protein of unknown function; non-tagged protein is detected in highly purified mitochondria in high-throughput studies; contains a PH domain and binds phosphatidylinositols and phosphatidylethanolamine in a large-scale study; YNL144C has a paralog, YHR131C, that arose from the whole genome duplication -S000037844 CDS YNL144C 14 355042 352820 C 2011-02-03 1996-07-31 -S000005087 ORF Uncharacterized YNL143C chromosome 14 14 357186 356794 C 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels -S000036002 CDS YNL143C 14 357186 356794 C 2011-02-03 1996-07-31 -S000005086 ORF Verified YNL142W MEP2 ammonium permease MEP2 chromosome 14 L000002583 14 357453 358952 W 2011-02-03 1996-07-31 Ammonium permease involved in regulation of pseudohyphal growth; belongs to a ubiquitous family of cytoplasmic membrane proteins that transport only ammonium (NH4+); expression is under the nitrogen catabolite repression regulation -S000035924 CDS YNL142W 14 357453 358952 W 2011-02-03 1996-07-31 -S000005085 ORF Verified YNL141W AAH1 adenine deaminase chromosome 14 L000004289 14 359596 360639 W 2011-02-03 1996-07-31 Adenine deaminase (adenine aminohydrolase); converts adenine to hypoxanthine; involved in purine salvage; transcriptionally regulated by nutrient levels and growth phase; Aah1p degraded upon entry into quiescence via SCF and the proteasome -S000035807 CDS YNL141W 14 359596 360639 W 2011-02-03 1996-07-31 -S000005084 ORF Uncharacterized YNL140C chromosome 14 14 361486 360917 C 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels; partially overlaps THO2/YNL139C -S000034768 CDS YNL140C 14 361486 360917 C 2011-02-03 1996-07-31 -S000005083 ORF Verified YNL139C THO2 RLR1|LDB5|ZRG13 chromosome 14 L000002589 14 365717 360924 C 2011-02-03 1996-07-31 Subunit of the THO complex; THO is required for efficient transcription elongation and involved in transcriptional elongation-associated recombination; required for LacZ RNA expression from certain plasmids -S000036082 CDS YNL139C 14 365717 360924 C 2011-02-03 1996-07-31 -S000028509 ORF Verified YNL138W-A YSF3 U2 snRNP complex subunit YSF3|RCP10 chromosome 14 14 366033 366412 W 2011-02-03 2003-07-29 Component of the SF3b subcomplex of the U2 snRNP; essential protein required for splicing and for assembly of SF3b -S000030223 CDS YNL138W-A 14 366033 366035 W 2011-02-03 2003-07-29 -S000030224 CDS YNL138W-A 14 366158 366412 W 2011-02-03 2003-07-29 -S000030225 intron YNL138W-A 14 366036 366157 W 2011-02-03 2003-07-29 -S000005082 ORF Verified YNL138W SRV2 adenylate cyclase-binding protein|CAP chromosome 14 L000002068 14 366741 368321 W -101 2011-02-03 1996-07-31 CAP (cyclase-associated protein); N-terminus binds adenylate cyclase and facilitates activation by RAS; N-terminus forms novel hexameric star-shaped shuriken structures that directly catalyze cofilin-mediated severing of actin filaments; C-terminus binds and recycles cofilin bound, ADP-actin monomers, facilitating regulation of actin dynamics and cell morphogenesis; N- and C-termini can function as physically separate proteins; mCAP1 is the mouse homolog -S000036041 CDS YNL138W 14 366741 368321 W 2011-02-03 1996-07-31 -S000005081 ORF Verified YNL137C NAM9 mitochondrial 37S ribosomal protein NAM9|MNA6 chromosome 14 L000001231 14 370055 368595 C 2011-02-03 1996-07-31 Mitochondrial ribosomal component of the small subunit -S000035090 CDS YNL137C 14 370055 368595 C 2011-02-03 1996-07-31 -S000005080 ORF Verified YNL136W EAF7 chromosome 14 14 370368 371645 W 2011-02-03 1996-07-31 Subunit of the NuA4 histone acetyltransferase complex; NuA4 acetylates the N-terminal tails of histones H4 and H2A -S000035041 CDS YNL136W 14 370368 371645 W 2011-02-03 1996-07-31 -S000005079 ORF Verified YNL135C FPR1 peptidylprolyl isomerase FPR1|RBP1|FKB1 chromosome 14 L000000623 14 372226 371882 C -105 2011-02-03 1996-07-31 Peptidyl-prolyl cis-trans isomerase (PPIase); binds to the drugs FK506 and rapamycin; also binds to the nonhistone chromatin binding protein Hmo1p and may regulate its assembly or function; N-terminally propionylated in vivo; mutation is functionally complemented by human FKBP1A -S000034848 CDS YNL135C 14 372226 371882 C 2011-02-03 1996-07-31 -S000005078 ORF Verified YNL134C chromosome 14 14 373581 372451 C 2011-02-03 1996-07-31 NADH-dependent aldehyde reductase, involved in detoxification of furfural; expression is up-regulated in the presence of furfural and 5-hydroxymethylfurfural, which are compounds generated during lignocellulosic biomass pre-treatment; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and nucleus; protein abundance increases in response to DNA replication stress -S000033976 CDS YNL134C 14 373581 372451 C 2011-02-03 1996-07-31 -S000005077 ORF Verified YNL133C FYV6 chromosome 14 14 374692 374171 C 2011-02-03 1996-07-31 Protein of unknown function; required for survival upon exposure to K1 killer toxin; proposed to regulate double-strand break repair via non-homologous end-joining -S000033840 CDS YNL133C 14 374692 374171 C 2011-02-03 1996-07-31 -S000006569 tRNA_gene tF(GAA)N chromosome 14 L000003689 14 374869 374959 W 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis -S000035429 intron tF(GAA)N 14 374906 374923 W 2011-02-03 2000-05-19 -S000035427 noncoding_exon tF(GAA)N 14 374869 374905 W 2011-02-03 2000-05-19 -S000035428 noncoding_exon tF(GAA)N 14 374924 374959 W 2011-02-03 2000-05-19 -S000005076 ORF Verified YNL132W KRE33 ribosome biosynthesis protein KRE33|RRA1 chromosome 14 14 375321 378491 W 2011-02-03 1996-07-31 Protein required for biogenesis of the small ribosomal subunit; heterozygous mutant shows haploinsufficiency in K1 killer toxin resistance; essential gene; NAT10, the human homolog, implicated in several types of cancer and premature aging. -S000033781 CDS YNL132W 14 375321 378491 W 2011-02-03 1996-07-31 -S000005075 ORF Verified YNL131W TOM22 MOM22|MAS22|MAS17 chromosome 14 L000002582 14 378767 379225 W 2011-02-03 1996-07-31 Component of the TOM (Translocase of Outer Membrane) complex; responsible for initial import of mitochondrially directed proteins; mediates interaction between TOM and TIM complexes and acts as a receptor for precursor proteins -S000033651 CDS YNL131W 14 378767 379225 W 2011-02-03 1996-07-31 -S000005074 ORF Verified YNL130C CPT1 diacylglycerol cholinephosphotransferase chromosome 14 L000000404 14 380831 379558 C 2011-02-03 2004-02-03|1996-07-31 Cholinephosphotransferase; required for phosphatidylcholine biosynthesis and for inositol-dependent regulation of EPT1 transcription; CPT1 has a paralog, EPT1, that arose from the whole genome duplication -S000030245 CDS YNL130C 14 380689 379558 C 2011-02-03 1996-07-31 -S000030243 CDS YNL130C 14 380831 380782 C 2011-02-03 2004-02-03|1996-07-31 -S000030246 intron YNL130C 14 380781 380690 C 2011-02-03 2004-02-03|1996-07-31 -S000028579 ORF Uncharacterized YNL130C-A DGR1 chromosome 14 14 381391 381245 C 2011-02-03 2003-07-29 Protein of unknown function; dgr1 null mutant is resistant to 2-deoxy-D-glucose -S000031313 CDS YNL130C-A 14 381391 381245 C 2011-02-03 2003-07-29 -S000005073 ORF Verified YNL129W NRK1 ribosylnicotinamide kinase chromosome 14 S000029011|S000029327 14 381480 382202 W 2011-02-03 1996-07-31 Nicotinamide riboside kinase; catalyzes the phosphorylation of nicotinamide riboside and nicotinic acid riboside in salvage pathways for NAD+ biosynthesis -S000031557 CDS YNL129W 14 381480 382202 W 2011-02-03 1996-07-31 -S000005072 ORF Verified YNL128W TEP1 putative phosphatidylinositol-3,4,5-trisphosphate 3-phosphatase chromosome 14 L000003922 14 382359 383663 W 2011-02-03 1996-07-31|2011-02-03 PTEN homolog with no demonstrated inositol lipid phosphatase activity; plays a role in normal sporulation; homolog of human tumor suppressor gene PTEN/MMAC1/TEP1 and fission yeast ptn1 -S000030721 CDS YNL128W 14 382359 383663 W 2011-02-03 1996-07-31|2011-02-03 -S000005071 ORF Verified YNL127W FAR11 chromosome 14 14 383987 386848 W 2011-02-03 1996-07-31 Protein involved in recovery from cell cycle arrest; acts in response to pheromone; also involved in regulation of intra-S DNA damage checkpoint and autophagy; is essential for dephosphorylation of Atg13p; interacts with Far3p, Far7p, Far8p, Far9p, Far10p and with the phosphatases Pph21p, Pph22p and Pph3p; has similarity to the N- and C-termini of N. crassa HAM-2; similar to human Fam40A and Fam40B -S000030640 CDS YNL127W 14 383987 386848 W 2011-02-03 1996-07-31 -S000005070 ORF Verified YNL126W SPC98 chromosome 14 L000003430 14 387227 389767 W 2011-02-03 1996-07-31 Component of the microtubule-nucleating Tub4p (gamma-tubulin) complex; interacts with Spc110p at the spindle pole body (SPB) inner plaque and with Spc72p at the SPB outer plaque -S000030533 CDS YNL126W 14 387227 389767 W 2011-02-03 1996-07-31 -S000005069 ORF Verified YNL125C ESBP6 MCH3 chromosome 14 L000004077 14 392167 390146 C 2011-02-03 1996-07-31 Protein with similarity to monocarboxylate permeases; appears not to be involved in transport of monocarboxylates such as lactate, pyruvate or acetate across the plasma membrane -S000037681 CDS YNL125C 14 392167 390146 C 2011-02-03 1996-07-31 -S000005068 ORF Verified YNL124W NAF1 RNA-binding snoRNP assembly protein chromosome 14 14 392892 394370 W 2011-02-03 1996-07-31 RNA-binding protein required for the assembly of box H/ACA snoRNPs; thus required for pre-rRNA processing; forms a complex with Shq1p and interacts with H/ACA snoRNP components Nhp2p and Cbf5p; similar to Gar1p -S000037659 CDS YNL124W 14 392892 394370 W 2011-02-03 1996-07-31 -S000005067 ORF Verified YNL123W NMA111 YNM3 chromosome 14 14 394685 397678 W 2011-02-03 1996-07-31 Serine protease and general molecular chaperone; involved in response to heat stress and promotion of apoptosis; may contribute to lipid homeostasis; sequence similarity to the mammalian Omi/HtrA2 family of serine proteases -S000037577 CDS YNL123W 14 394685 397678 W 2011-02-03 1996-07-31 -S000005066 ORF Verified YNL122C chromosome 14 14 398370 398023 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; homologous to bacterial L35 and human MRPL35 ribosomal proteins -S000037427 CDS YNL122C 14 398370 398023 C 2011-02-03 1996-07-31 -S000005065 ORF Verified YNL121C TOM70 protein channel TOM70|OMP1|MOM72|MAS70 chromosome 14 L000001030|L000003141 14 400537 398684 C 2011-02-03 1996-07-31 Component of the TOM (translocase of outer membrane) complex; involved in the recognition and initial import steps for all mitochondrially directed proteins; acts as a receptor for incoming precursor proteins; TOM70 has a paralog, TOM71, that arose from the whole genome duplication -S000031934 CDS YNL121C 14 400537 398684 C 2011-02-03 1996-07-31 -S000005063 ORF Verified YNL119W NCS2 TUC2 chromosome 14 14 401040 402521 W 2011-02-03 1996-07-31 Protein required for uridine thiolation of Lys(UUU) and Glu(UUC) tRNAs; required for the thiolation of uridine at the wobble position of Lys(UUU) and Glu(UUC) tRNAs; has a role in urmylation and in invasive and pseudohyphal growth; inhibits replication of Brome mosaic virus in S. cerevisiae -S000036308 CDS YNL119W 14 401040 402521 W 2011-02-03 1996-07-31 -S000005064 ORF Dubious YNL120C chromosome 14 14 401518 401033 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; deletion enhances replication of Brome mosaic virus in S. cerevisiae, but likely due to effects on the overlapping gene -S000031820 CDS YNL120C 14 401518 401033 C 2011-02-03 1996-07-31 -S000005062 ORF Verified YNL118C DCP2 decapping enzyme complex catalytic subunit|PSU1 chromosome 14 L000002866 14 405564 402652 C 2011-02-03 1996-07-31 Catalytic subunit of Dcp1p-Dcp2p decapping enzyme complex; removes 5' cap structure from mRNAs prior to their degradation; also enters nucleus and positively regulates transcription initiation; nudix hydrolase family member; forms cytoplasmic foci upon DNA replication stress; human homolog DCP2 complements yeast dcp2 thermosensitive mutant -S000035360 CDS YNL118C 14 405564 402652 C 2011-02-03 1996-07-31 -S000005061 ORF Verified YNL117W MLS1 malate synthase MLS1 chromosome 14 L000001123 14 406358 408022 W 2011-02-03 1996-07-31 Malate synthase, enzyme of the glyoxylate cycle; involved in utilization of non-fermentable carbon sources; expression is subject to carbon catabolite repression; localizes in peroxisomes during growth on oleic acid, otherwise cytosolic; can accept butyryl-CoA as acyl-CoA donor in addition to traditional substrate acetyl-CoA -S000035332 CDS YNL117W 14 406358 408022 W 2011-02-03 1996-07-31 -S000005060 ORF Verified YNL116W DMA2 ubiquitin-conjugating protein DMA2|CHF2 chromosome 14 S000029720 14 408341 409909 W 2011-02-03 1996-07-31 Ubiquitin-protein ligase (E3); controls septin dynamics and spindle position checkpoint (SPOC) with ligase Dma1p by regulating recruitment of Elm1p to bud neck; regulates levels of eIF2 subunit Gcd11p, as well as abundance, localization, and ubiquitination of Cdk inhibitory kinase Swe1p; ortholog of human RNF8, similar to human Chfr; contains FHA and RING finger domains; DMA2 has a paralog, DMA1, that arose from the whole genome duplication -S000035249 CDS YNL116W 14 408341 409909 W 2011-02-03 1996-07-31 -S000005059 ORF Uncharacterized YNL115C chromosome 14 14 412053 410119 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to mitochondria; YNL115C is not an essential gene -S000034227 CDS YNL115C 14 412053 410119 C 2011-02-03 1996-07-31 -S000118386 ARS ARS1417 ARSXIV-412 chromosome 14 14 412267 412496 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000005057 ORF Verified YNL113W RPC19 DNA-directed RNA polymerase core subunit RPC19|AC19 chromosome 14 L000001687 14 412771 413199 W 2011-02-03 1996-07-31 RNA polymerase subunit AC19; common to RNA polymerases I and III -S000034093 CDS YNL113W 14 412771 413199 W 2011-02-03 1996-07-31 -S000005058 ORF Dubious YNL114C chromosome 14 14 413055 412684 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF RPC19/YNL113W, an RNA polymerase subunit -S000034126 CDS YNL114C 14 413055 412684 C 2011-02-03 1996-07-31 -S000005056 ORF Verified YNL112W DBP2 DEAD-box ATP-dependent RNA helicase DBP2 chromosome 14 L000000493 14 413639 416281 W 2011-02-03 1996-07-31 ATP-dependent RNA helicase of the DEAD-box protein family; has strong preference for dsRNA; interacts with YRA1; required for assembly of Yra1p, Nab2p and Mex67p onto mRNA and formation of nuclear mRNP; involved in mRNA decay and rRNA processing; may be involved in suppression of transcription from cryptic initiation sites -S000033962 CDS YNL112W 14 413639 414911 W 2011-02-03 1996-07-31 -S000033963 CDS YNL112W 14 415914 416281 W 2011-02-03 1996-07-31 -S000033964 intron YNL112W 14 414912 415913 W 2011-02-03 1996-07-31 -S000005055 ORF Verified YNL111C CYB5 chromosome 14 L000002498 14 417302 416940 C 2011-02-03 1996-07-31 Cytochrome b5; involved in the sterol and lipid biosynthesis pathways; acts as an electron donor to support sterol C5-6 desaturation -S000033131 CDS YNL111C 14 417302 416940 C 2011-02-03 1996-07-31 -S000005054 ORF Verified YNL110C NOP15 rRNA-binding ribosome biosynthesis protein NOP15 chromosome 14 14 418488 417826 C 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; involved in 60S ribosomal subunit biogenesis; localizes to both nucleolus and cytoplasm -S000033055 CDS YNL110C 14 418488 417826 C 2011-02-03 1996-07-31 -S000005053 ORF Dubious YNL109W chromosome 14 14 418964 419509 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YNL108C -S000032014 CDS YNL109W 14 418964 419509 W 2011-02-03 1996-07-31 -S000005052 ORF Verified YNL108C HUF chromosome 14 14 419826 419014 C 2011-02-03 1996-07-31 Protein phosphatase; similar to prokaryotic phosphotransfer enzymes; null mutant shows alterations in glucose metabolism; GFP-fusion protein localizes to the cytoplasm and nucleus; YNL108C has a paralog, TFC7, that arose from the whole genome duplication -S000031012 CDS YNL108C 14 419826 419014 C 2011-02-03 1996-07-31 -S000005051 ORF Verified YNL107W YAF9 chromosome 14 S000007495 14 420098 420778 W 2011-02-03 1996-07-31 Subunit of NuA4 histone H4 acetyltransferase and SWR1 complexes; may function to antagonize silencing near telomeres; interacts directly with Swc4p; has homology to human leukemogenic protein AF9; contains a YEATS domain -S000030966 CDS YNL107W 14 420098 420778 W 2011-02-03 1996-07-31 -S000005049 ORF Dubious YNL105W RRT16 chromosome 14 14 424155 424583 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene INP52; identified in a screen for mutants with decreased levels of rDNA transcription -S000030822 CDS YNL105W 14 424155 424583 W 2011-02-03 1996-07-31 -S000005050 ORF Verified YNL106C INP52 phosphatidylinositol-3-/phosphoinositide 5-phosphatase INP52|SJL2 chromosome 14 L000003985 14 424495 420944 C 2011-02-03 1996-07-31 Polyphosphatidylinositol phosphatase; dephosphorylates a number of phosphatidylinositol phosphates (PtdInsPs, PIPs) to PI; involved in endocytosis; hyperosmotic stress causes translocation to actin patches; synaptojanin-like protein with a Sac1 domain; INP52 has a paralog, INP53, that arose from the whole genome duplication -S000030872 CDS YNL106C 14 424495 420944 C 2011-02-03 1996-07-31 -S000028701 ORF Dubious YNL103W-A chromosome 14 14 426719 426808 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene MET4/YNL104C -S000032634 CDS YNL103W-A 14 426719 426808 W 2011-02-03 2003-07-29 -S000005048 ORF Verified YNL104C LEU4 2-isopropylmalate synthase LEU4 chromosome 14 L000000945 14 426754 424895 C -76 2011-02-03 1996-07-31 Alpha-isopropylmalate synthase (2-isopropylmalate synthase); the main isozyme responsible for the first step in the leucine biosynthesis pathway; LEU4 has a paralog, LEU9, that arose from the whole genome duplication -S000037846 CDS YNL104C 14 426754 424895 C 2011-02-03 1996-07-31 -S000005047 ORF Verified YNL103W MET4 chromosome 14 L000001079 14 427735 429753 W -76 2011-02-03 1996-07-31|2006-11-09 Leucine-zipper transcriptional activator; responsible for regulation of sulfur amino acid pathway; requires different combinations of auxiliary factors Cbf1p, Met28p, Met31p and Met32p; feedforward loop exists in the regulation of genes controlled by Met4p and Met32p; can be ubiquitinated by ubiquitin ligase SCF-Met30p, is either degraded or maintained in an inactive state; regulates degradation of its own DNA-binding cofactors by targeting them to SCF-Met30p -S000037804 CDS YNL103W 14 427735 429753 W 2011-02-03 1996-07-31|2006-11-09 -S000005046 ORF Verified YNL102W POL1 DNA-directed DNA polymerase alpha catalytic subunit POL1|HPR3|CRT5|CDC17 chromosome 14 L000000257 14 430087 434493 W -74 2011-02-03 1996-07-31 Catalytic subunit of the DNA polymerase I alpha-primase complex; required for the initiation of DNA replication during mitotic DNA synthesis and premeiotic DNA synthesis -S000037722 CDS YNL102W 14 430087 434493 W 2011-02-03 1996-07-31 -S000005045 ORF Verified YNL101W AVT4 chromosome 14 14 434999 437140 W 2011-02-03 1996-07-31 Vacuolar transporter; exports large neutral amino acids from the vacuole; member of a family of seven S. cerevisiae genes (AVT1-7) related to vesicular GABA-glycine transporters; localizes to sites of contact between the vacuole and mitochondria (vCLAMPs) -S000036962 CDS YNL101W 14 434999 437140 W 2011-02-03 1996-07-31 -S000005044 ORF Verified YNL100W MIC27 AIM37|MCS27 chromosome 14 14 437613 438317 W 2011-02-03 1996-07-31 Component of the MICOS complex; MICOS (formerly MINOS or MitOS) is a mitochondrial inner membrane complex that extends into the intermembrane space and has a role in the maintenance of crista junctions, inner membrane architecture, and formation of contact sites to the outer membrane; forms a subcomplex with Mic10p and Mic12p whose assembly and stability requires cardiolipin -S000036897 CDS YNL100W 14 437613 438317 W 2011-02-03 1996-07-31 -S000005043 ORF Verified YNL099C OCA1 putative tyrosine protein phosphatase OCA1 chromosome 14 14 439283 438567 C 2011-02-03 1996-07-31 Putative protein tyrosine phosphatase; required for cell cycle arrest in response to oxidative damage of DNA -S000031337 CDS YNL099C 14 439283 438567 C 2011-02-03 1996-07-31 -S000005042 ORF Verified YNL098C RAS2 Ras family GTPase RAS2|TSL7|GLC5|CYR3|CTN5 chromosome 14 L000001583 14 440570 439602 C -71.5 2011-02-03 1996-07-31 GTP-binding protein; regulates nitrogen starvation response, sporulation, and filamentous growth; farnesylation and palmitoylation required for activity and localization to plasma membrane; homolog of mammalian Ras proto-oncogenes; RAS2 has a paralog, RAS1, that arose from the whole genome duplication -S000030460 CDS YNL098C 14 440570 439602 C 2011-02-03 1996-07-31 -S000028699 ORF Uncharacterized YNL097C-B YNL097C-A chromosome 14 14 440919 440797 C 2011-02-03 2003-07-29 Putative protein of unknown function -S000032611 CDS YNL097C-B 14 440919 440797 C 2011-02-03 2003-07-29 -S000028700 ORF Dubious YNL097W-A chromosome 14 14 441431 441586 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene PHO23/YNL097C -S000032629 CDS YNL097W-A 14 441431 441586 W 2011-02-03 2003-07-29 -S000005041 ORF Verified YNL097C PHO23 chromosome 14 L000004300 14 442358 441366 C 2011-02-03 1996-07-31 Component of the Rpd3L histone deacetylase complex; involved in transcriptional regulation of PHO5; affects termination of snoRNAs and cryptic unstable transcripts (CUTs); C-terminus shares significant sequence identity with the human candidate tumor suppressor p33-ING1 and its isoform ING3 -S000030326 CDS YNL097C 14 442358 441366 C 2011-02-03 1996-07-31 -S000006645 tRNA_gene tL(CAA)N chromosome 14 L000003690 14 443006 443119 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000033817 intron tL(CAA)N 14 443044 443075 W 2011-02-03 2000-05-19 -S000033815 noncoding_exon tL(CAA)N 14 443006 443043 W 2011-02-03 2000-05-19 -S000033816 noncoding_exon tL(CAA)N 14 443076 443119 W 2011-02-03 2000-05-19 -S000005040 ORF Verified YNL096C RPS7B eS7|ribosomal 40S subunit protein S7B|S7e|rp30|S7B chromosome 14 L000004473 14 444315 443398 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; interacts with Kti11p; deletion causes hypersensitivity to zymocin; homologous to mammalian ribosomal protein S7, no bacterial homolog; RPS7B has a paralog, RPS7A, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000030167 CDS YNL096C 14 443826 443398 C 2011-02-03 1996-07-31 -S000030166 CDS YNL096C 14 444315 444172 C 2011-02-03 1996-07-31 -S000030168 intron YNL096C 14 444171 443827 C 2011-02-03 1996-07-31 -S000005039 ORF Uncharacterized YNL095C chromosome 14 14 446840 444912 C 2011-02-03 1996-07-31 Putative protein of unknown function; predicted to contain a transmembrane domain; not an essential gene; YNL095C has a paralog, ECM3, that arose from the whole genome duplication -S000036433 CDS YNL095C 14 446840 444912 C 2011-02-03 1996-07-31 -S000005038 ORF Verified YNL094W APP1 phosphatidate phosphatase APP1 chromosome 14 14 447611 449374 W 2011-02-03 1996-07-31 Phosphatidate phosphatase, converts phosphatidate to diacylglycerol; App1p, Pah1p, Dpp1p, and Lpp1p are responsible for all the phosphatidate phosphatase activity; component of cortical actin patches; interacts with components of endocytic pathway -S000036404 CDS YNL094W 14 447611 449374 W 2011-02-03 1996-07-31 -S000118387 ARS ARS1419 ARSXIV-450 chromosome 14 14 449429 449588 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178171 ARS_consensus_sequence ARS1419 14 449534 449518 C 2014-11-18 2014-11-18 -S000005037 ORF Verified YNL093W YPT53 Rab family GTPase YPT53 chromosome 14 L000002547 14 449868 450530 W 2011-02-03 1996-07-31 Stress-induced Rab family GTPase; required for vacuolar protein sorting and endocytosis; involved in ionic stress tolerance; similar to Vps21p and Ypt52p; functional homolog of Vps21p; mammalian Rab5 homolog; YPT53 has a paralog, VPS21, that arose from the whole genome duplication -S000036317 CDS YNL093W 14 449868 450530 W 2011-02-03 1996-07-31 -S000005036 ORF Verified YNL092W S-adenosylmethionine-dependent methyltransferase chromosome 14 14 450871 452073 W 2011-02-03 1996-07-31 S-adenosylmethionine-dependent protein methyltransferase; capable of automethylation; member of the seven beta-strand family; YNL092W is not an essential gene -S000036208 CDS YNL092W 14 450871 452073 W 2011-02-03 1996-07-31 -S000005035 ORF Verified YNL091W NST1 chromosome 14 14 452408 456130 W 2011-02-03 1996-07-31 Protein of unknown function; mediates sensitivity to salt stress; interacts physically with the splicing factor Msl1p and also displays genetic interaction with MSL1 -S000036061 CDS YNL091W 14 452408 456130 W 2011-02-03 1996-07-31 -S000005034 ORF Verified YNL090W RHO2 Rho family GTPase RHO2 chromosome 14 L000001631 14 456565 457143 W 2011-02-03 1996-07-31 Non-essential small GTPase of the Rho/Rac family of Ras-like proteins; involved in the establishment of cell polarity and in microtubule assembly -S000035133 CDS YNL090W 14 456565 457143 W 2011-02-03 1996-07-31 -S000005033 ORF Dubious YNL089C chromosome 14 14 457169 456693 C 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; almost completely overlaps YNL090W/RHO2 which encodes a small GTPase of the Rho/Rac subfamily of Ras-like proteins -S000035490 CDS YNL089C 14 457169 456693 C 2011-02-03 1996-07-31 -S000005032 ORF Verified YNL088W TOP2 DNA topoisomerase 2|TRF3|TOR3 chromosome 14 L000002320 14 457704 461990 W -70 2011-02-03 1996-07-31 Topoisomerase II; relieves torsional strain in DNA by cleaving and re-sealing phosphodiester backbone of both positively and negatively supercoiled DNA; cleaves complementary strands; localizes to axial cores in meiosis; required for replication slow zone (RSZ) breakage following Mec1p inactivation; human homolog TOP2A implicated in cancers, and can complement yeast null mutant -S000035464 CDS YNL088W 14 457704 461990 W 2011-02-03 1996-07-31 -S000005031 ORF Verified YNL087W TCB2 tricalbin chromosome 14 14 462411 465947 W 2011-02-03 1996-07-31 ER protein involved in ER-plasma membrane tethering; one of 6 proteins (Ist2p, Scs2p, Scs22p, Tcb1p, Tcb2p, Tcb3p) that connect ER to plasma membrane (PM) and regulate PM phosphatidylinositol-4-phosphate (PI4P) levels by controlling access of Sac1p phosphatase to its substrate PI4P in the PM; contains 3 calcium and lipid binding domains; mRNA is targeted to bud; TCB2 has a paralog, TCB1, that arose from the whole genome duplication -S000035400 CDS YNL087W 14 462411 465947 W 2011-02-03 1996-07-31 -S000005030 ORF Verified YNL086W SNN1 BLS1 chromosome 14 14 466334 466642 W 2011-02-03 1996-07-31 Subunit of the BLOC-1 complex involved in endosomal maturation; interacts with Msb3p; green fluorescent protein (GFP)-fusion protein localizes to endosomes -S000035333 CDS YNL086W 14 466334 466642 W 2011-02-03 1996-07-31 -S000005029 ORF Verified YNL085W MKT1 chromosome 14 L000001120 14 467131 469623 W -69 2011-02-03 1996-07-31 Protein similar to nucleases that forms a complex with Pbp1p; complex may mediate posttranscriptional regulation of HO; involved in propagation of M2 dsRNA satellite of L-A virus; allelic variation affects mitochondrial genome stability, drug resistance, and more; forms cytoplasmic foci upon DNA replication stress; localization to P-bodies under ethanol stress differs between strains -S000034367 CDS YNL085W 14 467131 469623 W 2011-02-03 1996-07-31 -S000005028 ORF Verified YNL084C END3 chromosome 14 L000000558 14 471102 470053 C 2011-02-03 1996-07-31 EH domain-containing protein involved in endocytosis; actin cytoskeletal organization and cell wall morphogenesis; forms a complex with Sla1p and Pan1p -S000034279 CDS YNL084C 14 471102 470053 C 2011-02-03 1996-07-31 -S000005027 ORF Verified YNL083W SAL1 Ca(2+)-binding ATP:ADP antiporter SAL1 chromosome 14 14 471377 472861 W 2011-02-03 2004-02-18|2010-01-05|1996-07-31 ADP/ATP transporter; member of the Ca2+-binding subfamily of mitochondrial carriers, with two EF-hand motifs; transport activity of either Sal1p or Pet9p is critical for viability; polymorphic in different S. cerevisiae strains -S000034242 CDS YNL083W 14 471377 472861 W 2011-02-03 2004-02-18|2010-01-05|1996-07-31 -S000005026 ORF Verified YNL082W PMS1 ATP-binding mismatch repair protein chromosome 14 L000001457 14 473391 476012 W -66 2011-02-03 2004-04-21|1996-07-31 ATP-binding protein required for mismatch repair; required for both mitosis and meiosis; functions as a heterodimer with Mlh1p; binds double- and single-stranded DNA via its N-terminal domain, similar to E. coli MutL -S000034101 CDS YNL082W 14 473391 476012 W 2011-02-03 2004-04-21|1996-07-31 -S000005025 ORF Verified YNL081C SWS2 putative mitochondrial 37S ribosomal protein SWS2 chromosome 14 14 476619 476188 C 2011-02-03 1996-07-31 Putative mitochondrial ribosomal protein of the small subunit; has similarity to E. coli S13 ribosomal protein; participates in controlling sporulation efficiency; localizes to vacuole in response to H2O2 -S000032072 CDS YNL081C 14 476619 476188 C 2011-02-03 1996-07-31 -S000005024 ORF Verified YNL080C EOS1 chromosome 14 14 478032 476932 C 2011-02-03 1996-07-31 Protein involved in N-glycosylation; deletion mutation confers sensitivity to exidative stress and shows synthetic lethality with mutations in the spindle checkpoint genes BUB3 and MAD1; YNL080C is not an essential gene -S000031947 CDS YNL080C 14 478032 476932 C 2011-02-03 1996-07-31 -S000005023 ORF Verified YNL079C TPM1 tropomyosin TPM1 chromosome 14 L000002328 14 479165 478566 C 2011-02-03 1996-07-31 Major isoform of tropomyosin; binds to and stabilizes actin cables and filaments, which direct polarized cell growth and the distribution of several organelles; acetylated by the NatB complex and acetylated form binds actin most efficiently; TPM1 has a paralog, TPM2, that arose from the whole genome duplication -S000032271 CDS YNL079C 14 479165 478566 C 2011-02-03 1996-07-31 -S000005022 ORF Verified YNL078W NIS1 JIP1 chromosome 14 14 479768 480991 W 2011-02-03 1996-07-31 Protein localized in the bud neck at G2/M phase; physically interacts with septins; possibly involved in a mitotic signaling network -S000032241 CDS YNL078W 14 479768 480991 W 2011-02-03 1996-07-31 -S000005021 ORF Verified YNL077W APJ1 chromosome 14 14 481391 482977 W 2011-02-03 1996-07-31 Chaperone with a role in SUMO-mediated protein degradation; member of the DnaJ-like family; conserved across eukaryotes; overexpression interferes with propagation of the [Psi+] prion; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; forms nuclear foci upon DNA replication stress -S000032158 CDS YNL077W 14 481391 482977 W 2011-02-03 1996-07-31 -S000005020 ORF Verified YNL076W MKS1 LYS80 chromosome 14 L000001119 14 483556 485310 W 2011-02-03 1996-07-31 Pleiotropic negative transcriptional regulator; involved in Ras-CAMP and lysine biosynthetic pathways and nitrogen regulation; involved in retrograde (RTG) mitochondria-to-nucleus signaling -S000031187 CDS YNL076W 14 483556 485310 W 2011-02-03 1996-07-31 -S000005019 ORF Verified YNL075W IMP4 snoRNA-binding rRNA-processing protein IMP4 chromosome 14 S000007424 14 485607 486479 W 2011-02-03 1996-07-31 Component of the SSU processome; SSU processome is required for pre-18S rRNA processing; interacts with Mpp10p; member of a superfamily of proteins that contain a sigma(70)-like motif and associate with RNAs -S000031099 CDS YNL075W 14 485607 486479 W 2011-02-03 1996-07-31 -S000005018 ORF Verified YNL074C MLF3 YMK1 chromosome 14 L000004166 14 488124 486766 C 2011-02-03 1996-07-31 Serine-rich protein of unknown function; predicted to be palmitoylated; overproduction suppresses growth inhibition caused by exposure to immunosuppressant leflunomide; MLF3 has a paralog, VHS2, that arose from the whole genome duplication -S000030955 CDS YNL074C 14 488124 486766 C 2011-02-03 1996-07-31 -S000005017 ORF Verified YNL073W MSK1 lysine--tRNA ligase MSK1 chromosome 14 L000001195 14 488386 490116 W 2011-02-03 1996-07-31 Mitochondrial lysine-tRNA synthetase; required for import of both aminoacylated and deacylated forms of tRNA(Lys) into mitochondria and for aminoacylation of mitochondrially encoded tRNA(Lys) -S000030916 CDS YNL073W 14 488386 490116 W 2011-02-03 1996-07-31 -S000005016 ORF Verified YNL072W RNH201 ribonuclease H2 catalytic subunit RNH201|Rnh2A|RNH35 chromosome 14 L000004047 14 490317 491240 W 2011-02-03 1996-07-31 Ribonuclease H2 catalytic subunit; removes RNA primers during Okazaki fragment synthesis and errant ribonucleotides misincorporated during DNA replication; role in ribonucleotide excision repair; homolog of RNAse HI; related to human AGS4 which causes Aicardi-Goutieres syndrome -S000029909 CDS YNL072W 14 490317 491240 W 2011-02-03 1996-07-31 -S000005015 ORF Verified YNL071W LAT1 dihydrolipoyllysine-residue acetyltransferase|PDA2|ODP2 chromosome 14 L000000932|L000003242 14 491523 492971 W 2011-02-03 1996-07-31 Dihydrolipoamide acetyltransferase component (E2) of the PDC; the pyruvate dehydrogenase complex (PDC) catalyzes the oxidative decarboxylation of pyruvate to acetyl-CoA -S000037903 CDS YNL071W 14 491523 492971 W 2011-02-03 1996-07-31 -S000005014 ORF Verified YNL070W TOM7 YOK22|MOM7 chromosome 14 L000003250 14 493366 493548 W 2011-02-03 1996-07-31 Component of the TOM (translocase of outer membrane) complex; responsible for recognition and initial import steps for all mitochondrially directed proteins; promotes assembly and stability of the TOM complex -S000037807 CDS YNL070W 14 493366 493548 W 2011-02-03 1996-07-31 -S000005013 ORF Verified YNL069C RPL16B uL13|ribosomal 60S subunit protein L16B|L13|rp23|YL15|L21B|L16B|RP23 chromosome 14 L000003244 14 495001 493956 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L16B; N-terminally acetylated, binds 5.8 S rRNA; transcriptionally regulated by Rap1p; homologous to mammalian ribosomal protein L13A and bacterial L13; RPL16B has a paralog, RPL16A, that arose from the whole genome duplication -S000036374 CDS YNL069C 14 494524 493956 C 2011-02-03 1996-07-31 -S000036373 CDS YNL069C 14 495001 494974 C 2011-02-03 1996-07-31 -S000036375 intron YNL069C 14 494973 494525 C 2011-02-03 1996-07-31 -S000005012 ORF Verified YNL068C FKH2 forkhead family transcription factor FKH2 chromosome 14 L000002608 14 498289 495701 C 2011-02-03 1996-07-31 Forkhead family transcription factor; rate-limiting activator of replication origins; evolutionarily conserved regulator of lifespan; binds multiple chromosomal elements with distinct specificities, cell cycle dynamics; positively regulates transcriptional elongation; facilitates clustering, activation of early-firing replication origins; negative role in chromatin silencing at HML and HMR; major role in expression of G2/M phase genes; relocalizes to cytosol under hypoxia -S000036272 CDS YNL068C 14 498289 495701 C 2011-02-03 1996-07-31 -S000007623 ORF Dubious YNL067W-A YNL067W-B chromosome 14 14 498538 498684 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037221 CDS YNL067W-A 14 498538 498684 W 2011-02-03 2001-02-26 -S000118388 ARS ARS1420 ARSXIV-499 chromosome 14 14 498970 499154 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178172 ARS_consensus_sequence ARS1420 14 499037 499053 W 2014-11-18 2014-11-18 -S000028810 ORF Uncharacterized YNL067W-B YNL067W-A chromosome 14 14 499417 499557 W 2011-02-03 2003-07-29 Putative protein of unknown function -S000033610 CDS YNL067W-B 14 499417 499557 W 2011-02-03 2003-07-29 -S000005011 ORF Verified YNL067W RPL9B uS4|uL6|ribosomal 60S subunit protein L9B|L6|rp24|YL11|L9B|L8B chromosome 14 L000003165 14 499681 500256 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L9B; homologous to mammalian ribosomal protein L9 and bacterial L6; RPL9B has a paralog, RPL9A, that arose from a single-locus duplication -S000036228 CDS YNL067W 14 499681 500256 W 2011-02-03 1996-07-31 -S000005010 ORF Verified YNL066W SUN4 putative glucosidase SUN4|SCW3 chromosome 14 L000004564|L000004151 14 501515 502777 W 2011-02-03 1996-07-31 Cell wall protein related to glucanases; possibly involved in cell wall septation; member of the SUN family; SUN4 has a paralog, SIM1, that arose from the whole genome duplication -S000036134 CDS YNL066W 14 501515 502777 W 2011-02-03 1996-07-31 -S000122110 five_prime_UTR_intron YNL066W 14 501157 501502 W 2011-02-03 2007-04-04 -S000005009 ORF Verified YNL065W AQR1 chromosome 14 14 503724 505484 W 2011-02-03 1996-07-31 Plasma membrane transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; confers resistance to short-chain monocarboxylic acids and quinidine; involved in the excretion of excess amino acids; AQR1 has a paralog, QDR1, that arose from the whole genome duplication; relocalizes from plasma membrane to cytoplasm upon DNA replication stress -S000036037 CDS YNL065W 14 503724 505484 W 2011-02-03 1996-07-31 -S000005008 ORF Verified YNL064C YDJ1 MAB3|type I HSP40 co-chaperone YDJ1|HSP40|MAS5 chromosome 14 L000002503|L000003567|S000029274 14 507097 505868 C 2011-02-03 1996-07-31 Type I HSP40 co-chaperone; involved in regulation of HSP90 and HSP70 functions; acts as an adaptor that helps Rsp5p recognize cytosolic misfolded proteins for ubiquitination after heat shock; critical for determining cell size at Start as a function of growth rate; involved in protein translocation across membranes; member of the DnaJ family; chimeric protein in which human p58IPK J domain replaces yeast Ydj1p J domain can complement yeast ydj1 mutant -S000035088 CDS YNL064C 14 507097 505868 C 2011-02-03 1996-07-31 -S000005007 ORF Verified YNL063W MTQ1 S-adenosylmethionine-dependent methyltransferase chromosome 14 14 507758 508702 W 2011-02-03 1996-07-31 S-adenosylmethionine-dependent methyltransferase; methylates translational release factor Mrf1p; similar to E.coli PrmC; is not an essential gene -S000035039 CDS YNL063W 14 507758 508702 W 2011-02-03 1996-07-31 -S000005006 ORF Verified YNL062C GCD10 tRNA 1-methyladenosine methyltransferase subunit GCD10|TRM6 chromosome 14 L000000676 14 510212 508776 C 2011-02-03 1996-07-31 Subunit of tRNA (1-methyladenosine) methyltransferase with Gcd14p; required for the modification of the adenine at position 58 in tRNAs, especially tRNAi-Met; first identified as a negative regulator of GCN4 expression -S000034822 CDS YNL062C 14 510212 508776 C 2011-02-03 1996-07-31 -S000005005 ORF Verified YNL061W NOP2 rRNA (cytosine-C5-)-methyltransferase NOP2|YNA1 chromosome 14 L000002535 14 510540 512396 W 2011-02-03 1996-07-31 rRNA m5C methyltransferase; methylates cytosine at position 2870 of 25S rRNA; has an essential function independent of rRNA methylation; contains seven beta-strand methyltransferase motif; essential for processing and maturation of 27S pre-rRNA and large ribosomal subunit biogenesis; localized to the nucleolus; constituent of 66S pre-ribosomal particles; rRNA methylation defect and lethality are functionally complemented by human NOP2, a gene upregulated in cancer -S000034786 CDS YNL061W 14 510540 512396 W 2011-02-03 1996-07-31 -S000005004 ORF Verified YNL059C ARP5 chromosome 14 L000003434 14 514935 512668 C 2011-02-03 1997-01-28 Nuclear actin-related protein involved in chromatin remodeling; component of chromatin-remodeling enzyme complexes; promotes nucleosome shifts in the 3 prime direction -S000031814 CDS YNL059C 14 514935 512668 C 2011-02-03 1997-01-28 -S000005002 ORF Dubious YNL057W chromosome 14 14 516403 516735 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031644 CDS YNL057W 14 516403 516735 W 2011-02-03 1997-01-28 -S000005003 ORF Uncharacterized YNL058C chromosome 14 14 516713 515763 C 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to vacuole; not an essential gene; YNL058C has a paralog, PRM5, that arose from the whole genome duplication -S000031675 CDS YNL058C 14 516713 515763 C 2011-02-03 1997-01-28 -S000005001 ORF Verified YNL056W OCA2 chromosome 14 14 517249 517842 W 2011-02-03 1997-01-28 Protein of unknown function; similar to predicted tyrosine phosphatases Oca1p and Siw14p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YNL056W is not an essential gene -S000031555 CDS YNL056W 14 517249 517842 W 2011-02-03 1997-01-28 -S000005000 ORF Verified YNL055C POR1 porin POR1|VDAC|YVDAC1|OMP2 chromosome 14 L000001302 14 518845 517994 C 2011-02-03 1997-01-28 Mitochondrial porin (voltage-dependent anion channel); outer membrane protein required for maintenance of mitochondrial osmotic stability and mitochondrial membrane permeability; couples the glutathione pools of the intermembrane space (IMS) and the cytosol; interacts with Om45 and Om14 in the outer membrane; phosphorylated; protein abundance increases in response to DNA replication stress -S000030679 CDS YNL055C 14 518845 517994 C 2011-02-03 1997-01-28 -S000007136 long_terminal_repeat YNLWdelta3 chromosome 14 14 519163 519496 W 2011-02-03 2000-05-19 Ty1 LTR -S000007142 LTR_retrotransposon YNLWTy1-2 Ty1 chromosome 14 14 519163 525062 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000006544 tRNA_gene tD(GUC)N chromosome 14 L000003699 14 519169 519099 C 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000030423 noncoding_exon tD(GUC)N 14 519169 519099 C 2011-02-03 2000-05-19 -S000007384 transposable_element_gene YNL054W-A gag protein chromosome 14 14 519456 520778 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000033062 CDS YNL054W-A 14 519456 520778 W 2011-02-03 1999-07-17 -S000007385 transposable_element_gene YNL054W-B gag-pol fusion protein chromosome 14 14 519456 524706 W 2011-02-03 1999-07-17 TyB Gag-Pol protein; proteolytically processed to make the Gag, reverse transcriptase (RT), protease (PR), and integrase (IN) proteins that are required for retrotransposition -S000033063 CDS YNL054W-B 14 519456 520760 W 2011-02-03 1999-07-17 -S000033064 CDS YNL054W-B 14 520762 524706 W 2011-02-03 1999-07-17 -S000033065 plus_1_translational_frameshift YNL054W-B 14 520761 520761 W 2011-02-03 1999-07-17 -S000007137 long_terminal_repeat YNLWdelta4 chromosome 14 14 524729 525062 W 2011-02-03 2000-05-19 Ty1 LTR -S000004999 ORF Verified YNL054W VAC7 chromosome 14 L000004051 14 526086 529583 W 2011-02-03 1997-01-28 Integral vacuolar membrane protein; involved in vacuole inheritance and morphology; activates Fab1p kinase activity under basal conditions and also after hyperosmotic shock -S000030639 CDS YNL054W 14 526086 529583 W 2011-02-03 1997-01-28 -S000004998 ORF Verified YNL053W MSG5 tyrosine/serine/threonine protein phosphatase MSG5 chromosome 14 L000001188 14 529942 531411 W 2011-02-03 1997-01-28 Dual-specificity protein phosphatase; exists in 2 isoforms; required for maintenance of a low level of signaling through the cell integrity pathway, adaptive response to pheromone; regulates and is regulated by Slt2p; dephosphorylates Fus3p; MSG5 has a paralog, SDP1, that arose from the whole genome duplication -S000030532 CDS YNL053W 14 529942 531411 W 2011-02-03 1997-01-28 -S000004997 ORF Verified YNL052W COX5A cytochrome c oxidase subunit Va chromosome 14 L000000388|L000000387 14 531725 532186 W 2011-02-03 1997-01-28 Subunit Va of cytochrome c oxidase; cytochrome c oxidase is the terminal member of the mitochondrial inner membrane electron transport chain; Cox5Ap is predominantly expressed during aerobic growth while its isoform Vb (Cox5Bp) is expressed during anaerobic growth; COX5A has a paralog, COX5B, that arose from the whole genome duplication -S000030467 CDS YNL052W 14 531725 532186 W 2011-02-03 1997-01-28 -S000004996 ORF Verified YNL051W COG5 Golgi transport complex subunit COG5|COD4|API4 chromosome 14 14 532659 533870 W 2011-02-03 1997-01-28 Component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments -S000037658 CDS YNL051W 14 532659 533870 W 2011-02-03 1997-01-28 -S000004995 ORF Uncharacterized YNL050C chromosome 14 14 534982 534079 C 2011-02-03 1997-01-28 Putative protein of unknown function; YNL050c is not an essential gene -S000037523 CDS YNL050C 14 534874 534079 C 2011-02-03 1997-01-28 -S000037522 CDS YNL050C 14 534982 534966 C 2011-02-03 1997-01-28 -S000037524 intron YNL050C 14 534965 534875 C 2011-02-03 1997-01-28 -S000004994 ORF Verified YNL049C SFB2 COPII subunit SFB2|ISS1 chromosome 14 L000004658 14 537911 535281 C 2011-02-03 1997-01-28 Component of the Sec23p-Sfb2p heterodimer of the COPII vesicle coat; required for cargo selection during vesicle formation in ER to Golgi transport; homologous to Sfb3p; SFB2 has a paralog, SEC24, that arose from the whole genome duplication -S000036531 CDS YNL049C 14 537911 535281 C 2011-02-03 1997-01-28 -S000004993 ORF Verified YNL048W ALG11 alpha-1,2-mannosyltransferase ALG11 chromosome 14 L000003378 14 538173 539819 W 2011-02-03 1997-01-28 Alpha-1,2-mannosyltransferase; catalyzes sequential addition of the two terminal alpha 1,2-mannose residues to the Man5GlcNAc2-PP-dolichol intermediate during asparagine-linked glycosylation in the ER -S000036480 CDS YNL048W 14 538173 539819 W 2011-02-03 1997-01-28 -S000004992 ORF Verified YNL047C SLM2 phosphatidylinositol 4,5-bisphosphate-binding protein|LIT1 chromosome 14 14 541881 539911 C 2011-02-03 1997-01-28 Phosphoinositide PI4,5P(2) binding protein, forms a complex with Slm1p; acts downstream of Mss4p in a pathway regulating actin cytoskeleton organization in response to stress; TORC2 complex substrate and effector; SLM2 has a paralog, SLM1, that arose from the whole genome duplication -S000036346 CDS YNL047C 14 541881 539911 C 2011-02-03 1997-01-28 -S000004991 ORF Uncharacterized YNL046W chromosome 14 14 542304 542822 W 2011-02-03 1997-01-28 Putative protein of unknown function; expression depends on Swi5p; GFP-fusion protein localizes to the endoplasmic reticulum; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO) -S000036307 CDS YNL046W 14 542304 542822 W 2011-02-03 1997-01-28 -S000004990 ORF Verified YNL045W LAP2 bifunctional aminopeptidase/epoxide hydrolase chromosome 14 14 542963 544978 W 2011-02-03 1997-01-28 Leucyl aminopeptidase yscIV with epoxide hydrolase activity; metalloenzyme containing one zinc atom; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; also known as leukotriene A4 hydrolase -S000035413 CDS YNL045W 14 542963 544978 W 2011-02-03 1997-01-28 -S000004989 ORF Verified YNL044W YIP3 chromosome 14 L000003269 14 545268 545877 W 2011-02-03 1999-11-17|1997-01-28 Protein localized to COPII vesicles; proposed to be involved in ER to Golgi transport; interacts with members of the Rab GTPase family and Yip1p; also interacts with Rtn1p -S000035328 CDS YNL044W 14 545268 545291 W 2011-02-03 1999-11-17 -S000035329 CDS YNL044W 14 545371 545877 W 2011-02-03 1999-11-17|1997-01-28 -S000035330 intron YNL044W 14 545292 545370 W 2011-02-03 1999-11-17 -S000004988 ORF Dubious YNL043C chromosome 14 14 545909 545589 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YIP3/YNL044W -S000035201 CDS YNL043C 14 545909 545589 C 2011-02-03 1997-01-28 -S000118389 ARS ARS1421 ARSXIV-546 chromosome 14 14 546072 546170 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178173 ARS_consensus_sequence ARS1421 14 546146 546130 C 2014-11-18 2014-11-18 -S000007138 long_terminal_repeat YNLWsigma2 chromosome 14 14 546423 546714 W 2011-02-03 2000-05-19 Ty3 LTR -S000007139 long_terminal_repeat YNLWsigma3 chromosome 14 14 546738 547077 W 2011-02-03 2000-05-19 Ty3 LTR -S000006685 tRNA_gene tP(UGG)N1 chromosome 14 L000003691 14 547094 547196 W 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin -S000030970 intron tP(UGG)N1 14 547130 547160 W 2011-02-03 2000-05-19 -S000030968 noncoding_exon tP(UGG)N1 14 547094 547129 W 2011-02-03 2000-05-19 -S000030969 noncoding_exon tP(UGG)N1 14 547161 547196 W 2011-02-03 2000-05-19 -S000028850 ORF Uncharacterized YNL042W-B chromosome 14 14 547113 547370 W 2011-02-03 2003-07-29 Putative protein of unknown function -S000034563 CDS YNL042W-B 14 547113 547370 W 2011-02-03 2003-07-29 -S000004987 ORF Verified YNL042W BOP3 chromosome 14 L000004723 14 548100 549290 W 2011-02-03 1997-01-28 Protein of unknown function; potential Cdc28p substrate; overproduction confers resistance to methylmercury -S000035157 CDS YNL042W 14 548100 549290 W 2011-02-03 1997-01-28 -S000004986 ORF Verified YNL041C COG6 Golgi transport complex subunit COG6|SEC37|COD2 chromosome 14 14 551987 549468 C 2011-02-03 1997-01-28 Component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments -S000034122 CDS YNL041C 14 551987 549468 C 2011-02-03 1997-01-28 -S000004985 ORF Verified YNL040W putative alanine--tRNA ligase chromosome 14 14 553380 554750 W 2011-02-03 1997-01-28 Protein of unknown function; has strong similarity to alanyl-tRNA synthases from Eubacteria; null mutant displays decreased translation rate and increased readthrough of premature stop codons; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YNL040W is not an essential gene -S000034091 CDS YNL040W 14 553380 554750 W 2011-02-03 1997-01-28 -S000004984 ORF Verified YNL039W BDP1 transcription factor TFIIIB subunit BDP1|TFC7|TFIIIB90|TFC5 chromosome 14 L000003032 14 555048 556832 W 2011-02-03 1997-01-28 Essential subunit of RNA polymerase III transcription factor (TFIIIB); TFIIIB is involved in transcription of genes encoding tRNAs, 5S rRNA, U6 snRNA, and other small RNAs -S000032264 CDS YNL039W 14 555048 556832 W 2011-02-03 1997-01-28 -S000004983 ORF Verified YNL038W GPI15 phosphatidylinositol N-acetylglucosaminyltransferase GPI15 chromosome 14 14 557020 557783 W 2011-02-03 2003-09-27|1997-01-28 Protein involved in the synthesis of GlcNAc-PI; GlcNAc-PI is the first intermediate in the synthesis of glycosylphosphatidylinositol (GPI) anchors; homologous to the human PIG-H protein; GlcNAc-PI stands for N-acetylglucosaminyl phosphatidylinositol -S000032181 CDS YNL038W 14 557020 557610 W 2011-02-03 2003-09-27|1997-01-28 -S000032182 CDS YNL038W 14 557685 557783 W 2011-02-03 2003-09-27 -S000032183 intron YNL038W 14 557611 557684 W 2011-02-03 2003-09-27 -S000004982 ORF Verified YNL037C IDH1 isocitrate dehydrogenase (NAD(+)) IDH1 chromosome 14 L000000849 14 559002 557920 C 2011-02-03 1997-01-28 Subunit of mitochondrial NAD(+)-dependent isocitrate dehydrogenase; complex catalyzes the oxidation of isocitrate to alpha-ketoglutarate in the TCA cycle -S000032073 CDS YNL037C 14 559002 557920 C 2011-02-03 1997-01-28 -S000004981 ORF Verified YNL036W NCE103 carbonate dehydratase NCE103|NCE3 chromosome 14 L000003213 14 559814 560479 W 2011-02-03 1997-01-28 Carbonic anhydrase; metalloenzyme that catalyzes CO2 hydration to bicarbonate, which is an important metabolic substrate, and protons; not expressed under conditions of high CO2, such as inside a growing colony, but transcription is induced in response to low CO2 levels, such as on the colony surface in ambient air; poorly transcribed under aerobic conditions and at an undetectable level under anaerobic conditions; abundance increases in response to DNA replication stress -S000032012 CDS YNL036W 14 559814 560479 W 2011-02-03 1997-01-28 -S000006745 tRNA_gene tT(AGU)N2 chromosome 14 L000003698 14 560765 560693 C 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000037431 noncoding_exon tT(AGU)N2 14 560765 560693 C 2011-02-03 2000-05-19 -S000118390 ARS ARS1422 ARSXIV-561 chromosome 14 14 561111 561388 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178174 ARS_consensus_sequence ARS1422 14 561327 561311 C 2014-11-18 2014-11-18 -S000007141 long_terminal_repeat YNLWtau2 chromosome 14 14 561607 561977 W 2011-02-03 2000-05-19 Ty4 LTR -S000007131 long_terminal_repeat YNLCdelta5 chromosome 14 14 562364 562033 C 2011-02-03 2000-05-19 Ty2 LTR -S000007135 LTR_retrotransposon YNLCTy2-1 Ty2 chromosome 14 14 567660 562364 C 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; mutated in S288C -S000007132 long_terminal_repeat YNLCdelta6 chromosome 14 14 567992 567660 C 2011-02-03 2000-05-19 Ty2 LTR -S000006686 tRNA_gene tP(UGG)N2 chromosome 14 L000003692 14 568115 568217 W 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin -S000030974 intron tP(UGG)N2 14 568151 568181 W 2011-02-03 2000-05-19 -S000030972 noncoding_exon tP(UGG)N2 14 568115 568150 W 2011-02-03 2000-05-19 -S000030973 noncoding_exon tP(UGG)N2 14 568182 568217 W 2011-02-03 2000-05-19 -S000130143 ARS ARS1423 chromosome 14 14 568219 568524 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000004980 ORF Verified YNL035C chromosome 14 14 569691 568522 C 2011-02-03 1997-01-28 Nuclear protein of unknown function; relocalizes to the cytosol in response to hypoxia; contains WD-40 domains; not an essential gene; protein abundance increases in response to DNA replication stress -S000031007 CDS YNL035C 14 569691 568522 C 2011-02-03 1997-01-28 -S000006609 tRNA_gene tI(AAU)N1 chromosome 14 L000003697 14 569940 569867 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000034901 noncoding_exon tI(AAU)N1 14 569940 569867 C 2011-02-03 2000-05-19 -S000004979 ORF Uncharacterized YNL034W chromosome 14 14 570477 572315 W 2011-02-03 1997-01-28 Putative protein of unknown function; not an essential gene; YNL034W has a paralog, YNL018C, that arose from a segmental duplication -S000030964 CDS YNL034W 14 570477 572315 W 2011-02-03 1997-01-28 -S000004978 ORF Uncharacterized YNL033W chromosome 14 14 572999 573853 W 2011-02-03 1997-01-28 Putative protein of unknown function; YNL033W has a paralog, YNL019C, that arose from a segmental duplication -S000030908 CDS YNL033W 14 572999 573853 W 2011-02-03 1997-01-28 -S000004977 ORF Verified YNL032W SIW14 putative tyrosine protein phosphatase SIW14|OCA3 chromosome 14 L000004216 14 574506 575351 W 2011-02-03 1997-01-28 Tyrosine phosphatase involved in actin organization and endocytosis; localized to the cytoplasm -S000030820 CDS YNL032W 14 574506 575351 W 2011-02-03 1997-01-28 -S000004976 ORF Verified YNL031C HHT2 histone H3 chromosome 14 L000000773 14 576050 575640 C 2011-02-03 1997-01-28 Histone H3; core histone protein required for chromatin assembly, part of heterochromatin-mediated telomeric and HM silencing; one of two identical histone H3 proteins (see HHT1); regulated by acetylation, methylation, and phosphorylation; H3K14 acetylation plays an important role in the unfolding of strongly positioned nucleosomes during repair of UV damage -S000037842 CDS YNL031C 14 576050 575640 C 2011-02-03 1997-01-28 -S000004975 ORF Verified YNL030W HHF2 histone H4 chromosome 14 L000000771 14 576727 577038 W 2011-02-03 1997-01-28 Histone H4; core histone protein required for chromatin assembly and chromosome function; one of two identical histone proteins (see also HHF1); contributes to telomeric silencing; N-terminal domain involved in maintaining genomic integrity -S000037800 CDS YNL030W 14 576727 577038 W 2011-02-03 1997-01-28 -S000004973 ORF Dubious YNL028W chromosome 14 14 578679 578996 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036923 CDS YNL028W 14 578679 578996 W 2011-02-03 1997-01-28 -S000004974 ORF Verified YNL029C KTR5 putative mannosyltransferase chromosome 14 L000004099 14 578773 577205 C 2011-02-03 1997-01-28 Putative mannosyltransferase involved in protein glycosylation; member of the KRE2/MNT1 mannosyltransferase family; KTR5 has a paralog, KTR7, that arose from the whole genome duplication -S000036950 CDS YNL029C 14 578773 577205 C 2011-02-03 1997-01-28 -S000004972 ORF Verified YNL027W CRZ1 DNA-binding transcription factor CRZ1|TCN1|HAL8 chromosome 14 L000004202 14 579580 581616 W 2011-02-03 1997-01-28 Transcription factor, activates transcription of stress response genes; nuclear localization is positively regulated by calcineurin-mediated dephosphorylation; rapidly localizes to the nucleus under blue light stress; can be activated in stochastic pulses of nuclear localization in response to calcium -S000036172 CDS YNL027W 14 579580 581616 W 2011-02-03 1997-01-28 -S000004971 ORF Verified YNL026W SAM50 SAM complex subunit SAM50|TOB55|OMP85 chromosome 14 14 581920 583374 W 2011-02-03 1997-01-28 Component of the Sorting and Assembly Machinery (SAM) complex; the SAM (or TOB) complex is located in the mitochondrial outer membrane; the complex binds precursors of beta-barrel proteins and facilitates their outer membrane insertion; homologous to bacterial Omp85 -S000035990 CDS YNL026W 14 581920 583374 W 2011-02-03 1997-01-28 -S000004970 ORF Verified YNL025C SSN8 cyclin-dependent protein serine/threonine kinase regulator SSN8|CNC1|CycC|RYE2|UME3|SRB11|NUT9|GIG3 chromosome 14 L000002796 14 585291 584320 C 2011-02-03 1997-01-28 Cyclin-like component of the RNA polymerase II holoenzyme; involved in phosphorylation of the RNA polymerase II C-terminal domain; forms a kinase-cyclin pair in the RNAPII holoenzyme with Ssn3p; required for both entry into and execution of the meiotic program; involved in glucose repression and telomere maintenance; cyclin homolog 35% identical to human cyclin C -S000034989 CDS YNL025C 14 585291 584320 C 2011-02-03 1997-01-28 -S000007436 snoRNA_gene NME1 NME1 RRP2 chromosome 14 L000001258 14 585587 585926 W 2011-02-03 2000-05-19 RNA component of RNase MRP; RNase MRP cleaves pre-rRNA and has a role in cell cycle-regulated degradation of daughter cell-specific mRNAs; human ortholog is implicated in cartilage-hair hypoplasia (CHH) -S000032302 noncoding_exon NME1 14 585587 585926 W 2011-02-03 2000-05-19 -S000006457 snoRNA_gene snR66 SNR66 chromosome 14 L000004535 14 586090 586175 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U2417 -S000030852 noncoding_exon snR66 14 586090 586175 W 2011-02-03 2000-05-19 -S000028698 ORF Verified YNL024C-A KSH1 chromosome 14 14 586820 586602 C 2011-02-03 2003-07-29 Essential protein suggested to function early in the secretory pathway; inviability is suppressed by overexpression of Golgi protein Tvp23p; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and cytosol respectively; ortholog of human Kish -S000032608 CDS YNL024C-A 14 586820 586602 C 2011-02-03 2003-07-29 -S000004969 ORF Uncharacterized YNL024C EFM6 putative protein-lysine N-methyltransferase chromosome 14 14 587847 587107 C 2011-02-03 1997-01-28 Putative S-adenosylmethionine-dependent lysine methyltransferase; responsible for modifying Lys-390 in translational elongation factor EF-1 alpha (eEF1A); has seven beta-strand methyltransferase motif; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000034856 CDS YNL024C 14 587847 587107 C 2011-02-03 1997-01-28 -S000004968 ORF Verified YNL023C FAP1 chromosome 14 L000004577 14 591160 588263 C 2011-02-03 1997-01-28 Protein that binds to Fpr1p; confers rapamycin resistance by competing with rapamycin for Fpr1p binding; accumulates in the nucleus upon treatment of cells with rapamycin; has similarity to D. melanogaster shuttle craft and human NFX1 -S000034736 CDS YNL023C 14 591160 588263 C 2011-02-03 1997-01-28 -S000004967 ORF Verified YNL022C RCM1 rRNA (cytosine-C5-)-methyltransferase RCM1 chromosome 14 14 592899 591427 C 2011-02-03 1997-01-28 rRNA m5C methyltransferase; methylates cytosine at position 2278 of 25S rRNA while Nop2p methylates cytosine at position 2870; contains seven beta-strand methyltransferase motif; localized to the nucleolus; interacts with Trm112p; homolog of NSUN5A, a human gene which is deleted in Williams-Beuren Syndrome -S000033831 CDS YNL022C 14 592899 591427 C 2011-02-03 1997-01-28 -S000004966 ORF Verified YNL021W HDA1 histone deacetylase HDA1 chromosome 14 L000004088 14 593227 595347 W 2011-02-03 1997-01-28 Putative catalytic subunit of a class II histone deacetylase complex; role in azole resistance via Hsp90p, and in the heat shock response; Hda1p interacts with the Hda2p-Hda3p subcomplex to form an active tetramer; deletion increases histone H2B, H3 and H4 acetylation; other members of the HDA1 histone deacetylase complex are Hda2p and Hda3p -S000033782 CDS YNL021W 14 593227 595347 W 2011-02-03 1997-01-28 -S000004965 ORF Verified YNL020C ARK1 serine/threonine protein kinase ARK1 chromosome 14 L000004430 14 597539 595623 C 2011-02-03 1997-01-28 Serine/threonine protein kinase; involved in regulation of the cortical actin cytoskeleton; involved in control of endocytosis; ARK1 has a paralog, PRK1, that arose from the whole genome duplication -S000033598 CDS YNL020C 14 597539 595623 C 2011-02-03 1997-01-28 -S000004964 ORF Uncharacterized YNL019C chromosome 14 14 599230 598376 C 2011-02-03 1997-01-28 Putative protein of unknown function; expression induced during heat stress; YNL019C has a paralog, YNL033W, that arose from a segmental duplication -S000032941 CDS YNL019C 14 599230 598376 C 2011-02-03 1997-01-28 -S000004963 ORF Uncharacterized YNL018C chromosome 14 14 601774 599936 C 2011-02-03 1997-01-28 Putative protein of unknown function; YNL018C has a paralog, YNL034W, that arose from a segmental duplication -S000032852 CDS YNL018C 14 601774 599936 C 2011-02-03 1997-01-28 -S000006610 tRNA_gene tI(AAU)N2 chromosome 14 L000003693 14 602312 602385 W 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000034903 noncoding_exon tI(AAU)N2 14 602312 602385 W 2011-02-03 2000-05-19 -S000004962 ORF Dubious YNL017C chromosome 14 14 602476 602138 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the tRNA ORF tI(AAU)N2 -S000031913 CDS YNL017C 14 602476 602138 C 2011-02-03 1997-01-28 -S000004961 ORF Verified YNL016W PUB1 RNP1 chromosome 14 L000001529 14 602907 604268 W 2011-02-03 1997-01-28 Poly (A)+ RNA-binding protein; abundant mRNP-component protein that binds mRNA and is required for stability of many mRNAs; component of glucose deprivation induced stress granules, involved in P-body-dependent granule assembly; implicated in regulation of translation; carries Q/N-rich domain at C- terminus, identified as candidate prion; human homolog Tia1 is critical for normal synaptic plasticity; protein abundance increases in response to DNA replication stress -S000031862 CDS YNL016W 14 602907 604268 W 2011-02-03 1997-01-28 -S000004960 ORF Verified YNL015W PBI2 IB2|I2B|LMA1 chromosome 14 L000001344 14 605384 605611 W 2011-02-03 1997-01-28 Cytosolic inhibitor of vacuolar proteinase B (PRB1); required for efficient vacuole inheritance; with thioredoxin forms protein complex LMA1, which assists in priming SNARE molecules and promotes vacuole fusion; protein abundance increases in response to DNA replication stress -S000031753 CDS YNL015W 14 605384 605611 W 2011-02-03 1997-01-28 -S000004959 ORF Verified YNL014W HEF3 translation elongation factor EF-3|ZRG7 chromosome 14 14 606319 609453 W 2011-02-03 1997-01-28 Translational elongation factor EF-3; member of the ABC superfamily; stimulates EF-1 alpha-dependent binding of aminoacyl-tRNA by the ribosome; normally expressed in zinc deficient cells; HEF3 has a paralog, YEF3, that arose from the whole genome duplication -S000031664 CDS YNL014W 14 606319 609453 W 2011-02-03 1997-01-28 -S000004958 ORF Dubious YNL013C chromosome 14 14 609510 609133 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF HEF3/YNL014W -S000031500 CDS YNL013C 14 609510 609133 C 2011-02-03 1997-01-28 -S000118391 ARS ARS1424 ARSXIV-610 chromosome 14 14 609520 609607 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178175 ARS_consensus_sequence ARS1424 14 609532 609548 W 2014-11-18 2014-11-18 -S000004957 ORF Verified YNL012W SPO1 putative carboxylic ester hydrolase chromosome 14 L000001999 14 609686 611665 W -1 2011-02-03 2000-07-14|1997-01-28 Meiosis-specific prospore protein; required for meiotic spindle pole body duplication and separation; required to produce bending force necessary for proper prospore membrane assembly during sporulation; has similarity to phospholipase B -S000030704 CDS YNL012W 14 609686 609790 W 2011-02-03 2000-07-14 -S000030705 CDS YNL012W 14 609875 611665 W 2011-02-03 2000-07-14|1997-01-28 -S000030706 intron YNL012W 14 609791 609874 W 2011-02-03 2000-07-14 -S000004956 ORF Uncharacterized YNL011C chromosome 14 14 613170 611836 C 2011-02-03 1997-01-28 Putative protein of unknown function; YNL011C is not an essential gene -S000030538 CDS YNL011C 14 613170 611836 C 2011-02-03 1997-01-28 -S000004955 ORF Uncharacterized YNL010W putative phosphoric monoester hydrolase chromosome 14 14 613635 614360 W 2011-02-03 1997-01-28 Putative protein of unknown function; similar to phosphoserine phosphatases; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; homozygous diploid mutant shows an increase in glycogen accumulation -S000030490 CDS YNL010W 14 613635 614360 W 2011-02-03 1997-01-28 -S000004954 ORF Verified YNL009W IDP3 isocitrate dehydrogenase (NADP(+)) IDP3 chromosome 14 L000003946 14 614821 616083 W 2011-02-03 1997-01-28 Peroxisomal NADP-dependent isocitrate dehydrogenase; catalyzes oxidation of isocitrate to alpha-ketoglutarate with the formation of NADP(H+), required for growth on unsaturated fatty acids; IDP3 has a paralog, IDP2, that arose from the whole genome duplication -S000037693 CDS YNL009W 14 614821 616083 W 2011-02-03 1997-01-28 -S000130144 ARS ARS1425 chromosome 14 14 616311 617125 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000004953 ORF Verified YNL008C ASI3 putative ubiquitin-protein ligase ASI3 chromosome 14 14 618241 616211 C 2011-02-03 1997-01-28|2011-02-03 Subunit of the inner nuclear membrane Asi ubiquitin ligase complex; Asi complex targets both misfolded proteins of the inner nuclear membrane-associated degradation (INMAD) pathway and regulators of sterol biosynthesis for ubiquitin-mediated degradation; acts with Asi1p and Asi2p to ensure the fidelity of SPS-sensor signaling by targeting latent unprocessed forms of Stp1p and Stp2p, maintaining the repressed state of gene expression in the absence of inducing amino acids -S000037593 CDS YNL008C 14 618241 616211 C 2011-02-03 1997-01-28|2011-02-03 -S000004952 ORF Verified YNL007C SIS1 type II HSP40 co-chaperone SIS1 chromosome 14 L000001898 14 619565 618507 C 3 2011-02-03 1997-01-28 Type II HSP40 co-chaperone that interacts with the HSP70 protein Ssa1p; shuttles between cytosol and nucleus; mediates delivery of misfolded proteins into the nucleus for degradation; involved in proteasomal degradation of misfolded cytosolic proteins; protein abundance increases in response to DNA replication stress; polyQ aggregates sequester Sis1p and interfere with clearance of misfolded proteins; similar to bacterial DnaJ proteins and mammalian DnaJB1 -S000036851 CDS YNL007C 14 619565 618507 C 2011-02-03 1997-01-28 -S000004951 ORF Verified YNL006W LST8 TOR complex subunit LST8 chromosome 14 L000004356 14 620067 620978 W 2011-02-03 1997-01-28 Protein required for the transport of Gap1p; required for the transport of amino acid permease Gap1p from the Golgi to the cell surface; component of the TOR signaling pathway; associates with both Tor1p and Tor2p; contains a WD-repeat -S000036826 CDS YNL006W 14 620067 620978 W 2011-02-03 1997-01-28 -S000004950 ORF Verified YNL005C MRP7 mitochondrial 54S ribosomal protein YmL2|YmL2|MRPL2 chromosome 14 L000002682|S000029309|L000001155|L000003239 14 622428 621313 C 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit -S000036741 CDS YNL005C 14 622428 621313 C 2011-02-03 1997-01-28 -S000004949 ORF Verified YNL004W HRB1 mRNA-binding protein|TOM34 chromosome 14 L000002318 14 622915 624621 W 2011-02-03 1997-01-28|2007-07-09 Poly(A+) RNA-binding protein; key surveillance factor for the selective export of spliced mRNAs from the nucleus to the cytoplasm; preference for intron-containing genes; similar to Npl3p; HRB1 has a paralog, GBP2, that arose from the whole genome duplication -S000036718 CDS YNL004W 14 622915 622944 W 2011-02-03 1997-01-28|2007-07-09 -S000123273 CDS YNL004W 14 623287 624621 W 2011-02-03 2007-07-09 -S000123272 intron YNL004W 14 622945 623286 W 2011-02-03 2007-07-09 -S000004948 ORF Verified YNL003C PET8 SAM5 chromosome 14 L000001385 14 625829 624975 C 3 2011-02-03 1997-01-28 S-adenosylmethionine transporter of the mitochondrial inner membrane; member of the mitochondrial carrier family; required for biotin biosynthesis and respiratory growth -S000035777 CDS YNL003C 14 625829 624975 C 2011-02-03 1997-01-28 -S000004947 ORF Verified YNL002C RLP7 RPL7 chromosome 14 L000001647 14 627142 626174 C 2011-02-03 1997-01-28 Nucleolar protein similar to large ribosomal subunit L7 proteins; constituent of 66S pre-ribosomal particles; plays an essential role in processing of precursors to the large ribosomal subunit RNAs; binds junction of ITS2 and ITS2-proximal stem between the 3' end of 5.8S rRNA and the 5' end of 25S rRNA -S000035659 CDS YNL002C 14 627142 626174 C 2011-02-03 1997-01-28 -S000004946 ORF Verified YNL001W DOM34 ribosome dissociation factor DOM34 chromosome 14 L000000517 14 627456 628616 W 2011-02-03 1997-01-28 Protein that facilitates ribosomal subunit dissociation; Dom34-Hbs1 complex and Rli1p have roles in dissociating inactive ribosomes to facilitate translation restart, particularly ribosomes stalled in 3' UTRs; required for RNA cleavage in no-go decay, but reports conflict on endonuclease activity; Pelota ortholog; protein abundance increases in response to DNA replication stress; DOM34 has a paralog, YCL001W-B, that arose from the whole genome duplication -S000035621 CDS YNL001W 14 627456 628616 W 2011-02-03 1997-01-28 -S000006475 centromere CEN14 CEN14 chromosome 14 L000000307 14 628758 628875 W 0 2011-02-03 2000-05-19|2004-10-08 Chromosome XIV centromere -S000077302 centromere_DNA_Element_I CEN14 14 628758 628767 W 2011-02-03 2004-10-08 -S000077303 centromere_DNA_Element_II CEN14 14 628768 628850 W 2011-02-03 2004-10-08 -S000077304 centromere_DNA_Element_III CEN14 14 628851 628875 W 2011-02-03 2004-10-08 -S000005284 ORF Verified YNR001C CIT1 citrate (Si)-synthase CIT1|LYS6|CS1 chromosome 14 L000000341 14 631061 629622 C 2011-02-03 1997-01-28 Citrate synthase; catalyzes the condensation of acetyl coenzyme A and oxaloacetate to form citrate; the rate-limiting enzyme of the TCA cycle; nuclear encoded mitochondrial protein; CIT1 has a paralog, CIT2, that arose from the whole genome duplication -S000031441 CDS YNR001C 14 631061 629622 C 2011-02-03 1997-01-28 -S000007625 ORF Dubious YNR001W-A chromosome 14 14 631263 631481 W 2011-02-03 2001-02-26 Dubious open reading frame unlikely to encode a functional protein; identified by homology -S000037252 CDS YNR001W-A 14 631263 631481 W 2011-02-03 2001-02-26 -S000006679 tRNA_gene tP(AGG)N SUF10 chromosome 14 L000002158|L000003696 14 631917 631846 C -3 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in proline codons -S000033281 noncoding_exon tP(AGG)N 14 631917 631846 C 2011-02-03 2000-05-19 -S000007143 long_terminal_repeat YNRCdelta7 chromosome 14 14 632114 631998 C 2011-02-03 2000-05-19 Ty1 LTR -S000007146 long_terminal_repeat YNRCtau3 chromosome 14 14 632489 632119 C 2011-02-03 2000-05-19 Ty4 LTR -S000006674 tRNA_gene tN(GUU)N2 chromosome 14 L000003694 14 632599 632672 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis -S000035574 noncoding_exon tN(GUU)N2 14 632599 632672 W 2011-02-03 2000-05-19 -S000005285 ORF Verified YNR002C ATO2 putative ammonium permease ATO2|FUN34 chromosome 14 L000000647 14 633856 633008 C 2011-02-03 1997-01-28 Putative transmembrane protein involved in export of ammonia; ammonia is a starvation signal that promotes cell death in aging colonies; phosphorylated in mitochondria; member of the TC 9.B.33 YaaH family; homolog of Y. lipolytica Gpr1p; ATO2 has a paralog, ADY2, that arose from the whole genome duplication -S000031565 CDS YNR002C 14 633856 633008 C 2011-02-03 1997-01-28 -S000028705 ORF Dubious YNR003W-A chromosome 14 14 634420 634518 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene RPC34/YNR003C -S000032645 CDS YNR003W-A 14 634420 634518 W 2011-02-03 2003-07-29 -S000005286 ORF Verified YNR003C RPC34 DNA-directed RNA polymerase III subunit C34|C34 chromosome 14 L000001689 14 635297 634344 C 3 2011-02-03 1997-01-28 RNA polymerase III subunit C34; interacts with TFIIIB70 and is a key determinant in pol III recruitment by the preinitiation complex -S000031697 CDS YNR003C 14 635297 634344 C 2011-02-03 1997-01-28 -S000118392 ARS ARS1426 ARSXIV-636 chromosome 14 14 635664 635904 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178176 ARS_consensus_sequence ARS1426 14 635831 635815 C 2014-11-18 2014-11-18 -S000005287 ORF Verified YNR004W SWM2 chromosome 14 14 635943 636383 W 2011-02-03 1997-01-28 Protein with a role in snRNA and snoRNA cap trimethylation; interacts with Tgs1p and shows similar phenotypes; required for trimethylation of the caps of spliceosomal snRNAs and the U3 snoRNA, and for efficient 3' end processing of U3 snoRNA; may act as a specificity factor for Tgs1p -S000032703 CDS YNR004W 14 635943 636383 W 2011-02-03 1997-01-28 -S000005289 ORF Verified YNR006W VPS27 ESCRT-0 subunit protein VPS27|DID7|VPT27|VPL23|SSV17|GRD11 chromosome 14 L000002790 14 636986 638854 W 2011-02-03 1997-01-28 Endosomal protein that forms a complex with Hse1p; required for recycling Golgi proteins, forming lumenal membranes and sorting ubiquitinated proteins destined for degradation; has Ubiquitin Interaction Motifs which bind ubiquitin (Ubi4p) -S000032897 CDS YNR006W 14 636986 638854 W 2011-02-03 1997-01-28 -S000005288 ORF Dubious YNR005C chromosome 14 14 637335 636931 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032733 CDS YNR005C 14 637335 636931 C 2011-02-03 1997-01-28 -S000005290 ORF Verified YNR007C ATG3 AUT1|APG3 chromosome 14 L000004056|L000004783 14 640114 639182 C 2011-02-03 1997-01-28 E2-like enzyme; involved in autophagy and cytoplasm-to-vacuole targeting (Cvt) pathway; plays a role in formation of Atg8p-phosphatidylethanolamine conjugates, which are involved in membrane dynamics during autophagy and Cvt; interaction with Atg8p regulated by acetylation by NuA4 histone acetyltransferase Esa1p while attenuation of Atg3 acetylation is mediated by histone deacetylase Rpd3p; Atg12p-Atg5p conjugate enhances E2 activity of Atg3p by rearranging its catalytic site -S000034825 CDS YNR007C 14 640114 639182 C 2011-02-03 1997-01-28 -S000005291 ORF Verified YNR008W LRO1 phospholipid:diacylglycerol acyltransferase chromosome 14 S000007453 14 640396 642381 W 2011-02-03 1997-01-28 Acyltransferase that catalyzes diacylglycerol esterification; one of several acyltransferases that contribute to triglyceride synthesis; Lro1p and Dga1p can O-acylate ceramides; putative homolog of human lecithin cholesterol acyltransferase -S000035018 CDS YNR008W 14 640396 642381 W 2011-02-03 1997-01-28 -S000005292 ORF Verified YNR009W NRM1 chromosome 14 S000080164 14 642690 643439 W 2011-02-03 1997-01-28 Transcriptional co-repressor of MBF-regulated gene expression; Nrm1p associates stably with promoters via MCB binding factor (MBF) to repress transcription upon exit from G1 phase -S000035110 CDS YNR009W 14 642690 643439 W 2011-02-03 1997-01-28 -S000005293 ORF Verified YNR010W CSE2 MED9 chromosome 14 L000000426 14 643744 644193 W 2011-02-03 1997-01-28 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; component of the Middle domain of mediator; required for regulation of RNA polymerase II activity; relocalizes to the cytosol in response to hypoxia -S000034052 CDS YNR010W 14 643744 644193 W 2011-02-03 1997-01-28 -S000005294 ORF Verified YNR011C PRP2 DEAH-box RNA-dependent ATPase PRP2|RNA2 chromosome 14 L000001495 14 646950 644320 C 8 2011-02-03 1997-01-28 RNA-dependent DExD/H-box ATPase; required for activation of spliceosome before first transesterification step in RNA splicing; implicated in rearranging and proofreading snRNA structure in catalytic activation of spliceosome; ortholog of human protein DHX16 -S000034087 CDS YNR011C 14 646950 644320 C 2011-02-03 1997-01-28 -S000005295 ORF Verified YNR012W URK1 uridine kinase URK1 chromosome 14 L000002440 14 647432 648937 W 2011-02-03 1997-01-28 Uridine/cytidine kinase; component of the pyrimidine ribonucleotide salvage pathway that converts uridine into UMP and cytidine into CMP; involved in the pyrimidine deoxyribonucleotide salvage pathway, converting deoxycytidine into dCMP -S000035092 CDS YNR012W 14 647432 648937 W 2011-02-03 1997-01-28 -S000005296 ORF Verified YNR013C PHO91 chromosome 14 14 651712 649028 C 2011-02-03 1997-01-28 Low-affinity vacuolar phosphate transporter; exports phosphate from the vacuolar lumen to the cytosol; regulates phosphate and polyphosphate metabolism; acts upstream of Pho81p in regulation of the PHO pathway; localizes to sites of contact between the vacuole and mitochondria (vCLAMPs); deletion of pho84, pho87, pho89, pho90, and pho91 causes synthetic lethality; transcription independent of Pi and Pho4p activity; overexpression results in vigorous growth -S000035190 CDS YNR013C 14 651712 649028 C 2011-02-03 1997-01-28 -S000005297 ORF Uncharacterized YNR014W chromosome 14 14 652465 653103 W 2011-02-03 1997-01-28 Putative protein of unknown function; expression is cell-cycle regulated, Azf1p-dependent, and heat-inducible; YNR014W has a paralog, YMR206W, that arose from the whole genome duplication -S000036187 CDS YNR014W 14 652465 653103 W 2011-02-03 1997-01-28 -S000005298 ORF Verified YNR015W SMM1 DUS2 chromosome 14 L000003407 14 653387 654541 W 2011-02-03 1997-01-28 Dihydrouridine synthase; member of a family of dihydrouridine synthases including Dus1p, Smm1p, Dus3p, and Dus4p; modifies uridine residues at position 20 of cytoplasmic tRNAs -S000036301 CDS YNR015W 14 653387 654541 W 2011-02-03 1997-01-28 -S000005299 ORF Verified YNR016C ACC1 acetyl-CoA carboxylase ACC1|MTR7|FAS3|ABP2 chromosome 14 L000000017|L000000014|L000000603 14 661374 654673 C 2011-02-03 1997-01-28 Acetyl-CoA carboxylase, biotin containing enzyme; catalyzes carboxylation of cytosolic acetyl-CoA to form malonyl-CoA and regulates histone acetylation by regulating the availablity of acetyl-CoA; required for de novo biosynthesis of long-chain fatty acids; ACC1 has a paralog, HFA1, that arose from the whole genome duplication -S000036342 CDS YNR016C 14 661374 654673 C 2011-02-03 1997-01-28 -S000005300 ORF Verified YNR017W TIM23 protein transporter TIM23|MAS6|MPI3|MIM23 chromosome 14 L000001140|L000001028 14 662913 663581 W 2011-02-03 1997-01-28 Essential component of the TIM23 complex; involved in protein import into mitochondrial matrix and inner membrane; with Tim17p, contributes to architecture and function of the import channel; TIM23 complex is short for the translocase of the inner mitochondrial membrane -S000036476 CDS YNR017W 14 662913 663581 W 2011-02-03 1997-01-28 -S000005301 ORF Verified YNR018W RCF2 AIM38 chromosome 14 14 664270 664944 W 2011-02-03 1997-01-28 Cytochrome c oxidase subunit; has a role in assembly of respiratory supercomplexes; similar to Rcf1p, and either Rcf1p or Rcf2p is required for late-stage assembly of the Cox12p and Cox13p subunits and for cytochrome c oxidase activity; associates with the cytochrome c oxidase - cytochrome bc1 supercomplex; null mutant accumulates reactive oxygen species; member of the conserved hypoxia induced gene family; C. elegans homolog is functional in yeast -S000037162 CDS YNR018W 14 664270 664944 W 2011-02-03 1997-01-28 -S000005302 ORF Verified YNR019W ARE2 sterol acyltransferase|SAT1 chromosome 14 L000003220|L000002769 14 665339 667267 W 2011-02-03 1997-01-28 Acyl-CoA:sterol acyltransferase; endoplasmic reticulum enzyme that contributes the major sterol esterification activity in the presence of oxygen; ARE2 has a paralog, ARE1, that arose from the whole genome duplication -S000037242 CDS YNR019W 14 665339 667267 W 2011-02-03 1997-01-28 -S000005303 ORF Verified YNR020C ATP23 putative metalloprotease chromosome 14 14 668222 667410 C 2011-02-03 1997-01-28 Putative metalloprotease of the mitochondrial inner membrane; required for processing of Atp6p; has an additional role in assembly of the F0 sector of the F1F0 ATP synthase complex; substrate of the Mia40p-Erv1p disulfide relay system, and folding is assisted by Mia40p -S000030232 CDS YNR020C 14 668222 667410 C 2011-02-03 1997-01-28 -S000005304 ORF Uncharacterized YNR021W chromosome 14 14 668377 669591 W 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; YNR021W is not an essential gene -S000031253 CDS YNR021W 14 668377 669591 W 2011-02-03 1997-01-28 -S000005305 ORF Verified YNR022C MRPL50 mitochondrial 54S ribosomal protein MRPL50 chromosome 14 14 670193 669774 C 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit; not essential for mitochondrial translation -S000031291 CDS YNR022C 14 670193 669774 C 2011-02-03 1997-01-28 -S000005306 ORF Verified YNR023W SNF12 SWP73 chromosome 14 L000003408 14 670418 672118 W 2011-02-03 1997-01-28 73 kDa subunit of the SWI/SNF chromatin remodeling complex; involved in transcriptional regulation; relocates to the cytosol under hypoxic conditions; deletion mutants are temperature-sensitive; SNF12 has a paralog, RSC6, that arose from the whole genome duplication -S000032359 CDS YNR023W 14 670418 672118 W 2011-02-03 1997-01-28 -S000005307 ORF Verified YNR024W MPP6 chromosome 14 14 672409 672969 W 2011-02-03 1997-01-28 Nuclear exosome-associated RNA binding protein; involved in surveillance of pre-rRNAs and pre-mRNAs, and the degradation of cryptic non-coding RNAs (ncRNA); copurifies with ribosomes; relocalizes to the cytosol in response to hypoxia -S000032477 CDS YNR024W 14 672409 672969 W 2011-02-03 1997-01-28 -S000005308 ORF Dubious YNR025C chromosome 14 14 673061 672702 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; deletion reduces expression of PIS1 gene encoding phosphatidylinositol synthase -S000032509 CDS YNR025C 14 673061 672702 C 2011-02-03 1997-01-28 -S000005309 ORF Verified YNR026C SEC12 Sar family guanine nucleotide exchange factor SEC12|SED2 chromosome 14 L000001837 14 674689 673274 C 2011-02-03 1997-01-28 Guanine nucleotide exchange factor (GEF); activates Sar1p by catalyzing the exchange of GDP for GTP; required for the initiation of COPII vesicle formation in ER to Golgi transport; glycosylated integral membrane protein of the ER; SEC12 has a paralog, SED4, that arose from the whole genome duplication -S000032620 CDS YNR026C 14 674689 673274 C 2011-02-03 1997-01-28 -S000005310 ORF Verified YNR027W BUD17 putative pyridoxal kinase BUD17 chromosome 14 14 674923 675876 W 2011-02-03 1997-01-28 Putative pyridoxal kinase; a key enzyme in vitamin B6 metabolism; involved in bud-site selection; diploid mutants display a random rather than a bipolar budding pattern; similarity to yeast BUD16 and human pyridoxal kinase (PDXK) -S000033356 CDS YNR027W 14 674923 675876 W 2011-02-03 1997-01-28 -S000005311 ORF Verified YNR028W CPR8 peptidylprolyl isomerase family protein CPR8 chromosome 14 L000004349 14 676177 677103 W 2011-02-03 1997-01-28 Peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; potential role in the secretory pathway; CPR8 has a paralog, CPR4, that arose from the whole genome duplication -S000033423 CDS YNR028W 14 676177 677103 W 2011-02-03 1997-01-28 -S000005312 ORF Uncharacterized YNR029C chromosome 14 14 678488 677199 C 2011-02-03 1997-01-28 Putative protein of unknown function; deletion confers reduced fitness in saline -S000033458 CDS YNR029C 14 678488 677199 C 2011-02-03 1997-01-28 -S000005313 ORF Verified YNR030W ALG12 dolichyl-P-Man:Man(7)GlcNAc(2)-PP-dolichol alpha-1,6-mannosyltransferase|ECM39 chromosome 14 L000003906 14 678799 680454 W 2011-02-03 1997-01-28 Alpha-1,6-mannosyltransferase localized to the ER; responsible for addition of alpha-1,6 mannose to dolichol-linked Man7GlcNAc2; acts in the dolichol pathway for N-glycosylation; human homolog ALG12 complements yeast null mutant -S000034448 CDS YNR030W 14 678799 680454 W 2011-02-03 1997-01-28 -S000005314 ORF Verified YNR031C SSK2 mitogen-activated protein kinase kinase kinase SSK2 chromosome 14 L000002826 14 685433 680694 C 2011-02-03 1997-01-28 MAP kinase kinase kinase of HOG1 mitogen-activated signaling pathway; interacts with Ssk1p, leading to autophosphorylation and activation of Ssk2p which phosphorylates Pbs2p; also mediates actin cytoskeleton recovery from osmotic stress; a HOG-independent function of Ssk2p mediates the calcium-sensitive phenotype of the ptp2 msg5 double disruptant; SSK2 has a paralog, SSK22, that arose from the whole genome duplication -S000034513 CDS YNR031C 14 685433 680694 C 2011-02-03 1997-01-28 -S000005315 ORF Verified YNR032W PPG1 putative serine/threonine-protein kinase PPG1 chromosome 14 L000001470 14 686010 687116 W 2011-02-03 1997-01-28 Putative serine/threonine protein phosphatase; putative phosphatase of the type 2A-like phosphatase family, required for glycogen accumulation; interacts with Tap42p, which binds to and regulates other protein phosphatases -S000035579 CDS YNR032W 14 686010 687116 W 2011-02-03 1997-01-28 -S000007251 ORF Verified YNR032C-A HUB1 ubiquitin-like protein HUB1 chromosome 14 14 687464 687243 C 2011-02-03 1999-07-17 Ubiquitin-like protein modifier; promotes alternative splicing of SRC1 pre-mRNA; binds non-covalently to the HIND domain of Snu66, may function in modification of Sph1p and Hbt1p, functionally complemented by the human or S. pombe ortholog; mechanism of Hub1p adduct formation not yet clear -S000030977 CDS YNR032C-A 14 687464 687243 C 2011-02-03 1999-07-17 -S000005316 ORF Verified YNR033W ABZ1 4-amino-4-deoxychorismate synthase chromosome 14 L000000015 14 687635 689998 W 2011-02-03 1997-01-28 Para-aminobenzoate (PABA) synthase; has similarity to Escherichia coli PABA synthase components PabA and PabB; required for the synthesis of para-aminobenzoic acid, an important intermediate for folate and ubiquinone Q biosynthesis; protein abundance increases in response to DNA replication stress -S000035655 CDS YNR033W 14 687635 689998 W 2011-02-03 1997-01-28 -S000005317 ORF Verified YNR034W SOL1 chromosome 14 L000003102 14 690321 691286 W 2011-02-03 1997-01-28 Protein with a possible role in tRNA export; shows similarity to 6-phosphogluconolactonase non-catalytic domains but does not exhibit this enzymatic activity; homologous to Sol3p and Sol4p; SOL1 has a paralog, SOL2, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000035772 CDS YNR034W 14 690321 691286 W 2011-02-03 1997-01-28 -S000118393 ARS ARS1427 ARSXIV-692 chromosome 14 14 691486 691730 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178177 ARS_consensus_sequence ARS1427 14 691678 691662 C 2014-11-18 2014-11-18 -S000007525 ORF Verified YNR034W-A EGO4 chromosome 14 14 692561 692857 W 2011-02-03 2000-07-14 Protein of unknown function; expression is regulated by Msn2p/Msn4p; YNR034W-A has a paralog, YCR075W-A, that arose from the whole genome duplication -S000037062 CDS YNR034W-A 14 692561 692857 W 2011-02-03 2000-07-14 -S000005318 ORF Verified YNR035C ARC35 END9 chromosome 14 L000004558|L000004035 14 694047 693019 C 2011-02-03 1997-01-28 Subunit of the ARP2/3 complex; ARP2/3 is required for the motility and integrity of cortical actin patches; required for cortical localization of calmodulin -S000036635 CDS YNR035C 14 694047 693019 C 2011-02-03 1997-01-28 -S000005319 ORF Verified YNR036C MRPS12 putative mitochondrial 37S ribosomal protein MRPS12 chromosome 14 14 694822 694361 C 2011-02-03 1997-01-28 Mitochondrial protein; may interact with ribosomes based on co-purification experiments; similar to E. coli and human mitochondrial S12 ribosomal proteins -S000036702 CDS YNR036C 14 694822 694361 C 2011-02-03 1997-01-28 -S000005320 ORF Verified YNR037C RSM19 mitochondrial 37S ribosomal protein RSM19 chromosome 14 14 695327 695052 C 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the small subunit; has similarity to E. coli S19 ribosomal protein -S000036762 CDS YNR037C 14 695327 695052 C 2011-02-03 1997-01-28 -S000005321 ORF Verified YNR038W DBP6 putative ATP-dependent RNA helicase DBP6 chromosome 14 L000003940 14 695595 697484 W 2011-02-03 1997-01-28 Essential protein involved in ribosome biogenesis; putative ATP-dependent RNA helicase of the DEAD-box protein family; human homolog DDX51 complements yeast dbp6 mutant -S000036850 CDS YNR038W 14 695595 697484 W 2011-02-03 1997-01-28 -S000005322 ORF Verified YNR039C ZRG17 Zn(2+) transporter ZRG17 chromosome 14 S000007519 14 699431 697614 C 2011-02-03 1997-01-28 Endoplasmic reticulum zinc transporter; part of a heterodimeric transporter with Msc2p that transfers zinc from the cytosol to the ER lumen; member of the cation diffusion facilitator family of efflux pumps; zinc-regulated directly through Zap1p; transcription induced under conditions of zinc deficiency -S000036872 CDS YNR039C 14 699431 697614 C 2011-02-03 1997-01-28 -S000005323 ORF Uncharacterized YNR040W chromosome 14 14 699690 700460 W 2011-02-03 1997-01-28 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000037624 CDS YNR040W 14 699690 700460 W 2011-02-03 1997-01-28 -S000005325 ORF Dubious YNR042W chromosome 14 14 701238 701666 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified gene COQ2 -S000030522 CDS YNR042W 14 701238 701666 W 2011-02-03 1997-01-28 -S000005324 ORF Verified YNR041C COQ2 4-hydroxybenzoate octaprenyltransferase chromosome 14 L000000379 14 701659 700541 C 2011-02-03 1997-01-28 Para hydroxybenzoate polyprenyl transferase; catalyzes the second step in ubiquinone (coenzyme Q) biosynthesis; human COQ2, mutations in which are implicated in an increased risk of mutiple-system atrophy, can complement a yeast coq2 null mutant -S000037655 CDS YNR041C 14 701659 700541 C 2011-02-03 1997-01-28 -S000005326 ORF Verified YNR043W MVD1 diphosphomevalonate decarboxylase MVD1|ERG19 chromosome 14 L000003136 14 701895 703085 W 2011-02-03 1997-01-28 Mevalonate pyrophosphate decarboxylase; essential enzyme involved in the biosynthesis of isoprenoids and sterols, including ergosterol; acts as a homodimer -S000030635 CDS YNR043W 14 701895 703085 W 2011-02-03 1997-01-28 -S000005327 ORF Verified YNR044W AGA1 chromosome 14 L000000061 14 703699 705876 W 42 2011-02-03 1997-01-28 Anchorage subunit of a-agglutinin of a-cells; highly O-glycosylated protein with N-terminal secretion signal and C-terminal signal for addition of GPI anchor to cell wall, linked to adhesion subunit Aga2p via two disulfide bonds; AGA1 has a paralog, FIG2, that arose from the whole genome duplication -S000031496 CDS YNR044W 14 703699 705876 W 2011-02-03 1997-01-28 -S000005328 ORF Verified YNR045W PET494 chromosome 14 L000001402 14 706139 707608 W 42 2011-02-03 1997-01-28 Mitochondrial translational activator specific for the COX3 mRNA; acts together with Pet54p and Pet122p; located in the mitochondrial inner membrane -S000031585 CDS YNR045W 14 706139 707608 W 2011-02-03 1997-01-28 -S000005329 ORF Verified YNR046W TRM112 RNA methylation protein TRM112 chromosome 14 S000079653 14 707788 708195 W 2011-02-03 1997-01-28 Protein involved in methylation of tRNA, rRNA, and translation factors; also involved in ribosome biogenesis; subunit of tRNA methyltransferase (MTase) complexes in combination with Trm9p and Trm11p; N7-methylates G1575 of 18S rRNA as complex with Bud23p; subunit of complex with Mtq2p that methylates Sup45p (eRF1) in the ternary complex eRF1-eRF3-GTP; relative distribution to the nucleus increases upon DNA replication stress; functional homolog of human TRMT112 -S000031700 CDS YNR046W 14 707788 708195 W 2011-02-03 1997-01-28 -S000005330 ORF Verified YNR047W FPK1 serine/threonine protein kinase FPK1 chromosome 14 14 708523 711204 W 2011-02-03 1997-01-28 Ser/Thr protein kinase; phosphorylates several aminophospholipid translocase family members, regulating phospholipid translocation and membrane asymmetry; phosphorylates and inhibits upstream inhibitory kinase, Ypk1p; localizes to the cytoplasm, early endosome/TGN compartments and thplasma membrane; localizes to the shmoo tip where it has a redundant role in the cellular response to mating pheromone; FPK1 has a paralog, KIN82, that arose from the whole genome duplication -S000031803 CDS YNR047W 14 708523 711204 W 2011-02-03 1997-01-28 -S000005331 ORF Verified YNR048W putative aminophospholipid translocase regulatory protein|CRF1 chromosome 14 14 711630 712811 W 2011-02-03 1997-01-28 Potential noncatalytic subunit for phospholipid translocase Dnf3p; YNR048W has a paralog, CDC50, that arose from the whole genome duplication -S000031910 CDS YNR048W 14 711630 712811 W 2011-02-03 1997-01-28 -S000005332 ORF Verified YNR049C MSO1 chromosome 14 L000003070 14 713655 713023 C 2011-02-03 1997-01-28 Lipid-interacting protein in SNARE complex assembly machinery; acts at late step in secretion; interacts with membranes through two distinct binding sites; shows genetic and physical interactions with Sec1p; required for prospore membrane formation during sporulation; N-terminus closely associates with plasma membrane, C-terminus colocalizes with Sec4p on intracellular membranes; relocalizes from bud neck to nucleus upon DNA replication stress -S000032764 CDS YNR049C 14 713655 713023 C 2011-02-03 1997-01-28 -S000005333 ORF Verified YNR050C LYS9 saccharopine dehydrogenase (NADP+, L-glutamate-forming)|LYS13 chromosome 14 L000000969 14 715388 714048 C 44 2011-02-03 1997-01-28 Saccharopine dehydrogenase (NADP+, L-glutamate-forming); catalyzes the formation of saccharopine from alpha-aminoadipate 6-semialdehyde, the seventh step in lysine biosynthesis pathway; exhibits genetic and physical interactions with TRM112 -S000032832 CDS YNR050C 14 715388 714048 C 2011-02-03 1997-01-28 -S000007460 snoRNA_gene snR49 SNR49 chromosome 14 14 716120 716284 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U990 and small subunit (SSU) rRNA at positions U120, U211, and U302 -S000030653 noncoding_exon snR49 14 716120 716284 W 2011-02-03 2000-05-19 -S000005334 ORF Verified YNR051C BRE5 chromosome 14 14 718327 716780 C 2011-02-03 1997-01-28 Ubiquitin protease cofactor; forms deubiquitination complex with Ubp3p that coregulates anterograde and retrograde transport between the endoplasmic reticulum and Golgi compartments; null is sensitive to brefeldin A -S000033539 CDS YNR051C 14 718327 716780 C 2011-02-03 1997-01-28 -S000005335 ORF Verified YNR052C POP2 CCR4-NOT core DEDD family RNase subunit POP2|CAF1 chromosome 14 L000001465 14 720647 719346 C 2011-02-03 1997-01-28 RNase of the DEDD superfamily; subunit of the Ccr4-Not complex that mediates 3' to 5' mRNA deadenylation -S000033632 CDS YNR052C 14 720647 719346 C 2011-02-03 1997-01-28 -S000029463 snoRNA_gene snR191 SNR191 chromosome 14 S000028465 14 722211 721938 C 2011-02-03 2003-12-09 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at positions U2258 and U2260; encoded within the intron of NOG2/YNR053C -S000034351 noncoding_exon snR191 14 722211 721938 C 2011-02-03 2003-12-09 -S000005336 ORF Verified YNR053C NOG2 putative GTPase NOG2|NUG2 chromosome 14 14 723112 721120 C 2011-02-03 1997-01-28|2011-02-03 Putative GTPase; associates with pre-60S ribosomal subunits in the nucleolus and is required for their nuclear export and maturation; recruited by ribosomal proteins L17, L35, and L37 to assembling ribosomes after 27SB pre-rRNA is generated, immediately preceding removal of ITS2 -S000033758 CDS YNR053C 14 721770 721120 C 2011-02-03 1997-01-28 -S000033757 CDS YNR053C 14 723112 722303 C 2011-02-03 1997-01-28 -S000033759 intron YNR053C 14 722302 721771 C 2011-02-03 1997-01-28|2011-02-03 -S000005337 ORF Verified YNR054C ESF2 RNA-binding ATPase activator ESF2|ABT1 chromosome 14 14 724306 723356 C 2011-02-03 1997-01-28 Essential nucleolar protein involved in pre-18S rRNA processing; binds to RNA and stimulates ATPase activity of Dbp8; involved in assembly of the small subunit (SSU) processome -S000034628 CDS YNR054C 14 724306 723356 C 2011-02-03 1997-01-28 -S000006653 tRNA_gene tL(UAA)N chromosome 14 L000003695 14 726217 726134 C 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000037416 noncoding_exon tL(UAA)N 14 726217 726134 C 2011-02-03 2000-05-19 -S000007147 long_terminal_repeat YNRWsigma4 chromosome 14 14 726234 726574 W 2011-02-03 2000-05-19 Ty3 LTR -S000007144 long_terminal_repeat YNRCdelta8 chromosome 14 14 726945 726614 C 2011-02-03 2000-05-19 Ty1 LTR -S000007145 long_terminal_repeat YNRCdelta9 chromosome 14 14 727661 727363 C 2011-02-03 2000-05-19 Ty1 LTR -S000005338 ORF Verified YNR055C HOL1 chromosome 14 L000000798 14 730186 728426 C 48 2011-02-03 1997-01-28 Putative transporter in the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; mutations in membrane-spanning domains permit cation and histidinol uptake -S000034785 CDS YNR055C 14 730186 728426 C 2011-02-03 1997-01-28 -S000005339 ORF Verified YNR056C BIO5 chromosome 14 L000003530 14 733303 731618 C 2011-02-03 1997-01-28 Putative transmembrane protein involved in the biotin biosynthesis; responsible for uptake of 7-keto 8-aminopelargonic acid; BIO5 is in a cluster of 3 genes (BIO3, BIO4, and BIO5) that mediate biotin synthesis -S000034927 CDS YNR056C 14 733303 731618 C 2011-02-03 1997-01-28 -S000005340 ORF Verified YNR057C BIO4 dethiobiotin synthase chromosome 14 L000003307 14 734069 733356 C 2011-02-03 1997-01-28 Dethiobiotin synthetase; catalyzes the third step in the biotin biosynthesis pathway; BIO4 is in a cluster of 3 genes (BIO3, BIO4, and BIO5) that mediate biotin synthesis; BIO3 and BIO4 were acquired by horizontal gene transfer (HGT) from bacteria; expression appears to be repressed at low iron levels -S000035846 CDS YNR057C 14 734069 733356 C 2011-02-03 1997-01-28 -S000005341 ORF Verified YNR058W BIO3 adenosylmethionine-8-amino-7-oxononanoate transaminase chromosome 14 L000003176 14 734291 735733 W 2011-02-03 1997-01-28 7,8-diamino-pelargonic acid aminotransferase (DAPA); catalyzes the second step in the biotin biosynthesis pathway; BIO3 is in a cluster of 3 genes (BIO3, BIO4, and BIO5) that mediate biotin synthesis; BIO3 and BIO4 were acquired by horizontal gene transfer (HGT) from bacteria -S000036073 CDS YNR058W 14 734291 735733 W 2011-02-03 1997-01-28 -S000005342 ORF Verified YNR059W MNT4 putative alpha-1,3-mannosyltransferase chromosome 14 14 736803 738545 W 2011-02-03 1997-01-28 Putative alpha-1,3-mannosyltransferase; not required for protein O-glycosylation; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively -S000036222 CDS YNR059W 14 736803 738545 W 2011-02-03 1997-01-28 -S000005343 ORF Verified YNR060W FRE4 ferric-chelate reductase chromosome 14 L000003556 14 739951 742110 W 2011-02-03 1997-01-28 Ferric reductase; reduces a specific subset of siderophore-bound iron prior to uptake by transporters; expression induced by low iron levels -S000036976 CDS YNR060W 14 739951 742110 W 2011-02-03 1997-01-28 -S000005344 ORF Verified YNR061C chromosome 14 14 743540 742881 C 2011-02-03 1997-01-28 Protein of unknown function; relocalizes from vacuole to cytoplasm upon DNA replication stress -S000037708 CDS YNR061C 14 743540 742881 C 2011-02-03 1997-01-28 -S000005345 ORF Uncharacterized YNR062C chromosome 14 14 745343 744360 C 2011-02-03 1997-01-28 Putative membrane protein of unknown function -S000037784 CDS YNR062C 14 745343 744360 C 2011-02-03 1997-01-28 -S000005346 ORF Uncharacterized YNR063W chromosome 14 14 746943 748766 W 2011-02-03 1997-01-28 Putative zinc-cluster protein of unknown function -S000029847 CDS YNR063W 14 746943 748766 W 2011-02-03 1997-01-28 -S000005347 ORF Verified YNR064C epoxide hydrolase chromosome 14 14 750008 749136 C 2011-02-03 1997-01-28 Epoxide hydrolase; member of the alpha/beta hydrolase fold family; may have a role in detoxification of epoxides -S000030815 CDS YNR064C 14 750008 749136 C 2011-02-03 1997-01-28 -S000005348 ORF Uncharacterized YNR065C YSN1 chromosome 14 14 753700 750350 C 2011-02-03 1997-01-28 Protein of unknown function; protein-protein interactions suggest a possible role in actin patch formation; YNR065C is not an essential gene -S000030902 CDS YNR065C 14 753700 750350 C 2011-02-03 1997-01-28 -S000005349 ORF Uncharacterized YNR066C chromosome 14 14 755035 753725 C 2011-02-03 1997-01-28 Putative membrane-localized protein of unknown function -S000030952 CDS YNR066C 14 755035 753725 C 2011-02-03 1997-01-28 -S000005350 ORF Verified YNR067C DSE4 endo-1,3(4)-beta-glucanase|ENG1 chromosome 14 14 759099 755746 C 2011-02-03 1997-01-28 Daughter cell-specific secreted protein with similarity to glucanases; degrades cell wall from the daughter side causing daughter to separate from mother -S000031043 CDS YNR067C 14 759099 755746 C 2011-02-03 1997-01-28 -S000005351 ORF Uncharacterized YNR068C BUL3 chromosome 14 14 760885 760067 C 2011-02-03 1997-01-28 Putative protein of unknown function; exhibits homology to C-terminal end of Bul1p; expressed as a readthrough product of BSC5, the readthrough locus being termed BUL3; the BUL3 readthrough product is involved in ubiquitin-mediated sorting of plasma membrane proteins and interacts with WW domains of Rsp5p in vitro, but in a functionally different way than the non-readthrough form -S000032003 CDS YNR068C 14 760885 760067 C 2011-02-03 1997-01-28 -S000005352 ORF Verified YNR069C BSC5 BUL3 chromosome 14 14 762592 761123 C 2011-02-03 1997-01-28 Protein of unknown function; shows homology with N-terminal end of Bul1p; ORF exhibits genomic organization compatible with a translational readthrough-dependent mode of expression; readthrough expression includes YNR068C and the locus for this readthrough is termed BUL3; Bul3p is involved in ubiquitin-mediated sorting of plasma membrane proteins; readthrough and shortened forms of Bul3p interact with Rsp5p differently in vitro -S000032095 CDS YNR069C 14 762592 761123 C 2011-02-03 1997-01-28 -S000005353 ORF Verified YNR070W PDR18 ATP-binding cassette multidrug transporter PDR18 chromosome 14 14 765375 769376 W 2011-02-03 1997-01-28|2011-02-03 Putative transporter of the ATP-binding cassette (ABC) family; role in plasma membrane sterol incorporation; implicated in pleiotropic drug resistance; provides resistance to ethanol stress and contributes to a decreased intracellular accumulation of ethanol; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000033201 CDS YNR070W 14 765375 769376 W 2011-02-03 1997-01-28|2011-02-03 -S000005354 ORF Uncharacterized YNR071C aldose 1-epimerase superfamily protein chromosome 14 14 771468 770440 C 2011-02-03 1997-01-28 Putative aldose 1-epimerase -S000033956 CDS YNR071C 14 771468 770440 C 2011-02-03 1997-01-28 -S000005355 ORF Verified YNR072W HXT17 HLT4|hexose transporter HXT17 chromosome 14 L000003265 14 772657 774351 W 2011-02-03 1997-01-28 Putative transmembrane polyol transporter; supports growth on and uptake of mannitol and sorbitol with moderate affinity when overexpressed in a strain deleted for hexose family members; minor hexose transport activity when overexpressed in a similar strain; induced by raffinose and galactose at pH 7.7 versus pH 4.7, repressed by high levels of glucose; HXT17 has a paralog, HXT13, that arose from a segmental duplication -S000034105 CDS YNR072W 14 772657 774351 W 2011-02-03 1997-01-28 -S000005356 ORF Verified YNR073C MAN2 putative mannitol dehydrogenase chromosome 14 14 776300 774792 C 2011-02-03 1997-01-28 Mannitol dehydrogenase; MAN2 has a paralog, DSF1, that arose from a segmental duplication -S000034161 CDS YNR073C 14 776300 774792 C 2011-02-03 1997-01-28 -S000005357 ORF Verified YNR074C AIF1 CPD1 chromosome 14 14 778738 777602 C 2011-02-03 1997-01-28 Mitochondrial cell death effector; translocates to the nucleus in response to apoptotic stimuli, homolog of mammalian Apoptosis-Inducing Factor, putative reductase -S000035101 CDS YNR074C 14 778738 777602 C 2011-02-03 1997-01-28 -S000005358 ORF Verified YNR075W COS10 chromosome 14 L000004068 14 779916 781040 W 2011-02-03 1997-01-28 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins -S000035300 CDS YNR075W 14 779916 781040 W 2011-02-03 1997-01-28 -S000028706 ORF Uncharacterized YNR075C-A chromosome 14 14 781603 781511 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032648 CDS YNR075C-A 14 781603 781511 C 2011-02-03 2003-07-29 -S000005359 ORF Verified YNR076W PAU6 seripauperin PAU6 chromosome 14 L000002880 14 781918 782280 W 2011-02-03 1997-01-28 Member of the seripauperin multigene family; encoded mainly in subtelomeric regions; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole; active during alcoholic fermentation; regulated by anaerobiosis; negatively regulated by oxygen; repressed by heme; identical to Pau18p -S000035359 CDS YNR076W 14 781918 782280 W 2011-02-03 1997-01-28 -S000028993 telomere TEL14R chromosome 14 14 783278 784333 W 54 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome XIV; composed of an X element core sequence, X element combinatorial repeats, and a terminal stretch of telomeric repeats -S000028994 telomeric_repeat TEL14R 14 784038 784333 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome XIV -S000028995 X_element TEL14R 14 783278 783740 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome XIV; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YNR077C -S000028996 X_element_combinatorial_repeat TEL14R 14 783741 784037 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr XIV; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000005360 ORF Uncharacterized YNR077C chromosome 14 14 783541 783287 C 2011-02-03 1997-01-28 Protein of unknown function, abundance changes with carbon source -S000035391 CDS YNR077C 14 783541 783287 C 2011-02-03 1997-01-28 -S000028709 ORF Uncharacterized YOL166W-A chromosome 15 15 585 740 W 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032654 CDS YOL166W-A 15 585 740 W 2003-07-29 2003-07-29 -S000028929 telomere TEL15L chromosome 15 15 847 1 C -132 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome XV; composed of an X element core sequence, X element combinatorial repeats, and a terminal stretch of telomeric repeats -S000028930 telomeric_repeat TEL15L 15 117 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome XV -S000028931 X_element TEL15L 15 847 389 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome XV; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YOL166W-A -S000028932 X_element_combinatorial_repeat TEL15L 15 388 118 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr XV; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000005526 ORF Dubious YOL166C chromosome 15 15 1338 1000 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036497 CDS YOL166C 15 1338 1000 C 1996-07-31 1996-07-31 -S000005525 ORF Verified YOL165C AAD15 putative aryl-alcohol dehydrogenase chromosome 15 L000004640 15 2078 1647 C 1996-07-31 1996-07-31 Putative aryl-alcohol dehydrogenase; similar to P. chrysosporium aryl-alcohol dehydrogenase; mutational analysis has not yet revealed a physiological role; AAD15 has a paralog, AAD3, that arose from a segmental duplication; members of the AAD gene family comprise three pairs (AAD3 + AAD15, AAD6/AAD16 + AAD4, AAD10 + AAD14) whose two genes are more related to one another than to other members of the family -S000035578 CDS YOL165C 15 2078 1647 C 1996-07-31 1996-07-31 -S000007148 long_terminal_repeat YOLCdelta1 chromosome 15 15 3223 2894 C 2000-05-19 2000-05-19 Ty1 LTR -S000007160 long_terminal_repeat YOLWtau1 chromosome 15 15 3809 3986 W 2000-05-19 2000-05-19 Ty4 LTR -S000028580 ORF Uncharacterized YOL164W-A chromosome 15 15 4130 4312 W 2003-07-29 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031327 CDS YOL164W-A 15 4130 4312 W 2003-07-29 2003-07-29 -S000005524 ORF Verified YOL164W BDS1 sulfuric ester hydrolase chromosome 15 15 6175 8115 W 1996-07-31 1996-07-31 Bacterially-derived sulfatase; required for use of alkyl- and aryl-sulfates as sulfur sources -S000035536 CDS YOL164W 15 6175 8115 W 1996-07-31 1996-07-31 -S000005523 ORF Uncharacterized YOL163W chromosome 15 15 9597 10106 W 2011-02-03 1996-07-31 Putative protein of unknown function; member of the Dal5p subfamily of the major facilitator family -S000035451 CDS YOL163W 15 9597 10106 W 2011-02-03 1996-07-31 -S000005522 ORF Uncharacterized YOL162W chromosome 15 15 10119 10766 W 2011-02-03 1996-07-31 Putative protein of unknown function; member of the Dal5p subfamily of the major facilitator family -S000034399 CDS YOL162W 15 10119 10766 W 2011-02-03 1996-07-31 -S000005521 ORF Verified YOL161C PAU20 seripauperin PAU20 chromosome 15 15 11911 11549 C 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP and mCherry fusion proteins localize to the vacuole; expression induced by low temperature and also by anaerobic conditions; induced during alcoholic fermentation -S000034226 CDS YOL161C 15 11911 11549 C 2011-02-03 1996-07-31 -S000005520 ORF Dubious YOL160W chromosome 15 15 14313 14654 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034155 CDS YOL160W 15 14313 14654 W 2011-02-03 1996-07-31 -S000007627 ORF Verified YOL159C-A chromosome 15 15 15505 15233 C 2011-02-03 2001-02-26 Protein of unknown function; overexpression affects endocytic protein trafficking; identified by sequence comparison with hemiascomycetous yeast species -S000037257 CDS YOL159C-A 15 15505 15233 C 2011-02-03 2001-02-26 -S000005519 ORF Verified YOL159C CSS3 chromosome 15 15 17796 17281 C 2011-02-03 1996-07-31 Protein of unknown function, secreted when constitutively expressed; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the cell periphery, SWAT-GFP fusion also localizes to the extracellular region, and mCherry fusion also localizes to the vacuole; deletion mutants are viable and have elevated levels of Ty1 retrotransposition and Ty1 cDNA -S000034633 CDS YOL159C 15 17796 17281 C 2011-02-03 1996-07-31 -S000007149 long_terminal_repeat YOLCdelta2 chromosome 15 15 18561 18302 C 2011-02-03 2000-05-19 Ty1 LTR -S000005518 ORF Verified YOL158C ENB1 ARN4 chromosome 15 15 21311 19491 C 2011-02-03 1996-07-31 Endosomal ferric enterobactin transporter; expressed under conditions of iron deprivation; member of the major facilitator superfamily; expression is regulated by Rcs1p and affected by chloroquine treatment -S000034544 CDS YOL158C 15 21311 19491 C 2011-02-03 1996-07-31 -S000005517 ORF Verified YOL157C IMA2 oligo-1,6-glucosidase IMA2 chromosome 15 15 24294 22525 C 2011-02-03 1996-07-31 Isomaltase (alpha-1,6-glucosidase/alpha-methylglucosidase); preferred specificity for isomaltose, alpha-methylglucoside, and palatinose, but also exhibits alpha-1,2 glucosidase activity on sucrose and kojibiose, and can cleave the 1,3-alpha linkage of nigerose and turanose and the alpha-1,5 linkage of leucrose in vitro; not required for isomaltose utilization, but Ima2p overexpression allows the ima1 null mutant to grow on isomaltose -S000034426 CDS YOL157C 15 24294 22525 C 2011-02-03 1996-07-31 -S000005516 ORF Verified YOL156W HXT11 hexose transporter HXT11|LGT3 chromosome 15 L000000947 15 25273 26976 W 2011-02-03 1996-07-31 Hexose transporter; capable of transporting a broad range of substrates including: glucose, fructose, mannose and galactose; polyol transporter that supports the growth on and uptake of xylitol with low affinity when overexpressed in a strain deleted for hexose family members; nearly identical in sequence to Hxt9p; has similarity to major facilitator superfamily (MFS) transporters; involved in pleiotropic drug resistance -S000032470 CDS YOL156W 15 25273 26976 W 2011-02-03 1996-07-31 -S000028855 ORF Uncharacterized YOL155W-A chromosome 15 15 27084 27218 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000034568 CDS YOL155W-A 15 27084 27218 W 2011-02-03 2003-07-29 -S000005515 ORF Verified YOL155C HPF1 mannoprotein chromosome 15 15 31606 28703 C 2011-02-03 1996-07-31 Haze-protective mannoprotein; reduces the particle size of aggregated proteins in white wines -S000032305 CDS YOL155C 15 31606 28703 C 2011-02-03 1996-07-31 -S000005514 ORF Verified YOL154W ZPS1 chromosome 15 15 34658 35407 W 2011-02-03 1996-07-31 Putative GPI-anchored protein; transcription is induced under low-zinc conditions, as mediated by the Zap1p transcription factor, and at alkaline pH -S000032261 CDS YOL154W 15 34658 35407 W 2011-02-03 1996-07-31 -S000118995 ARS ARS1531 ARSXV-36|ARS1506.5 chromosome 15 15 35669 35904 2011-02-03 2006-10-02|2011-02-03 Autonomously Replicating Sequence -S000178178 ARS_consensus_sequence ARS1531 15 35713 35729 W 2014-11-18 2014-11-18 -S000005513 blocked_reading_frame YOL153C chromosome 15 15 38567 36822 C 2011-02-03 1996-07-31 Blocked reading frame, contains two in-frame stops in translation; this ORF is conserved, without the stops, in Saccharomyces paradoxus, S. mikatae, and S. bayanus; RNA sequencing data indicate the presence of a transcription unit at this reading frame -S000031205 CDS YOL153C 15 38567 36822 C 2011-02-03 1996-07-31 -S000005512 ORF Verified YOL152W FRE7 putative ferric-chelate reductase chromosome 15 L000003559 15 40748 42610 W 2011-02-03 1996-07-31|2006-01-05 Putative ferric reductase with similarity to Fre2p; expression induced by low copper levels -S000031126 CDS YOL152W 15 40748 42610 W 2011-02-03 1996-07-31|2006-01-05 -S000005511 ORF Verified YOL151W GRE2 methylglyoxal reductase (NADPH-dependent) GRE2 chromosome 15 L000004177 15 43694 44722 W 2011-02-03 1996-07-31 3-methylbutanal reductase and NADPH-dependent methylglyoxal reductase; stress induced (osmotic, ionic, oxidative, heat shock and heavy metals); regulated by the HOG pathway; restores resistance to glycolaldehyde by coupling reduction of glycolaldehyde to ethylene glycol and oxidation of NADPH to NADP+; protein abundance increases in response to DNA replication stress; methylglyoxal reductase (NADPH-dependent) is also known as D-lactaldehyde dehydrogenase -S000031026 CDS YOL151W 15 43694 44722 W 2011-02-03 1996-07-31 -S000005510 ORF Dubious YOL150C chromosome 15 15 44784 44473 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000029963 CDS YOL150C 15 44784 44473 C 2011-02-03 1996-07-31 -S000005509 ORF Verified YOL149W DCP1 MRT2 chromosome 15 L000002960|L000003045|S000029311 15 44938 45633 W 2011-02-03 1996-07-31 Subunit of the Dcp1p-Dcp2p decapping enzyme complex; decapping complex removes the 5' cap structure from mRNAs prior to their degradation; enhances the activity of catalytic subunit Dcp2p; regulated by DEAD box protein Dhh1p; forms cytoplasmic foci upon DNA replication stress -S000030376 CDS YOL149W 15 44938 45633 W 2011-02-03 1996-07-31 -S000005508 ORF Verified YOL148C SPT20 ADA5 chromosome 15 L000002593 15 47574 45760 C 2011-02-03 1996-07-31 Subunit of the SAGA transcriptional regulatory complex; involved in maintaining the integrity of the complex; mutant displays reduced transcription elongation in the G-less-based run-on (GLRO) assay -S000030163 CDS YOL148C 15 47574 45760 C 2011-02-03 1996-07-31 -S000005507 ORF Verified YOL147C PEX11 PMP27|PMP24 chromosome 15 L000002650|L000004117 15 48643 47933 C 2011-02-03 1996-07-31 Peroxisomal protein required for medium-chain fatty acid oxidation; also required for peroxisome proliferation, possibly by inducing membrane curvature; localization regulated by phosphorylation; transcription regulated by Adr1p and Pip2p-Oaf1p -S000036432 CDS YOL147C 15 48643 47933 C 2011-02-03 1996-07-31 -S000005506 ORF Verified YOL146W PSF3 DNA replication protein PSF3 chromosome 15 15 48864 49448 W 2011-02-03 2003-09-22|1996-07-31 Subunit of the GINS complex (Sld5p, Psf1p, Psf2p, Psf3p); complex is localized to DNA replication origins and implicated in assembly of the DNA replication machinery -S000036403 CDS YOL146W 15 48864 49448 W 2011-02-03 2003-09-22|1996-07-31 -S000005505 ORF Verified YOL145C CTR9 CDP1 chromosome 15 L000003477 15 52788 49555 C 2011-02-03 1996-07-31|2011-02-03 Component of the Paf1p complex involved in transcription elongation; binds to and modulates the activity of RNA polymerases I and II; required for expression of a subset of genes, including cyclin genes; involved in SER3 repression by helping to maintain SRG1 transcription-dependent nucleosome occupancy; contains TPR repeats -S000036252 CDS YOL145C 15 52788 49555 C 2011-02-03 1996-07-31|2011-02-03 -S000005504 ORF Verified YOL144W NOP8 chromosome 15 L000004849 15 53098 54552 W 2011-02-03 1996-07-31 Nucleolar protein required for 60S ribosomal subunit biogenesis -S000036206 CDS YOL144W 15 53098 54552 W 2011-02-03 1996-07-31 -S000005503 ORF Verified YOL143C RIB4 lumazine synthase RIB4 chromosome 15 L000003027 15 55104 54595 C 2011-02-03 1996-07-31 Lumazine synthase (DMRL synthase); catalyzes synthesis of immediate precursor to riboflavin; DMRL synthase stands for 6,7-dimethyl-8-ribityllumazine synthase -S000035226 CDS YOL143C 15 55104 54595 C 2011-02-03 1996-07-31 -S000005502 ORF Verified YOL142W RRP40 exosome non-catalytic core subunit RRP40|MTR14 chromosome 15 L000004799 15 55558 56280 W 2011-02-03 1996-07-31|2011-02-03 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; predicted to contain both S1 and KH RNA binding domains; has similarity to human hRrp40p (EXOSC3) -S000035132 CDS YOL142W 15 55558 56280 W 2011-02-03 1996-07-31|2011-02-03 -S000005501 ORF Verified YOL141W PPM2 tRNA methyltransferase PPM2|TYW4 chromosome 15 15 56452 58539 W 2011-02-03 1996-07-31|2011-02-03 AdoMet-dependent tRNA methyltransferase; also involved in methoxycarbonylation; required for the synthesis of wybutosine (yW), a modified guanosine found at the 3'-position adjacent to the anticodon of phe-tRNA; similarity to Ppm1p -S000034965 CDS YOL141W 15 56452 58539 W 2011-02-03 1996-07-31|2011-02-03 -S000077073 matrix_attachment_site ETC2 ETC2 chromosome 15 15 58541 58563 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; can act as a transcription-blocking insulator or as a heterochromatin barrier element; remains predominantly localized to the nuclear periphery throughout cell cycle; located between PPM2 and ARG8 -S000005500 ORF Verified YOL140W ARG8 acetylornithine transaminase chromosome 15 L000000111 15 58759 60030 W -130 2006-01-05 1996-07-31 Acetylornithine aminotransferase; catalyzes the fourth step in the biosynthesis of the arginine precursor ornithine -S000034835 CDS YOL140W 15 58759 60030 W 2006-01-05 1996-07-31 -S000005499 ORF Verified YOL139C CDC33 translation initiation factor eIF4E|eIF4E|TIF45 chromosome 15 L000000270 15 61024 60383 C 2006-01-05 1996-07-31 mRNA cap binding protein and translation initiation factor eIF4E; the eIF4E-cap complex is responsible for mediating cap-dependent mRNA translation via interactions with translation initiation factor eIF4G (Tif4631p or Tif4632p); protein abundance increases in response to DNA replication stress; mutants are defective for adhesion and pseudohyphal growth; human homolog EIF4E can complement yeast cdc33 null mutant -S000035358 CDS YOL139C 15 61024 60383 C 2006-01-05 1996-07-31 -S000005498 ORF Verified YOL138C RTC1 SEA2 chromosome 15 15 65350 61325 C 2006-01-05 1996-07-31|2011-02-03 Subunit of SEACAT, a subcomplex of the SEA complex; Rtc1p, along with Mtc5p and Sea4p, redundantly inhibit the TORC1 inhibitory role of the Iml1p/SEACIT (Iml1p-Npr2p-Npr3p) subcomplex, a GAP for GTPase Gtr1p (EGOC subunit) in response to amino acid limitation, thereby resulting in activation of TORC1 signaling; SEA is a coatomer-related complex that associates dynamically with the vacuole; has N-terminal WD-40 repeats and a C-terminal RING motif; null suppresses cdc13-1 -S000035295 CDS YOL138C 15 65350 61325 C 2006-01-05 1996-07-31|2011-02-03 -S000005497 ORF Verified YOL137W BSC6 chromosome 15 15 65621 67114 W 2006-01-05 1996-07-31 Protein of unknown function with 8 putative transmembrane segments; ORF exhibits genomic organization compatible with a translational readthrough-dependent mode of expression -S000034363 CDS YOL137W 15 65621 67114 W 2006-01-05 1996-07-31 -S000005496 ORF Verified YOL136C PFK27 6-phosphofructo-2-kinase|PFK-2 chromosome 15 L000003077 15 68754 67561 C 2006-01-05 1996-07-31 6-phosphofructo-2-kinase; catalyzes synthesis of fructose-2,6-bisphosphate; inhibited by phosphoenolpyruvate and sn-glycerol 3-phosphate, expression induced by glucose and sucrose, transcriptional regulation involves protein kinase A -S000034276 CDS YOL136C 15 68754 67561 C 2006-01-05 1996-07-31 -S000005495 ORF Verified YOL135C MED7 mediator complex subunit MED7 chromosome 15 L000003916 15 70044 69376 C 2006-01-05 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation -S000034163 CDS YOL135C 15 70044 69376 C 2006-01-05 1996-07-31 -S000005493 ORF Verified YOL133W HRT1 SCF ubiquitin ligase complex subunit HRT1|HRT2|ROC1|RBX1 chromosome 15 L000004443 15 70325 70690 W 2006-01-05 1996-07-31 RING-H2 domain core subunit of multiple ubiquitin ligase complexes; subunit of Skp1-Cullin-F-box (SCF) that tethers the Cdc34p (E2) and Cdc53p (cullin) SCF subunits, and is required for degradation of Gic2p, Far1p, Sic1p and Cln2p; subunit of the Rtt101p-Mms1p-Mms22p ubiquitin ligase that stabilizes replication forks after DNA lesions; subunit of the Cul3p-Elc1p-Ela1p ubiquitin ligase involved in Rpb1p degradation as part of transcription-coupled repair -S000032132 CDS YOL133W 15 70325 70690 W 2006-01-05 1996-07-31 -S000005494 ORF Dubious YOL134C chromosome 15 15 70545 70156 C 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps HRT1, a verified gene that encodes an SCF ubiquitin ligase subunit -S000034069 CDS YOL134C 15 70545 70156 C 2006-01-05 1996-07-31 -S000005492 ORF Verified YOL132W GAS4 1,3-beta-glucanosyltransferase chromosome 15 15 71300 72715 W 2006-01-05 1996-07-31 1,3-beta-glucanosyltransferase; involved with Gas2p in spore wall assembly; has similarity to Gas1p; localizes to the cell wall -S000032019 CDS YOL132W 15 71300 72715 W 2006-01-05 1996-07-31 -S000118484 ARS ARS1507 ARSXV-73 chromosome 15 15 72683 72753 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178179 ARS_consensus_sequence ARS1507 15 72687 72703 W 2014-11-18 2014-11-18 -S000005491 ORF Uncharacterized YOL131W chromosome 15 15 73031 73357 W 2006-01-05 1996-07-31 Putative protein of unknown function; YOL131W has a paralog, STB1, that arose from the whole genome duplication -S000031851 CDS YOL131W 15 73031 73357 W 2006-01-05 1996-07-31 -S000005490 ORF Verified YOL130W ALR1 Mg(2+) transporter ALR1|SWC3 chromosome 15 L000002887 15 74400 76979 W 2006-01-05 1996-07-31 Plasma membrane Mg(2+) transporter; expression and turnover are regulated by Mg(2+) concentration; overexpression confers increased tolerance to Al(3+) and Ga(3+) ions; magnesium transport defect of the null mutant is functionally complemented by either of the human genes MAGT1 and TUSC3 that are not orthologous to ALR1 -S000030868 CDS YOL130W 15 74400 76979 W 2006-01-05 1996-07-31 -S000005489 ORF Verified YOL129W VPS68 chromosome 15 15 77560 78114 W 2006-01-05 1996-07-31 Vacuolar membrane protein of unknown function; involved in vacuolar protein sorting; also detected in the mitochondria -S000032156 CDS YOL129W 15 77560 78114 W 2006-01-05 1996-07-31 -S000005488 ORF Verified YOL128C YGK3 serine/threonine protein kinase YGK3 chromosome 15 15 79479 78352 C 2006-01-05 1996-07-31 Protein kinase related to mammalian GSK-3 glycogen synthase kinases; GSK-3 homologs (Mck1p, Rim11p, Mrk1p, Ygk3p) are involved in control of Msn2p-dependent transcription of stress responsive genes and in protein degradation; YGK3 has a paralog, MCK1, that arose from the whole genome duplication -S000031135 CDS YOL128C 15 79479 78352 C 2006-01-05 1996-07-31 -S000005487 ORF Verified YOL127W RPL25 uL23|ribosomal 60S subunit protein L25|L23|rpl6L|YL25|L25 chromosome 15 L000001722 15 80348 81190 W 2006-01-05 1996-07-31 Ribosomal 60S subunit protein L25; primary rRNA-binding ribosomal protein component of large ribosomal subunit; binds to 25S rRNA via a conserved C-terminal motif; homologous to mammalian ribosomal protein L23A and bacterial L23 -S000031095 CDS YOL127W 15 80348 80360 W 2006-01-05 1996-07-31 -S000031096 CDS YOL127W 15 80775 81190 W 2006-01-05 1996-07-31 -S000031097 intron YOL127W 15 80361 80774 W 2006-01-05 1996-07-31 -S000005486 ORF Verified YOL126C MDH2 malate dehydrogenase MDH2 chromosome 15 L000001046 15 82920 81787 C 2006-10-06 1996-07-31|2006-10-06 Cytoplasmic malate dehydrogenase; one of three isozymes that catalyze interconversion of malate and oxaloacetate; involved in the glyoxylate cycle and gluconeogenesis during growth on two-carbon compounds; interacts with Pck1p and Fbp1 -S000030943 CDS YOL126C 15 82920 81787 C 2006-10-06 1996-07-31|2006-10-06 -S000005485 ORF Verified YOL125W TRM13 tRNA:m4X modification enzyme chromosome 15 15 83834 85264 W 2006-01-05 1996-07-31|2011-02-03 2'-O-methyltransferase; responsible for modification of tRNA at position 4; C-terminal domain has similarity to Rossmann-fold (RFM) superfamily of RNA methyltransferases -S000030912 CDS YOL125W 15 83834 85264 W 2006-01-05 1996-07-31|2011-02-03 -S000118485 ARS ARS1508 ARSXV-85 chromosome 15 15 85270 85361 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178180 ARS_consensus_sequence ARS1508 15 85360 85344 C 2014-11-18 2014-11-18 -S000005484 ORF Verified YOL124C TRM11 tRNA (guanine-N2-)-methyltransferase chromosome 15 S000029604|S000028498 15 86757 85456 C 2006-01-05 1996-07-31 Catalytic subunit of adoMet-dependent tRNA methyltransferase complex; required for the methylation of the guanosine nucleotide at position 10 (m2G10) in tRNAs; contains a THUMP domain and a methyltransferase domain; another complex member is Trm112p -S000029846 CDS YOL124C 15 86757 85456 C 2006-01-05 1996-07-31 -S000005483 ORF Verified YOL123W HRP1 NAB5|NAB4 chromosome 15 L000003337|L000003022|L000003015 15 87844 89448 W 2006-01-05 1996-07-31 Subunit of cleavage factor I; cleavage factor I is a five-subunit complex required for the cleavage and polyadenylation of pre-mRNA 3' ends; RRM-containing heteronuclear RNA binding protein and hnRNPA/B family member that binds to poly (A) signal sequences; required for genome stability -S000037901 CDS YOL123W 15 87844 89448 W 2006-01-05 1996-07-31 -S000005482 ORF Verified YOL122C SMF1 divalent metal ion transporter SMF1|SBS1 chromosome 15 L000001931 15 91419 89692 C 2006-01-05 1996-07-31 Divalent metal ion transporter; broad specificity for di-valent and tri-valent metals; post-translationally regulated by levels of metal ions; member of the Nramp family of metal transport proteins -S000036001 CDS YOL122C 15 91419 89692 C 2006-01-05 1996-07-31 -S000005481 ORF Verified YOL121C RPS19A eS19|ribosomal 40S subunit protein S19A|S19e|rp55a|YS16A|S19A|S16aA chromosome 15 L000003299 15 92850 92026 C 2006-01-05 1996-07-31 Protein component of the small (40S) ribosomal subunit; required for assembly and maturation of pre-40 S particles; homologous to mammalian ribosomal protein S19, no bacterial homolog; mutations in human RPS19 are associated with Diamond Blackfan anemia; RPS19A has a paralog, RPS19B, that arose from the whole genome duplication -S000035838 CDS YOL121C 15 92440 92026 C 2006-01-05 1996-07-31 -S000035837 CDS YOL121C 15 92850 92831 C 2006-01-05 1996-07-31 -S000035839 intron YOL121C 15 92830 92441 C 2006-01-05 1996-07-31 -S000005480 ORF Verified YOL120C RPL18A eL18|ribosomal 60S subunit protein L18A|L18e|rp28A|L18A|RP28A chromosome 15 L000001668 15 94402 93395 C 2006-01-05 1996-07-31 Ribosomal 60S subunit protein L18A; intron of RPL18A pre-mRNA forms stem-loop structures that are a target for Rnt1p cleavage leading to degradation; homologous to mammalian ribosomal protein L18, no bacterial homolog; RPL18A has a paralog, RPL18B, that arose from the whole genome duplication -S000035727 CDS YOL120C 15 93843 93395 C 2006-01-05 1996-07-31 -S000035726 CDS YOL120C 15 94402 94291 C 2006-01-05 1996-07-31 -S000035728 intron YOL120C 15 94290 93844 C 2006-01-05 1996-07-31 -S000005479 ORF Verified YOL119C MCH4 chromosome 15 15 96361 94856 C 2006-01-05 1996-07-31 Protein with similarity to mammalian monocarboxylate permeases; monocarboxylate permeases are involved in transport of monocarboxylic acids across the plasma membrane but mutant is not deficient in monocarboxylate transport -S000036182 CDS YOL119C 15 96361 94856 C 2006-01-05 1996-07-31 -S000005478 ORF Dubious YOL118C chromosome 15 15 96916 96608 C 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036070 CDS YOL118C 15 96916 96608 C 2006-01-05 1996-07-31 -S000005477 ORF Verified YOL117W RRI2 CSN10 chromosome 15 S000007579 15 97551 99488 W 2006-01-05 1996-07-31 Subunit of the COP9 signalosome (CSN) complex; this complex cleaves the ubiquitin-like protein Nedd8 from SCF ubiquitin ligases; plays a role in the mating pheromone response -S000036034 CDS YOL117W 15 97551 99488 W 2006-01-05 1996-07-31 -S000005476 ORF Verified YOL116W MSN1 PHD2|MSS10|HRB382|FUP1 chromosome 15 L000001197 15 99809 100957 W 2006-01-05 1996-07-31 Transcriptional activator; involved in regulation of invertase and glucoamylase expression, invasive growth and pseudohyphal differentiation, iron uptake, chromium accumulation, and response to osmotic stress; localizes to the nucleus; relative distribution to the nucleus increases upon DNA replication stress -S000035148 CDS YOL116W 15 99809 100957 W 2006-01-05 1996-07-31 -S000005475 ORF Verified YOL115W PAP2 non-canonical poly(A) polymerase PAP2|TRF4 chromosome 15 L000002953 15 101475 103229 W 2006-01-05 1996-07-31 Non-canonical poly(A) polymerase; involved in nuclear RNA degradation as a component of TRAMP; catalyzes polyadenylation of hypomodified tRNAs, and snoRNA and rRNA precursors; required for mRNA surveillance and maintenance of genome integrity, serving as a link between RNA and DNA metabolism; overlapping but non-redundant functions with Trf5p; relocalizes to cytosol in response to hypoxia -S000035037 CDS YOL115W 15 101475 103229 W 2006-01-05 1996-07-31 -S000005474 ORF Verified YOL114C PTH4 chromosome 15 15 103925 103317 C 2006-01-05 1996-07-31 Protein similar to the human peptidyl-tRNA hydrolase gene ICT1; associates with mitochondrial large subunit; may function in translation termination; YOL114C is not an essential gene -S000034821 CDS YOL114C 15 103925 103317 C 2006-01-05 1996-07-31 -S000005473 ORF Verified YOL113W SKM1 putative serine/threonine protein kinase SKM1 chromosome 15 L000004142 15 104326 106293 W 2006-01-05 1996-07-31 Member of the PAK family of serine/threonine protein kinases; similar to Ste20p; involved in down-regulation of sterol uptake; proposed to be a downstream effector of Cdc42p during polarized growth; SKM1 has a paralog, CLA4, that arose from the whole genome duplication -S000034781 CDS YOL113W 15 104326 106293 W 2006-01-05 1996-07-31 -S000005472 ORF Verified YOL112W MSB4 Rab GTPase-activating protein MSB4 chromosome 15 L000003919 15 106710 108188 W 2006-01-05 1996-07-31 GTPase-activating protein of the Ras superfamily; acts primarily on Sec4p, localizes to the bud site and bud tip; msb3 msb4 double mutation causes defects in secretion and actin organization; similar to the TBC-domain Tre2 oncogene; MSB4 has a paralog, MSB3, that arose from the whole genome duplication; human homolog USP6NL can complement yeast msb3 msb4 double null mutant -S000033897 CDS YOL112W 15 106710 108188 W 2006-01-05 1996-07-31 -S000005471 ORF Verified YOL111C MDY2 GET5|TMA24 chromosome 15 15 108896 108258 C 2006-01-05 1996-07-31 Protein involved in inserting tail-anchored proteins into ER membranes; forms a complex with Get4p; required for efficient mating; involved in shmoo formation and nuclear migration in the pre-zygote; associates with ribosomes -S000033697 CDS YOL111C 15 108896 108258 C 2006-01-05 1996-07-31 -S000005470 ORF Verified YOL110W SHR5 ERF4 chromosome 15 L000002592 15 109176 109889 W 2006-01-05 1996-07-31 Palmitoyltransferase subunit; this complex adds a palmitoyl lipid moiety to heterolipidated substrates such as Ras1p and Ras2p through a thioester linkage; palmitoylation is required for Ras2p membrane localization; Palmitoyltransferase is composed of Shr5p and Erf2 -S000033648 CDS YOL110W 15 109176 109889 W 2006-01-05 1996-07-31 -S000005469 ORF Verified YOL109W ZEO1 chromosome 15 L000003927 15 110297 110638 W 2006-01-05 1996-07-31 Peripheral membrane protein of the plasma membrane; interacts with Mid2p; regulates the cell integrity pathway mediated by Pkc1p and Slt2p; the authentic protein is detected in a phosphorylated state in highly purified mitochondria -S000031643 CDS YOL109W 15 110297 110638 W 2006-01-05 1996-07-31 -S000006592 tRNA_gene tG(UCC)O SUF1 chromosome 15 L000002149|L000003720 15 111033 110962 C -110 2006-01-05 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons -S000037569 noncoding_exon tG(UCC)O 15 111033 110962 C 2006-01-05 2000-05-19 -S000005468 ORF Verified YOL108C INO4 chromosome 15 L000000869 15 111886 111431 C 2006-01-05 1996-07-31 Transcription factor involved in phospholipid synthesis; required for derepression of inositol-choline-regulated genes involved in phospholipid synthesis; forms a complex, with Ino2p, that binds the inositol-choline-responsive element through a basic helix-loop-helix domain -S000030752 CDS YOL108C 15 111886 111431 C 2006-01-05 1996-07-31 -S000005467 ORF Uncharacterized YOL107W chromosome 15 15 112102 113130 W 2006-01-05 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and colocalizes in a punctate pattern with the early golgi/COPI vesicles; YOL107W is not an essential protein -S000030688 CDS YOL107W 15 112102 113130 W 2006-01-05 1996-07-31 -S000005466 ORF Dubious YOL106W chromosome 15 15 113226 113579 W 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030608 CDS YOL106W 15 113226 113579 W 2006-01-05 1996-07-31 -S000007150 long_terminal_repeat YOLCdelta3 chromosome 15 15 113626 113294 C 2006-01-05 2000-05-19 Ty1 LTR -S000006746 tRNA_gene tT(AGU)O1 chromosome 15 L000003701 15 113802 113874 W 2006-01-05 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000037533 noncoding_exon tT(AGU)O1 15 113802 113874 W 2006-01-05 2000-05-19 -S000118486 ARS ARS1509 ARSXV-114 chromosome 15 15 113885 113983 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178181 ARS_consensus_sequence ARS1509 15 113894 113910 W 2014-11-18 2014-11-18 -S000005465 ORF Verified YOL105C WSC3 chromosome 15 L000004218 15 115808 114138 C 2006-01-05 1996-07-31 Sensor-transducer of the stress-activated PKC1-MPK1 signaling pathway; involved in maintenance of cell wall integrity; involved in response to heat shock and other stressors; regulates 1,3-beta-glucan synthesis; WSC3 has a paralog, WSC2, that arose from the whole genome duplication -S000030500 CDS YOL105C 15 115808 114138 C 2006-01-05 1996-07-31 -S000005464 ORF Verified YOL104C NDJ1 TAM1 chromosome 15 L000003266|L000003597 15 117454 116396 C 2006-01-05 1996-07-31 Protein that regulates meiotic SPB cohesion and telomere clustering; localizes to both spindle pole bodies (SPBs) and telomeres; required for bouquet formation, effective homolog pairing, ordered cross-over distribution, sister chromatid cohesion at meiotic telomeres, chromosomal segregation and telomere-led rapid prophase movement -S000037679 CDS YOL104C 15 117454 116396 C 2006-01-05 1996-07-31 -S000007154 long_terminal_repeat YOLWdelta4 chromosome 15 15 117703 118040 W 2006-01-05 2000-05-19 Ty1 LTR -S000007161 LTR_retrotransposon YOLWTy1-1 Ty1 chromosome 15 15 117703 123628 W 2006-01-05 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007349 transposable_element_gene YOL103W-A gag protein chromosome 15 15 118000 119322 W 2006-01-05 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000030410 CDS YOL103W-A 15 118000 119322 W 2006-01-05 1999-07-17 -S000007350 transposable_element_gene YOL103W-B gag-pol fusion protein chromosome 15 S000029018 15 118000 123268 W 2006-01-05 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000030418 CDS YOL103W-B 15 118000 119304 W 2006-01-05 1999-07-17 -S000030419 CDS YOL103W-B 15 119306 123268 W 2006-01-05 1999-07-17 -S000030420 plus_1_translational_frameshift YOL103W-B 15 119305 119305 W 2006-01-05 1999-07-17 -S000007155 long_terminal_repeat YOLWdelta5 chromosome 15 15 123291 123628 W 2006-01-05 2000-05-19 Ty1 LTR -S000005463 ORF Verified YOL103W ITR2 myo-inositol transporter ITR2|HRB612 chromosome 15 L000000880 15 124001 125830 W 2006-01-05 2003-09-22|1996-07-31 Myo-inositol transporter; member of the sugar transporter superfamily; expressed constitutively; ITR2 has a paralog, ITR1, that arose from the whole genome duplication -S000037640 CDS YOL103W 15 124001 125830 W 2006-01-05 2003-09-22|1996-07-31 -S000005462 ORF Verified YOL102C TPT1 tRNA 2'-phosphotransferase chromosome 15 L000003433 15 126689 125997 C 2006-01-05 1996-07-31 tRNA 2'-phosphotransferase that catalyzes final step in tRNA splicing: the transfer of the 2'-PO(4) from the splice junction to NAD(+) to form ADP-ribose 1''-2''cyclic phosphate and nicotinamide -S000037519 CDS YOL102C 15 126689 125997 C 2006-01-05 1996-07-31 -S000005461 ORF Verified YOL101C IZH4 chromosome 15 15 127920 126982 C 2006-01-05 1996-07-31 Membrane protein involved in zinc ion homeostasis; member of the four-protein IZH family; expression induced by fatty acids and altered zinc levels; deletion reduces sensitivity to excess zinc; possible role in sterol metabolism; protein increases in abundance and relocalizes from nucleus to ER upon DNA replication stress; IZH4 has a paralog, IZH1, that arose from the whole genome duplication -S000037425 CDS YOL101C 15 127920 126982 C 2006-01-05 1996-07-31 -S000005460 ORF Verified YOL100W PKH2 serine/threonine protein kinase PKH2 chromosome 15 L000004617 15 129237 132482 W 2006-01-05 1996-07-31 Serine/threonine protein kinase; involved in sphingolipid-mediated signaling pathway that controls endocytosis; activates Ypk1p and Ykr2p, components of signaling cascade required for maintenance of cell wall integrity; contains a PH-like domain; redundant with Pkh1p; PKH2 has a paralog, PKH1, that arose from the whole genome duplication -S000032002 CDS YOL100W 15 129237 132482 W 2006-01-05 1996-07-31 -S000005459 ORF Dubious YOL099C chromosome 15 15 132508 132017 C 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene PKH2/YOL100W; may interact with ribosomes -S000030816 CDS YOL099C 15 132508 132017 C 2006-01-05 1996-07-31 -S000005458 ORF Verified YOL098C SDD3 chromosome 15 15 135838 132725 C 2006-01-05 1996-07-31 Putative metalloprotease; overproduction suppresses lethality due to expression of the dominant PET9 allele AAC2-A128P -S000030730 CDS YOL098C 15 135838 132725 C 2006-01-05 1996-07-31 -S000006449 snoRNA_gene snR58 SNR58 chromosome 15 L000004527 15 136183 136088 C 2006-01-05 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position C663 -S000030765 noncoding_exon snR58 15 136183 136088 C 2006-01-05 2000-05-19 -S000028854 ORF Uncharacterized YOL097W-A chromosome 15 15 136220 136405 W 2006-01-05 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000034567 CDS YOL097W-A 15 136220 136405 W 2006-01-05 2003-07-29 -S000005457 ORF Verified YOL097C WRS1 tryptophan--tRNA ligase WRS1|HRE342 chromosome 15 L000003253 15 137825 136527 C 2006-01-05 1996-07-31 Cytoplasmic tryptophanyl-tRNA synthetase; aminoacylates tryptophanyl-tRNA; human homolog WARS can complement yeast null mutant -S000030577 CDS YOL097C 15 137825 136527 C 2006-01-05 1996-07-31 -S000005456 ORF Verified YOL096C COQ3 hexaprenyldihydroxybenzoate methyltransferase chromosome 15 L000000380 15 139045 138107 C 2006-01-05 2003-09-22|1996-07-31 O-methyltransferase; catalyzes two different O-methylation steps in ubiquinone (Coenzyme Q) biosynthesis; component of a mitochondrial ubiquinone-synthesizing complex; phosphoprotein -S000036749 CDS YOL096C 15 139045 138107 C 2006-01-05 2003-09-22|1996-07-31 -S000005455 ORF Verified YOL095C HMI1 ATP-dependent 3'-5' DNA helicase chromosome 15 L000004614 15 141347 139227 C 2006-01-05 1996-07-31 Mitochondrial inner membrane localized ATP-dependent DNA helicase; required for the maintenance of the mitochondrial genome; not required for mitochondrial transcription; has homology to E. coli helicase uvrD -S000036656 CDS YOL095C 15 141347 139227 C 2006-01-05 1996-07-31 -S000005454 ORF Verified YOL094C RFC4 replication factor C subunit 4 chromosome 15 L000001625 15 142555 141584 C 2006-01-05 1996-07-31 Subunit of heteropentameric Replication factor C (RF-C); which is a DNA binding protein and ATPase that acts as a clamp loader of the proliferating cell nuclear antigen (PCNA) processivity factor for DNA polymerases delta and epsilon; relocalizes to the cytosol in response to hypoxia -S000036576 CDS YOL094C 15 142555 141584 C 2006-01-05 1996-07-31 -S000005453 ORF Verified YOL093W TRM10 tRNA (guanine(9)-N(1))-methyltransferase chromosome 15 15 142815 143696 W 2006-01-05 1996-07-31 tRNA methyltransferase; methylates the N-1 position of guanine at position 9 in tRNAs; protein abundance increases in response to DNA replication stress; member of the SPOUT (SpoU-TrmD) methyltransferase family; human ortholog TRMT10A plays a role in the pathogenesis of microcephaly and early onset diabetes; an 18-mer originates from the TRM10 locus; genetic analysis shows the 18-mer is the translation regulator -S000036530 CDS YOL093W 15 142815 143696 W 2006-01-05 1996-07-31 -S000005452 ORF Verified YOL092W YPQ1 cationic amino acid transporter chromosome 15 15 144204 145130 W 2006-01-05 1996-07-31 Putative vacuolar membrane transporter for cationic amino acids; likely contributes to amino acid homeostasis by exporting cationic amino acids from the vacuole; member of the PQ-loop family, with seven transmembrane domains; similar to mammalian PQLC2 vacuolar transporter; YPQ1 has a paralog, RTC2, that arose from the whole genome duplication -S000035613 CDS YOL092W 15 144204 145130 W 2006-01-05 1996-07-31 -S000005451 ORF Verified YOL091W SPO21 MPC70 chromosome 15 L000004853 15 145334 147163 W 2006-01-05 1996-07-31 Component of the meiotic outer plaque of the spindle pole body; involved in modifying the meiotic outer plaque that is required prior to prospore membrane formation; SPO21 has a paralog, YSW1, that arose from the whole genome duplication -S000035535 CDS YOL091W 15 145334 147163 W 2006-01-05 1996-07-31 -S000005450 ORF Verified YOL090W MSH2 mismatch repair ATPase MSH2|PMS5 chromosome 15 L000001190 15 147382 150276 W -83.8 2006-01-05 1996-07-31 Protein that binds to DNA mismatches; forms heterodimers with Msh3p and Msh6p that bind to DNA mismatches to initiate the mismatch repair process; contains a Walker ATP-binding motif required for repair activity and involved in interstrand cross-link repair; Msh2p-Msh6p binds to and hydrolyzes ATP -S000035449 CDS YOL090W 15 147382 150276 W 2006-01-05 1996-07-31 -S000005449 ORF Verified YOL089C HAL9 chromosome 15 L000004704 15 153490 150398 C 2006-01-05 1996-07-31 Putative transcription factor containing a zinc finger; overexpression increases salt tolerance through increased expression of the ENA1 (Na+/Li+ extrusion pump) gene while gene disruption decreases both salt tolerance and ENA1 expression; HAL9 has a paralog, TBS1, that arose from the whole genome duplication -S000035681 CDS YOL089C 15 153490 150398 C 2006-01-05 1996-07-31 -S000005448 ORF Verified YOL088C MPD2 protein disulfide isomerase MPD2 chromosome 15 L000004182 15 154745 153912 C 2006-01-05 1996-07-31 Member of the protein disulfide isomerase (PDI) family; exhibits chaperone activity; overexpression suppresses the lethality of a pdi1 deletion but does not complement all Pdi1p functions; undergoes oxidation by Ero1p -S000034755 CDS YOL088C 15 154745 153912 C 2006-01-05 1996-07-31 -S000005447 ORF Verified YOL087C DUF1 chromosome 15 15 158637 155287 C 2006-01-05 1996-07-31 Ubiquitin-binding protein of unknown function; contains one WD40 repeat in a beta-propeller fold; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; homolog of human WDR48/UAF1, which is involved in regulating the Fanconi anemia pathway; deletion mutant is sensitive to various chemicals including phenanthroline, sanguinarine, and nordihydroguaiaretic acid -S000034693 CDS YOL087C 15 158637 155287 C 2006-01-05 1996-07-31 -S000007626 ORF Verified YOL086W-A MHF1 chromosome 15 15 159173 159445 W 2006-01-05 2001-02-26 Component of the heterotetrameric MHF histone-fold complex; in humans the MHF complex interacts with both DNA and Mph1p ortholog FANCM, a Fanconi anemia complementation group protein, to stabilize and remodel blocked replication forks and repair damaged DNA; mhf1 srs2 double mutants are MMS hypersensitive; ortholog of human centromere constitutive-associated network (CCAN) subunit CENP-S, also known as MHF1 -S000037254 CDS YOL086W-A 15 159173 159445 W 2006-01-05 2001-02-26 -S000005446 ORF Verified YOL086C ADH1 alcohol dehydrogenase ADH1|ADC1 chromosome 15 L000000041 15 160594 159548 C -86 2006-01-05 1996-07-31 Alcohol dehydrogenase; fermentative isozyme active as homo- or heterotetramers; required for the reduction of acetaldehyde to ethanol, the last step in the glycolytic pathway; ADH1 has a paralog, ADH5, that arose from the whole genome duplication -S000034629 CDS YOL086C 15 160594 159548 C 2006-01-05 1996-07-31 -S000028708 ORF Dubious YOL085W-A chromosome 15 15 161579 161791 W 2006-01-05 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YOL085C -S000032652 CDS YOL085W-A 15 161579 161791 W 2006-01-05 2003-07-29 -S000005445 ORF Uncharacterized YOL085C chromosome 15 15 162014 161673 C 2006-01-05 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YOL085C is not an essential gene; partially overlaps dubious ORF YOL085W-A -S000034541 CDS YOL085C 15 162014 161673 C 2006-01-05 1996-07-31 -S000005444 ORF Verified YOL084W PHM7 chromosome 15 15 162356 165331 W 2006-01-05 1996-07-31 Protein of unknown function; expression is regulated by phosphate levels; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery and vacuole; protein abundance increases in response to DNA replication stress -S000034487 CDS YOL084W 15 162356 165331 W 2006-01-05 1996-07-31 -S000005443 ORF Verified YOL083W ATG34 ATG19-B chromosome 15 15 165714 166952 W 2006-01-05 1996-07-31 Receptor protein involved in selective autophagy during starvation; specifically involved in the transport of cargo protein alpha-mannosidase (Ams1p); Atg19p paralog -S000032467 CDS YOL083W 15 165714 166952 W 2006-01-05 1996-07-31 -S000028853 ORF Dubious YOL083C-A chromosome 15 15 166601 166461 C 2006-01-05 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by expression profiling and mass spectrometry -S000034566 CDS YOL083C-A 15 166601 166461 C 2006-01-05 2003-07-29 -S000118487 ARS ARS1510 ARSXV-167 chromosome 15 15 166976 167221 2006-08-30 2006-08-30 Autonomously Replicating Sequence -S000178182 ARS_consensus_sequence ARS1510 15 167002 167018 W 2014-11-18 2014-11-18 -S000005442 ORF Verified YOL082W ATG19 CVT19 chromosome 15 15 168727 169974 W 2006-01-05 1996-07-31 Receptor protein for the cytoplasm-to-vacuole targeting (Cvt) pathway; delivers cargo proteins aminopeptidase I (Ape1p) and alpha-mannosidase (Ams1p) to the phagophore assembly site for packaging into Cvt vesicles; interaction with Atg19p during the Cvt pathway requires phosphorylation by Hrr25p -S000032367 CDS YOL082W 15 168727 169974 W 2006-01-05 1996-07-31 -S000005441 ORF Verified YOL081W IRA2 Ras GTPase activating protein IRA2|GLC4|CCS1 chromosome 15 L000000874 15 171070 180309 W -72 2006-01-05 1996-07-31 GTPase-activating protein; negatively regulates RAS by converting it from the GTP- to the GDP-bound inactive form, required for reducing cAMP levels under nutrient limiting conditions; IRA2 has a paralog, IRA1, that arose from the whole genome duplication; defects in human homolog NF1 are associated with neurofibromatosis -S000032260 CDS YOL081W 15 171070 180309 W 2006-01-05 1996-07-31 -S000005439 ORF Dubious YOL079W chromosome 15 15 181057 181455 W 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031476 CDS YOL079W 15 181057 181455 W 2006-01-05 1996-07-31 -S000005440 ORF Verified YOL080C REX4 putative 3'-5' exonuclease chromosome 15 15 181427 180558 C 2006-01-05 1996-07-31 Putative RNA exonuclease; possibly involved in pre-rRNA processing and ribosome assembly -S000031202 CDS YOL080C 15 181427 180558 C 2006-01-05 1996-07-31 -S000005438 ORF Verified YOL078W AVO1 chromosome 15 15 181682 185212 W 2006-01-05 1996-07-31 Component of a membrane-bound complex containing the Tor2p kinase; contains Tor2p kinase and other proteins; may have a role in regulation of cell growth -S000031371 CDS YOL078W 15 181682 185212 W 2006-01-05 1996-07-31 -S000007339 ORF Verified YOL077W-A ATP19 F1F0 ATP synthase subunit k chromosome 15 15 185438 185644 W 2006-01-05 1999-07-17 Subunit k of the mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; associated only with the dimeric form of ATP synthase -S000031206 CDS YOL077W-A 15 185438 185644 W 2006-01-05 1999-07-17 -S000005437 ORF Verified YOL077C BRX1 chromosome 15 15 186723 185848 C 2006-01-05 1996-07-31|2011-02-03 Nucleolar protein; constituent of 66S pre-ribosomal particles; depletion leads to defects in rRNA processing and a block in the assembly of large ribosomal subunits; possesses a sigma(70)-like RNA-binding motif -S000030456 CDS YOL077C 15 186723 185848 C 2006-01-05 1996-07-31|2011-02-03 -S000005436 ORF Verified YOL076W MDM20 NAA25|DEC1 chromosome 15 L000002975 15 187024 189414 W 2006-01-05 1996-07-31 Non-catalytic subunit of the NatB N-terminal acetyltransferase; NatB catalyzes N-acetylation of proteins with specific N-terminal sequences; involved in mitochondrial inheritance and actin assembly -S000030374 CDS YOL076W 15 187024 189414 W 2006-01-05 1996-07-31 -S000005435 ORF Verified YOL075C chromosome 15 15 193542 189658 C 2006-01-05 1999-07-17|1996-07-31|2011-02-03 Putative ABC transporter -S000030157 CDS YOL075C 15 193542 189658 C 2006-01-05 1999-07-17|1996-07-31|2011-02-03 -S000005434 ORF Verified YOL073C DSC2 chromosome 15 15 194800 193832 C 2006-01-05 1996-07-31 Multi-transmembrane subunit of the DSC ubiquitin ligase complex; similar in sequence to rhomboid pseudoproteases Der1p and UBAC2 that function in ERAD; ortholog of fission yeast dsc2 -S000036354 CDS YOL073C 15 194800 193832 C 2006-01-05 1996-07-31 -S000005433 ORF Verified YOL072W THP1 BUD29 chromosome 15 15 194970 196337 W 2006-01-05 1996-07-31 Nuclear pore-associated protein; component of TREX-2 complex (Sac3p-Thp1p-Sus1p-Cdc31p) involved in transcription elongation and mRNA export from the nucleus; involved in post-transcriptional tethering of active genes to the nuclear periphery and to non-nascent mRNP; contains a PAM domain implicated in protein-protein binding -S000036289 CDS YOL072W 15 194970 196337 W 2006-01-05 1996-07-31 -S000005432 ORF Verified YOL071W SDH5 EMI5|succinate dehydrogenase assembly factor SDH5 chromosome 15 15 196507 196995 W 2006-01-05 1996-07-31 Protein required for flavinylation of Sdh1p; binds to Sdh1p and promotes FAD cofactor attachment, which is necessary for succinate dehydrogenase (SDH) complex assembly and activity; mutations in human ortholog PGL2 are associated with neuroendocrine tumors (paraganglioma) -S000036205 CDS YOL071W 15 196507 196995 W 2006-01-05 1996-07-31 -S000005431 ORF Verified YOL070C NBA1 chromosome 15 15 198725 197220 C 2006-01-05 1996-07-31 Protein of unknown function; localizes to the bud neck and cytoplasm; interacts with Nap1p; may interact with ribosomes, based on co-purification experiments; potential Cdc28p substrate -S000035224 CDS YOL070C 15 198725 197220 C 2006-01-05 1996-07-31 -S000005430 ORF Verified YOL069W NUF2 kinetochore-associated Ndc80 complex subunit NUF2 chromosome 15 L000001286 15 198942 200297 W 2006-01-05 1996-07-31 Component of the kinetochore-associated Ndc80 complex; involved in chromosome segregation, spindle checkpoint activity, and kinetochore clustering; evolutionarily conserved; other members include Ndc80p, Nuf2p, Spc24p, and Spc25p -S000035586 CDS YOL069W 15 198942 200297 W 2006-01-05 1996-07-31 -S000005429 ORF Verified YOL068C HST1 histone deacetylase HST1 chromosome 15 L000000826 15 201879 200368 C 2006-01-05 1996-07-31 NAD(+)-dependent histone deacetylase; essential subunit of the Sum1p/Rfm1p/Hst1p complex required for ORC-dependent silencing and meiotic repression; non-essential subunit of the Set3C deacetylase complex; involved in telomere maintenance; HST1 has a paralog, SIR2, that arose from the whole genome duplication -S000035472 CDS YOL068C 15 201879 200368 C 2006-01-05 1996-07-31 -S000005428 ORF Verified YOL067C RTG1 chromosome 15 L000001783 15 202518 201985 C 2006-01-05 1996-07-31 Transcription factor (bHLH) involved in interorganelle communication; contributes to communication between mitochondria, peroxisomes, and nucleus; target of Hog1p; activated in stochastic pulses of nuclear localization -S000035434 CDS YOL067C 15 202518 201985 C 2006-01-05 1996-07-31 -S000005427 ORF Verified YOL066C RIB2 bifunctional DRAP deaminase/tRNA pseudouridine synthase RIB2|PUS8 chromosome 15 L000003026 15 204471 202696 C 2006-01-05 1996-07-31 Bifunctional DRAP deaminase tRNA:pseudouridine synthase; the deaminase catalyzes the third step in riboflavin biosynthesis and the synthase catalyzes formation of pseudouridine at position 32 in cytoplasmic tRNAs; RIB2 has a paralog, PUS9, that arose from the whole genome duplication -S000035357 CDS YOL066C 15 204471 202696 C 2006-01-05 1996-07-31 -S000005426 ORF Verified YOL065C INP54 phosphoinositide 5-phosphatase INP54 chromosome 15 L000004299 15 205885 204731 C 2006-01-05 1996-07-31 Phosphatidylinositol 4,5-bisphosphate 5-phosphatase; role in secretion; localizes to the endoplasmic reticulum via the C-terminal tail; lacks the Sac1 domain and proline-rich region found in the other 3 INP proteins -S000034381 CDS YOL065C 15 205885 204731 C 2006-01-05 1996-07-31 -S000005425 ORF Verified YOL064C MET22 3'(2'),5'-bisphosphate nucleotidase|HAL2 chromosome 15 L000001090 15 207176 206103 C 2006-01-05 1996-07-31 Bisphosphate-3'-nucleotidase; involved in salt tolerance and methionine biogenesis; dephosphorylates 3'-phosphoadenosine-5'-phosphate and 3'-phosphoadenosine-5'-phosphosulfate, intermediates of the sulfate assimilation pathway; human homolog BPNT1 complements yeast null mutant -S000034318 CDS YOL064C 15 207176 206103 C 2006-01-05 1996-07-31 -S000005424 ORF Verified YOL063C CRT10 HUS1 chromosome 15 15 210265 207392 C 2006-01-05 1996-07-31 Protein involved in transcriptional regulation of RNR2 and RNR3; expression of the gene is induced by DNA damage and null mutations confer increased resistance to hydroxyurea; N-terminal region has a leucine repeat and a WD40 repeat -S000034270 CDS YOL063C 15 210265 207392 C 2006-01-05 1996-07-31 -S000005423 ORF Verified YOL062C APM4 AMP1 chromosome 15 L000003288 15 211995 210520 C 2006-01-05 1996-07-31 Cargo-binding mu subunit of AP-2; AP-2 is a heterotetrameric endocytic cargo-binding adaptor that facilitates uptake of membrane proteins during clathrin-mediated endocytosis; Apm4p is required for AP-2 function and localization, and binds cell wall stress receptor Mid2p; AP-2 is required for cell polarity responses to pheromone, nutritional status and cell wall damage in S. cerevisiae, and for hyphal growth in C. albicans; AP-2 complex is conserved in mammals -S000034160 CDS YOL062C 15 211995 210520 C 2006-01-05 1996-07-31 -S000005422 ORF Verified YOL061W PRS5 ribose phosphate diphosphokinase subunit PRS5 chromosome 15 L000004120 15 212244 213734 W 2006-01-05 1996-07-31 5-phospho-ribosyl-1(alpha)-pyrophosphate synthetase; synthesizes PRPP, which is required for nucleotide, histidine, and tryptophan biosynthesis; one of five related enzymes, which are active as heteromultimeric complexes; forms cytoplasmic foci upon DNA replication stress -S000034100 CDS YOL061W 15 212244 213734 W 2006-01-05 1996-07-31 -S000005421 ORF Verified YOL060C MAM3 chromosome 15 15 216137 214017 C 2006-01-05 1996-07-31 Protein required for normal mitochondrial morphology; has similarity to hemolysins -S000032070 CDS YOL060C 15 216137 214017 C 2006-01-05 1996-07-31 -S000005420 ORF Verified YOL059W GPD2 glycerol-3-phosphate dehydrogenase (NAD(+)) GPD2|GPD3 chromosome 15 L000000723|L000003160 15 217126 218448 W 2006-01-05 1996-07-31 NAD-dependent glycerol 3-phosphate dehydrogenase; expression is controlled by an oxygen-independent signaling pathway required to regulate metabolism under anoxic conditions; located in cytosol and mitochondria; constitutively active but is inactivated via phosphorylation by energy-stress responsive kinase SNF1; GPD2 has a paralog, GPD1, that arose from the whole genome duplication -S000032438 CDS YOL059W 15 217126 218448 W 2006-01-05 1996-07-31 -S000005419 ORF Verified YOL058W ARG1 argininosuccinate synthase|ARG10 chromosome 15 L000000107 15 219211 220473 W -56 2011-02-03 1996-07-31|2011-02-03 Arginosuccinate synthetase; catalyzes the formation of L-argininosuccinate from citrulline and L-aspartate in the arginine biosynthesis pathway; potential Cdc28p substrate -S000032317 CDS YOL058W 15 219211 220473 W 2011-02-03 1996-07-31|2011-02-03 -S000005418 ORF Verified YOL057W dipeptidyl-peptidase III chromosome 15 15 220767 222902 W 2011-02-03 1996-07-31 Dipeptidyl-peptidase III; cleaves dipeptides from the amino terminus of target proteins; highly active on synthetic substrate Arg-Arg-2-naphthylamide; mammalian ortholog may be a biomarker for some cancers -S000032234 CDS YOL057W 15 220767 222902 W 2011-02-03 1996-07-31 -S000005417 ORF Verified YOL056W GPM3 phosphoglycerate mutase family protein GPM3 chromosome 15 L000002980 15 223268 224179 W 2011-02-03 1996-07-31 Homolog of Gpm1p phosphoglycerate mutase; converts 3-phosphoglycerate to 2-phosphoglycerate in glycolysis; may be non-functional; GPM3 has a paralog, GPM2, that arose from the whole genome duplication -S000032154 CDS YOL056W 15 223268 224179 W 2011-02-03 1996-07-31 -S000005416 ORF Verified YOL055C THI20 trifunctional hydroxymethylpyrimidine kinase/phosphomethylpyrimidine kinase/thiaminase chromosome 15 15 226075 224420 C 2011-02-03 1996-07-31 Trifunctional enzyme of thiamine biosynthesis, degradation and salvage; has hydroxymethylpyrimidine (HMP) kinase, HMP-phosphate (HMP-P) kinase and thiaminase activities; member of a gene family with THI21 and THI22; HMP and HMP-P kinase activity redundant with Thi21p -S000031133 CDS YOL055C 15 226075 224420 C 2011-02-03 1996-07-31 -S000006586 tRNA_gene tG(GCC)O1 chromosome 15 L000003719 15 226681 226611 C 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis -S000031599 noncoding_exon tG(GCC)O1 15 226681 226611 C 2011-02-03 2000-05-19 -S000007158 long_terminal_repeat YOLWsigma1 chromosome 15 15 226696 227037 W 2011-02-03 2000-05-19 Ty3 LTR -S000007156 long_terminal_repeat YOLWdelta6 chromosome 15 15 227096 227293 W 2011-02-03 2000-05-19 Ty1 LTR -S000007151 long_terminal_repeat YOLCdelta7 chromosome 15 15 228178 227851 C 2011-02-03 2000-05-19 Ty1 LTR -S000006675 tRNA_gene tN(GUU)O1 chromosome 15 L000003702 15 228331 228404 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis -S000035637 noncoding_exon tN(GUU)O1 15 228331 228404 W 2011-02-03 2000-05-19 -S000005415 ORF Verified YOL054W PSH1 ubiquitin-protein ligase PSH1 chromosome 15 15 228614 229834 W 2011-02-03 1996-07-31 E3 ubiquitin ligase targeting centromere-binding protein Cse4p; mediates polyubiquitination and degradation of histone H3 variant Cse4p, preventing its mislocalization to euchromatin independent of Slx5p; ubiquitination of Cse4p may be antagonized by Scm3p -S000031092 CDS YOL054W 15 228614 229834 W 2011-02-03 1996-07-31 -S000005414 ORF Verified YOL053W AIM39 chromosome 15 15 230085 231272 W 2011-02-03 1996-07-31 Protein of unknown function; null mutant displays elevated frequency of mitochondrial genome loss -S000030999 CDS YOL053W 15 230085 231272 W 2011-02-03 1996-07-31 -S000005413 ORF Verified YOL052C-A DDR2 YOL053C-A|DDRA2 chromosome 15 L000003478 15 231755 231570 C 2011-02-03 1996-07-31 Multi-stress response protein; expression is activated by a variety of xenobiotic agents and environmental or physiological stresses; DDR2 has a paralog, HOR7, that arose from the whole genome duplication -S000035236 CDS YOL052C-A 15 231755 231570 C 2011-02-03 1996-07-31 -S000005412 ORF Verified YOL052C SPE2 adenosylmethionine decarboxylase SPE2 chromosome 15 L000001994 15 233636 232446 C -58 2011-02-03 1996-07-31 S-adenosylmethionine decarboxylase; required for the biosynthesis of spermidine and spermine; cells lacking Spe2p require spermine or spermidine for growth in the presence of oxygen but not when grown anaerobically -S000029956 CDS YOL052C 15 233636 232446 C 2011-02-03 1996-07-31 -S000081375 snoRNA_gene snR81 SNR81 chromosome 15 15 234346 234546 W 2011-02-03 2006-01-24 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U1052, constitutive pseudouridylation of U2 snRNA (LSR1) at position 42, and stress-induced U2 pseudouridylation at position 93 -S000114173 noncoding_exon snR81 15 234346 234546 W 2011-02-03 2006-01-24 -S000005411 ORF Verified YOL051W GAL11 MED15|ABE1|SPT13|SDS4|RAR3 chromosome 15 L000000664 15 234940 238185 W -53 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; affects transcription by acting as target of activators and repressors; forms part of the tail domain of mediator -S000029897 CDS YOL051W 15 234940 238185 W 2011-02-03 1996-07-31 -S000005410 ORF Dubious YOL050C chromosome 15 15 238202 237882 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps verified gene GAL11; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO) -S000037840 CDS YOL050C 15 238202 237882 C 2011-02-03 1996-07-31 -S000005409 ORF Verified YOL049W GSH2 glutathione synthase chromosome 15 L000003548 15 238619 240094 W 2011-02-03 1996-07-31 Glutathione synthetase; catalyzes the ATP-dependent synthesis of glutathione (GSH) from gamma-glutamylcysteine and glycine; induced by oxidative stress and heat shock -S000037056 CDS YOL049W 15 238619 240094 W 2011-02-03 1996-07-31 -S000005408 ORF Verified YOL048C RRT8 chromosome 15 15 241310 240204 C 2011-02-03 2003-09-27|1996-07-31 Protein involved in spore wall assembly; shares similarity with Lds1p and Lds2p and a strain mutant for all 3 genes exhibits reduced dityrosine fluorescence relative to the single mutants; identified in a screen for mutants with increased levels of rDNA transcription; green fluorescent protein (GFP)-fusion protein localizes to lipid particles; protein abundance increases in response to DNA replication stress -S000036368 CDS YOL048C 15 240947 240204 C 2011-02-03 2003-09-27 -S000036367 CDS YOL048C 15 241310 241026 C 2011-02-03 2003-09-27|1996-07-31 -S000036369 intron YOL048C 15 241025 240948 C 2011-02-03 2003-09-27 -S000005407 ORF Verified YOL047C LDS2 chromosome 15 15 242747 241614 C 2011-02-03 2000-07-14|1996-07-31 Protein Involved in spore wall assembly; localizes to lipid droplets found on or outside of the prospore membrane; shares similarity with Lds1p and Rrt8p, and a strain mutant for all 3 genes exhibits reduced dityrosine fluorescence relative to the single mutants; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern -S000036270 CDS YOL047C 15 242441 241614 C 2011-02-03 2000-07-14|1996-07-31 -S000036269 CDS YOL047C 15 242747 242505 C 2011-02-03 2000-07-14|1996-07-31 -S000036271 intron YOL047C 15 242504 242442 C 2011-02-03 2000-07-14|1996-07-31 -S000005405 ORF Verified YOL045W PSK2 serine/threonine protein kinase PSK2 chromosome 15 15 243497 246802 W 2011-02-03 1996-07-31 PAS-domain containing serine/threonine protein kinase; regulates sugar flux and translation in response to an unknown metabolite by phosphorylating Ugp1p and Gsy2p (sugar flux) and Caf20p, Tif11p and Sro9p (translation); PSK2 has a paralog, PSK1, that arose from the whole genome duplication -S000036127 CDS YOL045W 15 243497 246802 W 2011-02-03 1996-07-31 -S000005406 ORF Dubious YOL046C chromosome 15 15 244140 243466 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the verified gene PSK2/YOL045W -S000036179 CDS YOL046C 15 244140 243466 C 2011-02-03 1996-07-31 -S000005404 ORF Verified YOL044W PEX15 PAS21 chromosome 15 L000003971 15 247150 248301 W 2011-02-03 1996-07-31 Tail-anchored type II integral peroxisomal membrane protein; required for peroxisome biogenesis; cells lacking Pex15p mislocalize peroxisomal matrix proteins to cytosol; overexpression results in impaired peroxisome assembly -S000036032 CDS YOL044W 15 247150 248301 W 2011-02-03 1996-07-31 -S000005403 ORF Verified YOL043C NTG2 bifunctional N-glycosylase/AP lyase NTG2|SCR2 chromosome 15 L000004115 15 249534 248392 C 2011-02-03 1996-07-31 DNA N-glycosylase and apurinic/apyrimidinic (AP) lyase; involved in base excision repair, localizes to the nucleus; sumoylated; NTG2 has a paralog, NTG1, that arose from the whole genome duplication -S000035085 CDS YOL043C 15 249534 248392 C 2011-02-03 1996-07-31 -S000005402 ORF Verified YOL042W NGL1 RNA exonuclease chromosome 15 15 249825 250916 W 2011-02-03 1996-07-31 Putative endonuclease; has a domain similar to a magnesium-dependent endonuclease motif in mRNA deadenylase Ccr4p; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000035032 CDS YOL042W 15 249825 250916 W 2011-02-03 1996-07-31 -S000005401 ORF Verified YOL041C NOP12 chromosome 15 S000007491 15 252646 251267 C 2011-02-03 1996-07-31 Nucleolar protein involved in pre-25S rRNA processing; also involved in biogenesis of large 60S ribosomal subunit; contains an RNA recognition motif (RRM); binds to Ebp2; similar to Nop13p and Nsr1p -S000034818 CDS YOL041C 15 252646 251267 C 2011-02-03 1996-07-31 -S000005400 ORF Verified YOL040C RPS15 uS19|ribosomal 40S subunit protein S15|S19|rp52|S21|S15|RPS21 chromosome 15 L000002709|L000001759 15 253577 253149 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S15 and bacterial S19 -S000033943 CDS YOL040C 15 253577 253149 C 2011-02-03 1996-07-31 -S000005399 ORF Verified YOL039W RPP2A P2A|ribosomal protein P2A|RPLA2|RPL44 chromosome 15 L000001733|L000001735|L000002820 15 254297 254617 W 2011-02-03 1996-07-31 Ribosomal protein P2 alpha; a component of the ribosomal stalk, which is involved in the interaction between translational elongation factors and the ribosome; free (non-ribosomal) P2 stimulates the phosphorylation of the eIF2 alpha subunit (Sui2p) by Gcn2p; regulates the accumulation of P1 (Rpp1Ap and Rpp1Bp) in the cytoplasm -S000032787 CDS YOL039W 15 254297 254617 W 2011-02-03 1996-07-31 -S000028812 ORF Uncharacterized YOL038C-A chromosome 15 15 255021 254926 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by SAGE analysis -S000033612 CDS YOL038C-A 15 255021 254926 C 2011-02-03 2003-07-29 -S000005398 ORF Verified YOL038W PRE6 proteasome core particle subunit alpha 4 chromosome 15 L000001488 15 255337 256101 W 2011-02-03 1996-07-31 Alpha 4 subunit of the 20S proteasome; may replace alpha 3 subunit (Pre9p) under stress conditions to create a more active proteasomal isoform; GFP-fusion protein relocates from cytosol to the mitochondrial surface upon oxidative stress -S000031873 CDS YOL038W 15 255337 256101 W 2011-02-03 1996-07-31 -S000005396 ORF Uncharacterized YOL036W chromosome 15 15 256745 259030 W 2011-02-03 1996-07-31 Protein of unknown function; potential Cdc28p substrate; YOL036W has a paralog, YIR016W, that arose from the whole genome duplication -S000031637 CDS YOL036W 15 256745 259030 W 2011-02-03 1996-07-31 -S000005397 ORF Dubious YOL037C chromosome 15 15 257019 256666 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YOL036W -S000031673 CDS YOL037C 15 257019 256666 C 2011-02-03 1996-07-31 -S000005395 ORF Dubious YOL035C chromosome 15 15 259105 258803 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030751 CDS YOL035C 15 259105 258803 C 2011-02-03 1996-07-31 -S000006441 snoRNA_gene snR50 SNR50 chromosome 15 L000004519 15 259489 259578 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position G867 -S000030731 noncoding_exon snR50 15 259489 259578 W 2011-02-03 2000-05-19 -S000005394 ORF Verified YOL034W SMC5 DNA repair ATPase SMC5 chromosome 15 15 259923 263204 W 2011-02-03 1996-07-31 Subunit of the SMC5-SMC6 complex; the SMC5-SMC6 complex plays a key role in the removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair; binds single-stranded DNA and has ATPase activity; supports nucleolar function; S. pombe homolog forms a heterodimer with S. pombe Rad18p that is involved in DNA repair -S000030687 CDS YOL034W 15 259923 263204 W 2011-02-03 1996-07-31 -S000005393 ORF Verified YOL033W MSE1 glutamate--tRNA ligase MSE1 chromosome 15 L000002617 15 263475 265085 W 2011-02-03 1996-07-31 Mitochondrial glutamyl-tRNA synthetase; predicted to be palmitoylated -S000030607 CDS YOL033W 15 263475 265085 W 2011-02-03 1996-07-31 -S000005392 ORF Verified YOL032W OPI10 chromosome 15 15 265429 266169 W 2011-02-03 1996-07-31 Protein with a possible role in phospholipid biosynthesis; null mutant displays an inositol-excreting phenotype that is suppressed by exogenous choline; protein abundance increases in response to DNA replication stress -S000030531 CDS YOL032W 15 265429 266169 W 2011-02-03 1996-07-31 -S000005391 ORF Verified YOL031C SIL1 SLS1 chromosome 15 15 267529 266264 C 2011-02-03 1996-07-31 Nucleotide exchange factor for the ER lumenal Hsp70 chaperone Kar2p; required for protein translocation into the endoplasmic reticulum (ER); homolog of Yarrowia lipolytica SLS1; GrpE-like protein -S000037678 CDS YOL031C 15 267529 266264 C 2011-02-03 1996-07-31 -S000005390 ORF Verified YOL030W GAS5 1,3-beta-glucanosyltransferase chromosome 15 15 268187 269641 W 2011-02-03 1996-07-31 1,3-beta-glucanosyltransferase; has similarity to Gas1p; localizes to the cell wall -S000037638 CDS YOL030W 15 268187 269641 W 2011-02-03 1996-07-31 -S000005389 ORF Uncharacterized YOL029C chromosome 15 15 270420 269815 C 2011-02-03 1996-07-31 Putative protein of unknown function; identified as interacting with Hsc82p and Hsp82p in high-throughput two-hybrid screens -S000036601 CDS YOL029C 15 270420 269815 C 2011-02-03 1996-07-31 -S000005388 ORF Verified YOL028C YAP7 chromosome 15 L000004347 15 271370 270633 C 2011-02-03 1996-07-31 Putative basic leucine zipper (bZIP) transcription factor; YAP7 has a paralog, YAP5, that arose from the whole genome duplication -S000036521 CDS YOL028C 15 271370 270633 C 2011-02-03 1996-07-31 -S000005387 ORF Verified YOL027C MDM38 ribosome-binding protein MDM38|MKH1 chromosome 15 15 273724 272003 C 2011-02-03 1996-07-31 Mitochondrial protein; forms a complex with Mba1p to facilitate recruitment of mRNA-specific translational activators to ribosomes; roles in protein export and K+/H+ exchange; human ortholog Letm1 implicated in Wolf-Hirschhorn syndrome -S000036426 CDS YOL027C 15 273724 272003 C 2011-02-03 1996-07-31 -S000005386 ORF Verified YOL026C MIM1 TOM13 chromosome 15 15 274353 274012 C 2011-02-03 1996-07-31 Mitochondrial protein required for outer membrane protein import; cooperates with Tom70p to import the subset of proteins with multiple alpha-helical transmembrane segments, including Ugo1p, Tom20p, and others; present in a complex with Mim2p in the outer membrane that may create a local environment to facilitate membrane insertion of substrate proteins; also has a role in assembly of Tom20p into the TOM complex -S000036344 CDS YOL026C 15 274353 274012 C 2011-02-03 1996-07-31 -S000006733 tRNA_gene tS(GCU)O chromosome 15 L000003703 15 274673 274773 W 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000037500 intron tS(GCU)O 15 274710 274728 W 2011-02-03 2000-05-19 -S000037498 noncoding_exon tS(GCU)O 15 274673 274709 W 2011-02-03 2000-05-19 -S000037499 noncoding_exon tS(GCU)O 15 274729 274773 W 2011-02-03 2000-05-19 -S000005385 ORF Verified YOL025W LAG2 ECM36 chromosome 15 L000003402 15 274957 276939 W 2011-02-03 1996-07-31|1997-07-27 Protein that negatively regulates the SCF E3-ubiquitin ligase; regulates by interacting with and preventing neddyation of the cullin subunit, Cdc53p; longevity determinant that is preferentially expressed in young cells; similar to mammalian Cand1 -S000035469 CDS YOL025W 15 274957 276939 W 2011-02-03 1997-07-27|1996-07-31 -S000005384 ORF Uncharacterized YOL024W chromosome 15 15 277086 277604 W 2011-02-03 1996-07-31 Putative protein of unknown function; predicted to have thiol-disulfide oxidoreductase active site; YOL024W has a paralog, IGD1, that arose from the whole genome duplication -S000035404 CDS YOL024W 15 277086 277604 W 2011-02-03 1996-07-31 -S000118488 ARS ARS1511 ARSXV-278 chromosome 15 15 277530 277778 2011-02-03 2006-08-30 Autonomously Replicating Sequence; replication capacity dependent upon Sum1p -S000178183 ARS_consensus_sequence ARS1511 15 277733 277717 C 2014-11-18 2014-11-18 -S000005383 ORF Verified YOL023W IFM1 translation initiation factor 2 chromosome 15 L000000854 15 278056 280086 W 2011-02-03 1996-07-31 Mitochondrial translation initiation factor 2 -S000035326 CDS YOL023W 15 278056 280086 W 2011-02-03 1996-07-31 -S000005382 ORF Verified YOL022C TSR4 chromosome 15 15 281498 280272 C 2011-02-03 1996-07-31|2011-02-03 Cytoplasmic protein required for correct processing of 20S pre-rRNA; protein required for processing of the 20S pre-rRNA at site D to generate mature 18S rRNA; essential gene in S288C background but not in CEN.PK2 -S000035200 CDS YOL022C 15 281498 280272 C 2011-02-03 1996-07-31|2011-02-03 -S000006587 tRNA_gene tG(GCC)O2 SUF17 chromosome 15 L000002164|L000003704 15 282164 282234 W -53 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons -S000031601 noncoding_exon tG(GCC)O2 15 282164 282234 W 2011-02-03 2000-05-19 -S000005381 ORF Verified YOL021C DIS3 exosome catalytic subunit DIS3|MTR17|RRP44 chromosome 15 L000003486 15 285426 282421 C 2011-02-03 1996-07-31 Exosome core complex catalytic subunit; has both endonuclease and 3'-5' exonuclease activity; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; role in degradation of tRNAs; similar to E. coli RNase R and to human DIS3, which partially complements dis3-81 heat sensitivity; mutations in Dis3p analogous to human mutations implicated in multiple myeloma impair exosome function; protein abundance increases under to DNA replication stress -S000034208 CDS YOL021C 15 285426 282421 C 2011-02-03 1996-07-31 -S000005380 ORF Verified YOL020W TAT2 aromatic amino acid transmembrane transporter TAT2|TAP2|SCM2|SAB2|LTG3 chromosome 15 L000002263|L000000956|L000001813 15 286172 287950 W 2011-02-03 1996-07-31 High affinity tryptophan and tyrosine permease; overexpression confers FK506 and FTY720 resistance -S000034169 CDS YOL020W 15 286172 287950 W 2011-02-03 1996-07-31 -S000006785 tRNA_gene tY(GUA)O SUP3 chromosome 15 L000003705|L000002182 15 288192 288280 W -16 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations -S000034708 intron tY(GUA)O 15 288231 288244 W 2011-02-03 2000-05-19 -S000034706 noncoding_exon tY(GUA)O 15 288192 288230 W 2011-02-03 2000-05-19 -S000034707 noncoding_exon tY(GUA)O 15 288245 288280 W 2011-02-03 2000-05-19 -S000028707 ORF Uncharacterized YOL019W-A chromosome 15 15 288420 288572 W 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032650 CDS YOL019W-A 15 288420 288572 W 2011-02-03 2003-07-29 -S000005379 ORF Uncharacterized YOL019W TOS7 chromosome 15 15 288898 290553 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery and vacuole; YOL019W has a paralog, DCV1, that arose from the whole genome duplication -S000033133 CDS YOL019W 15 288898 290553 W 2011-02-03 1996-07-31 -S000005378 ORF Verified YOL018C TLG2 chromosome 15 L000004228 15 292074 290881 C 2011-02-03 1996-07-31 Syntaxin-like t-SNARE; forms a complex with Tlg1p and Vti1p and mediates fusion of endosome-derived vesicles with the late Golgi; required along with VPS45 for an early step of the constitutive CVT pathway; interactions with Vps45 prevents Tlg2p degradation, and facilitates t-SNARE complex formation; homologous to mammalian SNARE protein syntaxin 16 (Sx16) -S000032218 CDS YOL018C 15 292074 290881 C 2011-02-03 1996-07-31 -S000005377 ORF Verified YOL017W ESC8 chromosome 15 15 292529 294673 W 2011-02-03 1996-07-31 Protein involved in telomeric and mating-type locus silencing; interacts with Sir2p and also interacts with Gal11p, which is a component of the RNA pol II mediator complex; ESC8 has a paralog, IOC3, that arose from the whole genome duplication -S000032174 CDS YOL017W 15 292529 294673 W 2011-02-03 1996-07-31 -S000005376 ORF Verified YOL016C CMK2 calmodulin-dependent protein kinase CMK2 chromosome 15 L000000367 15 296120 294777 C 2011-02-03 1996-07-31 Calmodulin-dependent protein kinase; may play a role in stress response, many CA++/calmodulan dependent phosphorylation substrates demonstrated in vitro, amino acid sequence similar to mammalian Cam Kinase II; CMK2 has a paralog, CMK1, that arose from the whole genome duplication -S000032049 CDS YOL016C 15 296120 294777 C 2011-02-03 1996-07-31 -S000005375 ORF Verified YOL015W IRC10 chromosome 15 15 297078 298838 W 2011-02-03 1996-07-31 Protein of unknown function; subunit of the leading edge protein (LEP) complex (Ssp1-Ady3-Don1-Irc10) that forms a ring-like structure at the leading edge of the prospore membrane during meiosis II; null mutant displays increased levels of spontaneous Rad52p foci -S000032011 CDS YOL015W 15 297078 298838 W 2011-02-03 1996-07-31 -S000005374 ORF Uncharacterized YOL014W chromosome 15 15 299693 300067 W 2011-02-03 1996-07-31 Putative protein of unknown function; mCherry fusion protein localizes to the cytosol and nucleus -S000031065 CDS YOL014W 15 299693 300067 W 2011-02-03 1996-07-31 -S000007252 ORF Dubious YOL013W-B YOL013W-A chromosome 15 15 300690 300980 W 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the long terminal repeat (LTR) of a Ty1 element -S000033838 CDS YOL013W-B 15 300690 300980 W 2011-02-03 1999-07-17 -S000007152 long_terminal_repeat YOLCdelta8 chromosome 15 15 301021 300683 C 2011-02-03 2000-05-19 Ty1 LTR -S000028811 ORF Uncharacterized YOL013W-A YOL013W-B chromosome 15 15 301047 301238 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by SAGE -S000033611 CDS YOL013W-A 15 301047 301238 W 2011-02-03 2003-07-29 -S000006687 tRNA_gene tP(UGG)O1 chromosome 15 L000003706 15 301097 301198 W 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin -S000031042 intron tP(UGG)O1 15 301133 301162 W 2011-02-03 2000-05-19 -S000031040 noncoding_exon tP(UGG)O1 15 301097 301132 W 2011-02-03 2000-05-19 -S000031041 noncoding_exon tP(UGG)O1 15 301163 301198 W 2011-02-03 2000-05-19 -S000005373 ORF Verified YOL013C HRD1 E3 ubiquitin-protein ligase HRD1|DER3 chromosome 15 L000002963 15 303035 301380 C 2011-02-03 1996-07-31 Ubiquitin-protein ligase involved in ER-associated degradation (ERAD) of misfolded proteins; upon autoubiquitination triggers retrotranslocation of misfolded proteins to cytosol for degradation; genetically linked to the unfolded protein response (UPR); regulated through association with Hrd3p; contains an H2 ring finger; likely plays a general role in targeting proteins that persistently associate with and potentially obstruct the ER-localized translocon -S000030928 CDS YOL013C 15 303035 301380 C 2011-02-03 1996-07-31 -S000005372 ORF Verified YOL012C HTZ1 histone H2AZ|H2AZ|H2A.F/Z|HTA3 chromosome 15 L000003930|L000004094 15 303983 303579 C 2011-02-03 1996-07-31 Histone variant H2AZ; exchanged for histone H2A in nucleosomes by the SWR1 complex; involved in transcriptional regulation through prevention of the spread of silent heterochromatin; Htz1p-containing nucleosomes facilitate RNA Pol II passage by affecting correct assembly and modification status of RNA Pol II elongation complexes and by favoring efficient nucleosome remodeling -S000030851 CDS YOL012C 15 303983 303579 C 2011-02-03 1996-07-31 -S000005371 ORF Verified YOL011W PLB3 lysophospholipase chromosome 15 S000007426 15 305349 307409 W 2011-02-03 1996-07-31 Phospholipase B (lysophospholipase) involved in lipid metabolism; hydrolyzes phosphatidylinositol and phosphatidylserine and displays transacylase activity in vitro; PLB3 has a paralog, PLB1, that arose from the whole genome duplication -S000030818 CDS YOL011W 15 305349 307409 W 2011-02-03 1996-07-31 -S000005370 ORF Verified YOL010W RCL1 rRNA-processing endoribonuclease chromosome 15 15 307938 309041 W 2011-02-03 1996-07-31 Endonuclease that cleaves pre-rRNA at site A2 for 18S rRNA biogenesis; subunit of U3-containing 90S preribosome processome complex involved in small ribosomal subunit assembly; stimulates Bms1p GTPase and U3 binding activity; similar to RNA cyclase-like proteins but no cyclase activity detected -S000037888 CDS YOL010W 15 307938 309041 W 2011-02-03 1996-07-31 -S000130135 ARS ARS1512 ARSXV-309 chromosome 15 15 309359 309925 2011-02-03 2009-05-05 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay -S000005369 ORF Verified YOL009C MDM12 ERMES complex subunit MDM12 chromosome 15 L000002933 15 310139 309324 C 2011-02-03 1996-07-31 Mitochondrial outer membrane protein, ERMES complex subunit; required for transmission of mitochondria to daughter cells; required for mitophagy; may influence import and assembly of outer membrane beta-barrel proteins; ERMES complex is often co-localized with peroxisomes and with concentrated areas of pyruvate dehydrogenase -S000037008 CDS YOL009C 15 310139 309324 C 2011-02-03 1996-07-31 -S000005368 ORF Verified YOL008W COQ10 ubiquinone-binding protein COQ10 chromosome 15 15 310312 310935 W 2011-02-03 1996-07-31 Coenzyme Q (ubiquinone) binding protein; functions in the delivery of Q6 to its proper location for electron transport during respiration; START domain protein with homologs in bacteria and eukaryotes; respiratory growth defect of the null mutant is functionally complemented by human COQ10A -S000036984 CDS YOL008W 15 310312 310935 W 2011-02-03 1996-07-31 -S000005367 ORF Verified YOL007C CSI2 chromosome 15 L000004387 15 312367 311342 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)- fusion protein localizes to the mother side of the bud neck and the vacuole; YOL007C is not an essential gene -S000036219 CDS YOL007C 15 312367 311342 C 2011-02-03 1996-07-31 -S000005366 ORF Verified YOL006C TOP1 DNA topoisomerase 1|MAK17|MAK1 chromosome 15 L000002319 15 315387 313078 C 3 2011-02-03 1996-07-31 Topoisomerase I; nuclear enzyme that relieves torsional strain in DNA by cleaving and re-sealing the phosphodiester backbone; relaxes both positively and negatively supercoiled DNA; functions in replication, transcription, and recombination; role in processing ribonucleoside monophosphates in genomic DNA into irreversible single-strand breaks; enzymatic activity and interaction with Nsr1p are negatively regulated by polyphosphorylation -S000036071 CDS YOL006C 15 315387 313078 C 2011-02-03 1996-07-31 -S000005365 ORF Verified YOL005C RPB11 DNA-directed RNA polymerase II core subunit RPB11|B12.5 chromosome 15 L000001685 15 316175 315813 C 2011-02-03 1996-07-31 RNA polymerase II subunit B12.5; part of central core; similar to Rpc19p and bacterial alpha subunit -S000035928 CDS YOL005C 15 316175 315813 C 2011-02-03 1996-07-31 -S000005364 ORF Verified YOL004W SIN3 transcriptional regulator SIN3|UME4|SDS16|SDI1|RPD1|GAM2|CPE1 chromosome 15 L000001695 15 316938 321548 W 1 2011-02-03 1996-07-31 Component of both the Rpd3S and Rpd3L histone deacetylase complexes; involved in transcriptional repression and activation of diverse processes, including mating-type switching and meiosis; involved in the maintenance of chromosomal integrity -S000035863 CDS YOL004W 15 316938 321548 W 2011-02-03 1996-07-31 -S000005363 ORF Verified YOL003C PFA4 palmitoyltransferase PFA4 chromosome 15 15 322994 321858 C 2011-02-03 1996-07-31 Palmitoyltransferase with autoacylation activity; required for palmitoylation of amino acid permeases containing a C-terminal Phe-Trp-Cys site; required for modification of Chs3p; member of the DHHC family of putative palmitoyltransferases -S000034853 CDS YOL003C 15 322994 321858 C 2011-02-03 1996-07-31 -S000005362 ORF Verified YOL002C IZH2 PAQR-type receptor|PHO36 chromosome 15 15 324364 323411 C 2011-02-03 2003-01-09|1996-07-31 Plasma membrane receptor for plant antifungal osmotin; involved in zinc ion homeostasis, apoptosis; negatively regulates ZRT1 and other functionally divergent genes through CCCTC promoter motif (IzRE); modulates FET3 activity in iron-independent manner; affects gene expression by influencing balance of competition between Msn2p/Msn4p and Nrg1p/Nrg2p for binding to IzRE; transcription regulated by Zap1p, zinc, fatty acid levels; homolog of mammalian adiponectin receptor -S000034704 CDS YOL002C 15 324364 323411 C 2011-02-03 2003-01-09|1996-07-31 -S000005361 ORF Verified YOL001W PHO80 phoR|VAC5|TUP7|AGS3 chromosome 15 L000001426 15 325249 326130 W -1 2011-02-03 1996-07-31 Cyclin; interacts with cyclin-dependent kinase Pho85p; regulates the response to nutrient levels and environmental conditions, including the response to phosphate limitation and stress-dependent calcium signaling -S000034656 CDS YOL001W 15 325249 326130 W 2011-02-03 1996-07-31 -S000006476 centromere CEN15 CEN15 chromosome 15 L000000308 15 326702 326584 C 0 2011-02-03 2000-05-19|2004-10-08 Chromosome XV centromere -S000077290 centromere_DNA_Element_I CEN15 15 326702 326693 C 2011-02-03 2004-10-08 -S000077291 centromere_DNA_Element_II CEN15 15 326692 326609 C 2011-02-03 2004-10-08 -S000077292 centromere_DNA_Element_III CEN15 15 326608 326584 C 2011-02-03 2004-10-08 -S000005527 ORF Verified YOR001W RRP6 exosome nuclease subunit RRP6 chromosome 15 L000003540 15 326832 329033 W 2011-02-03 1996-07-31 Nuclear exosome exonuclease component; has 3'-5' exonuclease activity that is regulated by Lrp1p; involved in RNA processing, maturation, surveillance, degradation, tethering, and export; role in sn/snoRNAs precursor degradation; forms a stable heterodimer with Lrp1p; has similarity to E. coli RNase D and to human PM-Sc1 100 (EXOSC10); mutant displays reduced transcription elongation in the G-less-based -S000031325 CDS YOR001W 15 326832 329033 W 2011-02-03 1996-07-31 -S000005528 ORF Verified YOR002W ALG6 dolichyl-P-Glc:Man(9)GlcNAc(2)-PP-dolichol alpha-1,3-glucosyltransferase chromosome 15 L000003977 15 329417 331051 W 2011-02-03 1996-07-31 Alpha 1,3 glucosyltransferase; involved in transfer of oligosaccharides from dolichyl pyrophosphate to asparagine residues of proteins during N-linked protein glycosylation; C998T transition in human ortholog ALG6 causes carbohydrate-deficient glycoprotein syndrome type-Ic; wild-type human ortholog ALG6 can partially complement yeast alg6 mutant -S000032338 CDS YOR002W 15 329417 331051 W 2011-02-03 1996-07-31 -S000005529 ORF Verified YOR003W YSP3 putative subtilisin-like protease YSP3 chromosome 15 L000002552 15 331455 332891 W 2011-02-03 1996-07-31 Putative precursor of the subtilisin-like protease III; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; YSP3 has a paralog, PRB1, that arose from the whole genome duplication -S000032469 CDS YOR003W 15 331455 332891 W 2011-02-03 1996-07-31 -S000005530 ORF Verified YOR004W UTP23 rRNA-binding ribosome biosynthesis protein UTP23 chromosome 15 15 333592 334356 W 2011-02-03 1996-07-31 Component of the small subunit processome; involved in 40S ribosomal subunit biogenesis; interacts with snR30 and is required for dissociation of snR30 from large pre-ribosomal particles; has homology to PINc domain protein Fcf1p, although the PINc domain of Utp23p is not required for function; essential protein -S000032573 CDS YOR004W 15 333592 334356 W 2011-02-03 1996-07-31 -S000005531 ORF Verified YOR005C DNL4 DNA ligase (ATP) DNL4|LIG4 chromosome 15 L000003479 15 337343 334509 C 2011-02-03 1996-07-31 DNA ligase required for nonhomologous end-joining (NHEJ); forms stable heterodimer with required cofactor Lif1p, interacts with Nej1p; involved in meiosis, not essential for vegetative growth; mutations in human ortholog lead to ligase IV syndrome and Dubowitz syndrome -S000032618 CDS YOR005C 15 337343 334509 C 2011-02-03 1996-07-31 -S000118489 ARS ARS1513 ARSXV-337 chromosome 15 15 337424 337491 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000005532 ORF Verified YOR006C TSR3 chromosome 15 15 338621 337680 C 2011-02-03 1996-07-31 Protein required for 20S pre-rRNA processing; involved in processing of the 20S pre-rRNA at site D to generate mature 18S rRNA; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus; relative distribution to the nucleus increases upon DNA replication stress -S000033336 CDS YOR006C 15 338621 337680 C 2011-02-03 1996-07-31 -S000005533 ORF Verified YOR007C SGT2 chromosome 15 L000004506 15 339978 338938 C 2011-02-03 1996-07-31 Glutamine-rich cytoplasmic cochaperone; serves as a scaffold bringing together Get4, Get5p, and other TRC complex members that are required to mediate posttranslational insertion of tail-anchored proteins into the ER membrane; interacts with the prion domain of Sup35p; amyloid sensor; plays a role in targeting chaperones to prion aggregates; similar to human cochaperone SGT; forms cytoplasmic foci upon DNA replication stress -S000033384 CDS YOR007C 15 339978 338938 C 2011-02-03 1996-07-31 -S000006705 tRNA_gene tR(ACG)O chromosome 15 L000003718 15 340371 340299 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 6 nuclear tRNA genes containing the tDNA-anticodon ACG (converted to ICG in the mature tRNA), decodes CGU, CGC, and probably CGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000030451 noncoding_exon tR(ACG)O 15 340371 340299 C 2011-02-03 2000-05-19 -S000007153 long_terminal_repeat YORCdelta9 YOLCdelta9 chromosome 15 15 340898 340598 C 2011-02-03 2000-05-19 Ty1 LTR -S000005534 ORF Verified YOR008C SLG1 WSC1|HCS77 chromosome 15 L000003080 15 342414 341278 C 2011-02-03 1996-07-31 Sensor-transducer of the stress-activated PKC1-MPK1 kinase pathway; involved in maintenance of cell wall integrity; required for mitophagy; involved in organization of the actin cytoskeleton; secretory pathway Wsc1p is required for the arrest of secretion response -S000033455 CDS YOR008C 15 342414 341278 C 2011-02-03 1996-07-31 -S000006431 ORF Uncharacterized YOR008C-A chromosome 15 L000003931 15 343081 342857 C 2011-02-03 1999-07-17 Putative protein of unknown function; includes a potential transmembrane domain; deletion results in slightly lengthened telomeres; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively -S000034860 CDS YOR008C-A 15 343081 342857 C 2011-02-03 1999-07-17 -S000007628 ORF Dubious YOR008W-B chromosome 15 15 343929 344030 W 2006-01-05 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037258 CDS YOR008W-B 15 343929 344030 W 2006-01-05 2001-02-26 -S000005535 ORF Verified YOR009W TIR4 chromosome 15 15 344335 345798 W 2006-01-05 1996-07-31 Cell wall mannoprotein; expressed under anaerobic conditions and required for anaerobic growth; transcription is also induced by cold shock; member of the Srp1p/Tip1p family of serine-alanine-rich proteins -S000033574 CDS YOR009W 15 344335 345798 W 2006-01-05 1996-07-31 -S000005536 ORF Verified YOR010C TIR2 putative GPI-anchored mannoprotein|SRP2 chromosome 15 L000002312 15 346950 346195 C 2006-01-05 1996-07-31 Putative cell wall mannoprotein; member of the Srp1p/Tip1p family of serine-alanine-rich proteins; transcription is induced by cold shock and anaerobiosis; TIR2 has a paralog, TIR3, that arose from the whole genome duplication -S000034479 CDS YOR010C 15 346950 346195 C 2006-01-05 1996-07-31 -S000005537 ORF Verified YOR011W AUS1 ATP-binding cassette sterol transporter AUS1 chromosome 15 15 349679 353863 W 2006-01-05 1996-07-31 Plasma membrane sterol transporter of the ATP-binding cassette family; required, along with Pdr11p, for uptake of exogenous sterols and their incorporation into the plasma membrane; activity is stimulated by phosphatidylserine; sterol uptake is required for anaerobic growth because sterol biosynthesis requires oxygen; AUS1 has a paralog, PDR11, that arose from the whole genome duplication -S000035557 CDS YOR011W 15 349679 353863 W 2006-01-05 1996-07-31 -S000006747 tRNA_gene tT(AGU)O2 chromosome 15 L000003717 15 354113 354041 C 2006-01-05 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000037535 noncoding_exon tT(AGU)O2 15 354113 354041 C 2006-01-05 2000-05-19 -S000007159 long_terminal_repeat YORWsigma2 YOLWsigma2 chromosome 15 15 354128 354466 W 2006-01-05 2000-05-19 Ty3 LTR -S000007157 long_terminal_repeat YORWdelta10 YOLWdelta10 chromosome 15 15 354681 354958 W 2006-01-05 2000-05-19 Ty1 LTR -S000028581 ORF Uncharacterized YOR011W-A chromosome 15 15 355652 355858 W 2006-01-05 2003-07-29 Putative protein of unknown function -S000031328 CDS YOR011W-A 15 355652 355858 W 2006-01-05 2003-07-29 -S000005538 ORF Uncharacterized YOR012W chromosome 15 15 356543 356956 W 2006-01-05 1996-07-31 Putative protein of unknown function -S000035636 CDS YOR012W 15 356543 356956 W 2006-01-05 1996-07-31 -S000005539 ORF Dubious YOR013W IRC11 chromosome 15 15 356751 357221 W 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized gene YOR012C; null mutant displays increased levels of spontaneous Rad52 foci -S000035766 CDS YOR013W 15 356751 357221 W 2006-01-05 1996-07-31 -S000005540 ORF Verified YOR014W RTS1 protein phosphatase 2A regulatory subunit RTS1|SCS1 chromosome 15 L000001786 15 357674 359947 W 2006-01-05 1996-07-31 B-type regulatory subunit of protein phosphatase 2A (PP2A); Rts1p and Cdc55p are alternative regulatory subunits for PP2A catalytic subunits, Pph21p and Pph22p; PP2A-Rts1p protects cohesin when recruited by Sgo1p to the pericentromere; highly enriched at centromeres in the absence of Cdc55p; required for maintenance of septin ring organization during cytokinesis, for ring disassembly in G1 and for dephosphorylation of septin, Shs1p; homolog of the mammalian B' subunit of PP2A -S000036675 CDS YOR014W 15 357674 359947 W 2006-01-05 1996-07-31 -S000005541 ORF Uncharacterized YOR015W chromosome 15 15 359993 360352 W 2006-01-05 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YOR015W is not an essential gene -S000036735 CDS YOR015W 15 359993 360352 W 2006-01-05 1996-07-31 -S000005542 ORF Verified YOR016C ERP4 chromosome 15 L000004681 15 361084 360461 C 2006-01-05 1996-07-31 Member of the p24 family involved in ER to Golgi transport; similar to Emp24p and Erv25p; ERP4 has a paralog, ERP2, that arose from the whole genome duplication -S000036758 CDS YOR016C 15 361084 360461 C 2006-01-05 1996-07-31 -S000005543 ORF Verified YOR017W PET127 chromosome 15 L000001399 15 361412 363814 W 5.5 2006-01-05 1996-07-31 Protein with a role in 5'-end processing of mitochondrial RNAs; located in the mitochondrial membrane -S000036848 CDS YOR017W 15 361412 363814 W 2006-01-05 1996-07-31 -S000005544 ORF Verified YOR018W ROD1 ART4 chromosome 15 L000003079 15 364369 366882 W 2006-01-05 1996-07-31 Alpha-arrestin involved in ubiquitin-dependent endocytosis; activating dephosphorylation relays glucose signaling to transporter endocytosis; calcineurin dephosphorylation is required for Rsp5p-dependent internalization of agonist-occupied Ste2p, as part of signal desensitization; recruits Rsp5p to Ste2p via its 2 PPXY motifs; protein abundance increases in response to DNA replication stress; ROD1 has a paralog, ROG3, that arose from the whole genome duplication -S000037590 CDS YOR018W 15 364369 366882 W 2006-01-05 1996-07-31 -S000005545 ORF Verified YOR019W chromosome 15 15 368127 370319 W 2006-01-05 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; YOR019W has a paralog, JIP4, that arose from the whole genome duplication -S000037647 CDS YOR019W 15 368127 370319 W 2006-01-05 1996-07-31 -S000005546 ORF Verified YOR020C HSP10 CPN10 chromosome 15 L000000815 15 370844 370524 C 2006-01-05 1996-07-31 Mitochondrial matrix co-chaperonin; inhibits the ATPase activity of Hsp60p, a mitochondrial chaperonin; involved in protein folding and sorting in the mitochondria; 10 kD heat shock protein with similarity to E. coli groES -S000037650 CDS YOR020C 15 370844 370524 C 2006-01-05 1996-07-31 -S000028526 ORF Uncharacterized YOR020W-A chromosome 15 15 371685 371957 W 2006-01-05 2003-07-29 Putative protein of unknown function; conserved in A. gossypii; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000030330 CDS YOR020W-A 15 371685 371957 W 2006-01-05 2003-07-29 -S000005547 ORF Verified YOR021C SFM1 protein-arginine N-methyltransferase SFM1 chromosome 15 15 373439 372798 C 2006-01-05 1996-07-31 SPOUT methyltransferase; catalyzes omega-monomethylation of Rps3p on Arg-146; not an essential gene; predicted to be involved in rRNA processing and ribosome biogenesis and in biopolymer catabolism -S000030445 CDS YOR021C 15 373439 372798 C 2006-01-05 1996-07-31 -S000005548 ORF Verified YOR022C DDL1 putative carboxylic ester hydrolase chromosome 15 15 375857 373710 C 2006-01-05 1996-07-31 DDHD domain-containing phospholipase A1; mitochondrial matrix enzyme with sn-1-specific activity, hydrolyzing cardiolipin, PE, PC, PG and PA; implicated in remodeling of mitochondrial phospholipids; antagonistically regulated by Aft1p and Aft2p; in humans, mutations in DDHD1 and DDHD2 genes cause specific types of hereditary spastic paraplegia, while DDL1-defective yeast share similar phenotypes such as mitochondrial dysfunction and defects in lipid metabolism -S000030587 CDS YOR022C 15 375857 373710 C 2006-01-05 1996-07-31 -S000005549 ORF Verified YOR023C AHC1 chromosome 15 15 377712 376012 C 2006-01-05 1996-07-31 Subunit of the Ada histone acetyltransferase complex; required for structural integrity of the complex; Ahc2p and Ahc1p are unique to the ADA complex and not shared with the related SAGA and SLIK complexes; Ahc2p may tether Ahc1p to the complex -S000030673 CDS YOR023C 15 377712 376012 C 2006-01-05 1996-07-31 -S000005550 ORF Dubious YOR024W IRC12 chromosome 15 15 377847 378170 W 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031578 CDS YOR024W 15 377847 378170 W 2006-01-05 1996-07-31 -S000005551 ORF Verified YOR025W HST3 NAD-dependent histone deacetylase HST3 chromosome 15 L000003042 15 378219 379562 W 2006-01-05 1996-07-31 Member of the Sir2 family of NAD(+)-dependent protein deacetylases; involved along with Hst4p in telomeric silencing, cell cycle progression, radiation resistance, genomic stability and short-chain fatty acid metabolism -S000031696 CDS YOR025W 15 378219 379562 W 2006-01-05 1996-07-31 -S000005552 ORF Verified YOR026W BUB3 PAC9 chromosome 15 L000000198 15 379781 380806 W 2006-01-05 1996-07-31 Kinetochore checkpoint WD40 repeat protein; localizes to kinetochores during prophase and metaphase, delays anaphase in the presence of unattached kinetochores; forms complexes with Mad1p-Bub1p and with Cdc20p, binds Mad2p and Mad3p; functions at kinetochore to activate APC/C-Cdc20p for normal mitotic progression -S000031797 CDS YOR026W 15 379781 380806 W 2006-01-05 1996-07-31 -S000005553 ORF Verified YOR027W STI1 Hsp90 cochaperone STI1 chromosome 15 L000002129 15 381053 382822 W 2006-01-05 1996-07-31 Hsp90 cochaperone; regulates spatial organization of amyloid-like proteins in the cytosol, thereby buffering the proteotoxicity caused by amyloid-like proteins; interacts with the Ssa group of the cytosolic Hsp70 chaperones and activates Ssa1p ATPase activity; interacts with Hsp90 chaperones and inhibits their ATPase activity; homolog of mammalian Hop -S000031906 CDS YOR027W 15 381053 382822 W 2006-01-05 1996-07-31 -S000005554 ORF Verified YOR028C CIN5 YAP4|HAL6 chromosome 15 L000000339|L000004263 15 384420 383533 C 2006-01-05 1996-07-31 Basic leucine zipper (bZIP) transcription factor of the yAP-1 family; physically interacts with the Tup1-Cyc8 complex and recruits Tup1p to its targets; mediates pleiotropic drug resistance and salt tolerance; nuclearly localized under oxidative stress and sequestered in the cytoplasm by Lot6p under reducing conditions; CIN5 has a paralog, YAP6, that arose from the whole genome duplication -S000032760 CDS YOR028C 15 384420 383533 C 2006-01-05 1996-07-31 -S000005555 ORF Uncharacterized YOR029W chromosome 15 15 384600 384935 W 2006-01-05 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YOR029W is not an essential gene -S000032920 CDS YOR029W 15 384600 384935 W 2006-01-05 1996-07-31 -S000005556 ORF Verified YOR030W DFG16 ZRG12|ECM41 chromosome 15 L000003877 15 386825 388684 W 2006-01-05 1996-07-31 Probable multiple transmembrane protein; involved in diploid invasive and pseudohyphal growth upon nitrogen starvation; is glycosylated and phosphorylated; interacts with Rim21p and Rim9p in the plasma membrane to form a pH-sensing complex in the Rim101 pathway and is required to maintain Rim21p levels; required for accumulation of processed Rim101p -S000033591 CDS YOR030W 15 386825 388684 W 2006-01-05 1996-07-31 -S000005557 blocked_reading_frame YOR031W CRS5 metallothionein CRS5 chromosome 15 L000000421 15 389213 389422 W 2006-01-05 1996-07-31 Copper-binding metallothionein; required for wild-type copper resistance -S000033679 CDS YOR031W 15 389213 389422 W 2006-01-05 1996-07-31 -S000005558 ORF Verified YOR032C HMS1 chromosome 15 L000004441 15 391075 389771 C 2006-01-05 1996-07-31 bHLH protein with similarity to myc-family transcription factors; overexpression confers hyperfilamentous growth and suppresses the pseudohyphal filamentation defect of a diploid mep1 mep2 homozygous null mutant -S000033735 CDS YOR032C 15 391075 389771 C 2006-01-05 1996-07-31 -S000028710 ORF Uncharacterized YOR032W-A chromosome 15 15 392176 392376 W 2006-01-05 2003-07-29 Protein of unknown function; SWAT-GFP and seamless-GFP fusion proteins localize to the endoplasmic reticulum; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032675 CDS YOR032W-A 15 392176 392376 W 2006-01-05 2003-07-29 -S000005559 ORF Verified YOR033C EXO1 Rad2 family nuclease EXO1|DHS1 chromosome 15 L000000505|L000003929 15 394524 392416 C 2006-01-05 1996-07-31 5'-3' exonuclease and flap-endonuclease; involved in recombination, double-strand break repair, MMS2 error-free branch of the post replication (PRR) pathway and DNA mismatch repair; role in telomere maintenance; member of the Rad2p nuclease family, with conserved N and I nuclease domains; relative distribution to the nucleus increases upon DNA replication stress; EXO1 has a paralog, DIN7, that arose from the whole genome duplication -S000034621 CDS YOR033C 15 394524 392416 C 2006-01-05 1996-07-31 -S000005560 ORF Verified YOR034C AKR2 putative palmitoyltransferase AKR2 chromosome 15 L000004052 15 397086 394837 C 2006-01-05 1996-07-31 Ankyrin repeat-containing protein; member of a family of putative palmitoyltransferases containing an Asp-His-His-Cys-cysteine rich (DHHC-CRD) domain; possibly involved in constitutive endocytosis of Ste3p; AKR2 has a paralog, AKR1, that arose from the whole genome duplication -S000034777 CDS YOR034C 15 397086 394837 C 2006-01-05 1996-07-31 -S000028856 ORF Uncharacterized YOR034C-A chromosome 15 15 397668 397426 C 2006-01-05 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000034569 CDS YOR034C-A 15 397668 397426 C 2006-01-05 2003-07-29 -S000005561 ORF Verified YOR035C SHE4 DIM1 chromosome 15 L000004572 15 400104 397735 C 2006-01-05 1996-07-31 Protein containing a UCS (UNC-45/CRO1/SHE4) domain; binds to myosin motor domains to regulate myosin function; involved in endocytosis, polarization of the actin cytoskeleton, and asymmetric mRNA localization -S000034897 CDS YOR035C 15 400104 397735 C 2006-01-05 1996-07-31 -S000005562 ORF Verified YOR036W PEP12 SNAP receptor PEP12|VPT13|VPS6|VPL6 chromosome 15 L000001379 15 400348 401214 W -5 2006-01-05 1996-07-31 Target membrane receptor (t-SNARE); for vesicular intermediates traveling between the Golgi apparatus and the vacuole; controls entry of biosynthetic, endocytic, and retrograde traffic into the prevacuolar compartment; syntaxin -S000035899 CDS YOR036W 15 400348 401214 W 2006-01-05 1996-07-31 -S000005563 ORF Verified YOR037W CYC2 oxidoreductase chromosome 15 L000000449 15 401555 402655 W 12 2006-01-05 2003-09-22|1996-07-31 Mitochondrial peripheral inner membrane protein; contains a FAD cofactor in a domain exposed in the intermembrane space; exhibits redox activity in vitro; likely participates in ligation of heme to acytochromes c and c1 (Cyc1p and Cyt1p) -S000036064 CDS YOR037W 15 401555 402655 W 2006-01-05 2003-09-22|1996-07-31 -S000005564 ORF Verified YOR038C HIR2 SPT1 chromosome 15 L000000777 15 405388 402761 C 2006-01-05 1996-07-31 Subunit of HIR nucleosome assembly complex; involved in regulation of histone gene transcription; recruits Swi-Snf complexes to histone gene promoters; promotes heterochromatic gene silencing with Asf1p; relocalizes to the cytosol in response to hypoxia -S000036118 CDS YOR038C 15 405388 402761 C 2006-01-05 1996-07-31 -S000005565 ORF Verified YOR039W CKB2 casein kinase 2 regulatory subunit CKB2 chromosome 15 L000000345 15 405768 406544 W 2006-01-05 1996-07-31 Beta' regulatory subunit of casein kinase 2 (CK2); a Ser/Thr protein kinase with roles in cell growth and proliferation; CK2, comprised of CKA1, CKA2, CKB1 and CKB2, has many substrates including transcription factors and all RNA polymerase -S000036946 CDS YOR039W 15 405768 406544 W 2006-01-05 1996-07-31 -S000005566 ORF Verified YOR040W GLO4 hydroxyacylglutathione hydrolase GLO4 chromosome 15 L000003489 15 407064 407921 W 2006-01-05 1996-07-31 Mitochondrial glyoxalase II; catalyzes the hydrolysis of S-D-lactoylglutathione into glutathione and D-lactate; GLO4 has a paralog, GLO2, that arose from the whole genome duplication -S000037742 CDS YOR040W 15 407064 407921 W 2006-01-05 1996-07-31 -S000007292 snoRNA_gene snR9 SNR9 chromosome 15 L000001964 15 408134 407948 C 2006-01-05 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2340 and U2345 -S000034330 noncoding_exon snR9 15 408134 407948 C 2006-01-05 2000-05-19 -S000005568 ORF Verified YOR042W CUE5 ubiquitin-binding protein CUE5 chromosome 15 15 408425 409660 W 2006-01-05 1996-07-31 Ubiquitin-binding protein; functions as ubiquitin-Atg8p adaptor in ubiquitin-dependent autophagy; serves as proteaphagy receptor for inactivated 26S proteasomes; contains CUE domain that binds ubiquitin, which may facilitate intramolecular monoubiquitination; CUE5 has a paralog, DON1, that arose from the whole genome duplication; human TOLLIP is a functional CUE-domain homolog, can complement yeast null mutant, rescuing hypersensitivity of cue5 null mutant cells to Htt-96Q -S000029840 CDS YOR042W 15 408425 409660 W 2006-01-05 1996-07-31 -S000005567 ORF Dubious YOR041C SRF5 chromosome 15 15 408789 408358 C 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 85% of ORF overlaps the uncharacterized gene CUE5; deletion in cyr1 mutant results in loss of stress resistance -S000037769 CDS YOR041C 15 408789 408358 C 2006-01-05 1996-07-31 -S000006453 snoRNA_gene snR62 SNR62 chromosome 15 L000004531 15 409864 409765 C 2006-01-05 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U1888 -S000030839 noncoding_exon snR62 15 409864 409765 C 2006-01-05 2000-05-19 -S000005569 ORF Verified YOR043W WHI2 chromosome 15 L000002485 15 410870 412330 W 9 2006-01-05 1996-07-31 Protein required for full activation of the general stress response; required with binding partner Psr1p, possibly through Msn2p dephosphorylation; regulates growth during the diauxic shift; negative regulator of G1 cyclin expression; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the cell periphery -S000030841 CDS YOR043W 15 410870 412330 W 2006-01-05 1996-07-31 -S000005570 ORF Verified YOR044W IRC23 chromosome 15 15 413007 413480 W 2006-01-05 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion localizes to the ER; null mutant displays increased levels of spontaneous Rad52p foci; IRC23 has a paralog, BSC2, that arose from the whole genome duplication -S000030924 CDS YOR044W 15 413007 413480 W 2006-01-05 1996-07-31 -S000005571 ORF Verified YOR045W TOM6 MOM8B|ISP6 chromosome 15 L000000877 15 413852 414037 W 2006-01-05 1996-07-31 Component of the TOM (translocase of outer membrane) complex; responsible for recognition and initial import steps for all mitochondrially directed proteins; promotes assembly and stability of the TOM complex -S000030996 CDS YOR045W 15 413852 414037 W 2006-01-05 1996-07-31 -S000005572 ORF Verified YOR046C DBP5 ATP-dependent RNA helicase DBP5|RAT8 chromosome 15 L000003292 15 415907 414459 C 2011-02-03 1996-07-31 Cytoplasmic ATP-dependent RNA helicase of the DEAD-box family; involved in mRNA export from the nucleus, remodeling messenger ribonucleoprotein particles (mRNPs), with ATPase activity stimulated by Gle1p, IP6 and Nup159p; involved in translation termination along with Sup45p (eRF1); role in the cellular response to heat stress -S000031032 CDS YOR046C 15 415907 414459 C 2011-02-03 1996-07-31 -S000005573 ORF Verified YOR047C STD1 SFS3|MSN3 chromosome 15 L000002111 15 417681 416347 C 2011-02-03 1996-07-31 Protein involved in control of glucose-regulated gene expression; interacts with kinase Snf1p, glucose sensors Snf3p and Rgt2p, TATA-binding Spt15p; regulator of transcription factor Rgt1p; interactions with Pma1p appear to propagate [GAR+]; STD1 has a paralog, MTH1, that arose from the whole genome duplication -S000032001 CDS YOR047C 15 417681 416347 C 2011-02-03 1996-07-31 -S000005574 ORF Verified YOR048C RAT1 ssRNA exonuclease RAT1|XRN2|TAP1|HKE1 chromosome 15 L000001584 15 421650 418630 C 17.1 2011-02-03 1996-07-31 Nuclear 5' to 3' single-stranded RNA exonuclease; involved in RNA metabolism, including rRNA and snoRNA processing, as well as poly (A+) dependent and independent mRNA transcription termination; required for cotranscriptional pre-rRNA cleavage; displaces Cdk1p from elongating transcripts, especially as RNAPII reaches the poly(A) site, negatively regulates phosphorylation of the CTD of RNAPII, and inhibits RNAPII transcriptional elongation -S000032091 CDS YOR048C 15 421650 418630 C 2011-02-03 1996-07-31 -S000005575 ORF Verified YOR049C RSB1 phospholipid-translocating ATPase RSB1 chromosome 15 15 423732 422668 C 2011-02-03 1996-07-31 Putative sphingoid long-chain base (LCB) efflux transporter; integral membrane transporter that localizes to the plasma membrane and may transport long chain bases (LCBs) from the cytoplasmic side toward the extracytoplasmic side of the membrane; role in glycerophospholipid translocation; suppressor of the sphingoid LCB sensitivity of an LCB-lyase mutation -S000032150 CDS YOR049C 15 423732 422668 C 2011-02-03 1996-07-31 -S000005576 ORF Dubious YOR050C YOR29-01 chromosome 15 15 424617 424270 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; null mutant is viable -S000033916 CDS YOR050C 15 424617 424270 C 2011-02-03 1996-07-31 -S000005577 ORF Verified YOR051C ETT1 NRO1|YOR29-02 chromosome 15 15 426084 424846 C 2011-02-03 1996-07-31 Nuclear protein that inhibits replication of Brome mosaic virus; S. cerevisiae is a model system for studying replication of positive-strand RNA viruses in their natural hosts; deletion increases stop codon readthrough -S000034062 CDS YOR051C 15 426084 424846 C 2011-02-03 1996-07-31 -S000005578 ORF Verified YOR052C TMC1 YOR29-03 chromosome 15 15 427224 426772 C 2011-02-03 1996-07-31 AN1-type zinc finger protein, effector of proteotoxic stress response; stress-inducible transcriptional target of Rpn4p; induced by nitrogen limitation, weak acid, misfolded proteins; short-lived protein, degraded by proteasome; may protect cells from trivalent metalloid induced proteotoxicity; contains PACE promoter element; ortholog of human AIRAP, which stimulates proteasome activity in response to arsenic; protein abundance increases under DNA replication stress -S000034154 CDS YOR052C 15 427224 426772 C 2011-02-03 1996-07-31 -S000005579 ORF Dubious YOR053W YOR29-04 chromosome 15 15 427817 428158 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene VHS3/YOR054C -S000035170 CDS YOR053W 15 427817 428158 W 2011-02-03 1996-07-31 -S000005581 ORF Dubious YOR055W YOR29-06 chromosome 15 15 429478 429912 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035354 CDS YOR055W 15 429478 429912 W 2011-02-03 1996-07-31 -S000005580 ORF Verified YOR054C VHS3 phosphopantothenoylcysteine decarboxylase complex subunit VHS3|YOR29-05 chromosome 15 15 429857 427833 C 2011-02-03 1996-07-31 Negative regulatory subunit of protein phosphatase 1 Ppz1p; involved in coenzyme A biosynthesis; subunit of the phosphopantothenoylcysteine decarboxylase (PPCDC; Cab3p, Sis2p, Vhs3p) complex and the CoA-Synthesizing Protein Complex (CoA-SPC: Cab2p, Cab3p, Cab4p, Cab5p, Sis2p and Vhs3p) -S000035210 CDS YOR054C 15 429857 427833 C 2011-02-03 1996-07-31 -S000005582 ORF Verified YOR056C NOB1 rRNA-binding endoribonuclease|YOR29-07 chromosome 15 15 431626 430247 C 2011-02-03 1996-07-31 Protein involved in proteasomal and 40S ribosomal subunit biogenesis; required for cleavage of the 20S pre-rRNA to generate the mature 18S rRNA; cleavage is activated by Fun12p, a GTPase and translation initiation factor; relocalizes from nucleus to nucleolus upon DNA replication stress -S000035381 CDS YOR056C 15 431626 430247 C 2011-02-03 1996-07-31 -S000005583 ORF Verified YOR057W SGT1 co-chaperone SGT1|YOR29-08 chromosome 15 L000003443|L000004087 15 432186 433373 W 2011-02-03 1996-07-31 Cochaperone protein; regulates activity of adenylyl cyclase Cyr1p; involved in kinetochore complex assembly; associates with the SCF (Skp1p/Cdc53p/F box protein) ubiquitin ligase complex; acts as a linker between Skp1p and HSP90 complexes; protein abundance increases in response to DNA replication stress -S000036316 CDS YOR057W 15 432186 433373 W 2011-02-03 1996-07-31 -S000005584 ORF Verified YOR058C ASE1 YOR29-09 chromosome 15 L000000125 15 436345 433688 C 2011-02-03 1996-07-31 Mitotic spindle midzone-localized microtubule bundling protein; microtubule-associated protein (MAP) family member; required for spindle elongation and stabilization; undergoes cell cycle-regulated degradation by anaphase promoting complex; potential Cdc28p substrate; relative distribution to microtubules decreases upon DNA replication stress -S000036352 CDS YOR058C 15 436345 433688 C 2011-02-03 1996-07-31 -S000007162 long_terminal_repeat YORCdelta11 chromosome 15 15 438483 438175 C 2011-02-03 2000-05-19 Ty1 LTR -S000006634 tRNA_gene tK(UUU)O chromosome 15 L000003707 15 438643 438738 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000034218 intron tK(UUU)O 15 438680 438702 W 2011-02-03 2000-05-19 -S000034216 noncoding_exon tK(UUU)O 15 438643 438679 W 2011-02-03 2000-05-19 -S000034217 noncoding_exon tK(UUU)O 15 438703 438738 W 2011-02-03 2000-05-19 -S000005585 ORF Verified YOR059C LPL1 putative hydrolase|YOR29-10 chromosome 15 15 440258 438906 C 2011-02-03 1996-07-31 Phospholipase; contains lipase specific GXSXG motif; maintains lipid droplet (LD) morphology; induced by transcription factor Rpn4p; protein abundance increases in response to DNA replication stress -S000036452 CDS YOR059C 15 440258 438906 C 2011-02-03 1996-07-31 -S000005586 ORF Verified YOR060C SLD7 YOR29-11 chromosome 15 15 441163 440390 C 2011-02-03 1996-07-31 Protein with a role in chromosomal DNA replication; interacts with Sld3p and reduces its affinity for Cdc45p; deletion mutant has aberrant mitochondria -S000037458 CDS YOR060C 15 441163 440390 C 2011-02-03 1996-07-31 -S000005587 ORF Verified YOR061W CKA2 casein kinase 2 catalytic subunit CKA2|YOR29-12 chromosome 15 L000000344 15 441534 442553 W 2011-02-03 1996-07-31 Alpha' catalytic subunit of casein kinase 2 (CK2); CK2 is a Ser/Thr protein kinase with roles in cell growth and proliferation; CK2, comprised of CKA1, CKA2, CKB1 and CKB2, has many substrates including transcription factors and all RNA polymerases; protein abundance increases in response to DNA replication stress; regulates Fkh1p-mediated donor preference during mating-type switching -S000037585 CDS YOR061W 15 441534 442553 W 2011-02-03 1996-07-31 -S000005588 ORF Uncharacterized YOR062C YOR29-13 chromosome 15 15 443531 442725 C 2011-02-03 1996-07-31 Protein of unknown function; similar to Reg1p; expression regulated by glucose and Rgt1p; GFP-fusion protein is induced in response to the DNA-damaging agent MMS; YOR062C has a paralog, YKR075C, that arose from the whole genome duplication -S000037610 CDS YOR062C 15 443531 442725 C 2011-02-03 1996-07-31 -S000005589 ORF Verified YOR063W RPL3 uL3|ribosomal 60S subunit protein L3|rp1|YL1|L3|YOR29-14|TCM1|MAK8 chromosome 15 15 444686 445849 W 22 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L3; homologous to mammalian ribosomal protein L3 and bacterial L3; plays an important role in function of eIF5B in stimulating 3' end processing of 18S rRNA in context of 80S ribosomes that have not yet engaged in translation; involved in replication and maintenance of killer double stranded RNA virus -S000030496 CDS YOR063W 15 444686 445849 W 2011-02-03 1996-07-31 -S000005590 ORF Verified YOR064C YNG1 YOR29-15 chromosome 15 S000007517 15 446738 446079 C 2011-02-03 1996-07-31 Subunit of the NuA3 histone acetyltransferase complex; this complex acetylates histone H3; contains PHD finger domain that interacts with methylated histone H3; shares significant sequence identity with the human candidate tumor suppressor p33-ING1 in C-terminal region -S000030526 CDS YOR064C 15 446738 446079 C 2011-02-03 1996-07-31 -S000005591 ORF Verified YOR065W CYT1 ubiquinol--cytochrome-c reductase catalytic subunit CYT1|YOR29-16|CTC1 chromosome 15 L000000472 15 447439 448368 W 2011-02-03 1996-07-31 Cytochrome c1; component of the mitochondrial respiratory chain; expression is regulated by the heme-activated, glucose-repressed Hap2p/3p/4p/5p CCAAT-binding complex -S000030648 CDS YOR065W 15 447439 448368 W 2011-02-03 1996-07-31 -S000005592 ORF Verified YOR066W MSA1 YOR29-17 chromosome 15 15 449436 451325 W 2011-02-03 1996-07-31 Activator of G1-specific transcription factors MBF and SBF; involved in regulation of the timing of G1-specific gene transcription and cell cycle initiation; localization is cell-cycle dependent and regulated by Cdc28p phosphorylation; MSA1 has a paralog, MSA2, that arose from the whole genome duplication -S000030728 CDS YOR066W 15 449436 451325 W 2011-02-03 1996-07-31 -S000005593 ORF Verified YOR067C ALG8 dolichyl-P-Glc:Glc1Man(9)GlcNAc(2)-PP-dolichol alpha-1,3-glucosyltransferase|YOR29-18 chromosome 15 L000000079 15 453462 451729 C 2011-02-03 1996-07-31 Glucosyl transferase; involved in N-linked glycosylation; adds glucose to the dolichol-linked oligosaccharide precursor prior to transfer to protein during lipid-linked oligosaccharide biosynthesis; similar to Alg6p; human homolog ALG8 can complement yeast null mutant -S000030756 CDS YOR067C 15 453462 451729 C 2011-02-03 1996-07-31 -S000005595 ORF Verified YOR069W VPS5 sorting nexin 1|YOR29-20|VPT5|PEP10|GRD2 chromosome 15 L000002920 15 453768 455795 W 2011-02-03 2004-04-21|1996-07-31 Nexin-1 homolog; required for localizing membrane proteins from a prevacuolar/late endosomal compartment back to late Golgi; structural component of retromer membrane coat complex; forms a retromer subcomplex with Vps17p; required for recruiting the retromer complex to the endosome membranes; VPS5 has a paralog, YKR078W, that arose from the whole genome duplication -S000031779 CDS YOR069W 15 453768 455795 W 2011-02-03 2004-04-21|1996-07-31 -S000005594 ORF Verified YOR068C VAM10 YOR29-19 chromosome 15 15 454213 453869 C 2011-02-03 1996-07-31 Protein involved in vacuole morphogenesis; acts at an early step of homotypic vacuole fusion that is required for vacuole tethering -S000031602 CDS YOR068C 15 454213 453869 C 2011-02-03 1996-07-31 -S000005596 ORF Verified YOR070C GYP1 YOR29-21 chromosome 15 L000004377 15 457820 455907 C 2011-02-03 1996-07-31 Cis-golgi GTPase-activating protein (GAP) for yeast Rabs; the Rab family members are Ypt1p (in vivo) and for Ypt1p, Sec4p, Ypt7p, and Ypt51p (in vitro); involved in vesicle docking and fusion -S000033733 CDS YOR070C 15 457820 455907 C 2011-02-03 1996-07-31 -S000005597 ORF Verified YOR071C NRT1 nicotinamide riboside transporter|THI71|YOR29-22 chromosome 15 15 461276 459480 C 2011-02-03 1996-07-31 High-affinity nicotinamide riboside transporter; also transports thiamine with low affinity; major transporter for 5-aminoimidazole-4-carboxamide-1-beta-D-ribofuranoside (acadesine) uptake; shares sequence similarity with Thi7p and Thi72p; proposed to be involved in 5-fluorocytosine sensitivity -S000033867 CDS YOR071C 15 461276 459480 C 2011-02-03 1996-07-31 -S000005598 ORF Dubious YOR072W YOR29-23 chromosome 15 15 461502 461816 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious gene YOR072W-A; diploid deletion strains are methotrexate, paraquat and wortmannin sensitive -S000034814 CDS YOR072W 15 461502 461816 W 2011-02-03 1996-07-31 -S000028582 ORF Dubious YOR072W-A chromosome 15 15 461791 462039 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YOR072W; originally identified by fungal homology and RT-PCR -S000031329 CDS YOR072W-A 15 461791 462039 W 2011-02-03 2003-07-29 -S000006688 tRNA_gene tP(UGG)O2 SUF11 chromosome 15 L000002159|L000003708 15 464450 464551 W 30 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin; can mutate to suppress +1 frameshift mutations in proline codons -S000031047 intron tP(UGG)O2 15 464486 464515 W 2011-02-03 2000-05-19 -S000031045 noncoding_exon tP(UGG)O2 15 464450 464485 W 2011-02-03 2000-05-19 -S000031046 noncoding_exon tP(UGG)O2 15 464516 464551 W 2011-02-03 2000-05-19 -S000028516 ORF Uncharacterized YOR072W-B chromosome 15 15 464469 464630 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000030289 CDS YOR072W-B 15 464469 464630 W 2011-02-03 2003-07-29 -S000005599 ORF Verified YOR073W SGO1 YOR29-24 chromosome 15 15 464771 466543 W 2011-02-03 1996-07-31 Component of the spindle checkpoint; involved in sensing lack of tension on mitotic chromosomes; protects centromeric Rec8p at meiosis I; required for accurate chromosomal segregation at meiosis II and for mitotic chromosome stability; recruits condensin to the pericentric region of chromosomes during meiosis; dissociates from pericentromeres when sister kinetochores are under tension -S000034945 CDS YOR073W 15 464771 466543 W 2011-02-03 1996-07-31 -S000028583 ORF Dubious YOR073W-A chromosome 15 15 467390 467623 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially/completely overlaps the verified ORF CDC21/YOR074C; identified by RT-PCR -S000031330 CDS YOR073W-A 15 467390 467623 W 2011-02-03 2003-07-29 -S000005600 ORF Verified YOR074C CDC21 thymidylate synthase|YOR29-25|TMP1|CRT9 chromosome 15 L000000260 15 467589 466675 C 32 2011-02-03 1996-07-31|2005-12-01 Thymidylate synthase; required for de novo biosynthesis of pyrimidine deoxyribonucleotides; expression is induced at G1/S; human homolog TYMSOS can complement yeast cdc21 temperature-sensitive mutant at restrictive temperature -S000034991 CDS YOR074C 15 467589 466675 C 2011-02-03 1996-07-31|2005-12-01 -S000005601 ORF Verified YOR075W UFE1 YOR29-26 chromosome 15 L000002637 15 468212 469252 W 2011-02-03 1996-07-31 t-SNARE protein required for retrograde vesicular traffic; involved in Sey1p-independent homotypic ER fusion; required for efficient nuclear fusion during mating; forms a complex with the SNAREs Sec22p, Sec20p and Use1p to mediate fusion of Golgi-derived vesicles at the ER -S000035197 CDS YOR075W 15 468212 469252 W 2011-02-03 1996-07-31 -S000005602 ORF Verified YOR076C SKI7 YOR29-27 chromosome 15 15 471620 469377 C 2011-02-03 1996-07-31 GTP-binding protein that couples the Ski complex and exosome; putative pseudo-translational GTPase involved in 3'-to-5' mRNA decay pathway; interacts with both the cytoplasmic exosome and the Ski complex; eRF3-like domain targets nonstop mRNA for degradation; null mutants have a superkiller phenotype; SKI7 has a paralog, HBS1, that arose from the whole genome duplication -S000036014 CDS YOR076C 15 471620 469377 C 2011-02-03 1996-07-31 -S000005603 ORF Verified YOR077W RTS2 YOR29-28 chromosome 15 L000001787 15 471899 472597 W 2011-02-03 1996-07-31 Basic zinc-finger protein; similar to human and mouse Kin17 proteins which are chromatin-associated proteins involved in UV response and DNA replication -S000036174 CDS YOR077W 15 471899 472597 W 2011-02-03 1996-07-31 -S000005604 ORF Verified YOR078W BUD21 YOR29-29|UTP16 chromosome 15 15 472725 473369 W 2011-02-03 1996-07-31 Component of small ribosomal subunit (SSU) processosome; this complex contains U3 snoRNA; required at post-transcriptional step for efficient retrotransposition; absence results in decreased Ty1 Gag:GFP protein levels; originally isolated as bud-site selection mutant that displays a random budding pattern -S000036267 CDS YOR078W 15 472725 473369 W 2011-02-03 1996-07-31 -S000005605 ORF Verified YOR079C ATX2 Mn(2+) transporter ATX2|YOR29-30 chromosome 15 L000003290 15 474416 473475 C 2011-02-03 1996-07-31 Golgi membrane protein involved in manganese homeostasis; overproduction suppresses the sod1 (copper, zinc superoxide dismutase) null mutation -S000036294 CDS YOR079C 15 474416 473475 C 2011-02-03 1996-07-31 -S000005606 ORF Verified YOR080W DIA2 DNA-binding SCF ubiquitin ligase subunit DIA2|YOR29-31 chromosome 15 15 474594 476792 W 2011-02-03 1996-07-31|2010-01-05 Origin-binding F-box protein; forms SCF ubiquitin ligase complex with Skp1p and Cdc53p; functions in ubiquitination of silent chromatin structural protein Sir4p; required to target Cdc6p for destruction during G1 phase; required for deactivation of Rad53 checkpoint kinase, completion of DNA replication during recovery from DNA damage, assembly of RSC complex, RSC-mediated transcription regulation, and nucleosome positioning; involved in invasive and pseudohyphal growth -S000035995 CDS YOR080W 15 474594 476792 W 2011-02-03 1996-07-31|2010-01-05 -S000005607 ORF Verified YOR081C TGL5 STC2 chromosome 15 15 479188 476939 C 2011-02-03 1996-07-31 Bifunctional triacylglycerol lipase and LPA acyltransferase; lipid particle-localized triacylglycerol (TAG) lipase involved in triacylglycerol mobilization; catalyzes acylation of lysophosphatidic acid (LPA); potential Cdc28p substrate; TGL5 has a paralog, TGL4, that arose from the whole genome duplication -S000037799 CDS YOR081C 15 479188 476939 C 2011-02-03 1996-07-31 -S000005609 ORF Verified YOR083W WHI5 transcriptional repressor WHI5 chromosome 15 15 479533 480420 W 2011-02-03 1996-07-31 Repressor of G1 transcription; binds to SCB binding factor (SBF) at SCB target promoters in early G1; dilution of Whi5p concentration during cell growth determines cell size; phosphorylation of Whi5p by the CDK, Cln3p/Cdc28p relieves repression and promoter binding by Whi5, and contributes to both the determination of critical cell size at START and cell fate; periodically expressed in G1 -S000029953 CDS YOR083W 15 479533 480420 W 2011-02-03 1996-07-31 -S000005608 ORF Dubious YOR082C chromosome 15 15 479637 479296 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YOR083W -S000037872 CDS YOR082C 15 479637 479296 C 2011-02-03 1996-07-31 -S000005610 ORF Verified YOR084W LPX1 triglyceride lipase chromosome 15 15 480587 481750 W 2011-02-03 1996-07-31 Peroxisomal matrix-localized lipase; required for normal peroxisome morphology; contains a peroxisomal targeting signal type 1 (PTS1) and a lipase motif; peroxisomal import requires the PTS1 receptor, Pex5p and self-interaction; transcriptionally activated by Yrm1p along with genes involved in multidrug resistance; oleic acid inducible -S000030939 CDS YOR084W 15 480587 481750 W 2011-02-03 1996-07-31 -S000005611 ORF Verified YOR085W OST3 dolichyl-diphosphooligosaccharide--protein glycotransferase OST3 chromosome 15 L000002943 15 482033 483085 W 2011-02-03 1996-07-31 Gamma subunit of the oligosaccharyltransferase complex of the ER lumen; complex catalyzes asparagine-linked glycosylation of newly synthesized proteins; Ost3p is important for N-glycosylation of a subset of proteins -S000031015 CDS YOR085W 15 482033 483085 W 2011-02-03 1996-07-31 -S000005612 ORF Verified YOR086C TCB1 tricalbin chromosome 15 15 486779 483219 C 2011-02-03 1996-07-31 Lipid-binding ER protein involved in ER-plasma membrane tethering; one of 6 proteins (Ist2p, Scs2p, Scs22p, Tcb1p, Tcb2p, Tcb3p) that connect ER to plasma membrane and regulate PI4P levels by controlling access of Sac1p phosphatase to its substrate PI4P in PM; contains 3 calcium and lipid binding domains; non-tagged protein also localizes to mitochondria; C-termini of Tcb1p, Tcb2p and Tcb3p interact; TCB1 has a paralog, TCB2, that arose from the whole genome duplication -S000031064 CDS YOR086C 15 486779 483219 C 2011-02-03 1996-07-31 -S000006676 tRNA_gene tN(GUU)O2 chromosome 15 L000003709 15 487439 487512 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis -S000035653 noncoding_exon tN(GUU)O2 15 487439 487512 W 2011-02-03 2000-05-19 -S000005613 ORF Verified YOR087W YVC1 TRPY1|YOR088W chromosome 15 15 487707 489734 W 2011-02-03 2003-01-09|1996-07-31 Vacuolar cation channel; mediates release of Ca(2+) from the vacuole in response to hyperosmotic shock -S000031212 CDS YOR087W 15 487707 489734 W 2011-02-03 2003-01-09|1996-07-31 -S000007554 ARS ARS1501 ARS1514|ARS245 chromosome 15 15 489683 489942 2014-11-18 2000-10-17|2014-11-18 Autonomously Replicating Sequence -S000178184 ARS_consensus_sequence ARS1501 15 489891 489907 W 2014-11-18 2014-11-18 -S000005615 ORF Verified YOR089C VPS21 Rab family GTPase VPS21|YPT51|YPT21|VPT12|VPS12 chromosome 15 L000002474 15 490828 490196 C 2011-02-03 1996-07-31 Endosomal Rab family GTPase; required for endocytic transport and sorting of vacuolar hydrolases; required for endosomal localization of the CORVET complex; required with YPT52 for MVB biogenesis and sorting; involved in autophagy and ionic stress tolerance; geranylgeranylation required for membrane association; protein abundance increases in response to DNA replication stress; mammalian Rab5 homolog; VPS21 has a paralog, YPT53, that arose from the whole genome duplication -S000032213 CDS YOR089C 15 490828 490196 C 2011-02-03 1996-07-31 -S000005616 ORF Verified YOR090C PTC5 type 2C protein phosphatase PTC5|PPP1 chromosome 15 15 492841 491123 C 2011-02-03 1996-07-31 Mitochondrial type 2C protein phosphatase (PP2C); involved in regulation of pyruvate dehydrogenase activity by dephosphorylating the serine 133 of the Pda1p subunit; localizes to the intermembrane space and is imported via the presequence pathway and processed by the inner membrane protease (Imp1p-Imp2p); acts in concert with kinases Pkp1p and Pkp2p and phosphatase Ptc6p -S000031844 CDS YOR090C 15 492841 491123 C 2011-02-03 1996-07-31 -S000005617 ORF Verified YOR091W TMA46 RBF46 chromosome 15 15 493433 494470 W 2011-02-03 1996-07-31|2005-12-01 Protein of unknown function that associates with translating ribosomes; interacts with GTPase Rbg1p -S000032061 CDS YOR091W 15 493433 494470 W 2011-02-03 1996-07-31|2005-12-01 -S000005618 ORF Verified YOR092W ECM3 putative ATPase ECM3|YOR3165W chromosome 15 L000003879 15 495127 496968 W 2011-02-03 1996-07-31 Non-essential protein of unknown function; involved in signal transduction and the genotoxic response; induced rapidly in response to treatment with 8-methoxypsoralen and UVA irradiation; relocalizes from ER to cytoplasm upon DNA replication stress; ECM3 has a paralog, YNL095C, that arose from the whole genome duplication -S000032141 CDS YOR092W 15 495127 496968 W 2011-02-03 1996-07-31 -S000005619 ORF Uncharacterized YOR093C CMR2 chromosome 15 15 502452 497506 C 2011-02-03 1996-07-31 Putative protein of unknown function; deletion causes sensitivity to unfolded protein response-inducing agents -S000034073 CDS YOR093C 15 502452 497506 C 2011-02-03 1996-07-31 -S000005620 ORF Verified YOR094W ARF3 Arf family GTPase ARF3|ARL2 chromosome 15 L000000106 15 502795 503346 W 2011-02-03 1996-07-31 Glucose-repressible ADP-ribosylation factor; GTPase of Ras superfamily involved in regulating cell polarity and invasive growth; localizes to dynamic spots at plasma membrane and modulates PtdIns(4,5)P2 levels to facilitate endocytosis; required for localization of endocytic protein Lsb5p to correct cortical site in cells; also has mRNA binding activity; homolog of mammalian Arf6 -S000034255 CDS YOR094W 15 502795 503346 W 2011-02-03 1996-07-31 -S000005621 ORF Verified YOR095C RKI1 ribose-5-phosphate isomerase RKI1 chromosome 15 L000003519 15 504328 503552 C 2011-02-03 1996-07-31 Ribose-5-phosphate ketol-isomerase; catalyzes the interconversion of ribose 5-phosphate and ribulose 5-phosphate in the pentose phosphate pathway; participates in pyridoxine biosynthesis -S000034285 CDS YOR095C 15 504328 503552 C 2011-02-03 1996-07-31 -S000005622 ORF Verified YOR096W RPS7A eS7|ribosomal 40S subunit protein S7A|S7e|rp30|S7A|RPS30 chromosome 15 L000003300 15 505794 506767 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; interacts with Kti11p; deletion causes hypersensitivity to zymocin; homologous to mammalian ribosomal protein S7, no bacterial homolog; RPS7A has a paralog, RPS7B, that arose from the whole genome duplication -S000034377 CDS YOR096W 15 505794 505937 W 2011-02-03 1996-07-31 -S000034378 CDS YOR096W 15 506339 506767 W 2011-02-03 1996-07-31 -S000034379 intron YOR096W 15 505938 506338 W 2011-02-03 1996-07-31 -S000005623 ORF Uncharacterized YOR097C chromosome 15 15 507505 506978 C 2011-02-03 1996-07-31 Putative protein of unknown function; identified as interacting with Hsp82p in a high-throughput two-hybrid screen; YOR097C is not an essential gene -S000035307 CDS YOR097C 15 507505 506978 C 2011-02-03 1996-07-31 -S000005624 ORF Verified YOR098C NUP1 FG-nucleoporin NUP1 chromosome 15 L000001288 15 511178 507948 C 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; contributes directly to nucleocytoplasmic transport and maintenance of thenuclear pore complex (NPC) permeability barrier; possible karyopherin release factor that accelerates release of karyopherin-cargo complexes after transport across NPC; both NUP1 and NUP60 are homologous to human NUP153 -S000035367 CDS YOR098C 15 511178 507948 C 2011-02-03 1996-07-31 -S000005625 ORF Verified YOR099W KTR1 alpha-1,2-mannosyltransferase KTR1 chromosome 15 L000000924 15 511825 513006 W 54 2011-02-03 1996-07-31 Alpha-1,2-mannosyltransferase; involved in O- and N-linked protein glycosylation; type II membrane protein; member of the KRE2/MNT1 mannosyltransferase family; relocalizes from vacuole to cytoplasm upon DNA replication stress -S000035471 CDS YOR099W 15 511825 513006 W 2011-02-03 1996-07-31 -S000005626 ORF Verified YOR100C CRC1 carnitine:acyl carnitine antiporter chromosome 15 S000007462 15 514278 513295 C 2011-02-03 1996-07-31 Mitochondrial inner membrane carnitine transporter; required for carnitine-dependent transport of acetyl-CoA from peroxisomes to mitochondria during fatty acid beta-oxidation; human homolog SLC25A20 complements yeast null mutant -S000032610 CDS YOR100C 15 514278 513295 C 2011-02-03 1996-07-31 -S000005627 ORF Verified YOR101W RAS1 Ras family GTPase RAS1 chromosome 15 L000001582 15 515244 516173 W 53 2011-02-03 1996-07-31 GTPase involved in G-protein signaling in adenylate cyclase activation; plays a role in cell proliferation; localized to the plasma membrane; homolog of mammalian RAS proto-oncogenes; relative distribution to the nucleus increases upon DNA replication stress; RAS1 has a paralog, RAS2, that arose from the whole genome duplication -S000032754 CDS YOR101W 15 515244 516173 W 2011-02-03 1996-07-31 -S000005628 ORF Dubious YOR102W chromosome 15 15 516423 516773 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; extensively overlaps essential OST2 gene encoding a subunit of the ER lumen oligosaccharyltransferase complex -S000033499 CDS YOR102W 15 516423 516773 W 2011-02-03 1996-07-31 -S000005629 ORF Verified YOR103C OST2 dolichyl-diphosphooligosaccharide-protein glycotransferase chromosome 15 L000002942 15 516841 516449 C 2011-02-03 2003-09-22|1996-07-31 Epsilon subunit of the oligosaccharyltransferase complex; located in the ER lumen; catalyzes asparagine-linked glycosylation of newly synthesized proteins -S000033537 CDS YOR103C 15 516841 516449 C 2011-02-03 2003-09-22|1996-07-31 -S000005630 ORF Verified YOR104W PIN2 chromosome 15 15 517642 518490 W 2011-02-03 1996-07-31 Exomer-dependent cargo protein; induces appearance of [PIN+] prion when overproduced; prion-like domain serves as a retention signal in the trans-Golgi network; predicted to be palmitoylated -S000033687 CDS YOR104W 15 517642 518490 W 2011-02-03 1996-07-31 -S000005631 ORF Uncharacterized YOR105W chromosome 15 15 518195 518521 W 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels -S000033820 CDS YOR105W 15 518195 518521 W 2011-02-03 1996-07-31 -S000005632 ORF Verified YOR106W VAM3 SNAP receptor VAM3|PTH1 chromosome 15 L000003267|L000003302 15 519121 519972 W 2011-02-03 1996-07-31 Syntaxin-like vacuolar t-SNARE; functions with Vam7p in vacuolar protein trafficking; mediates docking/fusion of late transport intermediates with the vacuole; has an acidic di-leucine sorting signal and C-terminal transmembrane region -S000034700 CDS YOR106W 15 519121 519972 W 2011-02-03 1996-07-31 -S000005633 ORF Verified YOR107W RGS2 GTPase-activating protein RGS2 chromosome 15 15 521353 522282 W 2011-02-03 1996-07-31 Negative regulator of glucose-induced cAMP signaling; directly activates the GTPase activity of the heterotrimeric G protein alpha subunit Gpa2p -S000034847 CDS YOR107W 15 521353 522282 W 2011-02-03 1996-07-31 -S000005634 ORF Verified YOR108W LEU9 2-isopropylmalate synthase LEU9 chromosome 15 15 523027 524841 W 2011-02-03 1996-07-31 Alpha-isopropylmalate synthase II (2-isopropylmalate synthase); catalyzes the first step in the leucine biosynthesis pathway; the minor isozyme, responsible for the residual alpha-IPMS activity detected in a leu4 null mutant; LEU9 has a paralog, LEU4, that arose from the whole genome duplication -S000034978 CDS YOR108W 15 523027 524841 W 2011-02-03 1996-07-31 -S000028711 ORF Dubious YOR108C-A chromosome 15 15 524814 524605 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032677 CDS YOR108C-A 15 524814 524605 C 2011-02-03 2003-07-29 -S000005635 ORF Verified YOR109W INP53 phosphatidylinositol-3-/phosphoinositide 5-phosphatase INP53|SOP2|SJL3 chromosome 15 L000003984 15 525278 528601 W 2011-02-03 1996-07-31 Polyphosphatidylinositol phosphatase; dephosphorylates multiple phosphatidylinositol phosphates; involved in trans Golgi network-to-early endosome pathway; hyperosmotic stress causes translocation to actin patches; contains Sac1 and 5-ptase domains; INP53 has a paralog, INP52, that arose from the whole genome duplication -S000035927 CDS YOR109W 15 525278 528601 W 2011-02-03 1996-07-31 -S000005636 ORF Verified YOR110W TFC7 transcription factor TFIIIC subunit TFC7|tau 55 chromosome 15 15 528941 530248 W 2011-02-03 1996-07-31 RNA pol III transcription initiation factor complex (TFIIIC) subunit; part of the TauA globular domain of TFIIIC that binds DNA at the BoxA promoter sites of tRNA and similar genes; TFC7 has a paralog, YNL108C, that arose from the whole genome duplication -S000036863 CDS YOR110W 15 528941 530248 W 2011-02-03 1996-07-31 -S000005637 ORF Uncharacterized YOR111W chromosome 15 15 530429 531127 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000036919 CDS YOR111W 15 530429 531127 W 2011-02-03 1996-07-31 -S000005638 ORF Verified YOR112W CEX1 chromosome 15 15 531508 533793 W 2011-02-03 1996-07-31 Component of nuclear aminoacylation-dependent tRNA export pathway; cytoplasmic; interacts with nuclear pore component Nup116p; copurifies with tRNA export receptors Los1p and Msn5p, as well as eIF-1a; required for activation of RAN GTPase Gsp1p and dissociation of receptor-tRNA-Gsp1p export complex; recruits Rna1p from cytoplasm to NPC, facilitates Rna1p activation of Gsp1p GTPase activity by enabling Rna1p to gain access to Gsp1p-GTP bound to export receptor tRNA complex -S000036975 CDS YOR112W 15 531508 533793 W 2011-02-03 1996-07-31 -S000005639 ORF Verified YOR113W AZF1 chromosome 15 L000000158 15 534075 536819 W 2011-02-03 1996-07-31 Zinc-finger transcription factor; involved in diauxic shift; in the presence of glucose, activates transcription of genes involved in growth and carbon metabolism; in nonfermentable carbon sources, activates transcription of genes involved in maintenance of cell wall integrity; relocalizes to the cytosol in response to hypoxia -S000037745 CDS YOR113W 15 534075 536819 W 2011-02-03 1996-07-31 -S000005640 ORF Uncharacterized YOR114W chromosome 15 15 537570 538454 W 2011-02-03 1996-07-31 Putative protein of unknown function; null mutant is viable -S000037834 CDS YOR114W 15 537570 538454 W 2011-02-03 1996-07-31 -S000005641 ORF Verified YOR115C TRS33 chromosome 15 S000007434 15 539465 538659 C 2011-02-03 1996-07-31 Core component of TRAPP complexes I, II and IV; transport protein particle (TRAPP) complexes are related multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating ER-Golgi traffic (TRAPPI), intra-Golgi traffic (TRAPPII), endosome-Golgi traffic (TRAPPII and III) and autophagy (TRAPPIII, and IV); proposed subunit of a novel complex, TRAPPIV, that may function redundantly with TRAPPIII as a GEF that activates Ypt1 during autophagy -S000037875 CDS YOR115C 15 539465 538659 C 2011-02-03 1996-07-31 -S000005642 ORF Verified YOR116C RPO31 DNA-directed RNA polymerase III core subunit RPO31|C160|RPC160|RPC1 chromosome 15 L000001746|L000001694 15 544145 539763 C 59 2011-02-03 1996-07-31 RNA polymerase III largest subunit C160; part of core enzyme; similar to bacterial beta-prime subunit and to RPA190 and RPO21 -S000030813 CDS YOR116C 15 544145 539763 C 2011-02-03 1996-07-31 -S000005643 ORF Verified YOR117W RPT5 proteasome regulatory particle base subunit RPT5|YTA1 chromosome 15 L000002555 15 545029 546333 W 2011-02-03 1996-07-31 ATPase of the 19S regulatory particle of the 26S proteasome; one of six ATPases of the regulatory particle; involved in the degradation of ubiquitinated substrates; recruited to the GAL1-10 promoter region upon induction of transcription; similar to human TBP1 -S000030925 CDS YOR117W 15 545029 546333 W 2011-02-03 1996-07-31 -S000005644 ORF Verified YOR118W RTC5 chromosome 15 15 546857 548560 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; null mutation suppresses cdc13-1 temperature sensitivity -S000030998 CDS YOR118W 15 546857 548560 W 2011-02-03 1996-07-31 -S000005645 ORF Verified YOR119C RIO1 protein kinase RIO1|RRP10 chromosome 15 L000003989 15 550246 548792 C 2011-02-03 1996-07-31 Serine kinase involved in cell cycle regulation and rDNA integrity; associated with late pre-40S particles via its conserved C-terminal domain and participates in late 40S biogenesis; association with pre-40S particles regulated by its catalytic ATPase site and likely occurs after the release of Rio2p from these particles; involved in cell cycle progression and processing of the 20S pre-rRNA into mature 18S rRNA; phosphorylates Rpa43p in anaphase to remove Pol I from rDNA -S000031034 CDS YOR119C 15 550246 548792 C 2011-02-03 1996-07-31 -S000005646 ORF Verified YOR120W GCY1 glycerol 2-dehydrogenase (NADP(+)) GCY1|GCY chromosome 15 L000000694 15 551114 552052 W 2011-02-03 1996-07-31 Glycerol dehydrogenase; involved in an alternative pathway for glycerol catabolism used under microaerobic conditions; also has mRNA binding activity; member of the aldo-keto reductase (AKR) family; human homolog AKR1B1 can complement yeast null mutant; protein abundance increases in response to DNA replication stress; GCY1 has a paralog, YPR1, that arose from the whole genome duplication -S000033029 CDS YOR120W 15 551114 552052 W 2011-02-03 1996-07-31 -S000005647 ORF Dubious YOR121C chromosome 15 15 552103 551798 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame overlaps the verified gene GCY1/YOR120W -S000033061 CDS YOR121C 15 552103 551798 C 2011-02-03 1996-07-31 -S000005648 ORF Verified YOR122C PFY1 profilin|CLS5|PRF1 chromosome 15 L000001407 15 552887 552298 C 64 2011-02-03 1996-07-31 Profilin; binds actin, phosphatidylinositol 4,5-bisphosphate, and polyproline regions; involved in cytoskeleton organization; required for normal timing of actin polymerization in response to thermal stress; protein abundance increases in response to DNA replication stress; highly conserved protein; human PFN1 (profilin 1) complements temperature sensitive pfy1 mutants, PFN1 mutations are a rare cause of ALS -S000033159 CDS YOR122C 15 552665 552298 C 2011-02-03 1996-07-31 -S000033158 CDS YOR122C 15 552887 552875 C 2011-02-03 1996-07-31 -S000033160 intron YOR122C 15 552874 552666 C 2011-02-03 1996-07-31 -S000005649 ORF Verified YOR123C LEO1 chromosome 15 L000000936 15 554570 553176 C 2011-02-03 1996-07-31 Component of the Paf1 complex; which associates with RNA polymerase II and is involved in histone methylation; plays a role in regulating Ty1 transposition; involved in transcription elongation as demonstrated by the G-less-based run-on (GLRO) assay -S000033954 CDS YOR123C 15 554570 553176 C 2011-02-03 1996-07-31 -S000005650 ORF Verified YOR124C UBP2 ubiquitin-specific protease UBP2 chromosome 15 L000002416 15 558642 554824 C 2011-02-03 1996-07-31 Ubiquitin-specific protease; removes ubiquitin from ubiquitinated proteins; controls K63 homeostasis during oxidative stress; deubiquitinates Rsp5p and is required for MVB sorting of membrane proteins; can cleave polyubiquitin and has isopeptidase activity -S000034064 CDS YOR124C 15 558642 554824 C 2011-02-03 1996-07-31 -S000005651 ORF Verified YOR125C CAT5 putative monooxygenase CAT5|COQ7 chromosome 15 L000000219 15 559731 559030 C 2011-02-03 2003-09-22|1996-07-31 Protein required for ubiquinone (Coenzyme Q) biosynthesis; localizes to the matrix face of the mitochondrial inner membrane in a large complex with ubiquinone biosynthetic enzymes; required for gluconeogenic gene activation -S000034156 CDS YOR125C 15 559731 559030 C 2011-02-03 2003-09-22|1996-07-31 -S000005652 ORF Verified YOR126C IAH1 isoamyl acetate-hydrolyzing esterase chromosome 15 L000003383 15 560677 559961 C 2011-02-03 1996-07-31 Isoamyl acetate-hydrolyzing esterase; required in balance with alcohol acetyltransferase to maintain optimal amounts of isoamyl acetate, which is particularly important in sake brewing -S000035099 CDS YOR126C 15 560677 559961 C 2011-02-03 1996-07-31 -S000005653 ORF Verified YOR127W RGA1 THE1|DBM1 chromosome 15 L000002626 15 561170 564193 W 2011-02-03 1996-07-31 GTPase-activating protein for polarity-establishment protein Cdc42p; implicated in control of septin organization, pheromone response, and haploid invasive growth; relocalizes from bud neck to cytoplasm upon DNA replication stress; RGA1 has a paralog, RGA2, that arose from the whole genome duplication -S000035296 CDS YOR127W 15 561170 564193 W 2011-02-03 1996-07-31 -S000005654 ORF Verified YOR128C ADE2 phosphoribosylaminoimidazole carboxylase ADE2 chromosome 15 L000000032 15 566191 564476 C 64 2011-02-03 1996-07-31 Phosphoribosylaminoimidazole carboxylase; catalyzes a step in the 'de novo' purine nucleotide biosynthetic pathway; red pigment accumulates in mutant cells deprived of adenine -S000035306 CDS YOR128C 15 566191 564476 C 2011-02-03 1996-07-31 -S000114843 ARS ARS1516 ARS1516 ARSXV-567|ADE2 ARS chromosome 15 15 566410 566643 2011-02-03 2006-04-12|2006-09-08 Autonomously Replicating Sequence -S000005655 ORF Verified YOR129C AFI1 chromosome 15 15 569558 566877 C 2011-02-03 1996-07-31 Arf3p polarization-specific docking factor; required for the polarized distribution of the ADP-ribosylation factor, Arf3p; participates in polarity development and maintenance of a normal haploid budding pattern; interacts with Cnm7p -S000035385 CDS YOR129C 15 569558 566877 C 2011-02-03 1996-07-31 -S000005656 ORF Verified YOR130C ORT1 ARG11 chromosome 15 L000003289 15 570807 569929 C 2011-02-03 1996-07-31|2011-02-03 Ornithine transporter of the mitochondrial inner membrane; exports ornithine from mitochondria as part of arginine biosynthesis; functionally complemented by human ortholog, SLC25A15, which is associated with hyperammonaemia-hyperornithinaemia-homocitrullinuria (HHH) syndrome, but HHH-associated variants fail to complement -S000031722 CDS YOR130C 15 570807 569929 C 2011-02-03 1996-07-31|2011-02-03 -S000006545 tRNA_gene tD(GUC)O chromosome 15 L000003710 15 571958 572029 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000030425 noncoding_exon tD(GUC)O 15 571958 572029 W 2011-02-03 2000-05-19 -S000005657 ORF Verified YOR131C putative haloacid dehalogenase-like hydrolase chromosome 15 15 572838 572182 C 2011-02-03 1996-07-31 Putative haloacid dehalogenase-like hydrolase; non-essential gene; overexpression causes a cell cycle delay or arrest; protein abundance increases in response to DNA replication stress -S000031872 CDS YOR131C 15 572838 572182 C 2011-02-03 1996-07-31 -S000005658 ORF Verified YOR132W VPS17 retromer subunit VPS17|VPT3|PEP21 chromosome 15 L000002472|S000029642|L000002479 15 573175 574830 W 2011-02-03 1996-07-31 Subunit of the membrane-associated retromer complex; essential for endosome-to-Golgi retrograde protein transport; peripheral membrane protein that assembles onto the membrane with Vps5p to promote vesicle formation; required for recruiting the retromer complex to the endosome membranes -S000037422 CDS YOR132W 15 573175 574830 W 2011-02-03 1996-07-31 -S000005659 ORF Verified YOR133W EFT1 elongation factor 2 chromosome 15 L000000543 15 575098 577626 W 2011-02-03 1996-07-31 Elongation factor 2 (EF-2), also encoded by EFT2; catalyzes ribosomal translocation during protein synthesis; contains diphthamide, the unique posttranslationally modified histidine residue specifically ADP-ribosylated by diphtheria toxin; EFT1 has a paralog, EFT2, that arose from the whole genome duplication -S000037496 CDS YOR133W 15 575098 577626 W 2011-02-03 1996-07-31 -S000005660 ORF Verified YOR134W BAG7 chromosome 15 L000003395 15 578564 579793 W 2011-02-03 1996-07-31 Rho GTPase activating protein (RhoGAP); stimulates the intrinsic GTPase activity of Rho1p, which plays a bud growth by regulating actin cytoskeleton organization and cell wall biosynthesis, resulting in the downregulation of Rho1p; structurally and functionally related to Sac7p; BAG7 has a paralog, SAC7, that arose from the whole genome duplication -S000037586 CDS YOR134W 15 578564 579793 W 2011-02-03 1996-07-31 -S000005662 ORF Verified YOR136W IDH2 isocitrate dehydrogenase (NAD(+)) IDH2 chromosome 15 L000000850 15 580250 581359 W 2011-02-03 1996-07-31 Subunit of mitochondrial NAD(+)-dependent isocitrate dehydrogenase; complex catalyzes the oxidation of isocitrate to alpha-ketoglutarate in the TCA cycle; phosphorylated -S000030498 CDS YOR136W 15 580250 581359 W 2011-02-03 1996-07-31 -S000005661 ORF Dubious YOR135C IRC14 chromosome 15 15 580500 580159 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YOR136W; null mutant displays increased levels of spontaneous Rad52 foci -S000037633 CDS YOR135C 15 580500 580159 C 2011-02-03 1996-07-31 -S000005663 ORF Verified YOR137C SIA1 chromosome 15 15 583681 581813 C 2011-02-03 1996-07-31 Protein of unassigned function; involved in activation of the Pma1p plasma membrane H+-ATPase by glucose; contains peptide signal for membrane localization -S000030527 CDS YOR137C 15 583681 581813 C 2011-02-03 1996-07-31 -S000005664 ORF Verified YOR138C RUP1 chromosome 15 15 586324 584309 C 2011-02-03 1996-07-31 Protein that regulates ubiquitination of Rsp5p; has a WW domain consensus motif of PPPSY (residues 131-135) that mediates binding of Rsp5p to Ubp2p; contains an UBA domain; relative distribution to the nucleus increases upon DNA replication stress -S000030602 CDS YOR138C 15 586324 584309 C 2011-02-03 1996-07-31 -S000005666 ORF Verified YOR140W SFL1 chromosome 15 L000001869 15 586981 589281 W 2011-02-03 1996-07-31|2011-02-03 Transcriptional repressor and activator; involved in repression of flocculation-related genes, and activation of stress responsive genes; has direct role in INO1 transcriptional memory; negatively regulated by cAMP-dependent protein kinase A subunit Tpk2p; premature stop codon (C1430T, Q477-stop) in SK1 background is linked to the aggressively invasive phenotype of SK1 relative to BY4741 (S288C) -S000030239 CDS YOR140W 15 586981 589281 W 2011-02-03 1996-07-31|2011-02-03 -S000005665 ORF Dubious YOR139C chromosome 15 15 587342 586950 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF SFL1/YOR140W -S000030683 CDS YOR139C 15 587342 586950 C 2011-02-03 1996-07-31 -S000005667 ORF Verified YOR141C ARP8 chromosome 15 L000003437 15 592587 589942 C 2011-02-03 1996-07-31 Nuclear actin-related protein involved in chromatin remodeling; component of chromatin-remodeling enzyme complexes; has mRNA binding activity -S000030308 CDS YOR141C 15 592587 589942 C 2011-02-03 1996-07-31 -S000005668 ORF Verified YOR142W LSC1 succinate--CoA ligase (GDP-forming) subunit alpha chromosome 15 L000004591 15 593057 594046 W 2011-02-03 1996-07-31 Alpha subunit of succinyl-CoA ligase; succinyl-CoA ligase is a mitochondrial enzyme of the TCA cycle that catalyzes the nucleotide-dependent conversion of succinyl-CoA to succinate; phosphorylated -S000033682 CDS YOR142W 15 593057 594046 W 2011-02-03 1996-07-31 -S000006573 tRNA_gene tG(CCC)O SUF5 chromosome 15 L000002153|L000003716 15 594425 594354 C 76 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons -S000032361 noncoding_exon tG(CCC)O 15 594425 594354 C 2011-02-03 2000-05-19 -S000007169 long_terminal_repeat YORWdelta12 chromosome 15 15 594512 594819 W 2011-02-03 2000-05-19 Ty1 LTR -S000007170 long_terminal_repeat YORWdelta13 chromosome 15 15 594820 595151 W 2011-02-03 2000-05-19 Ty1 LTR -S000007182 LTR_retrotransposon YORWTy1-2 Ty1 chromosome 15 15 594820 600733 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007351 transposable_element_gene YOR142W-A gag protein chromosome 15 15 595112 596434 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000036110 CDS YOR142W-A 15 595112 596434 W 2011-02-03 1999-07-17 -S000007352 transposable_element_gene YOR142W-B gag-pol fusion protein chromosome 15 15 595112 600380 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000036113 CDS YOR142W-B 15 595112 596416 W 2011-02-03 1999-07-17 -S000036114 CDS YOR142W-B 15 596418 600380 W 2011-02-03 1999-07-17 -S000036115 plus_1_translational_frameshift YOR142W-B 15 596417 596417 W 2011-02-03 1999-07-17 -S000007171 long_terminal_repeat YORWdelta14 chromosome 15 15 600402 600733 W 2011-02-03 2000-05-19 Ty1 LTR -S000007643 ARS ARS1502 ARS1517 chromosome 15 15 600886 600960 2011-02-03 2001-03-06 Autonomously Replicating Sequence -S000005669 ORF Verified YOR143C THI80 thiamine diphosphokinase chromosome 15 L000002297 15 602342 601383 C 2011-02-03 1996-07-31 Thiamine pyrophosphokinase; phosphorylates thiamine to produce the coenzyme thiamine pyrophosphate (thiamine diphosphate) -S000033738 CDS YOR143C 15 602342 601383 C 2011-02-03 1996-07-31 -S000005670 ORF Verified YOR144C ELG1 RTT110 chromosome 15 S000007438 15 605092 602717 C 2011-02-03 1996-07-31 Subunit of an alternative replication factor C complex; important for DNA replication and genome integrity; suppresses spontaneous DNA damage; involved in homologous recombination-mediated repair and telomere homeostasis; required for PCNA (Pol30p) unloading during DNA replication -S000033871 CDS YOR144C 15 605092 602717 C 2011-02-03 1996-07-31 -S000005672 ORF Dubious YOR146W chromosome 15 15 605873 606178 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame overlaps the verified gene PNO1/YOR145C -S000034948 CDS YOR146W 15 605873 606178 W 2011-02-03 1996-07-31 -S000005671 ORF Verified YOR145C PNO1 RRP20|DIM2 chromosome 15 15 606171 605347 C 2011-02-03 1996-07-31 Essential nucleolar protein required for pre-18S rRNA processing; interacts with Dim1p, an 18S rRNA dimethyltransferase, and also with Nob1p, which is involved in proteasome biogenesis; contains a KH domain -S000033985 CDS YOR145C 15 606171 605347 C 2011-02-03 1996-07-31 -S000005673 ORF Verified YOR147W MDM32 chromosome 15 15 606607 608475 W 2011-02-03 1996-07-31|2005-11-30 Mitochondrial inner membrane protein with similarity to Mdm31p; required for normal mitochondrial morphology and inheritance; interacts genetically with MMM1, MDM10, MDM12, and MDM34; variation between SK1 and S288C at residues 182 and 262 impacts invasive growth and mitochondrial network structure -S000035083 CDS YOR147W 15 606607 608475 W 2011-02-03 1996-07-31|2005-11-30 -S000005674 ORF Verified YOR148C SPP2 chromosome 15 L000002631 15 609197 608640 C 2011-02-03 1996-07-31 Essential protein that promotes the first step of splicing; required for the final stages of spliceosome maturation and activation; interacts with Prp2p, which may release Spp2p from the spliceosome following the first cleavage reaction; stimulates Prp2p ATPase activity -S000035131 CDS YOR148C 15 609197 608640 C 2011-02-03 1996-07-31 -S000005675 ORF Verified YOR149C SMP3 glycosylphosphatidylinositol-alpha 1,2 mannosyltransferase|SAP2|LAS2 chromosome 15 L000001935 15 611388 609838 C 2011-02-03 1996-07-31|2011-02-03 Alpha 1,2-mannosyltransferase; involved in glycosyl phosphatidyl inositol (GPI) biosynthesis; required for addition of the fourth, side branching mannose to the GPI core structure -S000036016 CDS YOR149C 15 611388 609838 C 2011-02-03 1996-07-31|2011-02-03 -S000005676 ORF Verified YOR150W MRPL23 mitochondrial 54S ribosomal protein YmL23|YmL23 chromosome 15 15 611999 612490 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; localizes to vacuole in response to H2O2 -S000034760 CDS YOR150W 15 611999 612490 W 2011-02-03 1996-07-31 -S000130136 ARS ARS1518 ARSXV-618 chromosome 15 15 616670 617517 2011-02-03 2009-05-05 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000005677 ORF Verified YOR151C RPB2 DNA-directed RNA polymerase II core subunit RPB2|B150|SOH2|SIT2|RPO22|RPB150 chromosome 15 L000001588|L000001676 15 616671 612997 C 80 2011-02-03 1996-07-31 RNA polymerase II second largest subunit B150; part of central core; similar to bacterial beta subunit -S000035654 CDS YOR151C 15 616671 612997 C 2011-02-03 1996-07-31 -S000005678 ORF Verified YOR152C ATG40 chromosome 15 15 618288 617518 C 2011-02-03 1996-07-31 Autophagy receptor with a role in endoplasmic reticulum degradation; involved specifically in autophagy of cortical and cytoplasmic ER in response to nitrogen starvation or rapamycin treatment; localizes to the cortical and cytoplasmic ER; similar to human FAM134B, which is also involved in ER autophagy and is associated with sensory neuropathy -S000035770 CDS YOR152C 15 618288 617518 C 2011-02-03 1996-07-31 -S000005679 ORF Verified YOR153W PDR5 ATP-binding cassette multidrug transporter PDR5|STS1|YDR1|LEM1 chromosome 15 L000001365|L000002136|L000002504 15 619840 624375 W 85 2011-02-03 1996-07-31 Plasma membrane ATP-binding cassette (ABC) transporter; multidrug transporter actively regulated by Pdr1p; also involved in steroid transport, cation resistance, and cellular detoxification during exponential growth; PDR5 has a paralog, PDR15, that arose from the whole genome duplication -S000035997 CDS YOR153W 15 619840 624375 W 2011-02-03 1996-07-31 -S000005680 ORF Verified YOR154W SLP1 chromosome 15 15 624729 626492 W 2011-02-03 1996-07-31 Glycosylated integral ER membrane protein of unknown function; forms an ER-membrane associated protein complex with Emp65p; member of the SUN-like family of proteins; genetic interactions suggest a role in folding of ER membrane proteins; required for nuclear envelope localization of Mps3p -S000037835 CDS YOR154W 15 624729 626492 W 2011-02-03 1996-07-31 -S000005681 ORF Verified YOR155C ISN1 IMP 5'-nucleotidase chromosome 15 15 627980 626628 C 2011-02-03 1996-07-31 Inosine 5'-monophosphate (IMP)-specific 5'-nucleotidase; catalyzes the breakdown of IMP to inosine; responsible for production of nicotinamide riboside and nicotinic acid riboside; expression positively regulated by nicotinic acid and glucose availability; does not show similarity to known 5'-nucleotidases from other organisms -S000037874 CDS YOR155C 15 627980 626628 C 2011-02-03 1996-07-31 -S000005682 ORF Verified YOR156C NFI1 SUMO ligase NFI1|SIZ2 chromosome 15 L000002966 15 630540 628360 C 2011-02-03 1996-07-31 SUMO E3 ligase; catalyzes sumoylation of Yku70p/80p and Sir4p promoting telomere anchoring to the nuclear envelope and regulating telomerase activity; DNA-bound form catalyzes a DNA-damaged triggered sumoylation wave resulting in multisite modification of several DNA repair proteins, enhancing interactions between these proteins and accelerating repair; sumoylates Cse4p, a prerequisite for STUbL-mediated Ub-dependent degradation; role in telomere length maintenance -S000029894 CDS YOR156C 15 630540 628360 C 2011-02-03 1996-07-31 -S000005683 ORF Verified YOR157C PUP1 proteasome core particle subunit beta 2 chromosome 15 L000001530 15 631751 630966 C 84.6 2011-02-03 1996-07-31 Beta 2 subunit of the 20S proteasome; endopeptidase with trypsin-like activity that cleaves after basic residues; synthesized as a proprotein before being proteolytically processed for assembly into 20S particle; human homolog is subunit Z -S000029992 CDS YOR157C 15 631751 630966 C 2011-02-03 1996-07-31 -S000005684 ORF Verified YOR158W PET123 mitochondrial 37S ribosomal protein PET123 chromosome 15 L000001398 15 632164 633120 W 84.2 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; PET123 exhibits genetic interactions with PET122, which encodes a COX3 mRNA-specific translational activator -S000031031 CDS YOR158W 15 632164 633120 W 2011-02-03 1996-07-31 -S000005685 ORF Verified YOR159C SME1 mRNA splicing protein SME1|Sm E|SmE chromosome 15 L000004252 15 633566 633282 C 2011-02-03 1996-07-31 Core Sm protein Sm E; part of heteroheptameric complex (with Smb1p, Smd1p, Smd2p, Smd3p, Smx3p, and Smx2p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; homolog of human Sm E -S000031069 CDS YOR159C 15 633566 633282 C 2011-02-03 1996-07-31 -S000005686 ORF Verified YOR160W MTR10 KAP111 chromosome 15 L000003296 15 633839 636757 W 2011-02-03 1996-07-31 Nuclear import receptor; mediates the nuclear localization of proteins involved in mRNA-nucleus export; promotes dissociation of mRNAs from the nucleus-cytoplasm mRNA shuttling protein Npl3p; required for retrograde import of mature tRNAs; relocalizes from cytoplasm to the nuclear periphery upon DNA replication stress -S000030698 CDS YOR160W 15 633839 636757 W 2011-02-03 1996-07-31 -S000028713 ORF Dubious YOR161W-A chromosome 15 15 637574 637654 W 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032680 CDS YOR161W-A 15 637574 637654 W 2011-02-03 2003-07-29 -S000028714 ORF Dubious YOR161W-B chromosome 15 15 637975 638235 W 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032682 CDS YOR161W-B 15 637975 638235 W 2011-02-03 2003-07-29 -S000005687 ORF Verified YOR161C PNS1 chromosome 15 15 638558 636939 C 2011-02-03 1996-07-31 Protein of unknown function; has similarity to Torpedo californica tCTL1p, which is postulated to be a choline transporter, neither null mutation nor overexpression affects choline transport -S000030748 CDS YOR161C 15 638558 636939 C 2011-02-03 1996-07-31 -S000028712 ORF Uncharacterized YOR161C-C chromosome 15 15 639267 639121 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032678 CDS YOR161C-C 15 639267 639121 C 2011-02-03 2003-07-29 -S000005688 ORF Verified YOR162C YRR1 PDR2 chromosome 15 L000004200|S000029349|L000001362 15 641992 639560 C 89 2011-02-03 1996-07-31 Zn2-Cys6 zinc-finger transcription factor; activates genes involved in multidrug resistance; paralog of Yrm1p, acting on an overlapping set of target genes; YRR1 has a paralog, PDR8, that arose from the whole genome duplication -S000030856 CDS YOR162C 15 641992 639560 C 2011-02-03 1996-07-31 -S000005689 ORF Verified YOR163W DDP1 polyphosphatase DDP1 chromosome 15 S000007498 15 642741 643307 W 2011-02-03 1996-07-31 Polyphosphate phosphatase; hydrolyzes diphosphorylated inositol polyphosphates and diadenosine polyphosphates; high specificity for diadenosine hexa- and pentaphosphates; contains endopolyphosphatase activity with a high affinity for polyphosphates, an activity also observed for its human DIPP homologs; possesses mRNA decapping activity; nudix hydrolase family member; protein abundance increases in response to DNA replication stress -S000031902 CDS YOR163W 15 642741 643307 W 2011-02-03 1996-07-31 -S000005690 ORF Verified YOR164C GET4 ENV8 chromosome 15 15 644332 643394 C 2011-02-03 1996-07-31 Protein involved in inserting tail-anchored proteins into ER membranes; forms a complex with Mdy2p; highly conserved across species and homologous to human gene C7orf20 -S000031981 CDS YOR164C 15 644332 643394 C 2011-02-03 1996-07-31 -S000005691 ORF Verified YOR165W SEY1 dynamin-like GTPase SEY1 chromosome 15 15 644566 646896 W 2011-02-03 1996-07-31 Dynamin-like GTPase that mediates homotypic ER fusion; has a role in ER morphology; interacts physically and genetically with Yop1p and Rtn1p; functional ortholog of the human atlastin ATL1, defects in which cause a form of the human disease hereditary spastic paraplegia; homolog of Arabidopsis RHD3 -S000034063 CDS YOR165W 15 644566 646896 W 2011-02-03 1996-07-31 -S000005692 ORF Verified YOR166C SWT1 mRNA-processing endoribonuclease chromosome 15 15 648502 647126 C 2011-02-03 1996-07-31 RNA endoribonuclease involved in perinuclear mRNP quality control; involved in perinuclear mRNP quality control via the turnover of aberrant, unprocessed pre-mRNAs; interacts with subunits of THO/TREX, TREX-2, and RNA polymerase II; contains a PIN (PilT N terminus) domain -S000034075 CDS YOR166C 15 648502 647126 C 2011-02-03 1996-07-31 -S000005693 ORF Verified YOR167C RPS28A eS28|ribosomal 40S subunit protein S28A|S28e|YS27|S33A|S28A|RPS33A chromosome 15 L000001767 15 649007 648804 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; has an extraribosomal function in regulation of RPS28B, in which Rps28Ap binds to a decapping complex via Edc3p, which then binds to RPS28B mRNA leading to its decapping and degradation; homologous to mammalian ribosomal protein S28, no bacterial homolog; RPS28A has a paralog, RPS28B, that arose from the whole genome duplication -S000034207 CDS YOR167C 15 649007 648804 C 2011-02-03 1996-07-31 -S000005694 ORF Verified YOR168W GLN4 glutamine--tRNA ligase chromosome 15 L000000711 15 649303 651732 W 88 2011-02-03 1996-07-31 Glutamine tRNA synthetase; monomeric class I tRNA synthetase that catalyzes the specific glutaminylation of tRNA(Gln); N-terminal domain proposed to be involved in enzyme-tRNA interactions -S000034317 CDS YOR168W 15 649303 651732 W 2011-02-03 1996-07-31 -S000005695 ORF Dubious YOR169C chromosome 15 15 651840 651376 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame overlaps the verified gene GLN4/YOR168W -S000034343 CDS YOR169C 15 651840 651376 C 2011-02-03 1996-07-31 -S000005696 ORF Dubious YOR170W chromosome 15 15 651858 652163 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene LCB4 -S000033855 CDS YOR170W 15 651858 652163 W 2011-02-03 1996-07-31 -S000005697 ORF Verified YOR171C LCB4 sphinganine kinase LCB4 chromosome 15 L000004328 15 653884 652010 C 2011-02-03 1996-07-31 Sphingoid long-chain base kinase; responsible for synthesis of long-chain base phosphates, which function as signaling molecules, regulates synthesis of ceramide from exogenous long-chain bases, localizes to the Golgi and late endosomes; LCB4 has a paralog, LCB5, that arose from the whole genome duplication -S000033881 CDS YOR171C 15 653884 652010 C 2011-02-03 1996-07-31 -S000005698 ORF Verified YOR172W YRM1 chromosome 15 15 654210 656570 W 2011-02-03 1996-07-31 Zinc finger transcription factor involved in multidrug resistance; Zn(2)-Cys(6) zinc finger transcription factor; activates genes involved in multidrug resistance; paralog of Yrr1p, acting on an overlapping set of target genes -S000034873 CDS YOR172W 15 654210 656570 W 2011-02-03 1996-07-31 -S000118490 ARS ARS1519 ARSXV-657 chromosome 15 15 656701 656772 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000005699 ORF Verified YOR173W DCS2 5'-(N(7)-methyl 5'-triphosphoguanosine)-(mRNA) diphosphatase chromosome 15 15 657264 658325 W 2011-02-03 1996-07-31|2006-10-05 m(7)GpppX pyrophosphatase regulator; non-essential, stress induced regulatory protein; modulates m7G-oligoribonucleotide metabolism; inhibits Dcs1p; regulated by Msn2p, Msn4p, and the Ras-cAMP-cAPK signaling pathway; mutant has increased aneuploidy tolerance; DCS2 has a paralog, DCS1, that arose from the whole genome duplication -S000035026 CDS YOR173W 15 657264 658325 W 2011-02-03 1996-07-31|2006-10-05 -S000005700 ORF Verified YOR174W MED4 chromosome 15 L000003915 15 658747 659601 W 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation -S000035222 CDS YOR174W 15 658747 659601 W 2011-02-03 1996-07-31 -S000005701 ORF Verified YOR175C ALE1 lysophospholipid acyltransferase|LCA1|LPT1|SLC4 chromosome 15 15 661674 659815 C 2011-02-03 1996-07-31 Broad-specificity lysophospholipid acyltransferase; part of MBOAT family of membrane-bound O-acyltransferases; key component of Lands cycle; may have role in fatty acid exchange at sn-2 position of mature glycerophospholipids -S000035274 CDS YOR175C 15 661674 659815 C 2011-02-03 1996-07-31 -S000005702 ORF Verified YOR176W HEM15 ferrochelatase HEM15 chromosome 15 L000000766 15 662401 663582 W 2011-02-03 1996-07-31 Ferrochelatase; a mitochondrial inner membrane protein, catalyzes insertion of ferrous iron into protoporphyrin IX, the eighth and final step in the heme biosynthetic pathway; human homolog FECH can complement yeast mutant and allow growth of haploid null after sporulation of a heterozygous diploid -S000036250 CDS YOR176W 15 662401 663582 W 2011-02-03 1996-07-31 -S000006766 tRNA_gene tV(AAC)O chromosome 15 L000003715 15 663885 663812 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000032969 noncoding_exon tV(AAC)O 15 663885 663812 C 2011-02-03 2000-05-19 -S000007163 long_terminal_repeat YORCdelta15 chromosome 15 15 664324 664003 C 2011-02-03 2000-05-19 Ty1 LTR -S000007172 long_terminal_repeat YORWdelta16 chromosome 15 15 664325 664469 W 2011-02-03 2000-05-19 Ty1 LTR -S000007173 long_terminal_repeat YORWdelta17 chromosome 15 15 664813 665145 W 2011-02-03 2000-05-19 Ty2 LTR -S000005703 ORF Verified YOR177C MPC54 chromosome 15 15 667179 665785 C 2011-02-03 1996-07-31 Component of the meiotic outer plaque; a membrane-organizing center which is assembled on the cytoplasmic face of the spindle pole body during meiosis II and triggers the formation of the prospore membrane; potential Cdc28p substrate -S000036281 CDS YOR177C 15 667179 665785 C 2011-02-03 1996-07-31 -S000005704 ORF Verified YOR178C GAC1 protein phosphatase regulator GAC1 chromosome 15 L000000657 15 670241 667860 C 113 2011-02-03 1996-07-31 Regulatory subunit for Glc7p type-1 protein phosphatase (PP1); tethers Glc7p to Gsy2p glycogen synthase, binds Hsf1p heat shock transcription factor, required for induction of some HSF-regulated genes under heat shock; GAC1 has a paralog, PIG1, that arose from the whole genome duplication -S000036360 CDS YOR178C 15 670241 667860 C 2011-02-03 1996-07-31 -S000005705 ORF Verified YOR179C SYC1 cleavage polyadenylation factor subunit SYC1 chromosome 15 15 672411 671845 C 2011-02-03 1996-07-31 Subunit of the APT subcomplex of cleavage and polyadenylation factor; may have a role in 3' end formation of both polyadenylated and non-polyadenylated RNAs; SYC1 has a paralog, YSH1, that arose from the whole genome duplication -S000030078 CDS YOR179C 15 672411 671845 C 2011-02-03 1996-07-31 -S000005706 ORF Verified YOR180C DCI1 putative dodecenoyl-CoA isomerase DCI1|ECI2 chromosome 15 L000004175 15 675167 674352 C 2011-02-03 1996-07-31 Peroxisomal protein; identification as a delta(3,5)-delta(2,4)-dienoyl-CoA isomerase involved in fatty acid metabolism is disputed; DCI1 has a paralog, ECI1, that arose from the whole genome duplication -S000037854 CDS YOR180C 15 675167 674352 C 2011-02-03 1996-07-31 -S000005707 ORF Verified YOR181W LAS17 actin-binding protein LAS17|BEE1 chromosome 15 L000003068|L000003581 15 675939 677840 W 2011-02-03 1996-07-31 Actin assembly factor; C-terminal WCA domain activates Arp2/3 complex-mediated nucleation of branched actin filaments, polyproline domain nucleates actin filaments independent of Arp2/3; mutants are defective in endocytosis, bud site selection, cytokinesis; human homolog WAS (Wiskott-Aldrich Syndrome) implicated in severe immunodeficiency; human WAS complements yeast null mutant, but only in presence of WIPF1, which mediates localization of WAS to cortical patches -S000029943 CDS YOR181W 15 675939 677840 W 2011-02-03 1996-07-31 -S000005708 ORF Verified YOR182C RPS30B eS30|ribosomal 40S subunit protein S30B|S30e|S30B chromosome 15 L000003497 15 678793 678191 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S30, no bacterial homolog; RPS30B has a paralog, RPS30A, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000030004 CDS YOR182C 15 678379 678191 C 2011-02-03 1996-07-31 -S000030003 CDS YOR182C 15 678793 678791 C 2011-02-03 1996-07-31 -S000030005 intron YOR182C 15 678790 678380 C 2011-02-03 1996-07-31 -S000005709 ORF Uncharacterized YOR183W FYV12 chromosome 15 15 678872 679261 W 2011-02-03 1996-07-31 Protein of unknown function; required for survival upon exposure to K1 killer toxin -S000031055 CDS YOR183W 15 678872 679261 W 2011-02-03 1996-07-31 -S000005710 ORF Verified YOR184W SER1 O-phospho-L-serine:2-oxoglutarate transaminase|ADE9 chromosome 15 L000001865 15 679357 680544 W 98.2 2011-02-03 1996-07-31 3-phosphoserine aminotransferase; catalyzes the formation of phosphoserine from 3-phosphohydroxypyruvate, required for serine and glycine biosynthesis; regulated by the general control of amino acid biosynthesis mediated by Gcn4p; protein abundance increases in response to DNA replication stress -S000031176 CDS YOR184W 15 679357 680544 W 2011-02-03 1996-07-31 -S000007300 snoRNA_gene snR36 SNR36 chromosome 15 L000001974 15 680866 680685 C 2011-02-03 2000-05-19|2007-05-10 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of small subunit (SSU) rRNA at position U1187 -S000036766 noncoding_exon snR36 15 680866 680685 C 2011-02-03 2000-05-19|2007-05-10 -S000005711 ORF Verified YOR185C GSP2 Ran GTPase GSP2|CNR2 chromosome 15 L000000737 15 682106 681444 C 98.6 2011-02-03 1996-07-31 GTP binding protein (mammalian Ranp homolog); involved in the maintenance of nuclear organization, RNA processing and transport; interacts with Kap121p, Kap123p and Pdr6p (karyophilin betas); not required for viability; protein abundance increases in response to DNA replication stress; GSP2 has a paralog, GSP1, that arose from the whole genome duplication -S000031246 CDS YOR185C 15 682106 681444 C 2011-02-03 1996-07-31 -S000005712 ORF Uncharacterized YOR186W chromosome 15 15 683111 683545 W 2011-02-03 1996-07-31 Putative protein of unknown function; proper regulation of expression during heat stress is sphingolipid-dependent; mCherry fusion protein localizes to the vacuole; YOR186W has a paralog, YLR297W, that arose from the whole genome duplication -S000032297 CDS YOR186W 15 683111 683545 W 2011-02-03 1996-07-31 -S000028715 ORF Dubious YOR186C-A chromosome 15 15 683538 683329 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032684 CDS YOR186C-A 15 683538 683329 C 2011-02-03 2003-07-29 -S000005713 ORF Verified YOR187W TUF1 translation elongation factor Tu|tufM chromosome 15 L000002390 15 684030 685343 W 2011-02-03 1996-07-31 Mitochondrial translation elongation factor Tu (EF-Tu); involved in fundamental pathway of mtDNA homeostasis; comprises both GTPase and guanine nucleotide exchange factor activities, while these activities are found in separate proteins in S. pombe and humans; rare mutations in human mitochondrial elongation factor Tu (EFTu) associated with severe lactic acidosis, rapidly progressive fatal encephalopathy, severe infantile macrocystic leukodystrophy with micropolygyria -S000032398 CDS YOR187W 15 684030 685343 W 2011-02-03 1996-07-31 -S000005714 ORF Verified YOR188W MSB1 chromosome 15 L000001184 15 685767 689180 W 103 2011-02-03 1996-07-31 Protein of unknown function; may be involved in positive regulation of 1,3-beta-glucan synthesis and the Pkc1p-MAPK pathway; multicopy suppressor of temperature-sensitive mutations in CDC24 and CDC42, and of mutations in BEM4; potential Cdc28p substrate; relocalizes from bud neck to cytoplasm upon DNA replication stress -S000032501 CDS YOR188W 15 685767 689180 W 2011-02-03 1996-07-31 -S000005715 ORF Verified YOR189W IES4 chromosome 15 15 689624 689974 W 2011-02-03 1996-07-31 Component of the INO80 chromatiin remodeling complex; target of the Mec1p/Tel1p DNA damage signaling pathway; proposed to link chromatin remodeling to replication checkpoint responses -S000034540 CDS YOR189W 15 689624 689974 W 2011-02-03 1996-07-31 -S000005716 ORF Verified YOR190W SPR1 glucan 1,3-beta-glucosidase|SSG1 chromosome 15 L000002020|L000002083 15 690695 692032 W 2011-02-03 1996-07-31 Sporulation-specific exo-1,3-beta-glucanase; contributes to ascospore thermoresistance; SPR1 has a paralog, EXG1, that arose from the whole genome duplication -S000033255 CDS YOR190W 15 690695 692032 W 2011-02-03 1996-07-31 -S000005717 ORF Verified YOR191W ULS1 translocase ULS1|RIS1|TID4|DIS1 chromosome 15 L000004381 15 692475 697334 W 2011-02-03 1996-07-31 Swi2/Snf2-related translocase, SUMO-Targeted Ubiquitin Ligase (STUbL); required for maintenance of NHEJ inhibition at telomeres; functions at telomeres to translocate and ubiquitinylate poly-sumoylated Rap1p for proteosomal degradation; plays role in antagonizing silencing during mating-type switching; only known STUbL with a translocase activity; contains RING finger domain; relocalizes from nucleus to cytoplasm upon DNA replication stress -S000033303 CDS YOR191W 15 692475 697334 W 2011-02-03 1996-07-31 -S000005718 ORF Verified YOR192C THI72 thiamine transporter chromosome 15 15 700567 698768 C 2011-02-03 1996-07-31 Transporter of thiamine or related compound; contributes to uptake of 5-aminoimidazole-4-carboxamide-1-beta-D-ribofuranoside (acadesine); shares sequence similarity with Thi7p -S000034124 CDS YOR192C 15 700567 698768 C 2011-02-03 1996-07-31 -S000007164 long_terminal_repeat YORCdelta18 chromosome 15 15 703582 703429 C 2011-02-03 2000-05-19 Ty1 LTR -S000007174 long_terminal_repeat YORWdelta19 chromosome 15 15 703612 703762 W 2011-02-03 2000-05-19 Ty1 LTR -S000007180 long_terminal_repeat YORWtau2 chromosome 15 15 703772 704062 W 2011-02-03 2000-05-19 Ty4 LTR -S000028857 ORF Uncharacterized YOR192C-C chromosome 15 15 704224 703988 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000034570 CDS YOR192C-C 15 704224 703988 C 2011-02-03 2003-07-29 -S000007165 long_terminal_repeat YORCdelta20 chromosome 15 15 704395 704063 C 2011-02-03 2000-05-19 Ty2 LTR -S000007354 transposable_element_gene YOR192C-B gag-pol fusion protein chromosome 15 S000029019 15 709732 704419 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000034414 CDS YOR192C-B 15 708438 704419 C 2011-02-03 1999-07-17 -S000034413 CDS YOR192C-B 15 709732 708440 C 2011-02-03 1999-07-17 -S000034415 plus_1_translational_frameshift YOR192C-B 15 708439 708439 C 2011-02-03 1999-07-17 -S000007353 transposable_element_gene YOR192C-A gag protein chromosome 15 15 709732 708416 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000034406 CDS YOR192C-A 15 709732 708416 C 2011-02-03 1999-07-17 -S000007168 LTR_retrotransposon YORCTy2-1 Ty2 chromosome 15 15 710023 704063 C 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007166 long_terminal_repeat YORCdelta21 chromosome 15 15 710023 709691 C 2011-02-03 2000-05-19 Ty2 LTR -S000007181 long_terminal_repeat YORWtau3 chromosome 15 15 710024 710107 W 2011-02-03 2000-05-19 Ty4 LTR -S000006665 tRNA_gene tM(CAU)O1 IMT1 chromosome 15 L000003711 15 710201 710272 W 2011-02-03 2000-05-19 Methionine initiator tRNA (tRNA-Met); predicted by tRNAscan-SE analysis; one of four initiator methionine tRNAs in yeast that are functional for translation -S000032163 noncoding_exon tM(CAU)O1 15 710201 710272 W 2011-02-03 2000-05-19 -S000005719 ORF Verified YOR193W PEX27 chromosome 15 15 710446 711576 W 2011-02-03 1996-07-31 Peripheral peroxisomal membrane protein; involved in controlling peroxisome size and number, interacts with Pex25p; PEX27 has a paralog, PEX25, that arose from the whole genome duplication -S000034339 CDS YOR193W 15 710446 711576 W 2011-02-03 1996-07-31 -S000005720 ORF Verified YOR194C TOA1 transcription initiation factor IIA large subunit chromosome 15 L000002316 15 712543 711683 C 2011-02-03 1996-07-31 TFIIA large subunit; involved in transcriptional activation, acts as antirepressor or as coactivator; required, along with Toa2p, for ribosomal protein gene transcription in vivo; homologous to largest and second largest subunits of human and Drosophila TFIIA -S000034366 CDS YOR194C 15 712543 711683 C 2011-02-03 1996-07-31 -S000005721 ORF Verified YOR195W SLK19 chromosome 15 L000004340 15 712866 715331 W 2011-02-03 1996-07-31 Kinetochore-associated protein; required for chromosome segregation and kinetochore clustering; required for normal segregation of chromosomes in meiosis and mitosis; component of the FEAR regulatory network, which promotes Cdc14p release from the nucleolus during anaphase; potential Cdc28p substrate -S000035480 CDS YOR195W 15 712866 715331 W 2011-02-03 1996-07-31 -S000005722 ORF Verified YOR196C LIP5 putative lipoate synthase chromosome 15 L000002613 15 716837 715593 C 2011-02-03 1996-07-31 Protein involved in biosynthesis of the coenzyme lipoic acid; has similarity to E. coli lipoic acid synthase -S000035507 CDS YOR196C 15 716837 715593 C 2011-02-03 1996-07-31 -S000005723 ORF Verified YOR197W MCA1 Ca(2+)-dependent cysteine protease MCA1|YCA1 chromosome 15 15 717086 718384 W 2011-02-03 1996-07-31|2006-05-11 Ca2+-dependent cysteine protease; may cleave specific substrates during the stress response; regulates apoptosis upon H2O2 treatment; required for clearance of insoluble protein aggregates during normal growth; implicated in cell cycle dynamics and lifespan extension; undergoes autocatalytic processing; similar to mammalian metacaspases, but exists as a monomer due to an extra pair of anti-parallel beta-strands that block potential dimerization -S000035631 CDS YOR197W 15 717086 718384 W 2011-02-03 1996-07-31|2006-05-11 -S000005724 ORF Verified YOR198C BFR1 chromosome 15 L000000174 15 720065 718653 C 2011-02-03 1996-07-31 Component of mRNP complexes associated with polyribosomes; involved in localization of mRNAs to P bodies; implicated in secretion and nuclear segregation; multicopy suppressor of BFA (Brefeldin A) sensitivity -S000036502 CDS YOR198C 15 720065 718653 C 2011-02-03 1996-07-31 -S000005725 ORF Dubious YOR199W chromosome 15 15 720181 720510 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036654 CDS YOR199W 15 720181 720510 W 2011-02-03 1996-07-31 -S000005726 ORF Dubious YOR200W chromosome 15 15 720417 720815 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF MRM1/YOR201c -S000036053 CDS YOR200W 15 720417 720815 W 2011-02-03 1996-07-31 -S000005727 ORF Verified YOR201C MRM1 PET56 chromosome 15 L000001392 15 721708 720470 C 112 2011-02-03 1996-07-31 Ribose methyltransferase; modifies a functionally critical, conserved nucleotide in mitochondrial 21S rRNA -S000036099 CDS YOR201C 15 721708 720470 C 2011-02-03 1996-07-31 -S000005728 ORF Verified YOR202W HIS3 imidazoleglycerol-phosphate dehydratase HIS3|HIS8|HIS10 chromosome 15 L000000780|S000029212|L000000785 15 721946 722608 W 112 2011-02-03 1996-07-31 Imidazoleglycerol-phosphate dehydratase; catalyzes the sixth step in histidine biosynthesis; mutations cause histidine auxotrophy and sensitivity to Cu, Co, and Ni salts; transcription is regulated by general amino acid control via Gcn4p -S000029880 CDS YOR202W 15 721946 722608 W 2011-02-03 1996-07-31 -S000005729 ORF Dubious YOR203W chromosome 15 15 722565 722918 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps 5' end of essential DED1 gene required for translation initiation -S000031781 CDS YOR203W 15 722565 722918 W 2011-02-03 1996-07-31 -S000005730 ORF Verified YOR204W DED1 DEAD-box ATP-dependent RNA helicase DED1|SPP81 chromosome 15 L000000500 15 722911 724725 W 114 2011-02-03 1996-07-31 ATP-dependent DEAD (Asp-Glu-Ala-Asp)-box RNA helicase; required for translation initiation of all yeast mRNAs; binds to mRNA cap-associated factors, and binding stimulates Ded1p RNA-dependent ATPase activity; mutation in human homolog DBY is associated with male infertility; human homolog DDX3X complements ded1 null mutation; DED1 has a paralog, DBP1, that arose from the whole genome duplication -S000031924 CDS YOR204W 15 722911 724725 W 2011-02-03 1996-07-31 -S000005731 ORF Verified YOR205C GEP3 MTG3|AIM40|LRC5|FMP38 chromosome 15 15 727234 725564 C 2011-02-03 1996-07-31 Protein required for mitochondrial ribosome small subunit biogenesis; null mutant is defective in respiration and in maturation of 15S rRNA; protein is localized to the mitochondrial inner membrane; null mutant interacts synthetically with prohibitin (Phb1p) -S000031991 CDS YOR205C 15 727234 725564 C 2011-02-03 1996-07-31 -S000005732 ORF Verified YOR206W NOC2 mRNA-binding ribosome synthesis protein NOC2 chromosome 15 15 727512 729644 W 2011-02-03 1996-07-31 Protein involved in ribosome biogenesis; forms a nucleolar complex with Mak21p that binds to 90S and 66S pre-ribosomes; forms a nuclear complex with Noc3p that binds to 66S pre-ribosomes; both complexes mediate intranuclear transport of ribosomal precursors; acts as part of a Mak21p-Noc2p-Rrp5p module that associates with nascent pre-rRNA during transcription and has a role in bigenesis of the large ribosomal subunit -S000037497 CDS YOR206W 15 727512 729644 W 2011-02-03 1996-07-31 -S000118491 ARS ARS1521 ARSXV-730 chromosome 15 15 729740 729969 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178185 ARS_consensus_sequence ARS1521 15 729795 729811 W 2014-11-18 2014-11-18 -S000005733 ORF Verified YOR207C RET1 DNA-directed RNA polymerase III core subunit RET1|C128|RPC128|RPC2|PDS2 chromosome 15 L000001614 15 733457 730008 C 117 2011-02-03 1996-07-31 Second-largest subunit of RNA polymerase III; RNA polymerase III is responsible for the transcription of tRNA and 5S RNA genes, and other low molecular weight RNAs -S000037554 CDS YOR207C 15 733457 730008 C 2011-02-03 1996-07-31 -S000005734 ORF Verified YOR208W PTP2 tyrosine protein phosphatase PTP2 chromosome 15 L000001526 15 733925 736177 W 2011-02-03 1996-07-31 Nuclear phosphotyrosine-specific phosphatase involved in osmosensing; involved in the inactivation of mitogen-activated protein kinase (MAPK) during osmolarity sensing; dephosporylates Hog1p MAPK and regulates its localization; with Msg5p co-regulates the calcium signaling pathway -S000037667 CDS YOR208W 15 733925 736177 W 2011-02-03 1996-07-31 -S000005735 ORF Verified YOR209C NPT1 nicotinate phosphoribosyltransferase chromosome 15 L000001275 15 737726 736437 C 2011-02-03 1996-07-31 Nicotinate phosphoribosyltransferase; acts in the salvage pathway of NAD+ biosynthesis; required for silencing at rDNA and telomeres and has a role in silencing at mating-type loci; localized to the nucleus -S000030426 CDS YOR209C 15 737726 736437 C 2011-02-03 1996-07-31 -S000005736 ORF Verified YOR210W RPB10 DNA-directed RNA polymerase core subunit RPB10|ABC10-beta chromosome 15 L000001684 15 738320 738532 W 2011-02-03 1996-07-31 RNA polymerase subunit ABC10-beta; common to RNA polymerases I, II, and III -S000037369 CDS YOR210W 15 738320 738532 W 2011-02-03 1996-07-31 -S000005737 ORF Verified YOR211C MGM1 dynamin-related GTPase MGM1|MNA1 chromosome 15 L000001103 15 741569 738924 C 123 2011-02-03 1996-07-31|2006-10-03 Mitochondrial GTPase, present in complex with Ugo1p and Fzo1p; required for mitochondrial morphology, fusion, and genome maintenance; promotes membrane bending; exists as long and short form with different distributions; ratio of long to short forms is regulated by Psd1p; homolog of human OPA1 involved in autosomal dominant optic atrophy -S000037397 CDS YOR211C 15 741569 738924 C 2011-02-03 1996-07-31|2006-10-03 -S000005738 ORF Verified YOR212W STE4 G protein subunit beta|HMD2 chromosome 15 L000002114 15 742910 744181 W 124 2011-02-03 1996-07-31 G protein beta subunit; forms a dimer with Ste18p to activate mating signaling pathway, forms heterotrimer with Gpa1p and Ste18p to dampen signaling; pheromone-induced phosphorylation plays critical role in chemotropism; may recruit Rho1p to polarized growth site during mating; contains WD40 repeats -S000030085 CDS YOR212W 15 742910 744181 W 2011-02-03 1996-07-31 -S000005739 ORF Verified YOR213C SAS5 chromosome 15 L000004215 15 745281 744535 C 2011-02-03 1996-07-31 Subunit of the SAS complex (Sas2p, Sas4p, Sas5p); acetylates free histones and nucleosomes and regulates transcriptional silencing; stimulates Sas2p HAT activity -S000030141 CDS YOR213C 15 745281 744535 C 2011-02-03 1996-07-31 -S000005740 ORF Verified YOR214C SPR2 chromosome 15 S000029500|L000002021 15 746303 745593 C 2011-02-03 1996-07-31 Putative spore wall protein; expression increases during sporulation; not an essential gene; YOR214C has a paralog, SPO19, that arose from the whole genome duplication -S000030340 CDS YOR214C 15 746303 745593 C 2011-02-03 1996-07-31 -S000005741 ORF Verified YOR215C AIM41 chromosome 15 15 747282 746725 C 2011-02-03 1996-07-31 Protein of unknown function; the authentic protein is detected in highly purified mitochondria in high-throughput studies; null mutant displays reduced frequency of mitochondrial genome loss -S000033625 CDS YOR215C 15 747282 746725 C 2011-02-03 1996-07-31 -S000005742 ORF Verified YOR216C RUD3 GRP1 chromosome 15 L000004185 15 748979 747525 C 2011-02-03 1996-07-31 Golgi matrix protein; involved in the structural organization of the cis-Golgi; interacts genetically with COG3 and USO1 -S000033741 CDS YOR216C 15 748979 747525 C 2011-02-03 1996-07-31 -S000005743 ORF Verified YOR217W RFC1 replication factor C subunit 1|CDC44 chromosome 15 L000000278 15 749301 751886 W 2011-02-03 1996-07-31 Subunit of heteropentameric Replication factor C (RF-C); RF-C is a DNA binding protein and ATPase that acts as a clamp loader of the proliferating cell nuclear antigen (PCNA) processivity factor for DNA polymerases delta and epsilon -S000033941 CDS YOR217W 15 749301 751886 W 2011-02-03 1996-07-31 -S000005744 ORF Dubious YOR218C chromosome 15 15 751895 751476 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame overlaps the verified gene RFC1/YOR217W -S000033989 CDS YOR218C 15 751895 751476 C 2011-02-03 1996-07-31 -S000005745 ORF Verified YOR219C STE13 YCI1 chromosome 15 L000002120 15 755009 752214 C 129 2011-02-03 1996-07-31 Dipeptidyl aminopeptidase; Golgi integral membrane protein that cleaves on the carboxyl side of repeating -X-Ala- sequences, required for maturation of alpha factor, transcription is induced by a-factor -S000034857 CDS YOR219C 15 755009 752214 C 2011-02-03 1996-07-31 -S000005746 ORF Verified YOR220W RCN2 WSP1 chromosome 15 15 755328 756125 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; phosphorylated in response to alpha factor; protein abundance increases in response to DNA replication stress -S000033604 CDS YOR220W 15 755328 756125 W 2011-02-03 1996-07-31 -S000005747 ORF Verified YOR221C MCT1 [acyl-carrier-protein] S-malonyltransferase chromosome 15 15 757558 756476 C 2011-02-03 1996-07-31|2005-12-01 Predicted malonyl-CoA:ACP transferase; putative component of a type-II mitochondrial fatty acid synthase that produces intermediates for phospholipid remodeling -S000034462 CDS YOR221C 15 757558 756476 C 2011-02-03 1996-07-31|2005-12-01 -S000005748 ORF Verified YOR222W ODC2 mitochondrial 2-oxodicarboxylate carrier chromosome 15 15 758330 759253 W 2011-02-03 1996-07-31 Mitochondrial inner membrane transporter; 2-oxodicarboxylate transporter, exports 2-oxoadipate and 2-oxoglutarate from the mitochondrial matrix to the cytosol for use in lysine and glutamate biosynthesis and in lysine catabolism; ODC2 has a paralog, ODC1, that arose from the whole genome duplication -S000034614 CDS YOR222W 15 758330 759253 W 2011-02-03 1996-07-31 -S000007299 snoRNA_gene snR35 SNR35 chromosome 15 L000001973 15 759529 759326 C 2011-02-03 2000-05-19|2007-05-10 H/ACA box small nucleolar RNA (snoRNA); predicted to guide pseudouridylation of small subunit (SSU) rRNA at position 1191 -S000036764 noncoding_exon snR35 15 759529 759326 C 2011-02-03 2000-05-19|2007-05-10 -S000005749 ORF Verified YOR223W DSC3 chromosome 15 15 759782 760660 W 2011-02-03 1996-07-31 Subunit of the DSC ubiquitin ligase complex; protein of unknown function that localizes to the ER and vacuole lumen; overexpression affects endocytic protein trafficking; ortholog of fission yeast dsc3 -S000034765 CDS YOR223W 15 759782 760660 W 2011-02-03 1996-07-31 -S000005750 ORF Verified YOR224C RPB8 DNA-directed RNA polymerase core subunit RPB8|ABC14.5 chromosome 15 L000001682 15 761265 760825 C 2011-02-03 1996-07-31 RNA polymerase subunit ABC14.5; common to RNA polymerases I, II, and III -S000035658 CDS YOR224C 15 761265 760825 C 2011-02-03 1996-07-31 -S000005751 ORF Dubious YOR225W chromosome 15 15 761392 761721 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035836 CDS YOR225W 15 761392 761721 W 2011-02-03 1996-07-31 -S000005752 ORF Verified YOR226C ISU2 putative iron-binding protein ISU2|NUA2 chromosome 15 L000004770 15 762084 761614 C 2011-02-03 1996-07-31 Mitochondrial protein required for iron-sulfur protein synthesis; performs scaffolding function during Fe/S cluster assembly; involved in Fe-S cluster assembly for both mitochondrial and cytosolic proteins; protein abundance increases under DNA replication stress; ISU2 has a paralog, ISU1, that arose from the whole genome duplication; isu1 isu2 double mutant is inviable; human homolog ISCU implicated in mitochondrial myopathy, can complement isu1 isu2 double mutant -S000035907 CDS YOR226C 15 762084 761614 C 2011-02-03 1996-07-31 -S000005753 ORF Verified YOR227W HER1 chromosome 15 S000124018 15 762825 766565 W 2011-02-03 1996-07-31 Protein of unknown function; required for proliferation or remodeling of the ER that is caused by overexpression of Hmg2p; may interact with ribosomes, based on co-purification experiments; HER1 has a paralog, GIP3, that arose from the whole genome duplication -S000037838 CDS YOR227W 15 762825 766565 W 2011-02-03 1996-07-31 -S000118492 ARS ARS1523 ARSXV-767 chromosome 15 15 766605 766788 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000005754 ORF Verified YOR228C MCP1 chromosome 15 15 767777 766869 C 2011-02-03 1996-07-31 Mitochondrial protein of unknown function involved in lipid homeostasis; integral membrane protein that localizes to the mitochondrial outer membrane; involved in mitochondrial morphology; interacts genetically with MDM10, and other members of the ERMES complex; contains five predicted transmembrane domains -S000037878 CDS YOR228C 15 767777 766869 C 2011-02-03 1996-07-31 -S000077078 matrix_attachment_site ETC7 ETC7 chromosome 15 15 768106 768128 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; can act as a transcription-blocking insulator or as a heterochromatin barrier element; located between divergently transcribed genes MCP1 and WTM2 -S000005755 ORF Verified YOR229W WTM2 transcriptional modulator chromosome 15 L000003516 15 768409 769812 W 2011-02-03 1996-07-31 Transcriptional modulator; involved in regulation of meiosis, silencing, and expression of RNR genes; involved in response to replication stress; contains WD repeats; relocalizes to the cytosol in response to hypoxia; WTM2 has a paralog, UME1, that arose from the whole genome duplication -S000029954 CDS YOR229W 15 768409 769812 W 2011-02-03 1996-07-31 -S000005756 ORF Verified YOR230W WTM1 transcriptional modulator chromosome 15 L000003515 15 770800 772113 W 2011-02-03 1996-07-31 Transcriptional modulator; involved in regulation of meiosis, silencing, and expression of RNR genes; required for nuclear localization of the ribonucleotide reductase small subunit Rnr2p and Rnr4p; contains WD repeats -S000037695 CDS YOR230W 15 770800 772113 W 2011-02-03 1996-07-31 -S000005757 ORF Verified YOR231W MKK1 mitogen-activated protein kinase kinase MKK1|SSP32 chromosome 15 L000001117 15 772601 774127 W 2011-02-03 1996-07-31 MAPKK involved in the protein kinase C signaling pathway; involved in control of cell integrity; upon activation by Bck1p phosphorylates downstream target, Slt2p; functionally redundant with Mkk2p; MKK1 has a paralog, MKK2, that arose from the whole genome duplication -S000037755 CDS YOR231W 15 772601 774127 W 2011-02-03 1996-07-31 -S000028716 ORF Dubious YOR231C-A chromosome 15 15 773363 773163 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032687 CDS YOR231C-A 15 773363 773163 C 2011-02-03 2003-07-29 -S000005758 ORF Verified YOR232W MGE1 GRPE|YGE1 chromosome 15 L000000729|L000002638|L000001101 15 774573 775259 W 2011-02-03 1996-07-31 Mitochondrial matrix cochaperone; nucleotide release factor for Ssc1p in protein translocation and folding; also acts as cochaperone for Ssq1p in folding of Fe-S cluster proteins; acts as oxidative sensor to regulate mitochondrial Ssc1p; in presence of oxidative stress, dimeric Mge1p becomes a monomer and unable to regulate Ssc1p function; homolog of E. coli GrpE and human Mge1 (GRPEL1), which also responds to oxidative stress -S000030589 CDS YOR232W 15 774573 775259 W 2011-02-03 1996-07-31 -S000005759 ORF Verified YOR233W KIN4 putative serine/threonine protein kinase KIN4|KIN3|KIN31 chromosome 15 L000000904 15 775846 778248 W 2011-02-03 1996-07-31 Serine/threonine protein kinase; inhibits the mitotic exit network (MEN) when the spindle position checkpoint is activated; localized asymmetrically to mother cell cortex, spindle pole body and bud neck; KIN4 has a paralog, FRK1, that arose from the whole genome duplication -S000030703 CDS YOR233W 15 775846 778248 W 2011-02-03 1996-07-31 -S000005760 ORF Verified YOR234C RPL33B eL33|ribosomal 60S subunit protein L33B|L33e|rp47|Yl37|L37B|L33B|RPL37B chromosome 15 L000001729 15 779405 778555 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L33B; rpl33b null mutant exhibits normal growth while rpl33a rpl33b double null mutant is inviable; homologous to mammalian ribosomal protein L35A, no bacterial homolog; RPL33B has a paralog, RPL33A, that arose from the whole genome duplication -S000030771 CDS YOR234C 15 778859 778555 C 2011-02-03 1996-07-31 -S000030770 CDS YOR234C 15 779405 779387 C 2011-02-03 1996-07-31 -S000030772 intron YOR234C 15 779386 778860 C 2011-02-03 1996-07-31 -S000005761 ORF Dubious YOR235W IRC13 chromosome 15 15 779870 780184 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; null mutant displays increased levels of spontaneous Rad52 foci -S000031752 CDS YOR235W 15 779870 780184 W 2011-02-03 1996-07-31 -S000007294 snoRNA_gene snR17a SNR17A U3 chromosome 15 L000001966 15 780107 780596 W 136 2011-02-03 2000-05-19 Small nucleolar RNA (snoRNA) U3; part of Small ribosomal SubUnit (SSU) processosome; SNR17B also encodes snoRNA U3 -S000030175 intron snR17a 15 780121 780277 W 2011-02-03 2000-05-19 -S000030173 noncoding_exon snR17a 15 780107 780120 W 2011-02-03 2000-05-19 -S000030174 noncoding_exon snR17a 15 780278 780596 W 2011-02-03 2000-05-19 -S000005762 ORF Verified YOR236W DFR1 dihydrofolate reductase chromosome 15 L000000503 15 780906 781541 W 135 2011-02-03 1996-07-31 Dihydrofolate reductase involved in tetrahydrofolate biosynthesis; required for respiratory metabolism; mutation is functionally complemented by human DHFR -S000031908 CDS YOR236W 15 780906 781541 W 2011-02-03 1996-07-31 -S000005763 ORF Verified YOR237W HES1 oxysterol-binding protein related protein HES1|OSH5 chromosome 15 L000000767 15 781994 783298 W 2011-02-03 1996-07-31 Protein implicated in the regulation of ergosterol biosynthesis; one of a seven member gene family with a common essential function and non-essential unique functions; similar to human oxysterol binding protein (OSBP); SWAT-GFP and mCherry fusion proteins localize to the bud neck and vacuolar membrane; HES1 has a paralog, KES1, that arose from the whole genome duplication -S000032069 CDS YOR237W 15 781994 783298 W 2011-02-03 1996-07-31 -S000118493 ARS ARS1524 ARSXV-783 chromosome 15 15 783345 783563 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178186 ARS_consensus_sequence ARS1524 15 783386 783402 W 2014-11-18 2014-11-18 -S000005764 ORF Uncharacterized YOR238W chromosome 15 15 783677 784588 W 2011-02-03 2003-09-22|1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000034067 CDS YOR238W 15 783677 784588 W 2011-02-03 2003-09-22|1996-07-31 -S000005765 ORF Verified YOR239W ABP140 TRM140|YOR240W chromosome 15 15 784857 786744 W 2011-02-03 2000-08-14|1996-07-31 AdoMet-dependent tRNA methyltransferase and actin binding protein; C-terminal domain is responsible for 3-methylcytidine modification of residue 32 of the tRNA anticodon loop of tRNA-Thr and tRNA-Ser and contains an S-adenosylmethionine (AdoMet) binding motif; N-terminal actin binding sequence interacts with actin filaments and localizes to actin patches and cables; N- and C-terminal domains are encoded in separate ORFs that are translated into one protein via a +1 frameshift -S000034147 CDS YOR239W 15 784857 785687 W 2011-02-03 2000-08-14|1996-07-31 -S000034148 CDS YOR239W 15 785689 786744 W 2011-02-03 2000-08-14 -S000034149 plus_1_translational_frameshift YOR239W 15 785688 785688 W 2011-02-03 2000-08-14 -S000005767 ORF Verified YOR241W MET7 tetrahydrofolate synthase|MET23 chromosome 15 L000001082 15 786995 788641 W 136 2011-02-03 1996-07-31 Folylpolyglutamate synthetase; catalyzes extension of the glutamate chains of the folate coenzymes, required for methionine synthesis and for maintenance of mitochondrial DNA; protein abundance increases in response to DNA replication stress -S000033075 CDS YOR241W 15 786995 788641 W 2011-02-03 1996-07-31 -S000005768 ORF Verified YOR242C SSP2 chromosome 15 L000004585 15 789857 788742 C 2011-02-03 1996-07-31 Sporulation specific protein that localizes to the spore wall; required for sporulation at a point after meiosis II and during spore wall formation; expression controlled by a tightly regulated middle-meiotic promoter that is activated by Ndt80p; translation of SSP2 mRNA is delayed, such that the mRNA is present as nuclear divisions are taking place but is not engaged by ribosomes until relatively late in meiotic development -S000033690 CDS YOR242C 15 789857 788742 C 2011-02-03 1996-07-31 -S000005769 ORF Verified YOR243C PUS7 pseudouridine synthase PUS7 chromosome 15 15 792241 790211 C 2011-02-03 1996-07-31 Pseudouridine synthase; catalyzes pseudouridylation at positions 35 and 56 in U2 snRNA, position 50 in 5S rRNA, position 13 in cytoplasmic tRNAs, and position 35 in pre-tRNA(Tyr); also pseudouridylates some mRNAs; relocates from nucleus to cytoplasm during heat shock and differentially modifies some mRNAs during heat shock; conserved in archaea, vertebrates, and some bacteria -S000033806 CDS YOR243C 15 792241 790211 C 2011-02-03 1996-07-31 -S000005770 ORF Verified YOR244W ESA1 NuA4 histone acetyltransferase complex catalytic subunit ESA1|KAT5|TAS1 chromosome 15 L000003952 15 792531 793868 W 2011-02-03 1996-07-31 Catalytic subunit of the histone acetyltransferase complex (NuA4); acetylates four conserved internal lysines of histone H4 N-terminal tail and can acetylate histone H2A; master regulator of cellular acetylation balance; required for cell cycle progression and transcriptional silencing at the rDNA locus and regulation of autophagy; human ortholog TIP60/KAT5 is implicated in cancer and other diseases, functionally complements lethality of the esa1 null mutation -S000033978 CDS YOR244W 15 792531 793868 W 2011-02-03 1996-07-31 -S000005771 ORF Verified YOR245C DGA1 diacylglycerol O-acyltransferase chromosome 15 15 795332 794076 C 2011-02-03 1996-07-31 Diacylglycerol acyltransferase; catalyzes the terminal step of triacylglycerol (TAG) formation, acylates diacylglycerol using acyl-CoA as an acyl donor; Lro1p and Dga1p can O-acylate ceramides; localized to lipid particles -S000034041 CDS YOR245C 15 795332 794076 C 2011-02-03 1996-07-31 -S000005772 ORF Verified YOR246C ENV9 chromosome 15 15 796793 795801 C 2011-02-03 1996-07-31 Protein proposed to be involved in vacuolar functions; mutant shows defect in CPY processing and defects in vacuolar morphology; has similarity to oxidoreductases, found in lipid particles; required for replication of Brome mosaic virus in S. cerevisiae, a model system for studying replication of positive-strand RNA viruses in their natural hosts -S000034930 CDS YOR246C 15 796793 795801 C 2011-02-03 1996-07-31 -S000005773 ORF Verified YOR247W SRL1 chromosome 15 L000004669 15 797676 798308 W 2011-02-03 1996-07-31 Mannoprotein that exhibits a tight association with the cell wall; required for cell wall stability in the absence of GPI-anchored mannoproteins; has a high serine-threonine content; expression is induced in cell wall mutants; SRL1 has a paralog, SVS1, that arose from the whole genome duplication -S000035223 CDS YOR247W 15 797676 798308 W 2011-02-03 1996-07-31 -S000005774 ORF Dubious YOR248W TOS11 chromosome 15 15 798013 798315 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036109 CDS YOR248W 15 798013 798315 W 2011-02-03 1996-07-31 -S000005775 ORF Verified YOR249C APC5 anaphase promoting complex subunit 5|RMC1 chromosome 15 L000004320 15 800731 798674 C 2011-02-03 1996-07-31 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); APC/C is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; component of the platform domain of the APC/C, based on structural analysis; relative distribution to nuclear foci decreases upon DNA replication stress -S000036169 CDS YOR249C 15 800731 798674 C 2011-02-03 1996-07-31 -S000005776 ORF Verified YOR250C CLP1 cleavage polyadenylation factor subunit CLP1 chromosome 15 L000004201 15 802307 800970 C 2011-02-03 1996-07-31 Component of the cleavage and polyadenylation factor I (CF I); CF 1, composed of the CF 1A complex (Rna14p, Rna15p, Clp1p, Pcf11p) and Hrp1, is involved in cleavage and polyadenylation of mRNA 3' ends; involved in both the endonucleolyitc cleavage and polyadenylation steps of mRNA 3'-end maturation and in gene looping which affects reinitiation of transcription -S000036960 CDS YOR250C 15 802307 800970 C 2011-02-03 1996-07-31 -S000005777 ORF Verified YOR251C TUM1 thiosulfate sulfurtransferase chromosome 15 15 803464 802550 C 2011-02-03 1996-07-31 Rhodanese domain sulfur transferase; accepts persulfite from Nfs1p and transfers it to Uba4p in the pathway for 2-thiolation of the wobble uridine base of tRNAs; also stimulates sulfur transfer by Nfs1p; may be mitochondrially localized -S000037035 CDS YOR251C 15 803464 802550 C 2011-02-03 1996-07-31 -S000005778 ORF Verified YOR252W TMA16 RBF17 chromosome 15 15 803667 804203 W 2011-02-03 1996-07-31|2006-01-05 Protein of unknown function that associates with ribosomes -S000037174 CDS YOR252W 15 803667 804203 W 2011-02-03 1996-07-31|2006-01-05 -S000005779 ORF Verified YOR253W NAT5 peptide alpha-N-acetyltransferase subunit NAT5|NAA50|ROG2|ARD2 chromosome 15 15 804377 804907 W 2011-02-03 1996-07-31 Subunit of protein N-terminal acetyltransferase NatA; NatA is comprised of Nat1p, Ard1p, and Nat5p; N-terminally acetylates many proteins, which influences multiple processes such as the cell cycle, heat-shock resistance, mating, sporulation, and telomeric silencing -S000029833 CDS YOR253W 15 804377 804907 W 2011-02-03 1996-07-31 -S000005780 ORF Verified YOR254C SEC63 protein-transporting protein SEC63|PTL1 chromosome 15 L000001854|L000001269 15 807023 805032 C 2011-02-03 1996-07-31 Essential subunit of Sec63 complex; with Sec61 complex, Kar2p/BiP and Lhs1p forms a channel competent for SRP-dependent and post-translational SRP-independent protein targeting and import into the ER; other members are Sec62p, Sec66p, and Sec72p -S000029878 CDS YOR254C 15 807023 805032 C 2011-02-03 1996-07-31 -S000005781 ORF Verified YOR255W OSW1 chromosome 15 15 807271 808107 W 2011-02-03 1996-07-31 Protein involved in sporulation; required for the construction of the outer spore wall layers; required for proper localization of Spo14p -S000030954 CDS YOR255W 15 807271 808107 W 2011-02-03 1996-07-31 -S000005782 ORF Verified YOR256C TRE2 putative zinc metalloprotease chromosome 15 15 810683 808254 C 2006-01-05 1996-07-31|2011-02-03 Transferrin receptor-like protein; functions with Tre1p to regulate ubiquitination and vacuolar degradation of the metal transporter Smf1p; inviability of null mutant in systematic studies is due to proximity to CDC31; TRE2 has a paralog, TRE1, that arose from the whole genome duplication -S000030990 CDS YOR256C 15 810683 808254 C 2006-01-05 1996-07-31|2011-02-03 -S000005783 ORF Verified YOR257W CDC31 centrin|DSK1 chromosome 15 L000000269 15 811008 811493 W 147 2006-01-05 1996-07-31 Calcium-binding component of the spindle pole body (SPB) half-bridge; required for SPB duplication in mitosis and meiosis II; homolog of mammalian centrin; binds multiubiquitinated proteins and is involved in proteasomal protein degradation -S000031201 CDS YOR257W 15 811008 811493 W 2006-01-05 1996-07-31 -S000005784 ORF Verified YOR258W HNT3 DNA 5'-adenosine monophosphate hydrolase chromosome 15 15 811671 812324 W 2006-01-05 1996-07-31 DNA 5' AMP hydrolase involved in DNA repair; member of the histidine triad (HIT) superfamily of nucleotide-binding proteins; homolog of Aprataxin, a Hint related protein that is mutated in individuals with ataxia with oculomotor apraxia; relative distribution to nuclear foci decreases upon DNA replication stress -S000032199 CDS YOR258W 15 811671 812324 W 2006-01-05 1996-07-31 -S000005785 ORF Verified YOR259C RPT4 proteasome regulatory particle base subunit RPT4|SUG2|PCS1|CRL13 chromosome 15 L000003423|L000003107|L000000413 15 813708 812395 C 143 2006-01-05 1996-07-31 ATPase of the 19S regulatory particle of the 26S proteasome; one of six ATPases of the regulatory particle; involved in degradation of ubiquitinated substrates; contributes preferentially to ERAD; required for spindle pole body duplication; mainly nuclear localization -S000032229 CDS YOR259C 15 813708 812395 C 2006-01-05 1996-07-31 -S000005786 ORF Verified YOR260W GCD1 translation initiation factor eIF2B subunit gamma|TRA3 chromosome 15 L000000670 15 813984 815720 W 143 2006-01-05 1996-07-31 Gamma subunit of the translation initiation factor eIF2B; the guanine-nucleotide exchange factor for eIF2; activity subsequently regulated by phosphorylated eIF2; first identified as a negative regulator of GCN4 expression -S000032270 CDS YOR260W 15 813984 815720 W 2006-01-05 1996-07-31 -S000005787 ORF Verified YOR261C RPN8 proteasome regulatory particle lid subunit RPN8 chromosome 15 L000004308 15 816931 815915 C 2006-01-05 1996-07-31 Essential non-ATPase regulatory subunit of the 26S proteasome; has similarity to the human p40 proteasomal subunit and to another S. cerevisiae regulatory subunit, Rpn11p -S000032281 CDS YOR261C 15 816931 815915 C 2006-01-05 1996-07-31 -S000005788 ORF Verified YOR262W GPN2 putative GTPase GPN2 chromosome 15 15 817292 818335 W 2011-02-03 1996-07-31 Putative GTPase with a role in biogenesis of RNA pol II and polIII; may be involved in assembly of RNA polymerases II and III and in their transport into the nucleus; contains a Gly-Pro-Asn motif in the G domain; similar to Npa3p and Gpn3p; highly conserved across species and homologous to human gene GPN2/ATPBD1B; required for establishment of sister chromatid cohesion -S000033195 CDS YOR262W 15 817292 818335 W 2011-02-03 1996-07-31 -S000005790 ORF Verified YOR264W DSE3 chromosome 15 15 818866 820158 W 2011-02-03 1996-07-31 Daughter cell-specific protein, may help establish daughter fate; relocalizes from bud neck to cytoplasm upon DNA replication stress -S000033310 CDS YOR264W 15 818866 820158 W 2011-02-03 1996-07-31 -S000005789 ORF Dubious YOR263C chromosome 15 15 819164 818757 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF DES3/YOR264W -S000033220 CDS YOR263C 15 819164 818757 C 2011-02-03 1996-07-31 -S000005791 ORF Verified YOR265W RBL2 chromosome 15 L000002910 15 820454 820774 W 2011-02-03 1996-07-31 Protein involved in microtubule morphogenesis; required for protection from excess free beta-tubulin; proposed to be involved the folding of beta-tubulin; similar to mouse beta-tubulin cofactor A; protein abundance increases in response to DNA replication stress -S000034224 CDS YOR265W 15 820454 820774 W 2011-02-03 1996-07-31 -S000005792 ORF Verified YOR266W PNT1 chromosome 15 L000001460 15 821023 822294 W 2011-02-03 1996-07-31 Mitochondrial integral inner membrane protein; involved in membrane insertion of C-terminus of Cox2p, interacts genetically and physically with Cox18p; deletion mutant sensitive to the anti-Pneumocystis carinii drug pentamidine -S000034354 CDS YOR266W 15 821023 822294 W 2011-02-03 1996-07-31 -S000005793 ORF Verified YOR267C HRK1 putative serine/threonine protein kinase HRK1 chromosome 15 15 824867 822588 C 2011-02-03 1996-07-31 Protein kinase; implicated in activation of the plasma membrane H(+)-ATPase Pma1p in response to glucose metabolism; plays a role in ion homeostasis; protein abundance increases in response to DNA replication stress -S000034383 CDS YOR267C 15 824867 822588 C 2011-02-03 1996-07-31 -S000005794 ORF Uncharacterized YOR268C chromosome 15 15 825932 825534 C 2011-02-03 1996-07-31 Putative protein of unknown function; sporulation is abnormal in homozygous diploid; SWAT-GFP fusion protein localizes to the nucleus; YOR268C is not an essential gene -S000035396 CDS YOR268C 15 825932 825534 C 2011-02-03 1996-07-31 -S000005795 ORF Verified YOR269W PAC1 chromosome 15 L000001328 15 826385 827869 W 2011-02-03 1996-07-31 Involved in nuclear migration, part of the dynein/dynactin pathway; targets dynein to microtubule tips, which is necessary for sliding of microtubules along bud cortex; serves at interface between dynein's ATPase site and its microtubule binding stalk, causing individual dynein motors to remain attached to microtubules for long periods; synthetic lethal with bni1; homolog of human LIS1, mutations in which cause the severe brain disorder lissencephaly -S000035573 CDS YOR269W 15 826385 827869 W 2011-02-03 1996-07-31 -S000005796 ORF Verified YOR270C VPH1 H(+)-transporting V0 sector ATPase subunit a chromosome 15 L000002467 15 830574 828052 C 2011-02-03 1996-07-31 Subunit a of vacuolar-ATPase V0 domain; one of two isoforms (Vph1p and Stv1p); Vph1p is located in V-ATPase complexes of the vacuole while Stv1p is located in V-ATPase complexes of the Golgi and endosomes; relative distribution to the vacuolar membrane decreases upon DNA replication stress; human homolog ATP6V0A4 implicated in renal tubular acidosis, can complement yeast null mutant -S000036537 CDS YOR270C 15 830574 828052 C 2011-02-03 1996-07-31 -S000005797 ORF Uncharacterized YOR271C FSF1 chromosome 15 15 832042 831059 C 2011-02-03 1996-07-31 Putative protein; predicted to be an alpha-isopropylmalate carrier; belongs to the sideroblastic-associated protein family; non-tagged protein is detected in purified mitochondria; likely to play a role in iron homeostasis -S000036610 CDS YOR271C 15 832042 831059 C 2011-02-03 1996-07-31 -S000006497 snoRNA_gene snR8 SNR8 chromosome 15 L000001963 15 832332 832521 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at positions U960 and U986 -S000034324 noncoding_exon snR8 15 832332 832521 W 2011-02-03 2000-05-19 -S000005798 ORF Verified YOR272W YTM1 CST14 chromosome 15 L000003547|L000002998|S000029121 15 832813 834195 W 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; forms a complex with Nop7p and Erb1p that is required for maturation of the large ribosomal subunit; has seven C-terminal WD repeats -S000037380 CDS YOR272W 15 832813 834195 W 2011-02-03 1996-07-31 -S000005799 ORF Verified YOR273C TPO4 chromosome 15 15 836431 834452 C 2011-02-03 1996-07-31 Polyamine transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; recognizes spermine, putrescine, and spermidine; localizes to the plasma membrane -S000037433 CDS YOR273C 15 836431 834452 C 2011-02-03 1996-07-31 -S000005800 ORF Verified YOR274W MOD5 tRNA dimethylallyltransferase|[MOD+] chromosome 15 L000001131 15 837674 838960 W 2011-02-03 1996-07-31 Delta 2-isopentenyl pyrophosphate:tRNA isopentenyl transferase; required for biosynthesis of isopentenyladenosine in mitochondrial and cytoplasmic tRNAs; also has a role in tRNA gene-mediated silencing; gene encodes two isozymic forms; converts to a prion form, prion conversion contributes to azole antifungal resistance by upregulating ergosterol biosynthesis; homolog of human TRIT1, a mutation in which is associated with severe combined respiratory chain defects -S000030255 CDS YOR274W 15 837674 838960 W 2011-02-03 1996-07-31 -S000005801 ORF Verified YOR275C RIM20 chromosome 15 15 841069 839084 C 2011-02-03 1996-07-31 Protein involved in proteolytic activation of Rim101p; part of response to alkaline pH; PalA/AIP1/Alix family member; interaction with the ESCRT-III subunit Snf7p suggests a relationship between pH response and multivesicular body formation -S000030312 CDS YOR275C 15 841069 839084 C 2011-02-03 1996-07-31 -S000005802 ORF Verified YOR276W CAF20 p20|CAP20|CAF2 chromosome 15 L000000208|L000003291 15 841333 841818 W 2011-02-03 1996-07-31 Phosphoprotein of the mRNA cap-binding complex; involved in translational control; repressor of cap-dependent translation initiation; competes with eIF4G for binding to eIF4E -S000030543 CDS YOR276W 15 841333 841818 W 2011-02-03 1996-07-31 -S000005803 ORF Dubious YOR277C chromosome 15 15 841823 841515 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the verified gene CAF20 -S000031370 CDS YOR277C 15 841823 841515 C 2011-02-03 1996-07-31 -S000007296 snoRNA_gene snR31 SNR31 chromosome 15 L000001969 15 842182 841958 C 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of small subunit (SSU) rRNA at position U999 -S000036752 noncoding_exon snR31 15 842182 841958 C 2011-02-03 2000-05-19 -S000007291 snoRNA_gene snR5 SNR5 chromosome 15 L000001960 15 842403 842606 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at positions U1004 and U1124 -S000034319 noncoding_exon snR5 15 842403 842606 W 2011-02-03 2000-05-19 -S000005804 ORF Verified YOR278W HEM4 uroporphyrinogen-III synthase HEM4|SLU2 chromosome 15 L000002903 15 842817 843644 W 2011-02-03 1996-07-31 Uroporphyrinogen III synthase; catalyzes the conversion of hydroxymethylbilane to uroporphyrinogen III, the fourth step in heme biosynthesis; deficiency in the human homolog can result in the disease congenital erythropoietic porphyria -S000031577 CDS YOR278W 15 842817 843644 W 2011-02-03 1996-07-31 -S000005805 ORF Verified YOR279C RFM1 chromosome 15 15 844630 843698 C 2011-02-03 1996-07-31 Component of the Sum1p-Rfm1p-Hst1p complex; Rfm1p tethers the Hst1p histone deacetylase to the DNA-binding protein Sum1p; complex is involved in transcriptional repression of middle sporulation genes and in initiation of DNA replication -S000031617 CDS YOR279C 15 844630 843698 C 2011-02-03 1996-07-31 -S000005806 ORF Verified YOR280C FSH3 putative serine hydrolase chromosome 15 15 845792 844992 C 2011-02-03 1996-07-31 Putative serine hydrolase; likely target of Cyc8p-Tup1p-Rfx1p transcriptional regulation; sequence is similar to S. cerevisiae Fsh1p and Fsh2p and the human candidate tumor suppressor OVCA2 -S000031815 CDS YOR280C 15 845792 844992 C 2011-02-03 1996-07-31 -S000005808 ORF Dubious YOR282W chromosome 15 15 847000 847320 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps essential, verified gene PLP2/YOR281C -S000032900 CDS YOR282W 15 847000 847320 W 2011-02-03 1996-07-31 -S000005807 ORF Verified YOR281C PLP2 chromosome 15 15 847129 846269 C 2011-02-03 1996-07-31 Protein that interacts with the CCT complex to stimulate actin folding; has similarity to phosducins; null mutant lethality is complemented by mouse phosducin-like protein MgcPhLP; CCT is short for chaperonin containing TCP-1; essential gene -S000031925 CDS YOR281C 15 847129 846269 C 2011-02-03 1996-07-31 -S000005809 ORF Verified YOR283W phosphoglycerate mutase chromosome 15 15 847453 848145 W 2011-02-03 1996-07-31 Phosphatase with a broad substrate specificity; has some similarity to GPM1/YKL152C, a phosphoglycerate mutase; YOR283W is not an essential gene -S000032989 CDS YOR283W 15 847453 848145 W 2011-02-03 1996-07-31 -S000005810 ORF Verified YOR284W HUA2 chromosome 15 15 848478 849209 W 2011-02-03 1996-07-31 Cytoplasmic protein of unknown function; computational analysis of large-scale protein-protein interaction data suggests a possible role in actin patch assembly -S000033085 CDS YOR284W 15 848478 849209 W 2011-02-03 1996-07-31 -S000005811 ORF Verified YOR285W RDL1 thiosulfate sulfurtransferase RDL1 chromosome 15 15 849635 850054 W 2011-02-03 1996-07-31 Thiosulfate sulfurtransferase; contains a rhodanese-like domain; localized to the mitochondrial outer membrane; protein abundance increases in response to DNA replication stress; similar to the human TSTD gene -S000033844 CDS YOR285W 15 849635 850054 W 2011-02-03 1996-07-31 -S000005812 ORF Verified YOR286W RDL2 thiosulfate sulfurtransferase RDL2|AIM42|FMP31 chromosome 15 15 850280 850729 W 2011-02-03 1996-07-31 Protein with rhodanese activity; contains a rhodanese-like domain similar to Rdl1p, Uba4p, Tum1p, and Ych1p; overexpression causes a cell cycle delay; null mutant displays elevated frequency of mitochondrial genome loss -S000033993 CDS YOR286W 15 850280 850729 W 2011-02-03 1996-07-31 -S000005813 ORF Verified YOR287C RRP36 rRNA-processing protein RRP36 chromosome 15 15 851839 850937 C 2011-02-03 1996-07-31 Component of 90S preribosomes; involved in early cleavages of the 35S pre-rRNA and in production of the 40S ribosomal subunit -S000034025 CDS YOR287C 15 851839 850937 C 2011-02-03 1996-07-31 -S000005814 ORF Verified YOR288C MPD1 protein disulfide isomerase MPD1 chromosome 15 L000003038 15 853077 852121 C 2011-02-03 1996-07-31 Member of the protein disulfide isomerase (PDI) family; interacts with and inhibits the chaperone activity of Cne1p; MPD1 overexpression in a pdi1 null mutant suppresses defects in Pdi1p functions such as carboxypeptidase Y maturation -S000034906 CDS YOR288C 15 853077 852121 C 2011-02-03 1996-07-31 -S000005815 ORF Uncharacterized YOR289W chromosome 15 15 853357 854112 W 2011-02-03 1996-07-31 Putative protein of unknown function; transcription induced by the unfolded protein response; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus -S000035198 CDS YOR289W 15 853357 854112 W 2011-02-03 1996-07-31 -S000006525 tRNA_gene tA(UGC)O chromosome 15 L000003714 15 854259 854187 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 5 nuclear tRNA genes containing the tDNA-anticodon TGC (mature tRNA may be UGC or may contain modified bases), decodes GCA and probably GCG codons into alanine, one of 16 nuclear tRNAs for alanine -S000034894 noncoding_exon tA(UGC)O 15 854259 854187 C 2011-02-03 2000-05-19 -S000007178 long_terminal_repeat YORWsigma3 chromosome 15 15 854275 854614 W 2011-02-03 2000-05-19 Ty3 LTR -S000005816 ORF Verified YOR290C SNF2 SWI/SNF catalytic subunit SNF2|TYE3|SWI2|HAF1|GAM1 chromosome 15 L000001945 15 860258 855147 C 2011-02-03 1996-07-31 Catalytic subunit of the SWI/SNF chromatin remodeling complex; involved in transcriptional regulation; contains DNA-stimulated ATPase activity; functions interdependently in transcriptional activation with Snf5p and Snf6p -S000036380 CDS YOR290C 15 860258 855147 C 2011-02-03 1996-07-31 -S000005817 ORF Verified YOR291W YPK9 putative acid anhydride hydrolase chromosome 15 15 861175 865593 W 2011-02-03 1996-07-31 Vacuolar protein with a possible role in sequestering heavy metals; has similarity to the type V P-type ATPase Spf1p; homolog of human ATP13A2 (PARK9), mutations in which are associated with Parkinson disease and Kufor-Rakeb syndrome -S000037072 CDS YOR291W 15 861175 865593 W 2011-02-03 1996-07-31 -S000005818 ORF Uncharacterized YOR292C chromosome 15 15 866582 865653 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole; YOR292C is not an essential gene -S000037114 CDS YOR292C 15 866582 865653 C 2011-02-03 1996-07-31 -S000005819 ORF Verified YOR293W RPS10A eS10|ribosomal 40S subunit protein S10A|S10e|S10A chromosome 15 L000004475 15 867098 867852 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S10, no bacterial homolog; RPS10A has a paralog, RPS10B, that arose from the whole genome duplication; mutations in the human homolog associated with Diamond-Blackfan anemia -S000037299 CDS YOR293W 15 867098 867149 W 2011-02-03 1996-07-31 -S000037300 CDS YOR293W 15 867587 867852 W 2011-02-03 1996-07-31 -S000037301 intron YOR293W 15 867150 867586 W 2011-02-03 1996-07-31 -S000028858 ORF Uncharacterized YOR293C-A chromosome 15 15 868147 867998 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000034572 CDS YOR293C-A 15 868147 867998 C 2011-02-03 2003-07-29 -S000005820 ORF Verified YOR294W RRS1 chromosome 15 15 868340 868951 W 2011-02-03 1996-07-31 Essential protein that binds ribosomal protein L11; required for nuclear export of the 60S pre-ribosomal subunit during ribosome biogenesis; localizes to the nucleolus and in foci along nuclear periphery; cooperates with Ebp2p and Mps3p to mediate telomere clustering by binding Sir4p, but is not involved in telomere tethering; mouse homolog shows altered expression in Huntington's disease model mice -S000029945 CDS YOR294W 15 868340 868951 W 2011-02-03 1996-07-31 -S000005821 ORF Verified YOR295W UAF30 chromosome 15 15 869208 869894 W 2011-02-03 1996-07-31 Subunit of UAF (upstream activation factor) complex; UAF is an RNA polymerase I specific transcription stimulatory factor composed of Uaf30p, Rrn5p, Rrn9p, Rrn10p, histones H3 and H4; targeting factor for the UAF that facilitates activation of many rDNA genes; deletion decreases cellular growth rate; UAF30 has a paralog, TRI1, that arose from the whole genome duplication -S000030055 CDS YOR295W 15 869208 869894 W 2011-02-03 1996-07-31 -S000005822 ORF Uncharacterized YOR296W chromosome 15 15 870202 874071 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; expressed during copper starvation; YOR296W is not an essential gene -S000031083 CDS YOR296W 15 870202 874071 W 2011-02-03 1996-07-31 -S000118494 ARS ARS1526 ARSXV-874 chromosome 15 15 874251 874412 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000005823 ORF Verified YOR297C TIM18 chromosome 15 S000007448 15 875321 874743 C 2011-02-03 1996-07-31|2011-02-03 Component of the mitochondrial TIM22 complex; involved in insertion of polytopic proteins into the inner membrane; may mediate assembly or stability of the complex -S000031114 CDS YOR297C 15 875321 874743 C 2011-02-03 1996-07-31|2011-02-03 -S000005824 ORF Verified YOR298W MUM3 chromosome 15 15 875599 877038 W 2011-02-03 1996-07-31 Protein of unknown function involved in outer spore wall organization; has similarity to the tafazzins superfamily of acyltransferases -S000031297 CDS YOR298W 15 875599 877038 W 2011-02-03 1996-07-31 -S000007253 ORF Verified YOR298C-A MBF1 SUF13 chromosome 15 L000002160|L000004688 15 877685 877230 C 165 2011-02-03 2004-02-12|1999-07-17 Transcriptional coactivator; bridges the DNA-binding region of Gcn4p and TATA-binding protein Spt15p; suppressor of frameshift mutations; protein abundance increases in response to DNA replication stress -S000030828 CDS YOR298C-A 15 877685 877230 C 2011-02-03 2004-02-12|1999-07-17 -S000005825 ORF Verified YOR299W BUD7 exomer complex subunit chromosome 15 L000003554 15 878435 880675 W 2011-02-03 1996-07-31 Member of the ChAPs family (Chs5p-Arf1p-binding proteins); members include Bch1p, Bch2p, Bud7p, and Chs6p; ChAPs family proteins form the exomer complex with Chs5p to mediate export of specific cargo proteins, including Chs3p, from the Golgi to the plasma membrane; BUD7 has a paralog, BCH1, that arose from the whole genome duplication -S000031429 CDS YOR299W 15 878435 880675 W 2011-02-03 1996-07-31 -S000005826 ORF Dubious YOR300W HUF1 chromosome 15 15 880575 880883 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps with verified gene BUD7/YOR299W; mutation affects bipolar budding and bud site selection, though phenotype could be due to the mutation's effects on BUD7 -S000036845 CDS YOR300W 15 880575 880883 W 2011-02-03 1996-07-31 -S000005827 ORF Verified YOR301W RAX1 chromosome 15 15 880965 882272 W 2011-02-03 1996-07-31 Protein involved in bud site selection during bipolar budding; localization requires Rax2p; has similarity to members of the insulin-related peptide superfamily -S000037565 CDS YOR301W 15 880965 882272 W 2011-02-03 1996-07-31 -S000005828 ORF Verified YOR302W chromosome 15 15 882765 882842 W 2011-02-03 1996-07-31 CPA1 uORF; Arginine attenuator peptide, regulates translation of the CPA1 mRNA -S000037642 CDS YOR302W 15 882765 882842 W 2011-02-03 1996-07-31 -S000005829 ORF Verified YOR303W CPA1 carbamoyl-phosphate synthase (glutamine-hydrolyzing) CPA1 chromosome 15 L000000399 15 882899 884134 W 161 2011-02-03 1996-07-31 Small subunit of carbamoyl phosphate synthetase; carbamoyl phosphate synthetase catalyzes a step in the synthesis of citrulline, an arginine precursor; translationally regulated by an attenuator peptide encoded by YOR302W within the CPA1 mRNA 5'-leader -S000037697 CDS YOR303W 15 882899 884134 W 2011-02-03 1996-07-31 -S000005831 ORF Verified YOR304W ISW2 DNA translocase chromosome 15 L000004448 15 884514 887876 W 2011-02-03 1996-07-31 ATP-dependent DNA translocase involved in chromatin remodeling; ATPase component that, with Itc1p, forms a complex required for repression of a-specific genes, INO1, and early meiotic genes during mitotic growth; the Isw2 complex exhibits basal levels of chromatin binding throughout the genome as well as target-specific chromatin interactions; targeted by Ume6p- and Sua7p-dependent DNA looping to many loci genome-wide -S000037758 CDS YOR304W 15 884514 887876 W 2011-02-03 1996-07-31 -S000005830 ORF Verified YOR304C-A BIL1 EDO1 chromosome 15 15 888750 888520 C 2011-02-03 1997-07-01|1996-07-31 Protein that binds Bud6p and has a role in actin cable assembly; involved in the Bnr1p-dependent pathway of cable assembly; localizes to bud tip and bud neck -S000032659 CDS YOR304C-A 15 888750 888520 C 2011-02-03 1997-07-01|1996-07-31 -S000005832 ORF Verified YOR305W RRG7 chromosome 15 15 889022 889750 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the mitochondrion; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO); YOR305W is not an essential gene -S000030593 CDS YOR305W 15 889022 889750 W 2011-02-03 1996-07-31 -S000005833 ORF Verified YOR306C MCH5 chromosome 15 15 891432 889867 C 2011-02-03 1996-07-31|2011-02-03 Plasma membrane riboflavin transporter; facilitates the uptake of vitamin B2; required for FAD-dependent processes; sequence similarity to mammalian monocarboxylate permeases, however mutants are not deficient in monocarboxylate transport -S000030631 CDS YOR306C 15 891432 889867 C 2011-02-03 1996-07-31|2011-02-03 -S000005834 ORF Verified YOR307C SLY41 chromosome 15 L000001925 15 894092 892731 C 2011-02-03 1996-07-31 Protein involved in ER-to-Golgi transport -S000030776 CDS YOR307C 15 894092 892731 C 2011-02-03 1996-07-31 -S000005835 ORF Verified YOR308C SNU66 U4/U6-U5 snRNP complex subunit SNU66 chromosome 15 15 896387 894624 C 2011-02-03 1996-07-31 Component of the U4/U6.U5 snRNP complex; involved in pre-mRNA splicing via spliceosome; also required for pre-5S rRNA processing and may act in concert with Rnh70p; has homology to human SART-1 -S000030861 CDS YOR308C 15 896387 894624 C 2011-02-03 1996-07-31 -S000005836 ORF Dubious YOR309C chromosome 15 15 897078 896698 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene NOP58 -S000031849 CDS YOR309C 15 897078 896698 C 2011-02-03 1996-07-31 -S000005837 ORF Verified YOR310C NOP58 RNA-processing protein NOP58|NOP5 chromosome 15 L000004000 15 898360 896825 C 2011-02-03 1996-07-31 Protein involved in producing mature rRNAs and snoRNAs; involved in pre-rRNA processing, 18S rRNA synthesis, and snoRNA synthesis; component of the small subunit processome complex, which is required for processing of pre-18S rRNA -S000031855 CDS YOR310C 15 898360 896825 C 2011-02-03 1996-07-31 -S000005838 ORF Verified YOR311C DGK1 diacylglycerol kinase|HSD1 chromosome 15 15 899928 899056 C 2011-02-03 1996-07-31 Diacylglycerol kinase; localized to the endoplasmic reticulum (ER); overproduction induces enlargement of ER-like membrane structures and suppresses a temperature-sensitive sly1 mutation; contains a CTP transferase domain -S000032742 CDS YOR311C 15 899928 899056 C 2011-02-03 1996-07-31 -S000005839 ORF Verified YOR312C RPL20B eL20|ribosomal 60S subunit protein L20B|L20e|L20B|L18B|RPL18A1 chromosome 15 L000003148 15 901194 900250 C 2011-02-03 1996-07-31|2007-07-10 Ribosomal 60S subunit protein L20B; homologous to mammalian ribosomal protein L18A, no bacterial homolog; RPL20B has a paralog, RPL20A, that arose from the whole genome duplication -S000032858 CDS YOR312C 15 900767 900250 C 2011-02-03 1996-07-31 -S000032857 CDS YOR312C 15 901194 901194 C 2011-02-03 1996-07-31|2007-07-10 -S000032859 intron YOR312C 15 901193 900768 C 2011-02-03 1996-07-31|2007-07-10 -S000005840 ORF Verified YOR313C SPS4 chromosome 15 L000002026 15 902874 901858 C 2011-02-03 1996-07-31 Protein whose expression is induced during sporulation; not required for sporulation; heterologous expression in E. coli induces the SOS response that senses DNA damage -S000032971 CDS YOR313C 15 902874 901858 C 2011-02-03 1996-07-31 -S000005841 ORF Dubious YOR314W chromosome 15 15 903043 903372 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033076 CDS YOR314W 15 903043 903372 W 2011-02-03 1996-07-31 -S000007629 ORF Dubious YOR314W-A chromosome 15 15 904458 904568 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037260 CDS YOR314W-A 15 904458 904568 W 2011-02-03 2001-02-26 -S000005842 ORF Verified YOR315W SFG1 chromosome 15 15 904760 905800 W 2011-02-03 1996-07-31 Nuclear protein putative transcription factor; required for growth of superficial pseudohyphae (which do not invade the agar substrate) but not for invasive pseudohyphal growth; may act together with Phd1p; potential Cdc28p substrate -S000033756 CDS YOR315W 15 904760 905800 W 2011-02-03 1996-07-31 -S000005843 ORF Verified YOR316C COT1 metal cation transporter COT1 chromosome 15 L000000382 15 907555 906236 C 2011-02-03 1996-07-31 Vacuolar transporter that mediates zinc transport into the vacuole; overexpression confers resistance to cobalt and rhodium; protein abundance increases in response to DNA replication stress; COT1 has a paralog, ZRC1, that arose from the whole genome duplication -S000033807 CDS YOR316C 15 907555 906236 C 2011-02-03 1996-07-31 -S000028584 ORF Uncharacterized YOR316C-A chromosome 15 15 907935 907726 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031332 CDS YOR316C-A 15 907935 907726 C 2011-02-03 2003-07-29 -S000118495 ARS ARS1528 ARSXV-908 chromosome 15 15 908296 908544 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178187 ARS_consensus_sequence ARS1528 15 908306 908322 W 2014-11-18 2014-11-18 -S000005844 ORF Verified YOR317W FAA1 long-chain fatty acid-CoA ligase FAA1 chromosome 15 L000000594 15 909343 911445 W 2011-02-03 1996-07-31 Long chain fatty acyl-CoA synthetase; activates fatty acids with a preference for C12:0-C16:0 chain lengths; role in the competitive import of long-chain fatty acids and sphingoid long-chain bases; accounts for most acyl-CoA synthetase activity; localizes to lipid particles and the plasma membrane; role in sphingolipid-to-glycerolipid metabolism; forms ER foci upon replication stress; faa1 faa4 double null complemented by any of human ACSBG1, ACSL1, 3, 4, 5, 6, SLC27A2, or 4 -S000034010 CDS YOR317W 15 909343 911445 W 2011-02-03 1996-07-31 -S000005845 ORF Dubious YOR318C chromosome 15 15 912436 911784 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; transcript is predicted to be spliced but there is no evidence that it is spliced in vivo -S000034044 CDS YOR318C 15 912085 911784 C 2011-02-03 1996-07-31 -S000034043 CDS YOR318C 15 912436 912433 C 2011-02-03 1996-07-31 -S000034045 intron YOR318C 15 912432 912086 C 2011-02-03 1996-07-31 -S000005846 ORF Verified YOR319W HSH49 U2 snRNP complex subunit HSH49 chromosome 15 L000003014 15 912822 913463 W 2011-02-03 1996-07-31 U2-snRNP associated splicing factor; similar to the mammalian splicing factor SAP49; proposed to function as a U2-snRNP assembly factor along with Hsh155p and binding partner Cus1p; contains two RNA recognition motifs (RRM) -S000035030 CDS YOR319W 15 912822 913463 W 2011-02-03 1996-07-31 -S000005847 ORF Verified YOR320C GNT1 glucose N-acetyltransferase chromosome 15 15 915094 913619 C 2011-02-03 1996-07-31 N-acetylglucosaminyltransferase; capable of modification of N-linked glycans in the Golgi apparatus -S000035936 CDS YOR320C 15 915094 913619 C 2011-02-03 1996-07-31 -S000005848 ORF Verified YOR321W PMT3 dolichyl-phosphate-mannose-protein mannosyltransferase PMT3 chromosome 15 L000002622 15 916030 918291 W 2011-02-03 1996-07-31 Protein O-mannosyltransferase; transfers mannose residues from dolichyl phosphate-D-mannose to protein serine/threonine residues; acts in a complex with Pmt5p, can instead interact with Pmt1p in some conditions; antifungal drug target; PMT3 has a paralog, PMT2, that arose from the whole genome duplication -S000036207 CDS YOR321W 15 916030 918291 W 2011-02-03 1996-07-31 -S000005849 ORF Verified YOR322C LDB19 ART1 chromosome 15 15 921062 918606 C 2011-02-03 1996-07-31 Alpha-arrestin involved in ubiquitin-dependent endocytosis; regulates endocytosis of plasma membrane proteins by recruiting the ubiquitin ligase Rsp5p to its targets; involved in the basal internalization and turnover of alpha-factor receptor Ste2p; recruits ubiquitin ligase Rsp5p to Ste2p via its 2 PPXY motifs; inhibited by Npr1p-mediated phosphorylation, which affects translocation between the cytosol and the plasma membrane -S000036901 CDS YOR322C 15 921062 918606 C 2011-02-03 1996-07-31 -S000005850 ORF Verified YOR323C PRO2 glutamate-5-semialdehyde dehydrogenase chromosome 15 L000001492 15 922905 921535 C 175 2011-02-03 1996-07-31 Gamma-glutamyl phosphate reductase; catalyzes the second step in proline biosynthesis -S000036961 CDS YOR323C 15 922905 921535 C 2011-02-03 1996-07-31 -S000005852 ORF Dubious YOR325W chromosome 15 15 924577 925050 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF FRT1 -S000037825 CDS YOR325W 15 924577 925050 W 2011-02-03 1996-07-31 -S000005851 ORF Verified YOR324C FRT1 HPH1 chromosome 15 15 925040 923232 C 2011-02-03 1996-07-31 Tail-anchored ER membrane protein of unknown function; substrate of the phosphatase calcineurin; interacts with homolog Frt2p; promotes cell growth in stress conditions, possibly via a role in posttranslational translocation; FRT1 has a paralog, FRT2, that arose from the whole genome duplication -S000037039 CDS YOR324C 15 925040 923232 C 2011-02-03 1996-07-31 -S000005853 ORF Verified YOR326W MYO2 myosin 2|CDC66 chromosome 15 L000001223 15 925721 930445 W 174 2011-02-03 1996-07-31 Type V myosin motor involved in actin-based transport of cargos; required for the polarized delivery of secretory vesicles, the vacuole, late Golgi elements, peroxisomes, and the mitotic spindle; MYO2 has a paralog, MYO4, that arose from the whole genome duplication -S000029839 CDS YOR326W 15 925721 930445 W 2011-02-03 1996-07-31 -S000005854 ORF Verified YOR327C SNC2 SNAP receptor SNC2 chromosome 15 L000001943 15 931081 930734 C 2011-02-03 1996-07-31 Vesicle membrane receptor protein (v-SNARE); involved in the fusion between Golgi-derived secretory vesicles with the plasma membrane; Snc2p levels regulated by Vps45p; member of the synaptobrevin/VAMP family of R-type v-SNARE proteins; SNC2 has a paralog, SNC1, that arose from the whole genome duplication -S000029884 CDS YOR327C 15 931081 930734 C 2011-02-03 1996-07-31 -S000005855 ORF Verified YOR328W PDR10 ATP-binding cassette multidrug transporter PDR10 chromosome 15 L000002865 15 931803 936497 W 2011-02-03 1996-07-31 ATP-binding cassette (ABC) transporter; multidrug transporter involved in the pleiotropic drug resistance network; regulated by Pdr1p and Pdr3p -S000030958 CDS YOR328W 15 931803 936497 W 2011-02-03 1996-07-31 -S000028585 ORF Dubious YOR329W-A chromosome 15 15 939348 939557 W 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by fungal homology and RT-PCR -S000031335 CDS YOR329W-A 15 939348 939557 W 2011-02-03 2003-07-29 -S000005856 ORF Verified YOR329C SCD5 SCD7|FTB1 chromosome 15 L000001805|S000029433|L000001807 15 939349 936731 C 2011-02-03 1996-07-31 Protein required for normal actin organization and endocytosis; targeting subunit for protein phosphatase type 1; undergoes Crm1p-dependent nuclear-cytoplasmic shuttling; multicopy suppressor of clathrin deficiency -S000030995 CDS YOR329C 15 939349 936731 C 2011-02-03 1996-07-31 -S000005857 ORF Verified YOR330C MIP1 DNA-directed DNA polymerase gamma MIP1 chromosome 15 L000001113 15 943385 939621 C 181 2011-02-03 1996-07-31|2005-11-30 Mitochondrial DNA polymerase gamma; single subunit of mitochondrial DNA polymerase in yeast, in contrast to metazoan complex of catalytic and accessory subunits; polymorphic in yeast, petites occur more frequently in some lab strains; human ortholog POLG complements yeast mip1 mutant; mutations in human POLG associated with Alpers-Huttenlocher syndrome (AHS), progressive external ophthalmoplegia (PEO), parkinsonism, other mitochondrial diseases -S000031997 CDS YOR330C 15 943385 939621 C 2011-02-03 1996-07-31|2005-11-30 -S000005859 ORF Verified YOR332W VMA4 H(+)-transporting V1 sector ATPase subunit E chromosome 15 L000002459 15 943656 944357 W 2011-02-03 1996-07-31 Subunit E of the V1 domain of the vacuolar H+-ATPase (V-ATPase); V-ATPase is an electrogenic proton pump found throughout the endomembrane system; V1 domain has eight subunits; required for the V1 domain to assemble onto the vacuolar membrane; protein abundance increases in response to DNA replication stress -S000032201 CDS YOR332W 15 943656 944357 W 2011-02-03 1996-07-31 -S000005858 ORF Dubious YOR331C chromosome 15 15 944122 943565 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame overlaps the verified gene VMA4/YOR332W -S000032076 CDS YOR331C 15 944122 943565 C 2011-02-03 1996-07-31 -S000005861 ORF Verified YOR334W MRS2 chromosome 15 L000001178 15 944596 946008 W 2011-02-03 1996-07-31 Mitochondrial inner membrane Mg(2+) channel; required for maintenance of intramitochondrial Mg(2+) concentrations at the correct level to support splicing of group II introns; similar to bacterial CorA -S000033146 CDS YOR334W 15 944596 946008 W 2011-02-03 1996-07-31 -S000005860 ORF Dubious YOR333C SWF5 chromosome 15 15 944957 944541 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps 5' end of MRS2 gene required for respiratory growth -S000032222 CDS YOR333C 15 944957 944541 C 2011-02-03 1996-07-31 -S000028717 ORF Dubious YOR335W-A chromosome 15 15 946568 946648 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene ALA1/YOR335C -S000032688 CDS YOR335W-A 15 946568 946648 W 2011-02-03 2003-07-29 -S000005862 ORF Verified YOR335C ALA1 alanine--tRNA ligase|CDC64 chromosome 15 L000000286|L000002757 15 949109 946233 C 188 2011-02-03 1996-07-31 Cytoplasmic and mitochondrial alanyl-tRNA synthetase; required for protein synthesis; point mutation (cdc64-1 allele) causes cell cycle arrest at G1; lethality of null mutation is functionally complemented by human homolog AARS; mutations in human homolog AARS are associated with autoimmune disease polymyositis/dermatomyositis -S000033157 CDS YOR335C 15 949109 946233 C 2011-02-03 1996-07-31 -S000005863 ORF Verified YOR336W KRE5 chromosome 15 L000000914 15 949773 953870 W 2011-02-03 1996-07-31 Protein required for beta-1,6 glucan biosynthesis; mutations result in aberrant morphology and severe growth defects -S000033259 CDS YOR336W 15 949773 953870 W 2011-02-03 1996-07-31 -S000005864 ORF Verified YOR337W TEA1 chromosome 15 L000003020 15 954344 956623 W 193 2011-02-03 1996-07-31 Ty1 enhancer activator involved in Ty enhancer-mediated transcription; required for full levels of Ty enhancer-mediated transcription; C6 zinc cluster DNA-binding protein -S000033317 CDS YOR337W 15 954344 956623 W 2011-02-03 1996-07-31 -S000005865 ORF Uncharacterized YOR338W chromosome 15 15 956898 957989 W 2011-02-03 1996-07-31 Putative protein of unknown function; YOR338W transcription is regulated by Azf1p and its transcript is a specific target of the G protein effector Scp160p; identified as being required for sporulation in a high-throughput mutant screen; YOR338W has a paralog, FUN19, that arose from the whole genome duplication -S000034225 CDS YOR338W 15 956898 957989 W 2011-02-03 1996-07-31 -S000005866 ORF Verified YOR339C UBC11 putative E2 ubiquitin-protein ligase UBC11 chromosome 15 L000004673 15 958832 958362 C 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme; most similar in sequence to Xenopus ubiquitin-conjugating enzyme E2-C, but not a true functional homolog of this E2; unlike E2-C, not required for the degradation of mitotic cyclin Clb2 -S000034261 CDS YOR339C 15 958832 958362 C 2011-02-03 1996-07-31 -S000005867 ORF Verified YOR340C RPA43 DNA-directed RNA polymerase I subunit RPA43|A43 chromosome 15 L000003029 15 960182 959202 C 2011-02-03 1996-07-31 RNA polymerase I subunit A43 -S000035445 CDS YOR340C 15 960182 959202 C 2011-02-03 1996-07-31 -S000005868 ORF Verified YOR341W RPA190 DNA-directed RNA polymerase I core subunit RPA190|A190|RRN1 chromosome 15 L000001675 15 960987 965981 W 192 2011-02-03 1996-07-31 RNA polymerase I largest subunit A190 -S000036421 CDS YOR341W 15 960987 965981 W 2011-02-03 1996-07-31 -S000005869 ORF Verified YOR342C chromosome 15 15 967625 966666 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and the nucleus; relocalizes from nucleus to cytoplasm upon DNA replication stress; YOR342C has a paralog, YAL037W, that arose from the whole genome duplication -S000036448 CDS YOR342C 15 967625 966666 C 2011-02-03 1996-07-31 -S000005870 ORF Dubious YOR343C chromosome 15 15 968474 968148 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036546 CDS YOR343C 15 968474 968148 C 2011-02-03 1996-07-31 -S000007179 long_terminal_repeat YORWsigma4 chromosome 15 15 968991 969301 W 2011-02-03 2000-05-19 Ty3 LTR -S000007175 long_terminal_repeat YORWdelta22 chromosome 15 15 969293 969431 W 2011-02-03 2000-05-19 Ty1 LTR -S000007176 long_terminal_repeat YORWdelta23 chromosome 15 15 970286 970617 W 2011-02-03 2000-05-19 Ty2 LTR -S000007183 LTR_retrotransposon YORWTy2-2 Ty2 chromosome 15 15 970286 976244 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007355 transposable_element_gene YOR343W-A gag protein|YOR343C-A chromosome 15 15 970578 971894 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000036395 CDS YOR343W-A 15 970578 971894 W 2011-02-03 1999-07-17 -S000007356 transposable_element_gene YOR343W-B gag-pol fusion protein|YOR343C-B chromosome 15 15 970578 975891 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000036396 CDS YOR343W-B 15 970578 971871 W 2011-02-03 1999-07-17 -S000036397 CDS YOR343W-B 15 971873 975891 W 2011-02-03 1999-07-17 -S000036398 plus_1_translational_frameshift YOR343W-B 15 971872 971872 W 2011-02-03 1999-07-17 -S000007177 long_terminal_repeat YORWdelta24 chromosome 15 15 975913 976244 W 2011-02-03 2000-05-19 Ty2 LTR -S000006666 tRNA_gene tM(CAU)O2 EMT2 chromosome 15 L000000552|L000003712 15 976421 976493 W 2011-02-03 2000-05-19 Methionine tRNA (tRNA-Met), functions in translational elongation; not involved in translational initiation; predicted by tRNAscan-SE analysis -S000032168 noncoding_exon tM(CAU)O2 15 976421 976493 W 2011-02-03 2000-05-19 -S000005871 ORF Verified YOR344C TYE7 SGC1 chromosome 15 L000002401 15 978069 977194 C 199 2011-02-03 1996-07-31 Serine-rich protein that contains a bHLH DNA binding motif; binds E-boxes of glycolytic genes and contributes to their activation; may function as a transcriptional activator in Ty1-mediated gene expression; bHLH stands for basic-helix-loop-helix -S000036612 CDS YOR344C 15 978069 977194 C 2011-02-03 1996-07-31 -S000007167 long_terminal_repeat YORCdelta25 chromosome 15 15 980590 980259 C 2011-02-03 2000-05-19 Ty1 LTR -S000006689 tRNA_gene tP(UGG)O3 chromosome 15 L000003713 15 980683 980787 W 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin -S000031061 intron tP(UGG)O3 15 980719 980751 W 2011-02-03 2000-05-19 -S000031059 noncoding_exon tP(UGG)O3 15 980683 980718 W 2011-02-03 2000-05-19 -S000031060 noncoding_exon tP(UGG)O3 15 980752 980787 W 2011-02-03 2000-05-19 -S000118496 ARS ARS1529 ARSXV-982 chromosome 15 15 981462 981697 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000005873 ORF Verified YOR346W REV1 deoxycytidyl transferase chromosome 15 L000001615 15 981828 984785 W 2011-02-03 1996-07-31 Deoxycytidyl transferase; involved in repair of abasic sites and adducted guanines in damaged DNA by translesion synthesis (TLS); forms a complex with the subunits of DNA polymerase zeta, Rev3p and Rev7p; relocalizes from nucleus to cytoplasm upon DNA replication stress -S000037530 CDS YOR346W 15 981828 984785 W 2011-02-03 1996-07-31 -S000005872 ORF Dubious YOR345C chromosome 15 15 982162 981812 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene REV1; null mutant displays increased resistance to antifungal agents gliotoxin, cycloheximide and H2O2 -S000037325 CDS YOR345C 15 982162 981812 C 2011-02-03 1996-07-31 -S000005874 ORF Verified YOR347C PYK2 pyruvate kinase PYK2 chromosome 15 L000004122 15 986462 984942 C 2011-02-03 1996-07-31 Pyruvate kinase; appears to be modulated by phosphorylation; transcription repressed by glucose, and Pyk2p may be active under low glycolytic flux; PYK2 has a paralog, CDC19, that arose from the whole genome duplication -S000037542 CDS YOR347C 15 986462 984942 C 2011-02-03 1996-07-31 -S000005875 ORF Verified YOR348C PUT4 proline permease PUT4 chromosome 15 L000001538 15 988782 986899 C 2011-02-03 1996-07-31 Proline permease; required for high-affinity transport of proline; also transports the toxic proline analog azetidine-2-carboxylate (AzC); PUT4 transcription is repressed in ammonia-grown cells -S000030314 CDS YOR348C 15 988782 986899 C 2011-02-03 1996-07-31 -S000005876 ORF Verified YOR349W CIN1 chromosome 15 L000000336 15 989789 992833 W 215 2011-02-03 1996-07-31 Tubulin folding factor D involved in beta-tubulin (Tub2p) folding; isolated as mutant with increased chromosome loss and sensitivity to benomyl -S000030549 CDS YOR349W 15 989789 992833 W 2011-02-03 1996-07-31 -S000005877 ORF Verified YOR350C MNE1 chromosome 15 L000003295 15 994855 992864 C 2011-02-03 1996-07-31 Protein involved in splicing Group I aI5-beta intron from COX1 mRNA; mitochondrial matrix protein -S000030755 CDS YOR350C 15 994855 992864 C 2011-02-03 1996-07-31 -S000005878 ORF Verified YOR351C MEK1 serine/threonine protein kinase MEK1|MRE4 chromosome 15 L000001062|L000001148 15 996511 995018 C 175 2011-02-03 1996-07-31 Meiosis-specific serine/threonine protein kinase; functions in meiotic checkpoint, promotes recombination between homologous chromosomes by suppressing double strand break repair between sister chromatids; stabilizes Hop1-Thr318 phosphorylation to promote interhomolog recombination and checkpoint responses during meiosis -S000031597 CDS YOR351C 15 996511 995018 C 2011-02-03 1996-07-31 -S000005879 ORF Verified YOR352W TFB6 TFIIH complex subunit TFB6 chromosome 15 15 997213 998244 W 2011-02-03 1996-07-31 Subunit of TFIIH complex; facilities dissociation of the Ssl2p helices from TFIIH; expression levels regulated by Arg5,6p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus -S000031766 CDS YOR352W 15 997213 998244 W 2011-02-03 1996-07-31 -S000005880 ORF Verified YOR353C SOG2 chromosome 15 15 1000828 998453 C 2011-02-03 1996-07-31 Key component of the RAM signaling network; required for proper cell morphogenesis and cell separation after mitosis -S000031817 CDS YOR353C 15 1000828 998453 C 2011-02-03 1996-07-31 -S000005881 ORF Verified YOR354C MSC6 chromosome 15 15 1003225 1001147 C 2011-02-03 1996-07-31 Multicopy suppressor of HER2 involved in mitochondrial translation; mutant is defective in directing meiotic recombination events to homologous chromatids -S000031931 CDS YOR354C 15 1003225 1001147 C 2011-02-03 1996-07-31 -S000005882 ORF Verified YOR355W GDS1 chromosome 15 L000002580 15 1005137 1006705 W 2011-02-03 1996-07-31 Protein of unknown function; required for growth on glycerol as a carbon source; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000032902 CDS YOR355W 15 1005137 1006705 W 2011-02-03 1996-07-31 -S000005883 ORF Verified YOR356W CIR2 putative electron-transferring-flavoprotein dehydrogenase chromosome 15 15 1007221 1009116 W 2011-02-03 1996-07-31 Putative ortholog of human ETF-dH; found in a large supramolecular complex with other mitochondrial dehydrogenases; may have a role in oxidative stress response; ETF-dH is also known as electron transfer flavoprotein dehydrogenase -S000032990 CDS YOR356W 15 1007221 1009116 W 2011-02-03 1996-07-31 -S000005884 ORF Verified YOR357C SNX3 GRD19 chromosome 15 L000002931 15 1009712 1009224 C 2011-02-03 1996-07-31 Sorting nexin for late-Golgi enzymes; required to maintain late-Golgi resident enzymes in their proper location by recycling molecules from the prevacuolar compartment; contains a PX domain and sequence similarity to human Snx3p -S000033017 CDS YOR357C 15 1009712 1009224 C 2011-02-03 1996-07-31 -S000005885 ORF Verified YOR358W HAP5 chromosome 15 L000003021 15 1010161 1010889 W 2011-02-03 1996-07-31 Subunit of the Hap2p/3p/4p/5p CCAAT-binding complex; complex is heme-activated and glucose repressed; complex is a transcriptional activator and global regulator of respiratory gene expression; required for assembly and DNA binding activity of the complex -S000033859 CDS YOR358W 15 1010161 1010889 W 2011-02-03 1996-07-31 -S000005886 ORF Verified YOR359W VTS1 chromosome 15 15 1011189 1012760 W 2011-02-03 1996-07-31 Flap-structured DNA-binding and RNA-binding protein; stimulates deadenylation-dependent mRNA degradation mediated by the CCR4-NOT deadenylase complex; member of the Smaug (Smg) family of post-transcriptional regulators which bind RNA through a conserved sterile alpha motif (SAM) domain that interacts with Smg recognition element (SREs) containing transcripts; stimulates Dna2p endonuclease activity -S000033994 CDS YOR359W 15 1011189 1012760 W 2011-02-03 1996-07-31 -S000005887 ORF Verified YOR360C PDE2 3',5'-cyclic-nucleotide phosphodiesterase PDE2|SRA5 chromosome 15 L000002046 15 1014821 1013241 C 220 2011-02-03 1996-07-31 High-affinity cyclic AMP phosphodiesterase; component of the cAMP-dependent protein kinase signaling system, protects the cell from extracellular cAMP, contains readthrough motif surrounding termination codon -S000036087 CDS YOR360C 15 1014821 1013241 C 2011-02-03 1996-07-31 -S000005888 ORF Verified YOR361C PRT1 translation initiation factor eIF3 core subunit b|DNA26|CDC63 chromosome 15 L000001515 15 1017652 1015361 C 221 2011-02-03 1996-07-31 eIF3b subunit of the eukaryotic translation initiation factor 3 (eIF3); subunit of the core complex of eIF3; essential for translation; part of a subcomplex (Prt1p-Rpg1p-Nip1p) that stimulates binding of mRNA and tRNA(i)Met to ribosomes; eIF3 is also involved in programmed stop codon readthrough -S000036186 CDS YOR361C 15 1017652 1015361 C 2011-02-03 1996-07-31 -S000005889 ORF Verified YOR362C PRE10 proteasome core particle subunit alpha 7 chromosome 15 L000003146 15 1018746 1017880 C 2011-02-03 1996-07-31 Alpha 7 subunit of the 20S proteasome; protein abundance increases in response to DNA replication stress -S000036287 CDS YOR362C 15 1018746 1017880 C 2011-02-03 1996-07-31 -S000005890 ORF Verified YOR363C PIP2 oleate-activated transcription factor PIP2|OAF2 chromosome 15 L000003144 15 1023212 1020222 C 2011-02-03 1996-07-31 Autoregulatory, oleate-activated transcription factor; subunit of a heterodimeric complex with Oaf1p, which binds to oleate-response elements (ORE) in the promoter of genes involved in beta-oxidation of fatty acids, peroxisome organization and biogenesis, activating transcription in the presence of oleate; PIP2 has a paralog, OAF1, that arose from the whole genome duplication -S000036382 CDS YOR363C 15 1023212 1020222 C 2011-02-03 1996-07-31 -S000005891 ORF Dubious YOR364W chromosome 15 15 1023371 1023739 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YOR365C -S000037077 CDS YOR364W 15 1023371 1023739 W 2011-02-03 1996-07-31 -S000005893 ORF Dubious YOR366W chromosome 15 15 1025256 1025609 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YOR365C -S000037303 CDS YOR366W 15 1025256 1025609 W 2011-02-03 1996-07-31 -S000005892 ORF Uncharacterized YOR365C putative flavin adenine dinucleotide transporter chromosome 15 15 1025572 1023461 C 2011-02-03 1996-07-31 Putative protein of unknown function; not an essential protein; YOR365C has a paralog, FLC2, that arose from the whole genome duplication -S000037119 CDS YOR365C 15 1025572 1023461 C 2011-02-03 1996-07-31 -S000005894 ORF Verified YOR367W SCP1 chromosome 15 L000004232 15 1026007 1026609 W 2011-02-03 1996-07-31 Component of yeast cortical actin cytoskeleton; binds and cross links actin filaments; originally identified by its homology to calponin (contains a calponin-like repeat) but the Scp1p domain structure is more similar to transgelin -S000029952 CDS YOR367W 15 1026007 1026609 W 2011-02-03 1996-07-31 -S000005895 ORF Verified YOR368W RAD17 chromosome 15 L000001566 15 1026843 1028048 W 214 2011-02-03 1996-07-31 Checkpoint protein; involved in the activation of the DNA damage and meiotic pachytene checkpoints; with Mec3p and Ddc1p, forms a clamp that is loaded onto partial duplex DNA; homolog of human and S. pombe Rad1 and U. maydis Rec1 proteins -S000030058 CDS YOR368W 15 1026843 1028048 W 2011-02-03 1996-07-31 -S000005896 ORF Verified YOR369C RPS12 eS12|ribosomal 40S subunit protein S12|S12e|S12 chromosome 15 L000002785 15 1028625 1028194 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S12, no bacterial homolog -S000030088 CDS YOR369C 15 1028625 1028194 C 2011-02-03 1996-07-31 -S000005897 ORF Verified YOR370C MRS6 GTPase-activating protein MRS6|MSI4 chromosome 15 L000001182|L000001194 15 1030994 1029183 C 2011-02-03 1996-07-31 Rab escort protein; forms a complex with the Ras-like small GTPase Ypt1p that is required for the prenylation of Ypt1p by protein geranylgeranyltransferase type II (Bet2p-Bet4p); sequence similarity to mammalian choroideraemia gene; relative distribution to the nucleus increases upon DNA replication stress -S000031162 CDS YOR370C 15 1030994 1029183 C 2011-02-03 1996-07-31 -S000005898 ORF Verified YOR371C GPB1 KRH2 chromosome 15 15 1034182 1031489 C 2011-02-03 1996-07-31 Multistep regulator of cAMP-PKA signaling; inhibits PKA downstream of Gpa2p and Cyr1p, thereby increasing cAMP dependency; promotes ubiquitin-dependent proteolysis of Ira2p; regulated by G-alpha protein Gpa2p; GPB1 has a paralog, GPB2, that arose from the whole genome duplication -S000031222 CDS YOR371C 15 1034182 1031489 C 2011-02-03 1996-07-31 -S000005899 ORF Verified YOR372C NDD1 chromosome 15 15 1036471 1034807 C 2011-02-03 1996-07-31 Transcriptional activator essential for nuclear division; localized to the nucleus; essential component of the mechanism that activates the expression of a set of late-S-phase-specific genes; turnover is tightly regulated during cell cycle and in response to DNA damage -S000032194 CDS YOR372C 15 1036471 1034807 C 2011-02-03 1996-07-31 -S000005900 ORF Verified YOR373W NUD1 chromosome 15 L000002752 15 1036834 1039389 W 2011-02-03 1996-07-31 Component of the spindle pole body outer plaque; acts through the mitotic exit network to specify asymmetric spindle pole body inheritance -S000032346 CDS YOR373W 15 1036834 1039389 W 2011-02-03 1996-07-31 -S000005901 ORF Verified YOR374W ALD4 aldehyde dehydrogenase (NADP(+)) ALD4|ALDH2|ALD7 chromosome 15 L000004220 15 1039840 1041399 W 2011-02-03 1996-07-31 Mitochondrial aldehyde dehydrogenase; required for growth on ethanol and conversion of acetaldehyde to acetate; phosphorylated; activity is K+ dependent; utilizes NADP+ or NAD+ equally as coenzymes; expression is glucose repressed; can substitute for cytosolic NADP-dependent aldehyde dehydrogenase when directed to the cytosol; human homolog ALDH2 can complement yeast ald4 mutant -S000033216 CDS YOR374W 15 1039840 1041399 W 2011-02-03 1996-07-31 -S000005902 ORF Verified YOR375C GDH1 glutamate dehydrogenase (NADP(+)) GDH1|DHE4|GDHA|GDH-A|URE1 chromosome 15 L000000696 15 1043042 1041678 C 2011-02-03 1996-07-31 NADP(+)-dependent glutamate dehydrogenase; synthesizes glutamate from ammonia and alpha-ketoglutarate; rate of alpha-ketoglutarate utilization differs from Gdh3p; expression regulated by nitrogen and carbon sources; GDH1 has a paralog, GDH3, that arose from the whole genome duplication -S000033231 CDS YOR375C 15 1043042 1041678 C 2011-02-03 1996-07-31 -S000005903 ORF Uncharacterized YOR376W chromosome 15 15 1043191 1043559 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YOR376W is not an essential gene -S000033346 CDS YOR376W 15 1043191 1043559 W 2011-02-03 1996-07-31 -S000028586 ORF Uncharacterized YOR376W-A chromosome 15 15 1045196 1045351 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031336 CDS YOR376W-A 15 1045196 1045351 W 2011-02-03 2003-07-29 -S000005904 ORF Verified YOR377W ATF1 alcohol O-acetyltransferase chromosome 15 L000000138 15 1046226 1047803 W 2011-02-03 1996-07-31 Alcohol acetyltransferase; responsible for the major part of volatile acetate ester production during fermentation; main enzyme involved in terpenyl acetate synthesis; potential roles in lipid and sterol metabolism -S000033432 CDS YOR377W 15 1046226 1047803 W 2011-02-03 1996-07-31 -S000005905 ORF Verified YOR378W AMF1 chromosome 15 15 1049511 1051058 W 2011-02-03 1996-07-31 Low affinity NH4+ transporter; member of the DHA2 family of drug:H+ anti porters; putative paralog of ATR1; but not required for boron tolerance; non-essential gene -S000034342 CDS YOR378W 15 1049511 1051058 W 2011-02-03 1996-07-31 -S000005906 ORF Dubious YOR379C chromosome 15 15 1051064 1050726 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YOR378W -S000034365 CDS YOR379C 15 1051064 1050726 C 2011-02-03 1996-07-31 -S000005907 ORF Verified YOR380W RDR1 chromosome 15 15 1051290 1052930 W 2011-02-03 1996-07-31 Transcriptional repressor involved in regulating multidrug resistance; negatively regulates expression of the PDR5 gene; member of the Gal4p family of zinc cluster proteins -S000035338 CDS YOR380W 15 1051290 1052930 W 2011-02-03 1996-07-31 -S000005908 ORF Verified YOR381W FRE3 ferric-chelate reductase chromosome 15 L000003555 15 1055545 1057680 W 2011-02-03 1996-07-31 Ferric reductase; reduces siderophore-bound iron prior to uptake by transporters; expression induced by low iron levels -S000035406 CDS YOR381W 15 1055545 1057680 W 2011-02-03 1996-07-31 -S000028587 ORF Uncharacterized YOR381W-A chromosome 15 15 1058423 1058590 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031338 CDS YOR381W-A 15 1058423 1058590 W 2011-02-03 2003-07-29 -S000005909 ORF Verified YOR382W FIT2 chromosome 15 15 1059531 1059992 W 2011-02-03 1996-07-31 Mannoprotein that is incorporated into the cell wall; incorporated via a glycosylphosphatidylinositol (GPI) anchor; involved in the retention of siderophore-iron in the cell wall -S000035468 CDS YOR382W 15 1059531 1059992 W 2011-02-03 1996-07-31 -S000005910 ORF Verified YOR383C FIT3 chromosome 15 15 1061055 1060441 C 2011-02-03 1996-07-31 Mannoprotein that is incorporated into the cell wall; incorporated via a glycosylphosphatidylinositol (GPI) anchor; involved in the retention of siderophore-iron in the cell wall -S000035495 CDS YOR383C 15 1061055 1060441 C 2011-02-03 1996-07-31 -S000005911 ORF Verified YOR384W FRE5 putative ferric-chelate reductase chromosome 15 L000003557 15 1061564 1063648 W 2011-02-03 1996-07-31 Putative ferric reductase with similarity to Fre2p; expression induced by low iron levels; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000035594 CDS YOR384W 15 1061564 1063648 W 2011-02-03 1996-07-31 -S000005912 ORF Uncharacterized YOR385W chromosome 15 15 1065043 1065915 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YOR385W is not an essential gene -S000036492 CDS YOR385W 15 1065043 1065915 W 2011-02-03 1996-07-31 -S000005913 ORF Verified YOR386W PHR1 deoxyribodipyrimidine photo-lyase PHR1 chromosome 15 L000001432 15 1066839 1068536 W 205 2011-02-03 1996-07-31 DNA photolyase involved in photoreactivation; repairs pyrimidine dimers in the presence of visible light; induced by DNA damage; regulated by transcriptional repressor Rph1p -S000036613 CDS YOR386W 15 1066839 1068536 W 2011-02-03 1996-07-31 -S000005914 ORF Uncharacterized YOR387C chromosome 15 15 1070241 1069621 C 2011-02-03 1996-07-31 Putative protein of unknown function; regulated by the metal-responsive Aft1p transcription factor; highly inducible in zinc-depleted conditions; localizes to the soluble fraction; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively; YOR387C has a paralog, VEL1, that arose from a single-locus duplication -S000036646 CDS YOR387C 15 1070241 1069621 C 2011-02-03 1996-07-31 -S000005915 ORF Verified YOR388C FDH1 formate dehydrogenase (NAD+) chromosome 15 L000004078 15 1072923 1071793 C 2011-02-03 1996-07-31 NAD(+)-dependent formate dehydrogenase; may protect cells from exogenous formate -S000036744 CDS YOR388C 15 1072923 1071793 C 2011-02-03 1996-07-31 -S000005916 ORF Uncharacterized YOR389W chromosome 15 15 1074213 1076087 W 2011-02-03 1996-07-31 Putative protein of unknown function; expression regulated by copper levels -S000037549 CDS YOR389W 15 1074213 1076087 W 2011-02-03 1996-07-31 -S000005917 ORF Verified YOR390W FEX1 fluoride transporter chromosome 15 15 1076784 1077911 W 2011-02-03 1996-07-31 Protein involved in fluoride export; nearly identical to FEX2, and deletion of both proteins results in a large increase in fluoride sensitivity compared with the single mutant; contains two FEX domains connected by a linker; part of a widespread family of conserved fluoride export proteins -S000030291 CDS YOR390W 15 1076784 1077911 W 2011-02-03 1996-07-31 -S000005918 ORF Verified YOR391C HSP33 glutathione-independent methylglyoxalase family protein chromosome 15 15 1079258 1078545 C 2011-02-03 1996-07-31 Possible chaperone and cysteine protease; required for transcriptional reprogramming during the diauxic shift and for survival in stationary phase; similar to E. coli Hsp31 and S. cerevisiae Hsp31p, Hsp32p, and Sno4p; member of the DJ-1/ThiJ/PfpI superfamily, which includes human DJ-1 involved in Parkinson's disease and cancer -S000030329 CDS YOR391C 15 1079258 1078545 C 2011-02-03 1996-07-31 -S000005919 ORF Dubious YOR392W chromosome 15 15 1079282 1079725 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; gene expression induced by heat -S000031315 CDS YOR392W 15 1079282 1079725 W 2011-02-03 1996-07-31 -S000005920 ORF Verified YOR393W ERR1 phosphopyruvate hydratase ERR1 chromosome 15 L000002735 15 1080276 1081589 W 2011-02-03 1996-07-31 Putative phosphopyruvate hydratase -S000031378 CDS YOR393W 15 1080276 1081589 W 2011-02-03 1996-07-31 -S000005921 ORF Verified YOR394W PAU21 seripauperin PAU21 chromosome 15 15 1082718 1083212 W 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the cytosol; identical to Pau22p; encodes two proteins that are translated from 2 different start codons -S000031488 CDS YOR394W 15 1082718 1083212 W 2011-02-03 1996-07-31 -S000028997 telomere TEL15R chromosome 15 15 1083922 1091291 W 229 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome XV; composed of an X element core sequence, X element combinatorial repeats, a long Y' element, and a very short terminal stretch of telomeric repeats -S000028998 telomeric_repeat TEL15R 15 1091274 1091291 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome XV -S000028999 X_element TEL15R 15 1083922 1084367 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome XV; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YOR394C-A -S000029000 X_element_combinatorial_repeat TEL15R 15 1084368 1084620 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr XV; contains repeats of the D, C, and B types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000029001 Y_prime_element TEL15R 15 1084621 1091273 W 2011-02-03 2003-09-09 Telomeric long Y' element on the right arm of Chromosome XV; contains an ARS consensus sequence, a region of 36-bp repeats, and ORFs YOR396W and YOR396C-A -S000028718 ORF Uncharacterized YOR394C-A chromosome 15 15 1084369 1084202 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032689 CDS YOR394C-A 15 1084369 1084202 C 2011-02-03 2003-07-29 -S000007526 ORF Uncharacterized YOR396W YRF1-8 Y' element ATP-dependent helicase protein 1 copy 8 chromosome 15 15 1085473 1090863 W 2011-02-03 2000-07-14|2007-02-07 One of several telomeric Y' element-encoded DNA helicases; known as Y'-Help1 (Y'-HELicase Protein 1) -S000037061 CDS YOR396W 15 1085473 1090863 W 2011-02-03 2000-07-14|2007-02-07 -S000028719 ORF Dubious YOR396C-A chromosome 15 15 1090497 1090015 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032691 CDS YOR396C-A 15 1090497 1090015 C 2011-02-03 2003-07-29 -S000028724 ORF Dubious YPL283W-B chromosome 16 16 643 1125 W 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032709 CDS YPL283W-B 16 643 1125 W 2003-07-29 2003-07-29 -S000028723 ORF Dubious YPL283W-A chromosome 16 16 1426 2001 W 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032706 CDS YPL283W-A 16 1426 2001 W 2003-07-29 2003-07-29 -S000006204 ORF Verified YPL283C YRF1-7 Y' element ATP-dependent helicase protein 1 copy 7|YRF1 chromosome 16 16 6007 280 C 1996-07-31 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p -S000036889 CDS YPL283C 16 5840 280 C 1996-07-31 1996-07-31 -S000036888 CDS YPL283C 16 6007 5989 C 1996-07-31 1996-07-31 -S000036890 intron YPL283C 16 5988 5841 C 1996-07-31 1996-07-31 -S000028933 telomere TEL16L chromosome 16 16 7223 1 C -169 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome XVI; annotated components include an X element core sequence, X element combinatorial repeats, and a long Y' element; TEL16L does have telomeric repeats (TEL16L-TR), but they are missing from the genome annotation due to difficulties encountered during sequencing and/or assembly -S000028934 X_element TEL16L 16 7223 6778 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome XVI; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028935 X_element_combinatorial_repeat TEL16L 16 6777 6525 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr XVI; contains repeats of the D, C and B types; formerly called SubTelomeric Repeats -S000028936 Y_prime_element TEL16L 16 6524 1 C 2003-09-09 2003-09-09 Telomeric long Y' element on the left arm of Chromosome XVI; contains an ARS consensus sequence, a region of 36-bp repeats, and ORFs YRF1-7/YPL283C, YPL283W-A, YPL283W-B -S000006203 ORF Verified YPL282C PAU22 seripauperin PAU22 chromosome 16 16 8427 7933 C 1996-07-31 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole; identical to Pau21p; encodes two proteins that are translated from two different start codons -S000036818 CDS YPL282C 16 8427 7933 C 1996-07-31 1996-07-31 -S000006202 ORF Verified YPL281C ERR2 phosphopyruvate hydratase ERR2 chromosome 16 L000004075 16 10870 9557 C 1996-07-31 1996-07-31 Enolase, a phosphopyruvate hydratase; catalyzes the conversion of 2-phosphoglycerate to phosphoenolpyruvate; complements the growth defect of an ENO1 ENO2 double mutant -S000035948 CDS YPL281C 16 10870 9557 C 1996-07-31 1996-07-31 -S000006201 ORF Verified YPL280W HSP32 glutathione-independent methylglyoxalase family protein chromosome 16 16 11887 12600 W 1996-07-31 1996-07-31 Possible chaperone and cysteine protease; required for transcriptional reprogramming during the diauxic shift and for survival in stationary phase; similar to E. coli Hsp31 and S. cerevisiae Hsp31p, Hsp33p, and Sno4p; member of the DJ-1/ThiJ/PfpI superfamily, which includes human DJ-1 involved in Parkinson's disease and cancer -S000035901 CDS YPL280W 16 11887 12600 W 1996-07-31 1996-07-31 -S000006200 ORF Verified YPL279C FEX2 fluoride transporter chromosome 16 16 14355 13228 C 1996-07-31 1996-07-31 Protein involved in fluoride export; nearly identical to FEX1, and deletion of both proteins results in a large increase in fluoride sensitivity compared with the single mutant; contains two FEX domains connected by a linker; part of a widespread family of conserved fluoride export proteins -S000034797 CDS YPL279C 16 14355 13228 C 1996-07-31 1996-07-31 -S000006199 ORF Uncharacterized YPL278C chromosome 16 16 15355 15053 C 1996-07-31 1996-07-31 Putative protein of unknown function; gene expression regulated by copper levels -S000034632 CDS YPL278C 16 15355 15053 C 1996-07-31 1996-07-31 -S000006198 ORF Uncharacterized YPL277C chromosome 16 16 16868 15405 C 1996-07-31 1996-07-31 Putative protein of unknown function; localized to the membranes; gene expression regulated by copper levels -S000033762 CDS YPL277C 16 16868 15405 C 1996-07-31 1996-07-31 -S000006197 pseudogene YPL276W FDH2 chromosome 16 16 17948 18385 W 1996-07-31 1996-07-31 NAD(+)-dependent formate dehydrogenase; may protect cells from exogenous formate; YPL275W and YPL276W comprise a continuous open reading frame in some S. cerevisiae strains but not in the genomic reference strain S288C -S000033699 CDS YPL276W 16 17948 18385 W 1996-07-31 1996-07-31 -S000006196 pseudogene YPL275W FDH2 chromosome 16 16 18369 19079 W 1996-07-31 1996-07-31 NAD(+)-dependent formate dehydrogenase; may protect cells from exogenous formate; YPL275W and YPL276W comprise a continuous open reading frame in some S. cerevisiae strains but not in the genomic reference strain S288C -S000033615 CDS YPL275W 16 18369 19079 W 1996-07-31 1996-07-31 -S000130195 ARS ARS1603 chromosome 16 16 18370 19069 2009-05-08 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000006195 ORF Verified YPL274W SAM3 bifunctional polyamine/amino acid permease SAM3 chromosome 16 L000004875 16 22938 24701 W 1996-07-31 1996-07-31 High-affinity S-adenosylmethionine permease; required for utilization of S-adenosylmethionine as a sulfur source; has similarity to S-methylmethionine permease Mmp1p -S000033506 CDS YPL274W 16 22938 24701 W 1996-07-31 1996-07-31 -S000006194 ORF Verified YPL273W SAM4 S-adenosylmethionine-homocysteine S-methyltransferase SAM4 chromosome 16 16 25087 26064 W 1996-07-31 1996-07-31 S-adenosylmethionine-homocysteine methyltransferase; functions along with Mht1p in the conversion of S-adenosylmethionine (AdoMet) to methionine to control the methionine/AdoMet ratio; SAM4 has a paralog, YMR321C, that arose from a single-locus duplication -S000032785 CDS YPL273W 16 25087 26064 W 1996-07-31 1996-07-31 -S000006193 ORF Uncharacterized YPL272C PBI1 chromosome 16 16 28164 26611 C 1996-07-31 1996-07-31 Putative protein of unknown function; gene expression induced in response to ketoconazole; YPL272C is not an essential gene -S000032642 CDS YPL272C 16 28164 26611 C 1996-07-31 1996-07-31 -S000006192 ORF Verified YPL271W ATP15 F1F0 ATP synthase subunit epsilon|ATPEPSILON chromosome 16 L000000151|L000000152 16 30079 30267 W 1996-07-31 1996-07-31 Epsilon subunit of the F1 sector of mitochondrial F1F0 ATP synthase; which is a large, evolutionarily conserved enzyme complex required for ATP synthesis; F1 translationally regulates ATP6 and ATP8 expression to achieve a balanced output of ATP synthase genes encoded in nucleus and mitochondria; phosphorylated -S000032564 CDS YPL271W 16 30079 30267 W 1996-07-31 1996-07-31 -S000006191 ORF Verified YPL270W MDL2 ATP-binding cassette permease MDL2 chromosome 16 L000001050 16 30482 32803 W 2003-09-22 2003-09-22|1996-07-31 Mitochondrial inner membrane half-type ABC transporter; required for respiratory growth at high temperature; localizes to vacuole membrane in response to H2O2; similar to human TAP1 and TAP2 implicated in bare lymphocyte syndrome and Wegener-like granulomatosis -S000031583 CDS YPL270W 16 30482 32803 W 2003-09-22 2003-09-22|1996-07-31 -S000006190 ORF Verified YPL269W KAR9 chromosome 16 L000002932 16 33013 34947 W 1996-07-31 1996-07-31 Spindle positioning factor; orients astral microtubules, connecting them to actin cables at the cortex with Bim1p and Myo2, resulting in proper spindle positioning; targeted for StuBL-dependent degradation at kinetochores by Slx5p-Slx8p, ensuring chromosome transmission fidelity and correct spindle positioning; role in karyogamy; localizes to the shmoo tip, the growing bud-tip, the nucleus, the kinetochore, the spindle and microtubules; homolog of adenomatous polyposis coli -S000031613 CDS YPL269W 16 33013 34947 W 1996-07-31 1996-07-31 -S000006189 ORF Verified YPL268W PLC1 phosphatidylinositol phospholipase C chromosome 16 L000001448 16 35236 37845 W -167.2 1996-07-31 1996-07-31 Phospholipase C; hydrolyzes phosphatidylinositol 4,5-biphosphate (PIP2) to generate the signaling molecules inositol 1,4,5-triphosphate (IP3) and 1,2-diacylglycerol (DAG); involved in regulating many cellular processes; Plc1p and inositol polyphosphates are required for acetyl-CoA homeostasis which regulates global histone acetylation -S000031510 CDS YPL268W 16 35236 37845 W 1996-07-31 1996-07-31 -S000006188 ORF Verified YPL267W ACM1 chromosome 16 16 38169 38798 W 1996-07-31 1996-07-31 Pseudosubstrate inhibitor of the APC/C; suppresses APC/C [Cdh1]-mediated proteolysis of mitotic cyclins; associates with Cdh1p, Bmh1p and Bmh2p; cell cycle regulated protein; the anaphase-promoting complex/cyclosome is also known as APC/C -S000030663 CDS YPL267W 16 38169 38798 W 1996-07-31 1996-07-31 -S000006187 ORF Verified YPL266W DIM1 putative dimethyladenosine transferase|CDH1 chromosome 16 L000002579 16 39121 40077 W 1996-07-31 1996-07-31 Essential 18S rRNA dimethylase (dimethyladenosine transferase); responsible for conserved m6(2)Am6(2)A dimethylation in 3'-terminal loop of 18S rRNA, part of 90S and 40S pre-particles in nucleolus, involved in pre-ribosomal RNA processing; human homolog DIMT1 complements yeast dim1 mutant -S000030548 CDS YPL266W 16 39121 40077 W 1996-07-31 1996-07-31 -S000006186 ORF Verified YPL265W DIP5 chromosome 16 L000003178 16 41043 42869 W 1996-07-31 1996-07-31 Dicarboxylic amino acid permease; mediates high-affinity and high-capacity transport of L-glutamate and L-aspartate; also a transporter for Gln, Asn, Ser, Ala, and Gly; relocalizes from plasma membrane to vacuole upon DNA replication stress -S000030403 CDS YPL265W 16 41043 42869 W 1996-07-31 1996-07-31 -S000118411 ARS ARS1604 ARSXVI-43 chromosome 16 16 42977 43212 2006-08-30 2006-08-30 Autonomously Replicating Sequence -S000178190 ARS_consensus_sequence ARS1604 16 43163 43147 C 2014-11-18 2014-11-18 -S000006185 ORF Uncharacterized YPL264C chromosome 16 16 44344 43283 C 1996-07-31 1996-07-31 Putative membrane protein of unknown function; physically interacts with Hsp82p; YPL264C is not an essential gene -S000037545 CDS YPL264C 16 44344 43283 C 1996-07-31 1996-07-31 -S000006184 ORF Verified YPL263C KEL3 chromosome 16 16 46506 44551 C 1996-07-31 1996-07-31 Cytoplasmic protein of unknown function -S000037435 CDS YPL263C 16 46506 44551 C 1996-07-31 1996-07-31 -S000006183 ORF Verified YPL262W FUM1 fumarase FUM1 chromosome 16 L000000632 16 47336 48802 W 1996-07-31 1996-07-31 Fumarase; converts fumaric acid to L-malic acid in the TCA cycle; cytosolic and mitochondrial distribution determined by the N-terminal targeting sequence, protein conformation, and status of glyoxylate shunt; phosphorylated in mitochondria -S000037382 CDS YPL262W 16 47336 48802 W 1996-07-31 1996-07-31 -S000006181 ORF Verified YPL260W CUB1 chromosome 16 16 49303 50958 W 1996-07-31 1996-07-31 Conserved fungal gene linked to DNA repair and proteasome function; putative substrate of cAMP-dependent protein kinase (PKA); green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; YPL260W is not an essential gene; protein abundance increases in response to DNA replication stress -S000036555 CDS YPL260W 16 49303 50958 W 1996-07-31 1996-07-31 -S000006182 ORF Uncharacterized YPL261C chromosome 16 16 49304 48996 C 1996-07-31 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YPL261C is not an essential gene; partially overlaps verified ORF YPL260W -S000036608 CDS YPL261C 16 49304 48996 C 1996-07-31 1996-07-31 -S000006180 ORF Verified YPL259C APM1 YAP54 chromosome 16 L000002494 16 52671 51244 C 1996-07-31 1996-07-31 Mu1-like medium subunit of the AP-1 complex; binds clathrin; involved in clathrin-dependent Golgi protein sorting; the AP-1 complex is the clathrin-associated protein complex -S000036655 CDS YPL259C 16 52671 51244 C 1996-07-31 1996-07-31 -S000006179 ORF Verified YPL258C THI21 bifunctional hydroxymethylpyrimidine kinase/phosphomethylpyrimidine kinase chromosome 16 16 55153 53498 C 1996-07-31 1996-07-31 Hydroxymethylpyrimidine (HMP) and HMP-phosphate kinase; involved in thiamine biosynthesis; member of a gene family with THI20 and THI22; functionally redundant with Thi20p -S000035722 CDS YPL258C 16 55153 53498 C 1996-07-31 1996-07-31 -S000007184 long_terminal_repeat YPLCdelta1 chromosome 16 16 55858 55657 C 2000-05-19 2000-05-19 Ty1 LTR -S000006776 tRNA_gene tW(CCA)P chromosome 16 L000003737 16 56274 56169 C 2000-05-19 2000-05-19 Tryptophan tRNA (tRNA-Trp), predicted by tRNAscan-SE analysis -S000034120 intron tW(CCA)P 16 56238 56205 C 2000-05-19 2000-05-19 -S000034119 noncoding_exon tW(CCA)P 16 56204 56169 C 2000-05-19 2000-05-19 -S000034118 noncoding_exon tW(CCA)P 16 56274 56239 C 2000-05-19 2000-05-19 -S000007198 long_terminal_repeat YPLWsigma1 chromosome 16 16 56290 56358 W 2000-05-19 2000-05-19 Ty3 LTR -S000007189 long_terminal_repeat YPLWdelta2 chromosome 16 16 56409 56451 W 2000-05-19 2000-05-19 Ty1 LTR -S000007190 long_terminal_repeat YPLWdelta3 chromosome 16 16 56452 56788 W 2000-05-19 2000-05-19 Ty1 LTR -S000007199 LTR_retrotransposon YPLWTy1-1 Ty1 chromosome 16 16 56452 62375 W 2000-05-19 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007357 transposable_element_gene YPL257W-A gag protein chromosome 16 16 56748 58070 W 1996-07-31 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000033164 CDS YPL257W-A 16 56748 58070 W 1996-07-31 1996-07-31 -S000007358 transposable_element_gene YPL257W-B gag-pol fusion protein chromosome 16 16 56748 62016 W 1997-07-17 1997-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000033173 CDS YPL257W-B 16 56748 58052 W 1997-07-17 1997-07-17 -S000033174 CDS YPL257W-B 16 58054 62016 W 1997-07-17 1997-07-17 -S000033175 plus_1_translational_frameshift YPL257W-B 16 58053 58053 W 1997-07-17 1997-07-17 -S000007191 long_terminal_repeat YPLWdelta4 chromosome 16 16 62039 62375 W 2000-05-19 2000-05-19 Ty1 LTR -S000007192 long_terminal_repeat YPLWdelta5 chromosome 16 16 62389 62720 W 2000-05-19 2000-05-19 Ty2 LTR -S000007193 long_terminal_repeat YPLWdelta6 chromosome 16 16 62724 63006 W 2000-05-19 2000-05-19 Ty1 LTR -S000006178 ORF Uncharacterized YPL257W chromosome 16 16 63279 63860 W 1996-07-31 1996-07-31 Putative protein of unknown function; homozygous diploid deletion strain exhibits low budding index; physically interacts with Hsp82p; YPL257W is not an essential gene -S000035666 CDS YPL257W 16 63279 63860 W 1996-07-31 1996-07-31 -S000006177 ORF Verified YPL256C CLN2 cyclin CLN2 chromosome 16 L000000358 16 66614 64977 C 1996-07-31 1996-07-31 G1 cyclin involved in regulation of the cell cycle; activates Cdc28p kinase to promote the G1 to S phase transition; late G1 specific expression depends on transcription factor complexes, MBF (Swi6p-Mbp1p) and SBF (Swi6p-Swi4p); CLN2 has a paralog, CLN1, that arose from the whole genome duplication; cell cycle arrest phenotype of the cln1 cln2 cln3 triple null mutant is complemented by any of human cyclins CCNA2, CCNB1, CCNC, CCND1, or CCNE1 -S000035542 CDS YPL256C 16 66614 64977 C 1996-07-31 1996-07-31 -S000006176 ORF Verified YPL255W BBP1 chromosome 16 L000003060 16 67725 68882 W 1996-07-31 1996-07-31 Protein required for the spindle pole body (SPB) duplication; localizes at the cytoplasmic side of the central plaque periphery of the SPB; forms a complex with a nuclear envelope protein Mps2p and SPB components Spc29p and Kar1p; required for mitotic functions of Cdc5p -S000035492 CDS YPL255W 16 67725 68882 W 1996-07-31 1996-07-31 -S000006175 ORF Verified YPL254W HFI1 GAN1|SRM12|SUP110|ADA1 chromosome 16 L000003094 16 69485 70951 W 1996-07-31 1996-07-31 Adaptor protein required for structural integrity of the SAGA complex; a histone acetyltransferase-coactivator complex that is involved in global regulation of gene expression through acetylation and transcription functions -S000034469 CDS YPL254W 16 69485 70951 W 1996-07-31 1996-07-31 -S000006174 ORF Verified YPL253C VIK1 chromosome 16 L000004276 16 73006 71063 C 1996-07-31 1996-07-31 Protein that forms a kinesin-14 heterodimeric motor with Kar3p; localizes Kar3p at mitotic spindle poles; has a structure similar to a kinesin motor domain but lacks an ATP-binding site and is catalytically inactive; binds microtubules; required for sister chromatid cohesion; VIK1 has a paralog, CIK1, that arose from the whole genome duplication -S000034335 CDS YPL253C 16 73006 71063 C 1996-07-31 1996-07-31 -S000118412 ARS ARS1605 ARSXVI-73 chromosome 16 16 73032 73227 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000006172 ORF Dubious YPL251W chromosome 16 16 73625 73927 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps 5' end of the verified, essential gene YAH1/YPL252C -S000033368 CDS YPL251W 16 73625 73927 W 1996-07-31 1996-07-31 -S000006173 ORF Verified YPL252C YAH1 adrenodoxin chromosome 16 L000004699 16 73881 73363 C 1996-07-31 1996-07-31 Ferredoxin of the mitochondrial matrix; required for formation of cellular iron-sulfur proteins; involved in heme A biosynthesis; human homolog FDX1L can complement yeast by allowing growth during down-regulation of yeast YAH1 -S000033428 CDS YPL252C 16 73881 73363 C 1996-07-31 1996-07-31 -S000006171 ORF Verified YPL250C ATG41 ICY2 chromosome 16 S000007528 16 74719 74309 C 1996-07-31 1996-07-31 Protein of unknown function; required for selective and nonselective autophagy, and mitophagy; regulates the rate of autophagosome formation; interacts with Atg9p, and has a similar peri-mitochondrial localization; elevated Gcn4p-dependent expression under autophagy-inducing conditions; mobilized into polysomes upon a shift from a fermentable to nonfermentable carbon source; potential Cdc28p substrate; ATG41 has a paralog, ICY1, that arose from the whole genome duplication -S000033279 CDS YPL250C 16 74719 74309 C 1996-07-31 1996-07-31 -S000028589 ORF Dubious YPL250W-A chromosome 16 16 75702 75989 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the verified ORF RPL36B/YPL249C-A; identified by fungal homology and RT-PCR -S000031342 CDS YPL250W-A 16 75702 75989 W 2003-07-29 2003-07-29 -S000006438 ORF Verified YPL249C-A RPL36B eL36|ribosomal 60S subunit protein L36B|L36e|YL39|L39|L36B chromosome 16 L000004515 16 76239 75699 C 1999-07-17 1999-07-17 Ribosomal 60S subunit protein L36B; binds to 5.8 S rRNA; homologous to mammalian ribosomal protein L36, no bacterial homolog; RPL36B has a paralog, RPL36A, that arose from the whole genome duplication -S000032350 CDS YPL249C-A 16 75985 75699 C 1997-07-17 1997-07-17 -S000032349 CDS YPL249C-A 16 76239 76224 C 1999-07-17 1999-07-17 -S000032351 intron YPL249C-A 16 76223 75986 C 1997-07-17 1997-07-17 -S000006170 ORF Verified YPL249C GYP5 chromosome 16 16 79353 76669 C 1996-07-31 1996-07-31 GTPase-activating protein (GAP) for yeast Rab family members; involved in ER to Golgi trafficking; exhibits GAP activity toward Ypt1p that is stimulated by Gyl1p, also acts on Sec4p; interacts with Gyl1p, Rvs161p and Rvs167p; involved in recruiting Rvs167p to the bud tip during polarized growth; relocalizes from bud neck to cytoplasm upon DNA replication stress; GYP5 has a paralog, GYL1, that arose from the whole genome duplication -S000032543 CDS YPL249C 16 79353 76669 C 1996-07-31 1996-07-31 -S000006169 ORF Verified YPL248C GAL4 galactose-responsive transcription factor GAL4|GAL81 chromosome 16 L000000661 16 82356 79711 C -143 1996-07-31 1996-07-31 DNA-binding transcription factor required for activating GAL genes; responds to galactose; repressed by Gal80p and activated by Gal3p -S000032436 CDS YPL248C 16 82356 79711 C 1996-07-31 1996-07-31 -S000006168 ORF Uncharacterized YPL247C chromosome 16 16 84196 82625 C 1996-07-31 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; similar to the petunia WD repeat protein an11; overexpression causes a cell cycle delay or arrest -S000031428 CDS YPL247C 16 84196 82625 C 1996-07-31 1996-07-31 -S000006167 ORF Verified YPL246C RBD2 putative rhomboid protease RBD2 chromosome 16 16 85297 84509 C 1996-07-31 1996-07-31 Possible rhomboid protease; has similarity to eukaryotic rhomboid proteases including Pcp1p -S000031296 CDS YPL246C 16 85297 84509 C 1996-07-31 1996-07-31 -S000006166 ORF Uncharacterized YPL245W chromosome 16 16 85586 86950 W 1996-07-31 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the nucleus and the cytoplasm -S000031264 CDS YPL245W 16 85586 86950 W 1996-07-31 1996-07-31 -S000006165 ORF Verified YPL244C HUT1 chromosome 16 16 88033 87014 C 1996-07-31 1996-07-31 Protein with a role in UDP-galactose transport to the Golgi lumen; has similarity to human UDP-galactose transporter UGTrel1, exhibits a genetic interaction with S. cerevisiae ERO1 -S000031081 CDS YPL244C 16 88033 87014 C 1996-07-31 1996-07-31 -S000006164 ORF Verified YPL243W SRP68 signal recognition particle subunit SRP68 chromosome 16 L000002065 16 88517 90316 W 1996-07-31 1996-07-31 Core component of the signal recognition particle (SRP) complex; SRP complex functions in targeting nascent secretory proteins to the endoplasmic reticulum (ER) membrane; relocalizes from cytoplasm to the nuclear periphery upon DNA replication stress -S000030136 CDS YPL243W 16 88517 90316 W 1996-07-31 1996-07-31 -S000006163 ORF Verified YPL242C IQG1 CYK1 chromosome 16 L000004180 16 95109 90622 C 1996-07-31 1996-07-31 Essential protein required for determination of budding pattern; promotes localization of axial markers Bud4p and Cdc12p and functionally interacts with Sec3p, localizes to the contractile ring during anaphase, member of the IQGAP family; relocalizes from bud neck to cytoplasm upon DNA replication stress -S000029942 CDS YPL242C 16 95109 90622 C 1996-07-31 1996-07-31 -S000006162 ORF Verified YPL241C CIN2 GTPase-activating protein CIN2 chromosome 16 L000000337 16 96258 95372 C -143 1996-07-31 1996-07-31 GTPase-activating protein (GAP) for Cin4p; tubulin folding factor C involved in beta-tubulin (Tub2p) folding; mutants display increased chromosome loss and benomyl sensitivity; human homolog RP2 complements yeast null mutant -S000037281 CDS YPL241C 16 96153 95372 C 1996-07-31 1996-07-31 -S000037280 CDS YPL241C 16 96258 96234 C 1996-07-31 1996-07-31 -S000037282 intron YPL241C 16 96233 96154 C 1996-07-31 1996-07-31 -S000006161 ORF Verified YPL240C HSP82 Hsp90 family chaperone HSP82|HSP90 chromosome 16 L000000822 16 98625 96496 C -137 1996-07-31 1996-07-31 Hsp90 chaperone; redundant in function with Hsc82p; required for pheromone signaling, negative regulation of Hsf1p; docks with Tom70p for mitochondrial preprotein delivery; promotes telomerase DNA binding, nucleotide addition; protein abundance increases in response to DNA replication stress; contains two acid-rich unstructured regions that promote solubility of chaperone-substrate complexes; HSP82 has a paralog, HSC82, that arose from the whole genome duplication -S000037196 CDS YPL240C 16 98625 96496 C 1996-07-31 1996-07-31 -S000006160 ORF Verified YPL239W YAR1 chromosome 16 L000002496 16 99484 100086 W 1996-07-31 1996-07-31 Ankyrin-repeat containing, nucleocytoplasmic shuttling chaperone; prevents aggregation of Rps3p in the cytoplasm, associates with nascent Rps3p during its translation in the cytoplasm and delivers it to the 90S in the nucleus; required for 40S ribosomal subunit export, biogenesis and adaptation to osmotic and oxidative stress; expression repressed by heat shock -S000036306 CDS YPL239W 16 99484 100086 W 1996-07-31 1996-07-31 -S000006158 ORF Verified YPL237W SUI3 translation initiation factor eIF2 subunit beta chromosome 16 L000002179 16 100496 101353 W 1996-07-31 1996-07-31 Beta subunit of the translation initiation factor eIF2; involved in the identification of the start codon; proposed to be involved in mRNA binding -S000035286 CDS YPL237W 16 100496 101353 W 1996-07-31 1996-07-31 -S000006159 ORF Dubious YPL238C chromosome 16 16 100863 100474 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps 5' end of the verified essential gene SUI3/YPL237W -S000036133 CDS YPL238C 16 100863 100474 C 1996-07-31 1996-07-31 -S000006157 ORF Verified YPL236C ENV7 putative serine/threonine protein kinase ENV7 chromosome 16 16 102702 101608 C 1996-07-31 1996-07-31 Vacuolar membrane protein kinase; negatively regulates membrane fusion; associates with vacuolar membrane through palmitoylation of one or more cysteines in consensus sequence; vacuolar membrane association is essential to its kinase activity; mutant shows defect in CPY processing; ortholog of human serine/threonine kinase 16 (STK16) -S000035042 CDS YPL236C 16 102702 101608 C 1996-07-31 1996-07-31 -S000006156 ORF Verified YPL235W RVB2 RuvB family ATP-dependent DNA helicase reptin|TIP48|TIH2|TIP49B chromosome 16 S000007484 16 103232 104647 W 1996-07-31 1996-07-31 ATP-dependent DNA helicase, also known as reptin; member of the AAA+ and RuvB protein families, similar to Rvb1p; conserved component of multiple complexes including the INO80 complex, the Swr1 complex, and the R2TP complex (Rvb1-Rvb2-Tah1-Pih1); involved in multiple processes such as chromatin remodeling, box C/D snoRNP assembly, and RNA polymerase II assembly -S000034953 CDS YPL235W 16 103232 104647 W 1996-07-31 1996-07-31 -S000006155 ORF Verified YPL234C VMA11 H(+)-transporting V0 sector ATPase subunit c'|TFP3|CLS9 chromosome 16 L000002290|L000002464 16 105440 104946 C 1996-07-31 1996-07-31 Vacuolar ATPase V0 domain subunit c'; involved in proton transport activity; hydrophobic integral membrane protein (proteolipid) containing four transmembrane segments; N and C termini are in the vacuolar lumen -S000033991 CDS YPL234C 16 105440 104946 C 1996-07-31 1996-07-31 -S000006154 ORF Verified YPL233W NSL1 MIND complex subunit NSL1 chromosome 16 L000004652 16 106172 106822 W 1996-07-31 1996-07-31 Essential component of the MIND kinetochore complex; joins kinetochore subunits contacting DNA to those contacting microtubules; required for accurate chromosome segregation; complex consists of Mtw1p Including Nnf1p-Nsl1p-Dsn1p (MIND) -S000033898 CDS YPL233W 16 106172 106822 W 1996-07-31 1996-07-31 -S000006153 ORF Verified YPL232W SSO1 syntaxin chromosome 16 L000002089 16 107275 108147 W 1996-07-31 1996-07-31 Plasma membrane t-SNARE; involved in fusion of secretory vesicles at the plasma membrane and in vesicle fusion during sporulation; forms a complex with Sec9p that binds v-SNARE Snc2p; syntaxin homolog; functionally redundant with Sso2p; SSO1 has a paralog, SSO2, that arose from the whole genome duplication -S000033777 CDS YPL232W 16 107275 108147 W 1996-07-31 1996-07-31 -S000006152 ORF Verified YPL231W FAS2 trifunctional fatty acid synthase subunit FAS2 chromosome 16 L000000602 16 108652 114315 W -125 1996-07-31 1996-07-31 Alpha subunit of fatty acid synthetase; complex catalyzes the synthesis of long-chain saturated fatty acids; contains the acyl-carrier protein domain and beta-ketoacyl reductase, beta-ketoacyl synthase and self-pantetheinylation activities -S000033048 CDS YPL231W 16 108652 114315 W 1996-07-31 1996-07-31 -S000006151 ORF Verified YPL230W USV1 NSF1 chromosome 16 L000004623 16 115312 116487 W 1996-07-31 1996-07-31 Putative transcription factor containing a C2H2 zinc finger; mutation affects transcriptional regulation of genes involved in growth on non-fermentable carbon sources, response to salt stress and cell wall biosynthesis; USV1 has a paralog, RGM1, that arose from the whole genome duplication -S000032959 CDS YPL230W 16 115312 116487 W 1996-07-31 1996-07-31 -S000122111 five_prime_UTR_intron YPL230W 16 115219 115293 W 2007-04-04 2007-04-04 -S000118413 ARS ARS1607 ARSXVI-117 chromosome 16 16 116566 116680 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178191 ARS_consensus_sequence ARS1607 16 116593 116609 W 2014-11-18 2014-11-18 -S000006150 ORF Uncharacterized YPL229W chromosome 16 16 117067 117687 W 1996-07-31 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; not an essential gene; YPL229W has a paralog, YMR181C, that arose from the whole genome duplication -S000032811 CDS YPL229W 16 117067 117687 W 1996-07-31 1996-07-31 -S000006149 ORF Verified YPL228W CET1 polynucleotide 5'-phosphatase|CES5 chromosome 16 L000004278 16 118382 120031 W 1996-07-31 1996-07-31 RNA 5'-triphosphatase involved in mRNA 5' capping; subunit of mRNA capping enzyme, which is a heterotetramer composed of a Cet1p homodimer and two molecules of guanylyltransferase Ceg1p; Cet1p also has a role in regulation of RNAPII pausing at promoter-proximal sites; interaction between Cet1p and Ceg1p is required for Ceg1p nuclear import; mammalian enzyme is single bifunctional polypeptide; human homolog RNGTT can complement yeast cet1 null mutant -S000032710 CDS YPL228W 16 118382 120031 W 1996-07-31 1996-07-31 -S000006148 ORF Verified YPL227C ALG5 dolichyl-phosphate beta-glucosyltransferase chromosome 16 L000000077 16 121167 120163 C 1996-07-31 1996-07-31 UDP-glucose:dolichyl-phosphate glucosyltransferase; involved in asparagine-linked glycosylation in the endoplasmic reticulum; human ortholog ALG5 can partially complement yeast alg5 mutant -S000032583 CDS YPL227C 16 121167 120163 C 1996-07-31 1996-07-31 -S000006147 ORF Verified YPL226W NEW1 chromosome 16 S000007490 16 121767 125357 W 1996-07-31 1996-07-31 ATP binding cassette protein; cosediments with polysomes and is required for biogenesis of the small ribosomal subunit; Asn/Gln-rich rich region supports [NU+] prion formation and susceptibility to [PSI+] prion induction -S000031654 CDS YPL226W 16 121767 125357 W 1996-07-31 1996-07-31 -S000006146 ORF Verified YPL225W chromosome 16 16 126006 126446 W 1996-07-31 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; protein abundance increases in response to DNA replication stress -S000031511 CDS YPL225W 16 126006 126446 W 1996-07-31 1996-07-31 -S000006145 ORF Verified YPL224C MMT2 MFT2 chromosome 16 L000004108 16 128088 126634 C 2011-02-03 1996-07-31|2011-02-03 Putative metal transporter involved in mitochondrial iron accumulation; MMT2 has a paralog, MMT1, that arose from the whole genome duplication -S000030540 CDS YPL224C 16 128088 126634 C 2011-02-03 1996-07-31|2011-02-03 -S000006144 ORF Verified YPL223C GRE1 chromosome 16 L000004176 16 129138 128632 C 2011-02-03 1996-07-31 Hydrophilin essential in desiccation-rehydration process; stress induced (osmotic, ionic, oxidative, heat shock and heavy metals); regulated by the HOG pathway; GRE1 has a paralog, SIP18, that arose from the whole genome duplication -S000030402 CDS YPL223C 16 129138 128632 C 2011-02-03 1996-07-31 -S000006143 ORF Uncharacterized YPL222W FMP40 chromosome 16 16 130162 132228 W 2011-02-03 1996-07-31 Putative protein of unknown function; proposed to be involved in responding to environmental stresses; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000030350 CDS YPL222W 16 130162 132228 W 2011-02-03 1996-07-31 -S000028722 ORF Dubious YPL222C-A chromosome 16 16 132115 131870 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032704 CDS YPL222C-A 16 132115 131870 C 2011-02-03 2003-07-29 -S000006142 ORF Verified YPL221W FLC1 flavin adenine dinucleotide transporter|BOP1|HUF1 chromosome 16 L000004721 16 133043 135424 W 2011-02-03 1996-07-31 Flavin adenine dinucleotide transporter; required for uptake of FAD into endoplasmic reticulum; involved in cell wall maintenance; FLC1 has a paralog, FLC3, that arose from the whole genome duplication -S000030150 CDS YPL221W 16 133043 135424 W 2011-02-03 1996-07-31 -S000006141 ORF Verified YPL220W RPL1A uL1|PUB2|ribosomal 60S subunit protein L1A|L1|L1A|SSM1 chromosome 16 L000002657 16 135790 136443 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L1A; N-terminally acetylated; homologous to mammalian ribosomal protein L10A and bacterial L1; RPL1A has a paralog, RPL1B, that arose from the whole genome duplication; rpl1a rpl1b double null mutation is lethal -S000037448 CDS YPL220W 16 135790 136443 W 2011-02-03 1996-07-31 -S000006140 ORF Verified YPL219W PCL8 chromosome 16 L000004040 16 136750 138228 W 2011-02-03 1996-07-31 Cyclin; interacts with Pho85p cyclin-dependent kinase (Cdk) to phosphorylate and regulate glycogen synthase, also activates Pho85p for Glc8p phosphorylation; PCL8 has a paralog, PCL10, that arose from the whole genome duplication -S000036617 CDS YPL219W 16 136750 138228 W 2011-02-03 1996-07-31 -S000006139 ORF Verified YPL218W SAR1 Arf family GTPase SAR1 chromosome 16 L000001801 16 138698 139409 W 2011-02-03 1996-07-31 ARF family GTPase; component of the COPII vesicle coat; required for transport vesicle formation during ER to Golgi protein transport; lowers membrane rigidity aiding vesicle formation; localizes to ER-mitochondrial contact sites where it enhances membrane curvature, thereby reducing contact size via its N-terminal amphipathic helix; regulates mitochondrial fission and fusion dynamics -S000036527 CDS YPL218W 16 138698 138725 W 2011-02-03 1996-07-31 -S000036528 CDS YPL218W 16 138865 139409 W 2011-02-03 1996-07-31 -S000036529 intron YPL218W 16 138726 138864 W 2011-02-03 1996-07-31 -S000006138 ORF Verified YPL217C BMS1 GTPase BMS1 chromosome 16 16 143171 139620 C 2011-02-03 1996-07-31 GTPase required for ribosomal subunit synthesis and rRNA processing; required for synthesis of 40S ribosomal subunits and for processing the 35S pre-rRNA at sites A0, A1, and A2; interacts with Rcl1p, which stimulates its GTPase and U3 snoRNA binding activities; has similarity to Tsr1p -S000035571 CDS YPL217C 16 143171 139620 C 2011-02-03 1996-07-31 -S000006137 ORF Uncharacterized YPL216W chromosome 16 16 143821 147129 W 2011-02-03 1996-07-31 Putative protein of unknown function; not an essential gene; YPL216W has a paralog, ITC1, that arose from the whole genome duplication -S000035522 CDS YPL216W 16 143821 147129 W 2011-02-03 1996-07-31 -S000006136 ORF Verified YPL215W CBP3 chromosome 16 L000000226 16 147416 148423 W 2011-02-03 1996-07-31 Mitochondrial protein required for assembly of cytochrome bc1 complex; forms a complex with Cbp6p that binds to mt ribosomes near the polypeptide tunnel exit and promotes efficient translation of the COB mRNA; Cbp3p-Cbp6p complex also interacts with newly synthesized cytochrome b (Cobp) and Cbp4p to promote assembly of Cobp into the cytochrome bc1 complex; Cbp3p-Cbp6p complex is sequestered if assembly of Complex III is blocked, downregulating COB mRNA translation -S000035433 CDS YPL215W 16 147416 148423 W 2011-02-03 1996-07-31 -S000006135 ORF Verified YPL214C THI6 bifunctional hydroxyethylthiazole kinase/thiamine-phosphate diphosphorylase chromosome 16 L000002634 16 150191 148569 C 2011-02-03 1996-07-31 Thiamine-phosphate diphosphorylase and hydroxyethylthiazole kinase; required for thiamine biosynthesis; GFP-fusion protein localizes to the cytoplasm in a punctate pattern -S000034353 CDS YPL214C 16 150191 148569 C 2011-02-03 1996-07-31 -S000006134 ORF Verified YPL213W LEA1 U2 snRNP complex subunit LEA1 chromosome 16 16 150614 151330 W 2011-02-03 1996-07-31 Component of U2 snRNP complex; disruption causes reduced U2 snRNP levels; physically interacts with Msl1p; putative homolog of human U2A' snRNP protein -S000034273 CDS YPL213W 16 150614 151330 W 2011-02-03 1996-07-31 -S000006133 ORF Verified YPL212C PUS1 pseudouridine synthase PUS1 chromosome 16 L000003360 16 153149 151515 C 2011-02-03 1996-07-31 tRNA:pseudouridine synthase; introduces pseudouridines at positions 26-28, 34-36, 65, and 67 of tRNA; also acts on U2 snRNA; also pseudouridylates some mRNAs, and pseudouridylation level varies with growth phase; nuclear protein that appears to be involved in tRNA export; PUS1 has a paralog, PUS2, that arose from the whole genome duplication -S000033309 CDS YPL212C 16 153149 151515 C 2011-02-03 1996-07-31 -S000006132 ORF Verified YPL211W NIP7 ribosome biosynthesis protein NIP7 chromosome 16 L000004183 16 153495 154040 W 2011-02-03 1996-07-31 Nucleolar protein required for 60S ribosome subunit biogenesis; constituent of 66S pre-ribosomal particles; physically interacts with Nop8p and the exosome subunit Rrp43p -S000033280 CDS YPL211W 16 153495 154040 W 2011-02-03 1996-07-31 -S000006131 ORF Verified YPL210C SRP72 signal recognition particle subunit SRP72 chromosome 16 L000002066 16 156212 154290 C 2011-02-03 2003-09-22|1996-07-31 Core component of the signal recognition particle (SRP); the SRP is a ribonucleoprotein (RNP) complex that functions in targeting nascent secretory proteins to the endoplasmic reticulum (ER) membrane -S000033194 CDS YPL210C 16 156212 154290 C 2011-02-03 2003-09-22|1996-07-31 -S000006130 ORF Verified YPL209C IPL1 aurora kinase|PAC15 chromosome 16 L000000871 16 157593 156490 C -116 2011-02-03 1996-07-31 Aurora kinase of chromosomal passenger complex; mediates release of mono-oriented kinetochores from microtubules in meiosis I, and kinetochore release from SPB clusters at meiotic exit; helps maintain condensed chromosomes during anaphase; required for SPB cohesion and prevention of multipolar spindle formation; promotes telomerase release at G2/M; Iocalizes to nuclear foci that diffuse upon DNA replication stress; required for inhibition of karyopherin Pse1p upon SAC arrest -S000032505 CDS YPL209C 16 157593 156490 C 2011-02-03 1996-07-31 -S000006129 ORF Verified YPL208W RKM1 protein-lysine N-methyltransferase chromosome 16 16 157842 159593 W 2011-02-03 1996-07-31 SET-domain lysine-N-methyltransferase; catalyzes the formation of dimethyllysine residues on the large ribosomal subunit proteins L23 (Rpl23Ap and Rpl23Bp) and monomethyllysine residues on L18 (Rps18Ap and Rps18Bp) -S000032466 CDS YPL208W 16 157842 159593 W 2011-02-03 1996-07-31 -S000006128 ORF Verified YPL207W TYW1 putative tRNA 4-demethylwyosine synthase chromosome 16 16 159909 162341 W 2011-02-03 1996-07-31 Iron-sulfer protein required for synthesis of Wybutosine modified tRNA; Wybutosine is a modified guanosine found at the 3'-position adjacent to the anticodon of phenylalanine tRNA which supports reading frame maintenance by stabilizing codon-anticodon interactions; induction by Yap5p in response to iron provides protection from high iron toxicity; overexpression results in increased cellular iron -S000032365 CDS YPL207W 16 159909 162341 W 2011-02-03 1996-07-31 -S000130196 ARS ARS1608 chromosome 16 16 162341 162632 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000006127 ORF Verified YPL206C PGC1 phosphatidylglycerol phospholipase chromosome 16 16 163597 162632 C 2011-02-03 1996-07-31 Phosphatidylglycerol phospholipase C; regulates phosphatidylglycerol (PG) accumulation via a phospholipase C-type degradation mechanism; PG levels affect mitochondrial function; contains glycerophosphodiester phosphodiesterase motifs -S000032198 CDS YPL206C 16 163597 162632 C 2011-02-03 1996-07-31 -S000006126 ORF Dubious YPL205C chromosome 16 16 164266 163922 C 2011-02-03 1996-07-31 Hypothetical protein; deletion of locus affects telomere length -S000031200 CDS YPL205C 16 164266 163922 C 2011-02-03 1996-07-31 -S000006125 ORF Verified YPL204W HRR25 serine/threonine protein kinase HRR25|KTI14 chromosome 16 L000000810 16 164276 165760 W 2011-02-03 1996-07-31 Conserved casein kinase; regulates diverse events including: vesicular traffic, DNA repair, the CVT pathway, monopolar attachment of sister kinetochores at meiosis I, and ribosomal subunit biogenesis; monopolin subunit; binds the RNAPII CTD; phosphorylates COPII coat subunits; interacts with Sit4p phosphatase; antagonizes calcineurin signaling, reducing nuclear accumulation of Crz1p; phosphorylates Dsn1p, the kinetochore receptor for monopolin; homolog of mammalian CK1delta -S000031120 CDS YPL204W 16 164276 165760 W 2011-02-03 1996-07-31 -S000006124 ORF Verified YPL203W TPK2 cAMP-dependent protein kinase catalytic subunit TPK2|PKA3|YKR1|PKA2 chromosome 16 L000001445 16 166256 167398 W -120 2011-02-03 1996-07-31 cAMP-dependent protein kinase catalytic subunit; promotes vegetative growth in response to nutrients via the Ras-cAMP signaling pathway; partially redundant with Tpk1p and Tpk3p; localizes to P-bodies during stationary phase; relocalizes to the cytosol in response to hypoxia -S000031020 CDS YPL203W 16 166256 167398 W 2011-02-03 1996-07-31 -S000006123 ORF Verified YPL202C AFT2 chromosome 16 16 169338 168088 C 2011-02-03 1996-07-31 Iron-regulated transcriptional activator; activates genes involved in intracellular iron use and required for iron homeostasis and resistance to oxidative stress; AFT2 has a paralog, AFT1, that arose from the whole genome duplication -S000029960 CDS YPL202C 16 169338 168088 C 2011-02-03 1996-07-31 -S000006122 ORF Verified YPL201C YIG1 chromosome 16 16 171155 169770 C 2011-02-03 1996-07-31 Protein that interacts with glycerol 3-phosphatase; plays a role in anaerobic glycerol production; localizes to the nucleus and cytosol -S000029831 CDS YPL201C 16 171155 169770 C 2011-02-03 1996-07-31 -S000006121 ORF Verified YPL200W CSM4 chromosome 16 16 171484 171954 W 2011-02-03 1996-07-31 Protein required for accurate chromosome segregation during meiosis; involved in meiotic telomere clustering (bouquet formation) and telomere-led rapid prophase movements; functions with meiosis-specific telomere-binding protein Ndj1p; CSM4 has a paralog, MPS2, that arose from the whole genome duplication -S000037884 CDS YPL200W 16 171484 171954 W 2011-02-03 1996-07-31 -S000006120 ORF Uncharacterized YPL199C chromosome 16 16 172755 172033 C 2011-02-03 1996-07-31 Putative protein of unknown function; predicted to be palmitoylated -S000031860 CDS YPL199C 16 172755 172033 C 2011-02-03 1996-07-31 -S000006119 ORF Verified YPL198W RPL7B uL30|ribosomal 60S subunit protein L7B|YL8|L7B|L6B|L30|rp11 chromosome 16 L000003304 16 173152 174702 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L7B; required for processing of 27SA3 pre-rRNA to 27SB pre-rRNA during assembly of large ribosomal subunit; depletion leads to a turnover of pre-rRNA; contains a conserved C-terminal Nucleic acid Binding Domain (NDB2); binds to Domain II of 25S and 5.8S rRNAs; homologous to mammalian ribosomal protein L7 and bacterial L30; RPL7B has a paralog, RPL7A, that arose from the whole genome duplication -S000031808 CDS YPL198W 16 173152 173162 W 2011-02-03 1996-07-31 -S000031809 CDS YPL198W 16 173572 173665 W 2011-02-03 1996-07-31 -S000031810 CDS YPL198W 16 174073 174702 W 2011-02-03 1996-07-31 -S000031811 intron YPL198W 16 173163 173571 W 2011-02-03 1996-07-31 -S000031812 intron YPL198W 16 173666 174072 W 2011-02-03 1996-07-31 -S000006450 snoRNA_gene snR59 SNR59 chromosome 16 L000004528 16 173827 173904 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A807 -S000030766 noncoding_exon snR59 16 173827 173904 W 2011-02-03 2000-05-19 -S000006118 ORF Dubious YPL197C chromosome 16 16 174756 174343 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the ribosomal gene RPL7B -S000031658 CDS YPL197C 16 174756 174343 C 2011-02-03 1996-07-31 -S000006117 ORF Verified YPL196W OXR1 chromosome 16 16 175043 175864 W 2011-02-03 1996-07-31 Protein of unknown function required for oxidative damage resistance; required for normal levels of resistance to oxidative damage; null mutants are sensitive to hydrogen peroxide; member of a conserved family of proteins found in eukaryotes -S000031609 CDS YPL196W 16 175043 175864 W 2011-02-03 1996-07-31 -S000006116 ORF Verified YPL195W APL5 YKS4 chromosome 16 L000003037 16 176223 179021 W 2011-02-03 1996-07-31 Delta adaptin-like subunit of the clathrin associated protein complex; functions in transport of alkaline phosphatase to the vacuole via the alternate pathway; suppressor of loss of casein kinase 1 function; the clathrin associated protein complex is also known as AP-3 -S000031504 CDS YPL195W 16 176223 179021 W 2011-02-03 1996-07-31 -S000006115 ORF Verified YPL194W DDC1 chromosome 16 L000004256 16 179277 181115 W 2011-02-03 1996-07-31 DNA damage checkpoint protein; part of a PCNA-like complex required for DNA damage response, required for pachytene checkpoint to inhibit cell cycle in response to unrepaired recombination intermediates; potential Cdc28p substrate; forms nuclear foci upon DNA replication stress -S000030638 CDS YPL194W 16 179277 181115 W 2011-02-03 1996-07-31 -S000006114 ORF Verified YPL193W RSA1 chromosome 16 L000004919 16 181403 182548 W 2011-02-03 1996-07-31 Protein involved in the assembly of 60S ribosomal subunits; functionally interacts with Dbp6p; functions in a late nucleoplasmic step of the assembly -S000030542 CDS YPL193W 16 181403 182548 W 2011-02-03 1996-07-31 -S000006113 ORF Verified YPL192C PRM3 pheromone-regulated protein PRM3 chromosome 16 16 183056 182655 C 2011-02-03 1996-07-31 Protein required for nuclear envelope fusion during karyogamy; pheromone-regulated; peripheral protein of the nuclear membrane; interacts with Kar5p at the spindle pole body -S000030353 CDS YPL192C 16 183056 182655 C 2011-02-03 1996-07-31 -S000006112 ORF Verified YPL191C chromosome 16 16 184679 183597 C 2011-02-03 1996-07-31 Protein of unknown function; diploid deletion strain exhibits high budding index; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YPL191C has a paralog, YGL082W, that arose from the whole genome duplication -S000037541 CDS YPL191C 16 184679 183597 C 2011-02-03 1996-07-31 -S000006111 ORF Verified YPL190C NAB3 HMD1 chromosome 16 L000001228 16 187725 185317 C 2011-02-03 1996-07-31 RNA-binding protein, subunit of Nrd1 complex (Nrd1p-Nab3p-Sen1p); complex interacts with exosome to mediate 3'-end formation of some mRNAs, snRNAs, snoRNAs, and CUTs; required for termination of non-poly(A) transcripts and efficient splicing; Nrd1-Nab3 pathway appears to have a role in rapid suppression of some genes when cells are shifted to poor growth conditions, indicating role for Nrd1-Nab3 in regulating cellular response to nutrient availability -S000037419 CDS YPL190C 16 187725 185317 C 2011-02-03 1996-07-31 -S000028527 ORF Verified YPL189C-A COA2 chromosome 16 16 188513 188307 C 2011-02-03 2003-07-29 Cytochrome oxidase assembly factor; null mutation results in respiratory deficiency with specific loss of cytochrome oxidase activity; functions downstream of assembly factors Mss51p and Coa1p and interacts with assembly factor Shy1p -S000030331 CDS YPL189C-A 16 188513 188307 C 2011-02-03 2003-07-29 -S000006110 ORF Verified YPL189W GUP2 putative O-acyltransferase chromosome 16 16 189154 190983 W 2011-02-03 1996-07-31 Probable membrane protein; possible role in proton symport of glycerol; member of the MBOAT family of putative membrane-bound O-acyltransferases; homolog of the mammalian Hedgehog pathway modulator HHAT; GUP2 has a paralog, GUP1, that arose from the whole genome duplication -S000036867 CDS YPL189W 16 189154 190983 W 2011-02-03 1996-07-31 -S000006109 ORF Verified YPL188W POS5 NADH kinase chromosome 16 L000002651 16 191406 192650 W 2011-02-03 1996-07-31 Mitochondrial NADH kinase; phosphorylates NADH; also phosphorylates NAD(+) with lower specificity; required for the response to oxidative stress -S000036799 CDS YPL188W 16 191406 192650 W 2011-02-03 1996-07-31 -S000006108 ORF Verified YPL187W MF(ALPHA)1 chromosome 16 L000001094 16 193648 194145 W -115 2011-02-03 1996-07-31 Mating pheromone alpha-factor, made by alpha cells; interacts with mating type a cells to induce cell cycle arrest and other responses leading to mating; also encoded by MF(ALPHA)2, although MF(ALPHA)1 produces most alpha-factor; binds copper(II) ions -S000036743 CDS YPL187W 16 193648 194145 W 2011-02-03 1996-07-31 -S000006106 ORF Dubious YPL185W chromosome 16 16 195253 195648 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene UIP4/YPL186C -S000035778 CDS YPL185W 16 195253 195648 W 2011-02-03 1996-07-31 -S000006107 ORF Verified YPL186C UIP4 chromosome 16 16 195426 194512 C 2011-02-03 1996-07-31 Protein that interacts with Ulp1p; a Ubl (ubiquitin-like protein)-specific protease for Smt3p protein conjugates; detected in a phosphorylated state in the mitochondrial outer membrane; also detected in ER and nuclear envelope -S000036644 CDS YPL186C 16 195426 194512 C 2011-02-03 1996-07-31 -S000006105 ORF Verified YPL184C MRN1 PTR69 chromosome 16 16 197788 195950 C 2011-02-03 1996-07-31 RNA-binding protein that may be involved in translational regulation; binds specific categories of mRNAs, including those that contain upstream open reading frames (uORFs) and internal ribosome entry sites (IRES); interacts genetically with chromatin remodelers and splicing factors, linking chromatin state, splicing and as a result mRNA maturation -S000035615 CDS YPL184C 16 197788 195950 C 2011-02-03 1996-07-31 -S000007224 ORF Verified YPL183W-A RTC6 putative mitochondrial 54S ribosomal protein RTC6|TAE4|GON5 chromosome 16 16 199095 199376 W 2011-02-03 1999-07-17 Protein involved in translation; mutants have defects in biogenesis of nuclear ribosomes; sequence similar to prokaryotic ribosomal protein L36, may be a mitochondrial ribosomal protein; protein abundance increases in response to DNA replication stress -S000035617 CDS YPL183W-A 16 199095 199376 W 2011-02-03 1999-07-17 -S000006104 ORF Verified YPL183C RTT10 TRM734|ERE2 chromosome 16 16 202536 199495 C 2011-02-03 1996-07-31 WD40 domain-containing protein involved in endosomal recycling; forms a complex with Rrt2p that functions in the retromer-mediated pathway for recycling internalized cell-surface proteins; interacts with Trm7p for 2'-O-methylation of N34 of substrate tRNAs; has a role in regulation of Ty1 transposition; human ortholog is WDR6 -S000035538 CDS YPL183C 16 202536 199495 C 2011-02-03 1996-07-31 -S000006102 ORF Verified YPL181W CTI6 RXT1 chromosome 16 16 203421 204941 W 2011-02-03 1996-07-31 Component of the Rpd3L histone deacetylase complex; relieves transcriptional repression by binding to the Cyc8p-Tup1p corepressor and recruiting the SAGA complex to the repressed promoter; contains a PHD finger domain -S000034453 CDS YPL181W 16 203421 204941 W 2011-02-03 1996-07-31 -S000006103 ORF Dubious YPL182C chromosome 16 16 203689 203306 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene CTI6/YPL181W -S000034519 CDS YPL182C 16 203689 203306 C 2011-02-03 1996-07-31 -S000006101 ORF Verified YPL180W TCO89 chromosome 16 16 205248 207647 W 2011-02-03 1996-07-31 Subunit of TORC1 (Tor1p or Tor2p-Kog1p-Lst8p-Tco89p); regulates global H3K56ac; TORC1 complex regulates growth in response to nutrient availability; cooperates with Ssd1p in the maintenance of cellular integrity; deletion strains are hypersensitive to rapamycin -S000034375 CDS YPL180W 16 205248 207647 W 2011-02-03 1996-07-31 -S000006100 ORF Verified YPL179W PPQ1 SAL6 chromosome 16 L000001797|L000001474 16 208157 209806 W 2011-02-03 1996-07-31 Protein phosphatase that regulates the mating response; negatively regulates the MAP kinase signaling cascade during mating; member of the serine/threonine phosphatase PP1 family -S000033429 CDS YPL179W 16 208157 209806 W 2011-02-03 1996-07-31 -S000006561 tRNA_gene tE(UUC)P chromosome 16 L000003736 16 210263 210192 C 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; target of K. lactis zymocin -S000036031 noncoding_exon tE(UUC)P 16 210263 210192 C 2011-02-03 2000-05-19 -S000007194 long_terminal_repeat YPLWdelta7 chromosome 16 16 210451 210771 W 2011-02-03 2000-05-19 Ty1 LTR -S000007195 long_terminal_repeat YPLWdelta8 chromosome 16 16 211577 211898 W 2011-02-03 2000-05-19 Ty2 LTR -S000006099 ORF Verified YPL178W CBC2 CBP20|SAE1|MUD13 chromosome 16 L000002891|L000004111 16 212158 212784 W 2011-02-03 1996-07-31 Small subunit of the heterodimeric cap binding complex with Sto1p; interacts with Npl3p, possibly to package mRNA for export from the nucleus; may have a role in telomere maintenance; contains an RNA-binding motif -S000033362 CDS YPL178W 16 212158 212784 W 2011-02-03 1996-07-31 -S000006098 ORF Verified YPL177C CUP9 chromosome 16 L000000442 16 213962 213042 C 2011-02-03 1996-07-31 Homeodomain-containing transcriptional repressor; regulates expression of PTR2, which encodes a major peptide transporter; imported peptides activate ubiquitin-dependent proteolysis, resulting in degradation of Cup9p and de-repression of PTR2 transcription; CUP9 has a paralog, TOS8, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000032622 CDS YPL177C 16 213962 213042 C 2011-02-03 1996-07-31 -S000006097 ORF Verified YPL176C TRE1 chromosome 16 16 218363 216012 C 2011-02-03 1996-07-31 Transferrin receptor-like protein; plasma membrane protein that binds Bsd2p and regulates ubiquitination and vacuolar degradation of the metal transporter Smf1p; functionally redundant with Tre2p; TRE1 has a paralog, TRE2, that arose from the whole genome duplication -S000032515 CDS YPL176C 16 218363 216012 C 2011-02-03 1996-07-31 -S000006096 ORF Verified YPL175W SPT14 phosphatidylinositol N-acetylglucosaminyltransferase SPT14|GPI3|CWH6 chromosome 16 L000002036 16 218630 220088 W -113 2011-02-03 2000-07-14|1996-07-31 UDP-glycosyltransferase subunit of the GPI-GnT complex; UDP-GlcNAc-binding and catalytic subunit of the enzyme that mediates the first step in glycosylphosphatidylinositol (GPI) biosynthesis, mutations cause defects in transcription and in biogenesis of cell wall proteins -S000032480 CDS YPL175W 16 218630 218646 W 2011-02-03 2000-07-14|1996-07-31 -S000032481 CDS YPL175W 16 218747 220088 W 2011-02-03 2000-07-14|1996-07-31 -S000032482 intron YPL175W 16 218647 218746 W 2011-02-03 2000-07-14|1996-07-31 -S000130197 ARS ARS1611 chromosome 16 16 220088 220167 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000006095 ORF Verified YPL174C NIP100 PAC13 chromosome 16 L000001254 16 222773 220167 C 2011-02-03 1996-07-31 Large subunit of the dynactin complex; dynactin is involved in partitioning the mitotic spindle between mother and daughter cells; putative ortholog of mammalian p150(glued) -S000031426 CDS YPL174C 16 222773 220167 C 2011-02-03 1996-07-31 -S000006094 ORF Verified YPL173W MRPL40 mitochondrial 54S ribosomal protein YmL40|YmL40 chromosome 16 L000002696 16 223143 224036 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000031355 CDS YPL173W 16 223143 224036 W 2011-02-03 1996-07-31 -S000006093 ORF Verified YPL172C COX10 protoheme IX farnesyltransferase chromosome 16 L000000394 16 225741 224353 C 2011-02-03 1996-07-31 Heme A:farnesyltransferase; catalyzes first step in conversion of protoheme to heme A prosthetic group required for cytochrome c oxidase activity; human ortholog COX10 can complement yeast cox10 null mutant; human ortholog COX10 is associated with mitochondrial disorders -S000031181 CDS YPL172C 16 225741 224353 C 2011-02-03 1996-07-31 -S000006092 ORF Verified YPL171C OYE3 NADPH dehydrogenase|ZRG6 chromosome 16 L000001326 16 227371 226169 C 2011-02-03 1996-07-31 Conserved NADPH oxidoreductase containing flavin mononucleotide (FMN); homologous to Oye2p with different ligand binding and catalytic properties; has potential roles in oxidative stress response and programmed cell death -S000030238 CDS YPL171C 16 227371 226169 C 2011-02-03 1996-07-31 -S000006091 ORF Verified YPL170W DAP1 chromosome 16 16 228314 228772 W 2011-02-03 1996-07-31 Heme-binding protein; involved in regulation of cytochrome P450 protein Erg11p; damage response protein, related to mammalian membrane progesterone receptors; mutations lead to defects in telomeres, mitochondria, and sterol synthesis -S000030129 CDS YPL170W 16 228314 228772 W 2011-02-03 1996-07-31 -S000006090 ORF Verified YPL169C MEX67 chromosome 16 L000004314 16 230838 229039 C 2011-02-03 1996-07-31 Poly(A)RNA binding protein involved in nuclear mRNA export; component of the nuclear pore; ortholog of human TAP -S000037096 CDS YPL169C 16 230838 229039 C 2011-02-03 1996-07-31 -S000006089 ORF Uncharacterized YPL168W MRX4 chromosome 16 16 231217 232509 W 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; green fluorescent protein (GFP)-fusion protein localizes to the mitochondrion; expression may be cell cycle-regulated -S000036477 CDS YPL168W 16 231217 232509 W 2011-02-03 1996-07-31 -S000006088 ORF Verified YPL167C REV3 PSO1 chromosome 16 L000001616 16 237107 232593 C -102 2011-02-03 1996-07-31 Catalytic subunit of DNA polymerase zeta; involved in translesion synthesis during post-replication repair; required for mutagenesis induced by DNA damage; involved in double-strand break repair; forms a complex with Rev7p, Pol31p and Pol32p -S000036379 CDS YPL167C 16 237107 232593 C 2011-02-03 1996-07-31 -S000006087 ORF Verified YPL166W ATG29 chromosome 16 16 237338 237979 W 2011-02-03 1996-07-31 Autophagy-specific protein; required for recruiting other ATG proteins to the pre-autophagosomal structure (PAS); interacts with Atg17p and localizas to the PAS in a manner interdependent with Atg17p and Cis1p; not conserved; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress -S000036304 CDS YPL166W 16 237338 237979 W 2011-02-03 1996-07-31 -S000006086 ORF Verified YPL165C SET6 chromosome 16 16 239077 237956 C 2011-02-03 1996-07-31 SET domain protein of unknown function; deletion heterozygote is sensitive to compounds that target ergosterol biosynthesis, may be involved in compound availability -S000036129 CDS YPL165C 16 239077 237956 C 2011-02-03 1996-07-31 -S000006085 ORF Verified YPL164C MLH3 mismatch repair protein MLH3 chromosome 16 16 241497 239350 C 2011-02-03 1996-07-31 Protein involved in DNA mismatch repair and meiotic recombination; involved in crossing-over during meiotic recombination; forms a complex with Mlh1p; mammalian homolog is implicated mammalian microsatellite instability -S000035196 CDS YPL164C 16 241497 239350 C 2011-02-03 1996-07-31 -S000006084 ORF Verified YPL163C SVS1 chromosome 16 L000002750 16 242700 241918 C 2011-02-03 1996-07-31 Cell wall and vacuolar protein; required for wild-type resistance to vanadate; SVS1 has a paralog, SRL1, that arose from the whole genome duplication -S000035038 CDS YPL163C 16 242700 241918 C 2011-02-03 1996-07-31 -S000006083 ORF Uncharacterized YPL162C chromosome 16 16 244027 243206 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the membrane of vacuole with cell cycle-correlated morphology -S000034090 CDS YPL162C 16 244027 243206 C 2011-02-03 1996-07-31 -S000006082 ORF Verified YPL161C BEM4 ROM7 chromosome 16 L000000170 16 246220 244319 C 2011-02-03 1996-07-31 Protein involved in establishment of cell polarity and bud emergence; interacts with the Rho1p small GTP-binding protein and with the Rho-type GTPase Cdc42p; involved in maintenance of proper telomere length -S000033986 CDS YPL161C 16 246220 244319 C 2011-02-03 1996-07-31 -S000006081 ORF Verified YPL160W CDC60 leucine--tRNA ligase CDC60|LeuRS chromosome 16 L000000283 16 246990 250262 W -65 2011-02-03 1996-07-31 Cytosolic leucyl tRNA synthetase; ligates leucine to the appropriate tRNA; human homolog LARS can complement yeast temperature-sensitive mutant at restrictive temperature -S000033896 CDS YPL160W 16 246990 250262 W 2011-02-03 1996-07-31 -S000006080 ORF Verified YPL159C PET20 chromosome 16 16 251668 250907 C 2011-02-03 1996-07-31 Mitochondrial protein; required for respiratory growth under some conditions and for stability of the mitochondrial genome -S000034917 CDS YPL159C 16 251668 250907 C 2011-02-03 1996-07-31 -S000006079 ORF Verified YPL158C AIM44 GPS1 chromosome 16 16 254310 252034 C 2011-02-03 1996-07-31 Protein that regulates Cdc42p and Rho1p; functions in the late steps of cytokinesis and cell separation; sustains Rho1p at the cell division site after actomyosin ring contraction; inhibits the activation of Cdc42-Cla4 at the cell division site to prevent budding inside the old bud neck; transcription is regulated by Swi5p; null mutant displays elevated frequency of mitochondrial genome loss; relocalizes from bud neck to cytoplasm upon DNA replication stress -S000034827 CDS YPL158C 16 254310 252034 C 2011-02-03 1996-07-31 -S000006078 ORF Verified YPL157W TGS1 RNA methyltransferase chromosome 16 16 254814 255761 W 2011-02-03 1996-07-31 Trimethyl guanosine synthase, conserved nucleolar methyl transferase; converts the m(7)G cap structure of snRNAs, snoRNAs, and telomerase TLC1 RNA to m(2,2,7)G; also required for nucleolar assembly and splicing of meiotic pre-mRNAs; interacts with Swm2p, which may confer substrate specificity on Tgs1p -S000032912 CDS YPL157W 16 254814 255761 W 2011-02-03 1996-07-31 -S000006077 ORF Verified YPL156C PRM4 pheromone-regulated protein PRM4 chromosome 16 16 256767 255913 C 2011-02-03 1996-07-31 Pheromone-regulated protein proposed to be involved in mating; predicted to have 1 transmembrane segment; transcriptionally regulated by Ste12p during mating and by Cat8p during the diauxic shift -S000032757 CDS YPL156C 16 256767 255913 C 2011-02-03 1996-07-31 -S000006076 ORF Verified YPL155C KIP2 chromosome 16 L000000908 16 259336 257216 C 2011-02-03 1996-07-31 Kinesin-related motor protein involved in mitotic spindle positioning; stabilizes microtubules by targeting Bik1p to the plus end; functions as a microtubule polymerase and catastrophe inhibitor in vitro; Kip2p levels are controlled during the cell cycle -S000032676 CDS YPL155C 16 259336 257216 C 2011-02-03 1996-07-31 -S000006075 ORF Verified YPL154C PEP4 proteinase A|yscA|PRA1|PHO9 chromosome 16 L000001375 16 260931 259714 C -95 2011-02-03 1996-07-31 Vacuolar aspartyl protease (proteinase A); required for posttranslational precursor maturation of vacuolar proteinases; important for protein turnover after oxidative damage; plays a protective role in acetic acid induced apoptosis; synthesized as a zymogen, self-activates -S000031707 CDS YPL154C 16 260931 259714 C 2011-02-03 1996-07-31 -S000130198 ARS ARS1612 chromosome 16 16 260931 261727 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000006074 ORF Verified YPL153C RAD53 serine/threonine/tyrosine protein kinase RAD53|SPK1|MEC2|LSD1 chromosome 16 L000001573 16 264192 261727 C -109 2011-02-03 1996-07-31 DNA damage response protein kinase; required for cell-cycle arrest, regulation of copper genes in response to DNA damage; phosphorylates nuclear pores to counteract gene gating, preventing aberrant transitions at forks approaching transcribed genes; activates downstream kinase Dun1p; differentially senses mtDNA depletion, mitochondrial ROS; relocalizes to cytosol under hypoxia; human homolog CHEK2 implicated in breast cancer can complement yeast null mutant -S000031574 CDS YPL153C 16 264192 261727 C 2011-02-03 1996-07-31 -S000028721 ORF Uncharacterized YPL152W-A chromosome 16 16 264602 264700 W 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032702 CDS YPL152W-A 16 264602 264700 W 2011-02-03 2003-07-29 -S000006073 ORF Verified YPL152W RRD2 peptidylprolyl isomerase RRD2|YPA2 chromosome 16 L000004484 16 265028 266104 W 2011-02-03 1996-07-31 Peptidyl-prolyl cis/trans-isomerase; also activates the phosphotyrosyl phosphatase activity of protein phosphatase 2A (PP2A); regulates G1 phase progression, the osmoresponse, microtubule dynamics; subunit of the Tap42p-Pph21p-Rrd2p complex; protein abundance increases in response to DNA replication stress -S000031507 CDS YPL152W 16 265028 266104 W 2011-02-03 1996-07-31 -S000006072 ORF Verified YPL151C PRP46 mRNA splicing protein PRP46|NTC50 chromosome 16 16 267535 266180 C 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); this complex contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs -S000030537 CDS YPL151C 16 267535 266180 C 2011-02-03 1996-07-31 -S000006071 ORF Uncharacterized YPL150W non-specific serine/threonine protein kinase chromosome 16 16 268188 270893 W 2011-02-03 1996-07-31 Protein kinase of unknown cellular role; binds phosphatidylinositols and cardiolipin in a large-scale study -S000030474 CDS YPL150W 16 268188 270893 W 2011-02-03 1996-07-31 -S000006070 ORF Verified YPL149W ATG5 APG5 chromosome 16 L000003303 16 271310 272194 W 2011-02-03 1996-07-31 Conserved protein involved in autophagy and the Cvt pathway; undergoes conjugation with Atg12p to form a complex involved in Atg8p lipidation; Atg5p-Atg12p conjugate enhances E2 activity of Atg3 by rearranging its catalytic site, also forms a complex with Atg16p; the Atg5-Atg12/Atg16 complex binds to membranes and is essential for autophagosome formation; also involved in methionine restriction extension of chronological lifespan in an autophagy-dependent manner -S000030694 CDS YPL149W 16 271310 272194 W 2011-02-03 1996-07-31 -S000006069 ORF Verified YPL148C PPT2 holo-[acyl-carrier-protein] synthase chromosome 16 L000004400 16 272815 272294 C 2011-02-03 2003-09-22|1996-07-31 Phosphopantetheine:protein transferase (PPTase); activates mitochondrial acyl carrier protein (Acp1p) by phosphopantetheinylation -S000036734 CDS YPL148C 16 272815 272294 C 2011-02-03 2003-09-22|1996-07-31 -S000006068 ORF Verified YPL147W PXA1 ATP-binding cassette long-chain fatty acid transporter PXA1|SSH2|PAT2|PAL1|LPI1 chromosome 16 L000001541 16 273255 275867 W 2011-02-03 1996-07-31 Subunit of heterodimeric peroxisomal ABC transport complex, with Pxa2p; required for import of long-chain fatty acids into peroxisomes; similar to human adrenoleukodystrophy transporters ABCD1and ABCD2, and ALD-related proteins; mutations in ABCD1 cause X-linked adrenoleukodystrophy (X-ALD), a peroxisomal disorder; human ABCD1 and ABCD2 can each partially complement yeast pxa1 pxa2 double null mutant -S000036715 CDS YPL147W 16 273255 275867 W 2011-02-03 1996-07-31 -S000006067 ORF Verified YPL146C NOP53 RRP16 chromosome 16 16 277529 276162 C 2011-02-03 1996-07-31 Nucleolar protein; involved in biogenesis of the 60S subunit of the ribosome; interacts with rRNA processing factors Cbf5p and Nop2p and with the nucleolar proteins Nop17p and Nip7p; null mutant is viable but growth is severely impaired -S000036573 CDS YPL146C 16 277529 276162 C 2011-02-03 1996-07-31 -S000006066 ORF Verified YPL145C KES1 oxysterol-binding protein KES1|BSR3|OSH4|LPI3 chromosome 16 L000000894 16 279699 278395 C 2011-02-03 1996-07-31 One of seven members of the yeast oxysterol binding protein family; involved in negative regulation of Sec14p-dependent Golgi complex secretory functions, peripheral membrane protein that localizes to the Golgi complex; KES1 has a paralog, HES1, that arose from the whole genome duplication -S000035629 CDS YPL145C 16 279699 278395 C 2011-02-03 1996-07-31 -S000006065 ORF Verified YPL144W POC4 DMP1|PBA4 chromosome 16 16 280480 280926 W 2011-02-03 1996-07-31 Component of a heterodimeric Poc4p-Irc25p chaperone; involved in assembly of alpha subunits into the 20S proteasome; may regulate formation of proteasome isoforms with alternative subunits under different conditions; upregulates proteasome assembly in response to the unfolded protein response activated by mistargeting of proteins (UPRam) -S000035609 CDS YPL144W 16 280480 280926 W 2011-02-03 1996-07-31 -S000007441 snoRNA_gene snR17b SNR17B U3 chromosome 16 L000004247 16 281517 281056 C 2011-02-03 2000-05-19 Small nucleolar RNA (snoRNA) U3; part of small (ribosomal) subunit (SSU) processosome; SNR17A also encodes snoRNA U3 -S000030181 intron snR17b 16 281503 281374 C 2011-02-03 2000-05-19 -S000030180 noncoding_exon snR17b 16 281373 281056 C 2011-02-03 2000-05-19 -S000030179 noncoding_exon snR17b 16 281517 281504 C 2011-02-03 2000-05-19 -S000006064 ORF Verified YPL143W RPL33A eL33|ribosomal 60S subunit protein L33A|L33e|rp47|l37A|YL37|L33A|RPL37A chromosome 16 L000001728 16 282122 282970 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L33A; N-terminally acetylated; rpl33a null mutant exhibits slow growth while rpl33a rpl33b double null mutant is inviable; homologous to mammalian ribosomal protein L35A, no bacterial homolog; RPL33A has a paralog, RPL33B, that arose from the whole genome duplication -S000035517 CDS YPL143W 16 282122 282140 W 2011-02-03 1996-07-31 -S000035518 CDS YPL143W 16 282666 282970 W 2011-02-03 1996-07-31 -S000035519 intron YPL143W 16 282141 282665 W 2011-02-03 1996-07-31 -S000006063 ORF Dubious YPL142C chromosome 16 16 283003 282686 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF RPL33A/YPL143W, a component of the large (60S) ribosomal subunit -S000035342 CDS YPL142C 16 283003 282686 C 2011-02-03 1996-07-31 -S000006062 ORF Verified YPL141C FRK1 protein kinase FRK1 chromosome 16 16 286061 283464 C 2011-02-03 1996-07-31 Protein kinase of unknown cellular role; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; interacts with rRNA transcription and ribosome biogenesis factors and the long chain fatty acyl-CoA synthetase Faa3p; FRK1 has a paralog, KIN4, that arose from the whole genome duplication -S000034336 CDS YPL141C 16 286061 283464 C 2011-02-03 1996-07-31 -S000006061 ORF Verified YPL140C MKK2 putative mitogen-activated protein kinase kinase MKK2|SSP33|LPI6 chromosome 16 L000001118 16 289034 287514 C 2011-02-03 1996-07-31 MAPKK involved in the protein kinase C signaling pathway; involved in control of cell integrity; upon activation by Bck1p phosphorylates downstream target, Slt2p; functionally redundant with Mkk1p; MKK2 has a paralog, MKK1, that arose from the whole genome duplication -S000034223 CDS YPL140C 16 289034 287514 C 2011-02-03 1996-07-31 -S000118414 ARS ARS1614 ARSXVI-290 chromosome 16 16 289485 289705 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178192 ARS_consensus_sequence ARS1614 16 289530 289546 W 2014-11-18 2014-11-18 -S000006060 ORF Verified YPL139C UME1 WTM3 chromosome 16 L000003500 16 291051 289669 C 2011-02-03 1996-07-31 Component of both the Rpd3S and Rpd3L histone deacetylase complexes; negative regulator of meiosis; required for repression of a subset of meiotic genes during vegetative growth, binding of histone deacetylase Rpd3p required for activity, contains a NEE box and a WD repeat motif; homologous with Wtm1p; UME1 has a paralog, WTM2, that arose from the whole genome duplication -S000034691 CDS YPL139C 16 291051 289669 C 2011-02-03 1996-07-31 -S000006059 ORF Verified YPL138C SPP1 SAF41|CPS40 chromosome 16 16 292427 291366 C 2011-02-03 1996-07-31 Subunit of COMPASS (Set1C); a complex which methylates histone H3 on lysine 4 and is required in telomeric transcriptional silencing; promotes meiotic DSB formation by interacting with H3K4me3 and Rec107p, a protein required for Spo11p-catalyzed DSB formation located on chromosome axes; interacts with Orc2p; PHD finger domain protein similar to human CGBP, an unmethylated CpG binding protein; relocalizes to cytosol in response to hypoxia -S000034627 CDS YPL138C 16 292427 291366 C 2011-02-03 1996-07-31 -S000006057 ORF Dubious YPL136W chromosome 16 16 296286 296654 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene GIP3/YPL137C -S000034466 CDS YPL136W 16 296286 296654 W 2011-02-03 1996-07-31 -S000006058 ORF Verified YPL137C GIP3 protein phosphatase regulator GIP3 chromosome 16 16 296647 292817 C 2011-02-03 1996-07-31 Cytoplasmic protein that regulates protein phosphatase 1 Glc7p; overexpression relocalizes Glc7p from the nucleus and prevents chromosome segregation; may interact with ribosomes, based on co-purification experiments; GIP3 has a paralog, HER1, that arose from the whole genome duplication -S000034539 CDS YPL137C 16 296647 292817 C 2011-02-03 1996-07-31 -S000006056 ORF Verified YPL135W ISU1 iron-binding protein ISU1|NUA1 chromosome 16 L000004769 16 297553 298050 W 2011-02-03 1996-07-31 Conserved protein of the mitochondrial matrix; performs a scaffolding function during assembly of iron-sulfur clusters, interacts physically and functionally with yeast frataxin (Yfh1p); ISU1 has a paralog, ISU2, that arose from the whole genome duplication; isu1 isu2 double mutant is inviable; human homolog ISCU implicated in mitochondrial myopathy, can complement isu1 isu2 double mutant -S000032464 CDS YPL135W 16 297553 298050 W 2011-02-03 1996-07-31 -S000028720 ORF Dubious YPL135C-A chromosome 16 16 297851 297678 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032700 CDS YPL135C-A 16 297851 297678 C 2011-02-03 2003-07-29 -S000006055 ORF Verified YPL134C ODC1 mitochondrial 2-oxodicarboxylate carrier chromosome 16 S000007520 16 299503 298571 C 2011-02-03 1996-07-31 Mitochondrial inner membrane transporter; 2-oxodicarboxylate transporter, exports 2-oxoadipate and 2-oxoglutarate from the mitochondrial matrix to the cytosol for lysine and glutamate biosynthesis and lysine catabolism; suppresses, in multicopy, an fmc1 null mutation; ODC1 has a paralog, ODC2, that arose from the whole genome duplication -S000032295 CDS YPL134C 16 299503 298571 C 2011-02-03 1996-07-31 -S000006054 ORF Verified YPL133C RDS2 chromosome 16 16 301228 299888 C 2011-02-03 1996-07-31 Transcription factor involved in regulating gluconeogenesis; also involved in the regulation of glyoxylate cycle genes; member of the zinc cluster family of proteins; confers resistance to ketoconazole -S000032197 CDS YPL133C 16 301228 299888 C 2011-02-03 1996-07-31 -S000006053 ORF Verified YPL132W COX11 PSO7|LPI13 chromosome 16 L000000395|L000004044 16 301716 302618 W 2011-02-03 1996-07-31 Protein required for delivery of copper to Cox1p; mitochondrial inner membrane protein; association with mitochondrial ribosomes suggests that copper delivery may occur during translation of Cox1p -S000031257 CDS YPL132W 16 301716 302618 W 2011-02-03 1996-07-31 -S000006052 ORF Verified YPL131W RPL5 uL18|ribosomal 60S subunit protein L5|L18|YL3|L5|L1a|RPL1|LPI14 chromosome 16 L000001699 16 303121 304014 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L5; nascent Rpl5p is bound by specific chaperone Syo1p during translation; homologous to mammalian ribosomal protein L5 and bacterial L18; binds 5S rRNA and is required for 60S subunit assembly -S000031118 CDS YPL131W 16 303121 304014 W 2011-02-03 1996-07-31 -S000006051 ORF Verified YPL130W SPO19 chromosome 16 16 304387 305058 W 2011-02-03 1996-07-31 Meiosis-specific prospore protein; required to produce bending force necessary for proper assembly of the prospore membrane during sporulation; identified as a weak high-copy suppressor of the spo1-1 ts mutation; SPO19 has a paralog, YOR214C, that arose from the whole genome duplication -S000031018 CDS YPL130W 16 304387 305058 W 2011-02-03 1996-07-31 -S000006050 ORF Verified YPL129W TAF14 TATA-binding protein-associated factor TAF14|TafII30|ANC1|TFG3|TAF30|SWP29 chromosome 16 L000000086 16 305298 306137 W 2011-02-03 1996-07-31 Subunit of TFIID, TFIIF, INO80, SWI/SNF, and NuA3 complexes; involved in RNA polymerase II transcription initiation and in chromatin modification; contains a YEATS domain -S000031306 CDS YPL129W 16 305298 305306 W 2011-02-03 1996-07-31 -S000031307 CDS YPL129W 16 305412 306137 W 2011-02-03 1996-07-31 -S000031308 intron YPL129W 16 305307 305411 W 2011-02-03 1996-07-31 -S000006049 ORF Verified YPL128C TBF1 LPI16 chromosome 16 L000002264 16 308221 306533 C -81.5 2011-02-03 1996-07-31 Telobox-containing general regulatory factor; binds TTAGGG repeats within subtelomeric anti-silencing regions (STARs), blocking silent chromatin propagation; binds majority of snoRNA gene promoters, required for full snoRNA expression; caps DSB flanked by long T2AG3 repeats and blocks checkpoint activation -S000030320 CDS YPL128C 16 308221 306533 C 2011-02-03 1996-07-31 -S000006048 ORF Verified YPL127C HHO1 histone H1 chromosome 16 L000003354 16 309604 308828 C 2011-02-03 1996-07-31 Histone H1, linker histone with roles in meiosis and sporulation; decreasing levels early in sporulation may promote meiosis, and increasing levels during sporulation facilitate compaction of spore chromatin; binds to promoters and within genes in mature spores; may be recruited by Ume6p to promoter regions, contributing to transcriptional repression outside of meiosis; suppresses DNA repair involving homologous recombination -S000030125 CDS YPL127C 16 309604 308828 C 2011-02-03 1996-07-31 -S000006047 ORF Verified YPL126W NAN1 UTP17 chromosome 16 16 310210 312900 W 2011-02-03 1996-07-31 U3 snoRNP protein; component of the small (ribosomal) subunit (SSU) processosome containing U3 snoRNA; required for the biogenesis of18S rRNA -S000030112 CDS YPL126W 16 310210 312900 W 2011-02-03 1996-07-31 -S000006046 ORF Verified YPL125W KAP120 LPH2 chromosome 16 16 313388 316486 W 2011-02-03 1996-07-31 Karyopherin responsible for the nuclear import of Rpf1p; Rpf1p is a ribosome maturation factor -S000036402 CDS YPL125W 16 313388 316486 W 2011-02-03 1996-07-31 -S000006045 ORF Verified YPL124W SPC29 NIP29|LPH3 chromosome 16 L000001253 16 316755 317516 W 2011-02-03 1996-07-31 Inner plaque spindle pole body (SPB) component; links the central plaque component Spc42p to the inner plaque component Spc110p; required for SPB duplication -S000036286 CDS YPL124W 16 316755 317516 W 2011-02-03 1996-07-31 -S000006044 ORF Verified YPL123C RNY1 ribonuclease T2 chromosome 16 16 318945 317641 C 2011-02-03 1996-07-31 Vacuolar RNase of the T(2) family; relocalizes to the cytosol where it cleaves tRNAs upon oxidative or stationary phase stress; required for tRNA-specific translational pausing suring oxidative stress; promotes apoptosis under stress conditions and this function is independent of Rny1p catalytic activity -S000036104 CDS YPL123C 16 318945 317641 C 2011-02-03 1996-07-31 -S000006043 ORF Verified YPL122C TFB2 TFIIH/NER complex subunit TFB2 chromosome 16 L000003495 16 320767 319226 C 2011-02-03 1996-07-31 Subunit of TFIIH and nucleotide excision repair factor 3 complexes; involved in transcription initiation, required for nucleotide excision repair, similar to 52 kDa subunit of human TFIIH -S000035221 CDS YPL122C 16 320767 319226 C 2011-02-03 1996-07-31 -S000006042 ORF Verified YPL121C MEI5 LPH6 chromosome 16 L000001061 16 321630 320962 C 2011-02-03 1996-07-31 Meiosis-specific protein involved in meiotic recombination; involved in DMC1-dependent meiotic recombination; forms heterodimer with Sae3p; proposed to be an assembly factor for Dmc1p -S000035025 CDS YPL121C 16 321630 320962 C 2011-02-03 1996-07-31 -S000006041 ORF Verified YPL120W VPS30 beclin 1|ATG6|VPT30|APG6 chromosome 16 L000003545 16 322071 323744 W 2011-02-03 1996-07-31 Subunit of phosphatidylinositol (PtdIns) 3-kinase complexes I and II; Complex I is essential in autophagy, Complex II is required for vacuolar protein sorting; required for overflow degradation of misfolded proteins when ERAD is saturated; C-terminus has novel globular fold essential for autophagy through the targeting of the PI3-kinase complex I to the pre-autophagosomal structure; ortholog of higher eukaryote gene Beclin 1; human BECN1 can complement yeast null mutant -S000034961 CDS YPL120W 16 322071 323744 W 2011-02-03 1996-07-31 -S000028859 ORF Uncharacterized YPL119C-A chromosome 16 16 324287 324024 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000034573 CDS YPL119C-A 16 324287 324024 C 2011-02-03 2003-07-29 -S000006040 ORF Verified YPL119C DBP1 putative DEAD-box ATP-dependent RNA helicase DBP1|LPH8 chromosome 16 L000000492 16 326264 324411 C 2011-02-03 1996-07-31 Putative ATP-dependent RNA helicase of the DEAD-box protein family; mutants show reduced stability of the 40S ribosomal subunit scanning through 5' untranslated regions of mRNAs; protein abundance increases in response to DNA replication stress; DBP1 has a paralog, DED1, that arose from the whole genome duplication -S000035431 CDS YPL119C 16 326264 324411 C 2011-02-03 1996-07-31 -S000006039 ORF Verified YPL118W MRP51 mitochondrial 37S ribosomal protein MRP51 chromosome 16 L000003325 16 326628 327662 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; MRP51 exhibits genetic interactions with mutations in the COX2 and COX3 mRNA 5'-untranslated leader sequences -S000035395 CDS YPL118W 16 326628 327662 W 2011-02-03 1996-07-31 -S000006038 ORF Verified YPL117C IDI1 isopentenyl-diphosphate delta-isomerase IDI1|LPH10|BOT2 chromosome 16 L000000851 16 328730 327864 C -69.8 2011-02-03 1996-07-31 Isopentenyl diphosphate:dimethylallyl diphosphate isomerase; catalyzes an essential activation step in the isoprenoid biosynthetic pathway; required for viability; isopentenyl diphosphate:dimethylallyl diphosphate isomerase is also known as IPP isomerase -S000034380 CDS YPL117C 16 328730 327864 C 2011-02-03 1996-07-31 -S000006037 ORF Verified YPL116W HOS3 histone deacetylase chromosome 16 L000004093 16 329606 331699 W 2011-02-03 1996-07-31 Trichostatin A-insensitive homodimeric histone deacetylase (HDAC); specificity in vitro for histones H3, H4, H2A, and H2B; similar to Hda1p, Rpd3p, Hos1p, and Hos2p; deletion results in increased histone acetylation at rDNA repeats -S000034349 CDS YPL116W 16 329606 331699 W 2011-02-03 1996-07-31 -S000130199 ARS ARS1617 chromosome 16 16 331699 332100 2011-02-03 2009-05-08 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay -S000006036 ORF Verified YPL115C BEM3 chromosome 16 L000000169 16 335486 332100 C 2011-02-03 1996-07-31 Rho GTPase activating protein (RhoGAP); involved in control of the cytoskeleton organization; targets the essential Rho-GTPase Cdc42p, which controls establishment and maintenance of cell polarity, including bud-site assembly -S000034256 CDS YPL115C 16 335486 332100 C 2011-02-03 1996-07-31 -S000006035 ORF Dubious YPL114W chromosome 16 16 335948 336367 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; largely overlaps ORF YPL113C; diploid deletion in BY4743 strain background exhibits high budding index -S000034237 CDS YPL114W 16 335948 336367 W 2011-02-03 1996-07-31 -S000006034 ORF Verified YPL113C glyoxylate reductase chromosome 16 16 337143 335953 C 2011-02-03 1996-07-31 Glyoxylate reductase; acts on glyoxylate and hydroxypyruvate substrates; YPL113C is not an essential gene -S000032142 CDS YPL113C 16 337143 335953 C 2011-02-03 1996-07-31 -S000006033 ORF Verified YPL112C PEX25 chromosome 16 16 338620 337436 C 2011-02-03 1996-07-31 Peripheral peroxisomal membrane peroxin; required for the regulation of peroxisome size and maintenance, recruits GTPase Rho1p to peroxisomes, induced by oleate, interacts with Pex27p; PEX25 has a paralog, PEX27, that arose from the whole genome duplication -S000032062 CDS YPL112C 16 338620 337436 C 2011-02-03 1996-07-31 -S000006667 tRNA_gene tM(CAU)P IMT2 chromosome 16 L000003735 16 338919 338848 C 2011-02-03 2000-05-19 Methionine initiator tRNA (tRNA-Met); predicted by tRNAscan-SE analysis; one of four initiator methionine tRNAs in yeast that are functional for translation -S000034575 noncoding_exon tM(CAU)P 16 338919 338848 C 2011-02-03 2000-05-19 -S000006032 ORF Verified YPL111W CAR1 arginase|cargA|LPH15 chromosome 16 L000000216 16 339944 340945 W -75 2011-02-03 1996-07-31 Arginase, catabolizes arginine to ornithine and urea; expression responds to both induction by arginine and nitrogen catabolite repression; disruption decreases production of carcinogen ethyl carbamate during wine fermentation and also enhances freeze tolerance -S000031989 CDS YPL111W 16 339944 340945 W 2011-02-03 1996-07-31 -S000006031 ORF Verified YPL110C GDE1 glycerophosphocholine phosphodiesterase chromosome 16 16 344739 341068 C 2011-02-03 1996-07-31 Glycerophosphocholine (GroPCho) phosphodiesterase; hydrolyzes GroPCho to choline and glycerolphosphate, for use as a phosphate source and as a precursor for phosphocholine synthesis; may interact with ribosomes -S000031745 CDS YPL110C 16 344739 341068 C 2011-02-03 1996-07-31 -S000006030 ORF Uncharacterized YPL109C chromosome 16 16 347389 345264 C 2011-02-03 2004-07-21|1996-07-31|2003-09-27 UbiB family protein; contains transmembrane domain and mitochondrial targeting sequence; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000032179 CDS YPL109C 16 345444 345264 C 2011-02-03 2003-09-27 -S000032178 CDS YPL109C 16 347389 345597 C 2011-02-03 2004-07-21|1996-07-31|2003-09-27 -S000032180 intron YPL109C 16 345596 345445 C 2011-02-03 2003-09-27 -S000006029 ORF Uncharacterized YPL108W chromosome 16 16 348446 348952 W 2011-02-03 1996-07-31 Cytoplasmic protein of unknown function; non-essential gene that is induced in a GDH1 deleted strain with altered redox metabolism; GFP-fusion protein is induced in response to the DNA-damaging agent MMS -S000032152 CDS YPL108W 16 348446 348952 W 2011-02-03 1996-07-31 -S000006028 ORF Uncharacterized YPL107W chromosome 16 16 349119 349865 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to mitochondria; YPL107W is not an essential gene -S000031186 CDS YPL107W 16 349119 349865 W 2011-02-03 1996-07-31 -S000006027 ORF Verified YPL106C SSE1 adenyl-nucleotide exchange factor SSE1|MSI3|LPG3 chromosome 16 L000002078 16 352275 350194 C 2011-02-03 1996-07-31 ATPase component of heat shock protein Hsp90 chaperone complex; serves as nucleotide exchange factor to load ATP onto the SSA class of cytosolic Hsp70s; plays a role in prion propagation and determining prion variants; binds unfolded proteins; member of Hsp110 subclass of HSP70 proteins; deletion results in spindle elongation in S phase; SSE1 has a paralog, SSE2, that arose from the whole genome duplication -S000031029 CDS YPL106C 16 352275 350194 C 2011-02-03 1996-07-31 -S000006026 ORF Verified YPL105C SYH1 MYR1 chromosome 16 16 355412 352863 C 2011-02-03 1996-07-31 Protein of unknown function that influences nuclear pore distribution; co-purifies with ribosomes; contains a GYF domain, which bind proline-rich sequences; deletion extends chronological lifespan; SYH1 has a paralog, SMY2, that arose from the whole genome duplication -S000030941 CDS YPL105C 16 355412 352863 C 2011-02-03 1996-07-31 -S000006025 ORF Verified YPL104W MSD1 aspartate--tRNA ligase MSD1|LPG5 chromosome 16 L000001186 16 355700 357676 W 2011-02-03 1996-07-31 Mitochondrial aspartyl-tRNA synthetase; required for acylation of aspartyl-tRNA; yeast and bacterial aspartyl-, asparaginyl-, and lysyl-tRNA synthetases contain regions with high sequence similarity, suggesting a common ancestral gene -S000030906 CDS YPL104W 16 355700 357676 W 2011-02-03 1996-07-31 -S000006024 ORF Verified YPL103C FMP30 N-acetylphosphatidylethanolamine-hydrolyzing phospholipase D chromosome 16 16 359406 358000 C 2011-02-03 1996-07-31 Protein with a role in maintaining mitochondrial morphology; also involved in maintaining normal cardiolipin levels; mitochondrial inner membrane protein; proposed to be involved in N-acylethanolamine metabolism; related to mammalian N-acylPE-specific phospholipase D -S000029844 CDS YPL103C 16 359406 358000 C 2011-02-03 1996-07-31 -S000006022 ORF Verified YPL101W ELP4 Elongator subunit ELP4|KTI9|TOT7|HAP1 chromosome 16 16 360209 361579 W 2011-02-03 1996-07-31 Subunit of hexameric RecA-like ATPase Elp456 Elongator subcomplex; which is required for modification of wobble nucleosides in tRNA; required for Elongator structural integrity; null mutation is functionally complemented by human ELP4 -S000037803 CDS YPL101W 16 360209 361579 W 2011-02-03 1996-07-31 -S000006023 ORF Dubious YPL102C chromosome 16 16 360305 360003 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; deletion mutation enhances replication of Brome mosaic virus in S. cerevisiae, but this is likely due to effects on the overlapping gene ELP4 -S000037833 CDS YPL102C 16 360305 360003 C 2011-02-03 1996-07-31 -S000006021 ORF Verified YPL100W ATG21 HSV1|MAI1 chromosome 16 16 361872 363362 W 2011-02-03 1996-07-31 Phosphoinositide binding protein; required for vesicle formation in the cytoplasm-to-vacuole targeting (Cvt) pathway; binds both phosphatidylinositol (3,5)-bisphosphate and phosphatidylinositol 3-phosphate; WD-40 repeat protein -S000035919 CDS YPL100W 16 361872 363362 W 2011-02-03 1996-07-31 -S000006020 ORF Verified YPL099C INA17 AIM43|FMP14 chromosome 16 16 364068 363520 C 2011-02-03 1996-07-31 F1F0 ATPase synthase peripheral stalk assembly factor; subunit of the matrix-exposed inner mitochondrial membrane localized INA complex (Ina22p-Ina17p) involved in assembly of the F1F0 peripheral stalk; co-purifies with Ina22p and ATP synthase subunits; null mutant displays elevated frequency of mitochondrial genome loss and has a respiratory growth defect -S000037350 CDS YPL099C 16 364068 363520 C 2011-02-03 1996-07-31 -S000006019 ORF Verified YPL098C MGR2 chromosome 16 16 364727 364386 C 2011-02-03 1996-07-31 Subunit of the TIM23 translocase complex; acts to couple Tim21p with the core Tim23 translocase; provides quality control for insertion of membrane proteins by regulating their release into the inner membrane by the TIM23 complex; absolutely required for mitochondrial import of presequence-containing proteins at elevated temperature; required for viability of cells lacking the mitochondrial genome (petite-negative phenotype) -S000037279 CDS YPL098C 16 364727 364386 C 2011-02-03 1996-07-31 -S000006018 ORF Verified YPL097W MSY1 tyrosine--tRNA ligase MSY1 chromosome 16 L000002838 16 364952 366430 W 2011-02-03 1996-07-31 Mitochondrial tyrosyl-tRNA synthetase -S000037246 CDS YPL097W 16 364952 366430 W 2011-02-03 1996-07-31 -S000028423 ORF Verified YPL096C-A ERI1 RIN1 chromosome 16 S000028417 16 366735 366529 C 2011-02-03 2002-06-20 Endoplasmic reticulum membrane protein that binds and inhibits Ras2p; binds to and inhibits GTP-bound Ras2p at the endoplasmic reticulum (ER); component of the GPI-GnT complex which catalyzes the first step in GPI-anchor biosynthesis; probable homolog of mammalian PIG-Y protein -S000029959 CDS YPL096C-A 16 366735 366529 C 2011-02-03 2002-06-20 -S000006017 ORF Verified YPL096W PNG1 peptide-N4-(N-acetyl-beta-glucosaminyl)asparagine amidase chromosome 16 16 366927 368018 W 2011-02-03 1996-07-31 Conserved peptide N-glycanase; deglycosylating enzyme that cleaves N-glycans that are attached to misfolded ERAD substrate glycoproteins prior to proteasome-dependent degradation; localizes to the cytoplasm and nucleus; activity is enhanced by interaction with Rad23p; human ortholog NGLY1 is associated with a syndrome characterized by developmental delays, epilepsy, absence of tears and liver disease -S000037168 CDS YPL096W 16 366927 368018 W 2011-02-03 1996-07-31 -S000006016 ORF Verified YPL095C EEB1 medium-chain fatty acid ethyl ester synthase/esterase chromosome 16 16 369441 368071 C 2011-02-03 1996-07-31 Acyl-coenzymeA:ethanol O-acyltransferase; responsible for the major part of medium-chain fatty acid ethyl ester biosynthesis during fermentation; possesses short-chain esterase activity; may be involved in lipid metabolism and detoxification; EEB1 has a paralog, EHT1, that arose from the whole genome duplication -S000036441 CDS YPL095C 16 369441 368071 C 2011-02-03 1996-07-31 -S000006015 ORF Verified YPL094C SEC62 Sec63 complex subunit SEC62|LPG14 chromosome 16 L000001853 16 370663 369839 C 2011-02-03 2004-01-09|1996-07-31 Essential subunit of Sec63 complex; with Sec61 complex, Kar2p/BiP and Lhs1p forms a channel competent for SRP-dependent and post-translational SRP-independent protein targeting and import into the ER; cotranslationally N-acetylated by NatA; other members are Sec63p, Sec66p, and Sec72p -S000036372 CDS YPL094C 16 370663 369839 C 2011-02-03 2004-01-09|1996-07-31 -S000006014 ORF Verified YPL093W NOG1 putative GTPase NOG1 chromosome 16 16 370978 372921 W 2011-02-03 1996-07-31 Putative GTPase; associates with free 60S ribosomal subunits in the nucleolus and is required for 60S ribosomal subunit biogenesis; constituent of 66S pre-ribosomal particles; member of the ODN family of nucleolar G-proteins -S000036303 CDS YPL093W 16 370978 372921 W 2011-02-03 1996-07-31 -S000006013 ORF Verified YPL092W SSU1 LPG16 chromosome 16 L000002094 16 373793 375169 W 2011-02-03 1996-07-31 Plasma membrane sulfite pump involved in sulfite metabolism; required for efficient sulfite efflux; major facilitator superfamily protein -S000036190 CDS YPL092W 16 373793 375169 W 2011-02-03 1996-07-31 -S000006012 ORF Verified YPL091W GLR1 glutathione-disulfide reductase GLR1|LPG17 chromosome 16 L000000714 16 375502 376953 W 2011-02-03 1996-07-31 Cytosolic and mitochondrial glutathione oxidoreductase; converts oxidized glutathione to reduced glutathione; cytosolic Glr1p is the main determinant of the glutathione redox state of the mitochondrial intermembrane space; mitochondrial Glr1p has a role in resistance to hyperoxia; protein abundance increases in response to DNA replication stress -S000035283 CDS YPL091W 16 375502 376953 W 2011-02-03 1996-07-31 -S000006011 ORF Verified YPL090C RPS6A eS6|ribosomal 40S subunit protein S6A|S6e|rp9|YS4|S6A|S10A chromosome 16 L000004472 16 378395 377291 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S6, no bacterial homolog; phosphorylated on S233 by Ypk3p in a TORC1-dependent manner, and on S232 in a TORC1/2-dependent manner by Ypk1/2/3p; RPS6A has a paralog, RPS6B, that arose from the whole genome duplication -S000035035 CDS YPL090C 16 377995 377291 C 2011-02-03 1996-07-31 -S000035034 CDS YPL090C 16 378395 378390 C 2011-02-03 1996-07-31 -S000035036 intron YPL090C 16 378389 377996 C 2011-02-03 1996-07-31 -S000006010 ORF Verified YPL089C RLM1 chromosome 16 L000003028 16 381150 379120 C 2011-02-03 1996-07-31 MADS-box transcription factor; component of the protein kinase C-mediated MAP kinase pathway involved in the maintenance of cell integrity; phosphorylated and activated by the MAP-kinase Slt2p; RLM1 has a paralog, SMP1, that arose from the whole genome duplication -S000035262 CDS YPL089C 16 381150 379120 C 2011-02-03 1996-07-31 -S000006009 ORF Uncharacterized YPL088W aldo-keto reductase superfamily protein chromosome 16 16 381965 382993 W 2011-02-03 1996-07-31 Putative aryl alcohol dehydrogenase; transcription is activated by paralogous transcription factors Yrm1p and Yrr1p along with genes involved in multidrug resistance -S000035218 CDS YPL088W 16 381965 382993 W 2011-02-03 1996-07-31 -S000006008 ORF Verified YPL087W YDC1 alkaline dihydroceramidase chromosome 16 16 383455 384408 W 2011-02-03 1996-07-31 Alkaline dihydroceramidase, involved in sphingolipid metabolism; preferentially hydrolyzes dihydroceramide to a free fatty acid and dihydrosphingosine; has a minor reverse activity; YDC1 has a paralog, YPC1, that arose from the whole genome duplication -S000035115 CDS YPL087W 16 383455 384408 W 2011-02-03 1996-07-31 -S000118415 ARS ARS1618 ARSXVI-385 chromosome 16 16 384542 384789 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178193 ARS_consensus_sequence ARS1618 16 384592 384608 W 2014-11-18 2014-11-18 -S000006007 ORF Verified YPL086C ELP3 Elongator subunit ELP3|KAT9|KTI8|TOT3|HPA1 chromosome 16 L000004378 16 386446 384773 C 2011-02-03 1996-07-31 Subunit of Elongator complex; Elongator is required for modification of wobble nucleosides in tRNA; exhibits histone acetyltransferase activity that is directed to histones H3 and H4; disruption confers resistance to K. lactis zymotoxin; human homolog ELP3 can partially complement yeast elp3 null mutant -S000034914 CDS YPL086C 16 386446 384773 C 2011-02-03 1996-07-31 -S000006006 ORF Verified YPL085W SEC16 LPF1 chromosome 16 L000003051 16 387067 393654 W 2011-02-03 1996-07-31 COPII vesicle coat protein required for ER transport vesicle budding; essential factor in endoplasmic reticulum exit site (ERES) formation, as well as in COPII-mediated ER-to-Golgi traffic; bound to periphery of ER membranes and may act to stabilize initial COPII complexes; interacts with Sec23p, Sec24p and Sec31p -S000034866 CDS YPL085W 16 387067 393654 W 2011-02-03 1996-07-31 -S000006005 ORF Verified YPL084W BRO1 NPI3|ASI6|VPS31|LPF2 chromosome 16 L000003061 16 394038 396572 W 2011-02-03 1996-07-31 Cytoplasmic class E vacuolar protein sorting (VPS) factor; coordinates deubiquitination in the multivesicular body (MVB) pathway by recruiting Doa4p to endosomes -S000032909 CDS YPL084W 16 394038 396572 W 2011-02-03 1996-07-31 -S000006004 ORF Verified YPL083C SEN54 tRNA splicing endonuclease subunit SEN54 chromosome 16 L000003974 16 398105 396702 C 2011-02-03 1996-07-31 Subunit of the tRNA splicing endonuclease; tRNA splicing endonuclease (Sen complex) is composed of Sen2p, Sen15p, Sen34p, and Sen54p; Sen complex also cleaves the CBP1 mRNA at the mitochondrial surface -S000032739 CDS YPL083C 16 398105 396702 C 2011-02-03 1996-07-31 -S000006003 ORF Verified YPL082C MOT1 DNA-binding ATPase|END10|BTAF1|LPF4|BUR3 chromosome 16 L000001136|L000004559|S000029158 16 404083 398480 C 2011-02-03 1996-07-31 Essential protein involved in regulation of transcription; removes Spt15p (TBP) from DNA via its C-terminal ATPase activity; may have a role in ensuring that soluble TBP is available to bind TATA-less promoters; forms a complex with TBP that binds TATA DNA with high affinity but with altered specificity; the Mot1p-Spt15p-DNA ternary complex contains unbent DNA; coregulates transcription with Spt16p through assembly of preinitiation complex and organization of nucleosomes -S000032674 CDS YPL082C 16 404083 398480 C 2011-02-03 1996-07-31 -S000006002 ORF Verified YPL081W RPS9A uS4|ribosomal 40S subunit protein S9A|rp21|YS11|S9A|S4|S13 chromosome 16 L000004474 16 404950 406044 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S9 and bacterial S4; RPS9A has a paralog, RPS9B, that arose from the whole genome duplication -S000032631 CDS YPL081W 16 404950 404956 W 2011-02-03 1996-07-31 -S000032632 CDS YPL081W 16 405458 406044 W 2011-02-03 1996-07-31 -S000032633 intron YPL081W 16 404957 405457 W 2011-02-03 1996-07-31 -S000006001 ORF Dubious YPL080C chromosome 16 16 406498 406172 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031568 CDS YPL080C 16 406498 406172 C 2011-02-03 1996-07-31 -S000006000 ORF Verified YPL079W RPL21B eL21|ribosomal 60S subunit protein L21B|L21e|L21B chromosome 16 L000004459 16 406636 407539 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L21B; homologous to mammalian ribosomal protein L21, no bacterial homolog; RPL21B has a paralog, RPL21A, that arose from the whole genome duplication -S000031935 CDS YPL079W 16 406636 406646 W 2011-02-03 1996-07-31 -S000031936 CDS YPL079W 16 407068 407539 W 2011-02-03 1996-07-31 -S000031937 intron YPL079W 16 406647 407067 W 2011-02-03 1996-07-31 -S000005999 ORF Verified YPL078C ATP4 F1F0 ATP synthase subunit 4|LPF7 chromosome 16 L000000144 16 408744 408010 C 2011-02-03 1996-07-31 Subunit b of the stator stalk of mitochondrial F1F0 ATP synthase; ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; contributes to the oligomerization of the complex, which in turn determines the shape of inner membrane cristae; phosphorylated -S000030814 CDS YPL078C 16 408744 408010 C 2011-02-03 1996-07-31 -S000005998 ORF Uncharacterized YPL077C chromosome 16 16 410090 409368 C 2011-02-03 1996-07-31 Putative protein of unknown function; regulates PIS1 expression; mutant displays spore wall assembly defect in ether sensitivity screen; YPL077C is not an essential gene; YPL077C has a paralog, YBR197C, that arose from the whole genome duplication -S000030729 CDS YPL077C 16 410090 409368 C 2011-02-03 1996-07-31 -S000005997 ORF Verified YPL076W GPI2 phosphatidylinositol N-acetylglucosaminyltransferase|GCR4 chromosome 16 L000002807 16 410443 411285 W 2011-02-03 1996-07-31 Protein involved in the synthesis of GlcNAc-PI; GlcNAc-PI is the first intermediate in the synthesis of glycosylphosphatidylinositol (GPI) anchors; homologous to the human PIG-C protein; GlcNAc-PI stands for N-acetylglucosaminyl phosphatidylinositol -S000030692 CDS YPL076W 16 410443 411285 W 2011-02-03 1996-07-31 -S000005996 ORF Verified YPL075W GCR1 transcription regulator GCR1|SIT3|LPF10 chromosome 16 L000000690|S000029447|L000001900 16 412254 415362 W 2011-02-03 1997-10-20|1996-07-31 Transcriptional activator of genes involved in glycolysis; DNA-binding protein that interacts and functions with the transcriptional activator Gcr2p -S000036778 CDS YPL075W 16 412254 412261 W 2011-02-03 1997-10-20|1996-07-31 -S000036779 CDS YPL075W 16 413013 415362 W 2011-02-03 1997-10-20 -S000036780 intron YPL075W 16 412262 413012 W 2011-02-03 1997-10-20 -S000005995 ORF Verified YPL074W YTA6 putative AAA family ATPase YTA6 chromosome 16 L000002560 16 415763 418027 W 2011-02-03 1996-07-31 Putative ATPase of the CDC48/PAS1/SEC18 (AAA) family; localized to the cortex of mother cells but not to daughter cells; relocalizes from cytoplasm to plasma membrane foci upon DNA replication stress -S000036699 CDS YPL074W 16 415763 418027 W 2011-02-03 1996-07-31 -S000118416 ARS ARS1619 ARSXVI-418 chromosome 16 16 418138 418364 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178194 ARS_consensus_sequence ARS1619 16 418178 418194 W 2014-11-18 2014-11-18 -S000005993 ORF Verified YPL072W UBP16 putative ubiquitin-specific protease UBP16 chromosome 16 L000004590 16 418512 420011 W 2011-02-03 1996-07-31 Deubiquitinating enzyme anchored to the outer mitochondrial membrane; probably not important for general mitochondrial functioning, but may perform a more specialized function at mitochondria -S000036526 CDS YPL072W 16 418512 420011 W 2011-02-03 1996-07-31 -S000005994 ORF Dubious YPL073C chromosome 16 16 418984 418499 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps with verified gene UBP16/YPL072W; may interact with ribosome based on co-purification experiments -S000036568 CDS YPL073C 16 418984 418499 C 2011-02-03 1996-07-31 -S000005992 ORF Uncharacterized YPL071C chromosome 16 16 420518 420048 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus -S000035569 CDS YPL071C 16 420518 420048 C 2011-02-03 1996-07-31 -S000005991 ORF Verified YPL070W MUK1 guanine nucleotide exchange factor MUK1 chromosome 16 16 420948 422786 W 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF); involved in vesicle-mediated vacuolar transport, including Golgi-endosome trafficking and sorting through the multivesicular body (MVB); specifically stimulates the intrinsic guanine nucleotide exchange activity of Rab family members (Vps21p/Ypt52p/Ypt53p); partially redundant with GEF VPS9; required for localization of the CORVET complex to endosomes; contains a VPS9 domain -S000035514 CDS YPL070W 16 420948 422786 W 2011-02-03 1996-07-31 -S000130200 ARS ARS1620 chromosome 16 16 422786 422885 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000005990 ORF Verified YPL069C BTS1 farnesyltranstransferase chromosome 16 L000003062 16 423892 422885 C 2011-02-03 1996-07-31 Geranylgeranyl diphosphate synthase (GGPS); increases the intracellular pool of geranylgeranyl diphosphate, suppressor of bet2 mutation that causes defective geranylgeranylation of small GTP-binding proteins that mediate vesicular traffic -S000035752 CDS YPL069C 16 423892 422885 C 2011-02-03 1996-07-31 -S000005989 ORF Uncharacterized YPL068C chromosome 16 16 425096 424215 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleus and is induced in response to the DNA-damaging agent MMS -S000035679 CDS YPL068C 16 425096 424215 C 2011-02-03 1996-07-31 -S000005988 ORF Uncharacterized YPL067C chromosome 16 16 425847 425251 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YPL067C is not an essential gene -S000034754 CDS YPL067C 16 425847 425251 C 2011-02-03 1996-07-31 -S000005987 ORF Verified YPL066W RGL1 chromosome 16 16 426233 427672 W 2011-02-03 1996-07-31 Regulator of Rho1p signaling, cofactor of Tus1p; required for the localization of Tus1p during all phases of cytokinesis; green fluorescent protein (GFP)-fusion protein localizes to the bud neck and cytoplasm; null mutant is viable and exhibits growth defect on a non-fermentable (respiratory) carbon source -S000034712 CDS YPL066W 16 426233 427672 W 2011-02-03 1996-07-31 -S000005986 ORF Verified YPL065W VPS28 ESCRT-I subunit protein VPS28|VPL13|VPT28 chromosome 16 L000003228 16 427927 428655 W 2011-02-03 1996-07-31 Component of the ESCRT-I complex; complex is involved in ubiquitin-dependent sorting of proteins into the endosome; conserved C-terminal domain interacts with ESCRT-III subunit Vps20p; other members include Stp22p, Srn2p, Vps28p, and Mvb12p -S000034662 CDS YPL065W 16 427927 428655 W 2011-02-03 1996-07-31 -S000005985 ORF Verified YPL064C CWC27 putative peptidylprolyl isomerase CWC27 chromosome 16 16 429616 428711 C 2011-02-03 1996-07-31 Component of a complex containing Cef1p; putatively involved in pre-mRNA splicing; has similarity to S. pombe Cwf27p; protein abundance increases in response to DNA replication stress -S000034538 CDS YPL064C 16 429616 428711 C 2011-02-03 1996-07-31 -S000005984 ORF Verified YPL063W TIM50 protein translocase subunit TIM50 chromosome 16 16 429939 431369 W 2011-02-03 1996-07-31 Essential component of the TIM23 complex; acts as receptor for the translocase of the inner mitochondrial membrane (TIM23) complex guiding incoming precursors from the TOM complex; may control the gating of the Tim23p-Tim17p channel -S000034464 CDS YPL063W 16 429939 431369 W 2011-02-03 1996-07-31 -S000005983 ORF Dubious YPL062W chromosome 16 16 431895 432299 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YPL062W is not an essential gene; homozygous diploid mutant shows a decrease in glycogen accumulation -S000032441 CDS YPL062W 16 431895 432299 W 2011-02-03 1996-07-31 -S000005982 ORF Verified YPL061W ALD6 aldehyde dehydrogenase (NADP(+)) ALD6|ALD1 chromosome 16 L000003206 16 432588 434090 W 2011-02-03 1996-07-31 Cytosolic aldehyde dehydrogenase; activated by Mg2+ and utilizes NADP+ as the preferred coenzyme; required for conversion of acetaldehyde to acetate; constitutively expressed; locates to the mitochondrial outer surface upon oxidative stress -S000032358 CDS YPL061W 16 432588 434090 W 2011-02-03 1996-07-31 -S000005981 ORF Verified YPL060W MFM1 LPE10 chromosome 16 16 434523 435764 W 2011-02-03 1996-07-31 Mitochondrial inner membrane magnesium transporter; involved in maintenance of mitochondrial magnesium concentrations and membrane potential; indirectly affects splicing of group II introns; functionally and structurally related to Mrs2p -S000032240 CDS YPL060W 16 434523 435764 W 2011-02-03 1996-07-31 -S000006528 tRNA_gene tC(GCA)P1 chromosome 16 L000003734 16 435964 435893 C 2011-02-03 2000-05-19 Cysteine tRNA (tRNA-Cys), predicted by tRNAscan-SE analysis -S000037832 noncoding_exon tC(GCA)P1 16 435964 435893 C 2011-02-03 2000-05-19 -S000007196 long_terminal_repeat YPLWdelta9 chromosome 16 16 436068 436249 W 2011-02-03 2000-05-19 Ty1 LTR -S000007185 long_terminal_repeat YPLCdelta10 chromosome 16 16 436587 436250 C 2011-02-03 2000-05-19 Ty1 LTR -S000007197 long_terminal_repeat YPLWdelta11 chromosome 16 16 436594 436731 W 2011-02-03 2000-05-19 Ty1 LTR -S000007186 long_terminal_repeat YPLCtau1 chromosome 16 16 437260 436890 C 2011-02-03 2000-05-19 Ty4 LTR -S000007388 transposable_element_gene YPL060C-A chromosome 16 16 442742 437333 C 2015-01-13 1999-07-17|2014-11-18|2015-01-13 TyA Gag protein; the main structural constituent of virus-like particles (VLPs); Gag processing produces capsid proteins -S000178189 CDS YPL060C-A 16 439427 437333 C 2015-01-13 2014-11-18|2015-01-13 -S000036843 CDS YPL060C-A 16 442742 439429 C 2015-01-13 1999-07-17|2015-01-13 -S000178188 plus_1_translational_frameshift YPL060C-A 16 439428 439428 C 2015-01-13 2014-11-18|2015-01-13 -S000007188 LTR_retrotransposon YPLCTy4-1 Ty4 chromosome 16 16 443112 436890 C 2011-02-03 2000-05-19 Ty4 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007187 long_terminal_repeat YPLCtau2 chromosome 16 16 443112 442742 C 2011-02-03 2000-05-19 Ty4 LTR -S000005980 ORF Verified YPL059W GRX5 monothiol glutaredoxin GRX5 chromosome 16 S000007446 16 444579 445031 W 2011-02-03 1996-07-31 Glutathione-dependent oxidoreductase; mitochondrial matrix protein involved at an early step in the biogenesis of iron-sulfur centers along with Bol1p; hydroperoxide and superoxide-radical responsive; monothiol glutaredoxin subfamily member along with Grx3p and Grx4p -S000031521 CDS YPL059W 16 444579 445031 W 2011-02-03 1996-07-31 -S000005979 ORF Verified YPL058C PDR12 ATP-binding cassette multidrug transporter PDR12 chromosome 16 L000003205 16 450377 445842 C 2011-02-03 1996-07-31 Plasma membrane ATP-binding cassette (ABC) transporter; weak-acid-inducible multidrug transporter required for weak organic acid resistance; induced by sorbate and benzoate and regulated by War1p; mutants exhibit sorbate hypersensitivity -S000031386 CDS YPL058C 16 450377 445842 C 2011-02-03 1996-07-31 -S000005978 ORF Verified YPL057C SUR1 mannosylinositol phosphorylceramide synthase catalytic subunit SUR1|LPE15|CSG1|BCL21 chromosome 16 L000002243 16 453057 451909 C 2011-02-03 1996-07-31 Mannosylinositol phosphorylceramide (MIPC) synthase catalytic subunit; forms a complex with regulatory subunit Csg2p; function in sphingolipid biosynthesis is overlapping with that of Csh1p; SUR1 has a paralog, CSH1, that arose from the whole genome duplication -S000031334 CDS YPL057C 16 453057 451909 C 2011-02-03 1996-07-31 -S000005977 ORF Uncharacterized YPL056C LCL1 chromosome 16 16 453735 453430 C 2011-02-03 1996-07-31 Putative protein of unknown function; deletion mutant is fluconazole resistant and has long chronological lifespan -S000030453 CDS YPL056C 16 453735 453430 C 2011-02-03 1996-07-31 -S000005976 ORF Verified YPL055C LGE1 chromosome 16 16 454990 453992 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant forms abnormally large cells, and homozygous diploid null mutant displays delayed premeiotic DNA synthesis and reduced efficiency of meiotic nuclear division -S000030299 CDS YPL055C 16 454990 453992 C 2011-02-03 1996-07-31 -S000005975 ORF Verified YPL054W LEE1 chromosome 16 L000002859 16 455759 456664 W 2011-02-03 1996-07-31 Zinc-finger protein of unknown function -S000030275 CDS YPL054W 16 455759 456664 W 2011-02-03 1996-07-31 -S000119038 ARS ARS1633 ARSXVI-457|ARS1620.5 chromosome 16 16 456563 456810 2011-02-03 2006-10-04 Autonomously Replicating Sequence -S000005974 ORF Verified YPL053C KTR6 putative mannosyltransferase|MNN6 chromosome 16 L000003131 16 458458 457118 C 2011-02-03 1996-07-31 Probable mannosylphosphate transferase; involved in the synthesis of core oligosaccharides in protein glycosylation pathway; member of the KRE2/MNT1 mannosyltransferase family; KTR6 has a paralog, KRE2, that arose from the whole genome duplication -S000036430 CDS YPL053C 16 458458 457118 C 2011-02-03 1996-07-31 -S000005973 ORF Verified YPL052W OAZ1 YPL052W-A chromosome 16 16 458799 459678 W 2011-02-03 1996-07-31|2005-12-14 Regulator of ornithine decarboxylase Spe1p; antizyme that binds to Spe1p to stimulate ubiquitin-independent degradation by the proteasome; binding of polyamines to nascent Oaz1p during translation stimulates +1 ribosomal frameshifting, allowing translation of full-length Oaz1p -S000036401 CDS YPL052W 16 458799 459005 W 2011-02-03 1996-07-31|2005-12-14 -S000113788 CDS YPL052W 16 459007 459678 W 2011-02-03 2005-12-14 -S000113787 plus_1_translational_frameshift YPL052W 16 459006 459006 W 2011-02-03 2005-12-14 -S000005972 ORF Verified YPL051W ARL3 Arf family GTPase ARL3 chromosome 16 L000004809 16 459963 460559 W 2011-02-03 1996-07-31 ARF-like small GTPase of the RAS superfamily; required for recruitment of Arl1p, a GTPase that regulates membrane traffic, to the Golgi apparatus; NatC-catalyzed N-terminal acetylation regulates Golgi membrane association mediated by interaction with membrane receptor, Sys1p; similar to ADP-ribosylation factor and orthologous to mammalian ARFRP1 -S000036285 CDS YPL051W 16 459963 460559 W 2011-02-03 1996-07-31 -S000005971 ORF Verified YPL050C MNN9 mannosyltransferase complex subunit MNN9 chromosome 16 L000001129 16 461966 460779 C 2011-02-03 1996-07-31 Subunit of Golgi mannosyltransferase complex; this complex mediates elongation of the polysaccharide mannan backbone; forms a separate complex with Van1p that is also involved in backbone elongation; this complex also contains Anp1p, Mnn10p, Mnn11p, and Hoc1p -S000036103 CDS YPL050C 16 461966 460779 C 2011-02-03 1996-07-31 -S000005970 ORF Verified YPL049C DIG1 RST1 chromosome 16 L000003122 16 463839 462481 C 2011-02-03 1996-07-31 MAP kinase-responsive inhibitor of the Ste12p transcription factor; involved in the regulation of mating-specific genes and the invasive growth pathway; related regulators Dig1p and Dig2p bind to Ste12p; DIG1 has a paralog, DIG2, that arose from the whole genome duplication -S000036451 CDS YPL049C 16 463839 462481 C 2011-02-03 1996-07-31 -S000005969 ORF Verified YPL048W CAM1 translation elongation factor EF1B gamma|CPBP|TEF3 chromosome 16 L000000212|L000002279 16 464401 465648 W -27.3 2011-02-03 1996-07-31 One of two isoforms of the gamma subunit of eEF1B; stimulates the release of GDP from eEF1A (Tef1p/Tef2p) post association with the ribosomal complex with eEF1Balpha subunit; nuclear protein required for transcription of MXR1; binds the MXR1 promoter in the presence of other nuclear factors; binds calcium and phospholipids -S000035577 CDS YPL048W 16 464401 465648 W 2011-02-03 1996-07-31 -S000005968 ORF Verified YPL047W SGF11 SAGA histone acetyltransferase complex subunit SGF11 chromosome 16 16 465962 466261 W 2011-02-03 1996-07-31 Integral subunit of SAGA histone acetyltransferase complex; regulates transcription of a subset of SAGA-regulated genes, required for the Ubp8p association with SAGA and for H2B deubiquitylation -S000035515 CDS YPL047W 16 465962 466261 W 2011-02-03 1996-07-31 -S000005967 ORF Verified YPL046C ELC1 elongin C chromosome 16 L000004351 16 466943 466644 C 2011-02-03 1996-07-31 Elongin C, conserved among eukaryotes; forms a complex with Cul3p that polyubiquitylates monoubiquitylated RNA polymerase II to trigger its proteolysis; plays a role in global genomic repair -S000035426 CDS YPL046C 16 466943 466644 C 2011-02-03 1996-07-31 -S000005966 ORF Verified YPL045W VPS16 tethering complex subunit VPS16|CVT15|VPT16|VAM9|SVL6 chromosome 16 L000002471|L000003119|L000004766|S000029128 16 467260 469656 W 2011-02-03 1996-07-31 Subunit of the HOPS and the CORVET complexes; part of the Class C Vps complex essential for membrane docking and fusion at Golgi-to-endosome and endosome-to-vacuole protein transport stages -S000035390 CDS YPL045W 16 467260 469656 W 2011-02-03 1996-07-31 -S000005964 ORF Verified YPL043W NOP4 mRNA-binding ribosome biosynthesis protein NOP4|NOP77 chromosome 16 L000001262|L000001263 16 469939 471996 W 2011-02-03 1996-07-31 Nucleolar protein; essential for processing and maturation of 27S pre-rRNA and large ribosomal subunit biogenesis; constituent of 66S pre-ribosomal particles; contains four RNA recognition motifs (RRMs) -S000034348 CDS YPL043W 16 469939 471996 W 2011-02-03 1996-07-31 -S000005965 ORF Dubious YPL044C chromosome 16 16 470474 469926 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene NOP4/YPL043W -S000034376 CDS YPL044C 16 470474 469926 C 2011-02-03 1996-07-31 -S000005963 ORF Verified YPL042C SSN3 cyclin-dependent serine/threonine protein kinase SSN3|URR1|SSX7|CDK8|RYE5|UME5|SRB10|NUT7|GIG2 chromosome 16 L000002795|S000029631|L000002443|S000029520|L000002103 16 474707 473040 C 2011-02-03 1996-07-31 Cyclin-dependent protein kinase; component of RNA polymerase II holoenzyme; involved in phosphorylation of the RNA polymerase II C-terminal domain; involved in glucose repression -S000034254 CDS YPL042C 16 474707 473040 C 2011-02-03 1996-07-31 -S000005962 ORF Uncharacterized YPL041C MRX11 chromosome 16 16 475741 475118 C 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; SWAT-GFP and mCherry fusion proteins localize to the mitochondria; involved in maintenance of telomere length -S000034145 CDS YPL041C 16 475741 475118 C 2011-02-03 1996-07-31 -S000005961 ORF Verified YPL040C ISM1 isoleucine--tRNA ligase ISM1 chromosome 16 L000002648 16 479001 475993 C 2011-02-03 1996-07-31 Mitochondrial isoleucyl-tRNA synthetase; null mutant is deficient in respiratory growth; human homolog IARS2 implicated in mitochondrial diseases, can partially complement yeast null mutant -S000032140 CDS YPL040C 16 479001 475993 C 2011-02-03 1996-07-31 -S000005960 ORF Uncharacterized YPL039W chromosome 16 16 479225 480175 W 2011-02-03 1996-07-31 Putative protein of unknown function; YPL039W is not an essential gene -S000033263 CDS YPL039W 16 479225 480175 W 2011-02-03 1996-07-31 -S000028588 ORF Uncharacterized YPL038W-A chromosome 16 16 480182 480373 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031340 CDS YPL038W-A 16 480182 480373 W 2011-02-03 2003-07-29 -S000005959 ORF Verified YPL038W MET31 chromosome 16 L000003469 16 480535 481068 W 2011-02-03 1996-07-31 Zinc-finger DNA-binding transcription factor; targets strong transcriptional activator Met4p to promoters of sulfur metabolic genes; involved in transcriptional regulation of the methionine biosynthetic genes; feedforward loop controlling expression of MET32 and the lack of such a loop for MET31 may account for the differential actions of Met31p and Met32p; MET31 has a paralog, MET32, that arose from the whole genome duplication -S000032414 CDS YPL038W 16 480535 481068 W 2011-02-03 1996-07-31 -S000005958 ORF Verified YPL037C EGD1 chromosome 16 L000000545 16 481901 481428 C 2011-02-03 1996-07-31 Subunit beta1 of the nascent polypeptide-associated complex (NAC); involved in protein targeting, associated with cytoplasmic ribosomes; enhances DNA binding of the Gal4p activator; homolog of human BTF3b; EGD1 has a paralog, BTT1, that arose from the whole genome duplication -S000032253 CDS YPL037C 16 481901 481428 C 2011-02-03 1996-07-31 -S000005957 ORF Verified YPL036W PMA2 H(+)-exporting P2-type ATPase PMA2 chromosome 16 L000001450 16 482843 485686 W 2011-02-03 1996-07-31 Plasma membrane H+-ATPase; isoform of Pma1p, involved in pumping protons out of the cell; regulator of cytoplasmic pH and plasma membrane potential -S000032226 CDS YPL036W 16 482843 485686 W 2011-02-03 1996-07-31 -S000005955 ORF Uncharacterized YPL034W chromosome 16 16 486712 487209 W 2011-02-03 1996-07-31 Putative protein of unknown function; YPL034W is not essential gene -S000031184 CDS YPL034W 16 486712 487209 W 2011-02-03 1996-07-31 -S000005956 ORF Dubious YPL035C chromosome 16 16 486911 486564 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized gene YPL034W; YPL035C is not an essential gene -S000031189 CDS YPL035C 16 486911 486564 C 2011-02-03 1996-07-31 -S000005954 ORF Verified YPL033C SRL4 chromosome 16 16 488207 487362 C 2011-02-03 1996-07-31 Protein of unknown function; involved in regulation of dNTP production; null mutant suppresses the lethality of lcd1 and rad53 mutations; expression is induced by Kar4p -S000031014 CDS YPL033C 16 488207 487362 C 2011-02-03 1996-07-31 -S000005953 ORF Verified YPL032C SVL3 chromosome 16 L000004235 16 491364 488887 C 2011-02-03 1996-07-31 Protein of unknown function; mutant phenotype suggests a potential role in vacuolar function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery, cytoplasm, bud, and bud neck; relocalizes from bud neck to cytoplasm upon DNA replication stress; SVL3 has a paralog, PAM1, that arose from the whole genome duplication -S000030938 CDS YPL032C 16 491364 488887 C 2011-02-03 1996-07-31 -S000005952 ORF Verified YPL031C PHO85 cyclin-dependent serine/threonine-protein kinase PHO85|phoU|LDB15 chromosome 16 L000001431 16 493037 492018 C -34 2011-02-03 1996-07-31 Cyclin-dependent kinase; has ten cyclin partners; involved in regulating the cellular response to nutrient levels and environmental conditions and progression through the cell cycle; human lissencephaly-associated homolog CDK5 functionally complements null mutation -S000029949 CDS YPL031C 16 492918 492018 C 2011-02-03 1996-07-31 -S000029948 CDS YPL031C 16 493037 493021 C 2011-02-03 1996-07-31 -S000029950 intron YPL031C 16 493020 492919 C 2011-02-03 1996-07-31 -S000005951 ORF Verified YPL030W TRM44 tRNA (uracil) methyltransferase chromosome 16 16 493543 495246 W 2011-02-03 1996-07-31 tRNA(Ser) Um(44) 2'-O-methyltransferase; involved in maintaining levels of the tRNA-Ser species tS(CGA) and tS(UGA); conserved among metazoans and fungi but there does not appear to be a homolog in plants; TRM44 is a non-essential gene -S000029895 CDS YPL030W 16 493543 495246 W 2011-02-03 1996-07-31 -S000005950 ORF Verified YPL029W SUV3 ATP-dependent RNA helicase SUV3|LPB2 chromosome 16 L000002247 16 495506 497719 W 2011-02-03 1996-07-31 ATP-dependent RNA helicase; component of the mitochondrial degradosome along with the RNase Dss1p; the degradosome associates with the ribosome and mediates RNA turnover; also required during splicing of the COX1 AI5_beta intron; expression of a processed form of human homolog SUPV3L1 carrying an N-terminal deletion of 46 amino acids rescues yeast suv3 null mutant -S000037169 CDS YPL029W 16 495506 497719 W 2011-02-03 1996-07-31 -S000005949 ORF Verified YPL028W ERG10 acetyl-CoA C-acetyltransferase|TSM0115|LPB3 chromosome 16 L000000576 16 498096 499292 W -22 2011-02-03 1996-07-31 Acetyl-CoA C-acetyltransferase (acetoacetyl-CoA thiolase); cytosolic enzyme that transfers an acetyl group from one acetyl-CoA molecule to another, forming acetoacetyl-CoA; involved in the first step in mevalonate biosynthesis; human ACAT1 functionally complements the growth defect caused by repression of ERG10 expression -S000037054 CDS YPL028W 16 498096 499292 W 2011-02-03 1996-07-31 -S000005948 ORF Verified YPL027W SMA1 chromosome 16 16 499665 500402 W 2011-02-03 1996-07-31 Protein of unknown function involved in prospore membrane assembly; involved in the assembly of the prospore membrane during sporulation; interacts with Spo14p -S000036999 CDS YPL027W 16 499665 500402 W 2011-02-03 1996-07-31 -S000005947 ORF Verified YPL026C SKS1 putative serine/threonine protein kinase SKS1|SHA3 chromosome 16 L000004139|L000002824 16 502183 500675 C 2011-02-03 1996-07-31 Putative serine/threonine protein kinase; involved in the adaptation to low concentrations of glucose independent of the SNF3 regulated pathway; SKS1 has a paralog, VHS1, that arose from the whole genome duplication -S000036265 CDS YPL026C 16 502183 500675 C 2011-02-03 1996-07-31 -S000005946 ORF Dubious YPL025C chromosome 16 16 503030 502473 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036171 CDS YPL025C 16 503030 502473 C 2011-02-03 1996-07-31 -S000005945 ORF Verified YPL024W RMI1 NCE4 chromosome 16 L000004399 16 503517 504242 W 2011-02-03 1996-07-31 Subunit of the RecQ (Sgs1p) - Topo III (Top3p) complex; stimulates superhelical relaxing, DNA catenation/decatenation and ssDNA binding activities of Top3p; involved in response to DNA damage; functions in S phase-mediated cohesion establishment via a pathway involving the Ctf18-RFC complex and Mrc1p; stimulates Top3p DNA catenation/decatenation activity; null mutants display increased rates of recombination and delayed S phase -S000036120 CDS YPL024W 16 503517 504242 W 2011-02-03 1996-07-31 -S000005944 ORF Verified YPL023C MET12 methylenetetrahydrofolate reductase (NAD(P)H) MET12 chromosome 16 L000003571 16 506312 504339 C 2011-02-03 1996-07-31 Protein with MTHFR activity in vitro; null mutant has no phenotype and is prototrophic for methionine; MET13 encodes major isozyme of methylenetetrahydrofolate reductase (MTHFR) -S000035195 CDS YPL023C 16 506312 504339 C 2011-02-03 1996-07-31 -S000005943 ORF Verified YPL022W RAD1 RAD12|ssDNA endodeoxyribonuclease RAD1|LPB9 chromosome 16 L000001555 16 506697 509999 W -18 2011-02-03 1996-07-31 Single-stranded DNA endonuclease (with Rad10p); cleaves single-stranded DNA during nucleotide excision repair and double-strand break repair; subunit of Nucleotide Excision Repair Factor 1 (NEF1); homolog of human XPF protein -S000035144 CDS YPL022W 16 506697 509999 W 2011-02-03 1996-07-31 -S000005942 ORF Verified YPL021W ECM23 SRD2 chromosome 16 L000003366 16 511101 511664 W 2011-02-03 1996-07-31 Non-essential protein of unconfirmed function; affects pre-rRNA processing, may act as a negative regulator of the transcription of genes involved in pseudohyphal growth; homologous to Srd1p -S000035028 CDS YPL021W 16 511101 511664 W 2011-02-03 1996-07-31 -S000118417 ARS ARS1621 ARSXVI-512 chromosome 16 16 511636 511793 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178195 ARS_consensus_sequence ARS1621 16 511704 511720 W 2014-11-18 2014-11-18 -S000005941 ORF Verified YPL020C ULP1 SUMO protease ULP1|NIB1 chromosome 16 S000029323|L000001249 16 514178 512313 C 2011-02-03 1996-07-31 Protease that specifically cleaves Smt3p protein conjugates; required for cell cycle progression; associates with nucleoporins and may interact with septin rings during telophase; sequestered to the nucleolus under stress conditions -S000034812 CDS YPL020C 16 514178 512313 C 2011-02-03 1996-07-31 -S000005940 ORF Verified YPL019C VTC3 vacuolar transporter chaperone|PHM2 chromosome 16 S000007512 16 517018 514511 C 2011-02-03 1996-07-31 Regulatory subunit of the vacuolar transporter chaperone (VTC) complex; involved in membrane trafficking, vacuolar polyphosphate accumulation, microautophagy and non-autophagic vacuolar fusion; VTC3 has a paralog, VTC2, that arose from the whole genome duplication -S000032833 CDS YPL019C 16 517018 514511 C 2011-02-03 1996-07-31 -S000005939 ORF Verified YPL018W CTF19 MCM18 chromosome 16 L000003420 16 517651 518760 W 2011-02-03 1996-07-31 Outer kinetochore protein, needed for accurate chromosome segregation; component of kinetochore sub-complex COMA (Ctf19p, Okp1p, Mcm21p, Ame1p) that functions as platform for kinetochore assembly; required for spindle assembly checkpoint; minimizes potentially deleterious centromere-proximal crossovers by preventing meiotic DNA break formation proximal to centromere; homolog of human centromere constitutive-associated network (CCAN) subunit CENP-P and fission yeast fta2 -S000031967 CDS YPL018W 16 517651 518760 W 2011-02-03 1996-07-31 -S000005938 ORF Verified YPL017C IRC15 chromosome 16 16 520233 518734 C 2011-02-03 1996-07-31 Microtubule associated protein; regulates microtubule dynamics; required for accurate meiotic chromosome segregation; null mutant displays large budded cells due to delayed mitotic progression, increased levels of spontaneous Rad52 foci; IRC15 has a paralog, LPD1, that arose from the whole genome duplication -S000031777 CDS YPL017C 16 520233 518734 C 2011-02-03 1996-07-31 -S000005937 ORF Verified YPL016W SWI1 [SWI(+)]|[SWI+]|LPA1|GAM3|ADR6 chromosome 16 L000000052|L000002250 16 521014 524958 W 2011-02-03 1996-07-31|2011-02-03 Subunit of the SWI/SNF chromatin remodeling complex; regulates transcription by remodeling chromatin; required for transcription of many genes, including ADH1, ADH2, GAL1, HO, INO1 and SUC2; self-assembles to form [SWI+] prion and to alter expression pattern; human homolog ARID1A is a candidate tumor suppressor gene in breast cancer -S000031725 CDS YPL016W 16 521014 524958 W 2011-02-03 1996-07-31|2011-02-03 -S000005936 ORF Verified YPL015C HST2 histone deacetylase HST2 chromosome 16 L000003041 16 526883 525810 C 2011-02-03 1996-07-31 Cytoplasmic NAD(+)-dependent protein deacetylase; deacetylation targets are primarily cytoplasmic proteins; member of the silencing information regulator 2 (Sir2) family of NAD(+)-dependent protein deacetylases; modulates nucleolar (rDNA) and telomeric silencing; possesses NAD(+)-dependent histone deacetylase activity in vitro; contains a nuclear export signal (NES); function regulated by its nuclear export -S000031593 CDS YPL015C 16 526883 525810 C 2011-02-03 1996-07-31 -S000005935 ORF Verified YPL014W CIP1 chromosome 16 16 527547 528692 W 2011-02-03 1996-07-31 Cyclin-dependent kinase inhibitor; interacts with and inhibits the Cdc28p/Cln2p, G1/S phase cyclin-dependent kinase complex but not S-phase, or M-phase complexes; overexpression blocks cells in G1 phase and stabilizes the Cdc28p inhibitor Sic1p, while disruption accelerates the G1/S phase transition; phosphorylated during S phase in a Cdc28p-dependent manner; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and to the nucleus -S000031551 CDS YPL014W 16 527547 528692 W 2011-02-03 1996-07-31 -S000005934 ORF Verified YPL013C MRPS16 mitochondrial 37S ribosomal protein MRPS16 chromosome 16 16 529350 528985 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit -S000030647 CDS YPL013C 16 529350 528985 C 2011-02-03 1996-07-31 -S000005933 ORF Verified YPL012W RRP12 mRNA-binding protein RRP12 chromosome 16 16 529723 533409 W 2011-02-03 1996-07-31 Protein required for export of the ribosomal subunits; associates with the RNA components of the pre-ribosomes; has a role in nuclear import in association with Pse1p; also plays a role in the cell cycle and the DNA damage response; contains HEAT-repeats -S000030606 CDS YPL012W 16 529723 533409 W 2011-02-03 1996-07-31 -S000005932 ORF Verified YPL011C TAF3 TafII47|TAF47 chromosome 16 L000004154 16 534703 533642 C 2011-02-03 1996-07-31 TFIID subunit (47 kDa); involved in promoter binding and RNA polymerase II transcription initiation -S000030495 CDS YPL011C 16 534703 533642 C 2011-02-03 1996-07-31 -S000005931 ORF Verified YPL010W RET3 coatomer subunit zeta chromosome 16 L000004128 16 535018 535587 W 2011-02-03 1996-07-31 Zeta subunit of the coatomer complex (COPI); COPI coats Golgi-derived transport vesicles; involved in retrograde transport between Golgi and ER -S000030459 CDS YPL010W 16 535018 535587 W 2011-02-03 1996-07-31 -S000005930 ORF Verified YPL009C RQC2 TAE2 chromosome 16 16 538936 535820 C 2011-02-03 1996-07-31 Component of RQC, which mediates nascent chain degradation; RQC (ribosome quality control complex) is a ribosome-bound complex required for degradation of polypeptides arising from stalled translation; recruits alanine- and threonine-charged tRNA to the A site and directs the elongation of nascent chains independently of mRNA or 40S subunits; monitors translation stress and signals this to Hsf1p -S000037295 CDS YPL009C 16 538936 535820 C 2011-02-03 1996-07-31 -S000005929 ORF Verified YPL008W CHL1 MCM12|LPA9|CTF1 chromosome 16 L000000318 16 539385 541970 W -6 2011-02-03 1996-07-31 Probable DNA helicase; involved in sister-chromatid cohesion and genome integrity and interstrand cross-link repair; interacts with ECO1 and CTF18; mutants are defective in silencing, rDNA recombination, aging and the heat shock response; FANCJ-like helicase family member; mutations in the human homolog, DDX11/ChLR1, cause Warsaw breakage syndrome -S000037256 CDS YPL008W 16 539385 541970 W 2011-02-03 1996-07-31 -S000005928 ORF Verified YPL007C TFC8 transcription factor TFIIIC subunit TFC8|tau 60 chromosome 16 16 543848 542082 C 2011-02-03 1996-07-31 Subunit of RNA polymerase III transcription initiation factor complex; one of six subunits of RNA polymerase III transcription initiation factor complex (TFIIIC); part of TFIIIC TauB domain that binds BoxB promoter sites of tRNA and other genes; linker between TauB and TauA domains; human homolog is TFIIIC-90 -S000036517 CDS YPL007C 16 543848 542082 C 2011-02-03 1996-07-31 -S000005927 ORF Verified YPL006W NCR1 sphingolipid transporter chromosome 16 L000003596 16 544631 548143 W 2011-02-03 1996-07-31 Vacuolar membrane protein; transits through the biosynthetic vacuolar protein sorting pathway, involved in sphingolipid metabolism; cells lacking Ncr1p exhibit high levels of long chain bases (LCB), similar to the accumulation of high amounts of lipids observed in patients with Neimann-Pick C, a disease caused by loss-of-function mutations in NPC1, the functional ortholog of Ncr1p -S000036461 CDS YPL006W 16 544631 548143 W 2011-02-03 1996-07-31 -S000005926 ORF Verified YPL005W AEP3 chromosome 16 16 548486 550306 W 2011-02-03 1996-07-31 Peripheral mitochondrial inner membrane protein; may facilitate use of unformylated tRNA-Met in mitochondrial translation initiation; stabilizes the bicistronic AAP1-ATP6 mRNA -S000036393 CDS YPL005W 16 548486 550306 W 2011-02-03 1996-07-31 -S000005925 ORF Verified YPL004C LSP1 lipid-binding protein LSP1 chromosome 16 16 551657 550632 C 2011-02-03 1996-07-31 Eisosome core component; eisosomes are large immobile patch structures at the cell cortex associated with endocytosis; phosphorylated on Thr233 upon Pkc1p hyperactivation in a Slt2p MAPK-dependent fashion; null mutants show activation of Pkc1p/Ypk1p stress resistance pathways; member of the BAR domain family -S000035436 CDS YPL004C 16 551657 550632 C 2011-02-03 1996-07-31 -S000005924 ORF Verified YPL003W ULA1 ENR2 chromosome 16 L000004374 16 552020 553408 W 2011-02-03 1996-07-31 Protein that activates Rub1p (NEDD8) before neddylation; acts together with Uba3p; may play a role in protein degradation -S000035402 CDS YPL003W 16 552020 553408 W 2011-02-03 1996-07-31 -S000005923 ORF Verified YPL002C SNF8 ESCRT-II subunit protein SNF8|VPL14|VPS22 chromosome 16 L000001951 16 554328 553627 C 2011-02-03 1996-07-31 Component of the ESCRT-II complex; ESCRT-II is involved in ubiquitin-dependent sorting of proteins into the endosome; appears to be functionally related to SNF7; involved in glucose derepression -S000035294 CDS YPL002C 16 554328 553627 C 2011-02-03 1996-07-31 -S000005922 ORF Verified YPL001W HAT1 histone acetyltransferase catalytic subunit HAT1|KAT1 chromosome 16 L000003002 16 554605 555729 W 2011-02-03 1996-07-31 Catalytic subunit of the Hat1p-Hat2p histone acetyltransferase complex; uses the cofactor acetyl coenzyme A to acetylate free nuclear and cytoplasmic histone H4; involved in telomeric silencing and DNA double-strand break repair -S000035246 CDS YPL001W 16 554605 555729 W 2011-02-03 1996-07-31 -S000006477 centromere CEN16 CEN16 chromosome 16 L000000309 16 555957 556073 W 0 2011-02-03 2000-05-19|2006-05-09 Chromosome XVI centromere -S000077281 centromere_DNA_Element_I CEN16 16 555957 555966 W 2011-02-03 2004-10-05 -S000077282 centromere_DNA_Element_II CEN16 16 555967 556048 W 2011-02-03 2004-10-05 -S000077283 centromere_DNA_Element_III CEN16 16 556049 556073 W 2011-02-03 2004-10-05 -S000006205 ORF Verified YPR001W CIT3 citrate (Si)-synthase CIT3 chromosome 16 L000002855 16 556377 557837 W 2011-02-03 1996-07-31 Dual specificity mitochondrial citrate and methylcitrate synthase; catalyzes the condensation of acetyl-CoA and oxaloacetate to form citrate and that of propionyl-CoA and oxaloacetate to form 2-methylcitrate -S000030627 CDS YPR001W 16 556377 557837 W 2011-02-03 1996-07-31 -S000006206 ORF Verified YPR002W PDH1 putative 2-methylcitrate dehydratase chromosome 16 16 558385 559935 W 2011-02-03 1996-07-31 Putative 2-methylcitrate dehydratase; mitochondrial protein that participates in respiration; induced by diauxic shift; homologous to E. coli PrpD, may take part in the conversion of 2-methylcitrate to 2-methylisocitrate -S000030711 CDS YPR002W 16 558385 559935 W 2011-02-03 1996-07-31 -S000006570 tRNA_gene tF(GAA)P1 chromosome 16 L000003733 16 560289 560198 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis -S000035230 intron tF(GAA)P1 16 560252 560234 C 2011-02-03 2000-05-19 -S000035229 noncoding_exon tF(GAA)P1 16 560233 560198 C 2011-02-03 2000-05-19 -S000035228 noncoding_exon tF(GAA)P1 16 560289 560253 C 2011-02-03 2000-05-19 -S000007210 long_terminal_repeat YPRWdelta12 chromosome 16 16 560481 560812 W 2011-02-03 2000-05-19 Ty1 LTR -S000007254 ORF Dubious YPR002C-A chromosome 16 16 560766 560569 C 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the Ty1 long terminal repeat, YPRWdelta12 -S000031182 CDS YPR002C-A 16 560766 560569 C 2011-02-03 1999-07-17 -S000006207 ORF Uncharacterized YPR003C chromosome 16 16 563768 561504 C 2011-02-03 1996-07-31 Putative sulfate permease; physically interacts with Hsp82p; green fluorescent protein (GFP)-fusion protein localizes to the ER; YPR003C is not an essential gene -S000031534 CDS YPR003C 16 563768 561504 C 2011-02-03 1996-07-31 -S000118418 ARS ARS1622 ARSXVI-564 chromosome 16 16 563852 563967 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178196 ARS_consensus_sequence ARS1622 16 563877 563893 W 2014-11-18 2014-11-18 -S000006208 ORF Verified YPR004C AIM45 chromosome 16 16 565041 564007 C 2011-02-03 1996-07-31 Putative ortholog of mammalian ETF-alpha; interacts with frataxin, Yfh1p; null mutant displays elevated frequency of mitochondrial genome loss; may have a role in oxidative stress response; ETF-alpha is an electron transfer flavoprotein complex subunit -S000031622 CDS YPR004C 16 565041 564007 C 2011-02-03 1996-07-31 -S000119040 ARS ARS1634 ARSXVI-565|ARS1622.5 chromosome 16 16 565052 565294 2011-02-03 2006-10-04 Autonomously Replicating Sequence -S000006209 ORF Verified YPR005C HAL1 chromosome 16 L000000750 16 566671 565787 C 2011-02-03 1996-07-31 Cytoplasmic protein involved in halotolerance; decreases intracellular Na+ (via Ena1p) and increases intracellular K+ by decreasing efflux; expression repressed by Ssn6p-Tup1p and Sko1p and induced by NaCl, KCl, and sorbitol through Gcn4p -S000031706 CDS YPR005C 16 566671 565787 C 2011-02-03 1996-07-31 -S000006210 ORF Verified YPR006C ICL2 methylisocitrate lyase ICL2 chromosome 16 L000004095 16 568996 567269 C 2011-02-03 1996-07-31 2-methylisocitrate lyase of the mitochondrial matrix; functions in the methylcitrate cycle to catalyze the conversion of 2-methylisocitrate to succinate and pyruvate; ICL2 transcription is repressed by glucose and induced by ethanol -S000031857 CDS YPR006C 16 568996 567269 C 2011-02-03 1996-07-31 -S000006211 ORF Verified YPR007C REC8 SPO69 chromosome 16 L000004667 16 571378 569336 C 2011-02-03 1996-07-31 Meiosis-specific component of the sister chromatid cohesion complex; alpha-kleisin family member that maintains cohesion between sister chromatids during meiosis I; maintains cohesion between centromeres of sister chromatids until meiosis II; independent of its role in sister chromatid cohesion, Rec8p promotes allelic collisions and prevents nonspecific chromosome interactions; homolog of S. pombe Rec8p -S000032749 CDS YPR007C 16 571378 569336 C 2011-02-03 1996-07-31 -S000007200 long_terminal_repeat YPRCdelta13 chromosome 16 16 572173 571845 C 2011-02-03 2000-05-19 Ty1 LTR -S000006588 tRNA_gene tG(GCC)P1 chromosome 16 L000003721 16 572269 572339 W 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis -S000031679 noncoding_exon tG(GCC)P1 16 572269 572339 W 2011-02-03 2000-05-19 -S000006212 ORF Verified YPR008W HAA1 chromosome 16 16 573018 575102 W 2011-02-03 1996-07-31 Transcriptional activator involved in adaptation to weak acid stress; activates transcription of TPO2, YRO2, and other genes encoding membrane stress proteins; HAA1 has a paralog, CUP2, that arose from the whole genome duplication; relocalizes from cytoplasm to nucleus upon DNA replication stress -S000032911 CDS YPR008W 16 573018 575102 W 2011-02-03 1996-07-31 -S000006213 ORF Verified YPR009W SUT2 chromosome 16 16 576552 577358 W 2011-02-03 1996-07-31 Zn2Cys6 family transcription factor; positively regulates sterol uptake under anaerobic conditions with SUT1; represses filamentation-inducing genes during non-starvation conditions; positively regulates mating along with SUT1 by repressing the expression of genes (PRR2, NCE102 and RHO5) which function as mating inhibitors; multicopy suppressor of mutations that cause low activity of the cAMP/PKA pathway; SUT2 has a paralog, SUT1, that arose from the whole genome duplication -S000033007 CDS YPR009W 16 576552 577358 W 2011-02-03 1996-07-31 -S000006214 ORF Verified YPR010C RPA135 DNA-directed RNA polymerase I core subunit RPA135|A135|SRP3|RRN2|RPA2 chromosome 16 L000001674 16 581196 577585 C 2011-02-03 1996-07-31 RNA polymerase I second largest subunit A135 -S000033628 CDS YPR010C 16 581196 577585 C 2011-02-03 1996-07-31 -S000006628 tRNA_gene tK(CUU)P chromosome 16 L000003722 16 582062 582134 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000036081 noncoding_exon tK(CUU)P 16 582062 582134 W 2011-02-03 2000-05-19 -S000122558 ORF Uncharacterized YPR010C-A chromosome 16 16 582734 582373 C 2011-02-03 2007-05-09 Putative protein of unknown function; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the cytosol; conserved among Saccharomyces sensu stricto species -S000122561 CDS YPR010C-A 16 582558 582373 C 2011-02-03 2007-05-09 -S000122559 CDS YPR010C-A 16 582734 582702 C 2011-02-03 2007-05-09 -S000122560 intron YPR010C-A 16 582701 582559 C 2011-02-03 2007-05-09 -S000006215 ORF Verified YPR011C chromosome 16 16 584042 583062 C 2011-02-03 1996-07-31 Mitochondrial transporter; major substrates are adenosine 5'-phosphosulfate (APS) and 3'-phospho-adenosine 5'-phosphosulfate (PAPS); member of the mitochondrial carrier family; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000033732 CDS YPR011C 16 584042 583062 C 2011-02-03 1996-07-31 -S000006216 ORF Dubious YPR012W chromosome 16 16 584309 584563 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YPR012W is not an essential gene -S000034684 CDS YPR012W 16 584309 584563 W 2011-02-03 1996-07-31 -S000006217 ORF Uncharacterized YPR013C CMR3 chromosome 16 16 585585 584632 C 2011-02-03 1996-07-31 Putative zinc finger protein; YPR013C is not an essential gene -S000034773 CDS YPR013C 16 585585 584632 C 2011-02-03 1996-07-31 -S000006218 ORF Dubious YPR014C chromosome 16 16 587518 587189 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YPR014C is not an essential gene -S000034892 CDS YPR014C 16 587518 587189 C 2011-02-03 1996-07-31 -S000006219 ORF Uncharacterized YPR015C chromosome 16 16 591026 590283 C 2011-02-03 1996-07-31 Putative zinc finger transcription factor; binds DNA in sequence-specific manner; overexpression causes a cell cycle delay or arrest -S000035843 CDS YPR015C 16 591026 590283 C 2011-02-03 1996-07-31 -S000006220 ORF Verified YPR016C TIF6 translation initiation factor 6|CDC95 chromosome 16 L000004376 16 593069 592332 C 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; has similarity to human translation initiation factor 6 (eIF6); may be involved in the biogenesis and or stability of 60S ribosomal subunits -S000035939 CDS YPR016C 16 593069 592332 C 2011-02-03 1996-07-31 -S000007630 ORF Dubious YPR016W-A chromosome 16 16 593096 593356 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037261 CDS YPR016W-A 16 593096 593356 W 2011-02-03 2001-02-26 -S000006221 ORF Verified YPR017C DSS4 guanine nucleotide exchange factor DSS4 chromosome 16 L000000529 16 593917 593486 C 2011-02-03 1996-07-31 Guanine nucleotide dissociation stimulator for Sec4p; functions in the post-Golgi secretory pathway; binds zinc, found both on membranes and in the cytosol -S000036108 CDS YPR017C 16 593917 593486 C 2011-02-03 1996-07-31 -S000006222 ORF Verified YPR018W RLF2 CAC1 chromosome 16 L000003990 16 594476 596296 W 2011-02-03 1996-07-31 Largest subunit (p90) of the Chromatin Assembly Complex (CAF-1); chromatin assembly by CAF-1 is important for multiple processes including silencing at telomeres, mating type loci, and rDNA; maintenance of kinetochore structure; deactivation of the DNA damage checkpoint after DNA repair; chromatin dynamics during transcription; and repression of divergent noncoding transcription -S000036938 CDS YPR018W 16 594476 596296 W 2011-02-03 1996-07-31 -S000006223 ORF Verified YPR019W MCM4 MCM DNA helicase complex subunit MCM4|CDC54|HCD21 chromosome 16 L000002761 16 596750 599551 W 2011-02-03 1996-07-31 Essential helicase component of heterohexameric MCM2-7 complexes; MCM2-7 complexes bind pre-replication complexes on DNA and melt DNA prior to replication; forms an Mcm4p-6p-7p subcomplex; shows nuclear accumulation in G1; homolog of S. pombe Cdc21p -S000036996 CDS YPR019W 16 596750 599551 W 2011-02-03 1996-07-31 -S000006224 ORF Verified YPR020W ATP20 F1F0 ATP synthase subunit g chromosome 16 L000004738 16 599870 600217 W 2011-02-03 1996-07-31 Subunit g of the mitochondrial F1F0 ATP synthase; reversibly phosphorylated on two residues; unphosphorylated form is required for dimerization of the ATP synthase complex, which in turn determines oligomerization of the complex and the shape of inner membrane cristae -S000037811 CDS YPR020W 16 599870 600217 W 2011-02-03 1996-07-31 -S000006225 ORF Verified YPR021C AGC1 amino acid transporter AGC1 chromosome 16 16 603357 600649 C 2011-02-03 1996-07-31 Mitochondrial amino acid transporter; acts both as a glutamate uniporter and as an aspartate-glutamate exchanger; involved in nitrogen metabolism and nitrogen compound biosynthesis; human homolog SLC25A13 complements yeast null mutant -S000037867 CDS YPR021C 16 603357 600649 C 2011-02-03 1996-07-31 -S000006226 ORF Verified YPR022C SDD4 chromosome 16 16 607312 603911 C 2011-02-03 1996-07-31 Putative transcription factor, as suggested by computational analysis; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus and is induced in response to the DNA-damaging agent MMS; overproduction of a truncation allele suppresses lethality due to expression of the dominant PET9 allele AAC2-A128P -S000030796 CDS YPR022C 16 607312 603911 C 2011-02-03 1996-07-31 -S000006227 ORF Verified YPR023C EAF3 chromosome 16 16 610031 608826 C 2011-02-03 1996-07-31 Component of the Rpd3S histone deacetylase complex; Esa1p-associated factor, nonessential component of the NuA4 acetyltransferase complex, homologous to Drosophila dosage compensation protein MSL3; plays a role in regulating Ty1 transposition -S000030882 CDS YPR023C 16 610031 608826 C 2011-02-03 1996-07-31 -S000006228 ORF Verified YPR024W YME1 i-AAA protease YME1|YTA11|OSD1 chromosome 16 L000002522 16 610481 612724 W 2011-02-03 1996-07-31 Catalytic subunit of i-AAA protease complex; complex is located in mitochondrial inner membrane; responsible for degradation of unfolded or misfolded mitochondrial gene products; serves as nonconventional translocation motor to pull PNPase into intermembrane space; also has role in intermembrane space protein folding; mutation causes elevated rate of mitochondrial turnover; human homolog YME1L1 can complement yeast null mutant -S000030985 CDS YPR024W 16 610481 612724 W 2011-02-03 1996-07-31 -S000006229 ORF Verified YPR025C CCL1 TFIIH complex kinase subunit CCL1 chromosome 16 L000000237 16 614558 613377 C 2011-02-03 1996-07-31 Cyclin associated with protein kinase Kin28p; Kin28p is the TFIIH-associated carboxy-terminal domain (CTD) kinase involved in transcription initiation at RNA polymerase II promoters; human homolog CCNH allows growth of yeast ccl1 temperature-sensitive mutant at restrictive temperature -S000031028 CDS YPR025C 16 614558 613377 C 2011-02-03 1996-07-31 -S000006230 ORF Verified YPR026W ATH1 alpha,alpha-trehalase ATH1 chromosome 16 L000003059 16 615379 619014 W 2011-02-03 1996-07-31 Acid trehalase required for utilization of extracellular trehalose; involved in intracellular trehalose degradation during growth recovery after saline stress -S000032041 CDS YPR026W 16 615379 619014 W 2011-02-03 1996-07-31 -S000006231 ORF Uncharacterized YPR027C chromosome 16 16 621258 620425 C 2011-02-03 1996-07-31 Putative protein of unknown function; SWAT-GFP and seamless-GFP fusion proteins localize to the endoplasmic reticulum, while the mCherry fusion protein localizes to the vacuole -S000032081 CDS YPR027C 16 621258 620425 C 2011-02-03 1996-07-31 -S000006571 tRNA_gene tF(GAA)P2 chromosome 16 L000003732 16 622631 622540 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis -S000035233 intron tF(GAA)P2 16 622594 622576 C 2011-02-03 2000-05-19 -S000035232 noncoding_exon tF(GAA)P2 16 622575 622540 C 2011-02-03 2000-05-19 -S000035231 noncoding_exon tF(GAA)P2 16 622631 622595 C 2011-02-03 2000-05-19 -S000006232 ORF Verified YPR028W YOP1 YIP2 chromosome 16 L000004674 16 623527 624202 W 2011-02-03 1996-07-31 Reticulon-interacting protein; ER integral membrane protein involved in the generation of tubular ER morphology; promotes membrane curvature; forms tubules in vitro; regulates the ER asymmetry-induced inheritance block during ER stress; role in ER-derived peroxisomal biogenesis; interacts with Yip1p to mediate membrane traffic and with Sey1p to maintain ER morphology; facilitates lipid exchange between the ER and mitochondria; forms ER foci upon DNA replication stress -S000032203 CDS YPR028W 16 623527 623577 W 2011-02-03 1996-07-31 -S000032204 CDS YPR028W 16 623711 624202 W 2011-02-03 1996-07-31 -S000032205 intron YPR028W 16 623578 623710 W 2011-02-03 1996-07-31 -S000006233 ORF Verified YPR029C APL4 chromosome 16 L000004054 16 626967 624469 C 2011-02-03 1996-07-31 Gamma-adaptin; large subunit of the clathrin-associated protein (AP-1) complex; binds clathrin; involved in vesicle mediated transport -S000032228 CDS YPR029C 16 626967 624469 C 2011-02-03 1996-07-31 -S000006234 ORF Verified YPR030W CSR2 ART8|MRG19 chromosome 16 S000007450 16 627880 631245 W 2011-02-03 1996-07-31 Nuclear ubiquitin protein ligase binding protein; may regulate utilization of nonfermentable carbon sources and endocytosis of plasma membrane proteins; overproduction suppresses chs5 spa2 lethality at high temp; ubiquitinated by Rsp5p, deubiquitinated by Ubp2p; CSR2 has a paralog, ECM21, that arose from the whole genome duplication -S000034095 CDS YPR030W 16 627880 631245 W 2011-02-03 1996-07-31 -S000006235 ORF Verified YPR031W NTO1 chromosome 16 16 631515 633761 W 2011-02-03 1996-07-31 Subunit of the NuA3 histone acetyltransferase complex; this complex acetylates histone H3; contains PHD finger domain that interacts with methylated histone H3 -S000034190 CDS YPR031W 16 631515 633761 W 2011-02-03 1996-07-31 -S000118419 ARS ARS1623 ARSXVI-634 chromosome 16 16 633874 634122 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178197 ARS_consensus_sequence ARS1623 16 633921 633937 W 2014-11-18 2014-11-18 -S000006236 ORF Verified YPR032W SRO7 Rab GTPase-binding protein SRO7|SOP1|SNI1 chromosome 16 L000003105|L000004193 16 634123 637224 W 2011-02-03 1996-07-31 Effector of Rab GTPase Sec4p; forms a complex with Sec4p and t-SNARE Sec9p; involved in exocytosis and docking and fusion of post-Golgi vesicles with plasma membrane; regulates cell proliferation and colony development via the Rho1-Tor1 pathway; homolog of Drosophila lgl tumor suppressor; SRO7 has a paralog, SRO77, that arose from the whole genome duplication -S000035166 CDS YPR032W 16 634123 637224 W 2011-02-03 1996-07-31 -S000006237 ORF Verified YPR033C HTS1 TS4572|histidine--tRNA ligase|TSM4572 chromosome 16 L000000832|S000029607|L000002364 16 639019 637379 C 26 2011-02-03 1996-07-31 Cytoplasmic and mitochondrial histidine tRNA synthetase; efficient mitochondrial localization requires both a presequence and an amino-terminal sequence; mutations in human ortholog HARS2 are associated with Perrault syndrome -S000035204 CDS YPR033C 16 639019 637379 C 2011-02-03 1996-07-31 -S000006238 ORF Verified YPR034W ARP7 RSC11|SWP61 chromosome 16 L000003436 16 639525 640958 W 2011-02-03 1996-07-31 Component of both the SWI/SNF and RSC chromatin remodeling complexes; actin-related protein involved in transcriptional regulation -S000035348 CDS YPR034W 16 639525 640958 W 2011-02-03 1996-07-31 -S000006239 ORF Verified YPR035W GLN1 glutamate--ammonia ligase chromosome 16 L000000709 16 642208 643320 W 29 2011-02-03 1996-07-31|2011-02-03 Glutamine synthetase (GS); synthesizes glutamine from glutamate and ammonia; with Glt1p, forms the secondary pathway for glutamate biosynthesis from ammonia; expression regulated by nitrogen source and by amino acid limitation; forms filaments of back-to-back stacks of cylindrical homo-decamers at low pH, leading to enzymatic inactivation and storage during states of advanced cellular starvation; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress -S000035425 CDS YPR035W 16 642208 643320 W 2011-02-03 1996-07-31|2011-02-03 -S000006240 ORF Verified YPR036W VMA13 H(+)-transporting V1 sector ATPase subunit H|CLS11 chromosome 16 L000002465 16 643836 645272 W 2011-02-03 1996-07-31 Subunit H of the V1 peripheral membrane domain of V-ATPase; part of the electrogenic proton pump found throughout the endomembrane system; serves as an activator or a structural stabilizer of the V-ATPase; the V1 peripheral membrane domain of the vacuolar H+-ATPase (V-ATPase) has eight subunits -S000036312 CDS YPR036W 16 643836 645272 W 2011-02-03 1996-07-31 -S000028425 ORF Verified YPR036W-A SPO24 chromosome 16 16 645950 646153 W 2011-02-03 2002-07-25 Small (67 amino acids) protein involved in sporulation; localizes to the prospore membrane; phosphorylated during meiosis; a longer, 5'-extended mRNA is also transcribed beginning in mid-meiosis, regulated by two MSEs (middle sporulation elements), and includes an uORF of 15 codons in its 5'-UTR; evidence transcription is regulated by Pdr1p -S000029999 CDS YPR036W-A 16 645950 646153 W 2011-02-03 2002-07-25 -S000006242 ORF Dubious YPR038W IRC16 chromosome 16 16 646836 647195 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene YPR037C; null mutant displays increased levels of spontaneous Rad52p foci -S000036501 CDS YPR038W 16 646836 647195 W 2011-02-03 1996-07-31 -S000006243 ORF Dubious YPR039W chromosome 16 16 647012 647347 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified non essential genes ERV2/YPR037C and TIP41/YPR040W -S000036592 CDS YPR039W 16 647012 647347 W 2011-02-03 1996-07-31 -S000006241 ORF Verified YPR037C ERV2 flavin-linked sulfhydryl oxidase chromosome 16 16 647038 646448 C 2011-02-03 1996-07-31 Flavin-linked sulfhydryl oxidase localized to the ER lumen; involved in disulfide bond formation within the endoplasmic reticulum (ER) -S000036350 CDS YPR037C 16 647038 646448 C 2011-02-03 1996-07-31 -S000006244 ORF Verified YPR040W TIP41 chromosome 16 16 647305 648375 W 2011-02-03 1996-07-31 Protein that interacts with Tap42p, which regulates PP2A; component of the TOR (target of rapamycin) signaling pathway; protein abundance increases in response to DNA replication stress -S000037582 CDS YPR040W 16 647305 648375 W 2011-02-03 1996-07-31 -S000006245 ORF Verified YPR041W TIF5 translation initiation factor eIF5|SUI5 chromosome 16 L000002305 16 648704 649921 W 2011-02-03 1996-07-31 Translation initiation factor eIF5; functions both as a GTPase-activating protein to mediate hydrolysis of ribosome-bound GTP and as a GDP dissociation inhibitor to prevent recycling of eIF2 -S000037662 CDS YPR041W 16 648704 649921 W 2011-02-03 1996-07-31 -S000006246 ORF Verified YPR042C PUF2 chromosome 16 16 653662 650435 C 2011-02-03 1996-07-31 PUF family mRNA-binding protein; Pumilio homology domain confers RNA binding activity; preferentially binds mRNAs encoding membrane-associated proteins; binding site composed of two UAAU tetranucleotides, separated by a 3-nt linker; PUF2 has a paralog, JSN1, that arose from the whole genome duplication -S000037689 CDS YPR042C 16 653662 650435 C 2011-02-03 1996-07-31 -S000006247 ORF Verified YPR043W RPL43A eL43|ribosomal 60S subunit protein L43A|L43e|L43A chromosome 16 L000004469 16 654166 654847 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L43A; null mutation confers a dominant lethal phenotype; homologous to mammalian ribosomal protein L37A, no bacterial homolog; RPL43A has a paralog, RPL43B, that arose from the whole genome duplication -S000030558 CDS YPR043W 16 654166 654167 W 2011-02-03 1996-07-31 -S000030559 CDS YPR043W 16 654571 654847 W 2011-02-03 1996-07-31 -S000030560 intron YPR043W 16 654168 654570 W 2011-02-03 1996-07-31 -S000006248 ORF Dubious YPR044C OPI11 chromosome 16 16 654877 654524 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; largely overlaps verified gene RPL43A/YPR043W; deletion confers sensitivity to GSAO -S000030601 CDS YPR044C 16 654877 654524 C 2011-02-03 1996-07-31 -S000006249 ORF Verified YPR045C THP3 MNI2 chromosome 16 16 656552 655140 C 2011-02-03 1996-07-31 Protein that may have a role in transcription elongation; forms a complex with Csn12p that is recruited to transcribed genes; possibly involved in splicing based on pre-mRNA accumulation defect for many intron-containing genes -S000030682 CDS YPR045C 16 656552 655140 C 2011-02-03 1996-07-31 -S000006250 ORF Verified YPR046W MCM16 chromosome 16 L000003997 16 656799 657344 W 2011-02-03 1996-07-31 Component of the Ctf19 complex and the COMA subcomplex; involved in kinetochore-microtubule mediated chromosome segregation; binds to centromere DNA; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-H and fission yeast fta3 -S000031562 CDS YPR046W 16 656799 657344 W 2011-02-03 1996-07-31 -S000006251 ORF Verified YPR047W MSF1 phenylalanine--tRNA ligase chromosome 16 L000001187 16 657529 658938 W 2011-02-03 2003-09-22|1996-07-31 Mitochondrial phenylalanyl-tRNA synthetase; active as a monomer, unlike the cytoplasmic subunit which is active as a dimer complexed to a beta subunit dimer; similar to the alpha subunit of E. coli phenylalanyl-tRNA synthetase -S000031671 CDS YPR047W 16 657529 658938 W 2011-02-03 2003-09-22|1996-07-31 -S000006252 ORF Verified YPR048W TAH18 NAPDH-dependent diflavin reductase chromosome 16 L000004734 16 659182 661053 W 2011-02-03 1996-07-31 Conserved NAPDH-dependent diflavin reductase; component of an early step in the cytosolic Fe-S protein assembly (CIA) machinery; transfers electrons from NADPH to the Fe-S cluster of Dre2p; plays a pro-death role under oxidative stress; Tah18p-dependent nitric oxide synthesis confers high-temperature stress tolerance; possible target for development of antifungal drugs -S000031770 CDS YPR048W 16 659182 661053 W 2011-02-03 1996-07-31 -S000006253 ORF Verified YPR049C ATG11 autophagy protein ATG11|CVT3|CVT9 chromosome 16 L000004760|L000004756|S000029130 16 664673 661137 C 2011-02-03 1996-07-31 Adapter protein for pexophagy and the Cvt targeting pathway; directs receptor-bound cargo to the phagophore assembly site (PAS) for packaging into vesicles; required for recruiting other proteins to the PAS; recruits Dnm1p to facilitate fission of mitochondria that are destined for removal by mitophagy -S000031821 CDS YPR049C 16 664673 661137 C 2011-02-03 1996-07-31 -S000006255 ORF Verified YPR051W MAK3 peptide alpha-N-acetyltransferase MAK3|NAA30 chromosome 16 L000000977 16 664960 665490 W 34 2011-02-03 1996-07-31 Catalytic subunit of the NatC type N-terminal acetyltransferase (NAT); involved in subcellular targeting of select N-terminally acetylated substrates to the Golgi apparatus (Arl3p and Grh1p) and the inner nuclear membrane (Trm1p); required for replication of dsRNA virus; human NatC ortholog, Naa60, functionally complements the null, requiring either auxiliary subunit Mak10p or co-expression of human ortholog, Naa35; Naa60, the human NatF gene, also complements the null allele -S000034802 CDS YPR051W 16 664960 665490 W 2011-02-03 1996-07-31 -S000006254 ORF Dubious YPR050C chromosome 16 16 665366 664953 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps verified ORF MAK3/YPR051W -S000033860 CDS YPR050C 16 665366 664953 C 2011-02-03 1996-07-31 -S000006256 ORF Verified YPR052C NHP6A high-mobility group nucleosome-binding protein chromosome 16 L000001244|L000001245 16 665974 665693 C 2011-02-03 1996-07-31 High-mobility group (HMG) protein; binds to and remodels nucleosomes; involved in recruiting FACT and other chromatin remodelling complexes to chromosomes; functionally redundant with Nhp6Bp; required for transcriptional initiation fidelity of some tRNA genes; homologous to mammalian HMGB1 and HMGB2; NHP6A has a paralog, NHP6B, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000034851 CDS YPR052C 16 665974 665693 C 2011-02-03 1996-07-31 -S000006257 ORF Uncharacterized YPR053C chromosome 16 16 666243 665788 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YPR053C is not an essential gene; partially overlaps verified ORF NHP6A/YPR052C -S000034981 CDS YPR053C 16 666243 665788 C 2011-02-03 1996-07-31 -S000006258 ORF Verified YPR054W SMK1 mitogen-activated protein kinase SMK1 chromosome 16 L000001933 16 666280 667446 W 2011-02-03 1996-07-31 Middle sporulation-specific mitogen-activated protein kinase (MAPK); required for production of the outer spore wall layers; negatively regulates activity of the glucan synthase subunit Gsc2p -S000035191 CDS YPR054W 16 666280 667446 W 2011-02-03 1996-07-31 -S000006259 ORF Verified YPR055W SEC8 exocyst subunit SEC8 chromosome 16 L000001834 16 667676 670873 W 2011-02-03 1996-07-31 Essential 121 kDa subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis at the plasma membrane prior to SNARE-mediated fusion; involved in ER and Golgi inheritance in small buds; relocalizes away from bud neck upon DNA replication stress -S000036048 CDS YPR055W 16 667676 670873 W 2011-02-03 1996-07-31 -S000006260 ORF Verified YPR056W TFB4 TFIIH/NER complex subunit TFB4 chromosome 16 L000004156 16 671126 672142 W 2011-02-03 1996-07-31 Subunit of TFIIH complex; involved in transcription initiation, similar to 34 kDa subunit of human TFIIH; interacts with Ssl1p -S000036167 CDS YPR056W 16 671126 672142 W 2011-02-03 1996-07-31 -S000006261 ORF Verified YPR057W BRR1 chromosome 16 L000004059 16 672471 673496 W 2011-02-03 1996-07-31 snRNP protein component of spliceosomal snRNPs; required for pre-mRNA splicing and snRNP biogenesis; in null mutant newly-synthesized snRNAs are destabilized and 3'-end processing is slowed -S000036258 CDS YPR057W 16 672471 673496 W 2011-02-03 1996-07-31 -S000006262 ORF Verified YPR058W YMC1 organic acid transporter chromosome 16 L000002520 16 673751 674674 W 39.7 2011-02-03 1996-07-31 Secondary mitochondrial inner membrane glycine transporter; required with HEM25 for the transport of glycine into mitochondria for the initiation of heme biosynthesis; proposed role in oleate metabolism and glutamate biosynthesis; member of the mitochondrial carrier (MCF) family; localizes to the vacuole in response to H2O2; YMC1 has a paralog, YMC2, that arose from the whole genome duplication -S000036364 CDS YPR058W 16 673751 674674 W 2011-02-03 1996-07-31 -S000006263 ORF Dubious YPR059C chromosome 16 16 674700 674314 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YMC1/YPR058W -S000036983 CDS YPR059C 16 674700 674314 C 2011-02-03 1996-07-31 -S000006264 ORF Verified YPR060C ARO7 chorismate mutase ARO7|TYR7|OSM2|HGS1 chromosome 16 L000000120 16 675631 674861 C 39.4 2011-02-03 1996-07-31 Chorismate mutase; catalyzes the conversion of chorismate to prephenate to initiate the tyrosine/phenylalanine-specific branch of aromatic amino acid biosynthesis -S000037791 CDS YPR060C 16 675631 674861 C 2011-02-03 1996-07-31 -S000006265 ORF Verified YPR061C JID1 chromosome 16 16 676882 675977 C 2011-02-03 1996-07-31 Probable Hsp40p co-chaperone; has a DnaJ-like domain and appears to be involved in ER-associated degradation of misfolded proteins containing a tightly folded cytoplasmic domain; inhibits replication of Brome mosaic virus in S. cerevisiae -S000037866 CDS YPR061C 16 676882 675977 C 2011-02-03 1996-07-31 -S000006266 ORF Verified YPR062W FCY1 cytosine deaminase|yCD chromosome 16 L000003485 16 677165 677641 W 2011-02-03 1996-07-31 Cytosine deaminase; zinc metalloenzyme that catalyzes the hydrolytic deamination of cytosine to uracil; of biomedical interest because it also catalyzes the deamination of 5-fluorocytosine (5FC) to form anticancer drug 5-fluorouracil (5FU) -S000029927 CDS YPR062W 16 677165 677641 W 2011-02-03 1996-07-31 -S000006267 ORF Uncharacterized YPR063C chromosome 16 16 678320 677812 C 2011-02-03 1996-07-31 ER-localized protein of unknown function -S000029984 CDS YPR063C 16 678193 677812 C 2011-02-03 1996-07-31 -S000029983 CDS YPR063C 16 678320 678280 C 2011-02-03 1996-07-31 -S000029985 intron YPR063C 16 678279 678194 C 2011-02-03 1996-07-31 -S000006268 ORF Uncharacterized YPR064W chromosome 16 16 678951 679370 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YPR064W is not an essential gene -S000031009 CDS YPR064W 16 678951 679370 W 2011-02-03 1996-07-31 -S000006269 ORF Verified YPR065W ROX1 REO1 chromosome 16 L000001661 16 679693 680799 W 2011-02-03 1996-07-31 Heme-dependent repressor of hypoxic genes; mediates aerobic transcriptional repression of hypoxia induced genes such as COX5b and CYC7; repressor function regulated through decreased promoter occupancy in response to oxidative stress; contains an HMG domain that is responsible for DNA bending activity; involved in the hyperosmotic stress resistance -S000031123 CDS YPR065W 16 679693 680799 W 2011-02-03 1996-07-31 -S000006270 ORF Verified YPR066W UBA3 NEDD8-activating protein UBA3 chromosome 16 L000004373 16 681213 682112 W 2011-02-03 1996-07-31 Protein that activates Rub1p (NEDD8) before neddylation; acts together with Ula1p; may play a role in protein degradation; GFP-fusion protein localizes to the cytoplasm in a punctate pattern -S000031188 CDS YPR066W 16 681213 682112 W 2011-02-03 1996-07-31 -S000006271 ORF Verified YPR067W ISA2 chromosome 16 L000004955 16 682220 682777 W 2011-02-03 1996-07-31 Protein required for maturation of mitochondrial [4Fe-4S] proteins; functions in a complex with Isa1p and possibly Iba57p; localizes to the mitochondrial intermembrane space, overexpression of ISA2 suppresses grx5 mutations -S000032172 CDS YPR067W 16 682220 682777 W 2011-02-03 1996-07-31 -S000006272 ORF Verified YPR068C HOS1 histone deacetylase|CST3 chromosome 16 L000004091|S000029124|L000002993 16 684353 682941 C 2011-02-03 1996-07-31 Class I histone deacetylase (HDAC) family member; deacetylates Smc3p on lysine residues at anaphase onset; has sequence similarity to Hda1p, Rpd3p, Hos2p, and Hos3p; interacts with the Tup1p-Ssn6p corepressor complex -S000032210 CDS YPR068C 16 684353 682941 C 2011-02-03 1996-07-31 -S000118420 ARS ARS1624 ARSXVI-684 chromosome 16 16 684389 684637 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178198 ARS_consensus_sequence ARS1624 16 684405 684421 W 2014-11-18 2014-11-18 -S000006273 ORF Verified YPR069C SPE3 spermidine synthase chromosome 16 L000003328 16 685437 684556 C 2011-02-03 1996-07-31 Spermidine synthase; involved in biosynthesis of spermidine and also in biosynthesis of pantothenic acid; spermidine is required for growth of wild-type cells -S000032285 CDS YPR069C 16 685437 684556 C 2011-02-03 1996-07-31 -S000006274 ORF Verified YPR070W MED1 chromosome 16 16 685898 687598 W 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation -S000032028 CDS YPR070W 16 685898 687598 W 2011-02-03 1996-07-31 -S000006275 ORF Uncharacterized YPR071W chromosome 16 16 688172 688807 W 2011-02-03 1996-07-31 Putative membrane protein; YPR071W is not an essential gene; YPR071W has a paralog, YIL029C, that arose from a single-locus duplication -S000032138 CDS YPR071W 16 688172 688807 W 2011-02-03 1996-07-31 -S000006736 tRNA_gene tS(UGA)P SUP16 SUQ5 chromosome 16 L000003723|S000029556|L000002242|L000002190 16 689565 689646 W 48 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations -S000034846 noncoding_exon tS(UGA)P 16 689565 689646 W 2011-02-03 2000-05-19 -S000006276 ORF Verified YPR072W NOT5 CCR4-NOT core subunit NOT5 chromosome 16 L000004651 16 690107 691789 W 2011-02-03 1996-07-31 Component of the CCR4-NOT core complex, involved in mRNA decapping; involved intranscription initiation and elongation and in mRNA degradation; conserved lysine in human homolog of Not5p and Not3p is mutated in cancers -S000034137 CDS YPR072W 16 690107 691789 W 2011-02-03 1996-07-31 -S000006277 ORF Verified YPR073C LTP1 tyrosine protein phosphatase LTP1 chromosome 16 L000000957 16 692418 691933 C 2011-02-03 1996-07-31 Protein phosphotyrosine phosphatase of unknown cellular role; activated by adenine -S000034196 CDS YPR073C 16 692418 691933 C 2011-02-03 1996-07-31 -S000006278 ORF Verified YPR074C TKL1 transketolase TKL1 chromosome 16 L000002313 16 694838 692796 C 2011-02-03 1996-07-31 Transketolase; catalyzes conversion of xylulose-5-phosphate and ribose-5-phosphate to sedoheptulose-7-phosphate and glyceraldehyde-3-phosphate in the pentose phosphate pathway; needed for synthesis of aromatic amino acids; TKL1 has a paralog, TKL2, that arose from the whole genome duplication -S000034281 CDS YPR074C 16 694838 692796 C 2011-02-03 1996-07-31 -S000007631 ORF Dubious YPR074W-A chromosome 16 16 695018 695188 W 2011-02-03 2001-02-26 Hypothetical protein identified by homology -S000037262 CDS YPR074W-A 16 695018 695188 W 2011-02-03 2001-02-26 -S000118421 ARS ARS1625 ARSXVI-696 chromosome 16 16 695461 695574 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178199 ARS_consensus_sequence ARS1625 16 695465 695481 W 2014-11-18 2014-11-18 -S000006280 ORF Dubious YPR076W chromosome 16 16 696476 696850 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035349 CDS YPR076W 16 696476 696850 W 2011-02-03 1996-07-31 -S000006279 ORF Verified YPR075C OPY2 chromosome 16 L000004017 16 696819 695737 C 2011-02-03 1996-07-31 Integral membrane protein that acts as a membrane anchor for Ste50p; involved in the signaling branch of the high-osmolarity glycerol (HOG) pathway and as a regulator of the filamentous growth pathway; overproduction blocks cell cycle arrest in the presence of mating pheromone; relocalizes from vacuole to plasma membrane upon DNA replication stress -S000034338 CDS YPR075C 16 696819 695737 C 2011-02-03 1996-07-31 -S000006281 ORF Dubious YPR077C chromosome 16 16 697502 697131 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; expression increased by deletion of NAP1 -S000035364 CDS YPR077C 16 697502 697131 C 2011-02-03 1996-07-31 -S000006282 ORF Uncharacterized YPR078C chromosome 16 16 698265 697147 C 2011-02-03 1996-07-31 Putative protein of unknown function; possible role in DNA metabolism and/or in genome stability; expression is heat-inducible -S000035444 CDS YPR078C 16 698265 697147 C 2011-02-03 1996-07-31 -S000006283 ORF Verified YPR079W MRL1 chromosome 16 16 698869 700014 W 2011-02-03 1996-07-31 Membrane protein; has similarity to mammalian mannose-6-phosphate receptors; possibly functions as a sorting receptor in the delivery of vacuolar hydrolases; protein abundance increases in response to DNA replication stress -S000035534 CDS YPR079W 16 698869 700014 W 2011-02-03 1996-07-31 -S000006284 ORF Verified YPR080W TEF1 translation elongation factor EF-1 alpha|eEF1A|EF-1 alpha chromosome 16 L000002277 16 700594 701970 W 46 2011-02-03 1996-07-31 Translational elongation factor EF-1 alpha; in the GTP-bound active form, binds to and delivers aminoacylated tRNA to the A-site of ribosomes for elongation of nascent polypeptides; associates with vacuolar Rho1p GTPase; may also have a role in tRNA re-export from the nucleus; TEF1 has a paralog, TEF2, that arose from the whole genome duplication -S000035186 CDS YPR080W 16 700594 701970 W 2011-02-03 1996-07-31 -S000006285 ORF Verified YPR081C GRS2 putative glycine--tRNA ligase chromosome 16 16 703970 702114 C 2011-02-03 1996-07-31 Glycine-tRNA synthetase, not expressed under normal growth conditions; expression is induced under heat, oxidative, pH, or ethanol stress conditions; more stable than the major glycine-tRNA synthetase Grs1p at 37 deg C; GRS2 has a paralog, GRS1, that arose from the whole genome duplication -S000035269 CDS YPR081C 16 703970 702114 C 2011-02-03 1996-07-31 -S000006286 ORF Verified YPR082C DIB1 U4/U6-U5 snRNP complex subunit DIB1|SNU16 chromosome 16 L000004542 16 704656 704225 C 2011-02-03 1996-07-31 17-kDa component of the U4/U6aU5 tri-snRNP; plays an essential role in pre-mRNA splicing; human ortholog TXNL4A (the human U5-specific 15-kDa protein) complements yeast dib1 null mutant -S000036157 CDS YPR082C 16 704656 704225 C 2011-02-03 1996-07-31 -S000006287 ORF Verified YPR083W MDM36 chromosome 16 16 704854 706593 W 2011-02-03 1996-07-31 Mitochondrial protein; required for normal mitochondrial morphology and inheritance; component of the mitochondria-ER-cortex-ancor (MECA); interacts with Num1p to link the ER and mitochondria at the cell cortex; proposed involvement in the formation of Dnm1p and Num1p-containing cortical anchor complexes that promote mitochondrial fission -S000036324 CDS YPR083W 16 704854 706593 W 2011-02-03 1996-07-31 -S000006288 ORF Uncharacterized YPR084W chromosome 16 16 706972 708342 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000036408 CDS YPR084W 16 706972 708342 W 2011-02-03 1996-07-31 -S000006289 ORF Verified YPR085C ASA1 chromosome 16 16 709828 708497 C 2011-02-03 2003-09-22|1996-07-31 Subunit of the ASTRA complex, involved in chromatin remodeling; telomere length regulator involved in the stability or biogenesis of PIKKs such as TORC1 -S000030072 CDS YPR085C 16 709828 708497 C 2011-02-03 2003-09-22|1996-07-31 -S000006290 ORF Verified YPR086W SUA7 transcription factor TFIIB|TFIIB|SOH4 chromosome 16 L000002141 16 710101 711138 W 2011-02-03 1996-07-31 Transcription factor TFIIB; a general transcription factor required for transcription initiation and start site selection by RNA polymerase II -S000030297 CDS YPR086W 16 710101 711138 W 2011-02-03 1996-07-31 -S000006291 ORF Dubious YPR087W VPS69 chromosome 16 16 711354 711674 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 85% of ORF overlaps the verified gene SRP54; deletion causes a vacuolar protein sorting defect -S000030448 CDS YPR087W 16 711354 711674 W 2011-02-03 1996-07-31 -S000006292 ORF Verified YPR088C SRP54 RNA-binding signal recognition particle subunit SRP54|SRH1 chromosome 16 L000002064 16 713028 711403 C 2011-02-03 1996-07-31 Signal recognition particle (SRP) subunit (homolog of mammalian SRP54); contains the signal sequence-binding activity of SRP, interacts with the SRP RNA, and mediates binding of SRP to signal receptor; contains GTPase domain -S000030479 CDS YPR088C 16 713028 711403 C 2011-02-03 1996-07-31 -S000006293 ORF Uncharacterized YPR089W YPR090W chromosome 16 16 713275 715941 W 2011-02-03 2003-09-29|1996-07-31 Protein of unknown function; exhibits genetic interaction with ERG11 and protein-protein interaction with Hsp82p -S000031385 CDS YPR089W 16 713275 715941 W 2011-02-03 2003-09-29|1996-07-31 -S000006296 ORF Dubious YPR092W chromosome 16 16 718379 718684 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032289 CDS YPR092W 16 718379 718684 W 2011-02-03 1996-07-31 -S000006295 ORF Verified YPR091C NVJ2 chromosome 16 16 718468 716156 C 2011-02-03 1996-07-31 Lipid-binding ER protein, enriched at nucleus-vacuolar junctions (NVJ); may be involved in sterol metabolism or signaling at the NVJ; contains a synaptotagmin-like-mitochondrial-lipid binding protein (SMP) domain; binds phosphatidylinositols and other lipids in a large-scale study; may interact with ribosomes, based on co-purification experiments -S000031211 CDS YPR091C 16 718468 716156 C 2011-02-03 1996-07-31 -S000006442 snoRNA_gene snR51 SNR51 chromosome 16 L000004520 16 718806 718700 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U2729 and small subunit (SSU) rRNA at position A100 -S000030732 noncoding_exon snR51 16 718806 718700 C 2011-02-03 2000-05-19 -S000006461 snoRNA_gene snR70 SNR70 chromosome 16 L000004539 16 719050 718887 C 2011-02-03 2000-05-19|2007-05-09 C/D box small nucleolar RNA (snoRNA); predicted to guide 2'-O-methylation of small subunit (SSU) rRNA at position C1639 -S000031744 noncoding_exon snR70 16 719050 718887 C 2011-02-03 2000-05-19|2007-05-09 -S000007305 snoRNA_gene snR41 SNR41 chromosome 16 L000003056 16 719242 719148 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at positions A541 and G1126 -S000030612 noncoding_exon snR41 16 719242 719148 C 2011-02-03 2000-05-19 -S000006297 ORF Verified YPR093C ASR1 ubiquitin-protein ligase ASR1 chromosome 16 16 720424 719558 C 2011-02-03 2003-09-22|1996-07-31 Ubiquitin ligase that modifies and regulates RNA Pol II; involved in a putative alcohol-responsive signaling pathway; accumulates in the nucleus under alcohol stress; has a role in organization of septins and the actin cytoskeleton; contains a Ring/PHD finger domain similar to the mammalian rA9 protein -S000032333 CDS YPR093C 16 720424 719558 C 2011-02-03 2003-09-22|1996-07-31 -S000006298 ORF Verified YPR094W RDS3 U2 snRNP complex subunit RDS3 chromosome 16 16 720637 720960 W 2011-02-03 1996-07-31 Component of the SF3b subcomplex of the U2 snRNP; zinc cluster protein involved in pre-mRNA splicing and cycloheximide resistance -S000032497 CDS YPR094W 16 720637 720960 W 2011-02-03 1996-07-31 -S000006299 ORF Verified YPR095C SYT1 Arf family guanine nucleotide exchange factor SYT1 chromosome 16 L000004575 16 724717 721037 C 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF) for Arf proteins; promotes activation of Arl1p, which recruits Imh1p to the Golgi; involved in vesicular transport; member of the Sec7-domain family; contains a PH domain -S000034455 CDS YPR095C 16 724717 721037 C 2011-02-03 1996-07-31 -S000006300 ORF Verified YPR096C chromosome 16 16 725144 724842 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments -S000034576 CDS YPR096C 16 725144 724842 C 2011-02-03 1996-07-31 -S000006301 ORF Verified YPR097W chromosome 16 16 725394 728615 W 2011-02-03 1996-07-31|2011-02-03 Protein that contains a PX domain and binds phosphoinositides; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; PX stands for Phox homology -S000034675 CDS YPR097W 16 725394 728615 W 2011-02-03 1996-07-31|2011-02-03 -S000006302 ORF Verified YPR098C chromosome 16 16 729528 728947 C 2011-02-03 2003-09-27|1996-07-31 Protein of unknown function; localized to the mitochondrial outer membrane -S000034698 CDS YPR098C 16 729385 728947 C 2011-02-03 2003-09-27 -S000034697 CDS YPR098C 16 729528 729482 C 2011-02-03 2003-09-27|1996-07-31 -S000034699 intron YPR098C 16 729481 729386 C 2011-02-03 2003-09-27 -S000006304 ORF Verified YPR100W MRPL51 mitochondrial 54S ribosomal protein MRPL51 chromosome 16 16 729791 730213 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000033115 CDS YPR100W 16 729791 730213 W 2011-02-03 1996-07-31 -S000006303 ORF Dubious YPR099C chromosome 16 16 730113 729757 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene MRPL51/YPR100W -S000035639 CDS YPR099C 16 730113 729757 C 2011-02-03 1996-07-31 -S000006305 ORF Verified YPR101W SNT309 NTC25 chromosome 16 L000004269 16 730492 731019 W 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); this complex contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs; interacts physically and genetically with Prp19p -S000033189 CDS YPR101W 16 730492 731019 W 2011-02-03 1996-07-31 -S000006306 ORF Verified YPR102C RPL11A uL5|ribosomal 60S subunit protein L11A|rp39A|YL22|L5|L16B|L11A chromosome 16 L000004453 16 731748 731224 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L11A; expressed at twice the level of Rpl11Bp; involved in ribosomal assembly; depletion causes degradation of 60S proteins and RNA; homologous to mammalian ribosomal protein L11 and bacterial L5; RPL11A has a paralog, RPL11B, that arose from the whole genome duplication -S000033914 CDS YPR102C 16 731748 731224 C 2011-02-03 1996-07-31 -S000006307 ORF Verified YPR103W PRE2 proteasome core particle subunit beta 5|SRR2|PRG1|DOA3 chromosome 16 L000001484 16 732349 733212 W 2011-02-03 1996-07-31 Beta 5 subunit of the 20S proteasome; responsible for the chymotryptic activity of the proteasome -S000034099 CDS YPR103W 16 732349 733212 W 2011-02-03 1996-07-31 -S000006308 ORF Verified YPR104C FHL1 SPP42 chromosome 16 L000000612 16 736433 733623 C 2011-02-03 1996-07-31 Regulator of ribosomal protein (RP) transcription; has forkhead associated domain that binds phosphorylated proteins; recruits coactivator Ifh1p or corepressor Crf1p to RP gene promoters; also has forkhead DNA-binding domain though in vitro DNA binding assays give inconsistent results; computational analyses suggest it binds DNA directly at highly active RP genes and indirectly through Rap1p motifs at others; suppresses RNA pol III and splicing factor prp4 mutants -S000034142 CDS YPR104C 16 736433 733623 C 2011-02-03 1996-07-31 -S000006309 ORF Verified YPR105C COG4 Golgi transport complex subunit COG4|SGF1|SEC38|COD1 chromosome 16 S000007660 16 739569 736984 C 2011-02-03 1996-07-31 Essential component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments -S000035097 CDS YPR105C 16 739569 736984 C 2011-02-03 1996-07-31 -S000006310 ORF Verified YPR106W ISR1 putative protein kinase ISR1 chromosome 16 L000004210 16 740061 741392 W 2011-02-03 1996-07-31 Predicted protein kinase; overexpression causes sensitivity to staurosporine, which is a potent inhibitor of protein kinase C -S000035292 CDS YPR106W 16 740061 741392 W 2011-02-03 1996-07-31 -S000006311 ORF Verified YPR107C YTH1 cleavage polyadenylation factor RNA-binding subunit YTH1 chromosome 16 L000003546 16 742064 741438 C 2011-02-03 1996-07-31 Essential RNA-binding component of cleavage and polyadenylation factor; contains five zinc fingers; required for pre-mRNA 3'-end processing and polyadenylation; relocalizes to the cytosol in response to hypoxia -S000035304 CDS YPR107C 16 742064 741438 C 2011-02-03 1996-07-31 -S000006312 ORF Verified YPR108W RPN7 proteasome regulatory particle lid subunit RPN7 chromosome 16 L000004307 16 742454 743743 W 2011-02-03 1996-07-31 Essential non-ATPase regulatory subunit of the 26S proteasome; similar to another S. cerevisiae regulatory subunit, Rpn5p, as well as to mammalian proteasome subunits -S000035430 CDS YPR108W 16 742454 743743 W 2011-02-03 1996-07-31 -S000028590 ORF Uncharacterized YPR108W-A chromosome 16 16 744175 744387 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031362 CDS YPR108W-A 16 744175 744387 W 2011-02-03 2003-07-29 -S000006752 tRNA_gene tT(UGU)P chromosome 16 L000003724 16 744284 744355 W 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000036277 noncoding_exon tT(UGU)P 16 744284 744355 W 2011-02-03 2000-05-19 -S000006313 ORF Uncharacterized YPR109W chromosome 16 16 744689 745573 W 2011-02-03 1996-07-31 Predicted membrane protein; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; diploid deletion strain has high budding index -S000036314 CDS YPR109W 16 744689 745573 W 2011-02-03 1996-07-31 -S000006314 ORF Verified YPR110C RPC40 DNA-directed RNA polymerase core subunit RPC40|RPC5 chromosome 16 L000001690|L000002890 16 746835 745828 C 72 2011-02-03 1996-07-31 RNA polymerase subunit AC40; common to RNA polymerase I and III; predominant determinant targeting Ty1 integration upstream of Pol III-transcribed genes -S000031868 CDS YPR110C 16 746835 745828 C 2011-02-03 1996-07-31 -S000006315 ORF Verified YPR111W DBF20 serine/threonine-protein kinase DBF20 chromosome 16 L000000490 16 747306 749000 W 66 2011-02-03 1999-07-17|1996-07-31 Ser/Thr kinase involved in late nuclear division; one of the mitotic exit network (MEN) proteins; necessary for the execution of cytokinesis; also plays a role in regulating the stability of SWI5 and CLB2 mRNAs; DBF20 has a paralog, DBF2, that arose from the whole genome duplication -S000032040 CDS YPR111W 16 747306 749000 W 2011-02-03 1999-07-17|1996-07-31 -S000118422 ARS ARS1626 ARSXVI-749 chromosome 16 16 749099 749345 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178200 ARS_consensus_sequence ARS1626 16 749117 749133 W 2014-11-18 2014-11-18 -S000006316 ORF Verified YPR112C MRD1 RNA-binding ribosome biosynthesis protein MRD1 chromosome 16 S000007482 16 751919 749256 C 2011-02-03 1996-07-31 Essential conserved small ribosomal subunit (40s) synthesis factor; component of the 90S preribosome; required for production of 18S rRNA and small ribosomal subunit; contains five consensus RNA-binding domains and binds to the pre-rRNA at two sites within the 18S region -S000037455 CDS YPR112C 16 751919 749256 C 2011-02-03 1996-07-31 -S000006317 ORF Verified YPR113W PIS1 CDP-diacylglycerol--inositol 3-phosphatidyltransferase chromosome 16 L000001444 16 752257 752919 W 2011-02-03 1996-07-31 Phosphatidylinositol synthase; required for biosynthesis of phosphatidylinositol, which is a precursor for polyphosphoinositides, sphingolipids, and glycolipid anchors for some of the plasma membrane proteins -S000037583 CDS YPR113W 16 752257 752919 W 2011-02-03 1996-07-31 -S000006318 ORF Uncharacterized YPR114W chromosome 16 16 753301 754248 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000037664 CDS YPR114W 16 753301 754248 W 2011-02-03 1996-07-31 -S000006319 ORF Verified YPR115W RGC1 GCA1 chromosome 16 16 754877 758128 W 2011-02-03 1996-07-31 Putative regulator of the Fps1p glycerol channel; multiply phosphorylated by Hog1p under osmotic stress; contains a pleckstrin homology domain; forms homodimers and heterodimerizes with paralog Ask10p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000030470 CDS YPR115W 16 754877 758128 W 2011-02-03 1996-07-31 -S000006320 ORF Verified YPR116W RRG8 chromosome 16 16 758648 759481 W 2011-02-03 1996-07-31 Protein of unknown function; required for mitochondrial genome maintenance; null mutation results in a decrease in plasma membrane electron transport -S000030562 CDS YPR116W 16 758648 759481 W 2011-02-03 1996-07-31 -S000006321 ORF Uncharacterized YPR117W BSH1 chromosome 16 16 760025 767494 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000030644 CDS YPR117W 16 760025 767494 W 2011-02-03 1996-07-31 -S000006322 ORF Verified YPR118W MRI1 S-methyl-5-thioribose-1-phosphate isomerase MRI1 chromosome 16 16 767752 768987 W 2011-02-03 1996-07-31 5'-methylthioribose-1-phosphate isomerase; catalyzes the isomerization of 5-methylthioribose-1-phosphate to 5-methylthioribulose-1-phosphate in the methionine salvage pathway -S000030727 CDS YPR118W 16 767752 768987 W 2011-02-03 1996-07-31 -S000006635 tRNA_gene tK(UUU)P chromosome 16 L000003731 16 769302 769207 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000034222 intron tK(UUU)P 16 769265 769243 C 2011-02-03 2000-05-19 -S000034221 noncoding_exon tK(UUU)P 16 769242 769207 C 2011-02-03 2000-05-19 -S000034220 noncoding_exon tK(UUU)P 16 769302 769266 C 2011-02-03 2000-05-19 -S000007216 long_terminal_repeat YPRWsigma2 chromosome 16 16 769319 769659 W 2011-02-03 2000-05-19 Ty3 LTR -S000006323 ORF Verified YPR119W CLB2 B-type cyclin CLB2 chromosome 16 L000000350 16 771653 773128 W 2011-02-03 1996-07-31 B-type cyclin involved in cell cycle progression; activates Cdc28p to promote the transition from G2 to M phase; accumulates during G2 and M, then targeted via a destruction box motif for ubiquitin-mediated degradation by the proteasome; CLB2 has a paralog, CLB1, that arose from the whole genome duplication -S000031564 CDS YPR119W 16 771653 773128 W 2011-02-03 1996-07-31 -S000006324 ORF Verified YPR120C CLB5 B-type cyclin CLB5 chromosome 16 L000000353 16 775182 773875 C 2011-02-03 1996-07-31 B-type cyclin involved in DNA replication during S phase; activates Cdc28p to promote initiation of DNA synthesis; functions in formation of mitotic spindles along with Clb3p and Clb4p; most abundant during late G1 phase; CLB5 has a paralog, CLB6, that arose from the whole genome duplication -S000030306 CDS YPR120C 16 775182 773875 C 2011-02-03 1996-07-31 -S000006529 tRNA_gene tC(GCA)P2 chromosome 16 L000003730 16 775836 775765 C 2011-02-03 2000-05-19 Cysteine tRNA (tRNA-Cys), predicted by tRNAscan-SE analysis -S000037837 noncoding_exon tC(GCA)P2 16 775836 775765 C 2011-02-03 2000-05-19 -S000007211 long_terminal_repeat YPRWdelta14 chromosome 16 16 776093 776413 W 2011-02-03 2000-05-19 Ty1 LTR -S000007201 long_terminal_repeat YPRCdelta15 chromosome 16 16 776796 776667 C 2011-02-03 2000-05-19 Ty1 LTR -S000119041 ARS ARS1635 ARSXVI-777|ARS1626.5 chromosome 16 16 776926 777156 2011-02-03 2006-10-04 Autonomously Replicating Sequence -S000119042 ARS_consensus_sequence ARS1635 16 777098 777084 C 2011-02-03 2006-10-04 -S000007212 long_terminal_repeat YPRWdelta16 chromosome 16 16 777832 778154 W 2011-02-03 2000-05-19 Ty1 LTR -S000006325 ORF Verified YPR121W THI22 putative phosphomethylpyrimidine kinase chromosome 16 16 778583 780301 W 2011-02-03 1996-07-31|2011-02-03 Protein with similarity to hydroxymethylpyrimidine phosphate kinases; member of a gene family with THI20 and THI21; not required for thiamine biosynthesis; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively -S000033668 CDS YPR121W 16 778583 780301 W 2011-02-03 1996-07-31|2011-02-03 -S000006326 ORF Verified YPR122W AXL1 STE22|FUS5 chromosome 16 L000002601 16 782045 785671 W 2011-02-03 1996-07-31 Haploid specific endoprotease of a-factor mating pheromone; performs one of two N-terminal cleavages during maturation of a-factor mating pheromone; required for axial budding pattern of haploid cells -S000033830 CDS YPR122W 16 782045 785671 W 2011-02-03 1996-07-31 -S000006328 ORF Verified YPR124W CTR1 high-affinity Cu transporter CTR1 chromosome 16 L000003063 16 786208 787428 W 2011-02-03 1996-07-31 High-affinity copper transporter of plasma membrane; mediates nearly all copper uptake under low copper conditions; transcriptionally induced at low copper levels and degraded at high copper levels; protein increases in abundance and relocalizes from nucleus to plasma membrane upon DNA replication stress; human homolog SLC31A1 can complement a yeast ctr1 ctr3 double deletion -S000034806 CDS YPR124W 16 786208 787428 W 2011-02-03 1996-07-31 -S000006327 ORF Dubious YPR123C chromosome 16 16 786575 786141 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially/completely overlaps the verified ORF CTR -S000033865 CDS YPR123C 16 786575 786141 C 2011-02-03 1996-07-31 -S000006329 ORF Verified YPR125W YLH47 MRS7 chromosome 16 16 787961 789325 W 2011-02-03 1996-07-31 Mitochondrial inner membrane protein; exposed to the mitochondrial matrix; associates with mitochondrial ribosomes; NOT required for respiratory growth; homolog of human Letm1, a protein implicated in Wolf-Hirschhorn syndrome -S000034935 CDS YPR125W 16 787961 789325 W 2011-02-03 1996-07-31 -S000006330 ORF Dubious YPR126C chromosome 16 16 789385 789077 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034988 CDS YPR126C 16 789385 789077 C 2011-02-03 1996-07-31 -S000006331 ORF Verified YPR127W pyridoxine 4-dehydrogenase chromosome 16 16 790083 791120 W 2011-02-03 1996-07-31 Putative pyridoxine 4-dehydrogenase; differentially expressed during alcoholic fermentation; expression activated by transcription factor YRM1/YOR172W; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus -S000035194 CDS YPR127W 16 790083 791120 W 2011-02-03 1996-07-31 -S000006332 ORF Verified YPR128C ANT1 chromosome 16 16 792204 791218 C 2011-02-03 1996-07-31 Peroxisomal adenine nucleotide transporter; involved in beta-oxidation of medium-chain fatty acid; required for peroxisome proliferation -S000036009 CDS YPR128C 16 792204 791218 C 2011-02-03 1996-07-31 -S000006333 ORF Verified YPR129W SCD6 LSM13 chromosome 16 L000001806 16 792687 793736 W 2011-02-03 1996-07-31 Repressor of translation initiation; binds eIF4G through its RGG domain and inhibits recruitment of the preinitiation complex; also contains an Lsm domain; may have a role in RNA processing; overproduction suppresses null mutation in clathrin heavy chain gene CHC1; forms cytoplasmic foci upon DNA replication stress -S000036168 CDS YPR129W 16 792687 793736 W 2011-02-03 1996-07-31 -S000006334 ORF Dubious YPR130C chromosome 16 16 793781 793374 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035652 CDS YPR130C 16 793781 793374 C 2011-02-03 1996-07-31 -S000006335 ORF Verified YPR131C NAT3 peptide alpha-N-acetyltransferase complex B subunit NAT3|RAD56|NAA20 chromosome 16 S000007464|S000029405|L000001576 16 794498 793911 C 84.8 2011-02-03 2003-05-23|1996-07-31 Catalytic subunit of the NatB N-terminal acetyltransferase; NatB catalyzes acetylation of the amino-terminal methionine residues of all proteins beginning with Met-Asp or Met-Glu and of some proteins beginning with Met-Asn or Met-Met -S000035762 CDS YPR131C 16 794498 793911 C 2011-02-03 2003-05-23|1996-07-31 -S000006336 ORF Verified YPR132W RPS23B uS12|ribosomal 40S subunit protein S23B|rp37|YS14|S28B|S23B|S12 chromosome 16 L000001765 16 794965 795767 W 2011-02-03 1996-07-31 Ribosomal protein 28 (rp28) of the small (40S) ribosomal subunit; required for translational accuracy; homologous to mammalian ribosomal protein S23 and bacterial S12; RPS23B has a paralog, RPS23A, that arose from the whole genome duplication; deletion of both RPS23A and RPS23B is lethal -S000035959 CDS YPR132W 16 794965 795029 W 2011-02-03 1996-07-31 -S000035960 CDS YPR132W 16 795395 795767 W 2011-02-03 1996-07-31 -S000035961 intron YPR132W 16 795030 795394 W 2011-02-03 1996-07-31 -S000006337 ORF Verified YPR133C SPN1 IWS1 chromosome 16 16 797210 795978 C 2011-02-03 1996-07-31 Protein involved in RNA polymerase II transcription; is constitutively recruited to the CYC1 promoter and is required for recruitment of chromatin remodeling factors for the expression of CYC1 gene; interacts genetically or physically with RNAP II, TBP, TFIIS, and chromatin remodelling factors; central domain highly conserved throughout eukaryotes; mutations confer an Spt- phenotype -S000037797 CDS YPR133C 16 797210 795978 C 2011-02-03 1996-07-31 -S000006433 ORF Verified YPR133W-A TOM5 MOM8A chromosome 16 L000003249 16 797557 797709 W 2011-02-03 1999-07-17 Component of the TOM (translocase of outer membrane) complex; responsible for recognition and initial import of all mitochondrially directed proteins; involved in transfer of precursors from the Tom70p and Tom20p receptors to the Tom40p pore -S000036542 CDS YPR133W-A 16 797557 797709 W 2011-02-03 1999-07-17 -S000006338 ORF Verified YPR134W MSS18 chromosome 16 L000001204 16 798051 798857 W 2011-02-03 1996-07-31 Nuclear encoded protein needed for splicing of mitochondrial intron; required for efficient splicing of mitochondrial COX1 aI5beta intron; mss18 mutations block cleavage of 5' exon - intron junction; phenotype of intronless strain suggests additional functions -S000029836 CDS YPR134W 16 798051 798857 W 2011-02-03 1996-07-31 -S000006339 ORF Verified YPR135W CTF4 chromatin-binding protein CTF4|POB1|CHL15 chromosome 16 L000000326 16 799234 802017 W 103 2011-02-03 1996-07-31 Chromatin-associated protein; required for sister chromatid cohesion; interacts with DNA polymerase alpha (Pol1p) and may link DNA synthesis to sister chromatid cohesion -S000029940 CDS YPR135W 16 799234 802017 W 2011-02-03 1996-07-31 -S000006341 ORF Verified YPR137W RRP9 chromosome 16 S000007466 16 802359 804080 W 2011-02-03 1996-07-31 Protein involved in pre-rRNA processing; associated with U3 snRNP; component of small ribosomal subunit (SSU) processosome; ortholog of the human U3-55k protein -S000031011 CDS YPR137W 16 802359 804080 W 2011-02-03 1996-07-31 -S000006340 ORF Dubious YPR136C chromosome 16 16 802837 802325 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF RRP9 -S000029987 CDS YPR136C 16 802837 802325 C 2011-02-03 1996-07-31 -S000007213 long_terminal_repeat YPRWdelta17 chromosome 16 16 804511 804638 W 2011-02-03 2000-05-19 Ty1 LTR -S000007202 long_terminal_repeat YPRCdelta18 chromosome 16 16 804978 804645 C 2011-02-03 2000-05-19 Ty1 LTR -S000007360 transposable_element_gene YPR137C-B gag-pol fusion protein chromosome 16 S000029020 16 810269 805001 C 2011-02-03 1997-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000034188 CDS YPR137C-B 16 808963 805001 C 2011-02-03 1997-07-17 -S000034187 CDS YPR137C-B 16 810269 808965 C 2011-02-03 1997-07-17 -S000034189 plus_1_translational_frameshift YPR137C-B 16 808964 808964 C 2011-02-03 1997-07-17 -S000007359 transposable_element_gene YPR137C-A gag protein chromosome 16 16 810269 808947 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000034186 CDS YPR137C-A 16 810269 808947 C 2011-02-03 1996-07-31 -S000007208 LTR_retrotransposon YPRCTy1-2 Ty1 chromosome 16 16 810562 804645 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007203 long_terminal_repeat YPRCdelta19 chromosome 16 16 810562 810229 C 2011-02-03 2000-05-19 Ty1 LTR -S000006677 tRNA_gene tN(GUU)P chromosome 16 L000003725 16 810676 810749 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis -S000030747 noncoding_exon tN(GUU)P 16 810676 810749 W 2011-02-03 2000-05-19 -S000006342 ORF Verified YPR138C MEP3 ammonium permease MEP3 chromosome 16 L000004105 16 812453 810984 C 2011-02-03 1996-07-31 Ammonium permease of high capacity and low affinity; belongs to a ubiquitous family of cytoplasmic membrane proteins that transport only ammonium (NH4+); expression is under the nitrogen catabolite repression regulation ammonia permease; MEP3 has a paralog, MEP1, that arose from the whole genome duplication -S000031048 CDS YPR138C 16 812453 810984 C 2011-02-03 1996-07-31 -S000006343 ORF Verified YPR139C LOA1 lysophosphatidic acid acyltransferase LOA1|VPS66 chromosome 16 16 814058 813156 C 2011-02-03 1996-07-31 Lysophosphatidic acid acyltransferase; involved in triacelglyceride homeostasis and lipid droplet formation; localized to lipid droplets and the ER; specificity for oleoyl-CoA -S000031180 CDS YPR139C 16 814058 813156 C 2011-02-03 1996-07-31 -S000006344 ORF Verified YPR140W TAZ1 lysophosphatidylcholine acyltransferase chromosome 16 16 814391 815536 W 2011-02-03 1996-07-31 Lyso-phosphatidylcholine acyltransferase; required for normal phospholipid content of mitochondrial membranes; major determinant of the final acyl chain composition of the mitochondrial-specific phospholipid cardiolipin; mutations in human ortholog tafazzin (TAZ) cause Barth syndrome, a rare X-linked disease characterized by skeletal and cardiomyopathy and bouts of cyclic neutropenia; a specific splice variant of human TAZ can complement yeast null mutant -S000030806 CDS YPR140W 16 814391 815536 W 2011-02-03 1996-07-31 -S000006345 ORF Verified YPR141C KAR3 OSR11 chromosome 16 L000000888 16 817923 815734 C 94.4 2011-02-03 1996-07-31 Minus-end-directed microtubule motor; functions in mitosis and meiosis, localizes to the spindle pole body and localization is dependent on functional Cik1p, required for nuclear fusion during mating; potential Cdc28p substrate -S000030832 CDS YPR141C 16 817923 815734 C 2011-02-03 1996-07-31 -S000006347 ORF Verified YPR143W RRP15 chromosome 16 16 818323 819075 W 2011-02-03 1996-07-31 Nucleolar protein; constituent of pre-60S ribosomal particles; required for proper processing of the 27S pre-rRNA at the A3 and B1 sites to yield mature 5.8S and 25S rRNAs -S000032060 CDS YPR143W 16 818323 819075 W 2011-02-03 1996-07-31 -S000006346 ORF Dubious YPR142C chromosome 16 16 818693 818130 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF RRP15, which is required for ribosomal RNA processing -S000031843 CDS YPR142C 16 818693 818130 C 2011-02-03 1996-07-31 -S000118423 ARS ARS1627 ARSXVI-819 chromosome 16 16 819160 819399 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178201 ARS_consensus_sequence ARS1627 16 819340 819324 C 2014-11-18 2014-11-18 -S000006611 tRNA_gene tI(AAU)P1 chromosome 16 L000003726 16 819529 819602 W 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000035185 noncoding_exon tI(AAU)P1 16 819529 819602 W 2011-02-03 2000-05-19 -S000006348 ORF Verified YPR144C NOC4 ribosome biosynthesis protein NOC4|UTP19 chromosome 16 16 821423 819765 C 2011-02-03 1996-07-31 Nucleolar protein; forms a complex with Nop14p that mediates maturation and nuclear export of 40S ribosomal subunits; relocalizes to the cytosol in response to hypoxia -S000032106 CDS YPR144C 16 821423 819765 C 2011-02-03 1996-07-31 -S000006505 snoRNA_gene snR45 SNR45 chromosome 16 L000003412 16 821732 821903 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA) but not shown to be active; no target site is predicted within the ribosomal RNAs -S000030617 noncoding_exon snR45 16 821732 821903 W 2011-02-03 2000-05-19 -S000006349 ORF Verified YPR145W ASN1 asparagine synthase (glutamine-hydrolyzing) 1 chromosome 16 L000002732 16 822620 824338 W 2011-02-03 1996-07-31 Asparagine synthetase; catalyzes the synthesis of L-asparagine from L-aspartate in the asparagine biosynthetic pathway; ASN1 has a paralog, ASN2, that arose from the whole genome duplication -S000034141 CDS YPR145W 16 822620 824338 W 2011-02-03 1996-07-31 -S000113589 ORF Uncharacterized YPR145C-A chromosome 16 16 824926 824690 C 2011-02-03 2005-11-21 Putative protein of unknown function -S000113590 CDS YPR145C-A 16 824926 824690 C 2011-02-03 2005-11-21 -S000006350 ORF Dubious YPR146C chromosome 16 16 825676 825347 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034200 CDS YPR146C 16 825676 825347 C 2011-02-03 1996-07-31 -S000006351 ORF Verified YPR147C chromosome 16 16 826559 825645 C 2011-02-03 1996-07-31 Protein of unknown function; may have a role in lipid metabolism, based on localization to lipid droplets; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and is induced in response to the DNA-damaging agent MMS -S000034283 CDS YPR147C 16 826559 825645 C 2011-02-03 1996-07-31 -S000006352 ORF Verified YPR148C chromosome 16 16 828140 826833 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern -S000034341 CDS YPR148C 16 828140 826833 C 2011-02-03 1996-07-31 -S000006353 ORF Verified YPR149W NCE102 NCE2 chromosome 16 L000003098 16 829918 830439 W 2011-02-03 1996-07-31 Protein of unknown function; contains transmembrane domains; involved in secretion of proteins that lack classical secretory signal sequences; component of the detergent-insoluble glycolipid-enriched complexes (DIGs); NCE102 has a paralog, FHN1, that arose from the whole genome duplication -S000035352 CDS YPR149W 16 829918 830439 W 2011-02-03 1996-07-31 -S000006354 ORF Dubious YPR150W chromosome 16 16 830999 831520 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene SUE1/YPR151C -S000033972 CDS YPR150W 16 830999 831520 W 2011-02-03 1996-07-31 -S000006355 ORF Verified YPR151C SUE1 chromosome 16 16 831675 831055 C 2011-02-03 1996-07-31 Protein required for degradation of unstable forms of cytochrome c; located in the mitochondria -S000034039 CDS YPR151C 16 831675 831055 C 2011-02-03 1996-07-31 -S000006356 ORF Verified YPR152C URN1 chromosome 16 16 833458 832061 C 2011-02-03 1996-07-31 Protein of unknown function containing WW and FF domains; overexpression causes accumulation of cells in G1 phase -S000034921 CDS YPR152C 16 833458 832061 C 2011-02-03 1996-07-31 -S000006357 ORF Verified YPR153W MAY24 chromosome 16 16 833689 834245 W 2011-02-03 1996-07-31|2007-07-10 Protein of unknown function -S000035217 CDS YPR153W 16 833689 833693 W 2011-02-03 1996-07-31|2007-07-10 -S000123277 CDS YPR153W 16 833828 834245 W 2011-02-03 2007-07-10 -S000123276 intron YPR153W 16 833694 833827 W 2011-02-03 2007-07-10 -S000006358 ORF Verified YPR154W PIN3 LSB2 chromosome 16 16 834565 835212 W 2011-02-03 1996-07-31 Negative regulator of actin nucleation-promoting factor activity; interacts with Las17p, a homolog of human Wiskott-Aldrich Syndrome protein (WASP), via an N-terminal SH3 domain, and along with LSB1 cooperatively inhibits the nucleation of actin filaments; short-lived protein whose levels increase in response to thermal stress; induces the formation of the [PIN+] and [RNQ+] prions when overproduced; PIN3 has a paralog, LSB1, that arose from the whole genome duplication -S000036101 CDS YPR154W 16 834565 835212 W 2011-02-03 1996-07-31 -S000006359 ORF Verified YPR155C NCA2 chromosome 16 L000003161 16 837413 835563 C 2011-02-03 1996-07-31 Protein that regulates expression of Fo-F1 ATP synthase subunits; involved in the regulation of mitochondrial expression of subunits 6 (Atp6p) and 8 (Atp8p) of the Fo-F1 ATP synthase; functions with Nca3p -S000036159 CDS YPR155C 16 837413 835563 C 2011-02-03 1996-07-31 -S000006360 ORF Verified YPR156C TPO3 spermine transporter chromosome 16 16 839777 837909 C 2011-02-03 1996-07-31 Polyamine transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; specific for spermine; localizes to the plasma membrane; TPO3 has a paralog, TPO2, that arose from the whole genome duplication -S000036260 CDS YPR156C 16 839777 837909 C 2011-02-03 1996-07-31 -S000006361 ORF Uncharacterized YPR157W TDA6 chromosome 16 16 841266 842669 W 2011-02-03 1996-07-31 Putative protein of unknown function; induced by treatment with 8-methoxypsoralen and UVA irradiation; null mutant is sensitive to expression of the top1-T722A allele; SWAT-GFP and mCherry fusion proteins localize to the cell periphery and vacuole; TDA6 has a paralog, VPS62, that arose from the whole genome duplication -S000036428 CDS YPR157W 16 841266 842669 W 2011-02-03 1996-07-31 -S000118424 ARS ARS1628 ARSXVI-843 chromosome 16 16 842653 842900 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178202 ARS_consensus_sequence ARS1628 16 842708 842724 W 2014-11-18 2014-11-18 -S000006362 ORF Verified YPR158W CUR1 chromosome 16 16 843262 844020 W 2011-02-03 1996-07-31 Sorting factor, central regulator of spatial protein quality control; physically and functionally interacts with chaperones to promote sorting and deposition of misfolded proteins into cytosolic compartments; involved in destabilization of [URE3] prions; CUR1 has a paralog, BTN2, that arose from the whole genome duplication -S000030121 CDS YPR158W 16 843262 844020 W 2011-02-03 1996-07-31 -S000007214 long_terminal_repeat YPRWdelta20 chromosome 16 16 844412 844749 W 2011-02-03 2000-05-19 Ty1 LTR -S000007220 LTR_retrotransposon YPRWTy1-3 Ty1 chromosome 16 16 844412 850340 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007363 transposable_element_gene YPR158W-A gag protein chromosome 16 16 844709 846031 W 2011-02-03 1999-07-17|1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000037619 CDS YPR158W-A 16 844709 846031 W 2011-02-03 1999-07-17 -S000007364 transposable_element_gene YPR158W-B gag-pol fusion protein chromosome 16 16 844709 849980 W 2011-02-03 1997-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000037621 CDS YPR158W-B 16 844709 846013 W 2011-02-03 1997-07-17 -S000037622 CDS YPR158W-B 16 846015 849980 W 2011-02-03 1997-07-17 -S000037623 plus_1_translational_frameshift YPR158W-B 16 846014 846014 W 2011-02-03 1997-07-17 -S000007215 long_terminal_repeat YPRWdelta21 chromosome 16 16 850003 850340 W 2011-02-03 2000-05-19 Ty1 LTR -S000007204 long_terminal_repeat YPRCdelta22 chromosome 16 16 850512 850357 C 2011-02-03 2000-05-19 Ty1 LTR -S000130201 ARS ARS1629 chromosome 16 16 850512 850629 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000007205 long_terminal_repeat YPRCdelta23 chromosome 16 16 850966 850629 C 2011-02-03 2000-05-19 Ty1 LTR -S000007362 transposable_element_gene YPR158C-D gag-pol fusion protein chromosome 16 S000029021 16 856257 850989 C 2011-02-03 1997-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000035820 CDS YPR158C-D 16 854951 850989 C 2011-02-03 1997-07-17 -S000035819 CDS YPR158C-D 16 856257 854953 C 2011-02-03 1997-07-17 -S000035821 plus_1_translational_frameshift YPR158C-D 16 854952 854952 C 2011-02-03 1997-07-17 -S000007361 transposable_element_gene YPR158C-C gag protein chromosome 16 16 856257 854935 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000035816 CDS YPR158C-C 16 856257 854935 C 2011-02-03 1999-07-17 -S000007217 long_terminal_repeat YPRWsigma3 chromosome 16 16 856545 856885 W 2011-02-03 2000-05-19 Ty3 LTR -S000007209 LTR_retrotransposon YPRCTy1-4 Ty1 chromosome 16 16 856554 850629 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007206 long_terminal_repeat YPRCdelta24 chromosome 16 16 856554 856217 C 2011-02-03 2000-05-19 Ty1 LTR -S000006520 tRNA_gene tA(AGC)P chromosome 16 L000003727 16 856902 856974 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine -S000032310 noncoding_exon tA(AGC)P 16 856902 856974 W 2011-02-03 2000-05-19 -S000006363 ORF Verified YPR159W KRE6 beta-glucan synthesis-associated protein KRE6|CWH48 chromosome 16 L000000915 16 857583 859745 W 95.9 2011-02-03 1996-07-31 Type II integral membrane protein; required for beta-1,6 glucan biosynthesis; putative beta-glucan synthase; localizes to ER, plasma membrane, sites of polarized growth and secretory vesicles; functionally redundant with Skn1p; KRE6 has a paralog, SKN1, that arose from the whole genome duplication -S000030298 CDS YPR159W 16 857583 859745 W 2011-02-03 1996-07-31 -S000006589 tRNA_gene tG(GCC)P2 chromosome 16 L000003728 16 860379 860449 W 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis -S000031683 noncoding_exon tG(GCC)P2 16 860379 860449 W 2011-02-03 2000-05-19 -S000028725 ORF Uncharacterized YPR159C-A chromosome 16 16 860415 860314 C 2011-02-03 2003-07-29 Protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the cytosol; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032712 CDS YPR159C-A 16 860415 860314 C 2011-02-03 2003-07-29 -S000006364 ORF Verified YPR160W GPH1 glycogen phosphorylase chromosome 16 L000000724 16 861306 864014 W 2011-02-03 1996-07-31 Glycogen phosphorylase required for the mobilization of glycogen; non-essential; regulated by cyclic AMP-mediated phosphorylation; phosphorylation by Cdc28p may coordinately regulate carbohydrate metabolism and the cell cycle; expression is regulated by stress-response elements and by the HOG MAP kinase pathway -S000029939 CDS YPR160W 16 861306 864014 W 2011-02-03 1996-07-31 -S000028860 ORF Dubious YPR160W-A chromosome 16 16 861934 862014 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by expression profiling and mass spectrometry -S000034591 CDS YPR160W-A 16 861934 862014 W 2011-02-03 2003-07-29 -S000028726 ORF Dubious YPR160C-A chromosome 16 16 862861 862577 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032715 CDS YPR160C-A 16 862861 862577 C 2011-02-03 2003-07-29 -S000006365 ORF Verified YPR161C SGV1 cyclin-dependent serine/threonine protein kinase SGV1|BUR1 chromosome 16 L000001878 16 866422 864449 C 2011-02-03 1996-07-31 Cyclin (Bur2p)-dependent protein kinase; part of the BUR kinase complex which functions in transcriptional regulation; phosphorylates the carboxy-terminal domain (CTD) of Rpo21p and the C-terminal repeat domain of Spt5p; recruits Spt6p to the CTD at the onset of transcription; regulated by Cak1p; similar to metazoan CDK9 proteins -S000030002 CDS YPR161C 16 866422 864449 C 2011-02-03 1996-07-31 -S000006366 ORF Verified YPR162C ORC4 origin recognition complex subunit 4 chromosome 16 L000003075 16 868304 866715 C 2011-02-03 1996-07-31 Subunit of the origin recognition complex (ORC); ORC directs DNA replication by binding to replication origins and is also involved in transcriptional silencing; ORC4 has a paralog, RIF2, that arose from the whole genome duplication -S000030984 CDS YPR162C 16 868304 866715 C 2011-02-03 1996-07-31 -S000006367 ORF Verified YPR163C TIF3 eIF4B|STM1|RBL3 chromosome 16 L000002304 16 869955 868645 C 2011-02-03 1996-07-31 Translation initiation factor eIF-4B; contains an RNA recognition motif and binds to single-stranded RNA; has RNA annealing activity; interacts with Rps20p at the head of the 40S ribosomal subunit and alters the structure of the mRNA entry channel -S000031085 CDS YPR163C 16 869955 868645 C 2011-02-03 1996-07-31 -S000006368 ORF Verified YPR164W MMS1 SLM6|RTT108 chromosome 16 L000003933 16 870703 874926 W 2011-02-03 1996-07-31 Subunit of E3 ubiquitin ligase complex involved in replication repair; stabilizes protein components of the replication fork such as the fork-pausing complex and leading strand polymerase, preventing fork collapse and promoting efficient recovery during replication stress; regulates Ty1 transposition; involved with Rtt101p in nonfunctional rRNA decay -S000032195 CDS YPR164W 16 870703 874926 W 2011-02-03 1996-07-31 -S000006369 ORF Verified YPR165W RHO1 Rho family GTPase RHO1 chromosome 16 L000001630 16 875368 875997 W 2011-02-03 1996-07-31 GTP-binding protein of the rho subfamily of Ras-like proteins; involved in establishment of cell polarity; regulates protein kinase C (Pkc1p) and the cell wall synthesizing enzyme 1,3-beta-glucan synthase (Fks1p and Gsc2p) -S000032291 CDS YPR165W 16 875368 875997 W 2011-02-03 1996-07-31 -S000006370 ORF Verified YPR166C MRP2 mitochondrial 37S ribosomal protein MRP2 chromosome 16 L000001153 16 876629 876282 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit -S000032335 CDS YPR166C 16 876629 876282 C 2011-02-03 1996-07-31 -S000006371 ORF Verified YPR167C MET16 phosphoadenylyl-sulfate reductase (thioredoxin) chromosome 16 L000001087 16 877632 876847 C 2011-02-03 1996-07-31 3'-phosphoadenylsulfate reductase; reduces 3'-phosphoadenylyl sulfate to adenosine-3',5'-bisphosphate and free sulfite using reduced thioredoxin as cosubstrate, involved in sulfate assimilation and methionine metabolism -S000032426 CDS YPR167C 16 877632 876847 C 2011-02-03 1996-07-31 -S000006372 ORF Verified YPR168W NUT2 mediator complex subunit NUT2|MED10 chromosome 16 L000003447|L000004593 16 878076 878549 W 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; required for transcriptional activation and has a role in basal transcription; protein abundance increases in response to DNA replication stress -S000034534 CDS YPR168W 16 878076 878549 W 2011-02-03 1996-07-31 -S000006373 ORF Verified YPR169W JIP5 chromosome 16 16 878690 880168 W 2011-02-03 1996-07-31|2005-12-01 Protein required for biogenesis of the large ribosomal subunit; required for biogenesis of the large ribosomal subunit; interacts with proteins involved in RNA processing, ribosome biogenesis, ubiquitination and demethylation; similar to WDR55, a human WD repeat protein; essential gene -S000034622 CDS YPR169W 16 878690 880168 W 2011-02-03 1996-07-31|2005-12-01 -S000006612 tRNA_gene tI(AAU)P2 chromosome 16 L000003729 16 880369 880296 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000035187 noncoding_exon tI(AAU)P2 16 880369 880296 C 2011-02-03 2000-05-19 -S000007218 long_terminal_repeat YPRWsigma4 chromosome 16 16 880386 880726 W 2011-02-03 2000-05-19 Ty3 LTR -S000118425 ARS ARS1630 ARSXVI-881 chromosome 16 16 880861 881108 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178203 ARS_consensus_sequence ARS1630 16 880905 880921 W 2014-11-18 2014-11-18 -S000007207 long_terminal_repeat YPRCtau3 chromosome 16 16 881830 881487 C 2011-02-03 2000-05-19 Ty4 LTR -S000028591 ORF Dubious YPR169W-A chromosome 16 16 883239 883457 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps two other dubious ORFs: YPR170C and YPR170W-B -S000031363 CDS YPR169W-A 16 883239 883457 W 2011-02-03 2003-07-29 -S000028515 ORF Uncharacterized YPR170W-B chromosome 16 16 883239 883595 W 2011-02-03 2003-07-29 Putative protein of unknown function; conserved in fungi; SWAT-GFP fusion protein localizes to the vacuole membrane; partially overlaps the dubious genes YPR169W-A, YPR170W-A and YRP170C -S000030284 CDS YPR170W-B 16 883239 883387 W 2011-02-03 2003-07-29 -S000030285 CDS YPR170W-B 16 883487 883595 W 2011-02-03 2003-07-29 -S000030286 intron YPR170W-B 16 883388 883486 W 2011-02-03 2003-07-29 -S000006374 ORF Dubious YPR170C chromosome 16 16 883318 882983 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORFs YPR169W-A and YPR170W-B -S000033271 CDS YPR170C 16 883318 882983 C 2011-02-03 1996-07-31 -S000028861 ORF Dubious YPR170W-A chromosome 16 16 883378 883563 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by expression profiling and mass spectrometry -S000034592 CDS YPR170W-A 16 883378 883563 W 2011-02-03 2003-07-29 -S000006375 ORF Verified YPR171W BSP1 chromosome 16 16 883828 885558 W 2011-02-03 1996-07-31 Adapter that links synaptojanins to the cortical actin cytoskeleton; the synaptojanins are Inp52p and Inp53p -S000034199 CDS YPR171W 16 883828 885558 W 2011-02-03 1996-07-31 -S000006376 ORF Uncharacterized YPR172W pyridoxal 5'-phosphate synthase chromosome 16 16 885796 886398 W 2011-02-03 1996-07-31 Protein of unknown function; predicted to encode a pyridoxal 5'-phosphate synthase based on sequence similarity but purified protein does not possess this activity, nor does it bind flavin mononucleotide (FMN); transcriptionally activated by Yrm1p along with genes involved in multidrug resistance; YPR172W has a paralog, YLR456W, that arose from the whole genome duplication -S000034326 CDS YPR172W 16 885796 886398 W 2011-02-03 1996-07-31 -S000006377 ORF Verified YPR173C VPS4 AAA family ATPase VPS4|DID6|VPT10|VPL4|GRD13|END13|CSC1 chromosome 16 L000002956 16 887837 886524 C 2011-02-03 1996-07-31 AAA-ATPase involved in multivesicular body (MVB) protein sorting; ATP-bound Vps4p localizes to endosomes and catalyzes ESCRT-III disassembly and membrane release; ATPase activity is activated by Vta1p; regulates cellular sterol metabolism -S000034362 CDS YPR173C 16 887837 886524 C 2011-02-03 1996-07-31 -S000006378 ORF Verified YPR174C chromosome 16 16 888708 888043 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nuclear periphery; potential Cdc28p substrate; binds phosphatidylinositols and phosphatidylethanolamine in a large-scale study; relative distribution to foci at the nuclear periphery increases upon DNA replication stress; YPR174C has a paralog, NBP1, that arose from the whole genome duplication -S000035379 CDS YPR174C 16 888708 888043 C 2011-02-03 1996-07-31 -S000006379 ORF Verified YPR175W DPB2 DNA polymerase epsilon noncatalytic subunit chromosome 16 L000000519 16 888974 891043 W 2011-02-03 2003-09-22|1996-07-31 Second largest subunit of DNA polymerase II (DNA polymerase epsilon); required for maintenance of fidelity of chromosomal replication; essential motif in C-terminus is required for formation of the four-subunit Pol epsilon; expression peaks at the G1/S phase boundary; Cdc28p substrate -S000035567 CDS YPR175W 16 888974 891043 W 2011-02-03 2003-09-22|1996-07-31 -S000006380 ORF Verified YPR176C BET2 Rab geranylgeranyltransferase BET2 chromosome 16 L000000172 16 892078 891101 C 2011-02-03 1996-07-31 Beta subunit of Type II geranylgeranyltransferase; required for vesicular transport between the endoplasmic reticulum and the Golgi; provides a membrane attachment moiety to Rab-like proteins Ypt1p and Sec4p; human homolog RABGGTB can complement yeast BET2 mutant -S000035598 CDS YPR176C 16 892078 891101 C 2011-02-03 1996-07-31 -S000006382 ORF Verified YPR178W PRP4 U4/U6-U5 snRNP complex subunit PRP4|RNA4 chromosome 16 L000001497 16 892332 893729 W 2011-02-03 1996-07-31 Splicing factor; component of the U4/U6-U5 snRNP complex -S000036653 CDS YPR178W 16 892332 893729 W 2011-02-03 1996-07-31 -S000006381 ORF Dubious YPR177C chromosome 16 16 892684 892313 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the 5' end of the essential PRP4 gene encoding a component of the U4/U6-U5 snRNP complex -S000036500 CDS YPR177C 16 892684 892313 C 2011-02-03 1996-07-31 -S000006383 ORF Verified YPR179C HDA3 PLO1 chromosome 16 16 895764 893797 C 2011-02-03 1996-07-31 Subunit of the HDA1 histone deacetylase complex; possibly tetrameric trichostatin A-sensitive class II histone deacetylase complex contains Hda1p homodimer and an Hda2p-Hda3p heterodimer; required for the activity of the complex; relocalizes to the cytosol in response to hypoxia; similar to Hda2p -S000036672 CDS YPR179C 16 895764 893797 C 2011-02-03 1996-07-31 -S000006384 ORF Verified YPR180W AOS1 E1 ubiquitin-activating protein AOS1|RHC31 chromosome 16 L000004031 16 895961 897004 W 2011-02-03 1996-07-31 Subunit of heterodimeric nuclear SUMO activating enzyme E1 with Uba2p; activates Smt3p (SUMO) before its conjugation to proteins (sumoylation), which may play a role in protein targeting; essential for viability; relocalizes to the cytosol in response to hypoxia -S000030253 CDS YPR180W 16 895961 897004 W 2011-02-03 1996-07-31 -S000006385 ORF Verified YPR181C SEC23 GTPase-activating protein SEC23 chromosome 16 L000001846|S000028412 16 899667 897361 C 2011-02-03 1996-07-31 GTPase-activating protein, stimulates the GTPase activity of Sar1p; component of the Sec23p-Sec24p heterodimer of the COPII vesicle coat, involved in ER to Golgi transport; substrate of Ubp3/Bre5 complex; ubiquitylated by Ub-ligase Rsp5p; proteasome-mediated degradation of Sec23p is regulated by Cdc48p -S000030311 CDS YPR181C 16 899667 897361 C 2011-02-03 1996-07-31 -S000006386 ORF Verified YPR182W SMX3 mRNA splicing protein SMX3|Sm F|SmF chromosome 16 L000002786 16 900194 900454 W 2011-02-03 1996-07-31 Core Sm protein Sm F; part of heteroheptameric complex (with Smb1p, Smd1p, Smd2p, Smd3p, Sme1p, and Smx2p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; homolog of human Sm F -S000030535 CDS YPR182W 16 900194 900454 W 2011-02-03 1996-07-31 -S000006387 ORF Verified YPR183W DPM1 dolichyl-phosphate beta-D-mannosyltransferase|SED3 chromosome 16 L000000524 16 900755 901558 W 2011-02-03 1996-07-31 Dolichol phosphate mannose (Dol-P-Man) synthase of ER membrane; catalyzes formation of Dol-P-Man from Dol-P and GDP-Man; required for biosynthesis of glycosyl phosphatidylinositol (GPI) membrane anchor, as well as O-mannosylation and protein N- and O-linked glycosylation; human homolog DPM1 can complement yeast mutant strains -S000031445 CDS YPR183W 16 900755 901558 W 2011-02-03 1996-07-31 -S000006388 ORF Verified YPR184W GDB1 bifunctional 4-alpha-glucanotransferase/amylo-alpha-1,6-glucosidase chromosome 16 16 902044 906654 W 2011-02-03 1996-07-31 Glycogen debranching enzyme; contains glucanotranferase and alpha-1,6-amyloglucosidase activities; required for glycogen degradation; phosphorylated in mitochondria; activity is inhibited by Igd1p; protein abundance increases in response to DNA replication stress -S000031566 CDS YPR184W 16 902044 906654 W 2011-02-03 1996-07-31 -S000006389 ORF Verified YPR185W ATG13 serine/threonine protein kinase regulatory subunit ATG13|APG13 chromosome 16 L000003956 16 907218 909434 W 2011-02-03 1996-07-31 Regulatory subunit of the Atg1p signaling complex; stimulates Atg1p kinase activity; required for vesicle formation during autophagy and the cytoplasm-to-vacuole targeting (Cvt) pathway; contains a HORMA domain required for autophagy and for recruitment of the phosphatidylinositol 3-kinase complex subunit Atg14p to the pre-autophagosomal structure -S000031704 CDS YPR185W 16 907218 909434 W 2011-02-03 1996-07-31 -S000006390 ORF Verified YPR186C PZF1 TFC2 chromosome 16 L000002286|L000001544 16 911022 909733 C 2011-02-03 1996-07-31 Transcription factor IIIA (TFIIIA); essential DNA binding protein required for transcription of 5S rRNA by RNA polymerase III; not involved in transcription of other RNAP III genes; nine conserved zinc fingers; may also bind 5S rRNA -S000032601 CDS YPR186C 16 911022 909733 C 2011-02-03 1996-07-31 -S000006391 ORF Verified YPR187W RPO26 DNA-directed RNA polymerase core subunit RPO26|ABC23|RPB6 chromosome 16 L000001745 16 911257 911800 W 2011-02-03 1996-07-31 RNA polymerase subunit ABC23; common to RNA polymerases I, II, and III; part of central core; similar to bacterial omega subunit -S000032734 CDS YPR187W 16 911257 911276 W 2011-02-03 1996-07-31 -S000032735 CDS YPR187W 16 911353 911800 W 2011-02-03 1996-07-31 -S000032736 intron YPR187W 16 911277 911352 W 2011-02-03 1996-07-31 -S000006392 ORF Verified YPR188C MLC2 chromosome 16 S000007532 16 912479 911988 C 2011-02-03 1996-07-31 Regulatory light chain for the type II myosin Myo1p; binds to an IQ motif of Myo1p, localization to the bud neck depends on Myo1p; involved in the disassembly of the Myo1p ring -S000032770 CDS YPR188C 16 912479 911988 C 2011-02-03 1996-07-31 -S000006393 ORF Verified YPR189W SKI3 SKI complex subunit tetratricopeptide repeat protein SKI3|SKI5 chromosome 16 L000001904 16 912664 916962 W 2011-02-03 1996-07-31 Ski complex component and TPR protein; mediates 3'-5' RNA degradation by the cytoplasmic exosome; null mutants have superkiller phenotype of increased viral dsRNAs and are synthetic lethal with mutations in 5'-3' mRNA decay; mutations in the human ortholog, TTC37, causes Syndromic diarrhea/Trichohepatoenteric (SD/THE) syndrome -S000034826 CDS YPR189W 16 912664 916962 W 2011-02-03 1996-07-31 -S000006394 ORF Verified YPR190C RPC82 DNA-directed RNA polymerase III subunit C82|RPC80|RPC3 chromosome 16 L000001693|S000029422|L000001692 16 919041 917077 C 2011-02-03 1996-07-31 RNA polymerase III subunit C82 -S000033015 CDS YPR190C 16 919041 917077 C 2011-02-03 1996-07-31 -S000006395 ORF Verified YPR191W QCR2 ubiquinol--cytochrome-c reductase subunit 2|UCR2|COR2 chromosome 16 L000001545 16 919381 920487 W 2011-02-03 1996-07-31 Subunit 2 of ubiquinol cytochrome-c reductase (Complex III); Complex III is a component of the mitochondrial inner membrane electron transport chain; phosphorylated; transcription is regulated by Hap1p, Hap2p/Hap3p, and heme -S000033835 CDS YPR191W 16 919381 920487 W 2011-02-03 1996-07-31 -S000006396 ORF Verified YPR192W AQY1 chromosome 16 L000004720 16 921860 922777 W 2011-02-03 1996-07-31 Spore-specific water channel; mediates the transport of water across cell membranes, developmentally controlled; may play a role in spore maturation, probably by allowing water outflow, may be involved in freeze tolerance -S000033980 CDS YPR192W 16 921860 922777 W 2011-02-03 1996-07-31 -S000006397 ORF Verified YPR193C HPA2 histone acetyltransferase|KAT10 chromosome 16 L000004379 16 923379 922909 C 2011-02-03 1996-07-31 Tetrameric histone acetyltransferase; has similarity to Gcn5p, Hat1p, Elp3p, and Hpa3p; acetylates histones H3 and H4 in vitro and exhibits autoacetylation activity; also acetylates polyamines -S000034022 CDS YPR193C 16 923379 922909 C 2011-02-03 1996-07-31 -S000006398 ORF Verified YPR194C OPT2 chromosome 16 16 926937 924304 C 2011-02-03 1996-07-31 Oligopeptide transporter; localized to peroxisomes and affects glutathione redox homeostasis; also localizes to the plasma membrane (PM) and to the late Golgi, and has a role in maintenance of lipid asymmetry between the inner and outer leaflets of the PM; member of the OPT family, with potential orthologs in S. pombe and C. albicans; also plays a role in formation of mature vacuoles and in polarized cell growth -S000034902 CDS YPR194C 16 926937 924304 C 2011-02-03 1996-07-31 -S000006399 ORF Dubious YPR195C chromosome 16 16 928294 927965 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035080 CDS YPR195C 16 928294 927965 C 2011-02-03 1996-07-31 -S000006400 ORF Uncharacterized YPR196W putative maltose-responsive transcription factor chromosome 16 16 931376 932788 W 2011-02-03 1996-07-31 Putative maltose-responsive transcription factor -S000036124 CDS YPR196W 16 931376 932788 W 2011-02-03 1996-07-31 -S000118426 ARS ARS1631 ARSXVI-933 chromosome 16 16 932983 933229 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178204 ARS_consensus_sequence ARS1631 16 933165 933149 C 2014-11-18 2014-11-18 -S000007219 long_terminal_repeat YPRWtau4 chromosome 16 16 933071 933404 W 2011-02-03 2000-05-19 Ty4 LTR -S000006402 ORF Verified YPR198W SGE1 NOR1 chromosome 16 L000001876 16 934034 935665 W 84.8 2011-02-03 1996-07-31 Plasma membrane multidrug transporter; member of the major facilitator superfamily; acts as an extrusion permease; partial multicopy suppressor of gal11 mutations -S000036370 CDS YPR198W 16 934034 935665 W 2011-02-03 1996-07-31 -S000006401 ORF Dubious YPR197C chromosome 16 16 934461 933898 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF SGE1/YPR198W -S000036181 CDS YPR197C 16 934461 933898 C 2011-02-03 1996-07-31 -S000006403 ORF Verified YPR199C ARR1 ACR1|YAP8 chromosome 16 L000004292 16 939032 938148 C 2011-02-03 1996-07-31 Transcriptional activator of the basic leucine zipper (bZIP) family; required for transcription of genes involved in resistance to arsenic compounds; directly binds trivalent arsenic (As(III)) as does K. lactis ortholog, KIYAP8 -S000036409 CDS YPR199C 16 939032 938148 C 2011-02-03 1996-07-31 -S000006404 ORF Verified YPR200C ARR2 ACR2 chromosome 16 L000004293|L000004290 16 939671 939279 C 2011-02-03 1996-07-31 Arsenate reductase required for arsenate resistance; converts arsenate to arsenite which can then be exported from cells by Arr3p -S000034447 CDS YPR200C 16 939671 939279 C 2011-02-03 1996-07-31 -S000006405 ORF Verified YPR201W ARR3 ACR3 chromosome 16 L000004323 16 939922 941136 W 2011-02-03 1996-07-31 Plasma membrane metalloid/H+ antiporter; member of bile/arsenite/riboflavin transporter (BART) superfamily; transports arsenite and antimonite; required for resistance to arsenic compounds; transcription is activated by Arr1p in the presence of arsenite -S000034611 CDS YPR201W 16 939922 941136 W 2011-02-03 1996-07-31 -S000130202 ARS ARS1632 chromosome 16 16 942084 943032 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000029002 telomere TEL16R chromosome 16 16 942396 948010 W 106 2011-02-03 2003-09-09|2011-02-03 Telomeric region on the right arm of Chromosome XVI; annotated components include an X element core sequence and a short Y' element; TEL16R does have telomeric repeats (TEL16R-TR), but they are missing from the genome annotation due to difficulties encountered during sequencing and/or assembly -S000029003 X_element TEL16R 16 942396 942771 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome XVI; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000029004 Y_prime_element TEL16R 16 942810 948010 W 2011-02-03 2003-09-09|2011-02-03 Telomeric short Y' element on the right arm of Chromosome XVI; contains an ARS consensus sequence, a region of 36-bp repeats, and four ORFs YPR202W, YPR203W, YPR204W, and YPR204C-A -S000006406 ORF Uncharacterized YPR202W chromosome 16 16 943032 943896 W 2011-02-03 1996-07-31 Putative protein of unknown function; similar to telomere-encoded helicases; down-regulated at low calcium levels; YPR202W is not an essential gene; transcript is predicted to be spliced but there is no evidence that it is spliced in vivo -S000034726 CDS YPR202W 16 943032 943050 W 2011-02-03 1996-07-31 -S000034727 CDS YPR202W 16 943199 943896 W 2011-02-03 1996-07-31 -S000034728 intron YPR202W 16 943051 943198 W 2011-02-03 1996-07-31 -S000006407 ORF Uncharacterized YPR203W chromosome 16 16 943880 944188 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000035720 CDS YPR203W 16 943880 944188 W 2011-02-03 1996-07-31 -S000006408 ORF Verified YPR204W Y' -Help1|Y' element ATP-dependent helicase chromosome 16 16 944603 947701 W 2011-02-03 1996-07-31 DNA helicase encoded within the telomeric Y' element; Y' -helicase protein 1 -S000035834 CDS YPR204W 16 944603 947701 W 2011-02-03 1996-07-31 -S000028727 ORF Dubious YPR204C-A chromosome 16 16 947338 946856 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032717 CDS YPR204C-A 16 947338 946856 C 2011-02-03 2003-07-29 -S000007328 tRNA_gene tP(UGG)Q chromosome 17 L000004903 17 731 802 W 2000-05-19 2000-05-19 Mitochondrial proline tRNA (tRNA-Pro) -S000036040 noncoding_exon tP(UGG)Q 17 731 802 W 2000-05-19 2000-05-19 -S000007257 ORF Dubious Q0010 ORF6 chromosome 17 L000004921 17 3952 4338 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF Q0017 -S000036184 CDS Q0010 17 3952 4338 W 2000-05-19 2000-05-19 -S000007258 ORF Dubious Q0017 ORF7 chromosome 17 L000004922 17 4254 4415 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF Q0010 -S000036188 CDS Q0017 17 4254 4415 W 2000-05-19 2000-05-19 -S000029667 origin_of_replication ORI1 ORI1 chromosome 17 L000001308 17 4312 4012 C 2014-11-18 2014-11-18 Mitochondrial origin of replication -S000007287 rRNA_gene Q0020 15S_RRNA 14s rRNA|15S_RRNA_2 chromosome 17 L000004882 17 6546 8194 W 2000-05-19 2000-05-19 Ribosomal RNA of the small mitochondrial ribosomal subunit; MSU1 allele suppresses ochre stop mutations in mitochondrial protein-coding genes -S000037488 noncoding_exon Q0020 17 6546 8194 W 2000-05-19 2000-05-19 -S000007337 tRNA_gene tW(UCA)Q chromosome 17 L000004912 17 9374 9447 W 2000-05-19 2000-05-19 Mitochondrial tRNA, annotated as tryptophanyl tRNA (tRNA-Trp); predicted by tRNAscan-SE analysis to have specificity for selenocysteine -S000031464 noncoding_exon tW(UCA)Q 17 9374 9447 W 2000-05-19 2000-05-19 -S000007259 ORF Dubious Q0032 ORF8 chromosome 17 L000004923 17 11667 11957 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036376 CDS Q0032 17 11667 11957 W 2000-05-19 2000-05-19 -S000029331 origin_of_replication ORI8 ORI8 chromosome 17 L000003958 17 12780 12510 C 2014-11-18 2014-11-18 Mitochondrial origin of replication -S000007261 ORF Verified Q0050 AI1 intron-encoded reverse transcriptase aI1 chromosome 17 L000000066|L000004925 17 13818 16322 W 2000-05-19 2000-05-19 Reverse transcriptase required for splicing of the COX1 pre-mRNA; encoded by a mobile group II intron within the mitochondrial COX1 gene -S000037112 CDS Q0050 17 13818 16322 W 2000-05-19 2000-05-19 -S000007262 ORF Verified Q0055 AI2 intron-encoded reverse transcriptase aI2 chromosome 17 L000004926|L000000067 17 13818 18830 W 2000-05-19 2000-05-19 Reverse transcriptase required for splicing of the COX1 pre-mRNA; encoded by a mobile group II intron within the mitochondrial COX1 gene -S000037125 CDS Q0055 17 13818 13986 W 2000-05-19 2000-05-19 -S000037126 CDS Q0055 17 16435 18830 W 2000-05-19 2000-05-19 -S000037127 intron Q0055 17 13987 16434 W 2000-05-19 2000-05-19 -S000007263 ORF Verified Q0060 AI3 intron-encoded DNA endonuclease aI3|I-SceIII chromosome 17 L000004927|L000000068 17 13818 19996 W 2000-05-19 2000-05-19|2006-01-12 Endonuclease I-SceIII; encoded by a mobile group I intron within the mitochondrial COX1 gene -S000037203 CDS Q0060 17 13818 13986 W 2000-05-19 2000-05-19 -S000114045 CDS Q0060 17 16435 16470 W 2006-01-12 2006-01-12 -S000037204 CDS Q0060 17 18954 19996 W 2000-05-19 2000-05-19 -S000037205 intron Q0060 17 13987 16434 W 2006-01-12 2000-05-19|2006-01-12 -S000114046 intron Q0060 17 16471 18953 W 2006-01-12 2006-01-12 -S000007264 ORF Verified Q0065 AI4 intron-encoded DNA endonuclease aI4|I-SceII chromosome 17 L000004928|L000004885 17 13818 21935 W 2000-05-19 2000-05-19|2006-01-12 Endonuclease I-SceII; encoded by a mobile group I intron within the mitochondrial COX1 gene; intron is normally spliced by the BI4p maturase but AI4p can mutate to acquire the same maturase activity -S000037224 CDS Q0065 17 13818 13986 W 2000-05-19 2000-05-19 -S000114047 CDS Q0065 17 16435 16470 W 2006-01-12 2006-01-12 -S000037225 CDS Q0065 17 18954 18991 W 2000-05-19 2000-05-19 -S000037226 CDS Q0065 17 20508 21935 W 2000-05-19 2000-05-19 -S000037227 intron Q0065 17 13987 16434 W 2006-01-12 2000-05-19|2006-01-12 -S000114048 intron Q0065 17 16471 18953 W 2006-01-12 2006-01-12 -S000037228 intron Q0065 17 18992 20507 W 2000-05-19 2000-05-19 -S000007265 ORF Verified Q0070 AI5_ALPHA intron-encoded DNA endonuclease aI5 alpha chromosome 17 L000004929|L000004886 17 13818 23167 W 2000-05-19 2000-05-19 Endonuclease I-SceIV; involved in intron mobility; encoded by a mobile group I intron within the mitochondrial COX1 gene -S000029861 CDS Q0070 17 13818 13986 W 2000-05-19 2000-05-19 -S000029862 CDS Q0070 17 16435 16470 W 2000-05-19 2000-05-19 -S000029863 CDS Q0070 17 18954 18991 W 2000-05-19 2000-05-19 -S000029864 CDS Q0070 17 20508 20984 W 2000-05-19 2000-05-19 -S000029865 CDS Q0070 17 21995 23167 W 2000-05-19 2000-05-19 -S000029866 intron Q0070 17 13987 16434 W 2000-05-19 2000-05-19 -S000029867 intron Q0070 17 16471 18953 W 2000-05-19 2000-05-19 -S000029868 intron Q0070 17 18992 20507 W 2000-05-19 2000-05-19 -S000029869 intron Q0070 17 20985 21994 W 2000-05-19 2000-05-19 -S000007260 ORF Verified Q0045 COX1 cytochrome c oxidase subunit 1|OXI3 chromosome 17 L000004924|L000000383|L000001321 17 13818 26701 W 2000-05-19 2000-05-19 Subunit I of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain; one of three mitochondrially-encoded subunits -S000037020 CDS Q0045 17 13818 13986 W 2000-05-19 2000-05-19 -S000037021 CDS Q0045 17 16435 16470 W 2000-05-19 2000-05-19 -S000037022 CDS Q0045 17 18954 18991 W 2000-05-19 2000-05-19 -S000037023 CDS Q0045 17 20508 20984 W 2000-05-19 2000-05-19 -S000037024 CDS Q0045 17 21995 22246 W 2000-05-19 2000-05-19 -S000037025 CDS Q0045 17 23612 23746 W 2000-05-19 2000-05-19 -S000037026 CDS Q0045 17 25318 25342 W 2000-05-19 2000-05-19 -S000037027 CDS Q0045 17 26229 26701 W 2000-05-19 2000-05-19 -S000037028 intron Q0045 17 13987 16434 W 2000-05-19 2000-05-19 -S000037029 intron Q0045 17 16471 18953 W 2000-05-19 2000-05-19 -S000037030 intron Q0045 17 18992 20507 W 2000-05-19 2000-05-19 -S000037031 intron Q0045 17 20985 21994 W 2000-05-19 2000-05-19 -S000037032 intron Q0045 17 22247 23611 W 2000-05-19 2000-05-19 -S000037033 intron Q0045 17 23747 25317 W 2000-05-19 2000-05-19 -S000037034 intron Q0045 17 25343 26228 W 2000-05-19 2000-05-19 -S000007266 ORF Uncharacterized Q0075 AI5_BETA intron-encoded DNA endonuclease aI5 beta chromosome 17 L000004887|L000004930 17 24156 25255 W 2000-05-19 2000-05-19 Protein of unknown function; encoded within an intron of the mitochondrial COX1 gene; translational initiation codon is predicted to be ATA rather than ATG -S000029881 CDS Q0075 17 24156 24870 W 2000-05-19 2000-05-19 -S000029882 CDS Q0075 17 24906 25255 W 2000-05-19 2000-05-19 -S000029883 intron Q0075 17 24871 24905 W 2000-05-19 2000-05-19 -S000007267 ORF Verified Q0080 ATP8 F1F0 ATP synthase subunit 8|AAP1 chromosome 17 L000004931|L000002723|L000002797 17 27666 27812 W 2000-05-19 2000-05-19 Subunit 8 of the F0 sector of mitochondrial F1F0 ATP synthase; encoded on the mitochondrial genome; ATP8 and ATP6 mRNAs are not translated in the absence of the F1 sector of ATPase -S000029967 CDS Q0080 17 27666 27812 W 2000-05-19 2000-05-19 -S000007268 ORF Verified Q0085 ATP6 F1F0 ATP synthase subunit a|PHO1|OLI4|OLI2 chromosome 17 L000004932|L000001300|L000002722|L000001418|L000001299 17 28487 29266 W 2000-05-19 2000-05-19 Subunit a of the F0 sector of mitochondrial F1F0 ATP synthase; mitochondrially encoded; translation is specifically activated by Atp22p; ATP6 and ATP8 mRNAs are not translated in the absence of the F1 sector of ATPase; mutations in human ortholog MT-ATP6 are associated with neurodegenerative disorders such as Neurogenic Ataxia and Retinitis Pigmentosa (NARP), Leigh syndrome (LS), Charcot-Marie-Tooth (CMT), and ataxia telangiectasia -S000029982 CDS Q0085 17 28487 29266 W 2000-05-19 2000-05-19 -S000029673 origin_of_replication ORI7 ORI7 chromosome 17 L000001314 17 30220 30594 W 2014-11-18 2014-11-18 Mitochondrial origin of replication -S000007269 ORF Dubious Q0092 ORF5 chromosome 17 L000004933 17 30874 31014 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030082 CDS Q0092 17 30874 31014 W 2000-05-19 2000-05-19 -S000029668 origin_of_replication ORI2 ORI2 chromosome 17 L000001309 17 32231 32501 W 2014-11-18 2014-11-18 Mitochondrial origin of replication -S000007318 tRNA_gene tE(UUC)Q chromosome 17 L000004893 17 35373 35444 W 2000-05-19 2000-05-19 Mitochondrial glutamate tRNA (tRNA-Glu); predicted by tRNAscan-SE analysis -S000036036 noncoding_exon tE(UUC)Q 17 35373 35444 W 2000-05-19 2000-05-19 -S000007271 ORF Verified Q0110 BI2 cytochrome b mRNA maturase bI2 chromosome 17 L000004935|L000004888 17 36540 38579 W 2000-05-19 2000-05-19 Mitochondrial mRNA maturase with a role in splicing; encoded by both exon and intron sequences of partially processed COB mRNA -S000031214 CDS Q0110 17 36540 36954 W 2000-05-19 2000-05-19 -S000031215 CDS Q0110 17 37723 38579 W 2000-05-19 2000-05-19 -S000031216 intron Q0110 17 36955 37722 W 2000-05-19 2000-05-19 -S000007272 ORF Verified Q0115 BI3 cytochrome b mRNA maturase bI3 chromosome 17 L000004936|L000000176 17 36540 40265 W 2000-05-19 2000-05-19 Mitochondrial mRNA maturase; forms a complex with Mrs1p to mediate splicing of the bI3 intron of the COB gene; encoded by both exon and intron sequences of partially processed COB mRNA -S000031224 CDS Q0115 17 36540 36954 W 2000-05-19 2000-05-19 -S000031225 CDS Q0115 17 37723 37736 W 2000-05-19 2000-05-19 -S000031226 CDS Q0115 17 39141 40265 W 2000-05-19 2000-05-19 -S000031227 intron Q0115 17 36955 37722 W 2000-05-19 2000-05-19 -S000031228 intron Q0115 17 37737 39140 W 2000-05-19 2000-05-19 -S000007273 ORF Verified Q0120 BI4 intron-encoded RNA maturase bI4 chromosome 17 L000000177|L000004937 17 36540 42251 W 2000-05-19 2000-05-19 Mitochondrial mRNA maturase; forms a complex with Nam2p to mediate splicing of the bI4 intron of the COB gene; encoded by both exon and intron sequences of partially processed COB mRNA -S000032184 CDS Q0120 17 36540 36954 W 2000-05-19 2000-05-19 -S000032185 CDS Q0120 17 37723 37736 W 2000-05-19 2000-05-19 -S000032186 CDS Q0120 17 39141 39217 W 2000-05-19 2000-05-19 -S000032187 CDS Q0120 17 40841 42251 W 2000-05-19 2000-05-19 -S000032188 intron Q0120 17 36955 37722 W 2000-05-19 2000-05-19 -S000032189 intron Q0120 17 37737 39140 W 2000-05-19 2000-05-19 -S000032190 intron Q0120 17 39218 40840 W 2000-05-19 2000-05-19 -S000007270 ORF Verified Q0105 COB cytochrome b|CYTB|COB1 chromosome 17 L000004934|L000000376 17 36540 43647 W 2000-05-19 2000-05-19 Cytochrome b; mitochondrially encoded subunit of the ubiquinol-cytochrome c reductase complex which includes Cobp, Rip1p, Cyt1p, Cor1p, Qcr2p, Qcr6p, Qcr7p, Qcr8p, Qcr9p, and Qcr10p -S000031165 CDS Q0105 17 36540 36954 W 2000-05-19 2000-05-19 -S000031166 CDS Q0105 17 37723 37736 W 2000-05-19 2000-05-19 -S000031167 CDS Q0105 17 39141 39217 W 2000-05-19 2000-05-19 -S000031168 CDS Q0105 17 40841 41090 W 2000-05-19 2000-05-19 -S000031169 CDS Q0105 17 42508 42558 W 2000-05-19 2000-05-19 -S000031170 CDS Q0105 17 43297 43647 W 2000-05-19 2000-05-19 -S000031171 intron Q0105 17 36955 37722 W 2000-05-19 2000-05-19 -S000031172 intron Q0105 17 37737 39140 W 2000-05-19 2000-05-19 -S000031173 intron Q0105 17 39218 40840 W 2000-05-19 2000-05-19 -S000031174 intron Q0105 17 41091 42507 W 2000-05-19 2000-05-19 -S000031175 intron Q0105 17 42559 43296 W 2000-05-19 2000-05-19 -S000029672 origin_of_replication ORI6 ORI6 chromosome 17 L000001313 17 45227 47927 W 2014-11-18 2014-11-18 Mitochondrial origin of replication -S000007274 ORF Verified Q0130 OLI1 F0 ATP synthase subunit c|OLI3|ATP9 chromosome 17 L000004938|L000001298|L000002724 17 46723 46953 W 2000-05-19 2000-05-19 F0-ATP synthase subunit c (ATPase-associated proteolipid); encoded on the mitochondrial genome; mutation confers oligomycin resistance; expression is specifically dependent on the nuclear genes AEP1 and AEP2 -S000032266 CDS Q0130 17 46723 46953 W 2000-05-19 2000-05-19 -S000007333 tRNA_gene tS(UGA)Q2 chromosome 17 L000004908 17 48201 48290 W 2000-05-19 2000-05-19 Mitochondrial serine tRNA (tRNA-Ser); predicted by tRNAscan-SE analysis -S000031361 noncoding_exon tS(UGA)Q2 17 48201 48290 W 2000-05-19 2000-05-19 -S000007275 ORF Verified Q0140 VAR1 mitochondrial 37S ribosomal protein VAR1|VARI chromosome 17 L000004939|L000002456|L000002455 17 48901 50097 W 2000-05-19 2000-05-19 Mitochondrial ribosomal protein of the small subunit; mitochondrially-encoded; polymorphic in different strains due to variation in number of AAT (asparagine) codons; translated near the mitochondrial inner membrane; may have a role in loss of mitochondrial DNA under stress conditions -S000032355 CDS Q0140 17 48901 50097 W 2000-05-19 2000-05-19 -S000007276 ORF Dubious Q0142 ORF9 chromosome 17 L000004940 17 51052 51228 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps dubious open reading frame Q0143 -S000032370 CDS Q0142 17 51052 51228 W 2000-05-19 2000-05-19 -S000007277 ORF Dubious Q0143 ORF10 chromosome 17 L000004941 17 51277 51429 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032373 CDS Q0143 17 51277 51429 W 2000-05-19 2000-05-19 -S000007278 ORF Dubious Q0144 chromosome 17 L000004942 17 54109 54438 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032378 CDS Q0144 17 54109 54438 W 2000-05-19 2000-05-19 -S000029669 origin_of_replication ORI3 ORI3 chromosome 17 L000001310 17 54840 54567 C 2014-11-18 2014-11-18 Mitochondrial origin of replication -S000029670 origin_of_replication ORI4 ORI4 chromosome 17 L000001311 17 56832 56567 C 2014-11-18 2014-11-18 Mitochondrial origin of replication -S000007288 rRNA_gene Q0158 21S_RRNA 21S_rRNA_4|21S_rRNA_3 chromosome 17 L000004883 17 58009 62447 W 2000-05-19 2000-05-19 Mitochondrial 21S rRNA; intron encodes the I-SceI DNA endonuclease -S000034078 intron Q0158 17 60725 61867 W 2000-05-19 2000-05-19 -S000034076 noncoding_exon Q0158 17 58009 60724 W 2000-05-19 2000-05-19 -S000034077 noncoding_exon Q0158 17 61868 62447 W 2000-05-19 2000-05-19 -S000007279 ORF Verified Q0160 SCEI intron-encoded endonuclease I-SceI|I-SceIV|OMEGA chromosome 17 L000004889|L000001858 17 61022 61729 W 2000-05-19 2000-05-19 I-SceI DNA endonuclease; encoded by the mitochondrial group I intron of the 21S_rRNA gene; mediates gene conversion that propagates the intron into intron-less copies of the 21S_rRNA gene -S000033285 CDS Q0160 17 61022 61729 W 2000-05-19 2000-05-19 -S000007334 tRNA_gene tT(UGU)Q1 chromosome 17 L000004909 17 63862 63937 W 2000-05-19 2000-05-19 Mitochondrial threonine tRNA (tRNA-Thr); predicted by tRNAscan-SE analysis -S000033404 noncoding_exon tT(UGU)Q1 17 63862 63937 W 2000-05-19 2000-05-19 -S000007316 tRNA_gene tC(GCA)Q chromosome 17 L000004891 17 64415 64490 W 2000-05-19 2000-05-19 Mitochondrial cysteine tRNA (tRNA-Cys) -S000035255 noncoding_exon tC(GCA)Q 17 64415 64490 W 2000-05-19 2000-05-19 -S000007321 tRNA_gene tH(GUG)Q chromosome 17 L000004896 17 64596 64670 W 2000-05-19 2000-05-19 Mitochondrial histidine tRNA (tRNA-His); predicted by tRNAscan-SE analysis -S000033926 noncoding_exon tH(GUG)Q 17 64596 64670 W 2000-05-19 2000-05-19 -S000007280 ORF Dubious Q0182 ORF11 chromosome 17 L000004944 17 65770 66174 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034264 CDS Q0182 17 65770 66174 W 2000-05-19 2000-05-19 -S000007324 tRNA_gene tL(UAA)Q chromosome 17 L000004899 17 66095 66179 W 2000-05-19 2000-05-19 Mitochondrial leucine tRNA (tRNA-Leu); predicted by tRNAscan-SE analysis; required for mitochondrial translation and indirectly for maintenance of the mitochondrial genome; mutations in the orthologous human gene cause the neurological disease MELAS -S000037434 noncoding_exon tL(UAA)Q 17 66095 66179 W 2000-05-19 2000-05-19 -S000007329 tRNA_gene tQ(UUG)Q chromosome 17 L000004904 17 66210 66285 W 2000-05-19 2000-05-19 Mitochondrial glutamine tRNA (tRNA-Gln); predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000032591 noncoding_exon tQ(UUG)Q 17 66210 66285 W 2000-05-19 2000-05-19 -S000007323 tRNA_gene tK(UUU)Q chromosome 17 L000004898 17 67061 67134 W 2000-05-19 2000-05-19 Mitochondrial lysine tRNA (tRNA-Lys); predicted by tRNAscan-SE analysis; modification of wobble base U34 is decreased at elevated temperatures, decreasing ability to decode AAG codons; this function is performed at high temperature by imported cytoplasmic tRNA-Lys with CUU anticodon -S000034232 noncoding_exon tK(UUU)Q 17 67061 67134 W 2000-05-19 2000-05-19 -S000007331 tRNA_gene tR(UCU)Q1 chromosome 17 L000004906 17 67309 67381 W 2000-05-19 2000-05-19 Mitochondrial arginine tRNA (tRNA-Arg); predicted by tRNAscan-SE analysis -S000032809 noncoding_exon tR(UCU)Q1 17 67309 67381 W 2000-05-19 2000-05-19 -S000007320 tRNA_gene tG(UCC)Q chromosome 17 L000004895 17 67468 67542 W 2000-05-19 2000-05-19 Mitochondrial glycine tRNA (tRNA-Gly); predicted by tRNAscan-SE analysis -S000037571 noncoding_exon tG(UCC)Q 17 67468 67542 W 2000-05-19 2000-05-19 -S000007317 tRNA_gene tD(GUC)Q chromosome 17 L000004892 17 68322 68396 W 2000-05-19 2000-05-19 Mitochondrial aspartate tRNA (tRNA-Asp); predicted by tRNAscan-SE analysis -S000030428 noncoding_exon tD(GUC)Q 17 68322 68396 W 2000-05-19 2000-05-19 -S000007332 tRNA_gene tS(GCU)Q1 chromosome 17 L000004907 17 69203 69288 W 2000-05-19 2000-05-19 Mitochondrial serine tRNA (tRNA-Ser); predicted by tRNAscan-SE analysis -S000030614 noncoding_exon tS(GCU)Q1 17 69203 69288 W 2000-05-19 2000-05-19 -S000007330 tRNA_gene tR(ACG)Q2 chromosome 17 L000004905 17 69289 69362 W 2000-05-19 2000-05-19 Mitochondrial arginine tRNA (tRNA-Arg); predicted by tRNAscan-SE analysis -S000034929 noncoding_exon tR(ACG)Q2 17 69289 69362 W 2000-05-19 2000-05-19 -S000007315 tRNA_gene tA(UGC)Q chromosome 17 L000004890 17 69846 69921 W 2000-05-19 2000-05-19 Mitochondrial alanine tRNA (tRNA-Ala); predicted by tRNAscan-SE analysis -S000034925 noncoding_exon tA(UGC)Q 17 69846 69921 W 2000-05-19 2000-05-19 -S000007322 tRNA_gene tI(GAU)Q chromosome 17 L000004897 17 70162 70237 W 2000-05-19 2000-05-19 Mitochondrial isoleucine tRNA (tRNA-Ile); predicted by tRNAscan-SE analysis; mutations in human ortholog are linked to conditions such as progressive encephalopathy, metabolic syndrome, and hypomagnesaemia -S000036091 noncoding_exon tI(GAU)Q 17 70162 70237 W 2000-05-19 2000-05-19 -S000007338 tRNA_gene tY(GUA)Q chromosome 17 L000004913 17 70824 70907 W 2000-05-19 2000-05-19 Mitochondrial tyrosine tRNA (tRNA-Tyr) -S000034742 noncoding_exon tY(GUA)Q 17 70824 70907 W 2000-05-19 2000-05-19 -S000007327 tRNA_gene tN(GUU)Q chromosome 17 L000004902 17 71433 71503 W 2000-05-19 2000-05-19 Mitochondrial asparagine tRNA (tRNA-Asn); predicted by tRNAscan-SE analysis -S000030750 noncoding_exon tN(GUU)Q 17 71433 71503 W 2000-05-19 2000-05-19 -S000007325 tRNA_gene tM(CAU)Q1 chromosome 17 L000004900 17 72630 72705 W 2000-05-19 2000-05-19 Mitochondrial methionine tRNA (tRNA-Met); predicted by tRNAscan-SE analysis -S000032341 noncoding_exon tM(CAU)Q1 17 72630 72705 W 2000-05-19 2000-05-19 -S000007281 ORF Verified Q0250 COX2 cytochrome c oxidase subunit 2|OXII|OXI1 chromosome 17 L000004945|L000000384|L000001322|L000003004 17 73758 74513 W 2000-05-19 2000-05-19 Subunit II of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain; one of three mitochondrially-encoded subunits -S000036455 CDS Q0250 17 73758 74513 W 2000-05-19 2000-05-19 -S000007282 ORF Uncharacterized Q0255 maturase-like protein|RF1|ORF1 chromosome 17 L000004946 17 74495 75984 W 2000-05-19 2000-05-19 Maturase-like protein -S000036463 CDS Q0255 17 74495 75622 W 2000-05-19 2000-05-19 -S000036464 CDS Q0255 17 75663 75872 W 2000-05-19 2000-05-19 -S000036465 CDS Q0255 17 75904 75984 W 2000-05-19 2000-05-19 -S000036466 intron Q0255 17 75623 75662 W 2000-05-19 2000-05-19 -S000036467 intron Q0255 17 75873 75903 W 2000-05-19 2000-05-19 -S000007319 tRNA_gene tF(GAA)Q chromosome 17 L000004894 17 77431 77505 W 2000-05-19 2000-05-19 Mitochondrial phenylalanine tRNA (tRNA-Phe); predicted by tRNAscan-SE analysis -S000035453 noncoding_exon tF(GAA)Q 17 77431 77505 W 2000-05-19 2000-05-19 -S000007335 tRNA_gene tT(UAG)Q2 tT(XXX)Q2 chromosome 17 L000004910 17 78162 78089 C 2000-05-19 2000-05-19 Mitochondrial threonine tRNA (tRNA-Thr); decodes CUA codons as threonine rather than leucine; has an unusual enlarged 8-nt anticodon loop; may be evolutionarily derived from mitochondrial tRNA-His; conserved in some genera of budding yeasts -S000032409 noncoding_exon tT(UAG)Q2 17 78162 78089 C 2000-05-19 2000-05-19 -S000007336 tRNA_gene tV(UAC)Q chromosome 17 L000004911 17 78533 78608 W 2000-05-19 2000-05-19 Mitochondrial valine tRNA (tRNA-Val); predicted by tRNAscan-SE analysis -S000036325 noncoding_exon tV(UAC)Q 17 78533 78608 W 2000-05-19 2000-05-19 -S000007283 ORF Verified Q0275 COX3 cytochrome c oxidase subunit 3|OXI2 chromosome 17 L000004947|L000000385|L000001320 17 79213 80022 W 2000-05-19 2000-05-19 Subunit III of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain; one of three mitochondrially-encoded subunits -S000036648 CDS Q0275 17 79213 80022 W 2000-05-19 2000-05-19 -S000029671 origin_of_replication ORI5 ORI5 chromosome 17 L000001312 17 82329 82600 W 2014-11-18 2014-11-18 Mitochondrial origin of replication -S000007326 tRNA_gene tM(CAU)Q2 chromosome 17 L000004901 17 85035 85112 W 2000-05-19 2000-05-19 Mitochondrial formylated methionine tRNA (tRNA-fMet); predicted by tRNAscan-SE analysis -S000032348 noncoding_exon tM(CAU)Q2 17 85035 85112 W 2000-05-19 2000-05-19 -S000029023 ncRNA_gene Q0285 RPM1 chromosome 17 L000004810 17 85295 85777 W 2003-12-02 2003-12-02 RNA component of mitochondrial RNase P; mitochondrial RNase P also contains the protein subunit Rpm2p; RNase P removes 5' extensions from mitochondrial tRNA precursors; RPM1 is conserved in bacteria, fungi, and protozoa -S000035976 noncoding_exon Q0285 17 85295 85777 W 2003-12-02 2003-12-02 -S000007284 ORF Dubious Q0297 ORF12 chromosome 17 L000004948 17 85554 85709 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene RPM1 -S000037483 CDS Q0297 17 85554 85709 W 2000-05-19 2000-05-19 -S000029683 gene_group MAL3 MAL3 chromosome 2 L000001002 2 144 Multigene complex, polymeric locus for maltose fermentation; encodes the MAL33 trans-acting MAL-activator, MAL31 maltose permease, and MAL32 maltase -S000178039 ARS ARS200 chromosome 2 2 40 202 2014-11-18 2014-11-18 Autonomously replicating sequence -S000028599 ORF Dubious YBL113W-A chromosome 2 2 646 1128 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031383 CDS YBL113W-A 2 646 1128 W 2003-07-29 2003-07-29 -S000002153 ORF Uncharacterized YBL113C chromosome 2 2 2658 280 C 1996-07-31 1996-07-31 Helicase-like protein encoded within the telomeric Y' element -S000036166 CDS YBL113C 2 2658 280 C 1996-07-31 1996-07-31 -S000002152 ORF Uncharacterized YBL112C chromosome 2 2 2899 2582 C 1996-07-31 1996-07-31 Putative protein of unknown function; YBL112C is contained within TEL02L -S000035974 CDS YBL112C 2 2899 2582 C 1996-07-31 1996-07-31 -S000002151 ORF Verified YBL111C chromosome 2 2 5009 2907 C 1996-07-31 1996-07-31 Helicase-like protein encoded within the telomeric Y' element; relocalizes from mitochondrion to cytoplasm upon DNA replication stress -S000035858 CDS YBL111C 2 4116 2907 C 1996-07-31 1996-07-31 -S000035857 CDS YBL111C 2 5009 4216 C 1996-07-31 1996-07-31 -S000035859 intron YBL111C 2 4215 4117 C 1996-07-31 1996-07-31 -S000002150 ORF Dubious YBL109W chromosome 2 2 5790 6125 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034042 CDS YBL109W 2 5790 6125 W 1996-07-31 1996-07-31 -S000178040 ARS ARS201 chromosome 2 2 6498 6620 2014-11-18 2014-11-18 Autonomously replicating sequence -S000028867 telomere TEL02L chromosome 2 2 6608 1 C -80 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome II; annotated components include an X element core sequence, X element combinatorial repeats, and a short Y' element; TEL02L does have telomeric repeats (TEL02L-TR), but they are missing from the genome annotation due to difficulties encountered during sequencing and/or assembly -S000028868 X_element TEL02L 2 6608 6139 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome II; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028869 X_element_combinatorial_repeat TEL02L 2 6138 5849 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr II; contains repeats of the D, C, B and A types, Tbf1p binding sites, and ORF YBL109W; formerly called SubTelomeric Repeats -S000028870 Y_prime_element TEL02L 2 5848 1 C 2003-09-09 2003-09-09 Telomeric short Y' element on the left arm of Chromosome II; contains an ARS consensus sequence, a region of 36-bp repeats, and four ORFs (YBL111C, YBL112C, YBL113C, YBL113W-A) -S000007592 ORF Verified YBL108C-A PAU9 seripauperin PAU9 chromosome 2 2 7733 7605 C 2001-02-26 2001-02-26 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively -S000037104 CDS YBL108C-A 2 7733 7605 C 2001-02-26 2001-02-26 -S000000204 ORF Dubious YBL108W chromosome 2 2 8177 8482 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033883 CDS YBL108W 2 8177 8482 W 1996-07-31 1996-07-31 -S000006798 long_terminal_repeat YBLWdelta1 chromosome 2 2 8848 9092 W 2000-05-19 2000-05-19 Ty1 LTR -S000006799 long_terminal_repeat YBLWdelta2 chromosome 2 2 9093 9424 W 2000-05-19 2000-05-19 Ty2 LTR -S000007229 ORF Dubious YBL107W-A chromosome 2 2 9268 9372 W 1999-07-17 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the Ty2 LTR YBLWdelta2; YBL107W-A has a paralog, YER138W-A, that arose from a single-locus duplication -S000036010 CDS YBL107W-A 2 9268 9372 W 1999-07-17 1999-07-17 -S000006800 long_terminal_repeat YBLWdelta3 chromosome 2 2 9425 9518 W 2000-05-19 2000-05-19 Ty1 LTR -S000006647 tRNA_gene tL(UAA)B1 chromosome 2 L000003738 2 9583 9666 W 2000-05-19 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000035755 noncoding_exon tL(UAA)B1 2 9583 9666 W 2000-05-19 2000-05-19 -S000000203 ORF Verified YBL107C MIX23 MIC23 chromosome 2 2 10551 9961 C 1996-07-31 1996-07-31 Mitochondrial intermembrane space protein of unknown function; imported via the MIA import machinery; contains an unusual twin cysteine motif (CX13C CX14C) -S000033751 CDS YBL107C 2 10551 9961 C 1996-07-31 1996-07-31 -S000000202 ORF Verified YBL106C SRO77 putative Rab GTPase-binding protein SRO77|SNI2|SOP2 chromosome 2 L000004194 2 13879 10847 C 1996-07-31 1996-07-31|2011-02-03 Protein with roles in exocytosis and cation homeostasis; functions in docking and fusion of post-Golgi vesicles with plasma membrane; regulates cell proliferation and colony development via the Rho1-Tor1 pathway; interacts with SNARE protein Sec9p; homolog of Drosophila lethal giant larvae tumor suppressor; SRO77 has a paralog, SRO7, that arose from the whole genome duplication -S000033072 CDS YBL106C 2 13879 10847 C 1996-07-31 1996-07-31|2011-02-03 -S000000201 ORF Verified YBL105C PKC1 protein kinase C|CLY7|CLY5|STT1|HPO2|CLY15 chromosome 2 L000001446|L000000362|S000029091 2 17696 14241 C -79 1996-07-31 1996-07-31|2011-02-03 Protein serine/threonine kinase; essential for cell wall remodeling during growth; localized to sites of polarized growth and the mother-daughter bud neck; homolog of the alpha, beta, and gamma isoforms of mammalian protein kinase C (PKC) -S000032980 CDS YBL105C 2 17696 14241 C 1996-07-31 1996-07-31|2011-02-03 -S000000200 ORF Verified YBL104C SEA4 YBL103C-A chromosome 2 2 21293 18177 C 2004-01-26 2004-01-26|1996-07-31 Subunit of SEACAT, a subcomplex of the SEA complex; Sea4p, along with Rtc1p and Mtc5p, redundantly inhibit the TORC1 inhibitory role of the Iml1p/SEACIT (Iml1p-Npr2p-Npr3p) subcomplex, a GAP for GTPase Gtr1p (EGOC subunit) in response to amino acid limitation, thereby resulting in activation of TORC1 signaling; SEA is a coatomer-related complex that associates dynamically with the vacuole; contains an N-terminal beta-propeller fold and a C-terminal RING motif -S000032891 CDS YBL104C 2 21293 18177 C 2004-01-26 2004-01-26|1996-07-31 -S000000199 ORF Verified YBL103C RTG3 chromosome 2 L000003152 2 23536 22076 C 2011-02-03 1997-07-27|1997-01-28 bHLH/Zip transcription factor for retrograde (RTG) and TOR pathways; forms a complex with another bHLH/Zip protein, Rtg1p, to activate the pathways; target of Hog1p -S000032786 CDS YBL103C 2 23536 22076 C 2011-02-03 1997-07-27|1997-01-28 -S000000198 ORF Verified YBL102W SFT2 chromosome 2 L000002950 2 24098 24745 W 2004-01-26 1997-01-28 Tetra-spanning membrane protein found mostly in the late Golgi; non-essential; can suppress some sed5 alleles; may be part of the transport machinery, but precise function is unknown; similar to mammalian syntaxin 5 -S000032738 CDS YBL102W 2 24098 24745 W 2004-01-26 1997-01-28 -S000000197 ORF Verified YBL101C ECM21 ART2 chromosome 2 L000003896 2 28299 24946 C 2004-01-26 1998-09-13|1997-01-28 Protein involved in regulating endocytosis of plasma membrane proteins; identified as a substrate for ubiquitination by Rsp5p and deubiquitination by Ubp2p; promoter contains several Gcn4p binding elements; ECM21 has a paralog, CSR2, that arose from the whole genome duplication -S000031747 CDS YBL101C 2 28299 24946 C 2004-01-26 1998-09-13|1997-01-28 -S000028598 ORF Uncharacterized YBL100W-C YBL101W-C chromosome 2 2 28427 28546 W 2004-01-26 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031381 CDS YBL100W-C 2 28427 28546 W 2004-01-26 2003-07-29 -S000118996 ARS ARS230 ARSII-29|ARS201.5 chromosome 2 2 28942 29160 2011-02-03 2006-10-02 Autonomously Replicating Sequence -S000006801 long_terminal_repeat YBLWdelta4 chromosome 2 2 29644 29975 W 2011-02-03 2000-05-19 Ty2 LTR -S000006809 LTR_retrotransposon YBLWTy2-1 Ty2 chromosome 2 2 29644 35602 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000002148 transposable_element_gene YBL100W-A gag protein|TY2A_B|YBL101W-A chromosome 2 2 29935 31251 W 2011-02-03 1997-01-28 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000032385 CDS YBL100W-A 2 29935 31251 W 2011-02-03 1997-01-28 -S000002149 transposable_element_gene YBL100W-B gag-pol fusion protein|TY2B_B|YBL101W-B chromosome 2 2 29935 35248 W 2011-02-03 1997-01-28 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000032404 CDS YBL100W-B 2 29935 31227 W 2011-02-03 1997-01-28 -S000032405 CDS YBL100W-B 2 31229 35248 W 2011-02-03 1997-01-28 -S000032406 plus_1_translational_frameshift YBL100W-B 2 31228 31228 W 2011-02-03 1997-01-28 -S000006802 long_terminal_repeat YBLWdelta5 chromosome 2 2 35271 35602 W 2011-02-03 2000-05-19 Ty2 LTR -S000006803 long_terminal_repeat YBLWdelta6 chromosome 2 2 35604 35796 W 2011-02-03 2000-05-19 Ty1 LTR -S000006807 long_terminal_repeat YBLCtau1 YBLWtau1 chromosome 2 2 36221 35851 C 2011-02-03 2000-05-19|2007-04-05 Ty4 LTR -S000006562 tRNA_gene tF(GAA)B chromosome 2 L000003739 2 36398 36488 W 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis -S000035371 intron tF(GAA)B 2 36435 36452 W 2011-02-03 2000-05-19 -S000035369 noncoding_exon tF(GAA)B 2 36398 36434 W 2011-02-03 2000-05-19 -S000035370 noncoding_exon tF(GAA)B 2 36453 36488 W 2011-02-03 2000-05-19 -S000000195 ORF Verified YBL099W ATP1 F1F0 ATP synthase subunit alpha chromosome 2 L000000141 2 37053 38690 W 2011-02-03 1997-01-28|2011-02-03 Alpha subunit of the F1 sector of mitochondrial F1F0 ATP synthase; which is a large, evolutionarily conserved enzyme complex required for ATP synthesis; F1 translationally regulates ATP6 and ATP8 expression to achieve a balanced output of ATP synthase genes encoded in nucleus and mitochondria; phosphorylated; N-terminally propionylated in vivo -S000034558 CDS YBL099W 2 37053 38690 W 2011-02-03 1997-01-28|2011-02-03 -S000000196 ORF Dubious YBL100C chromosome 2 2 37303 36989 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the 5' end of ATP1 -S000031662 CDS YBL100C 2 37303 36989 C 2011-02-03 1997-01-28 -S000000194 ORF Verified YBL098W BNA4 kynurenine 3-monooxygenase chromosome 2 2 39145 40527 W 2011-02-03 1997-01-28 Kynurenine 3-monooxygenase; required for the de novo biosynthesis of NAD from tryptophan via kynurenine; expression regulated by Hst1p; putative therapeutic target for Huntington disease -S000034424 CDS YBL098W 2 39145 40527 W 2011-02-03 1997-01-28 -S000000193 ORF Verified YBL097W BRN1 condensin subunit BRN1 chromosome 2 L000004324 2 40831 43095 W 2011-02-03 2004-01-29|1997-01-28|2011-02-03 Subunit of the condensin complex; required for chromosome condensation and for clustering of tRNA genes at the nucleolus; may influence multiple aspects of chromosome transmission -S000034364 CDS YBL097W 2 40831 43095 W 2011-02-03 2004-01-29|1997-01-28|2011-02-03 -S000000191 ORF Uncharacterized YBL095W MRX3 chromosome 2 2 43277 44089 W 2011-02-03 1997-01-28 Protein that associates with mitochondrial ribosome; likely functions in cristae junction formation; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000033361 CDS YBL095W 2 43277 44089 W 2011-02-03 1997-01-28 -S000000192 ORF Dubious YBL096C chromosome 2 2 43482 43174 C 2011-02-03 1997-01-28 Non-essential protein of unknown function -S000033392 CDS YBL096C 2 43482 43174 C 2011-02-03 1997-01-28 -S000000190 ORF Dubious YBL094C chromosome 2 2 44097 43765 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps uncharacterized ORF YBL095W -S000033262 CDS YBL094C 2 44097 43765 C 2011-02-03 1997-01-28 -S000000189 ORF Verified YBL093C ROX3 SSX2|MED19|SSN7|NUT3 chromosome 2 L000001662|S000029515|L000002098 2 44918 44256 C 2011-02-03 1997-01-28 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme -S000032413 CDS YBL093C 2 44918 44256 C 2011-02-03 1997-01-28 -S000000188 ORF Verified YBL092W RPL32 eL32|ribosomal 60S subunit protein L32|L32e|L32 chromosome 2 L000004464 2 45978 46370 W 2011-02-03 1997-01-28 Ribosomal 60S subunit protein L32; overexpression disrupts telomeric silencing; homologous to mammalian ribosomal protein L32, no bacterial homolog -S000032377 CDS YBL092W 2 45978 46370 W 2011-02-03 1997-01-28 -S000122091 five_prime_UTR_intron YBL092W 2 45645 45977 W 2011-02-03 2007-04-04 -S000007228 ORF Verified YBL091C-A SCS22 phospholipid metabolism-regulating protein SCS22 chromosome 2 2 47180 46565 C 2011-02-03 2004-01-07|1999-07-17 Protein involved in regulation of phospholipid metabolism; one of 6 proteins (Ist2p, Scs2p, Scs22p, Tcb1p, Tcb2p, Tcb3p) that connect the ER and plasma membrane (PM); regulates PM PI4P levels by controlling access of the Sac1p phosphatase to its substrate, PI4P; human VAP homolog; similar to D. melanogaster inturned protein; SWAT-GFP and mCherry fusion proteins localize to the cytosol; SCS22 has a paralog, SCS2, that arose from the whole genome duplication -S000037851 CDS YBL091C-A 2 47058 46565 C 2011-02-03 2004-01-07|1999-07-17 -S000037850 CDS YBL091C-A 2 47180 47147 C 2011-02-03 2004-01-07 -S000037852 intron YBL091C-A 2 47146 47059 C 2011-02-03 2004-01-07 -S000000187 ORF Verified YBL091C MAP2 methionine aminopeptidase chromosome 2 L000003044 2 48628 47363 C 2011-02-03 1997-07-27|1997-01-28|2011-02-03 Methionine aminopeptidase; catalyzes the cotranslational removal of N-terminal methionine from nascent polypeptides; function is partially redundant with that of Map1p -S000032224 CDS YBL091C 2 48628 47363 C 2011-02-03 1997-07-27|1997-01-28|2011-02-03 -S000000186 ORF Verified YBL090W MRP21 mitochondrial 37S ribosomal protein MRP21|MRP50 chromosome 2 L000003275 2 48825 49358 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the small subunit; MRP21 exhibits genetic interactions with mutations in the COX2 and COX3 mRNA 5'-untranslated leader sequences -S000032193 CDS YBL090W 2 48825 49358 W 2011-02-03 1997-01-28 -S000000185 ORF Verified YBL089W AVT5 amino acid transporter chromosome 2 2 49574 50953 W 2011-02-03 2003-09-22|1997-01-28 Putative transporter; member of a family of seven S. cerevisiae genes (AVT1-7) related to vesicular GABA-glycine transporters; AVT5 has a paralog, AVT6, that arose from the whole genome duplication -S000031223 CDS YBL089W 2 49574 50953 W 2011-02-03 2003-09-22|1997-01-28 -S000000184 ORF Verified YBL088C TEL1 DNA-binding protein kinase TEL1 chromosome 2 L000002281 2 59382 51019 C -60 2011-02-03 1997-01-28|2011-02-03 Protein kinase primarily involved in telomere length regulation; contributes to cell cycle checkpoint control in response to DNA damage; acts with Red1p and Mec1p to promote interhomolog recombination by phosphorylation of Hop1; functionally redundant with Mec1p; regulates P-body formation induced by replication stress; homolog of human ataxia-telangiectasia mutated (ATM) gene -S000030193 CDS YBL088C 2 59382 51019 C 2011-02-03 1997-01-28|2011-02-03 -S000000183 ORF Verified YBL087C RPL23A uL14|ribosomal 60S subunit protein L23A|L14|YL32|L23A|L17aA chromosome 2 L000001716 2 60739 59822 C 2011-02-03 1997-01-28 Ribosomal 60S subunit protein L23A; homologous to mammalian ribosomal protein L23 and bacterial L14; RPL23A has a paralog, RPL23B, that arose from the whole genome duplication -S000030032 CDS YBL087C 2 60193 59822 C 2011-02-03 1997-01-28 -S000030031 CDS YBL087C 2 60739 60698 C 2011-02-03 1997-01-28 -S000030033 intron YBL087C 2 60697 60194 C 2011-02-03 1997-01-28 -S000000182 ORF Uncharacterized YBL086C chromosome 2 2 62602 61202 C 2011-02-03 1997-01-28 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery -S000029917 CDS YBL086C 2 62602 61202 C 2011-02-03 1997-01-28 -S000118344 ARS ARS202 ARSII-63 chromosome 2 2 63259 63381 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000000181 ORF Verified YBL085W BOI1 BOB1|GIN7 chromosome 2 L000000191|L000000703 2 63876 66818 W 2011-02-03 1997-01-28 Protein implicated in polar growth; functionally redundant with Boi2p; interacts with bud-emergence protein Bem1p; contains an SH3 (src homology 3) domain and a PH (pleckstrin homology) domain; relocalizes from bud neck to cytoplasm upon DNA replication stress; BOI1 has a paralog, BOI2, that arose from the whole genome duplication -S000029876 CDS YBL085W 2 63876 66818 W 2011-02-03 1997-01-28 -S000000180 ORF Verified YBL084C CDC27 anaphase promoting complex subunit CDC27|SNB1|APC3 chromosome 2 L000000266 2 69445 67169 C -58 2011-02-03 1997-01-28|2011-02-03 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); APC/C is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition -S000037167 CDS YBL084C 2 69445 67169 C 2011-02-03 1997-01-28|2011-02-03 -S000000179 ORF Dubious YBL083C chromosome 2 2 70138 69713 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps verified ORF ALG3 -S000037052 CDS YBL083C 2 70138 69713 C 2011-02-03 1997-01-28 -S000000178 ORF Verified YBL082C ALG3 dolichyl-P-Man:Man(5)GlcNAc(2)-PP-dolichol alpha-1,3-mannosyltransferase|RHK1 chromosome 2 L000002668 2 71127 69751 C 2011-02-03 1997-01-28 Dolichol-P-Man dependent alpha(1-3) mannosyltransferase; involved in synthesis of dolichol-linked oligosaccharide donor for N-linked glycosylation of proteins; G353A missense mutation in human ortholog ALG3 implicated in carbohydrate deficient glycoprotein syndrome type IV, which is characterized by microcephaly, severe epilepsy, minimal psychomotor development, partial deficiency of sialic acids in serum glycoproteins; wild-type human ALG3 can complement yeast alg3 mutant -S000036997 CDS YBL082C 2 71127 69751 C 2011-02-03 1997-01-28 -S000000177 ORF Uncharacterized YBL081W chromosome 2 2 71866 72972 W 2011-02-03 1997-01-28 Non-essential protein of unknown function; null mutation results in a decrease in plasma membrane electron transport -S000036378 CDS YBL081W 2 71866 72972 W 2011-02-03 1997-01-28 -S000000176 ORF Verified YBL080C PET112 glutamyl-tRNA(Gln) amidotransferase subunit PET112 chromosome 2 L000001394 2 74695 73070 C 2011-02-03 1997-01-28|2011-02-03 Subunit of the trimeric GatFAB AmidoTransferase(AdT) complex; involved in the formation of Q-tRNAQ; mutation is functionally complemented by the bacterial GatB ortholog -S000036223 CDS YBL080C 2 74695 73070 C 2011-02-03 1997-01-28|2011-02-03 -S000000175 ORF Verified YBL079W NUP170 NLE3 chromosome 2 L000001256|L000003140 2 75259 79767 W 2011-02-03 1997-01-28 Subunit of inner ring of nuclear pore complex (NPC); contributes to NPC assembly and nucleocytoplasmic transport; interacts with genomic regions that contain ribosomal protein and subtelomeric genes, where it functions in nucleosome positioning and as a repressor of transcription; both Nup170p and NUP157p are similar to human Nup155p; NUP170 has a paralog, NUP157, that arose from the whole genome duplication -S000034905 CDS YBL079W 2 75259 79767 W 2011-02-03 1997-01-28 -S000000174 ORF Verified YBL078C ATG8 ubiquitin-like protein ATG8|AUT7|CVT5|APG8 chromosome 2 L000004607|L000004604 2 80731 80378 C 2011-02-03 1997-01-28 Component of autophagosomes and Cvt vesicles; regulator of Atg1p, targets it to autophagosomes; binds the Atg1p-Atg13p complex, triggering its vacuolar degradation; unique ubiquitin-like protein whose conjugation target is lipid phosphatidylethanolamine (PE); Atg8p-PE is anchored to membranes, is involved in phagophore expansion, and may mediate membrane fusion during autophagosome formation; deconjugation of Atg8p-PE is required for efficient autophagosome biogenesis -S000033940 CDS YBL078C 2 80731 80378 C 2011-02-03 1997-01-28 -S000000173 ORF Dubious YBL077W chromosome 2 2 80897 81328 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene ILS1/YBL076C -S000033872 CDS YBL077W 2 80897 81328 W 2011-02-03 1997-01-28 -S000000172 ORF Verified YBL076C ILS1 isoleucine--tRNA ligase ILS1 chromosome 2 L000000856 2 84261 81043 C -43 2011-02-03 1997-01-28 Cytoplasmic isoleucine-tRNA synthetase; target of the G1-specific inhibitor reveromycin A -S000033054 CDS YBL076C 2 84261 81043 C 2011-02-03 1997-01-28 -S000000171 ORF Verified YBL075C SSA3 Hsp70 family ATPase SSA3|YG106 chromosome 2 L000002071|L000000820 2 86448 84499 C 2011-02-03 1997-01-28 ATPase involved in protein folding and the response to stress; plays a role in SRP-dependent cotranslational protein-membrane targeting and translocation; member of the heat shock protein 70 (HSP70) family; localized to the cytoplasm; SSA3 has a paralog, SSA4, that arose from the whole genome duplication -S000032985 CDS YBL075C 2 86448 84499 C 2011-02-03 1997-01-28 -S000000169 ORF Dubious YBL073W chromosome 2 2 87646 87957 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the essential gene AAR2/YBL074C -S000032838 CDS YBL073W 2 87646 87957 W 2011-02-03 1997-01-28 -S000000170 ORF Verified YBL074C AAR2 U5 snRNP complex subunit AAR2 chromosome 2 L000000008 2 87789 86722 C 2011-02-03 1997-01-28 Component of the U5 snRNP complex; required for splicing of U3 precursors; originally described as a splicing factor specifically required for splicing pre-mRNA of the MATa1 cistron -S000032869 CDS YBL074C 2 87789 86722 C 2011-02-03 1997-01-28 -S000006447 snoRNA_gene snR56 SNR56 chromosome 2 L000004525 2 88190 88277 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position G1428 -S000030761 noncoding_exon snR56 2 88190 88277 W 2011-02-03 2000-05-19 -S000000168 ORF Verified YBL072C RPS8A eS8|ribosomal 40S subunit protein S8A|S8e|rp19|YS9|S8A|S14A chromosome 2 L000001752|L000001753 2 89125 88523 C 2011-02-03 1997-01-28 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S8, no bacterial homolog; RPS8A has a paralog, RPS8B, that arose from the whole genome duplication -S000031871 CDS YBL072C 2 89125 88523 C 2011-02-03 1997-01-28 -S000122090 five_prime_UTR_intron YBL072C 2 89440 89133 C 2011-02-03 2007-04-04|2011-02-03 -S000028597 ORF Uncharacterized YBL071C-B chromosome 2 2 89556 89458 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031379 CDS YBL071C-B 2 89556 89458 C 2011-02-03 2003-07-29 -S000007587 ORF Verified YBL071W-A KTI11 DPH3 chromosome 2 2 89978 90226 W 2011-02-03 2001-01-30 Zn-ribbon protein that co-purifies with Dph1 and Dph2; in a complex required for synthesis of diphthamide on translation factor eEF2 and with Elongator subunits Iki3p, Elp2p, and Elp3p; involved in modification of wobble nucleosides in tRNAs; forms a stable heterodimer with Ats1p -S000037098 CDS YBL071W-A 2 89978 90226 W 2011-02-03 2001-01-30 -S000000167 ORF Uncharacterized YBL071C chromosome 2 2 90531 90223 C 2011-02-03 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YBL071C is not an essential gene -S000031723 CDS YBL071C 2 90531 90223 C 2011-02-03 1997-01-28 -S000000165 ORF Verified YBL069W AST1 chromosome 2 L000000133 2 90741 92030 W 2011-02-03 2001-05-29|1997-01-28 Lipid raft associated protein; interacts with the plasma membrane ATPase Pma1p and has a role in its targeting to the plasma membrane by influencing its incorporation into lipid rafts; sometimes classified in the medium-chain dehydrogenase/reductases (MDRs) superfamily; AST1 has a paralog, AST2, that arose from the whole genome duplication -S000031495 CDS YBL069W 2 90741 92030 W 2011-02-03 2001-05-29|1997-01-28 -S000000166 ORF Dubious YBL070C chromosome 2 2 90925 90605 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031635 CDS YBL070C 2 90925 90605 C 2011-02-03 1997-01-28 -S000028530 ORF Dubious YBL068W-A chromosome 2 2 91794 92030 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by fungal homology and RT-PCR -S000031139 CDS YBL068W-A 2 91794 92030 W 2011-02-03 2003-07-29 -S000000164 ORF Verified YBL068W PRS4 ribose phosphate diphosphokinase subunit PRS4 chromosome 2 L000001513 2 92414 93394 W 2011-02-03 2003-09-22|1997-01-28|2011-02-03 5-phospho-ribosyl-1(alpha)-pyrophosphate synthetase, synthesizes PRPP; which is required for nucleotide, histidine, and tryptophan biosynthesis; one of five related enzymes, which are active as heteromultimeric complexes; PRS4 has a paralog, PRS2, that arose from the whole genome duplication; a missense mutation in the conserved residue R196 of its human homolog PRPS1 is pathogenic -S000031367 CDS YBL068W 2 92414 93394 W 2011-02-03 2003-09-22|1997-01-28|2011-02-03 -S000178041 ARS ARS203 chromosome 2 2 93435 93519 2014-11-18 2014-11-18 Autonomously replicating sequence -S000000163 ORF Verified YBL067C UBP13 ubiquitin-specific protease UBP13 chromosome 2 L000003172 2 95882 93639 C 2011-02-03 2004-07-16|1997-01-28|1999-04-26|2011-02-03 Ubiquitin-specific protease that cleaves Ub-protein fusions; UBP13 has a paralog, UBP9, that arose from the whole genome duplication -S000030367 CDS YBL067C 2 95882 93639 C 2011-02-03 2004-07-16|1997-01-28|1999-04-26|2011-02-03 -S000000161 ORF Dubious YBL065W chromosome 2 2 99963 100307 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF SEF1/YBL066C; YBL065W is a non-essential gene -S000037539 CDS YBL065W 2 99963 100307 W 2011-02-03 1997-01-28 -S000000162 ORF Verified YBL066C SEF1 chromosome 2 L000003318 2 100115 96669 C 2011-02-03 2004-07-16|1999-04-26|1997-01-28 Putative transcription factor; has homolog in Kluyveromyces lactis -S000030204 CDS YBL066C 2 100115 96669 C 2011-02-03 2004-07-16|1997-01-28|1999-04-26 -S000000160 ORF Verified YBL064C PRX1 thioredoxin peroxidase PRX1 chromosome 2 2 101156 100371 C 2011-02-03 1997-01-28 Mitochondrial peroxiredoxin with thioredoxin peroxidase activity; has a role in reduction of hydroperoxides; reactivation requires Trr2p and glutathione; induced during respiratory growth and oxidative stress; phosphorylated; protein abundance increases in response to DNA replication stress -S000037361 CDS YBL064C 2 101156 100371 C 2011-02-03 1997-01-28 -S000000159 ORF Verified YBL063W KIP1 CIN9 chromosome 2 L000000907 2 101886 105221 W 2011-02-03 1997-01-28 Kinesin-related motor protein; required for mitotic spindle assembly, chromosome segregation, and 2 micron plasmid partitioning; functionally redundant with Cin8p for chromosomal but not plasmid functions -S000037298 CDS YBL063W 2 101886 105221 W 2011-02-03 1997-01-28 -S000000158 ORF Dubious YBL062W chromosome 2 2 105308 105688 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036607 CDS YBL062W 2 105308 105688 W 2011-02-03 1997-01-28 -S000000157 ORF Verified YBL061C SKT5 CSD4|CHS4|CAL2 chromosome 2 L000001911|L000000332 2 107406 105316 C 2011-02-03 1997-01-28 Activator of Chs3p (chitin synthase III) during vegetative growth; recruits Chs3p to the bud neck via interaction with Bni4p; SKT5 has a paralog, SHC1, that arose from the whole genome duplication -S000036460 CDS YBL061C 2 107406 105316 C 2011-02-03 1997-01-28 -S000000156 ORF Verified YBL060W YEL1 Arf family guanine nucleotide exchange factor YEL1 chromosome 2 2 107932 109995 W 2011-02-03 1997-01-28 Guanine nucleotide exchange factor specific for Arf3p; localized to the bud neck and tip; required for localization of Arf3p to the bud neck and tip -S000036446 CDS YBL060W 2 107932 109995 W 2011-02-03 1997-01-28 -S000007488 ORF Verified YBL059C-A CMC2 chromosome 2 2 110539 110125 C 2011-02-03 2000-12-01 Protein involved in respiratory chain complex assembly or maintenance; protein of the mitochondrial intermembrane space; contains twin Cx9C motifs that can form coiled coil-helix-coiled-coil helix fold -S000032274 CDS YBL059C-A 2 110420 110125 C 2011-02-03 2000-12-01 -S000032273 CDS YBL059C-A 2 110539 110506 C 2011-02-03 2000-12-01 -S000032275 intron YBL059C-A 2 110505 110421 C 2011-02-03 2000-12-01 -S000000155 ORF Uncharacterized YBL059W chromosome 2 2 110594 111244 W 2011-02-03 1997-01-28 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YBL059W has a paralog, YER093C-A, that arose from the whole genome duplication -S000035392 CDS YBL059W 2 110594 110879 W 2011-02-03 1997-01-28 -S000035393 CDS YBL059W 2 110949 111244 W 2011-02-03 1997-01-28 -S000035394 intron YBL059W 2 110880 110948 W 2011-02-03 1997-01-28 -S000000154 ORF Verified YBL058W SHP1 protein phosphatase regulator SHP1|UBX1 chromosome 2 L000002746 2 111437 112708 W 2011-02-03 1997-01-28 UBX domain-containing substrate adaptor for Cdc48p; ubiquitin regulatory X domain-containing protein that acts as a substrate recruiting cofactor for Cdc48p; positively regulates Glc7p PPase activity to promote growth and mitotic progression in complex with Cdc48p; ubiquitinated protein interactor involved in ER-associated degradation (ERAD); regulated by nuclear Ub-dependent degradation (INMAD pathway) independent of the Asi and Doa10 complexes; homolog of human p47 (NSFL1C) -S000034369 CDS YBL058W 2 111437 112708 W 2011-02-03 1997-01-28 -S000000153 ORF Verified YBL057C PTH2 aminoacyl-tRNA hydrolase chromosome 2 2 113427 112801 C 2011-02-03 1997-01-28|2011-02-03 One of two mitochondrially-localized peptidyl-tRNA hydrolases; negatively regulates the ubiquitin-proteasome pathway via interactions with ubiquitin-like ubiquitin-associated proteins; dispensable for cell growth; see also PTH1 -S000034185 CDS YBL057C 2 113427 112801 C 2011-02-03 1997-01-28|2011-02-03 -S000000152 ORF Verified YBL056W PTC3 type 2C protein phosphatase PTC3 chromosome 2 L000003426 2 113762 115168 W 2011-02-03 1997-01-28|2011-02-03 Type 2C protein phosphatase (PP2C); dephosphorylates Hog1p (see also Ptc2p) to limit maximal kinase activity induced by osmotic stress; dephosphorylates T169 phosphorylated Cdc28p (see also Ptc2p); role in DNA damage checkpoint inactivation; PTC3 has a paralog, PTC2, that arose from the whole genome duplication -S000034127 CDS YBL056W 2 113762 115168 W 2011-02-03 1997-01-28|2011-02-03 -S000000151 ORF Verified YBL055C 3'-5'-exodeoxyribonuclease|Tat-D chromosome 2 2 116829 115573 C 2011-02-03 1997-01-28 3'-->5' exonuclease and endonuclease with a possible role in apoptosis; has similarity to mammalian and C. elegans apoptotic nucleases -S000033245 CDS YBL055C 2 116829 115573 C 2011-02-03 1997-01-28 -S000000150 ORF Verified YBL054W TOD6 PBF1 chromosome 2 2 117589 119166 W 2011-02-03 1997-01-28 PAC motif binding protein involved in rRNA and ribosome biogenesis; subunit of the RPD3L histone deacetylase complex; Myb-like HTH transcription factor; hypophosphorylated by rapamycin treatment in a Sch9p-dependent manner; activated in stochastic pulses of nuclear localization -S000033217 CDS YBL054W 2 117589 119166 W 2011-02-03 1997-01-28 -S000000149 ORF Dubious YBL053W chromosome 2 2 119335 119709 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033156 CDS YBL053W 2 119335 119709 W 2011-02-03 1997-01-28 -S000000148 ORF Verified YBL052C SAS3 KAT6 chromosome 2 L000003280 2 121874 119379 C 2011-02-03 1997-01-28 Histone acetyltransferase catalytic subunit of NuA3 complex; acetylates histone H3, involved in transcriptional silencing; homolog of the mammalian MOZ proto-oncogene; mutant has aneuploidy tolerance; sas3gcn5 double mutation is lethal -S000032250 CDS YBL052C 2 121874 119379 C 2011-02-03 1997-01-28 -S000000147 ORF Verified YBL051C PIN4 MDT1 chromosome 2 2 124759 122753 C 2011-02-03 1997-01-28 Protein involved in G2/M phase progression and response to DNA damage; interacts with Rad53p; contains an RNA recognition motif, a nuclear localization signal, and several SQ/TQ cluster domains; hyperphosphorylated in response to DNA damage -S000032171 CDS YBL051C 2 124759 122753 C 2011-02-03 1997-01-28 -S000000146 ORF Verified YBL050W SEC17 RNS3 chromosome 2 L000001841 2 125125 126119 W 2011-02-03 1997-01-28 Alpha-SNAP cochaperone; SNARE-complex adaptor for Sec18 (NSF) during the disassembly of postfusion cis-SNARE complexes; stimulates the ATPase activity of Sec18p; peripheral membrane protein required for vesicular transport between ER and Golgi, the 'priming' step in homotypic vacuole fusion, and autophagy; similar to mammalian alpha-SNAP -S000032144 CDS YBL050W 2 125125 125154 W 2011-02-03 1997-01-28 -S000032145 CDS YBL050W 2 125271 126119 W 2011-02-03 1997-01-28 -S000032146 intron YBL050W 2 125155 125270 W 2011-02-03 1997-01-28 -S000000145 ORF Verified YBL049W MOH1 chromosome 2 2 126828 127244 W 2011-02-03 1997-01-28 Protein of unknown function, essential for stationary phase survival; not required for growth on nonfermentable carbon sources; possibly linked with vacuolar transport -S000031247 CDS YBL049W 2 126828 127244 W 2011-02-03 1997-01-28 -S000000144 ORF Dubious YBL048W RRT1 chromosome 2 2 127299 127610 W 2011-02-03 1997-01-28 Protein of unknown function; identified in a screen for mutants with increased levels of rDNA transcription; dubious open reading frame unlikely to encode a protein, based on experimental and comparative sequence data -S000031090 CDS YBL048W 2 127299 127610 W 2011-02-03 1997-01-28 -S000000143 ORF Verified YBL047C EDE1 BUD15 chromosome 2 2 132040 127895 C 2011-02-03 1997-01-28 Scaffold protein involved in the formation of early endocytic sites; putative regulator of cytokinesis; homo-oligomerization is required for localization to and organization of endocytic sites; has a network of interactions with other endocytic proteins; binds membranes in a ubiquitin-dependent manner; may also bind ubiquitinated membrane-associated proteins; interacts with Cmk2 and functions upstream of CMK2 in regulating non-apoptotic cell death; homolog of mammalian Eps15 -S000030056 CDS YBL047C 2 132040 127895 C 2011-02-03 1997-01-28 -S000000142 ORF Verified YBL046W PSY4 HSM6 chromosome 2 2 132424 133749 W 2011-02-03 1997-01-28 Regulatory subunit of protein phosphatase PP4; presence of Psy4p in the PP4 complex (along with catalytic subunit Pph3p and Psy2p) is required for dephosphorylation of the histone variant H2AX, but not for dephosphorylation of Rad53p, during recovery from the DNA damage checkpoint; localization is cell-cycle dependent and regulated by Cdc28p phosphorylation; required for cisplatin resistance; homolog of mammalian R2 -S000030008 CDS YBL046W 2 132424 133749 W 2011-02-03 1997-01-28 -S000000141 ORF Verified YBL045C COR1 ubiquinol--cytochrome-c reductase subunit COR1|QCR1 chromosome 2 L000000381 2 135516 134143 C 2011-02-03 1997-01-28 Core subunit of the ubiquinol-cytochrome c reductase complex; the ubiquinol-cytochrome c reductase complex (bc1 complex) is a component of the mitochondrial inner membrane electron transport chain -S000037896 CDS YBL045C 2 135516 134143 C 2011-02-03 1997-01-28 -S000000140 ORF Uncharacterized YBL044W chromosome 2 2 135998 136366 W 2011-02-03 1997-01-28 Putative protein of unknown function; YBL044W is not an essential protein -S000037855 CDS YBL044W 2 135998 136366 W 2011-02-03 1997-01-28 -S000000139 ORF Verified YBL043W ECM13 chromosome 2 L000003888 2 136688 137461 W 2011-02-03 1997-01-28 Non-essential protein of unknown function; induced by treatment with 8-methoxypsoralen and UVA irradiation; ECM13 has a paralog, YJR115W, that arose from the whole genome duplication -S000037081 CDS YBL043W 2 136688 137461 W 2011-02-03 1997-01-28 -S000000138 ORF Verified YBL042C FUI1 uridine permease chromosome 2 L000004437 2 140260 138341 C 2011-02-03 1997-01-28 High affinity uridine permease, localizes to the plasma membrane; also mediates low but significant transport of the cytotoxic nucleoside analog 5-fluorouridine; not involved in uracil transport; relative distribution to the vacuole increases upon DNA replication stress -S000036981 CDS YBL042C 2 140260 138341 C 2011-02-03 1997-01-28 -S000000137 ORF Verified YBL041W PRE7 proteasome core particle subunit beta 6|PRS3 chromosome 2 L000002699 2 141247 141972 W 2011-02-03 1997-01-28 Beta 6 subunit of the 20S proteasome -S000036959 CDS YBL041W 2 141247 141972 W 2011-02-03 1997-01-28 -S000000136 ORF Verified YBL040C ERD2 chromosome 2 L000000567 2 142868 142112 C 2011-02-03 1997-01-28 HDEL receptor; an integral membrane protein that binds to the HDEL motif in proteins destined for retention in the endoplasmic reticulum; has a role in maintenance of normal levels of ER-resident proteins -S000036161 CDS YBL040C 2 142749 142112 C 2011-02-03 1997-01-28 -S000036160 CDS YBL040C 2 142868 142847 C 2011-02-03 1997-01-28 -S000036162 intron YBL040C 2 142846 142750 C 2011-02-03 1997-01-28 -S000028517 ORF Uncharacterized YBL039W-B YBL039W-A chromosome 2 2 143393 143572 W 2011-02-03 2003-07-29 Putative protein of unknown function; mCherry fusion protein localizes to the vacuole -S000030292 CDS YBL039W-B 2 143393 143572 W 2011-02-03 2003-07-29 -S000178042 ARS ARS206 chromosome 2 2 143658 143745 2014-11-18 2014-11-18 Autonomously replicating sequence -S000028814 ORF Dubious YBL039C-A chromosome 2 2 145031 144948 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF URA7; identified by expression profiling and mass spectrometry -S000033616 CDS YBL039C-A 2 145031 144948 C 2011-02-03 2003-07-29 -S000000135 ORF Verified YBL039C URA7 CTP synthase URA7 chromosome 2 L000002436 2 145728 143989 C 2011-02-03 1997-01-28 Major CTP synthase isozyme (see also URA8); catalyzes the ATP-dependent transfer of the amide nitrogen from glutamine to UTP, forming CTP, the final step in de novo biosynthesis of pyrimidines; involved in phospholipid biosynthesis; capable of forming cytoplasmic filaments termed cytoophidium, especially during conditions of glucose depletion; URA7 has a paralog, URA8, that arose from the whole genome duplication -S000035182 CDS YBL039C 2 145728 143989 C 2011-02-03 1997-01-28 -S000000134 ORF Verified YBL038W MRPL16 RML16|mitochondrial 54S ribosomal protein YmL47|YmL47 chromosome 2 L000001165 2 146187 146885 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit; homologous to bacterial L16 ribosomal protein; synthetic lethality with hac1 mutation suggests a possible role in synthesis of precursors for protein glycosylation -S000035077 CDS YBL038W 2 146187 146885 W 2011-02-03 1997-01-28 -S000000133 ORF Verified YBL037W APL3 chromosome 2 L000003322 2 147209 150286 W 2011-02-03 1997-01-28 Alpha-adaptin; large subunit of the clathrin associated protein complex (AP-2); involved in vesicle mediated transport -S000034928 CDS YBL037W 2 147209 150286 W 2011-02-03 1997-01-28 -S000000132 ORF Verified YBL036C chromosome 2 2 151220 150447 C 2011-02-03 1997-01-28 Putative non-specific single-domain racemase; based on structural similarity; binds pyridoxal 5'-phosphate; expression of GFP-fusion protein induced in response to the DNA-damaging agent MMS -S000033968 CDS YBL036C 2 151220 150447 C 2011-02-03 1997-01-28 -S000000131 ORF Verified YBL035C POL12 DNA-directed DNA polymerase alpha subunit POL12 chromosome 2 L000002698 2 153610 151493 C 2011-02-03 1997-01-28 B subunit of DNA polymerase alpha-primase complex; required for initiation of DNA replication during mitotic and premeiotic DNA synthesis; also functions in telomere capping and length regulation -S000033851 CDS YBL035C 2 153610 151493 C 2011-02-03 1997-01-28 -S000000130 ORF Verified YBL034C STU1 chromosome 2 L000002138 2 158389 153848 C 2011-02-03 1997-01-28 Component of the mitotic spindle; binds to interpolar microtubules via its association with beta-tubulin (Tub2p); required for interpolar microtubules to provide an outward force on the spindle poles -S000033728 CDS YBL034C 2 158389 153848 C 2011-02-03 1997-01-28 -S000000129 ORF Verified YBL033C RIB1 GTP cyclohydrolase II chromosome 2 L000001634 2 159693 158656 C 2011-02-03 1999-04-22|1997-01-28 GTP cyclohydrolase II; catalyzes the first step of the riboflavin biosynthesis pathway -S000033070 CDS YBL033C 2 159693 158656 C 2011-02-03 1999-04-22|1997-01-28 -S000000128 ORF Verified YBL032W HEK2 KHD1 chromosome 2 2 160184 161329 W 2011-02-03 1997-01-28 RNA binding protein involved in asymmetric localization of ASH1 mRNA; represses translation of ASH1 mRNA, an effect reversed by Yck1p-dependent phosphoryation; regulates telomere position effect and length; similarity to hnRNP-K -S000033035 CDS YBL032W 2 160184 161329 W 2011-02-03 1997-01-28 -S000000127 ORF Verified YBL031W SHE1 chromosome 2 L000002867 2 161699 162715 W 2011-02-03 1997-01-28 Mitotic spindle protein; interacts with components of the Dam1 (DASH) complex, its effector Sli15p, and microtubule-associated protein Bim1p; also localizes to nuclear microtubules and to the bud neck in a ring-shaped structure; inhibits dynein function -S000032946 CDS YBL031W 2 161699 162715 W 2011-02-03 1997-01-28 -S000000126 ORF Verified YBL030C PET9 ADP/ATP carrier protein PET9|OP1|ANC2|AAC2 chromosome 2 L000000004|L000001386|L000004346 2 163997 163041 C -20 2011-02-03 1997-01-28 Major ADP/ATP carrier of the mitochondrial inner membrane; exchanges cytosolic ADP for mitochondrially synthesized ATP; also imports heme and ATP; required for viability in many lab strains that carry a sal1 mutation; PET9 has a paralog, AAC3, that arose from the whole genome duplication; human homolog SLC25A4 implicated in progressive external ophthalmoplegia can complement yeast null mutant -S000032782 CDS YBL030C 2 163997 163041 C 2011-02-03 1997-01-28 -S000007591 ORF Verified YBL029C-A chromosome 2 S000029022 2 164772 164488 C 2011-02-03 2001-02-26 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery; protein abundance increases in response to DNA replication stress; has potential orthologs in Saccharomyces species and in Yarrowia lipolytica -S000037103 CDS YBL029C-A 2 164772 164488 C 2011-02-03 2001-02-26 -S000000125 ORF Uncharacterized YBL029W chromosome 2 2 166134 167264 W 2011-02-03 1997-01-28 Non-essential protein of unknown function -S000032107 CDS YBL029W 2 166134 167264 W 2011-02-03 1997-01-28 -S000000124 ORF Verified YBL028C chromosome 2 2 167838 167518 C 2011-02-03 1997-01-28 Protein of unknown function that may interact with ribosomes; green fluorescent protein (GFP)-fusion protein localizes to the nucleolus; predicted to be involved in ribosome biogenesis -S000031894 CDS YBL028C 2 167838 167518 C 2011-02-03 1997-01-28 -S000000123 ORF Verified YBL027W RPL19B eL19|ribosomal 60S subunit protein L19B|L19e|rpl5L|YL14|L23B|L19B chromosome 2 L000001719|L000001718 2 168423 169376 W 2011-02-03 1997-01-28 Ribosomal 60S subunit protein L19B; rpl19a and rpl19b single null mutations result in slow growth, while the double null mutation is lethal; homologous to mammalian ribosomal protein L19, no bacterial homolog; RPL19B has a paralog, RPL19A, that arose from the whole genome duplication -S000031846 CDS YBL027W 2 168423 168424 W 2011-02-03 1997-01-28 -S000031847 CDS YBL027W 2 168809 169376 W 2011-02-03 1997-01-28 -S000031848 intron YBL027W 2 168425 168808 W 2011-02-03 1997-01-28 -S000118345 ARS ARS207 ARSII-170 chromosome 2 2 170173 170279 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178043 ARS_consensus_sequence ARS207 2 170223 170207 C 2014-11-18 2014-11-18 -S000000122 ORF Verified YBL026W LSM2 Sm-like protein LSM2|SNP3|SMX5 chromosome 2 L000003168 2 170623 171038 W 2011-02-03 1997-01-28 Lsm (Like Sm) protein; part of heteroheptameric complexes (Lsm2p-7p and either Lsm1p or 8p): cytoplasmic Lsm1p complex involved in mRNA decay; nuclear Lsm8p complex part of U6 snRNP and possibly involved in processing tRNA, snoRNA, and rRNA; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress -S000030858 CDS YBL026W 2 170623 170676 W 2011-02-03 1997-01-28 -S000030859 CDS YBL026W 2 170805 171038 W 2011-02-03 1997-01-28 -S000030860 intron YBL026W 2 170677 170804 W 2011-02-03 1997-01-28 -S000000121 ORF Verified YBL025W RRN10 chromosome 2 L000003279 2 171481 171918 W 2011-02-03 1997-01-28 Protein involved in promoting high level transcription of rDNA; subunit of UAF (upstream activation factor) for RNA polymerase I -S000030749 CDS YBL025W 2 171481 171918 W 2011-02-03 1997-01-28 -S000000120 ORF Verified YBL024W NCL1 tRNA (cytosine-C5-)-methyltransferase|TRM4 chromosome 2 2 172534 174588 W 2011-02-03 1997-01-28 S-adenosyl-L-methionine-dependent tRNA: m5C-methyltransferase; methylates cytosine to m5C at several positions in tRNAs and intron-containing pre-tRNAs; increases proportion of tRNALeu(CAA) with m5C at wobble position in response to hydrogen peroxide, causing selective translation of mRNA from genes enriched in TTG codon; loss of NCL1 confers hypersensitivity to oxidative stress; similar to Nop2p and human proliferation associated nucleolar protein p120 -S000030630 CDS YBL024W 2 172534 174588 W 2011-02-03 1997-01-28 -S000000119 ORF Verified YBL023C MCM2 MCM DNA helicase complex subunit MCM2 chromosome 2 L000001038 2 177526 174920 C -31 2011-02-03 1997-01-28 Protein involved in DNA replication; component of the Mcm2-7 hexameric helicase complex that binds chromatin as a part of the pre-replicative complex; relative distribution to the nucleus increases upon DNA replication stress -S000037739 CDS YBL023C 2 177526 174920 C 2011-02-03 1997-01-28 -S000000118 ORF Verified YBL022C PIM1 ATP-dependent Lon protease PIM1|LON1 chromosome 2 L000000949|L000001440 2 181275 177874 C 2011-02-03 1997-01-28 ATP-dependent Lon protease; involved in degradation of misfolded proteins in mitochondria; required for biogenesis and maintenance of mitochondria -S000037690 CDS YBL022C 2 181275 177874 C 2011-02-03 1997-01-28 -S000000117 ORF Verified YBL021C HAP3 chromosome 2 L000000753 2 182094 181660 C 2011-02-03 1997-01-28 Subunit of the Hap2p/3p/4p/5p CCAAT-binding complex; complex is heme-activated and glucose-repressed; complex is a transcriptional activator and global regulator of respiratory gene expression; contains sequences contributing to both complex assembly and DNA binding -S000037614 CDS YBL021C 2 182094 181660 C 2011-02-03 1997-01-28 -S000000116 ORF Verified YBL020W RFT1 glycolipid translocation protein chromosome 2 L000001626 2 182401 184125 W 2011-02-03 1997-01-28 Membrane protein required for translocation of Man5GlcNac2-PP-Dol; required for translocation of Man5GlcNac2-PP-Dol from the cytoplasmic side to the lumenal side of the ER membrane but is not the flippase; mutation is suppressed by expression of human p53 protein; essential gene -S000037598 CDS YBL020W 2 182401 184125 W 2011-02-03 1997-01-28 -S000000115 ORF Verified YBL019W APN2 DNA-(apurinic or apyrimidinic site) lyase APN2|ETH1 chromosome 2 L000004434 2 184353 185915 W 2011-02-03 1997-01-28 Class II abasic (AP) endonuclease involved in repair of DNA damage; homolog of human HAP1 and E. coli exoIII -S000037877 CDS YBL019W 2 184353 185915 W 2011-02-03 1997-01-28 -S000000114 ORF Verified YBL018C POP8 ribonuclease P chromosome 2 L000004304 2 186474 185998 C 2011-02-03 1997-01-28 Subunit of both RNase MRP and nuclear RNase P; RNase MRP cleaves pre-rRNA, while nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs; relocalizes to the cytosol in response to hypoxia -S000035953 CDS YBL018C 2 186352 185998 C 2011-02-03 1997-01-28 -S000035952 CDS YBL018C 2 186474 186428 C 2011-02-03 1997-01-28 -S000035954 intron YBL018C 2 186427 186353 C 2011-02-03 1997-01-28 -S000000113 ORF Verified YBL017C PEP1 type I sorting receptor|VPT1|VPS10 chromosome 2 L000001373 2 191583 186844 C -8 2011-02-03 1997-01-28 Type I transmembrane sorting receptor for multiple vacuolar hydrolases; cycles between the late-Golgi and prevacuolar endosome-like compartments -S000035832 CDS YBL017C 2 191583 186844 C 2011-02-03 1997-01-28 -S000000112 ORF Verified YBL016W FUS3 mitogen-activated serine/threonine-protein kinase FUS3|DAC2 chromosome 2 L000000655 2 192451 193512 W -5 2011-02-03 1997-01-28 Mitogen-activated serine/threonine protein kinase involved in mating; phosphoactivated by Ste7p; substrates include Ste12p, Far1p, Bni1p, Sst2p; inhibits invasive growth during mating by phosphorylating Tec1p, promoting its; inhibits recruitment of Ste5p, Cdc42p-mediated asymmetry and mating morphogenesis -S000035775 CDS YBL016W 2 192451 193512 W 2011-02-03 1997-01-28 -S000000111 ORF Verified YBL015W ACH1 acetyl-CoA hydrolase chromosome 2 L000000021 2 194122 195702 W 2011-02-03 1997-01-28 Protein with CoA transferase activity; particularly for CoASH transfer from succinyl-CoA to acetate; has minor acetyl-CoA-hydrolase activity; phosphorylated; required for acetate utilization and for diploid pseudohyphal growth -S000035656 CDS YBL015W 2 194122 195702 W 2011-02-03 1997-01-28 -S000006796 long_terminal_repeat YBLCdelta7 chromosome 2 2 197320 197016 C 2011-02-03 2000-05-19|2007-04-05 Ty1 LTR -S000006600 tRNA_gene tI(AAU)B chromosome 2 L000003740 2 197494 197567 W 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000030373 noncoding_exon tI(AAU)B 2 197494 197567 W 2011-02-03 2000-05-19 -S000006574 tRNA_gene tG(GCC)B chromosome 2 L000003750 2 197699 197629 C 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis -S000037887 noncoding_exon tG(GCC)B 2 197699 197629 C 2011-02-03 2000-05-19 -S000006797 long_terminal_repeat YBLWsigma1 YBLCsigma1 chromosome 2 2 197714 198054 W 2011-02-03 2000-05-19 Ty3 LTR -S000118997 ARS ARS231 ARSII-198|ARS207.5 chromosome 2 2 198313 198473 2014-11-18 2014-11-18|2006-10-02 Autonomously Replicating Sequence -S000178044 ARS_consensus_sequence ARS231 2 198385 198369 C 2014-11-18 2014-11-18 -S000000110 ORF Verified YBL014C RRN6 chromosome 2 L000001772 2 201748 199064 C 2011-02-03 1997-01-28|2011-02-03 Component of the core factor (CF) rDNA transcription factor complex; CF is required for transcription of 35S rRNA genes by RNA polymerase I and is composed of Rrn6p, Rrn7p, and Rrn11p -S000034605 CDS YBL014C 2 201748 199064 C 2011-02-03 1997-01-28|2011-02-03 -S000000109 ORF Verified YBL013W FMT1 methionyl-tRNA formyltransferase chromosome 2 2 202056 203261 W 2011-02-03 2004-01-29|1997-01-28 Methionyl-tRNA formyltransferase; catalyzes the formylation of initiator Met-tRNA in mitochondria; potential Cdc28p substrate -S000034585 CDS YBL013W 2 202056 203261 W 2011-02-03 2004-01-29|1997-01-28 -S000000107 ORF Verified YBL011W SCT1 bifunctional glycerol-3-phosphate/glycerone-phosphate O-acyltransferase SCT1|GAT2 chromosome 2 L000001820 2 203538 205817 W 2011-02-03 1997-01-28 Glycerol 3-phosphate/dihydroxyacetone phosphate sn-1 acyltransferase; dual substrate-specific acyltransferase of the glycerolipid biosynthesis pathway; prefers 16-carbon fatty acids; similar to Gpt2p; gene is constitutively transcribed -S000033576 CDS YBL011W 2 203538 205817 W 2011-02-03 1997-01-28 -S000000108 ORF Dubious YBL012C chromosome 2 2 203807 203406 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033578 CDS YBL012C 2 203807 203406 C 2011-02-03 1997-01-28 -S000000106 ORF Uncharacterized YBL010C chromosome 2 2 206949 206107 C 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein colocalizes with clathrin-coated vesicles -S000033474 CDS YBL010C 2 206949 206107 C 2011-02-03 1997-01-28 -S000000105 ORF Verified YBL009W ALK2 protein kinase ALK2 chromosome 2 2 207194 209224 W 2011-02-03 1997-01-28 Protein kinase; along with its paralog, ALK1, required for proper spindle positioning and nuclear segregation following mitotic arrest, proper organization of cell polarity factors in mitosis, proper localization of formins and polarity factors, and survival in cells that activate spindle assembly checkpoint; phosphorylated in response to DNA damage; ALK2 has a paralog, ALK1, that arose from the whole genome duplication; similar to mammalian haspins -S000033987 CDS YBL009W 2 207194 209224 W 2011-02-03 1997-01-28 -S000028529 ORF Uncharacterized YBL008W-A chromosome 2 2 209409 209648 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000030335 CDS YBL008W-A 2 209409 209648 W 2011-02-03 2003-07-29 -S000000104 ORF Verified YBL008W HIR1 chromosome 2 L000000776 2 209653 212175 W 2011-02-03 1997-01-28|2011-02-03 Subunit of the HIR complex; HIR is a nucleosome assembly complex involved in regulation of histone gene transcription; contributes to nucleosome formation, heterochromatic gene silencing, and formation of functional kinetochores -S000033882 CDS YBL008W 2 209653 212175 W 2011-02-03 1997-01-28|2011-02-03 -S000000103 ORF Verified YBL007C SLA1 cytoskeletal protein-binding protein SLA1 chromosome 2 L000001912 2 216366 212632 C 2011-02-03 1997-01-28 Cytoskeletal protein binding protein; required for assembly of the cortical actin cytoskeleton; interacts with proteins regulating actin dynamics and proteins required for endocytosis; found in the nucleus and cell cortex; has 3 SH3 domains -S000033661 CDS YBL007C 2 216366 212632 C 2011-02-03 1997-01-28 -S000028596 ORF Dubious YBL006W-A chromosome 2 2 216711 216860 W 2011-02-03 2004-01-29|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene LDB7/YBL006C -S000031377 CDS YBL006W-A 2 216711 216860 W 2011-02-03 2004-01-29|2003-07-29 -S000000102 ORF Verified YBL006C LDB7 RSC14 chromosome 2 2 217129 216587 C 2011-02-03 2004-01-29|1997-01-28 Component of the RSC chromatin remodeling complex; interacts with Rsc3p, Rsc30p, Npl6p, and Htl1p to form a module important for a broad range of RSC functions -S000030377 CDS YBL006C 2 217129 216587 C 2011-02-03 2004-01-29|1997-01-28 -S000000101 ORF Verified YBL005W PDR3 drug-responsive transcription factor PDR3|TPE2|AMY2 chromosome 2 L000002985|L000001363 2 217470 220400 W -10 2011-02-03 1997-01-28 Transcriptional activator of the pleiotropic drug resistance network; regulates expression of ATP-binding cassette (ABC) transporters through binding to cis-acting PDRE sites (PDR responsive elements); has a role in response to drugs and organic solvents; post-translationally up-regulated in cells lacking functional mitochondrial genome; involved in diauxic shift; relative distribution to nucleus increases upon DNA replication stress; APCC(Cdh1) substrate -S000030309 CDS YBL005W 2 217470 220400 W 2011-02-03 1997-01-28 -S000006804 long_terminal_repeat YBLWdelta8 chromosome 2 2 220895 221036 W 2011-02-03 2000-05-19 Ty1 LTR -S000006805 long_terminal_repeat YBLWdelta9 chromosome 2 2 221037 221370 W 2011-02-03 2000-05-19 Ty1 LTR -S000006808 LTR_retrotransposon YBLWTy1-1 Ty1 chromosome 2 2 221037 226952 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000002146 transposable_element_gene YBL005W-A gag protein chromosome 2 2 221330 222652 W 2011-02-03 1997-01-28 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000032539 CDS YBL005W-A 2 221330 222652 W 2011-02-03 1997-01-28 -S000002147 transposable_element_gene YBL005W-B gag-pol fusion protein chromosome 2 2 221330 226598 W 2011-02-03 1997-01-28 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000032555 CDS YBL005W-B 2 221330 222634 W 2011-02-03 1997-01-28 -S000032556 CDS YBL005W-B 2 222636 226598 W 2011-02-03 1997-01-28 -S000032557 plus_1_translational_frameshift YBL005W-B 2 222635 222635 W 2011-02-03 1997-01-28 -S000006806 long_terminal_repeat YBLWdelta10 chromosome 2 2 226621 226952 W 2011-02-03 2000-05-19 Ty1 LTR -S000006720 tRNA_gene tS(AGA)B chromosome 2 L000003741 2 227075 227156 W 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000032344 noncoding_exon tS(AGA)B 2 227075 227156 W 2011-02-03 2000-05-19 -S000000100 ORF Verified YBL004W UTP20 chromosome 2 2 227636 235117 W 2011-02-03 2001-05-29|1997-01-28 Component of the small-subunit (SSU) processome; SSU processome is involved in the biogenesis of the 18S rRNA -S000030137 CDS YBL004W 2 227636 235117 W 2011-02-03 2001-05-29|1997-01-28 -S000000099 ORF Verified YBL003C HTA2 histone H2A|H2A2 chromosome 2 L000000749|L000000828 2 235792 235394 C .2 2011-02-03 1997-01-28 Histone H2A; core histone protein required for chromatin assembly and chromosome function; one of two nearly identical (see also HTA1) subtypes; DNA damage-dependent phosphorylation by Mec1p facilitates DNA repair; acetylated by Nat4p -S000029974 CDS YBL003C 2 235792 235394 C 2011-02-03 1997-01-28 -S000000098 ORF Verified YBL002W HTB2 histone H2B chromosome 2 L000000830 2 236492 236887 W .2 2011-02-03 1997-01-28 Histone H2B; core histone protein required for chromatin assembly and chromosome function; nearly identical to HTB1; Rad6p-Bre1p-Lge1p mediated ubiquitination regulates reassembly after DNA replication, transcriptional activation, meiotic DSB formation and H3 methylation -S000037396 CDS YBL002W 2 236492 236887 W 2011-02-03 1997-01-28 -S000000097 ORF Verified YBL001C ECM15 chromosome 2 L000003890 2 237467 237153 C 2011-02-03 1997-01-28 Non-essential protein of unknown function; likely exists as tetramer, may be regulated by the binding of small-molecule ligands (possibly sulfate ions), may have a role in yeast cell-wall biogenesis -S000037284 CDS YBL001C 2 237467 237153 C 2011-02-03 1997-01-28 -S000118346 ARS ARS208 ARSII-238 chromosome 2 2 237787 237900 2014-11-18 2014-11-18|2006-08-30|2011-02-03 Autonomously Replicating Sequence -S000178045 ARS_consensus_sequence ARS208 2 237835 237819 C 2014-11-18 2014-11-18 -S000006464 centromere CEN2 CEN2 chromosome 2 L000000295 2 238207 238323 W 0 2011-02-03 2000-05-19 Chromosome II centromere -S000077260 centromere_DNA_Element_I CEN2 2 238207 238216 W 2011-02-03 2004-10-04 -S000077261 centromere_DNA_Element_II CEN2 2 238217 238298 W 2011-02-03 2004-10-04 -S000077262 centromere_DNA_Element_III CEN2 2 238299 238323 W 2011-02-03 2004-10-04 -S000000205 ORF Verified YBR001C NTH2 alpha,alpha-trehalase NTH2 chromosome 2 L000001281 2 241283 238941 C 2011-02-03 1997-01-28 Putative neutral trehalase, required for thermotolerance; may mediate resistance to other cellular stresses; NTH2 has a paralog, NTH1, that arose from the whole genome duplication -S000034705 CDS YBR001C 2 241283 238941 C 2011-02-03 1997-01-28 -S000000206 ORF Verified YBR002C RER2 ditrans,polycis-polyprenyl diphosphate synthase chromosome 2 L000004874 2 242568 241708 C 2011-02-03 1997-01-28 Forms the dehydrodolichyl diphosphate syntase (DDS) complex with NUS1; major enzyme of polyprenol synthesis in both the endoplasmic reticulum (ER) and in lipid droplets; participates in ER protein sorting; human ortholog DHDDS functionally complements the heat sensitive growth defect of a ts allele, and is associated with retinitis pigmentosa -S000035641 CDS YBR002C 2 242568 241708 C 2011-02-03 1997-01-28 -S000000207 ORF Verified YBR003W COQ1 trans-hexaprenyltranstransferase chromosome 2 L000000378 2 242809 244230 W 2011-02-03 1997-01-28 Hexaprenyl pyrophosphate synthetase; catalyzes the first step in ubiquinone (coenzyme Q) biosynthesis -S000035753 CDS YBR003W 2 242809 244230 W 2011-02-03 1997-01-28 -S000000208 ORF Verified YBR004C GPI18 GPI-anchor transamidase GPI18|FMP44 chromosome 2 2 245667 244366 C 2011-02-03 1997-01-28|2011-02-03 Functional ortholog of human PIG-V; PIG-V is a mannosyltransferase that transfers the second mannose in glycosylphosphatidylinositol biosynthesis; the authentic, non-tagged protein was localized to mitochondria -S000035794 CDS YBR004C 2 245667 244366 C 2011-02-03 1997-01-28|2011-02-03 -S000000209 ORF Verified YBR005W RCR1 SSH6 chromosome 2 2 245906 246547 W 2011-02-03 1997-01-28 Protein of the ER membrane involved in cell wall chitin deposition; may function in the endosomal-vacuolar trafficking pathway, helping determine whether plasma membrane proteins are degraded or routed to the plasma membrane; RCR1 has a paralog, RCR2, that arose from the whole genome duplication -S000035989 CDS YBR005W 2 245906 246547 W 2011-02-03 1997-01-28 -S000000210 ORF Verified YBR006W UGA2 succinate-semialdehyde dehydrogenase (NAD(P)(+))|UGA5 chromosome 2 S000007516 2 247010 248503 W 2011-02-03 1999-04-26|1997-01-28 Succinate semialdehyde dehydrogenase; involved in the utilization of gamma-aminobutyrate (GABA) as a nitrogen source; part of the 4-aminobutyrate and glutamate degradation pathways; localized to the cytoplasm -S000036842 CDS YBR006W 2 247010 248503 W 2011-02-03 1999-04-26|1997-01-28 -S000000211 ORF Verified YBR007C DSF2 chromosome 2 2 251016 248806 C 2011-02-03 1997-01-28|2011-02-03 Deletion suppressor of mpt5 mutation; relocalizes from bud neck to cytoplasm upon DNA replication stress -S000036880 CDS YBR007C 2 251016 248806 C 2011-02-03 1997-01-28|2011-02-03 -S000000212 ORF Verified YBR008C FLR1 chromosome 2 L000003532 2 254209 252563 C 2011-02-03 1997-01-28 Plasma membrane transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; involved in efflux of fluconazole, diazaborine, benomyl, methotrexate, and other drugs; expression induced in cells treated with the mycotoxin patulin; relocalizes from nucleus to plasma membrane upon DNA replication stress -S000036932 CDS YBR008C 2 254209 252563 C 2011-02-03 1997-01-28 -S000114517 ARS ARS209 ARS209 chromosome 2 2 254998 255083 2014-11-18 2014-11-18|2006-03-02|2011-02-03 Autonomously Replicating Sequence; originally referred to as H4 ARS -S000178046 ARS_consensus_sequence ARS209 2 255041 255025 C 2014-11-18 2014-11-18 -S000000213 ORF Verified YBR009C HHF1 histone H4 chromosome 2 L000000770 2 255684 255373 C 2011-02-03 1997-01-28 Histone H4; core histone protein required for chromatin assembly and chromosome function; one of two identical histone proteins (see also HHF2); contributes to telomeric silencing; N-terminal domain involved in maintaining genomic integrity -S000037700 CDS YBR009C 2 255684 255373 C 2011-02-03 1997-01-28 -S000000214 ORF Verified YBR010W HHT1 histone H3|SIN2|BUR5 chromosome 2 L000000772 2 256331 256741 W 2011-02-03 1997-01-28 Histone H3; core histone protein required for chromatin assembly, part of heterochromatin-mediated telomeric and HM silencing; one of two identical histone H3 proteins (see HHT2); regulated by acetylation, methylation, and phosphorylation; H3K14 acetylation plays an important role in the unfolding of strongly positioned nucleosomes during repair of UV damage -S000030575 CDS YBR010W 2 256331 256741 W 2011-02-03 1997-01-28 -S000000215 ORF Verified YBR011C IPP1 inorganic diphosphatase IPP1|PPA1 chromosome 2 L000000872 2 257975 257112 C 2011-02-03 1997-01-28 Cytoplasmic inorganic pyrophosphatase (PPase); homodimer that catalyzes the rapid exchange of oxygens from Pi with water, highly expressed and essential for viability, active-site residues show identity to those from E. coli PPase -S000030655 CDS YBR011C 2 257975 257112 C 2011-02-03 1997-01-28 -S000006810 long_terminal_repeat YBRCdelta11 chromosome 2 2 258976 258670 C 2011-02-03 2000-05-19|2007-04-05 Ty1 LTR -S000000216 ORF Dubious YBR012C chromosome 2 2 259566 259147 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; expression induced by iron-regulated transcriptional activator Aft2p -S000030768 CDS YBR012C 2 259566 259147 C 2011-02-03 1997-01-28 -S000006815 long_terminal_repeat YBRWdelta12 chromosome 2 2 259578 259909 W 2011-02-03 2000-05-19 Ty1 LTR -S000006821 LTR_retrotransposon YBRWTy1-2 Ty1 chromosome 2 2 259578 265494 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000002154 transposable_element_gene YBR012W-A gag protein chromosome 2 2 259869 261191 W 2011-02-03 1997-01-28 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000031588 CDS YBR012W-A 2 259869 261191 W 2011-02-03 1997-01-28 -S000002155 transposable_element_gene YBR012W-B gag-pol fusion protein chromosome 2 2 259869 265140 W 2011-02-03 1997-01-28 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000031594 CDS YBR012W-B 2 259869 261173 W 2011-02-03 1997-01-28 -S000031595 CDS YBR012W-B 2 261175 265140 W 2011-02-03 1997-01-28 -S000031596 plus_1_translational_frameshift YBR012W-B 2 261174 261174 W 2011-02-03 1997-01-28 -S000006816 long_terminal_repeat YBRWdelta13 chromosome 2 2 265163 265494 W 2011-02-03 2000-05-19 Ty1 LTR -S000000217 ORF Uncharacterized YBR013C chromosome 2 2 265881 265492 C 2011-02-03 1997-01-28 Putative protein of unknown function; haploid deletion mutant exhibits synthetic phenotype with alpha-synuclein; SWAT-GFP fusion protein localizes to the endoplasmic reticulum while mCherry fusion protein localizes to both the endoplasmic reticulum and vacuole -S000030875 CDS YBR013C 2 265881 265492 C 2011-02-03 1997-01-28 -S000006811 long_terminal_repeat YBRCdelta14 chromosome 2 2 266256 266178 C 2007-04-05 2000-05-19|2007-04-05 Ty1 LTR -S000006737 tRNA_gene tT(AGU)B chromosome 2 L000003742 2 266378 266450 W 2004-07-16 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000032147 noncoding_exon tT(AGU)B 2 266378 266450 W 2004-07-16 2000-05-19 -S000000218 ORF Verified YBR014C GRX7 glutathione-disulfide reductase GRX7 chromosome 2 2 267336 266725 C 2004-07-16 1997-01-28 Cis-golgi localized monothiol glutaredoxin; more similar in activity to dithiol than other monothiol glutaredoxins; involved in the oxidative stress response; does not bind metal ions; GRX7 has a paralog, GRX6, that arose from the whole genome duplication -S000031840 CDS YBR014C 2 267336 266725 C 2004-07-16 1997-01-28 -S000000219 ORF Verified YBR015C MNN2 alpha-1,2-mannosyltransferase MNN2|LDB8|CRV4|TTP1 chromosome 2 L000002385 2 269503 267710 C 2004-07-16 1997-01-28 Alpha-1,2-mannosyltransferase; responsible for addition of the first alpha-1,2-linked mannose to form the branches on the mannan backbone of oligosaccharides, localizes to an early Golgi compartment -S000032017 CDS YBR015C 2 269503 267710 C 2004-07-16 1997-01-28 -S000000220 ORF Verified YBR016W chromosome 2 2 270247 270633 W 2004-07-16 1997-01-28 Tail-anchored plasma membrane protein with a conserved CYSTM module; predicted to be palmitoylated; has similarity to hydrophilins, which are involved in the adaptive response to hyperosmotic conditions; YBR016W has a paralog, YDL012C, that arose from the whole genome duplication -S000032998 CDS YBR016W 2 270247 270633 W 2004-07-16 1997-01-28 -S000000221 ORF Verified YBR017C KAP104 chromosome 2 L000003444 2 273703 270947 C 2004-07-16 1997-01-28 Transportin or cytosolic karyopherin beta 2; functions in the rg-nuclear localization signal-mediated nuclear import/reimport of mRNA-binding proteins Nab2p and Hrp1p; regulates asymmetric protein synthesis in daughter cells during mitosis -S000033056 CDS YBR017C 2 273703 270947 C 2004-07-16 1997-01-28 -S000000222 ORF Verified YBR018C GAL7 UDP-glucose:hexose-1-phosphate uridylyltransferase chromosome 2 L000000662 2 275527 274427 C 7 2004-07-16 1997-01-28 Galactose-1-phosphate uridyl transferase; synthesizes glucose-1-phosphate and UDP-galactose from UDP-D-glucose and alpha-D-galactose-1-phosphate in the second step of galactose catabolism; human homolog UGP2 can complement yeast null mutant -S000033134 CDS YBR018C 2 275527 274427 C 2004-07-16 1997-01-28 -S000000223 ORF Verified YBR019C GAL10 bifunctional UDP-glucose 4-epimerase/aldose 1-epimerase chromosome 2 L000000663 2 278352 276253 C 7 2004-07-16 1997-01-28 UDP-glucose-4-epimerase; catalyzes interconversion of UDP-galactose and UDP-D-glucose in galactose metabolism; also catalyzes conversion of alpha-D-glucose or alpha-D-galactose to their beta-anomers; human homolog GALE implicated in galactosemia, can complement yeast null mutant -S000033206 CDS YBR019C 2 278352 276253 C 2004-07-16 1997-01-28 -S000000224 ORF Verified YBR020W GAL1 galactokinase chromosome 2 L000000658 2 279021 280607 W 7 2004-07-16 1997-01-28 Galactokinase; phosphorylates alpha-D-galactose to alpha-D-galactose-1-phosphate in the first step of galactose catabolism; expression regulated by Gal4p; human homolog GALK2 complements yeast null mutant; GAL1 has a paralog, GAL3, that arose from the whole genome duplication -S000034916 CDS YBR020W 2 279021 280607 W 2004-07-16 1997-01-28 -S000000225 ORF Verified YBR021W FUR4 uracil permease chromosome 2 L000000652 2 281443 283344 W 8 2004-07-16 1997-01-28 Plasma membrane localized uracil permease; expression is tightly regulated by uracil levels and environmental cues; conformational alterations induced by unfolding or substrate binding result in Rsp5p-mediated ubiquitination and degradation -S000035064 CDS YBR021W 2 281443 283344 W 2004-07-16 1997-01-28 -S000000226 ORF Verified YBR022W POA1 ADP-ribose 1''-phosphate phosphatase chromosome 2 2 283738 284271 W 2004-07-16 1997-01-28 Phosphatase that is highly specific for ADP-ribose 1''-phosphate; a tRNA splicing metabolite; may have a role in regulation of tRNA splicing -S000035171 CDS YBR022W 2 283738 284271 W 2004-07-16 1997-01-28 -S000000227 ORF Verified YBR023C CHS3 chitin synthase CHS3|KTI2|DIT101|CSD2|CAL1 chromosome 2 L000000331 2 287925 284428 C 9 2004-07-16 1997-01-28 Chitin synthase III; catalyzes the transfer of N-acetylglucosamine (GlcNAc) to chitin; required for synthesis of the majority of cell wall chitin, the chitin ring during bud emergence, and spore wall chitosan; contains overlapping di-leucine and di-acidic signals that mediate, respectively, intracellular trafficking by AP-1 and trafficking to plasma membrane by exomer complex; requires AP-3 complex for its intracellular retention -S000035205 CDS YBR023C 2 287925 284428 C 2004-07-16 1997-01-28 -S000000228 ORF Verified YBR024W SCO2 putative thioredoxin peroxidase SCO2 chromosome 2 L000001816 2 289445 290350 W 2004-07-16 1997-01-28 Protein anchored to mitochondrial inner membrane; may have a redundant function with Sco1p in delivery of copper to cytochrome c oxidase; interacts with Cox2p; SCO2 has a paralog, SCO1, that arose from the whole genome duplication -S000036144 CDS YBR024W 2 289445 290350 W 2004-07-16 1997-01-28 -S000000229 ORF Verified YBR025C OLA1 Obg-like ATPase chromosome 2 2 291865 290681 C 2004-07-16 1997-01-28 P-loop ATPase with similarity to human OLA1 and bacterial YchF; identified as specifically interacting with the proteasome; null mutant displays increased translation rate and increased readthrough of premature stop codons; protein abundance increases in response to hydrogen peroxide and to DNA replication stress -S000036196 CDS YBR025C 2 291865 290681 C 2004-07-16 1997-01-28 -S000000230 ORF Verified YBR026C ETR1 MRF1'|MRF1 chromosome 2 L000002810 2 294019 292877 C 2004-07-16 1997-01-28 2-enoyl thioester reductase; member of the medium chain dehydrogenase/reductase family; localized to mitochondria, where it has a probable role in fatty acid synthesis; human MECR functionally complements the respiratory growth defect of the null mutant -S000031678 CDS YBR026C 2 294019 292877 C 2004-07-16 1997-01-28 -S000000231 ORF Uncharacterized YBR027C chromosome 2 2 294356 294024 C 2004-07-16 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YBR027C is not an essential gene -S000031824 CDS YBR027C 2 294356 294024 C 2004-07-16 1997-01-28 -S000000232 ORF Verified YBR028C YPK3 putative protein kinase YPK3 chromosome 2 2 296002 294425 C 2004-07-16 1997-01-28 AGC kinase; phosphorylated by cAMP-dependent protein kinase (PKA) in a TORC1-dependent manner; directly phosphorylated by TORC1; phosphorylates ribosomal protein Rps6a/b (S6), in a TORC-dependent manner; undergoes autophosphorylation -S000031957 CDS YBR028C 2 296002 294425 C 2004-07-16 1997-01-28 -S000000233 ORF Verified YBR029C CDS1 phosphatidate cytidylyltransferase|CDG1 chromosome 2 L000002673 2 297742 296369 C 2004-07-16 1997-01-28 Phosphatidate cytidylyltransferase (CDP-diglyceride synthetase); an enzyme that catalyzes that conversion of CTP + phosphate into diphosphate + CDP-diaclglyerol, a critical step in the synthesis of all major yeast phospholipids; human homolog CDS1 can complement yeast cds1 null mutant -S000037428 CDS YBR029C 2 297742 296369 C 2004-07-16 1997-01-28 -S000000234 ORF Verified YBR030W RKM3 protein-lysine N-methyltransferase chromosome 2 2 298292 299950 W 2004-07-16 1997-01-28 Ribosomal lysine methyltransferase; specific for monomethylation of Rpl42ap and Rpl42bp (lysine 40); nuclear SET domain containing protein; relocalizes to the cytosol in response to hypoxia -S000037095 CDS YBR030W 2 298292 299950 W 2004-07-16 1997-01-28 -S000000235 ORF Verified YBR031W RPL4A uL4|ribosomal 60S subunit protein L4A|L4|rp2|YL2|L4A|L2A chromosome 2 L000001701 2 300166 301254 W 2004-07-16 1997-01-28 Ribosomal 60S subunit protein L4A; N-terminally acetylated; homologous to mammalian ribosomal protein L4 and bacterial L4; RPL4A has a paralog, RPL4B, that arose from the whole genome duplication -S000037181 CDS YBR031W 2 300166 301254 W 2004-07-16 1997-01-28 -S000000236 ORF Uncharacterized YBR032W chromosome 2 2 301519 301821 W 2004-07-16 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YBR032W is not an essential gene -S000037283 CDS YBR032W 2 301519 301821 W 2004-07-16 1997-01-28 -S000000237 ORF Uncharacterized YBR033W EDS1 chromosome 2 2 301944 304703 W 2004-07-16 1997-01-28 Putative zinc cluster protein, predicted to be a transcription factor; not an essential gene; EDS1 has a paralog, RGT1, that arose from the whole genome duplication -S000037351 CDS YBR033W 2 301944 304703 W 2004-07-16 1997-01-28 -S000000238 ORF Verified YBR034C HMT1 protein-arginine omega-N methyltransferase HMT1|RMT1|ODP1|HCP1 chromosome 2 L000002808|L000001296 2 305976 304930 C 2004-07-16 1997-01-28 Nuclear SAM-dependent mono- and asymmetric methyltransferase; modifies hnRNPs, including Npl3p and Hrp1p, affecting their activity and nuclear export; methylates U1 snRNP protein Snp1p, ribosomal protein Rps2p, and histones H3 and H4; interacts genetically with genes encoding components of Rpd3(L) and this interaction is important for Rpd3 recruitment to the subtelomeric region -S000037372 CDS YBR034C 2 305976 304930 C 2004-07-16 1997-01-28 -S000000239 ORF Verified YBR035C PDX3 pyridoxamine-phosphate oxidase PDX3 chromosome 2 L000001371 2 306955 306269 C 2004-07-16 1997-01-28 Pyridoxine (pyridoxamine) phosphate oxidase; has homologs in E. coli and Myxococcus xanthus; transcription is under the general control of nitrogen metabolism -S000030013 CDS YBR035C 2 306955 306269 C 2004-07-16 1997-01-28 -S000087162 snoRNA_gene snR161 SNR161 chromosome 2 2 307345 307185 C 2005-11-10 2005-11-10 H/ACA small nucleolar RNA (snoRNA); guides pseudouridylation of small subunit (SSU) rRNA at positions U632 and U766 -S000087163 noncoding_exon snR161 2 307345 307185 C 2005-11-10 2005-11-10 -S000006657 telomerase_RNA_gene TLC1 TLC1 TER1 chromosome 2 L000002315 2 307587 308887 W 2004-07-16 2000-05-19 RNA template component of telomerase; flexible scaffold that tethers telomerase holoenzyme protein subunits to the complex; contains template sequence that Est2p uses to add irregular repeats of TG(1-3) residues onto a DNA end; promoter regulated by the cell cycle dependent transcriptional activators Swi4p/Swi6p and Mbp1p/Swi6p -S000033066 noncoding_exon TLC1 2 307587 308887 W 2004-07-16 2000-05-19 -S000000240 ORF Verified YBR036C CSG2 mannosylinositol phosphorylceramide synthase regulatory subunit|CLS2 chromosome 2 L000002979|L000000427 2 310313 309081 C 2004-07-16 1997-01-28 Endoplasmic reticulum membrane protein; required for mannosylation of inositolphosphorylceramide and for growth at high calcium concentrations; protein abundance increases in response to DNA replication stress -S000030091 CDS YBR036C 2 310313 309081 C 2004-07-16 1997-01-28 -S000000241 ORF Verified YBR037C SCO1 Cu-binding protein SCO1|PET161 chromosome 2 L000001815 2 311452 310565 C 2011-02-03 1997-01-28 Copper-binding protein of mitochondrial inner membrane; required for cytochrome c oxidase activity and respiration; may function to deliver copper to cytochrome c oxidase; similar to thioredoxins; SCO1 has a paralog, SCO2, that arose from the whole genome duplication -S000030247 CDS YBR037C 2 311452 310565 C 2011-02-03 1997-01-28 -S000000242 ORF Verified YBR038W CHS2 chitin synthase CHS2 chromosome 2 L000000330 2 311898 314789 W 2011-02-03 1997-01-28 Chitin synthase II; catalyzes transfer of N-acetylglucosamine (GlcNAc) to chitin upon activation of zymogenic form; required for chitin synthesis in the primary septum during cytokinesis; localization regulated by Cdk1p during mitosis; phosphorylation by Dbf2p kinase regulates its dynamics and chitin synthesis during cytokinesis -S000033656 CDS YBR038W 2 311898 314789 W 2011-02-03 1997-01-28 -S000000243 ORF Verified YBR039W ATP3 F1F0 ATP synthase subunit gamma chromosome 2 L000000143 2 315575 316510 W 2004-07-16 1997-01-28 Gamma subunit of the F1 sector of mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis -S000033784 CDS YBR039W 2 315575 316510 W 2004-07-16 1997-01-28 -S000000244 ORF Verified YBR040W FIG1 chromosome 2 L000003311 2 316968 317864 W 2004-07-16 1997-01-28 Integral membrane protein required for efficient mating; may participate in or regulate the low affinity Ca2+ influx system, which affects intracellular signaling and cell-cell fusion during mating -S000033389 CDS YBR040W 2 316968 317864 W 2004-07-16 1997-01-28 -S000000245 ORF Verified YBR041W FAT1 long-chain fatty acid transporter FAT1 chromosome 2 L000003201 2 318266 320275 W 2004-07-16 2004-01-21|1997-01-28 Very long chain fatty acyl-CoA synthetase and fatty acid transporter; activates imported fatty acids with a preference for very long lengths (C20-C26); has a separate function in the transport of long chain fatty acids -S000033461 CDS YBR041W 2 318266 320275 W 2004-07-16 2004-01-21|1997-01-28 -S000000246 ORF Verified YBR042C CST26 putative acyltransferase|PSI1 chromosome 2 2 321609 320416 C 2004-07-16 1997-01-28 Acyltransferase; enzyme mainly responsible for the introduction of saturated very long chain fatty acids into neo-synthesized molecules of phosphatidylinositol; required for incorporation of stearic acid into phosphatidylinositol; affects chromosome stability when overexpressed; CST26 has a paralog, YDR018C, that arose from the whole genome duplication -S000033482 CDS YBR042C 2 321609 320416 C 2004-07-16 1997-01-28 -S000000247 ORF Verified YBR043C QDR3 AQR2 chromosome 2 2 323945 321876 C 2004-07-16 1997-01-28|2011-02-03 Multidrug transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; has a role in polyamine homeostasis; involved in spore wall asembly; sequence similarity to DTR1 and QDR1, and the triple mutant dtr1 qdr1 qdr3 exhibits reduced dityrosine fluorescence relative to the single mutants; expression is upregulated under polyamine stress; required for resistance to quinidine, barban, cisplatin, and bleomycin -S000033571 CDS YBR043C 2 323945 321876 C 2004-07-16 1997-01-28|2011-02-03 -S000000248 ORF Verified YBR044C TCM62 chromosome 2 2 326059 324341 C 2011-02-03 1997-01-28|2011-02-03 Protein involved in assembly of the succinate dehydrogenase complex; mitochondrial; putative chaperone -S000033606 CDS YBR044C 2 326059 324341 C 2011-02-03 1997-01-28|2011-02-03 -S000118347 ARS ARS211 ARSII-326 chromosome 2 2 326140 326375 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178047 ARS_consensus_sequence ARS211 2 326153 326169 W 2014-11-18 2014-11-18 -S000006769 tRNA_gene tV(UAC)B chromosome 2 L000003749 2 326865 326792 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000036275 noncoding_exon tV(UAC)B 2 326865 326792 C 2011-02-03 2000-05-19 -S000006817 long_terminal_repeat YBRWdelta15 chromosome 2 2 327069 327394 W 2011-02-03 2000-05-19 Ty1 LTR -S000006818 long_terminal_repeat YBRWdelta16 chromosome 2 2 327390 327704 W 2011-02-03 2000-05-19 Ty1 LTR -S000000249 ORF Verified YBR045C GIP1 protein phosphatase regulator GIP1 chromosome 2 L000003092 2 330092 328173 C 2011-02-03 1997-01-28|2011-02-03 Meiosis-specific regulatory subunit of the Glc7p protein phosphatase; regulates spore wall formation and septin organization, required for expression of some late meiotic genes and for normal localization of Glc7p -S000034552 CDS YBR045C 2 330092 328173 C 2011-02-03 1997-01-28|2011-02-03 -S000000250 ORF Verified YBR046C ZTA1 NADPH:quinone reductase chromosome 2 L000004168 2 331511 330507 C 2011-02-03 1997-01-28 NADPH-dependent quinone reductase; GFP-tagged protein localizes to the cytoplasm and nucleus; has similarity to E. coli quinone oxidoreductase and to human zeta-crystallin -S000034640 CDS YBR046C 2 331511 330507 C 2011-02-03 1997-01-28 -S000000251 ORF Uncharacterized YBR047W FMP23 chromosome 2 2 331833 332360 W 2011-02-03 1997-01-28 Putative protein of unknown function; proposed to be involved in iron or copper homeostasis; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000035689 CDS YBR047W 2 331833 332360 W 2011-02-03 1997-01-28 -S000000252 ORF Verified YBR048W RPS11B uS17|ribosomal 40S subunit protein S11B|S17|rp41B|YS12|S18B|S11B chromosome 2 L000001758 2 332831 333812 W 2011-02-03 1997-01-28 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S11 and bacterial S17; RPS11B has a paralog, RPS11A, that arose from the whole genome duplication -S000035808 CDS YBR048W 2 332831 332875 W 2011-02-03 1997-01-28 -S000035809 CDS YBR048W 2 333387 333812 W 2011-02-03 1997-01-28 -S000035810 intron YBR048W 2 332876 333386 W 2011-02-03 1997-01-28 -S000000253 ORF Verified YBR049C REB1 DNA-binding protein REB1|GRF2 chromosome 2 L000001601 2 336818 334386 C 2011-02-03 1997-01-28 RNA polymerase I enhancer binding protein; DNA binding protein that binds to genes transcribed by both RNA polymerase I and RNA polymerase II; required for termination of RNA polymerase I transcription; Reb1p bound to DNA acts to block RNA polymerase II readthrough transcription -S000035873 CDS YBR049C 2 336818 334386 C 2011-02-03 1997-01-28 -S000000255 ORF Dubious YBR051W chromosome 2 2 337988 338338 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the REG2/YBR050C regulatory subunit of the Glc7p type-1 protein phosphatase -S000036875 CDS YBR051W 2 337988 338338 W 2011-02-03 1997-01-28 -S000000254 ORF Verified YBR050C REG2 protein phosphatase regulator REG2 chromosome 2 L000004126 2 338199 337183 C 2011-02-03 1997-01-28 Regulatory subunit of the Glc7p type-1 protein phosphatase; involved with Reg1p, Glc7p, and Snf1p in regulation of glucose-repressible genes, also involved in glucose-induced proteolysis of maltose permease; REG2 has a paralog, REG1, that arose from the whole genome duplication -S000036783 CDS YBR050C 2 338199 337183 C 2011-02-03 1997-01-28 -S000000256 ORF Verified YBR052C RFS1 flavodoxin-like fold family protein chromosome 2 2 339352 338720 C 2011-02-03 1997-01-28 Protein of unknown function; member of a flavodoxin-like fold protein family that includes Pst2p and Ycp4p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; RFS1 has a paralog, PST2, that arose from the whole genome duplication -S000037575 CDS YBR052C 2 339352 338720 C 2011-02-03 1997-01-28 -S000000257 ORF Uncharacterized YBR053C chromosome 2 2 340751 339675 C 2011-02-03 1997-01-28 Putative protein of unknown function; induced by cell wall perturbation -S000037643 CDS YBR053C 2 340751 339675 C 2011-02-03 1997-01-28 -S000000258 ORF Verified YBR054W YRO2 chromosome 2 L000002548 2 343101 344135 W 2011-02-03 1997-01-28 Protein with a putative role in response to acid stress; null mutant is sensitive to acetic acid; transcription is regulated by Haa1p and induced in the presence of acetic acid; protein observed in plasma membrane foci in the presence of acetic acid; the authentic, non-tagged protein is detected in a phosphorylated state in highly purified mitochondria in high-throughput studies -S000037737 CDS YBR054W 2 343101 344135 W 2011-02-03 1997-01-28 -S000000259 ORF Verified YBR055C PRP6 U4/U6-U5 snRNP complex subunit PRP6|TSM7269|RNA6 chromosome 2 L000001499 2 347301 344602 C 33 2011-02-03 1997-01-28 Splicing factor; component of the U4/U6-U5 snRNP complex -S000037759 CDS YBR055C 2 347301 344602 C 2011-02-03 1997-01-28 -S000006648 tRNA_gene tL(UAA)B2 chromosome 2 L000003743 2 347603 347686 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000035757 noncoding_exon tL(UAA)B2 2 347603 347686 W 2011-02-03 2000-05-19 -S000000260 ORF Verified YBR056W 17-beta-hydroxysteroid dehydrogenase-like protein chromosome 2 2 347879 349384 W 2011-02-03 1997-01-28 Putative glycoside hydrolase of the mitochondrial intermembrane space -S000030661 CDS YBR056W 2 347879 349384 W 2011-02-03 1997-01-28 -S000006819 long_terminal_repeat YBRWdelta17 chromosome 2 2 350459 350751 W 2011-02-03 2000-05-19 Ty1 LTR -S000006691 tRNA_gene tQ(UUG)B chromosome 2 L000003744 2 350827 350898 W 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000031659 noncoding_exon tQ(UUG)B 2 350827 350898 W 2011-02-03 2000-05-19 -S000028736 ORF Uncharacterized YBR056W-A chromosome 2 2 351255 351455 W 2011-02-03 2003-07-29 Protein of unknown function; mRNA identified as translated by ribosome profiling data; partially overlaps dubious ORF YBR056C-B; YBR056W-A has a paralog, YDR034W-B, that arose from the whole genome duplication -S000033380 CDS YBR056W-A 2 351255 351455 W 2011-02-03 2003-07-29 -S000087087 ORF Dubious YBR056C-B chromosome 2 2 351451 351293 C 2011-02-03 2005-11-08 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the dubious ORF YBR056W-A -S000087088 CDS YBR056C-B 2 351451 351293 C 2011-02-03 2005-11-08 -S000000261 ORF Verified YBR057C MUM2 SPOT8 chromosome 2 L000003595|L000002013 2 353293 352193 C 31 2011-02-03 1997-01-28 Protein essential for meiotic DNA replication and sporulation; cytoplasmic protein; subunit of the MIS complex which controls mRNA methylation during during the induction of sporulation; also interacts with Orc2p, which is a component of the origin recognition complex -S000030712 CDS YBR057C 2 353293 352193 C 2011-02-03 1997-01-28 -S000000262 ORF Verified YBR058C UBP14 ubiquitin-specific protease UBP14|GID6 chromosome 2 L000003173 2 356017 353672 C 2011-02-03 2003-09-22|1997-01-28 Ubiquitin-specific protease; specifically disassembles unanchored ubiquitin chains; involved in fructose-1,6-bisphosphatase (Fbp1p) degradation; similar to human isopeptidase T -S000030826 CDS YBR058C 2 356017 353672 C 2011-02-03 2003-09-22|1997-01-28 -S000007521 ORF Verified YBR058C-A TSC3 chromosome 2 2 356566 356324 C 2011-02-03 2000-06-19 Protein that stimulates the activity of serine palmitoyltransferase; involved in sphingolipid biosynthesis; Lcb1p and Lcb2p are the two components of serine palmitoyltransferase -S000036279 CDS YBR058C-A 2 356566 356324 C 2011-02-03 2000-06-19 -S000000263 ORF Verified YBR059C AKL1 serine/threonine protein kinase AKL1 chromosome 2 S000007479 2 360187 356861 C 2011-02-03 1997-01-28 Ser-Thr protein kinase; member (with Ark1p and Prk1p) of the Ark kinase family; involved in endocytosis and actin cytoskeleton organization -S000031795 CDS YBR059C 2 360187 356861 C 2011-02-03 1997-01-28 -S000000264 ORF Verified YBR060C ORC2 origin recognition complex subunit 2|SIR5|RRR1 chromosome 2 L000001776 2 362514 360652 C 2011-02-03 1997-01-28 Subunit of the origin recognition complex (ORC); ORC directs DNA replication by binding to replication origins and is also involved in transcriptional silencing; interacts with Spp1p and with trimethylated histone H3; phosphorylated by Cdc28p -S000031761 CDS YBR060C 2 362514 360652 C 2011-02-03 1997-01-28 -S000000265 ORF Verified YBR061C TRM7 tRNA methyltransferase TRM7 chromosome 2 2 365719 364787 C 2011-02-03 1997-01-28 2'-O-ribose methyltransferase; methylates the 2'-O-ribose of tRNA-Phe, tRNA-Trp, and tRNA-Leu at positions C32 and N34 of tRNA anticodon loop; crucial biological role likely modification of tRNA-Phe; interacts with Trm732p and Rtt10p in 2'-O-methylation of C32 and N34 substrate tRNAs, respectively; yeast null mutant can be functionally complemented by human FTSJ1, mutations in which have been implicated in nonsyndromic X-linked intellectual disability (NSXLID) -S000031905 CDS YBR061C 2 365719 364787 C 2011-02-03 1997-01-28 -S000000266 ORF Uncharacterized YBR062C chromosome 2 2 366600 365976 C 2011-02-03 2004-07-16|1997-01-28 Protein of unknown function that interacts with Msb2p; may play a role in activation of the filamentous growth pathway -S000032827 CDS YBR062C 2 366502 365976 C 2011-02-03 2004-07-16|1997-01-28 -S000032826 CDS YBR062C 2 366600 366585 C 2011-02-03 2004-07-16 -S000032828 intron YBR062C 2 366584 366503 C 2011-02-03 2004-07-16 -S000000268 ORF Dubious YBR064W chromosome 2 2 367763 368191 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YBR063C -S000033067 CDS YBR064W 2 367763 368191 W 2011-02-03 1997-01-28 -S000000267 ORF Uncharacterized YBR063C chromosome 2 2 368184 366970 C 2011-02-03 1997-01-28 Putative protein of unknown function; YBR063C is not an essential gene -S000032899 CDS YBR063C 2 368184 366970 C 2011-02-03 1997-01-28 -S000000269 ORF Verified YBR065C ECM2 SLT11 chromosome 2 L000003878 2 369678 368584 C 2011-02-03 1997-01-28 Pre-mRNA splicing factor; facilitates the cooperative formation of U2/U6 helix II in association with stem II in the spliceosome, function may be regulated by Slu7p -S000033674 CDS YBR065C 2 369678 368584 C 2011-02-03 1997-01-28 -S000000270 ORF Verified YBR066C NRG2 chromosome 2 L000004599 2 370699 370037 C 2011-02-03 1997-01-28 Transcriptional repressor; mediates glucose repression and negatively regulates filamentous growth; activated in stochastic pulses of nuclear localization in response to low glucose -S000033763 CDS YBR066C 2 370699 370037 C 2011-02-03 1997-01-28 -S000000271 ORF Verified YBR067C TIP1 putative lipase chromosome 2 L000002311 2 372735 372103 C 2011-02-03 1997-01-28 Major cell wall mannoprotein with possible lipase activity; transcription is induced by heat- and cold-shock; member of the Srp1p/Tip1p family of serine-alanine-rich proteins -S000033875 CDS YBR067C 2 372735 372103 C 2011-02-03 1997-01-28 -S000000272 ORF Verified YBR068C BAP2 branched-chain amino acid permease BAP2 chromosome 2 L000003157 2 375690 373861 C 2011-02-03 1997-01-28|2011-02-03 High-affinity leucine permease; functions as a branched-chain amino acid permease involved in uptake of leucine, isoleucine and valine; contains 12 predicted transmembrane domains; BAP2 has a paralog, BAP3, that arose from the whole genome duplication -S000034014 CDS YBR068C 2 375690 373861 C 2011-02-03 1997-01-28|2011-02-03 -S000000273 ORF Verified YBR069C TAT1 amino acid transporter TAT1|VAP1|TAP1 chromosome 2 L000002454|L000002262 2 378433 376574 C 2011-02-03 1997-01-28 Amino acid transporter for valine, leucine, isoleucine, and tyrosine; low-affinity tryptophan and histidine transporter; overexpression confers FK506 and FTY720 resistance; protein abundance increases in response to DNA replication stress -S000034884 CDS YBR069C 2 378433 376574 C 2011-02-03 1997-01-28 -S000130151 ARS ARS212 ARSII-379 chromosome 2 2 379221 379912 2011-02-03 2009-05-07 Autonomously Replicating Sequence -S000000274 ORF Verified YBR070C ALG14 N-acetylglucosaminyldiphosphodolichol N-acetylglucosaminyltransferase anchoring subunit ALG14 chromosome 2 2 379934 379221 C 2011-02-03 1997-01-28 Component of UDP-GlcNAc transferase; required for second step of dolichyl-linked oligosaccharide synthesis; anchors catalytic subunit Alg13p to ER membrane; similar to bacterial and human glycosyltransferases; both human homologs ALG13 and ALG14 are required to complement yeast alg14 mutant -S000035895 CDS YBR070C 2 379934 379221 C 2011-02-03 1997-01-28 -S000000275 ORF Verified YBR071W chromosome 2 2 380411 381046 W 2011-02-03 1997-01-28 Protein of unknown function found in the cytoplasm and bud neck; mRNA expression may be regulated by the cell cycle and/or cell wall stress; overexpression of YBR071W affects endocytic protein trafficking -S000036135 CDS YBR071W 2 380411 381046 W 2011-02-03 1997-01-28 -S000000276 ORF Verified YBR072W HSP26 chaperone protein HSP26 chromosome 2 L000000817 2 382030 382674 W 2011-02-03 1997-01-28 Small heat shock protein (sHSP) with chaperone activity; forms hollow, sphere-shaped oligomers that suppress unfolded proteins aggregation; long-lived protein that is preferentially retained in mother cells and forms cytoplasmic foci; oligomer activation requires heat-induced conformational change; also has mRNA binding activity -S000036920 CDS YBR072W 2 382030 382674 W 2011-02-03 1997-01-28 -S000028532 ORF Uncharacterized YBR072C-A chromosome 2 2 383021 382860 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031141 CDS YBR072C-A 2 383021 382860 C 2011-02-03 2003-07-29 -S000000277 ORF Verified YBR073W RDH54 DNA-dependent ATPase RDH54|TID1 chromosome 2 L000002988|L000003224 2 383112 385988 W 2011-02-03 2003-09-22|1997-01-28|2009-05-07|2011-02-03 DNA-dependent ATPase; DNA recombination/repair translocase, supercoils DNA and promotes DNA strand opening; stimulates strand exchange by modifying dsDNA topology; involved in recombinational repair of DNA double-strand breaks (DSBs) during mitosis and meiosis; phosphorylated in Mec1p-, Rad53p-dependent way in response to one DSB; contributes to remodelling of nucleosomes; proposed to be involved in crossover interference; interacts with Dmc1p; stimulates Dmc1p and Rad51p -S000036971 CDS YBR073W 2 383112 385988 W 2011-02-03 2003-09-22|1997-01-28|2009-05-07|2011-02-03 -S000000278 ORF Verified YBR074W PFF1 YBR075W chromosome 2 2 386286 389216 W 2011-02-03 2003-09-29|1997-01-28|2011-02-03 Multi-spanning vacuolar membrane protease; glycosylated transmembrane protein bearing homology to the M28 family of metalloproteases; has a lumenal-facing protease domain; proposed role in vacuole physiology -S000037055 CDS YBR074W 2 386286 389216 W 2011-02-03 2003-09-29|1997-01-28|2011-02-03 -S000130152 ARS ARS213 ARSII-390 chromosome 2 2 389212 390371 2011-02-03 2009-05-07|2011-02-03 Autonomously Replicating Sequence -S000000280 ORF Verified YBR076W ECM8 chromosome 2 L000003883 2 390227 391291 W 2011-02-03 1997-01-28|2011-02-03 Non-essential protein of unknown function -S000037886 CDS YBR076W 2 390227 391291 W 2011-02-03 1997-01-28|2011-02-03 -S000028533 ORF Dubious YBR076C-A chromosome 2 2 391617 391351 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene ECM8; identified by fungal homology and RT-PCR -S000031142 CDS YBR076C-A 2 391617 391351 C 2011-02-03 2003-07-29 -S000000281 ORF Verified YBR077C SLM4 GSE1|NIR1|EGO3 chromosome 2 2 392293 391805 C 2011-02-03 1997-01-28 Component of the EGO and GSE complexes; essential for integrity and function of EGO; EGO is involved in the regulation of microautophagy and GSE is required for proper sorting of amino acid permease Gap1p; gene exhibits synthetic genetic interaction with MSS4 -S000029854 CDS YBR077C 2 392293 391805 C 2011-02-03 1997-01-28 -S000000282 ORF Verified YBR078W ECM33 chromosome 2 L000003902 2 393123 394742 W 2011-02-03 1997-01-28|2011-02-03 GPI-anchored protein of unknown function; possible role in apical bud growth; GPI-anchoring on the plasma membrane crucial to function; phosphorylated in mitochondria; similar to Sps2p; ECM33 has a paralog, PST1, that arose from the whole genome duplication -S000030046 CDS YBR078W 2 393123 393180 W 2011-02-03 1997-01-28 -S000030047 CDS YBR078W 2 393511 394742 W 2011-02-03 1997-01-28|2011-02-03 -S000030048 intron YBR078W 2 393181 393510 W 2011-02-03 1997-01-28 -S000000283 ORF Verified YBR079C RPG1 translation initiation factor eIF3 core subunit a|TIF32 chromosome 2 L000004268 2 398277 395383 C 2011-02-03 1997-01-28 eIF3a subunit of the eukaryotic translation initiation factor 3 (eIF3); subunit of the core complex of eIF3; essential for translation; part of a Prt1p-Rpg1p-Nip1p subcomplex that stimulates binding of mRNA and tRNA(i)Met to ribosomes; involved in translation reinitiation; eIF3 is also involved in programmed stop codon readthrough -S000030963 CDS YBR079C 2 398277 395383 C 2011-02-03 1997-01-28 -S000000284 ORF Verified YBR080C SEC18 AAA family ATPase SEC18|ANU4 chromosome 2 L000001842 2 400890 398614 C 48 2011-02-03 1997-01-28 AAA ATPase and SNARE disassembly chaperone; required for vesicular transport between ER and Golgi, the 'priming' step in homotypic vacuole fusion, autophagy, and protein secretion; releases Sec17p from SNAP complexes; has similarity to mammalian N-ethylmaleimide-sensitive factor (NSF) -S000031072 CDS YBR080C 2 400890 398614 C 2011-02-03 1997-01-28 -S000000285 ORF Verified YBR081C SPT7 SAGA histone acetyltransferase complex subunit SPT7|GIT2 chromosome 2 L000002033 2 405251 401253 C 46 2011-02-03 1997-01-28 Subunit of the SAGA transcriptional regulatory complex; involved in proper assembly of the complex; also present as a C-terminally truncated form in the SLIK/SALSA transcriptional regulatory complex -S000032039 CDS YBR081C 2 405251 401253 C 2011-02-03 1997-01-28 -S000006708 tRNA_gene tR(UCU)B chromosome 2 L000003745 2 405878 405949 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA); decodes AGA codons into arginine; one of 19 nuclear tRNAs for arginine; part of dicistronic transcript with tD(GUC)B -S000037831 noncoding_exon tR(UCU)B 2 405878 405949 W 2011-02-03 2000-05-19 -S000006530 tRNA_gene tD(GUC)B chromosome 2 L000003746 2 405960 406031 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000037666 noncoding_exon tD(GUC)B 2 405960 406031 W 2011-02-03 2000-05-19 -S000000286 ORF Verified YBR082C UBC4 E2 ubiquitin-conjugating protein UBC4 chromosome 2 L000002407 2 407169 406628 C 2011-02-03 1997-01-28 Ubiquitin-conjugating enzyme (E2); key E2 partner with Ubc1p for the anaphase-promoting complex (APC); mediates degradation of abnormal or excess proteins, including calmodulin and histone H3; regulates levels of DNA Polymerase-{alpha} to promote efficient and accurate DNA replication; interacts with many SCF ubiquitin protein ligases; component of the cellular stress response; UBC4 has a paralog, UBC5, that arose from the whole genome duplication -S000032123 CDS YBR082C 2 407027 406628 C 2011-02-03 1997-01-28 -S000032122 CDS YBR082C 2 407169 407123 C 2011-02-03 1997-01-28 -S000032124 intron YBR082C 2 407122 407028 C 2011-02-03 1997-01-28 -S000118348 ARS ARS214 ARSII-408 chromosome 2 2 407953 408068 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178048 ARS_consensus_sequence ARS214 2 408004 407988 C 2014-11-18 2014-11-18 -S000000287 ORF Verified YBR083W TEC1 ROC1 chromosome 2 L000002276|L000001658 2 409169 410629 W 2011-02-03 1997-01-28 Transcription factor targeting filamentation genes and Ty1 expression; Ste12p activation of most filamentation gene promoters depends on Tec1p and Tec1p transcriptional activity is dependent on its association with Ste12p; binds to TCS elements upstream of filamentation genes, which are regulated by Tec1p/Ste12p/Dig1p complex; competes with Dig2p for binding to Ste12p/Dig1p; positive regulator of chronological life span; TEA/ATTS DNA-binding domain family member -S000032249 CDS YBR083W 2 409169 410629 W 2011-02-03 1997-01-28 -S000000288 ORF Verified YBR084W MIS1 trifunctional formate-tetrahydrofolate ligase/methenyltetrahydrofolate cyclohydrolase/methylenetetrahydrofolate dehydrogenase MIS1 chromosome 2 L000001115 2 411054 413981 W 2011-02-03 1997-01-28 Mitochondrial C1-tetrahydrofolate synthase; involved in interconversion between different oxidation states of tetrahydrofolate (THF); provides activities of formyl-THF synthetase, methenyl-THF cyclohydrolase, and methylene-THF dehydrogenase -S000033123 CDS YBR084W 2 411054 413981 W 2011-02-03 1997-01-28 -S000002156 ORF Verified YBR084C-A RPL19A eL19|ribosomal 60S subunit protein L19A|L19e|rpl5L|YL14|L23A|L19A chromosome 2 L000001720 2 415261 414186 C 2011-02-03 1997-01-28 Ribosomal 60S subunit protein L19A; rpl19a and rpl19b single null mutations result in slow growth, while the double null mutation is lethal; homologous to mammalian ribosomal protein L19, no bacterial homolog; RPL19A has a paralog, RPL19B, that arose from the whole genome duplication -S000033730 CDS YBR084C-A 2 414753 414186 C 2011-02-03 1997-01-28 -S000033729 CDS YBR084C-A 2 415261 415260 C 2011-02-03 1997-01-28 -S000033731 intron YBR084C-A 2 415259 414754 C 2011-02-03 1997-01-28 -S000000289 ORF Verified YBR085W AAC3 ADP/ATP carrier protein AAC3|ANC3 chromosome 2 L000000005 2 415983 416906 W 2011-02-03 1997-01-28 Mitochondrial inner membrane ADP/ATP translocator; exchanges cytosolic ADP for mitochondrially synthesized ATP; expressed under anaerobic conditions; similar to Aac1p; has roles in maintenance of viability and in respiration; AAC3 has a paralog, PET9, that arose from the whole genome duplication -S000033180 CDS YBR085W 2 415983 416906 W 2011-02-03 1997-01-28 -S000118349 ARS ARS215 ARSII-418 chromosome 2 2 417784 418079 2011-02-03 2006-08-30 Autonomously Replicating Sequence; replication origin of very weak function -S000007522 ORF Verified YBR085C-A chromosome 2 2 419164 418907 C 2011-02-03 2000-07-14 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and to the nucleus; protein abundance increases in response to DNA replication stress -S000037060 CDS YBR085C-A 2 419164 418907 C 2011-02-03 2000-07-14 -S000000290 ORF Verified YBR086C IST2 chromosome 2 2 423041 420201 C 2011-02-03 2003-01-03|1997-01-28 Cortical ER protein involved in ER-plasma membrane tethering; one of 6 proteins (Ist2p, Scs2p, Scs22p, Tcb1p, Tcb2p, Tcb3p) that connect ER to the plasma membrane (PM) and regulate PM phosphatidylinositol-4-phosphate (PI4P) levels by controlling access of Sac1p phosphatase to its substrate PI4P in the PM; localizes to the mother cell in small-budded cells and to the bud in medium- and large-budded cells; mRNA is transported to the bud tip by an actomyosin-driven process -S000033202 CDS YBR086C 2 423041 420201 C 2011-02-03 2003-01-03|1997-01-28 -S000000291 ORF Verified YBR087W RFC5 replication factor C subunit 5 chromosome 2 L000002843 2 423765 424829 W 2011-02-03 1997-01-28 Subunit of heteropentameric Replication factor C (RF-C); RF-C is a DNA binding protein and ATPase that acts as a clamp loader of the proliferating cell nuclear antigen (PCNA) processivity factor for DNA polymerases delta and epsilon -S000033291 CDS YBR087W 2 423765 424829 W 2011-02-03 1997-01-28 -S000000293 ORF Dubious YBR089W chromosome 2 2 425183 425782 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the verified gene POL30 -S000034297 CDS YBR089W 2 425183 425782 W 2011-02-03 1997-01-28 -S000000292 ORF Verified YBR088C POL30 proliferating cell nuclear antigen|PCNA chromosome 2 L000001463 2 425766 424990 C 2011-02-03 1997-01-28 Proliferating cell nuclear antigen (PCNA); functions as the sliding replication clamp for DNA polymerase delta; may function as a docking site for other proteins required for mitotic and meiotic chromosomal DNA replication and for DNA repair; PCNA ubiquitination at K164 plays a crucial role during Okazaki fragment processing -S000033330 CDS YBR088C 2 425766 424990 C 2011-02-03 1997-01-28 -S000002157 ORF Verified YBR089C-A NHP6B high-mobility group nucleosome-binding protein|YBR090C-A chromosome 2 L000001246 2 426489 426190 C 2011-02-03 1997-01-28|2011-02-03 High-mobility group (HMG) protein; binds to and remodels nucleosomes; involved in recruiting FACT and other chromatin remodelling complexes to the chromosomes; functionally redundant with Nhp6Ap; required for transcriptional initiation fidelity of some tRNA genes; homologous to mammalian HMGB1 and HMGB2; NHP6B has a paralog, NHP6A, that arose from the whole genome duplication -S000031885 CDS YBR089C-A 2 426489 426190 C 2011-02-03 1997-01-28|2011-02-03 -S000122092 five_prime_UTR_intron YBR089C-A 2 426873 426517 C 2011-02-03 2007-04-04 -S000000294 ORF Uncharacterized YBR090C chromosome 2 2 427058 426333 C 2011-02-03 1997-01-28|2011-02-03 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus -S000035423 CDS YBR090C 2 426516 426333 C 2011-02-03 1997-01-28|2011-02-03 -S000035422 CDS YBR090C 2 427058 426874 C 2011-02-03 1997-01-28 -S000035424 intron YBR090C 2 426873 426517 C 2011-02-03 1997-01-28 -S000000295 ORF Verified YBR091C TIM12 MRS5 chromosome 2 L000001181 2 427484 427155 C 2011-02-03 1997-01-28 Essential protein of the inner mitochondrial membrane; peripherally localized; component of the TIM22 complex, which is a twin-pore translocase that mediates insertion of numerous multispanning inner membrane proteins -S000036311 CDS YBR091C 2 427484 427155 C 2011-02-03 1997-01-28 -S000000296 ORF Verified YBR092C PHO3 acid phosphatase PHO3|phoC chromosome 2 L000001419 2 429101 427698 C 47 2011-02-03 1997-01-28 Constitutively expressed acid phosphatase similar to Pho5p; brought to the cell surface by transport vesicles; hydrolyzes thiamin phosphates in the periplasmic space, increasing cellular thiamin uptake; expression is repressed by thiamin -S000036423 CDS YBR092C 2 429101 427698 C 2011-02-03 1997-01-28 -S000000297 ORF Verified YBR093C PHO5 acid phosphatase PHO5|phoE chromosome 2 L000001421 2 430951 429548 C 47 2011-02-03 1997-01-28 Repressible acid phosphatase; 1 of 3 repressible acid phosphatases that also mediates extracellular nucleotide-derived phosphate hydrolysis; secretory pathway derived cell surface glycoprotein; induced by phosphate starvation and coordinately regulated by PHO4 and PHO2 -S000036491 CDS YBR093C 2 430951 429548 C 2011-02-03 1997-01-28 -S000000298 ORF Verified YBR094W PBY1 putative tubulin tyrosine ligase chromosome 2 2 432036 434297 W 2011-02-03 1997-01-28|2011-02-03 Putative tubulin tyrosine ligase associated with P-bodies; may have a role in mRNA metabolism; yeast knockout collection strain identified as a pby1 null mutant is actually wild-type for PBY1 and deleted for mms4 -S000037253 CDS YBR094W 2 432036 434297 W 2011-02-03 1997-01-28|2011-02-03 -S000000299 ORF Verified YBR095C RXT2 RAF60 chromosome 2 2 435698 434406 C 2011-02-03 2003-09-22|1997-01-28 Component of the histone deacetylase Rpd3L complex; possibly involved in cell fusion and invasive growth; relocalizes to the cytosol in response to hypoxia -S000037292 CDS YBR095C 2 435698 434406 C 2011-02-03 2003-09-22|1997-01-28 -S000000300 ORF Uncharacterized YBR096W chromosome 2 2 436021 436713 W 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the ER -S000037475 CDS YBR096W 2 436021 436713 W 2011-02-03 1997-01-28 -S000000301 ORF Verified YBR097W VPS15 ubiquitin-binding serine/threonine protein kinase VPS15|VPT15|VPS40|VPL19|VAC4|GRD8 chromosome 2 L000002470|L000002924|S000029641|L000002480 2 436951 441315 W 2011-02-03 1997-01-28|2011-02-03 Serine/threonine protein kinase involved in vacuolar protein sorting; functions as a membrane-associated complex with Vps34p; active form recruits Vps34p to the Golgi membrane; interacts with the GDP-bound form of Gpa1p; myristoylated; a fraction is localized, with Vps34p, to nuclear pores at nucleus-vacuole junctions and may facilitate transcription elongation for genes positioned at the nuclear periphery -S000030201 CDS YBR097W 2 436951 441315 W 2011-02-03 1997-01-28|2011-02-03 -S000000302 ORF Verified YBR098W MMS4 YBR100W|SLX2 chromosome 2 2 441515 443590 W 2011-02-03 2003-01-03|1997-01-28 Subunit of structure-specific Mms4p-Mus81p endonuclease; cleaves branched DNA; involved in recombination, DNA repair, and joint molecule formation/resolution during meiotic recombination; phosphorylation of the non-catalytic subunit Mms4p by Cdc28p and Cdc5p during mitotic cell cycle activates the function of Mms4p-Mus81p -S000030360 CDS YBR098W 2 441515 443590 W 2011-02-03 2003-01-03|1997-01-28 -S000000303 ORF Dubious YBR099C chromosome 2 2 443307 442924 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene MMS4 -S000030430 CDS YBR099C 2 443307 442924 C 2011-02-03 1997-01-28 -S000000305 ORF Verified YBR101C FES1 chromosome 2 2 444693 443821 C 2011-02-03 1997-01-28 Hsp70 (Ssa1p) nucleotide exchange factor; required for the release of misfolded proteins from the Hsp70 system to the Ub-proteasome machinery for destruction; cytosolic homolog of Sil1p, which is the nucleotide exchange factor for BiP (Kar2p) in the endoplasmic reticulum; protein abundance increases in response to DNA replication stress -S000036293 CDS YBR101C 2 444693 443821 C 2011-02-03 1997-01-28 -S000000306 ORF Verified YBR102C EXO84 exocyst subunit EXO84|USA3 chromosome 2 S000007470|L000003227 2 447323 445062 C 2011-02-03 1997-01-28 Exocyst subunit with dual roles in exocytosis and spliceosome assembly; subunit of the the exocyst complex which mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis at the plasma membrane (PM) prior to SNARE-mediated fusion; required for exocyst assembly and targeting the complex to specific sites on the bud tip PM; associates the U1 snRNP; role in pre-mRNA splicing and prespliceosome formation; possible Cdc28 substrate -S000036412 CDS YBR102C 2 447323 445062 C 2011-02-03 1997-01-28 -S000000307 ORF Verified YBR103W SIF2 EMB1 chromosome 2 2 447709 449316 W 2011-02-03 1997-01-28 WD40 repeat-containing subunit of Set3C histone deacetylase complex; complex represses early/middle sporulation genes; antagonizes telomeric silencing; binds specifically to the Sir4p N-terminus -S000037118 CDS YBR103W 2 447709 449316 W 2011-02-03 1997-01-28 -S000007593 ORF Dubious YBR103C-A chromosome 2 2 449463 449320 C 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by homology to related yeast -S000037105 CDS YBR103C-A 2 449463 449320 C 2011-02-03 2001-02-26 -S000000308 ORF Verified YBR104W YMC2 organic acid transporter chromosome 2 L000002521 2 449667 450656 W 2011-02-03 1997-01-28 Putative mitochondrial inner membrane transporter; proposed role in oleate metabolism and glutamate biosynthesis; member of the mitochondrial carrier (MCF) family; YMC2 has a paralog, YMC1, that arose from the whole genome duplication -S000037195 CDS YBR104W 2 449667 450656 W 2011-02-03 1997-01-28 -S000000309 ORF Verified YBR105C VID24 glucose-induced degradation complex subunit VID24|GID4 chromosome 2 L000004624 2 451969 450881 C 2011-02-03 1997-01-28 GID Complex regulatory subunit; binds GID Complex in response to glucose through interactions with complex member Vid28p; regulates fructose-1,6-bisphosphatase (FBPase) targeting to the vacuole; promotes proteasome-dependent catabolite degradation of FBPase; peripheral membrane protein located at Vid (vacuole import and degradation) vesicles -S000037212 CDS YBR105C 2 451969 450881 C 2011-02-03 1997-01-28 -S000000310 ORF Verified YBR106W PHO88 SND3 chromosome 2 L000003995 2 452658 453224 W 2011-02-03 1997-01-28 Protein involved in SRP-independent targeting of substrates to the ER; component of an alternative ER targeting pathway that has partial functional redundancy with the GET pathway; preference for substrates with downstream transmembrane domains; interacts with Snd1p, Env10p/Snd2p, and Sec61p-translocon subunits; can compensate for loss of SRP; role in phosphate transport, interacting with pho88, and in the maturation of secretory proteins -S000037352 CDS YBR106W 2 452658 453224 W 2011-02-03 1997-01-28 -S000000311 ORF Verified YBR107C IML3 MCM19 chromosome 2 L000004778 2 454530 453793 C 2011-02-03 1997-01-28 Outer kinetochore protein and component of the Ctf19 complex; involved in the establishment of pericentromeric cohesion during mitosis; prevents non-disjunction of sister chromatids during meiosis II; forms a stable complex with Chl4p; required for localization of Sgo1p to pericentric sites during meiosis I; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-L and fission yeast fta1 -S000037374 CDS YBR107C 2 454530 453793 C 2011-02-03 1997-01-28 -S000000312 ORF Verified YBR108W AIM3 chromosome 2 2 454822 457665 W 2011-02-03 2004-07-09|1997-01-28|2011-02-03 Protein that inhibits barbed-end actin filament elongation; interacts with Rvs167p; null mutant is viable and displays elevated frequency of mitochondrial genome loss -S000030057 CDS YBR108W 2 454822 457665 W 2011-02-03 2004-07-09|1997-01-28|2011-02-03 -S000000313 ORF Verified YBR109C CMD1 calmodulin|CaM chromosome 2 L000000365 2 458362 457919 C 53 2011-02-03 1997-01-28 Calmodulin; Ca2+ binding protein that regulates Ca2+ independent processes (mitosis, bud growth, actin organization, endocytosis, etc.) and Ca2+ dependent processes (stress-activated pathways), targets include Nuf1p, Myo2p and calcineurin; binds to the Hog1p MAPK in response to hyperosmotic stress; potentiates membrane tubulation and constriction mediated by the Rvs161p-Rvs167p complex; human CALM1 or CALM2 functionally complement repression induced inviability -S000030094 CDS YBR109C 2 458362 457919 C 2011-02-03 1997-01-28 -S000028737 ORF Dubious YBR109W-A chromosome 2 2 458608 458832 W 2011-02-03 2003-07-29 Putative protein of unknown function; questionable ORF from MIPS -S000033381 CDS YBR109W-A 2 458608 458832 W 2011-02-03 2003-07-29 -S000000314 ORF Verified YBR110W ALG1 chitobiosyldiphosphodolichol beta-1,4 mannosyltransferase chromosome 2 L000000076 2 458872 460221 W 54 2011-02-03 1997-01-28 Mannosyltransferase; involved in asparagine-linked glycosylation in the endoplasmic reticulum (ER); essential for viability; human homolog ALG1 complements yeast null mutant -S000032542 CDS YBR110W 2 458872 460221 W 2011-02-03 1997-01-28 -S000000315 ORF Verified YBR111C YSA1 ADP-ribose diphosphatase|RMA2 chromosome 2 L000002551 2 461873 461178 C 2011-02-03 1997-01-28 Nudix hydrolase family member with ADP-ribose pyrophosphatase activity; shown to metabolize O-acetyl-ADP-ribose to AMP and acetylated ribose 5'-phosphate -S000032550 CDS YBR111C 2 461873 461178 C 2011-02-03 1997-01-28 -S000028510 ORF Verified YBR111W-A SUS1 chromosome 2 2 462139 462579 W 2011-02-03 2003-12-17|2003-07-29 Component of both the SAGA histone acetylase and TREX-2 complexes; interacts with RNA polymerase II; involved in mRNA export coupled transcription activation and elongation; involved in post-transcriptional tethering of active genes to the nuclear periphery and to non-nascent mRNP -S000030260 CDS YBR111W-A 2 462139 462209 W 2011-02-03 2003-12-17|2003-07-29 -S000030261 CDS YBR111W-A 2 462290 462429 W 2011-02-03 2003-12-17|2003-07-29 -S000030263 CDS YBR111W-A 2 462500 462579 W 2011-02-03 2003-12-17 -S000030262 intron YBR111W-A 2 462210 462289 W 2011-02-03 2003-12-17|2003-07-29 -S000030264 intron YBR111W-A 2 462430 462499 W 2011-02-03 2003-12-17 -S000000317 ORF Dubious YBR113W chromosome 2 2 465566 466048 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene CYC8 -S000033391 CDS YBR113W 2 465566 466048 W 2011-02-03 1997-01-28 -S000000316 ORF Verified YBR112C CYC8 transcription regulator CYC8|[OCT]|[OCT1+]|SSN6|CRT8 chromosome 2 L000000452 2 465770 462870 C 56 2011-02-03 1997-01-28 General transcriptional co-repressor; acts together with Tup1p; also acts as part of a transcriptional co-activator complex that recruits the SWI/SNF and SAGA complexes to promoters; can form the prion [OCT+] -S000032660 CDS YBR112C 2 465770 462870 C 2011-02-03 1997-01-28 -S000000318 ORF Verified YBR114W RAD16 DNA repair protein RAD16|PSO5 chromosome 2 L000004121|L000001565 2 467248 469620 W 58 2011-02-03 1997-01-28 Nucleotide excision repair (NER) protein; binds damaged DNA during NER; binds DNA in an ATP-dependent manner (with Rad7p) during NER; required for NER of non-transcribed chromatin; subunit of Nucleotide Excision Repair Factor 4 (NEF4) and the Elongin-Cullin-Socs (ECS) ligase complex -S000033462 CDS YBR114W 2 467248 469620 W 2011-02-03 1997-01-28 -S000000319 ORF Verified YBR115C LYS2 L-aminoadipate-semialdehyde dehydrogenase chromosome 2 L000000965 2 473926 469748 C 59 2011-02-03 1997-01-28 Alpha aminoadipate reductase; catalyzes the reduction of alpha-aminoadipate to alpha-aminoadipate 6-semialdehyde, which is the fifth step in biosynthesis of lysine; activation requires posttranslational phosphopantetheinylation by Lys5p -S000033483 CDS YBR115C 2 473926 469748 C 2011-02-03 1997-01-28 -S000000320 ORF Dubious YBR116C chromosome 2 2 474726 474199 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene TKL2 -S000033572 CDS YBR116C 2 474726 474199 C 2011-02-03 1997-01-28 -S000000321 ORF Verified YBR117C TKL2 transketolase TKL2 chromosome 2 L000002314 2 476437 474392 C 2011-02-03 1997-01-28 Transketolase; catalyzes conversion of xylulose-5-phosphate and ribose-5-phosphate to sedoheptulose-7-phosphate and glyceraldehyde-3-phosphate in the pentose phosphate pathway; needed for synthesis of aromatic amino acids; TKL2 has a paralog, TKL1, that arose from the whole genome duplication -S000033608 CDS YBR117C 2 476437 474392 C 2011-02-03 1997-01-28 -S000000322 ORF Verified YBR118W TEF2 translation elongation factor EF-1 alpha|eEF1A|EF-1 alpha chromosome 2 L000002278 2 477671 479047 W 61 2011-02-03 1997-01-28 Translational elongation factor EF-1 alpha; in the GTP-bound active form, binds to and delivers aminoacylated tRNA to the A-site of ribosomes for elongation of nascent polypeptides; associates with vacuolar Rho1p GTPase; TEF2-RFP levels increase during replicative aging; may also have a role in tRNA re-export from the nucleus; TEF2 has a paralog, TEF1, that arose from the whole genome duplication -S000034590 CDS YBR118W 2 477671 479047 W 2011-02-03 1997-01-28 -S000000323 ORF Verified YBR119W MUD1 U1A|U1-A chromosome 2 L000001217 2 479338 480323 W 2011-02-03 1997-01-28 U1 snRNP A protein; homolog of human U1-A; involved in nuclear mRNA splicing -S000034715 CDS YBR119W 2 479338 479345 W 2011-02-03 1997-01-28 -S000034716 CDS YBR119W 2 479435 480323 W 2011-02-03 1997-01-28 -S000034717 intron YBR119W 2 479346 479434 W 2011-02-03 1997-01-28 -S000000324 ORF Verified YBR120C CBP6 chromosome 2 L000000228 2 480923 480435 C 2011-02-03 1997-01-28 Mitochondrial protein required for translation of the COB mRNA; forms a complex with Cbp3p that binds to mt ribosomes near the polypeptide tunnel exit and promotes efficient translation of the COB mRNA; Cbp3p-Cbp6p complex also interacts with newly synthesized cytochrome b (Cobp) and Cbp4p to promote assembly of Cobp into the cytochrome bc1 complex; Cbp3p-Cbp6p complex is sequestered if assembly of Complex III is blocked, downregulating COB mRNA translation -S000035739 CDS YBR120C 2 480923 480435 C 2011-02-03 1997-01-28 -S000028815 ORF Dubious YBR121C-A chromosome 2 2 482484 482326 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely contained within the verified gene GRS1; identified by expression profiling and mass spectrometry -S000033618 CDS YBR121C-A 2 482484 482326 C 2011-02-03 2003-07-29 -S000000325 ORF Verified YBR121C GRS1 glycine--tRNA ligase chromosome 2 L000000738|L000000731 2 483367 481364 C 2011-02-03 1997-01-28|2011-02-03 Cytoplasmic and mitochondrial glycyl-tRNA synthase; ligates glycine to the cognate anticodon-bearing tRNA; transcription termination factor that may interact with the 3'-end of pre-mRNA to promote 3'-end formation; GRS1 has a paralog, GRS2, that arose from the whole genome duplication; human homolog GARS implicated in Charcot-Marie-Tooth disease, can complement yeast null mutant -S000036674 CDS YBR121C 2 483367 481364 C 2011-02-03 1997-01-28|2011-02-03 -S000000326 ORF Verified YBR122C MRPL36 mitochondrial 54S ribosomal protein YmL36|YmL36 chromosome 2 L000002531|L000001171 2 484503 483970 C 2011-02-03 2003-09-22|1997-01-28 Mitochondrial ribosomal protein of the large subunit; overproduction suppresses mutations in the COX2 leader peptide-encoding region -S000036725 CDS YBR122C 2 484503 483970 C 2011-02-03 2003-09-22|1997-01-28 -S000000328 ORF Dubious YBR124W chromosome 2 2 486507 486866 W 2011-02-03 1997-01-28 Putative protein of unknown function -S000037559 CDS YBR124W 2 486507 486866 W 2011-02-03 1997-01-28 -S000000327 ORF Verified YBR123C TFC1 transcription factor TFIIIC subunit TFC1|tau 95 chromosome 2 L000002285 2 486691 484742 C 2011-02-03 1997-01-28 Subunit of RNA polymerase III transcription initiation factor complex; one of six subunits of the RNA polymerase III transcription initiation factor complex (TFIIIC); part of the TauA globular domain of TFIIIC that binds DNA at the BoxA promoter sites of tRNA and similar genes; human homolog is TFIIIC-63 -S000036794 CDS YBR123C 2 486691 484742 C 2011-02-03 1997-01-28 -S000118350 ARS ARS216 ARSII-487 chromosome 2 2 486707 486954 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178049 ARS_consensus_sequence ARS216 2 486859 486843 C 2014-11-18 2014-11-18 -S000000329 ORF Verified YBR125C PTC4 type 2C protein phosphatase PTC4|GCT1 chromosome 2 2 488380 487199 C 2011-02-03 1997-01-28 Cytoplasmic type 2C protein phosphatase (PP2C); identified as a high-copy number suppressor of cnb1 mpk1 synthetic lethality; overexpression decreases high-osmolarity induced Hog1p phosphorylation and kinase activity -S000037589 CDS YBR125C 2 488380 487199 C 2011-02-03 1997-01-28 -S000000330 ORF Verified YBR126C TPS1 alpha,alpha-trehalose-phosphate synthase (UDP-forming) TPS1|TSS1|GLC6|GGS1|FDP1|CIF1|BYP1 chromosome 2 L000002330 2 490392 488905 C 41 2011-02-03 1997-01-28 Synthase subunit of trehalose-6-P synthase/phosphatase complex; synthesizes the storage carbohydrate trehalose, which is critically important for survival of long-term desiccation; also found in a monomeric form; expression is induced by the stress response and repressed by the Ras-cAMP pathway; protein abundance increases in response to DNA replication stress and in response to prolonged exposure to boric acid -S000037645 CDS YBR126C 2 490392 488905 C 2011-02-03 1997-01-28 -S000028600 ORF Verified YBR126W-A MEO1 chromosome 2 2 490850 491056 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray analysis, and genome-wide homology searches; mRNA identified as translated by ribosome profiling data; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; partially overlaps the dubious ORF YBR126W-B -S000031400 CDS YBR126W-A 2 490850 491056 W 2011-02-03 2003-07-29 -S000028738 ORF Dubious YBR126W-B chromosome 2 2 490927 491070 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YBR126W-A; identified by SAGE -S000033382 CDS YBR126W-B 2 490927 491070 W 2011-02-03 2003-07-29 -S000000331 ORF Verified YBR127C VMA2 H(+)-transporting V1 sector ATPase subunit B|ATPSV|VAT2 chromosome 2 L000002458 2 492822 491269 C 2011-02-03 1997-01-28 Subunit B of V1 peripheral membrane domain of vacuolar H+-ATPase; electrogenic proton pump found throughout the endomembrane system; contains nucleotide binding sites; also detected in the cytoplasm; protein abundance increases in response to DNA replication stress; human homolog ATP6V1B1, implicated in autosomal-recessive distal renal tubular acidosis (RTA) with sensorineural deafness, complements yeast null mutant -S000037698 CDS YBR127C 2 492822 491269 C 2011-02-03 1997-01-28 -S000000332 ORF Verified YBR128C ATG14 APG14|CVT12 chromosome 2 L000004763|L000004641 2 494115 493081 C 2011-02-03 1997-01-28 Autophagy-specific subunit of phosphatidylinositol 3-kinase complex I; Atg14p targets complex I to the phagophore assembly site (PAS); required for localizing additional ATG proteins to the PAS; required for overflow degradation of misfolded proteins when ERAD is saturated; homolog of human Barkor; other members are Vps34, Vps15, and Vps30p -S000037772 CDS YBR128C 2 494115 493081 C 2011-02-03 1997-01-28 -S000000333 ORF Verified YBR129C OPY1 chromosome 2 L000004016 2 495339 494353 C 2011-02-03 1997-01-28 Protein of unknown function; overproduction blocks cell cycle arrest in the presence of mating pheromone; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000030622 CDS YBR129C 2 495339 494353 C 2011-02-03 1997-01-28 -S000000334 ORF Verified YBR130C SHE3 chromosome 2 L000004189|L000002868 2 496869 495592 C 2011-02-03 1997-01-28 Protein adaptor between Myo4p and the She2p-mRNA complex; part of the mRNA localization machinery that restricts accumulation of certain proteins to the bud; also required for cortical ER inheritance -S000030714 CDS YBR130C 2 496869 495592 C 2011-02-03 1997-01-28 -S000000335 ORF Verified YBR131W CCZ1 CVT16 chromosome 2 L000004556|L000004776|S000029129 2 497163 499277 W 2011-02-03 1997-01-28 Subunit of a heterodimeric guanine nucleotide exchange factor (GEF); subunit of the Mon1-Ccz1 GEF complex, which stimulates nucleotide exchange and activation of Ypt7p, a Rab family GTPase involved in membrane tethering and fusion events at the late endosome and vacuole; GEF activity is stimulated by membrane association and anionic phospholipids; involved in localizing Ypt7p to the vacuolar membrane; required for macroautophagy, the CVT pathway and mitophagy -S000031661 CDS YBR131W 2 497163 499277 W 2011-02-03 1997-01-28 -S000028601 ORF Dubious YBR131C-A chromosome 2 2 497739 497650 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YBR131W; identified by gene-trapping, microarray analysis, and genome-wide homology searches -S000031403 CDS YBR131C-A 2 497739 497650 C 2011-02-03 2003-07-29 -S000000336 ORF Verified YBR132C AGP2 chromosome 2 L000003947 2 501442 499652 C 2011-02-03 1997-01-28 Plasma membrane regulator of polyamine and carnitine transport; has similarity to transporters but lacks transport activity; may act as a sensor that transduces environmental signals; has a positive or negative regulatory effect on transcription of many transporter genes -S000031670 CDS YBR132C 2 501442 499652 C 2011-02-03 1997-01-28 -S000000338 ORF Dubious YBR134W chromosome 2 2 504243 504644 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032775 CDS YBR134W 2 504243 504644 W 2011-02-03 1997-01-28 -S000000337 ORF Verified YBR133C HSL7 protein arginine N-methyltransferase chromosome 2 L000003130 2 504287 501804 C 2011-02-03 1997-01-28 Protein arginine N-methyltransferase; exhibits septin and Hsl1p-dependent localization to the bud neck in budded cells and periodic Hsl1p-dependent phosphorylation; required with Hsl1p, and Elm1p for the mother-bud neck recruitment, phosphorylation, and degradation of Swe1p; interacts directly with Swe1p; relocalizes away from bud neck upon DNA replication stress; human homolog PRMT5 can complement yeast hsl7 mutant -S000031794 CDS YBR133C 2 504287 501804 C 2011-02-03 1997-01-28 -S000000339 ORF Verified YBR135W CKS1 cyclin-dependent protein kinase regulatory subunit CKS1 chromosome 2 L000000347 2 504854 505306 W 73 2011-02-03 1997-01-28 Cyclin-dependent protein kinase regulatory subunit and adaptor; interacts with Cdc28p (aka Cdk1p); required for G1/S and G2/M phase transitions and budding; mediates phosphorylation and degradation of Sic1p; modulates proteolysis of M-phase targets through interactions with the proteasome; role in transcriptional regulation, recruiting proteasomal subunits to target gene promoters; human homologs CKS1B and CKS2 can each complement yeast cks1 null mutant -S000032889 CDS YBR135W 2 504854 505306 W 2011-02-03 1997-01-28 -S000000340 ORF Verified YBR136W MEC1 protein kinase MEC1|RAD31|SAD3|ESR1 chromosome 2 L000000586|S000029404|S000007656 2 505668 512774 W 2011-02-03 1997-01-28 Genome integrity checkpoint protein and PI kinase superfamily member; Mec1p and Dun1p function in same pathway to regulate dNTP pools and telomere length; signal transducer required for cell cycle arrest and transcriptional responses to damaged or unreplicated DNA; facilitates replication fork progression and regulates P-body formation under replication stress; promotes interhomolog recombination by phosphorylating Hop1p; associates with shortened, dysfunctional telomeres -S000032977 CDS YBR136W 2 505668 512774 W 2011-02-03 1997-01-28 -S000000341 ORF Verified YBR137W chromosome 2 2 513044 513583 W 2011-02-03 1997-01-28|2011-02-03 Protein with a role in ER delivery of tail-anchored membrane proteins; interacts with Sgt2p; binds to the TRC complex, which inserts proteins into the ER membrane; interacts with Msn5p karyopherin; YBR137W is not an essential gene -S000033068 CDS YBR137W 2 513044 513583 W 2011-02-03 1997-01-28|2011-02-03 -S000000342 ORF Uncharacterized YBR138C HDR1 chromosome 2 L000003401 2 515336 513762 C 2011-02-03 1997-01-28|2011-02-03 Cytoplasmic protein of unknown function; APCC(Cdh1) substrate; potentially phosphorylated by Cdc28p; YBR138C is not an essential gene -S000033676 CDS YBR138C 2 515336 513762 C 2011-02-03 1997-01-28|2011-02-03 -S000000343 ORF Verified YBR139W carboxypeptidase C chromosome 2 2 515664 517190 W 2011-02-03 1997-01-28 Putative serine type carboxypeptidase; role in phytochelatin synthesis; green fluorescent protein (GFP)-fusion protein localizes to the vacuole; expression induced by nitrogen limitation in a GLN3, GAT1-independent manner -S000033849 CDS YBR139W 2 515664 517190 W 2011-02-03 1997-01-28 -S000178050 ARS ARS217 chromosome 2 2 517185 517386 2014-11-18 2014-11-18 Autonomously replicating sequence -S000178051 ARS_consensus_sequence ARS217 2 517263 517247 C 2014-11-18 2014-11-18 -S000000344 ORF Verified YBR140C IRA1 GTPase-activating protein IRA1|PPD1|GLC1 chromosome 2 L000000704|L000000873 2 526628 517350 C 78 2011-02-03 1997-01-28 GTPase-activating protein; negatively regulates RAS by converting it from GTP- to the GDP-bound inactive form, required for reducing cAMP levels under nutrient limiting conditions, mediates membrane association of adenylate cyclase; mutations cause catalase T deficiency, defective glycogen synthesis and defective trehalose accumulation; IRA1 has a paralog, IRA2, that arose from the whole genome duplication; defects in human homolog NF1 are associated with neurofibromatosis -S000034687 CDS YBR140C 2 526628 517350 C 2011-02-03 1997-01-28 -S000028602 ORF Dubious YBR141W-A chromosome 2 2 527167 527262 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the uncharacterized ORF YBR141C; identified by gene-trapping, microarray analysis, and genome-wide homology searching -S000031405 CDS YBR141W-A 2 527167 527262 W 2011-02-03 2003-07-29 -S000000345 ORF Verified YBR141C BMT2 25S rRNA (adenine2142-N1)-methyltransferase chromosome 2 2 528038 527025 C 2011-02-03 1997-01-28|2011-02-03 Nucleolar S-adenosylmethionine-dependent rRNA methyltransferase; methylates adenine (m1A) of the large subunit (LSU) rRNA at position 2142; belongs to Rossmann fold superfamily; green fluorescent protein (GFP)-fusion protein localizes to the nucleolus; YBR141C is not an essential gene -S000034839 CDS YBR141C 2 528038 527025 C 2011-02-03 1997-01-28|2011-02-03 -S000000346 ORF Verified YBR142W MAK5 putative ATP-dependent RNA helicase chromosome 2 L000000979 2 528317 530638 W 80 2011-02-03 1997-01-28 Essential nucleolar protein; putative DEAD-box RNA helicase required for maintenance of M1 dsRNA virus; involved in biogenesis of large (60S) ribosomal subunits -S000035850 CDS YBR142W 2 528317 530638 W 2011-02-03 1997-01-28 -S000000347 ORF Verified YBR143C SUP45 translation termination factor eRF1|eRF1|SUP47|SUP1|SAL4 chromosome 2 L000002258|L000002206|S000029305|L000001134 2 532182 530869 C 81 2011-02-03 1997-01-28 Polypeptide release factor (eRF1) in translation termination; mutant form acts as a recessive omnipotent suppressor; methylated by Mtq2p-Trm112p in ternary complex eRF1-eRF3-GTP; mutation of methylation site confers resistance to zymocin; has a role in cytokinesis through interaction with Mlc1p -S000035896 CDS YBR143C 2 532182 530869 C 2011-02-03 1997-01-28 -S000000348 ORF Dubious YBR144C chromosome 2 2 533549 533235 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YBR144C is not an essential gene -S000036039 CDS YBR144C 2 533549 533235 C 2011-02-03 1997-01-28 -S000000349 ORF Verified YBR145W ADH5 alcohol dehydrogenase ADH5 chromosome 2 L000000045 2 533762 534817 W 2011-02-03 1997-01-28 Alcohol dehydrogenase isoenzyme V; involved in ethanol production; ADH5 has a paralog, ADH1, that arose from the whole genome duplication -S000036921 CDS YBR145W 2 533762 534817 W 2011-02-03 1997-01-28 -S000000350 ORF Verified YBR146W MRPS9 mitochondrial 37S ribosomal protein MRPS9 chromosome 2 L000001175 2 535260 536096 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the small subunit -S000036972 CDS YBR146W 2 535260 536096 W 2011-02-03 1997-01-28 -S000000351 ORF Verified YBR147W RTC2 cationic amino acid transporter|YPQ3|RRT11 chromosome 2 2 536575 537465 W 2011-02-03 1997-01-28 Putative vacuolar membrane transporter for cationic amino acids; likely contributes to amino acid homeostasis by exporting cationic amino acids from the vacuole; positive regulation by Lys14p suggests that lysine may be the primary substrate; member of the PQ-loop family, with seven transmembrane domains; similar to mammalian PQLC2 vacuolar transporter; RTC2 has a paralog, YPQ1, that arose from the whole genome duplication -S000037067 CDS YBR147W 2 536575 537465 W 2011-02-03 1997-01-28 -S000000352 ORF Verified YBR148W YSW1 chromosome 2 L000002553 2 537876 539705 W 2011-02-03 1997-01-28 Protein required for normal prospore membrane formation; interacts with Gip1p, which is the meiosis-specific regulatory subunit of the Glc7p protein phosphatase; expressed specifically in spores and localizes to the prospore membrane; YSW1 has a paralog, SPO21, that arose from the whole genome duplication -S000037151 CDS YBR148W 2 537876 539705 W 2011-02-03 1997-01-28 -S000000353 ORF Verified YBR149W ARA1 D-arabinose 1-dehydrogenase (NAD(P)(+)) ARA1 chromosome 2 L000004642 2 539987 541021 W 2011-02-03 1997-01-28 NADP+ dependent arabinose dehydrogenase; involved in carbohydrate metabolism; purified as homodimer; naturally occurs with a N-terminus degradation product -S000037890 CDS YBR149W 2 539987 541021 W 2011-02-03 1997-01-28 -S000000354 ORF Verified YBR150C TBS1 chromosome 2 2 544493 541209 C 2011-02-03 1997-01-28 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; TBS1 has a paralog, HAL9, that arose from the whole genome duplication -S000030836 CDS YBR150C 2 544493 541209 C 2011-02-03 1997-01-28 -S000000355 ORF Verified YBR151W APD1 chromosome 2 2 545028 545978 W 2011-02-03 1997-01-28 Protein of unknown function; required for normal localization of actin patches and for normal tolerance of sodium ions and hydrogen peroxide; localizes to both cytoplasm and nucleus -S000030957 CDS YBR151W 2 545028 545978 W 2011-02-03 1997-01-28 -S000000356 ORF Verified YBR152W SPP381 U4/U6-U5 snRNP complex subunit SPP381 chromosome 2 L000004711 2 546376 547251 W 2011-02-03 1997-01-28 mRNA splicing factor, component of U4/U6.U5 tri-snRNP; interacts genetically and physically with Prp38p; relocalizes to the cytosol in response to hypoxia -S000031058 CDS YBR152W 2 546376 547251 W 2011-02-03 1997-01-28 -S000000357 ORF Verified YBR153W RIB7 2,5-diamino-6-(ribosylamino)-4(3H)-pyrimidinone 5'-phosphate reductase chromosome 2 L000001637 2 547460 548194 W 2011-02-03 1997-01-28 Diaminohydroxyphoshoribosylaminopyrimidine deaminase; catalyzes the second step of the riboflavin biosynthesis pathway -S000032010 CDS YBR153W 2 547460 548194 W 2011-02-03 1997-01-28 -S000000358 ORF Verified YBR154C RPB5 DNA-directed RNA polymerase core subunit RPB5|ABC27 chromosome 2 L000001590|L000001679 2 549009 548362 C 2011-02-03 1997-01-28 RNA polymerase subunit ABC27; common to RNA polymerases I, II, and III; contacts DNA and affects transactivation -S000032044 CDS YBR154C 2 549009 548362 C 2011-02-03 1997-01-28 -S000077079 matrix_attachment_site ETC8 ETC8 chromosome 2 2 549229 549251 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; can act as a transcription-blocking insulator or as a heterochromatin barrier element; located between divergently transcribed genes RPB5 and CNS1 -S000000359 ORF Verified YBR155W CNS1 HSP70/90 family co-chaperone CNS1 chromosome 2 L000004495 2 549771 550928 W 2011-02-03 1997-01-28 TPR-containing co-chaperone; binds both Hsp82p (Hsp90) and Ssa1p (Hsp70); stimulates ATPase activity of Ssa1p; ts mutants reduce Hsp82p function, overexpression suppresses phenotypes of HSP82 ts allele and cpr7 deletion; human homolog TTC4 complements yeast cns1 mutant -S000032166 CDS YBR155W 2 549771 550928 W 2011-02-03 1997-01-28 -S000000360 ORF Verified YBR156C SLI15 chromosome 2 L000003320 2 553200 551104 C 2011-02-03 1997-01-28 Subunit of the conserved chromosomal passenger complex (CPC); complex regulates kinetochore-microtubule attachments, activation of the spindle tension checkpoint, and mitotic spindle disassembly; other complex members are Ipl1p, Bir1p, and Nbl1p -S000032209 CDS YBR156C 2 553200 551104 C 2011-02-03 1997-01-28 -S000000361 ORF Verified YBR157C ICS2 chromosome 2 2 554310 553543 C 2011-02-03 2004-01-21|1997-01-28 Protein of unknown function; null mutation does not confer any obvious defects in growth, spore germination, viability, or carbohydrate utilization -S000032276 CDS YBR157C 2 554310 553543 C 2011-02-03 2004-01-21|1997-01-28 -S000000362 ORF Verified YBR158W AMN1 CST13|ICS4 chromosome 2 L000002997 2 556549 558198 W 2011-02-03 1997-01-28 Protein required for daughter cell separation; multiple mitotic checkpoints, and chromosome stability; contains 12 degenerate leucine-rich repeat motifs; expression is induced by the Mitotic Exit Network (MEN) -S000033182 CDS YBR158W 2 556549 558198 W 2011-02-03 1997-01-28 -S000000363 ORF Verified YBR159W IFA38 ketoreductase chromosome 2 2 558685 559728 W 2011-02-03 1997-01-28 Microsomal beta-keto-reductase; contains oleate response element (ORE) sequence in the promoter region; mutants exhibit reduced VLCFA synthesis, accumulate high levels of dihydrosphingosine, phytosphingosine and medium-chain ceramides -S000033243 CDS YBR159W 2 558685 559728 W 2011-02-03 1997-01-28 -S000000364 ORF Verified YBR160W CDC28 cyclin-dependent serine/threonine-protein kinase CDC28|SRM5|HSL5|CDK1 chromosome 2 L000000267 2 560078 560974 W 90 2011-02-03 1997-01-28 Cyclin-dependent kinase (CDK) catalytic subunit; master regulator of mitotic and meiotic cell cycles; alternately associates with G1, S, G2/M phase cyclins, which provide substrate specificity; regulates metabolism, basal transcription, chromosome dynamics, growth and morphogenesis; transcript induction in osmostress involves antisense RNA; human homologs CDK1, CDK2, CDK3 can complement yeast conditional cdc28 mutants; human CDK1, CDK2 can complement yeast cdc28 null mutant -S000035243 CDS YBR160W 2 560078 560974 W 2011-02-03 1997-01-28 -S000000365 ORF Verified YBR161W CSH1 mannosylinositol phosphorylceramide synthase catalytic subunit CSH1 chromosome 2 2 561634 562764 W 2011-02-03 1997-01-28 Mannosylinositol phosphorylceramide (MIPC) synthase catalytic subunit; forms a complex with regulatory subunit Csg2p; function in sphingolipid biosynthesis is overlapping with that of Sur1p; CSH1 has a paralog, SUR1, that arose from the whole genome duplication -S000035322 CDS YBR161W 2 561634 562764 W 2011-02-03 1997-01-28 -S000000366 ORF Verified YBR162C TOS1 chromosome 2 2 564570 563203 C 2011-02-03 1997-01-28 Covalently-bound cell wall protein of unknown function; identified as a cell cycle regulated SBF target gene; deletion mutants are highly resistant to treatment with beta-1,3-glucanase; has sequence similarity to YJL171C -S000035351 CDS YBR162C 2 564570 563203 C 2011-02-03 1997-01-28 -S000002158 ORF Verified YBR162W-A YSY6 chromosome 2 L000002554 2 565231 565428 W 2011-02-03 1997-01-28 Protein of unknown function; expression suppresses a secretory pathway mutation in E. coli; has similarity to the mammalian RAMP4 protein involved in secretion -S000032375 CDS YBR162W-A 2 565231 565428 W 2011-02-03 1997-01-28 -S000000367 ORF Verified YBR163W EXO5 DEM1 chromosome 2 2 565723 567480 W 2011-02-03 1997-01-28 Mitochondrial 5'-3' exonuclease and sliding exonuclease; required for mitochondrial genome maintenance; distantly related to the RecB nuclease domain of bacterial RecBCD recombinases; may be regulated by the transcription factor Ace2 -S000035461 CDS YBR163W 2 565723 567480 W 2011-02-03 1997-01-28 -S000000368 ORF Verified YBR164C ARL1 Arf family GTPase ARL1|DLP2 chromosome 2 L000002832 2 568426 567875 C 2011-02-03 1997-01-28 Soluble GTPase with a role in regulation of membrane traffic; regulates potassium influx; role in membrane organization at trans-Golgi network; required for delivery of Atg9p to the phagophore assembly site during autophagy under high temperature stress; required with Ypt6p for starvation-induced autophagy; required for the CVT pathway under non-starvation conditions; G protein of the Ras superfamily, similar to ADP-ribosylation factor -S000036313 CDS YBR164C 2 568426 567875 C 2011-02-03 1997-01-28 -S000000369 ORF Verified YBR165W UBS1 chromosome 2 L000003544 2 568852 569685 W 2011-02-03 1997-01-28 Ubiquitin-conjugating enzyme suppressor that regulates Cdc34p; functions as a general positive regulator of Cdc34p activity; nuclear protein that may represent a link between nucleocytoplasmic transport and ubiquitin ligase activity -S000036458 CDS YBR165W 2 568852 569685 W 2011-02-03 1997-01-28 -S000000370 ORF Verified YBR166C TYR1 prephenate dehydrogenase (NADP(+)) chromosome 2 L000002359|L000002402 2 571200 569842 C 97 2011-02-03 1997-01-28 Prephenate dehydrogenase involved in tyrosine biosynthesis; expression is dependent on phenylalanine levels -S000036504 CDS YBR166C 2 571200 569842 C 2011-02-03 1997-01-28 -S000000371 ORF Verified YBR167C POP7 ribonuclease P/MRP protein subunit POP7|RPP2 chromosome 2 L000004303|L000004505 2 571890 571468 C 2011-02-03 1997-01-28 Subunit of RNase MRP, nuclear RNase P and telomerase; forms a soluble heterodimer with Pop6p that binds P3 domain of RNase MRP and RNase P RNAs; RNase MRP cleaves pre-rRNA, nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs, while telomerase replenishes telomeric DNA -S000036597 CDS YBR167C 2 571890 571468 C 2011-02-03 1997-01-28 -S000000372 ORF Verified YBR168W PEX32 chromosome 2 2 572371 573612 W 2011-02-03 1997-01-28 Peroxisomal integral membrane protein; involved in negative regulation of peroxisome size; partially functionally redundant with Pex31p; genetic interactions suggest action at a step downstream of steps mediated by Pex28p and Pex29p -S000037359 CDS YBR168W 2 572371 573612 W 2011-02-03 1997-01-28 -S000000373 ORF Verified YBR169C SSE2 adenyl-nucleotide exchange factor SSE2 chromosome 2 L000002079 2 575996 573915 C 2011-02-03 1997-01-28 Member of Hsp110 subclass of the heat shock protein 70 (HSP70) family; serves as nucleotide exchange factor to load ATP onto the SSA class of cytosolic Hsp70s; may be involved in protein folding; localized to the cytoplasm; SSE2 has a paralog, SSE1, that arose from the whole genome duplication -S000037401 CDS YBR169C 2 575996 573915 C 2011-02-03 1997-01-28 -S000000374 ORF Verified YBR170C NPL4 HRD4 chromosome 2 L000001271 2 578086 576344 C 2011-02-03 1997-01-28 Substrate-recruiting cofactor of the Cdc48p-Npl4p-Ufd1p segregase; assists Cdc48p in the dislocation of misfolded, polyubiquitinated ERAD substrates that are subsequently delivered to the proteasome for degradation; also involved in the regulated destruction of resident ER membrane proteins, such as HMG-CoA reductase (Hmg1/2p) and cytoplasmic proteins (Fbp1p); role in mobilizing membrane bound transcription factors by regulated ubiquitin/proteasome-dependent processing (RUP) -S000030469 CDS YBR170C 2 578086 576344 C 2011-02-03 1997-01-28 -S000000375 ORF Verified YBR171W SEC66 KAR7|Sec63 complex subunit SEC66|SEC71|HSS1 chromosome 2 L000001856 2 578364 578984 W 2011-02-03 1997-01-28 Non-essential subunit of Sec63 complex; with Sec61 complex, Kar2p/BiP and Lhs1p forms a channel competent for SRP-dependent and post-translational SRP-independent protein targeting and import into the ER; other members are Sec63p, Sec62p, and Sec72p -S000030603 CDS YBR171W 2 578364 578984 W 2011-02-03 1997-01-28 -S000000376 ORF Verified YBR172C SMY2 chromosome 2 L000001941 2 581372 579150 C 2011-02-03 2003-09-22|1997-01-28 GYF domain protein; involved in COPII vesicle formation; interacts with the Sec23p/Sec24p subcomplex; overexpression suppresses the temperature sensitivity of a myo2 mutant; similar to S. pombe Mpd2; SMY2 has a paralog, SYH1, that arose from the whole genome duplication -S000030643 CDS YBR172C 2 581372 579150 C 2011-02-03 2003-09-22|1997-01-28 -S000000377 ORF Verified YBR173C UMP1 RNS2 chromosome 2 L000004429 2 582172 581726 C 2011-02-03 1997-01-28 Chaperone required for correct maturation of the 20S proteasome; short-lived chaperone; may inhibit premature dimerization of proteasome half-mers; degraded by proteasome upon completion of its assembly -S000030726 CDS YBR173C 2 582172 581726 C 2011-02-03 1997-01-28 -S000000379 ORF Verified YBR175W SWD3 SAF35|CPS30 chromosome 2 2 582408 583355 W 2011-02-03 1997-01-28 Essential subunit of the COMPASS (Set1C) complex; COMPASS methylates histone H3 on lysine 4 and is required in transcriptional silencing near telomeres; WD40 beta propeller superfamily member and ortholog of mammalian WDR5 -S000031715 CDS YBR175W 2 582408 583355 W 2011-02-03 1997-01-28 -S000000378 ORF Dubious YBR174C chromosome 2 2 582652 582338 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YBR175W; null mutant is viable and sporulation defective -S000031563 CDS YBR174C 2 582652 582338 C 2011-02-03 1997-01-28 -S000000380 ORF Verified YBR176W ECM31 3-methyl-2-oxobutanoate hydroxymethyltransferase chromosome 2 L000003901 2 583720 584658 W 2011-02-03 1997-01-28 Ketopantoate hydroxymethyltransferase; required for pantothenic acid biosynthesis, converts 2-oxoisovalerate into 2-dehydropantoate -S000031869 CDS YBR176W 2 583720 584658 W 2011-02-03 1997-01-28 -S000000382 ORF Dubious YBR178W chromosome 2 2 586071 586445 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YBR177C -S000032865 CDS YBR178W 2 586071 586445 W 2011-02-03 1997-01-28 -S000000381 ORF Verified YBR177C EHT1 medium-chain fatty acid ethyl ester synthase/esterase chromosome 2 2 586162 584807 C 2011-02-03 1997-01-28 Acyl-coenzymeA:ethanol O-acyltransferase; plays a minor role in medium-chain fatty acid ethyl ester biosynthesis; possesses short-chain esterase activity; localizes to lipid particles and the mitochondrial outer membrane; EHT1 has a paralog, EEB1, that arose from the whole genome duplication -S000031916 CDS YBR177C 2 586162 584807 C 2011-02-03 1997-01-28 -S000000383 ORF Verified YBR179C FZO1 mitofusin chromosome 2 L000004083 2 589114 586547 C 2011-02-03 1997-01-28 Mitofusin; integral membrane protein involved in mitochondrial outer membrane tethering and fusion; role in mitochondrial genome maintenance; efficient tethering and degradation of Fzo1p requires an intact N-terminal GTPase domain; targeted for destruction by the ubiquitin ligase SCF-Mdm30p and the cytosolic ubiquitin-proteasome system -S000032906 CDS YBR179C 2 589114 586547 C 2011-02-03 1997-01-28 -S000000384 ORF Verified YBR180W DTR1 chromosome 2 2 589741 591459 W 2011-02-03 1997-01-28 Putative dityrosine transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; required for spore wall synthesis; sequence similarity to QDR1 and QDR3, and the triple mutant dtr1 qdr1 qdr3 exhibits reduced dityrosine fluorescence relative to the single mutants; expressed during sporulation -S000035007 CDS YBR180W 2 589741 591459 W 2011-02-03 1997-01-28 -S000000385 ORF Verified YBR181C RPS6B eS6|ribosomal 40S subunit protein S6B|S6e|RPS102|RPS101|LPG18 chromosome 2 L000002721 2 592774 591712 C 2011-02-03 1997-01-28 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S6, no bacterial homolog; phosphorylated on S233 by Ypk3p in a TORC1-dependent manner, and on S232 in a TORC1/2-dependent manner by Ypk1/2/3p; RPS6B has a paralog, RPS6A, that arose from the whole genome duplication -S000035075 CDS YBR181C 2 592416 591712 C 2011-02-03 1997-01-28 -S000035074 CDS YBR181C 2 592774 592769 C 2011-02-03 1997-01-28 -S000035076 intron YBR181C 2 592768 592417 C 2011-02-03 1997-01-28 -S000000386 ORF Verified YBR182C SMP1 chromosome 2 L000004146 2 594864 593506 C 2011-02-03 1997-01-28 MADS-box transcription factor involved in osmotic stress response; SMP1 has a paralog, RLM1, that arose from the whole genome duplication -S000035193 CDS YBR182C 2 594864 593506 C 2011-02-03 1997-01-28 -S000028603 ORF Uncharacterized YBR182C-A chromosome 2 2 595555 595361 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031408 CDS YBR182C-A 2 595555 595361 C 2011-02-03 2003-07-29 -S000000387 ORF Verified YBR183W YPC1 phytoceramidase chromosome 2 2 596115 597065 W 2011-02-03 1997-01-28 Alkaline ceramidase; also has reverse (CoA-independent) ceramide synthase activity; catalyzes both breakdown and synthesis of phytoceramide; overexpression confers fumonisin B1 resistance; YPC1 has a paralog, YDC1, that arose from the whole genome duplication -S000036119 CDS YBR183W 2 596115 597065 W 2011-02-03 1997-01-28 -S000000388 ORF Uncharacterized YBR184W chromosome 2 2 597363 598934 W 2011-02-03 1997-01-28 Putative protein of unknown function; YBR184W is not an essential gene -S000036220 CDS YBR184W 2 597363 598934 W 2011-02-03 1997-01-28 -S000000389 ORF Verified YBR185C MBA1 chromosome 2 L000002809 2 599959 599123 C 2011-02-03 1997-01-28 Membrane-associated mitochondrial ribosome receptor; forms a complex with Mdm38p that may facilitate recruitment of mRNA-specific translational activators to ribosomes; possible role in protein export from the matrix to inner membrane -S000036261 CDS YBR185C 2 599959 599123 C 2011-02-03 1997-01-28 -S000000390 ORF Verified YBR186W PCH2 chromosome 2 L000004274 2 600553 602360 W 2011-02-03 2000-07-14|1997-01-28 Hexameric ring ATPase that remodels chromosome axis protein Hop1p; nucleolar component of the pachytene checkpoint, which prevents chromosome segregation when recombination and chromosome synapsis are defective; also represses meiotic interhomolog recombination in rDNA; required for meiotic double-stranded break formation -S000036993 CDS YBR186W 2 600553 602103 W 2011-02-03 2000-07-14|1997-01-28 -S000036994 CDS YBR186W 2 602217 602360 W 2011-02-03 2000-07-14 -S000036995 intron YBR186W 2 602104 602216 W 2011-02-03 2000-07-14 -S000000391 ORF Verified YBR187W GDT1 putative ribosome biosynthesis protein GDT1 chromosome 2 2 602634 603476 W 2011-02-03 1997-01-28 Calcium transporter localized to the cis- and medial-Golgi apparatus; required for protein glycosylation; GFP-fusion protein localizes to the vacuole; TMEM165, a human gene which causes Congenital Disorders of Glycosylation is orthologous and functionally complements the null allele; expression pattern and physical interactions suggest a possible role in ribosome biogenesis; expression reduced in a gcr1 null mutant -S000037050 CDS YBR187W 2 602634 603476 W 2011-02-03 1997-01-28 -S000000392 ORF Verified YBR188C NTC20 chromosome 2 L000004267 2 604107 603685 C 2011-02-03 1997-01-28 Member of the NineTeen Complex (NTC); this complex contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs -S000037089 CDS YBR188C 2 604107 603685 C 2011-02-03 1997-01-28 -S000000393 ORF Verified YBR189W RPS9B ribosomal 40S subunit protein S9B|rp21|YS11|S9B|S4|S13|SUP46|RPS13A chromosome 2 L000002207|S000029306|L000001135 2 604508 605508 W 106 2011-02-03 1997-01-28 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S9 and bacterial S4; RPS9B has a paralog, RPS9A, that arose from the whole genome duplication -S000037264 CDS YBR189W 2 604508 604514 W 2011-02-03 1997-01-28 -S000037265 CDS YBR189W 2 604928 605508 W 2011-02-03 1997-01-28 -S000037266 intron YBR189W 2 604515 604927 W 2011-02-03 1997-01-28 -S000000394 ORF Dubious YBR190W chromosome 2 2 605966 606277 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ribosomal protein gene RPL21A/YBR191W -S000029997 CDS YBR190W 2 605966 606277 W 2011-02-03 1997-01-28 -S000000395 ORF Verified YBR191W RPL21A eL21|ribosomal 60S subunit protein L21A|L21e|L21A|URP1 chromosome 2 L000002441 2 606270 607140 W 2011-02-03 1997-01-28 Ribosomal 60S subunit protein L21A; homologous to mammalian ribosomal protein L21, no bacterial homolog; RPL21A has a paralog, RPL21B, that arose from the whole genome duplication -S000030992 CDS YBR191W 2 606270 606280 W 2011-02-03 1997-01-28 -S000030993 CDS YBR191W 2 606669 607140 W 2011-02-03 1997-01-28 -S000030994 intron YBR191W 2 606281 606668 W 2011-02-03 1997-01-28 -S000007594 ORF Dubious YBR191W-A chromosome 2 2 607149 607223 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037106 CDS YBR191W-A 2 607149 607223 W 2011-02-03 2001-02-26 -S000000396 ORF Verified YBR192W RIM2 PYT1 chromosome 2 L000001641 2 607652 608785 W 2011-02-03 1997-01-28 Mitochondrial pyrimidine nucleotide transporter; imports pyrimidine nucleoside triphosphates and exports pyrimidine nucleoside monophosphates; member of the mitochondrial carrier family -S000031077 CDS YBR192W 2 607652 608785 W 2011-02-03 1997-01-28 -S000000397 ORF Verified YBR193C MED8 chromosome 2 L000003917 2 609753 609082 C 2011-02-03 1997-01-28 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation -S000031128 CDS YBR193C 2 609753 609082 C 2011-02-03 1997-01-28 -S000000398 ORF Verified YBR194W AIM4 SOY1 chromosome 2 2 610038 610409 W 2011-02-03 1997-01-28 Protein proposed to be associated with the nuclear pore complex; null mutant is viable, displays elevated frequency of mitochondrial genome loss and is sensitive to freeze-thaw stress -S000032148 CDS YBR194W 2 610038 610409 W 2011-02-03 1997-01-28 -S000000399 ORF Verified YBR195C MSI1 CAC3 chromosome 2 L000001193 2 611882 610614 C 89 2011-02-03 1997-01-28 Subunit of chromatin assembly factor I (CAF-1); chromatin assembly by CAF-1 affects multiple processes including silencing at telomeres, mating type loci, and rDNA; maintenance of kinetochore structure; deactivation of DNA damage checkpoint after DNA repair; chromatin dynamics during transcription; and repression of divergent noncoding transcription; Msi1p localizes to nucleus and cytoplasm and independently regulates the RAS/cAMP pathway via sequestration of Npr1p kinase -S000032175 CDS YBR195C 2 611882 610614 C 2011-02-03 1997-01-28 -S000000400 ORF Verified YBR196C PGI1 glucose-6-phosphate isomerase|CDC30 chromosome 2 L000001410|L000001409 2 613900 612236 C 89 2011-02-03 1997-01-28 Glycolytic enzyme phosphoglucose isomerase; catalyzes the interconversion of glucose-6-phosphate and fructose-6-phosphate; required for cell cycle progression and completion of the gluconeogenic events of sporulation -S000032251 CDS YBR196C 2 613900 612236 C 2011-02-03 1997-01-28 -S000028534 ORF Uncharacterized YBR196C-A chromosome 2 2 614173 614024 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031143 CDS YBR196C-A 2 614173 614024 C 2011-02-03 2003-07-29 -S000028816 ORF Uncharacterized YBR196C-B chromosome 2 2 614630 614526 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000033621 CDS YBR196C-B 2 614630 614526 C 2011-02-03 2003-07-29 -S000000401 ORF Verified YBR197C chromosome 2 2 615856 615203 C 2011-02-03 1997-01-28 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; YBR197C is not an essential gene; relative distribution to the nucleus increases upon DNA replication stress; YBR197C has a paralog, YPL077C, that arose from the whole genome duplication -S000032354 CDS YBR197C 2 615856 615203 C 2011-02-03 1997-01-28 -S000000402 ORF Verified YBR198C TAF5 chromatin modification protein|TafII90|TAF90 chromosome 2 L000004155 2 618523 616127 C 2011-02-03 1997-01-28 Subunit (90 kDa) of TFIID and SAGA complexes; involved in RNA polymerase II transcription initiation and in chromatin modification -S000033223 CDS YBR198C 2 618523 616127 C 2011-02-03 1997-01-28 -S000000403 ORF Verified YBR199W KTR4 putative mannosyltransferase chromosome 2 L000000927 2 618909 620303 W 2011-02-03 1997-01-28 Glycosyltransferase involved in protein glycosylation; transfers GDP-mannose to methyl-alpha-mannoside in vitro; member of the KRE2/MNT1 mannosyltransferase family of type II membrane proteins with a short cytoplasmic N-terminus, a membrane-spanning region and a highly conserved catalytic lumenal domain -S000033316 CDS YBR199W 2 618909 620303 W 2011-02-03 1997-01-28 -S000000404 ORF Verified YBR200W BEM1 phosphatidylinositol-3-phosphate-binding protein BEM1|SRO1 chromosome 2 L000000167 2 620872 622527 W 102 2011-02-03 1997-01-28 Protein containing SH3-domains; involved in establishing cell polarity and morphogenesis; functions as a scaffold protein for complexes that include Cdc24p, Ste5p, Ste20p, and Rsr1p -S000030486 CDS YBR200W 2 620872 622527 W 2011-02-03 1997-01-28 -S000118351 ARS ARS220 ARSII-623 chromosome 2 2 622671 622939 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000028535 ORF Uncharacterized YBR200W-A chromosome 2 2 622983 623147 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031144 CDS YBR200W-A 2 622983 623147 W 2011-02-03 2003-07-29 -S000000405 ORF Verified YBR201W DER1 derlin chromosome 2 L000002800 2 623576 624211 W 2011-02-03 1999-04-26|1997-01-28 ER membrane protein that promotes export of misfolded polypeptides; required for ER-associated protein degradation of misfolded or unassembled proteins; initiates export of aberrant polypeptides from ER lumen by threading them into ER membrane and routing them to Hrd1p for ubiquitination; function normally requires N-terminal acetylation by NatB; N- and C- termini protrude into cytoplasm; similar to Dfm1p; homolog of mammalian derlin-1 -S000030597 CDS YBR201W 2 623576 624211 W 2011-02-03 1999-04-26|1997-01-28 -S000087085 ORF Uncharacterized YBR201C-A chromosome 2 2 624696 624493 C 2011-02-03 2005-11-08 Putative protein of unknown function -S000087086 CDS YBR201C-A 2 624696 624493 C 2011-02-03 2005-11-08 -S000000406 ORF Verified YBR202W MCM7 mini-chromosome maintenance complex protein 7|CDC47 chromosome 2 L000002760 2 625772 628309 W 2011-02-03 1997-01-28|2011-02-03 Component of the Mcm2-7 hexameric helicase complex; MCM2-7 primes origins of DNA replication in G1 and becomes an active ATP-dependent helicase that promotes DNA melting and elongation in S-phase; forms an Mcm4p-6p-7p subcomplex -S000030677 CDS YBR202W 2 625772 628309 W 2011-02-03 1997-01-28|2011-02-03 -S000000407 ORF Verified YBR203W COS111 chromosome 2 2 629168 631942 W 2011-02-03 1997-01-28|2011-02-03 Protein required for antifungal drug ciclopirox olamine resistance; not related to the subtelomerically-encoded COS family; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000031550 CDS YBR203W 2 629168 631942 W 2011-02-03 1997-01-28|2011-02-03 -S000130153 ARS ARS221 ARSII-632 chromosome 2 2 631939 632251 2011-02-03 2009-05-07|2011-02-03 Autonomously Replicating Sequence -S000178052 ARS_consensus_sequence ARS221 2 632005 632021 W 2014-11-18 2014-11-18 -S000000408 ORF Verified YBR204C LDH1 triacylglycerol lipase chromosome 2 2 633381 632254 C 2011-02-03 1997-01-28|2011-02-03 Serine hydrolase; exhibits active esterase plus weak triacylglycerol lipase activities; proposed role in lipid homeostasis, regulating phospholipid and non-polar lipid levels and required for mobilization of LD-stored lipids; localizes to the lipid droplet (LD) surface; contains a classical serine containing catalytic triad (GxSxG motif) -S000031575 CDS YBR204C 2 633381 632254 C 2011-02-03 1997-01-28|2011-02-03 -S000000409 ORF Verified YBR205W KTR3 mannosyltransferase KTR3 chromosome 2 L000000926 2 633622 634836 W 2011-02-03 1997-01-28 Putative alpha-1,2-mannosyltransferase; involved in O- and N-linked protein glycosylation; member of the KRE2/MNT1 mannosyltransferase family; Svp26p mediates uptake of Ktr3p into COPII vesicles; relocalizes from nucleus to vacuole upon DNA replication stress -S000031710 CDS YBR205W 2 633622 634836 W 2011-02-03 1997-01-28 -S000000410 ORF Dubious YBR206W chromosome 2 2 634601 634924 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene KTR3 -S000031861 CDS YBR206W 2 634601 634924 W 2011-02-03 1997-01-28 -S000000411 ORF Verified YBR207W FTH1 chromosome 2 L000003065 2 635146 636543 W 2011-02-03 1997-01-28|2011-02-03 Putative high affinity iron transporter; involved in transport of intravacuolar stores of iron; forms complex with Fet5p; expression is regulated by iron; proposed to play indirect role in endocytosis; protein abundance increases in response to DNA replication stress -S000032783 CDS YBR207W 2 635146 636543 W 2011-02-03 1997-01-28|2011-02-03 -S000000412 ORF Verified YBR208C DUR1,2 bifunctional urea carboxylase/allophanate hydrolase|DUR80 chromosome 2 L000000532|L000000533|L000000536 2 642210 636703 C 112 2011-02-03 1997-01-28 Urea amidolyase; contains both urea carboxylase and allophanate hydrolase activities, degrades urea to CO2 and NH3; expression sensitive to nitrogen catabolite repression and induced by allophanate, an intermediate in allantoin degradation; protein abundance increases in response to DNA replication stress -S000032849 CDS YBR208C 2 642210 636703 C 2011-02-03 1997-01-28 -S000000413 ORF Dubious YBR209W chromosome 2 2 642583 642900 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YBR209W is not an essential gene -S000032978 CDS YBR209W 2 642583 642900 W 2011-02-03 1997-01-28 -S000006526 tRNA_gene tC(GCA)B chromosome 2 L000003748 2 643078 643007 C 2011-02-03 2000-05-19 Cysteine tRNA (tRNA-Cys), predicted by tRNAscan-SE analysis -S000035208 noncoding_exon tC(GCA)B 2 643078 643007 C 2011-02-03 2000-05-19 -S000006820 long_terminal_repeat YBRCtau2 YBRWtau2 chromosome 2 2 643858 643488 C 2011-02-03 2000-05-19|2007-04-05 Ty4 LTR -S000006812 long_terminal_repeat YBRWdelta18 YBRCdelta18 chromosome 2 2 643859 644002 W 2011-02-03 2000-05-19 Ty1 LTR -S000006813 long_terminal_repeat YBRCdelta19 chromosome 2 2 644603 644362 C 2011-02-03 2000-05-19|2007-04-05 Ty1 LTR -S000006548 tRNA_gene tE(UUC)B chromosome 2 L000003747 2 645167 645238 W 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000035972 noncoding_exon tE(UUC)B 2 645167 645238 W 2011-02-03 2000-05-19 -S000000414 ORF Verified YBR210W ERV15 chromosome 2 2 645550 645978 W 2011-02-03 1997-01-28 Protein involved in export of proteins from the endoplasmic reticulum; ERV15 has a paralog, ERV14, that arose from the whole genome duplication -S000033653 CDS YBR210W 2 645550 645978 W 2011-02-03 1997-01-28 -S000000415 ORF Verified YBR211C AME1 ARP100 chromosome 2 L000004725 2 647132 646158 C 2011-02-03 1997-01-28 Essential kinetochore protein associated with microtubules and SPBs; component of the kinetochore sub-complex COMA (Ctf19p, Okp1p, Mcm21p, Ame1p); involved in spindle checkpoint maintenance; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-U and fission yeast Mis17; relative distribution to the nucleus increases upon DNA replication stress -S000033678 CDS YBR211C 2 647132 646158 C 2011-02-03 1997-01-28 -S000000416 ORF Verified YBR212W NGR1 RBP1 chromosome 2 L000001242 2 647886 649904 W 2011-02-03 1997-01-28 RNA binding protein that negatively regulates growth rate; interacts with the 3' UTR of the mitochondrial porin (POR1) mRNA and enhances its degradation; overexpression impairs mitochondrial function; interacts with Dhh1p to mediate POR1 mRNA decay; expressed in stationary phase -S000034651 CDS YBR212W 2 647886 649904 W 2011-02-03 1997-01-28 -S000000417 ORF Verified YBR213W MET8 bifunctional precorrin-2 dehydrogenase/sirohydrochlorin ferrochelatase MET8 chromosome 2 L000001083 2 650368 651192 W 119 2011-02-03 1997-01-28 Bifunctional dehydrogenase and ferrochelatase; involved in the biosynthesis of siroheme, a prosthetic group used by sulfite reductase; required for sulfate assimilation and methionine biosynthesis -S000034801 CDS YBR213W 2 650368 651192 W 2011-02-03 1997-01-28 -S000000418 ORF Verified YBR214W SDS24 chromosome 2 L000004811 2 651415 652998 W 2011-02-03 1997-01-28 Protein involved in cell separation during budding; one of two S. cerevisiae homologs (Sds23p and Sds24p) of the S. pombe Sds23 protein, which is implicated in APC/cyclosome regulation; may play an indirect role in fluid-phase endocytosis; protein abundance increases in response to DNA replication stress; SDS24 has a paralog, SDS23, that arose from the whole genome duplication -S000034936 CDS YBR214W 2 651415 652998 W 2011-02-03 1997-01-28 -S000000419 ORF Verified YBR215W HPC2 chromosome 2 L000000804 2 653356 655317 W 2011-02-03 1997-01-28|2007-07-09 Subunit of the HIR complex; HIR is a nucleosome assembly complex involved in regulation of histone gene transcription; mutants display synthetic defects with subunits of FACT, a complex that allows passage of RNA Pol II through nucleosomes -S000035856 CDS YBR215W 2 653356 653368 W 2011-02-03 1997-01-28|2007-07-09 -S000123275 CDS YBR215W 2 653453 655317 W 2011-02-03 2007-07-09 -S000123274 intron YBR215W 2 653369 653452 W 2011-02-03 2007-07-09 -S000000420 ORF Verified YBR216C YBP1 chromosome 2 2 657600 655576 C 2011-02-03 1997-01-28 Protein involved in cellular response to oxidative stress; required for oxidation of specific cysteine residues of transcription factor Yap1p, resulting in nuclear localization of Yap1p in response to stress; YBP1 has a paralog, YBP2, that arose from the whole genome duplication -S000035897 CDS YBR216C 2 657600 655576 C 2011-02-03 1997-01-28 -S000000421 ORF Verified YBR217W ATG12 APG12 chromosome 2 L000004702 2 657832 658392 W 2011-02-03 1997-01-28 Ubiquitin-like modifier involved in autophagy and the Cvt pathway; conserved; conjugated to Atg5p to form a complex involved in Atg8p lipidation; Atg5p-Atg12p conjugate enhances E2 activity of Atg3p by rearranging its catalytic site, also forms a complex with Atg16p; the Atg5-Atg12/Atg16 complex binds to membranes and is essential for autophagosome formation -S000036158 CDS YBR217W 2 657832 658392 W 2011-02-03 1997-01-28 -S000000422 ORF Verified YBR218C PYC2 pyruvate carboxylase 2 chromosome 2 L000001543 2 662249 658707 C 2011-02-03 1997-01-28 Pyruvate carboxylase isoform; cytoplasmic enzyme that converts pyruvate to oxaloacetate; differentially regulated than isoform Pyc1p; mutations in the human homolog are associated with lactic acidosis; PYC2 has a paralog, PYC1, that arose from the whole genome duplication -S000036216 CDS YBR218C 2 662249 658707 C 2011-02-03 1997-01-28 -S000000423 ORF Uncharacterized YBR219C chromosome 2 2 663303 662499 C 2011-02-03 1997-01-28 Putative protein of unknown function; YBR219C is not an essential gene -S000036941 CDS YBR219C 2 662581 662499 C 2011-02-03 1997-01-28 -S000036940 CDS YBR219C 2 663303 663003 C 2011-02-03 1997-01-28 -S000036942 intron YBR219C 2 663002 662582 C 2011-02-03 1997-01-28 -S000000424 ORF Uncharacterized YBR220C chromosome 2 2 664677 662995 C 2011-02-03 1997-01-28 Putative protein of unknown function; YBR220C is not an essential gene -S000037728 CDS YBR220C 2 664677 662995 C 2011-02-03 1997-01-28 -S000000425 ORF Verified YBR221C PDB1 pyruvate dehydrogenase (acetyl-transferring) subunit E1 beta chromosome 2 L000001353 2 666253 665153 C 2011-02-03 1997-01-28 E1 beta subunit of the pyruvate dehydrogenase (PDH) complex; PDH is an evolutionarily conserved multi-protein complex found in mitochondria -S000037817 CDS YBR221C 2 666253 665153 C 2011-02-03 1997-01-28 -S000028817 ORF Uncharacterized YBR221W-A chromosome 2 2 666538 666642 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000033623 CDS YBR221W-A 2 666538 666642 W 2011-02-03 2003-07-29 -S000000426 ORF Verified YBR222C PCS60 FAT2 chromosome 2 L000003238 2 668351 666720 C 2011-02-03 1997-01-28 Oxalyl-CoA synthetase; capable of catalyzing conversion of oxalate to oxalyl-CoA; catalyzes first step in pathway of oxalate degradation that functions to protect yeast from inhibitory effects of oxalate; peroxisomal protein that binds mRNA; localizes to both peroxisomal peripheral membrane and matrix, expression is highly inducible by oleic acid; similar to E. coli long chain acyl-CoA synthetase -S000029826 CDS YBR222C 2 668351 666720 C 2011-02-03 1997-01-28 -S000028604 ORF Dubious YBR223W-A chromosome 2 2 668721 668840 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps YBR223C; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031411 CDS YBR223W-A 2 668721 668840 W 2011-02-03 2003-07-29 -S000000428 ORF Dubious YBR224W chromosome 2 2 670125 670640 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene TDP1 -S000030960 CDS YBR224W 2 670125 670640 W 2011-02-03 1997-01-28 -S000000427 ORF Verified YBR223C TDP1 tyrosyl-DNA phosphodiesterase 1 chromosome 2 S000007461 2 670297 668663 C 2011-02-03 1997-01-28 Tyrosyl-DNA phosphodiesterase I; hydrolyzes 3' and 5'-phosphotyrosyl bonds; involved in the repair of DNA lesions created by topo I and topo II; mutations in the human homolog, TDP1, result in the a neurodegenerative disease, spinocerebellar ataxia with axonal neuropathy (SCAN1); yeast cells and human rhabdomyosarcoma lines that overexpress TDP1 both exhibit elevated dosage chromosomal instability (dCIN) -S000030837 CDS YBR223C 2 670297 668663 C 2011-02-03 1997-01-28 -S000000429 ORF Uncharacterized YBR225W chromosome 2 2 670627 673329 W 2011-02-03 1997-01-28 Putative protein of unknown function; non-essential gene identified in a screen for mutants affected in mannosylphophorylation of cell wall components -S000031063 CDS YBR225W 2 670627 673329 W 2011-02-03 1997-01-28 -S000000430 ORF Dubious YBR226C chromosome 2 2 673565 673155 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YBR225W -S000031074 CDS YBR226C 2 673565 673155 C 2011-02-03 1997-01-28 -S000000431 ORF Verified YBR227C MCX1 chromosome 2 2 675134 673572 C 2011-02-03 1997-01-28 Non-proteolytic ATPase of the AAA family; stimulates incorporation of the pyridoxal phosphate cofactor into Hem1p (5-aminolevulinic acid synthase); localized to the mitochondrial matrix; ortholog of vertebrate CLPX, which promotes erythropoiesis -S000032046 CDS YBR227C 2 675134 673572 C 2011-02-03 1997-01-28 -S000000432 ORF Verified YBR228W SLX1 endonuclease chromosome 2 2 675313 676227 W 2011-02-03 1997-01-28 Endonuclease involved in DNA recombination and repair; subunit of a complex, with Slx4p, that hydrolyzes 5' branches from duplex DNA in response to stalled or converging replication forks; function overlaps with that of Sgs1p-Top3p -S000032169 CDS YBR228W 2 675313 676227 W 2011-02-03 1997-01-28 -S000000433 ORF Verified YBR229C ROT2 glucan 1,3-alpha-glucosidase ROT2|GLS2 chromosome 2 L000003405 2 679221 676357 C 2011-02-03 1997-01-28 Glucosidase II catalytic subunit; required to trim the final glucose in N-linked glycans; required for normal cell wall synthesis; mutations in rot2 suppress tor2 mutations, and are synthetically lethal with rot1 mutations -S000032215 CDS YBR229C 2 679221 676357 C 2011-02-03 1997-01-28 -S000000434 ORF Verified YBR230C OM14 chromosome 2 2 680050 679549 C 2011-02-03 1997-01-28 Mitochondrial outer membrane receptor for cytosolic ribosomes; integral protein of the outer membrane that interacts with the nascent chain-associated complex (NAC) bound to ribosomes, contributing to co-translational mitochondrial import; interacts with porin (Por1p) and Om45p; abundance is decreased in cells grown in glucose relative to other carbon sources -S000034001 CDS YBR230C 2 679942 679549 C 2011-02-03 1997-01-28 -S000034000 CDS YBR230C 2 680050 680040 C 2011-02-03 1997-01-28 -S000034002 intron YBR230C 2 680039 679943 C 2011-02-03 1997-01-28 -S000029722 ORF Uncharacterized YBR230W-A chromosome 2 2 680362 680562 W 2011-02-03 2004-04-01 Putative protein of unknown function; YBR230W-A has a paralog, COQ8, that arose from the whole genome duplication -S000036857 CDS YBR230W-A 2 680362 680562 W 2011-02-03 2004-04-01 -S000006478 snRNA_gene LSR1 LSR1 U2|snR20 chromosome 2 L000000954 2 681862 680688 C 2011-02-03 2000-05-19|2006-10-04 U2 spliceosomal RNA (U2 snRNA), component of the spliceosome; pairs with the branchpoint sequence; functionally equivalent to mammalian U2 snRNA; stress-induced pseudouridylations at positions 56 and 93 may contribute to regulation of splicing -S000030971 noncoding_exon LSR1 2 681862 680688 C 2011-02-03 2000-05-19|2006-10-04 -S000000435 ORF Verified YBR231C SWC5 AOR1 chromosome 2 L000004001 2 683090 682179 C 2011-02-03 1997-01-28 Component of the SWR1 complex; complex exchanges histone variant H2AZ (Htz1p) for chromatin-bound histone H2A; protein abundance increases in response to DNA replication stress; relocalizes to the cytosol in response to hypoxia -S000034102 CDS YBR231C 2 683090 682179 C 2011-02-03 1997-01-28 -S000000437 ORF Verified YBR233W PBP2 HEK1 chromosome 2 L000004512 2 683428 684669 W 2011-02-03 1997-01-28 RNA binding protein; has similarity to mammalian heterogeneous nuclear RNP K protein, involved in the regulation of telomere position effect and telomere length; relative distribution to the nucleus increases upon DNA replication stress -S000035244 CDS YBR233W 2 683428 684669 W 2011-02-03 1997-01-28 -S000000436 ORF Dubious YBR232C chromosome 2 2 683732 683373 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034194 CDS YBR232C 2 683732 683373 C 2011-02-03 1997-01-28 -S000007595 ORF Verified YBR233W-A DAD3 chromosome 2 2 684977 685261 W 2011-02-03 2001-02-26 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; is transferred to the kinetochore prior to mitosis -S000037141 CDS YBR233W-A 2 684977 685261 W 2011-02-03 2001-02-26 -S000000438 ORF Verified YBR234C ARC40 chromosome 2 L000004788 2 686592 685438 C 2011-02-03 1997-01-28 Subunit of the ARP2/3 complex; ARP2/3 is required for the motility and integrity of cortical actin patches -S000035293 CDS YBR234C 2 686592 685438 C 2011-02-03 1997-01-28 -S000000439 ORF Verified YBR235W VHC1 chromosome 2 2 686901 690263 W 2011-02-03 1997-01-28 Vacuolar membrane cation-chloride cotransporter (CCC); likely mediates K+ and Cl- cotransport into the vacuole; has a role in potassium homeostasis and salt tolerance; localizes to sites of contact between the vacuole and mitochondria (vCLAMPs); similar to mammalian electroneutral Na(+)-(K+)-C1- cotransporter family -S000035401 CDS YBR235W 2 686901 690263 W 2011-02-03 1997-01-28 -S000000440 ORF Verified YBR236C ABD1 mRNA (guanine-N7)-methyltransferase chromosome 2 L000000011 2 691693 690383 C 2011-02-03 1997-01-28 Methyltransferase; catalyzes the transfer of a methyl group from S-adenosylmethionine to the GpppN terminus of capped mRNA; nuclear protein that relocalizes to the cytosol in response to hypoxia -S000035435 CDS YBR236C 2 691693 690383 C 2011-02-03 1997-01-28 -S000000441 ORF Verified YBR237W PRP5 DEAD-box RNA helicase PRP5|RNA5 chromosome 2 L000001498 2 691969 694518 W 138 2011-02-03 1997-01-28 RNA helicase in the DEAD-box family; necessary for prespliceosome formation, bridges U1 and U2 snRNPs and enables stable U2 snRNP association with intron RNA -S000036392 CDS YBR237W 2 691969 694518 W 2011-02-03 1997-01-28 -S000000442 ORF Verified YBR238C chromosome 2 2 697302 695107 C 2011-02-03 1997-01-28 Mitochondrial membrane protein; not required for respiratory growth but causes a synthetic respiratory defect in combination with rmd9 mutations; transcriptionally up-regulated by TOR; deletion increases life span; YBR238C has a paralog, RMD9, that arose from the whole genome duplication -S000036425 CDS YBR238C 2 697302 695107 C 2011-02-03 1997-01-28 -S000000443 ORF Verified YBR239C ERT1 chromosome 2 2 699943 698354 C 2011-02-03 1997-01-28 Transcriptional regulator; involved in regulation of gluconeogenesis and fermentable carbon utilization; GFP-fusion protein localizes to cytoplasm, nucleus; null mutation affects periodicity of transcriptional and metabolic oscillation; plays role in restricting Ty1 transposition; member of the zinc cluster family of proteins, similar to Rds2p -S000036512 CDS YBR239C 2 699943 698354 C 2011-02-03 1997-01-28 -S000000444 ORF Verified YBR240C THI2 phoF|PHO6 chromosome 2 L000003526 2 701842 700490 C 2011-02-03 1997-01-28 Transcriptional activator of thiamine biosynthetic genes; interacts with regulatory factor Thi3p to control expression of thiamine biosynthetic genes with respect to thiamine availability; acts together with Pdc2p to respond to thiaminediphosphate demand, possibly as related to carbon source availability; zinc finger protein of the Zn(II)2Cys6 type -S000037494 CDS YBR240C 2 701842 700490 C 2011-02-03 1997-01-28 -S000000445 ORF Uncharacterized YBR241C chromosome 2 2 704055 702589 C 2011-02-03 1997-01-28 Putative transporter, member of the sugar porter family; green fluorescent protein (GFP)-fusion protein localizes to the vacuolar membrane; YBR241C is not an essential gene; YBR241C has a paralog, VPS73, that arose from the whole genome duplication -S000037584 CDS YBR241C 2 704055 702589 C 2011-02-03 1997-01-28 -S000118352 ARS ARS222 ARSII-704 chromosome 2 2 704296 704566 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000000446 ORF Uncharacterized YBR242W chromosome 2 L000004757 2 704670 705386 W 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; YBR242W is not an essential gene; YBR242W has a paralog, YGL101W, that arose from the whole genome duplication -S000030457 CDS YBR242W 2 704670 705386 W 2011-02-03 1997-01-28 -S000000447 ORF Verified YBR243C ALG7 UDP-N-acetylglucosamine--dolichyl-phosphate N-acetylglucosaminephosphotransferase|TUR1 chromosome 2 L000000078 2 706793 705447 C 2011-02-03 1997-01-28 UDP-N-acetyl-glucosamine-1-P transferase; transfers Glc-Nac-P from UDP-GlcNac to Dol-P in the ER in the first step of the dolichol pathway of protein asparagine-linked glycosylation; inhibited by tunicamycin; human homolog DPAGT1 can complement yeast ALG7 mutant -S000030493 CDS YBR243C 2 706793 705447 C 2011-02-03 1997-01-28 -S000000448 ORF Verified YBR244W GPX2 glutathione peroxidase GPX2|AMI1 chromosome 2 2 707528 708016 W 2011-02-03 1997-01-28 Phospholipid hydroperoxide glutathione peroxidase; protects cells from phospholipid hydroperoxides and nonphospholipid peroxides during oxidative stress; induced by glucose starvation; protein abundance increases in response to DNA replication stress -S000030605 CDS YBR244W 2 707528 708016 W 2011-02-03 1997-01-28 -S000000449 ORF Verified YBR245C ISW1 chromatin-remodeling ATPase ISW1|SGN2 chromosome 2 L000004447 2 711539 708150 C 2011-02-03 1997-01-28 ATPase subunit of imitation-switch (ISWI) class chromatin remodelers; with Ioc3p forms Isw1a complex involved in repression of transcription initiation; with Ioc2p and Ioc4p forms Isw1b complex involved in regulation of transcription elongation; Isw1b recruited to ORFs by H3K36 methylation and acts with Chd1p to prevent trans-histone exchange over coding regions; Isw1p import into nucleus depends on C-terminal bipartite nuclear targeting signal KRIR X19 KKAK -S000030646 CDS YBR245C 2 711539 708150 C 2011-02-03 1997-01-28 -S000000450 ORF Verified YBR246W RRT2 DPH7|diphthamide synthase|ERE1 chromosome 2 2 711591 712754 W 2011-02-03 1997-01-28 Methylesterase performing penultimate step of diphthamide biosynthesis; hydrolyzes methylated diphthine to produce diphthine and allows Dph6-catalyzed amidation reaction to occur; deletion leads to resistance to sordarin and accumulation of methylatediphthine; WD40 domain-containing protein; involved in endosomal recycling; forms complex with Rtt10p that functions in retromer-mediated pathway for recycling internalized cell-surface proteins -S000030760 CDS YBR246W 2 711591 712754 W 2011-02-03 1997-01-28 -S000000451 ORF Verified YBR247C ENP1 snoRNA-binding rRNA-processing protein ENP1|MEG1 chromosome 2 L000003200|L000001059 2 714455 713004 C 2011-02-03 1997-01-28 Protein associated with U3 and U14 snoRNAs; required for pre-rRNA processing and 40S ribosomal subunit synthesis; localized in the nucleus and concentrated in the nucleolus; human BYSL functionally complements the heat sensitivity of an enp1 ts mutant -S000031591 CDS YBR247C 2 714455 713004 C 2011-02-03 1997-01-28 -S000000452 ORF Verified YBR248C HIS7 imidazoleglycerol-phosphate synthase chromosome 2 L000000784 2 716465 714807 C 146 2011-02-03 1997-01-28 Imidazole glycerol phosphate synthase; glutamine amidotransferase:cyclase that catalyzes the fifth step of histidine biosynthesis and also produces 5-aminoimidazole-4-carboxamide ribotide (AICAR), a purine precursor -S000031672 CDS YBR248C 2 716465 714807 C 2011-02-03 1997-01-28 -S000000453 ORF Verified YBR249C ARO4 3-deoxy-7-phosphoheptulonate synthase ARO4 chromosome 2 L000000119 2 717994 716882 C 2011-02-03 1997-01-28 3-deoxy-D-arabino-heptulosonate-7-phosphate (DAHP) synthase; catalyzes the first step in aromatic amino acid biosynthesis and is feedback-inhibited by tyrosine or high concentrations of phenylalanine or tryptophan; relative distribution to the nucleus increases upon DNA replication stress -S000031774 CDS YBR249C 2 717994 716882 C 2011-02-03 1997-01-28 -S000000454 ORF Verified YBR250W SPO23 chromosome 2 2 719033 720604 W 2011-02-03 1997-01-28 Protein of unknown function; associates with meiosis-specific protein Spo1p -S000033891 CDS YBR250W 2 719033 720604 W 2011-02-03 1997-01-28 -S000000455 ORF Verified YBR251W MRPS5 mitochondrial 37S ribosomal protein MRPS5 chromosome 2 L000001174 2 721390 722313 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the small subunit -S000034780 CDS YBR251W 2 721390 722313 W 2011-02-03 1997-01-28 -S000000456 ORF Verified YBR252W DUT1 bifunctional dITP/dUTP diphosphatase chromosome 2 L000000537 2 722611 723054 W 2011-02-03 1997-01-28 Deoxyuridine triphosphate diphosphatase (dUTPase); catalyzes hydrolysis of dUTP to dUMP and PPi, thereby preventing incorporation of uracil into DNA during replication; critical for the maintenance of genetic stability; also has diphosphatase activity on deoxyinosine triphosphate; human homolog DUT allows growth of yeast haploid dut1 null mutant after sporulation of heterozygous diploid -S000034888 CDS YBR252W 2 722611 723054 W 2011-02-03 1997-01-28 -S000000457 ORF Verified YBR253W SRB6 MED22 chromosome 2 L000002053 2 723270 723635 W 2011-02-03 1997-01-28 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation -S000035009 CDS YBR253W 2 723270 723635 W 2011-02-03 1997-01-28 -S000000458 ORF Verified YBR254C TRS20 TRAPP subunit TRS20 chromosome 2 S000007431 2 724263 723736 C 2011-02-03 1997-01-28 Core component of transport protein particle (TRAPP) complexes I-III; TRAPPs are multimeric guanine nucleotide-exchange factors for GTPase Ypt1p, regulating ER-Golgi traffic (TRAPPI), intra-Golgi traffic (TRAPPII), endosome-Golgi traffic (TRAPPII and III) and autophagy (TRAPPIII); mutation leads to defects in endocytic recycling, block in sporulation/meiosis; mutations in human homolog TRAPPC2 cause spondyloepiphyseal dysplasia tarda, TRAPPC2 can complement yeast null mutant -S000035081 CDS YBR254C 2 724263 723736 C 2011-02-03 1997-01-28 -S000000459 ORF Verified YBR255W MTC4 chromosome 2 2 724456 726540 W 2011-02-03 1997-01-28 Protein of unknown function; required for normal growth rate at 15 degrees C; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; mtc4 is synthetically sick with cdc13-1 -S000036028 CDS YBR255W 2 724456 726540 W 2011-02-03 1997-01-28 -S000007649 ORF Uncharacterized YBR255C-A RCF3 chromosome 2 2 727074 726618 C 2011-02-03 2003-12-17|2001-06-26 Putative protein of unknown function; may interact with respiratory chain complexes III (ubiquinol-cytochrome c reductase) or IV (cytochrome c oxidase); identified by sequence comparison with hemiascomycetous yeast species -S000037335 CDS YBR255C-A 2 726917 726618 C 2011-02-03 2003-12-17|2001-06-26 -S000037334 CDS YBR255C-A 2 727074 727012 C 2011-02-03 2003-12-17|2001-06-26 -S000037336 intron YBR255C-A 2 727011 726918 C 2011-02-03 2003-12-17|2001-06-26 -S000000460 ORF Verified YBR256C RIB5 riboflavin synthase chromosome 2 L000001636 2 728102 727386 C 150 2011-02-03 1997-01-28 Riboflavin synthase; catalyzes the last step of the riboflavin biosynthesis pathway -S000036049 CDS YBR256C 2 728102 727386 C 2011-02-03 1997-01-28 -S000000461 ORF Verified YBR257W POP4 RNase P/RNase MRP complex subunit chromosome 2 L000003537 2 728885 729724 W 2011-02-03 1997-01-28 Subunit of both RNase MRP and nuclear RNase P; RNase MRP cleaves pre-rRNA, while nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs; binds to the RPR1 RNA subunit in RNase P -S000036225 CDS YBR257W 2 728885 729724 W 2011-02-03 1997-01-28 -S000000462 ORF Verified YBR258C SHG1 CPS15 chromosome 2 2 730162 729734 C 2011-02-03 1997-01-28 Subunit of the COMPASS (Set1C) complex; COMPASS methylates histone H3 on lysine 4 and is required in transcriptional silencing near telomeres -S000036263 CDS YBR258C 2 730162 729734 C 2011-02-03 1997-01-28 -S000000463 ORF Verified YBR259W chromosome 2 2 730387 732453 W 2011-02-03 1997-01-28 Protein of unknown function; YBR259W is not an essential gene; forms cytoplasmic foci upon DNA replication stress -S000036998 CDS YBR259W 2 730387 732453 W 2011-02-03 1997-01-28 -S000000464 ORF Verified YBR260C RGD1 chromosome 2 2 734639 732639 C 2011-02-03 1997-01-28 GTPase-activating protein (RhoGAP) for Rho3p and Rho4p; possibly involved in control of actin cytoskeleton organization -S000035993 CDS YBR260C 2 734639 732639 C 2011-02-03 1997-01-28 -S000000465 ORF Verified YBR261C TAE1 N-terminal protein methyltransferase|NTM1 chromosome 2 2 735530 734832 C 2011-02-03 1997-01-28 AdoMet-dependent proline methyltransferase; catalyzes the dimethylation of ribosomal proteins Rpl12 and Rps25 at N-terminal proline residues; has a role in protein synthesis; fusion protein localizes to the cytoplasm -S000037822 CDS YBR261C 2 735530 734832 C 2011-02-03 1997-01-28 -S000000466 ORF Verified YBR262C MIC12 AIM5|MCS12|FMP51 chromosome 2 2 736040 735720 C 2011-02-03 1997-01-28 Component of the MICOS complex; MICOS (formerly MINOS or MitOS) is a mitochondrial inner membrane complex that extends into the intermembrane space and has a role in the maintenance of crista junctions, inner membrane architecture, and formation of contact sites to the outer membrane; forms a subcomplex with Mic10p and Mic27p whose assembly and stability requires cardiolipin -S000029843 CDS YBR262C 2 736040 735720 C 2011-02-03 1997-01-28 -S000000467 ORF Verified YBR263W SHM1 glycine hydroxymethyltransferase SHM1|TMP3|SHMT1 chromosome 2 L000001883 2 736264 737736 W 2011-02-03 2003-09-22|1997-01-28 Mitochondrial serine hydroxymethyltransferase; converts serine to glycine plus 5,10 methylenetetrahydrofolate; involved in generating precursors for purine, pyrimidine, amino acid, and lipid biosynthesis; reverse reaction generates serine -S000030905 CDS YBR263W 2 736264 737736 W 2011-02-03 2003-09-22|1997-01-28 -S000000468 ORF Verified YBR264C YPT10 Rab family GTPase YPT10 chromosome 2 2 738369 737770 C 2011-02-03 2003-09-22|1997-01-28 Rab family GTP-binding protein; contains the PEST signal sequence specific for proteolytic enzymes; may be involved in vesicular transport; overexpression leads to accumulation of Golgi-like cisternae with budding vesicles -S000030937 CDS YBR264C 2 738369 737770 C 2011-02-03 2003-09-22|1997-01-28 -S000000469 ORF Verified YBR265W TSC10 3-dehydrosphinganine reductase chromosome 2 2 738582 739544 W 2011-02-03 1997-01-28|2011-02-03 3-ketosphinganine reductase; catalyzes the second step in phytosphingosine synthesis; essential for growth in the absence of exogenous dihydrosphingosine or phytosphingosine; localized to lipid droplets; member of short chain dehydrogenase/reductase protein family -S000031091 CDS YBR265W 2 738582 739544 W 2011-02-03 1997-01-28|2011-02-03 -S000000471 ORF Verified YBR267W REI1 chromosome 2 2 739841 741022 W 2011-02-03 1999-04-26|1997-01-28|2011-02-03 Cytoplasmic pre-60S factor; required for the correct recycling of shuttling factors Alb1, Arx1 and Tif6 at the end of the ribosomal large subunit biogenesis; involved in bud growth in the mitotic signaling network -S000032151 CDS YBR267W 2 739841 741022 W 2011-02-03 1999-04-26|1997-01-28|2011-02-03 -S000000470 ORF Dubious YBR266C SLM6 chromosome 2 2 740388 739936 C 2011-02-03 1999-04-26|1997-01-28|2011-02-03 Protein with a potential role in actin cytoskeleton organization; gene exhibits synthetic genetic interaction with MSS4 encoding phosphatidylinositol 4-phosphate kinase -S000031132 CDS YBR266C 2 740388 739936 C 2011-02-03 1999-04-26|1997-01-28|2011-02-03 -S000000472 ORF Verified YBR268W MRPL37 mitochondrial 54S ribosomal protein YmL37|YmL37 chromosome 2 L000001172 2 741299 741616 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit -S000032225 CDS YBR268W 2 741299 741616 W 2011-02-03 1997-01-28 -S000118353 ARS ARS224 ARSII-742 chromosome 2 2 741681 741797 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178053 ARS_consensus_sequence ARS224 2 741742 741726 C 2014-11-18 2014-11-18 -S000000473 ORF Verified YBR269C SDH8 FMP21 chromosome 2 2 742576 742160 C 2011-02-03 2004-01-09|1997-01-28 Protein required for assembly of succinate dehydrogenase; interacts with flavinylated Sdh1p and may function as a chaperone for free Sdh1p, protecting its FAD cofactor from redox reactions before assembly of the complex; soluble protein of the mitochondrial matrix; respiratory defect of null mutant is functionally complemented by Drosophila and human orthologs -S000032252 CDS YBR269C 2 742576 742160 C 2011-02-03 2004-01-09|1997-01-28 -S000000474 ORF Verified YBR270C BIT2 chromosome 2 2 744398 742761 C 2011-02-03 1997-01-28|2011-02-03 Subunit of TORC2 membrane-associated complex; involved in regulation of actin cytoskeletal dynamics during polarized growth and cell wall integrity; interacts with Slm1p and Slm2p, homologous PH domain-containing TORC2 substrates; BIT2 has a paralog, BIT61, that arose from the whole genome duplication -S000031901 CDS YBR270C 2 744398 742761 C 2011-02-03 1997-01-28|2011-02-03 -S000000475 ORF Verified YBR271W EFM2 S-adenosylmethionine-dependent methyltransferase chromosome 2 2 744852 746111 W 2011-02-03 1997-01-28 S-adenosylmethionine-dependent methyltransferase; seven-beta-strand lysine methyltransferase which dimethylates translation elongation factor EF2 (Eft1p and Eft2p) at lysine 613 and methylates EF3 (Yef3p) at lysine 187; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; involved in regulation of translational termination; predicted involvement in ribosome biogenesis -S000032109 CDS YBR271W 2 744852 746111 W 2011-02-03 1997-01-28 -S000000476 ORF Verified YBR272C HSM3 chromosome 2 L000004729 2 747803 746361 C 2011-02-03 1997-01-28 Evolutionarily conserved 19S regulatory particle assembly-chaperone; involved in the assembly of the base subcomplex of the 19S proteasomal regulatory particle (RP); involved in DNA mismatch repair during slow growth; weak similarity to Msh1p; structural study suggests Hsm3p is a scaffold protein for Rpt1p-Rpt2p complex formation; ortholog of human 19S subunit S5b -S000032139 CDS YBR272C 2 747803 746361 C 2011-02-03 1997-01-28 -S000000477 ORF Verified YBR273C UBX7 CUI3 chromosome 2 2 749371 748061 C 2011-02-03 1997-01-28 UBX (ubiquitin regulatory X) domain-containing protein; interacts with Cdc48p; UBX7 has a paralog, UBX6, that arose from the whole genome duplication -S000034143 CDS YBR273C 2 749371 748061 C 2011-02-03 1997-01-28 -S000000478 ORF Verified YBR274W CHK1 serine/threonine protein kinase CHK1 chromosome 2 L000004861 2 749594 751177 W 2011-02-03 1997-01-28 Serine/threonine kinase and DNA damage checkpoint effector; mediates cell cycle arrest via phosphorylation of Pds1p; phosphorylated by checkpoint signal transducer Mec1p; homolog of S. pombe and mammalian Chk1 checkpoint kinase -S000034288 CDS YBR274W 2 749594 751177 W 2011-02-03 1997-01-28 -S000000479 ORF Verified YBR275C RIF1 DNA-binding protein RIF1 chromosome 2 L000001639 2 757106 751356 C 2011-02-03 1997-01-28|2011-02-03 Protein that binds to the Rap1p C-terminus; acts synergistically with Rif2p to help control telomere length and establish telomeric silencing; involved in control of DNA replication; contributes to resection of DNA double strand breaks (DSBs); deletion results in telomere elongation -S000034316 CDS YBR275C 2 757106 751356 C 2011-02-03 1997-01-28|2011-02-03 -S000118354 ARS ARS225 ARSII-757 chromosome 2 2 757437 757667 2011-02-03 2006-08-30 Autonomously Replicating Sequence; replication origin of very weak function -S000000480 ORF Verified YBR276C PPS1 tyrosine/serine/threonine protein phosphatase PPS1 chromosome 2 L000003522 2 760043 757620 C 2011-02-03 1997-01-28 Protein phosphatase; has specificity for serine, threonine, and tyrosine residues; has a role in the DNA synthesis phase of the cell cycle -S000034373 CDS YBR276C 2 760043 757620 C 2011-02-03 1997-01-28 -S000000482 ORF Verified YBR278W DPB3 DNA polymerase epsilon noncatalytic subunit chromosome 2 L000000520 2 760294 760899 W 2011-02-03 1997-01-28 Third-largest subunit of DNA polymerase II (DNA polymerase epsilon); required to maintain fidelity of chromosomal replication and also for inheritance of telomeric silencing; stabilizes the interaction of Pol epsilon with primer-template DNA, positively affecting the processivity of the polymerase and exonuclease activities of Pol epsilon; mRNA abundance peaks at the G1/S boundary of the cell cycle; DPB3 has a paralog, DLS1, that arose from the whole genome duplication -S000035459 CDS YBR278W 2 760294 760899 W 2011-02-03 1997-01-28 -S000000481 ORF Dubious YBR277C chromosome 2 2 760616 760215 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YBR278W -S000035356 CDS YBR277C 2 760616 760215 C 2011-02-03 1997-01-28 -S000000483 ORF Verified YBR279W PAF1 chromosome 2 L000002621 2 761257 762594 W 2011-02-03 1997-01-28 Component of the Paf1p complex involved in transcription elongation; binds to and modulates the activity of RNA polymerases I and II; required for expression of a subset of genes, including cell cycle-regulated genes; involved in SER3 repression by helping to maintain SRG1 transcription-dependent nucleosome occupancy; homolog of human PD2/hPAF1 -S000035503 CDS YBR279W 2 761257 762594 W 2011-02-03 1997-01-28 -S000000484 ORF Verified YBR280C SAF1 SCF ubiquitin ligase complex subunit SAF1 chromosome 2 2 764697 762784 C 2011-02-03 2003-09-22|1997-01-28 F-Box protein involved in proteasome-dependent degradation of Aah1p; involved in proteasome-dependent degradation of Aah1p during entry of cells into quiescence; interacts with Skp1 -S000035024 CDS YBR280C 2 764697 762784 C 2011-02-03 2003-09-22|1997-01-28 -S000000485 ORF Verified YBR281C DUG2 glutamine amidotransferase subunit DUG2 chromosome 2 2 767606 764970 C 2011-02-03 1997-01-28 Component of glutamine amidotransferase (GATase II); forms a complex with Dug3p to degrade glutathione (GSH) and other peptides containing a gamma-glu-X bond in an alternative pathway to GSH degradation by gamma-glutamyl transpeptidase (Ecm38p) -S000035219 CDS YBR281C 2 767606 764970 C 2011-02-03 1997-01-28 -S000000486 ORF Verified YBR282W MRPL27 mitochondrial 54S ribosomal protein YmL27|YmL27 chromosome 2 L000002528|L000001167 2 768240 768680 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit; homolog of human Bcl-2 interacting protein BMRP -S000036203 CDS YBR282W 2 768240 768680 W 2011-02-03 1997-01-28 -S000000487 ORF Verified YBR283C SSH1 chromosome 2 L000003994 2 770415 768943 C 2011-02-03 1997-01-28 Subunit of the Ssh1 translocon complex; Sec61p homolog involved in co-translational pathway of protein translocation; not essential -S000036248 CDS YBR283C 2 770415 768943 C 2011-02-03 1997-01-28 -S000000488 ORF Uncharacterized YBR284W metallo-dependent hydrolase superfamily protein chromosome 2 2 771239 773632 W 2011-02-03 1997-01-28 Putative metallo-dependent hydrolase superfamily protein; similar to AMP deaminases but lacks key catalytic residues and does not rescue purine nucleotide metabolic defect of quadruple aah1 ade8 amd1 his1 mutant; null mutant exhibits longer telomeres, altered Ty mobility, decreased resistance to rapamycin and wortmannin; induced in response to hydrostatic pressure; not an essential gene; YBR284W has a paralog, YJL070C, that arose from the whole genome duplication -S000036400 CDS YBR284W 2 771239 773632 W 2011-02-03 1997-01-28 -S000000489 ORF Uncharacterized YBR285W chromosome 2 2 773922 774356 W 2011-02-03 1997-01-28|2011-02-03 Putative protein of unknown function; YBR285W is not an essential gene -S000030111 CDS YBR285W 2 773922 774356 W 2011-02-03 1997-01-28|2011-02-03 -S000000490 ORF Verified YBR286W APE3 APY1 chromosome 2 L000000093 2 774700 776313 W 2011-02-03 1997-01-28|2005-11-07 Vacuolar aminopeptidase Y; processed to mature form by Prb1p -S000030229 CDS YBR286W 2 774700 776313 W 2011-02-03 1997-01-28|2005-11-07 -S000000491 ORF Uncharacterized YBR287W ZSP1 chromosome 2 2 776571 777854 W 2011-02-03 1997-01-28 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the ER; YBR287W is not an essential gene -S000030366 CDS YBR287W 2 776571 777854 W 2011-02-03 1997-01-28 -S000000492 ORF Verified YBR288C APM3 YKS6 chromosome 2 L000002758 2 779463 778012 C 2011-02-03 1997-01-28|2011-02-03 Mu3-like subunit of the clathrin associated protein complex (AP-3); functions in transport of alkaline phosphatase to the vacuole via the alternate pathway -S000030452 CDS YBR288C 2 779463 778012 C 2011-02-03 1997-01-28|2011-02-03 -S000000493 ORF Verified YBR289W SNF5 TYE4|SWI10|HAF4 chromosome 2 L000001948 2 779667 782384 W 2011-02-03 1997-01-28|2011-02-03 Subunit of the SWI/SNF chromatin remodeling complex; involved in transcriptional regulation; functions interdependently in transcriptional activation with Snf2p and Snf6p; relocates to the cytosol under hypoxic conditions -S000031369 CDS YBR289W 2 779667 782384 W 2011-02-03 1997-01-28|2011-02-03 -S000000494 ORF Verified YBR290W BSD2 chromosome 2 L000000194 2 782591 783556 W 2011-02-03 1997-01-28 Heavy metal ion homeostasis protein; facilitates trafficking of Smf1p and Smf2p metal transporters to vacuole where they are degraded; acts as an adaptor protein with Rsp5p in the regulated endocytosis of Smf1p and is itself ubiquitylated by Rsp5p; controls metal ion transport, prevents metal hyperaccumulation, functions in copper detoxification -S000031117 CDS YBR290W 2 782591 783556 W 2011-02-03 1997-01-28 -S000000495 ORF Verified YBR291C CTP1 chromosome 2 L000003310 2 784572 783673 C 2011-02-03 1997-01-28 Mitochondrial inner membrane citrate transporter; member of the mitochondrial carrier family -S000031161 CDS YBR291C 2 784572 783673 C 2011-02-03 1997-01-28 -S000000496 ORF Dubious YBR292C chromosome 2 2 785073 784702 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YBR292C is not an essential gene -S000032196 CDS YBR292C 2 785073 784702 C 2011-02-03 1997-01-28 -S000000497 ORF Verified YBR293W VBA2 chromosome 2 2 787006 788430 W 2011-02-03 1997-01-28 Permease of basic amino acids in the vacuolar membrane -S000032357 CDS YBR293W 2 787006 788430 W 2011-02-03 1997-01-28 -S000000498 ORF Verified YBR294W SUL1 sulfate permease|SFP2 chromosome 2 L000002180 2 789235 791814 W 2011-02-03 1999-04-26|1997-01-28 High affinity sulfate permease of the SulP anion transporter family; sulfate uptake is mediated by specific sulfate transporters Sul1p and Sul2p, which control the concentration of endogenous activated sulfate intermediates -S000032440 CDS YBR294W 2 789235 791814 W 2011-02-03 1999-04-26|1997-01-28 -S000118355 ARS ARS228 ARSII-792 chromosome 2 2 792218 792310 2014-11-18 2014-11-18|2006-08-30|2011-02-03 Autonomously Replicating Sequence -S000000499 ORF Verified YBR295W PCA1 cation-transporting P-type ATPase PCA1|PAY2|CAD2 chromosome 2 L000001347|L000000207 2 792849 796499 W 161 2011-02-03 1997-01-28|2011-02-03 Cadmium transporting P-type ATPase; may also have a role in copper and iron homeostasis; stabilized by Cd binding, which prevents ubiquitination; S288C and other lab strains contain a G970R mutation which eliminates Cd transport function -S000034460 CDS YBR295W 2 792849 796499 W 2011-02-03 1997-01-28|2011-02-03 -S000000500 ORF Verified YBR296C PHO89 ITN1 chromosome 2 2 798522 796798 C 2011-02-03 1997-01-28 Plasma membrane Na+/Pi cotransporter; active in early growth phase; similar to phosphate transporters of Neurospora crassa; transcription regulated by inorganic phosphate concentrations and Pho4p; mutations in related human transporter genes hPit1 and hPit2 are associated with hyperphosphatemia-induced calcification of vascular tissue and familial idiopathic basal ganglia calcification -S000034537 CDS YBR296C 2 798522 796798 C 2011-02-03 1997-01-28 -S000028605 ORF Uncharacterized YBR296C-A chromosome 2 2 800242 800123 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031414 CDS YBR296C-A 2 800242 800123 C 2011-02-03 2003-07-29 -S000000501 ORF Verified YBR297W MAL33 transcription factor MAL33|MALR|MAL3R chromosome 2 L000001016 2 800523 801929 W 2011-02-03 1997-01-28 MAL-activator protein; part of complex locus MAL3; nonfunctional in genomic reference strain S288C -S000034658 CDS YBR297W 2 800523 801929 W 2011-02-03 1997-01-28 -S000000502 ORF Verified YBR298C MAL31 maltose permease|MALT|MAL3T chromosome 2 L000001014 2 804475 802631 C 2011-02-03 1997-01-28 Maltose permease; high-affinity maltose transporter (alpha-glucoside transporter); encoded in the MAL3 complex locus; member of the 12 transmembrane domain superfamily of sugar transporters; functional in genomic reference strain S288C -S000034677 CDS YBR298C 2 804475 802631 C 2011-02-03 1997-01-28 -S000028606 ORF Uncharacterized YBR298C-A chromosome 2 2 805256 805035 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031416 CDS YBR298C-A 2 805256 805035 C 2011-02-03 2003-07-29 -S000000503 ORF Verified YBR299W MAL32 alpha-glucosidase MAL32|MALS|MAL3S chromosome 2 L000001015 2 805351 807105 W 2011-02-03 1997-01-28 Maltase (alpha-D-glucosidase); inducible protein involved in maltose catabolism; encoded in the MAL3 complex locus; functional in genomic reference strain S288C; hydrolyzes the disaccharides maltose, turanose, maltotriose, and sucrose -S000035668 CDS YBR299W 2 805351 807105 W 2011-02-03 1997-01-28 -S000000505 ORF Verified YBR301W PAU24 seripauperin PAU24|DAN3 chromosome 2 2 809057 809419 W 2011-02-03 1997-01-28 Cell wall mannoprotein; has similarity to Tir1p, Tir2p, Tir3p, and Tir4p; member of the seripauperin multigene family encoded mainly in subtelomeric regions; expressed under anaerobic conditions, completely repressed during aerobic growth -S000033172 CDS YBR301W 2 809057 809419 W 2011-02-03 1997-01-28 -S000000504 ORF Dubious YBR300C chromosome 2 2 809097 808600 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YBR301W; YBR300C is not an essential gene -S000033026 CDS YBR300C 2 809097 808600 C 2011-02-03 1997-01-28 -S000000506 ORF Verified YBR302C COS2 chromosome 2 L000004716 2 811479 810340 C 2011-02-03 1997-01-28 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins -S000033196 CDS YBR302C 2 811479 810340 C 2011-02-03 1997-01-28 -S000028940 telomere TEL02R chromosome 2 2 812379 813184 W 166 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome II; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats -S000028941 telomeric_repeat TEL02R 2 813138 813184 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome II -S000028942 X_element TEL02R 2 812379 812848 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome II; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028943 X_element_combinatorial_repeat TEL02R 2 812849 813137 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr II; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000029654 ORF Verified R0010W FLP1 2-micron L000000619 2-micron 252 1523 W 2006-10-06 2004-02-11 Site-specific recombinase encoded on the 2-micron plasmid; required for 2-micron plasmid propagation as part of a plasmid amplification system that compensates for any copy number decreases caused by missegregation events -S000119086 CDS R0010W 2-micron 252 1523 W 2006-10-06 2004-02-11 -S000029675 ORF Verified R0020C REP1 2-micron L000001611 2-micron 3008 1887 C 2006-10-06 2004-02-11 Master regulator that regulates transcript levels of the FLP1 gene; acts in concert with Rep2p to regulate transcript levels of the FLP1 gene that promotes plasmid copy amplification and 2-micron plasmid-inheritance; also autoregulates levels of its own transcript; both Rep1p and Rep2p are sumoylated which is important for function -S000119087 CDS R0020C 2-micron 3008 1887 C 2006-10-06 2004-02-11 -S000029674 ORF Verified R0030W RAF1 2-micron S000007507 2-micron 3271 3816 W 2006-10-06 2004-02-11 Anti-repressor that increases 2 micron plasmid copy number; increases 2 micron plasmid copy number by relieving repression of the FLP1 site-specific recombinase caused by the Rep1-Rep2p trascription regulator; also itself repressed by the Rep1p-Rep2p complex -S000119088 CDS R0030W 2-micron 3271 3816 W 2006-10-06 2004-02-11 -S000029676 ORF Verified R0040C REP2 2-micron L000001612 2-micron 6198 5308 C 2006-10-06 2004-02-11 Master regulator that regulates transcript levels of the FLP1 gene; acts in concert with Rep1p to regulate transcript levels of the FLP1 gene that promotes plasmid copy amplification and 2-micron plasmid-inheritance; also autoregulates levels of its own transcript; required for Rep1p stability; both Rep1p and Rep2p are sumoylated which is important for function -S000119089 CDS R0040C 2-micron 6198 5308 C 2006-10-06 2004-02-11 -S000028476 ARS ARS300 ARS300 chromosome 3 3 989 1068 2014-11-18 2003-03-31|2014-11-18 Autonomously Replicating Sequence -S000030118 ARS_consensus_sequence ARS300 3 1060 1050 C 2003-03-31 2003-03-31 -S000028871 telomere TEL03L chromosome 3 3 1098 1 C -50 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome III; composed of an X element core sequence, X element combinatorial repeats, and a terminal stretch of telomeric repeats -S000028872 telomeric_repeat TEL03L 3 360 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome III -S000028873 X_element TEL03L 3 1098 640 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome III; contains an ARS consensus sequence and an Abf1p binding site -S000028874 X_element_combinatorial_repeat TEL03L 3 639 361 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr III; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000006828 long_terminal_repeat YCLWomega1 chromosome 3 3 1179 1429 W 2000-09-13 2000-05-19 Ty5 LTR -S000006831 LTR_retrotransposon YCLWTy5-1 Ty5 chromosome 3 3 1179 4322 W 2000-09-13 2000-05-19 Ty5 element, LTR retrotransposon of the Copia (Pseudoviridae) group; this is the only near-full length Ty5 retrotransposon in S288C and it is non-functional -S000000581 ORF Dubious YCL076W chromosome 3 3 1392 2135 W 2000-09-13 2000-09-13|1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034360 CDS YCL076W 3 1392 2135 W 2000-09-13 2000-09-13|1997-01-28 -S000000580 pseudogene YCL075W chromosome 3 3 2126 2566 W 2000-09-13 1997-01-28 Pseudogene: encodes fragment of Ty Pol protein -S000033443 CDS YCL075W 3 2126 2566 W 2000-09-13 1997-01-28 -S000000579 pseudogene YCL074W chromosome 3 3 2824 3750 W 2000-09-13 2000-09-13|1997-01-28 Pseudogene: encodes fragment of Ty Pol protein -S000033352 CDS YCL074W 3 2824 3750 W 2000-09-13 2000-09-13|1997-01-28 -S000006829 long_terminal_repeat YCLWomega2 chromosome 3 3 4073 4322 W 2000-09-13 2000-05-19 Ty5 LTR -S000000575 ORF Verified YCL073C GEX1 glutathione exchanger chromosome 3 3 8326 6479 C 2000-09-13 2000-09-13|1997-01-28 Proton:glutathione antiporter; localized to the vacuolar and plasma membranes; imports glutathione from the vacuole and exports it through the plasma membrane; has a role in resistance to oxidative stress and modulation of the PKA pathway; GEX1 has a paralog, GEX2, that arose from a segmental duplication -S000033250 CDS YCL073C 3 8326 6479 C 2000-09-13 2000-09-13|1997-01-28 -S000000574 ORF Verified YCL069W VBA3 basic amino acid transporter chromosome 3 3 9706 11082 W 2000-09-13 1997-01-28 Permease of basic amino acids in the vacuolar membrane; VBA3 has a paralog, VBA5, that arose from a segmental duplication -S000031320 CDS YCL069W 3 9706 11082 W 2000-09-13 1997-01-28 -S000028477 ARS ARS301 ARS301 HML-E ARS chromosome 3 3 11146 11401 2003-03-31 2003-03-31 Inactive replication origin linked to the silent mating type locus HML; functions as a transcriptional silencer -S000030120 ARS_consensus_sequence ARS301 3 11257 11267 W 2003-03-31 2003-03-31 -S000029214 silent_mating_type_cassette_array silenced_gene HML HML chromosome 3 L000000791 3 11146 14849 W -49 2007-12-10 2007-12-10 Mating type cassette - left; unexpressed complete copy of the mating-type genes, silenced by the Sir2 histone deacetylase and its associated SIR1, SIR3 and SIR4 proteins; mating-type switching involves replacement of the Ya or Yalpha sequences present at the MAT locus with either the a or alpha genes located at one of the HM loci in a process stimulated by the HO endonuclease; sequence replacement occurs by gene conversion, leaving the donor unaltered -S000124942 W_region HML 3 11509 12238 W 2007-12-10 2007-12-10 -S000124943 X_region HML 3 12239 12943 W 2007-12-10 2007-12-10 -S000124944 Y_region HML 3 12944 13690 W 2007-12-10 2007-12-10 -S000124945 Z1_region HML 3 13691 13929 W 2007-12-10 2007-12-10 -S000124946 Z2_region HML 3 13930 14017 W 2007-12-10 2007-12-10 -S000000573 ORF Uncharacterized YCL068C chromosome 3 3 12285 11503 C 2000-09-13 2000-09-13|1997-01-28 Putative protein of unknown function -S000031134 CDS YCL068C 3 12285 11503 C 2000-09-13 2000-09-13|1997-01-28 -S000000572 ORF Verified|silenced_gene YCL067C HMLALPHA2 homeodomain mating type protein alpha2|ALPHA2 chromosome 3 3 13018 12386 C 2000-09-13 1997-01-28 Silenced copy of ALPHA2 at HML; homeobox-domain protein that associates with Mcm1p in haploid cells to repress a-specific gene expression and interacts with a1p in diploid cells to repress haploid-specific gene expression -S000030191 CDS YCL067C 3 13018 12386 C 2000-09-13 1997-01-28 -S000000571 ORF Verified|silenced_gene YCL066W HMLALPHA1 transcriptional co-activator mating type protein alpha|ALPHA1 chromosome 3 3 13282 13809 W 2000-09-13 1997-01-28 Silenced copy of ALPHA1 at HML; ALPHA1 encodes a transcriptional coactivator involved in the regulation of mating-type alpha-specific gene expression -S000030081 CDS YCL066W 3 13282 13809 W 2000-09-13 1997-01-28 -S000000570 ORF Dubious YCL065W chromosome 3 3 13751 14119 W 2000-09-13 2000-09-13|1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps HMLALPHA1 -S000029969 CDS YCL065W 3 13751 14119 W 2000-09-13 2000-09-13|1997-01-28 -S000028478 ARS ARS302 ARS302 HML-I ARS chromosome 3 3 14575 14849 2003-03-31 2003-03-31 Inactive replication origin linked to the silent mating type locus HML; functions as a transcriptional silencer -S000030152 ARS_consensus_sequence ARS302 3 14701 14711 W 2003-03-31 2003-03-31 -S000028479 ARS ARS303 ARS303 chromosome 3 3 14871 15213 2003-03-31 2003-03-31 Autonomously Replicating Sequence on Chromosome III; inactive as replication origin at native locus near HML -S000030154 ARS_consensus_sequence ARS303 3 15196 15186 C 2003-03-31 2003-03-31 -S000028480 ARS ARS320 ARS320 chromosome 3 3 15214 16274 2003-03-31 2003-03-31 Autonomously Replicating Sequence on Chromosome III; inactive as replication origin at native locus near HML -S000030156 ARS_consensus_sequence ARS320 3 15298 15308 W 2003-03-31 2003-03-31 -S000000569 ORF Verified YCL064C CHA1 L-serine/L-threonine ammonia-lyase CHA1 chromosome 3 L000000316 3 16880 15798 C -46 2000-09-13 2000-09-13|1997-01-28 Catabolic L-serine (L-threonine) deaminase; catalyzes the degradation of both L-serine and L-threonine; required to use serine or threonine as the sole nitrogen source, transcriptionally induced by serine and threonine -S000037243 CDS YCL064C 3 16880 15798 C 2000-09-13 2000-09-13|1997-01-28 -S000000568 ORF Verified YCL063W VAC17 YCL062W chromosome 3 3 17290 18561 W 2000-09-13 2000-09-13|1997-01-28 Phosphoprotein involved in vacuole inheritance; degraded in late M phase of the cell cycle; acts as a vacuole-specific receptor for myosin Myo2p; involved in regulation of asymmetric inheritance of aggregated/misfolded proteins and age reset -S000037206 CDS YCL063W 3 17290 18561 W 2000-09-13 2000-09-13|1997-01-28 -S000000566 ORF Verified YCL061C MRC1 chromatin-modulating protein MRC1|YCL060C chromosome 3 3 22106 18816 C 2000-09-13 2000-09-13|1997-01-28 S-phase checkpoint protein required for DNA replication; couples DNA helicase and polymerase; interacts with and stabilizes Pol2p at stalled replication forks during stress, where it forms a pausing complex with Tof1p and is phosphorylated by Mec1p; defines a novel S-phase checkpoint with Hog1p that coordinates DNA replication and transcription upon osmostress; protects uncapped telomeres; Dia2p-dependent degradation mediates checkpoint recovery; mammalian claspin homolog -S000036990 CDS YCL061C 3 22106 18816 C 2000-09-13 2000-09-13|1997-01-28 -S000000564 ORF Verified YCL059C KRR1 ribosome biosynthesis protein KRR1 chromosome 3 L000004098 3 23379 22429 C 2000-09-13 1997-01-28 Nucleolar protein required for rRNA synthesis and ribosomal assembly; required for the synthesis of 18S rRNA and for the assembly of 40S ribosomal subunit; essential gene -S000034984 CDS YCL059C 3 23379 22429 C 2000-09-13 1997-01-28 -S000028518 ORF Verified YCL058W-A ADF1 chromosome 3 3 23584 23925 W 2006-01-11 2003-07-29|2006-01-11 Transcriptional repressor encoded by the FYV5 antisense strand; negatively regulates transcription of FYV5 by binding to the promoter on the sense strand -S000030294 CDS YCL058W-A 3 23584 23925 W 2006-01-11 2003-07-29|2006-01-11 -S000000563 ORF Verified YCL058C FYV5 MDF1 chromosome 3 3 23981 23523 C 2000-09-13 1997-01-28 Protein involved in regulation of the mating pathway; binds with Matalpha2p to promoters of haploid-specific genes; required for survival upon exposure to K1 killer toxin; involved in ion homeostasis -S000034080 CDS YCL058C 3 23981 23523 C 2000-09-13 1997-01-28 -S000007547 ORF Verified YCL057C-A MIC10 MOS1|MCS10|MIO10 chromosome 3 3 24325 24032 C 2000-09-14 2000-09-14 Conserved component of the MICOS complex; MICOS (formerly MINOS or MitOS) is a mitochondrial inner membrane complex that extends into the intermembrane space and has a role in the maintenance of crista junctions, inner membrane architecture, and formation of contact sites to the outer membrane; forms a subcomplex with Mic12p and Mic27p whose assembly and stability requires cardiolipin; homo-oligomers cause membrane bending; ortholog of human MINOS1 -S000037065 CDS YCL057C-A 3 24325 24032 C 2000-09-14 2000-09-14 -S000000562 ORF Verified YCL057W PRD1 metalloendopeptidase chromosome 3 L000003155 3 24768 26906 W 2000-09-13 1997-01-28 Zinc metalloendopeptidase; found in the cytoplasm and intermembrane space of mitochondria; with Cym1p, involved in degradation of mitochondrial proteins and of presequence peptides cleaved from imported proteins; protein abundance increases in response to DNA replication stress -S000034023 CDS YCL057W 3 24768 26906 W 2000-09-13 1997-01-28 -S000000561 ORF Verified YCL056C PEX34 chromosome 3 3 27359 26925 C 2000-09-13 1997-01-28 Protein that regulates peroxisome populations; peroxisomal integral membrane protein; interacts with Pex11p, Pex25p, and Pex27p to control both constitutive peroxisome division and peroxisome morphology and abundance during peroxisome proliferation -S000033789 CDS YCL056C 3 27359 26925 C 2000-09-13 1997-01-28 -S000000560 ORF Verified YCL055W KAR4 chromosome 3 L000003481 3 27929 28936 W 2000-09-13 1997-01-28 Transcription factor required for response to pheromones; also required during meiosis; exists in two forms, a slower-migrating form more abundant during vegetative growth and a faster-migrating form induced by pheromone -S000033110 CDS YCL055W 3 27929 28936 W 2000-09-13 1997-01-28 -S000028481 ARS ARS304 ARS304 chromosome 3 3 30200 30657 2003-03-31 2003-03-31 Autonomously Replicating Sequence on Chromosome III -S000030159 ARS_consensus_sequence ARS304 3 30439 30429 C 2003-03-31 2003-03-31 -S000178054 ORF Uncharacterized YCL054W-A RDT1 chromosome 3 3 30910 30996 W 2014-11-18 2014-11-18 Short open reading frame, shows evidence of translation; may be new protein-coding gene that originated de novo from noncoding sequence; same allele found in at least 33 other S. cerevisiae strains; at least 3 strains have a second allele with three nucleotide substitutions leading to two amino acid differences -S000178055 CDS YCL054W-A 3 30910 30996 W 2014-11-18 2014-11-18 -S000000559 ORF Verified YCL054W SPB1 27S pre-rRNA (guanosine2922-2'-O)-methyltransferase chromosome 3 L000001990 3 31449 33974 W 2000-09-13 1999-07-17|1997-01-28 AdoMet-dependent methyltransferase; involved in rRNA processing and 60S ribosomal subunit maturation; methylates G2922 in the tRNA docking site of the large subunit rRNA and in the absence of snR52, U2921; suppressor of PAB1 mutants -S000033016 CDS YCL054W 3 31449 33974 W 2000-09-13 1999-07-17|1997-01-28 -S000000557 ORF Verified YCL052C PBN1 chromosome 3 L000003219 3 35393 34143 C 2000-09-13 1997-01-28 Component of glycosylphosphatidylinositol-mannosyltransferase I; essential component; required for the autocatalytic post-translational processing of the protease B precursor Prb1p; localizes to ER in lumenal orientation; homolog of mammalian PIG-X -S000031965 CDS YCL052C 3 35393 34143 C 2000-09-13 1997-01-28 -S000000556 ORF Verified YCL051W LRE1 chromosome 3 L000003355 3 35865 37616 W 2000-09-13 2000-09-13|1997-01-28 Protein involved in control of cell wall structure and stress response; direct inhibitor of the nuclear Dbf2 related (NDR) kinase Cbk1p-Mob2p; overproduction confers resistance to cell-wall degrading enzymes; exhibits genetic interactions with genes involved in the cell wall integrity pathway; LRE1 has a paralog, HLR1, that arose from the whole genome duplication -S000031923 CDS YCL051W 3 35865 37616 W 2000-09-13 2000-09-13|1997-01-28 -S000000555 ORF Verified YCL050C APA1 bifunctional AP-4-A phosphorylase/ADP sulfurylase|DTP1 chromosome 3 L000000090 3 38801 37836 C -33 2000-09-13 2000-09-13|1997-01-28 AP4A phosphorylase; bifunctional diadenosine 5',5'''-P1,P4-tetraphosphate phosphorylase and ADP sulfurylase involved in catabolism of bis(5'-nucleosidyl) tetraphosphates; catalyzes phosphorolysis of dinucleoside oligophosphates, cleaving substrates' alpha/beta-anhydride bond and introducing Pi into the beta-position of the corresponding NDP formed; protein abundance increases under DNA replication stress; APA1 has a paralog, APA2, that arose from the whole genome duplication -S000031713 CDS YCL050C 3 38801 37836 C 2000-09-13 2000-09-13|1997-01-28 -S000028482 ARS ARS305 ARS305 chromosome 3 3 39508 39595 2014-11-18 2003-03-31|2014-11-18 Efficient early-firing replication origin on Chromosome III -S000030162 ARS_consensus_sequence ARS305 3 39589 39579 C 2003-03-31 2003-03-31 -S000000554 ORF Uncharacterized YCL049C chromosome 3 3 40724 39786 C 2000-09-13 2000-09-13|1997-01-28 Protein of unknown function; localizes to membrane fraction; YCL049C is not an essential gene -S000031529 CDS YCL049C 3 40724 39786 C 2000-09-13 2000-09-13|1997-01-28 -S000087203 ORF Uncharacterized YCL048W-A chromosome 3 3 41488 41727 W 2005-11-14 2005-11-14 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the cell periphery and vacuole; YCL048W-A has a paralog, YDR524C-B, that arose from the whole genome duplication -S000087204 CDS YCL048W-A 3 41488 41727 W 2005-11-14 2005-11-14 -S000000553 ORF Verified YCL048W SPS22 chromosome 3 3 42165 43556 W 2000-09-13 1997-01-28 Protein of unknown function; SPS22 has a paralog, SPS2, that arose from the whole genome duplication; redundant with Sps2p for the organization of the beta-glucan layer of the spore wall -S000031494 CDS YCL048W 3 42165 43556 W 2000-09-13 1997-01-28 -S000000552 ORF Verified YCL047C POF1 nicotinamide-nucleotide adenylyltransferase chromosome 3 3 44437 43661 C 2000-09-13 1997-01-28 Nicotinamide mononucleotide-specific adenylyltransferase (NMNAT); catalyzes the conversion of nicotinamide mononucleotide (NMN) to nicotinamide adenine dinucleotide (NAD+); role in the nicotinamide riboside (NR) salvage pathway of NAD+ biosynthesis; involved in NR and NAD+ homeostasis; ATPase involved in protein quality control and filamentation pathways; interacts physically with Kss1p and suppresses the filamentation defect of a kss1 deletion -S000030504 CDS YCL047C 3 44437 43661 C 2000-09-13 1997-01-28 -S000000551 ORF Dubious YCL046W chromosome 3 3 46640 46963 W 2000-09-13 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YCL045C -S000030444 CDS YCL046W 3 46640 46963 W 2000-09-13 1997-01-28 -S000000550 ORF Verified YCL045C EMC1 chromosome 3 3 46905 44623 C 2000-09-13 1997-01-28 Member of conserved endoplasmic reticulum membrane complex; involved in efficient folding of proteins in the ER; null mutant displays induction of the unfolded protein response; interacts with Gal80p; homologous to worm H17B01.4/EMC-1, fly CG2943, and human KIAA0090 -S000030200 CDS YCL045C 3 46905 44623 C 2000-09-13 1997-01-28 -S000000549 ORF Verified YCL044C MGR1 chromosome 3 3 48364 47111 C 2000-09-13 1997-01-28 Subunit of the mitochondrial (mt) i-AAA protease supercomplex; i-AAA degrades misfolded mitochondrial proteins; forms a subcomplex with Mgr3p that binds to substrates to facilitate proteolysis; required for growth of cells lacking mtDNA -S000037468 CDS YCL044C 3 48364 47111 C 2000-09-13 1997-01-28 -S000000548 ORF Verified YCL043C PDI1 protein disulfide isomerase PDI1|TRG1|MFP1 chromosome 3 L000001360 3 50221 48653 C 2000-09-13 1997-01-28 Protein disulfide isomerase; multifunctional oxidoreductase of the ER lumen, essential for disulfide bond formation in secretory and cell-surface proteins, processing of non-native disulfide bonds; Ero1p activator; complexes with exomannosidase, Mnl1p to facilitate the recognition of misfolded glycoproteins and the trimming of glycan Man8GlcNAc2 to Man7GlcNAc2 on substrates, thereby accelerating ERAD; PDI1 has a paralog, EUG1, that arose from the whole genome duplication -S000037357 CDS YCL043C 3 50221 48653 C 2000-09-13 1997-01-28 -S000000547 ORF Uncharacterized YCL042W chromosome 3 3 50584 50943 W 2000-09-13 2000-09-13|1997-01-28 Putative protein of unknown function; epitope-tagged protein localizes to the cytoplasm -S000037297 CDS YCL042W 3 50584 50943 W 2000-09-13 2000-09-13|1997-01-28 -S000000546 ORF Dubious YCL041C chromosome 3 3 50627 50133 C 2000-09-13 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps both the verified gene PDI1/YCL043C and the uncharacterized gene YCL042W -S000036569 CDS YCL041C 3 50627 50133 C 2000-09-13 1997-01-28 -S000000545 ORF Verified YCL040W GLK1 glucokinase|HOR3 chromosome 3 L000000708 3 50838 52340 W -47 2000-09-13 1997-01-28 Glucokinase; catalyzes the phosphorylation of glucose at C6 in the first irreversible step of glucose metabolism; one of three glucose phosphorylating enzymes; expression regulated by non-fermentable carbon sources; GLK1 has a paralog, EMI2, that arose from the whole genome duplication -S000036534 CDS YCL040W 3 50838 52340 W 2000-09-13 1997-01-28 -S000000544 ORF Verified YCL039W GID7 glucose-induced degradation complex subunit GID7|MOH2 chromosome 3 3 52645 54882 W 2000-09-13 1999-07-17|1997-01-28 Subunit of GID Complex that binds directly to central component Vid30p; GID complex is involved in proteasome-dependent catabolite inactivation of fructose-1,6-bisphosphatase; Gid7p contains six WD40 repeats; computational analysis suggests that Gid7p and Moh1p have similar functions -S000035505 CDS YCL039W 3 52645 54882 W 2000-09-13 1999-07-17|1997-01-28 -S000000543 ORF Verified YCL038C ATG22 AUT4 chromosome 3 L000004750 3 56527 54941 C 2000-09-13 1997-01-28 Vacuolar integral membrane protein required for efflux of amino acids; required for efflux of amino acids during autophagic body breakdown in the vacuole; null mutation causes a gradual loss of viability during starvation -S000034405 CDS YCL038C 3 56527 54941 C 2000-09-13 1997-01-28 -S000000542 ORF Verified YCL037C SRO9 chromosome 3 L000003106 3 58678 57374 C 2003-09-22 2003-09-22|1997-01-28 Cytoplasmic RNA-binding protein; shuttles between nucleus and cytoplasm and is exported from the nucleus in an mRNA export-dependent manner; associates with translating ribosomes; involved in heme regulation of Hap1p as a component of the HMC complex, also involved in the organization of actin filaments; contains a La motif; SRO9 has a paralog, SLF1, that arose from the whole genome duplication -S000034295 CDS YCL037C 3 58678 57374 C 2003-09-22 2003-09-22|1997-01-28 -S000000541 ORF Verified YCL036W GFD2 YCD6 chromosome 3 L000004631 3 59026 60726 W 2000-09-13 1997-01-28 Protein of unknown function; identified as a high-copy suppressor of a dbp5 mutation; GFD2 has a paralog, YDR514C, that arose from the whole genome duplication -S000034257 CDS YCL036W 3 59026 60726 W 2000-09-13 1997-01-28 -S000000540 ORF Verified YCL035C GRX1 dithiol glutaredoxin GRX1 chromosome 3 3 61173 60841 C 2000-09-13 1997-01-28 Glutathione-dependent disulfide oxidoreductase; hydroperoxide and superoxide-radical responsive, heat-stable, with active site cysteine pair; protects cells from oxidative damage; GRX1 has a paralog, GRX2, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000033290 CDS YCL035C 3 61173 60841 C 2000-09-13 1997-01-28 -S000000539 ORF Verified YCL034W LSB5 chromosome 3 3 61658 62722 W 2000-09-13 2000-09-13|1997-01-28 Protein involved in membrane-trafficking events at plasma membrane; interacts with actin regulators Sla1p and Las17p, ubiquitin, Arf3p to couple actin dynamics to membrane trafficking processes; similar structure to GGA family of proteins with N-terminal VHS domain and GAT domain; binds Las17p, which is homolog of human Wiskott-Aldrich Syndrome protein involved in actin patch assembly, actin polymerization; may mediate disassembly of Pan1 complex from endocytic coat -S000033272 CDS YCL034W 3 61658 62722 W 2000-09-13 2000-09-13|1997-01-28 -S000000538 ORF Verified YCL033C MXR2 MSRB chromosome 3 3 63282 62776 C 2000-09-13 1997-01-28 Methionine-R-sulfoxide reductase; involved in the response to oxidative stress; protects iron-sulfur clusters from oxidative inactivation along with MXR1; involved in the regulation of lifespan -S000033176 CDS YCL033C 3 63282 62776 C 2000-09-13 1997-01-28 -S000000537 ORF Verified YCL032W STE50 chromosome 3 L000002125 3 63441 64481 W -22 2000-09-13 1997-01-28 Adaptor protein for various signaling pathways; involved in mating response, invasive/filamentous growth, osmotolerance; acts as an adaptor that links G protein-associated Cdc42p-Ste20p complex to the effector Ste11p to modulate signal transduction -S000033154 CDS YCL032W 3 63441 64481 W 2000-09-13 1997-01-28 -S000000536 ORF Verified YCL031C RRP7 chromosome 3 L000004251 3 65568 64675 C 2000-09-13 1997-01-28 Essential protein involved in rRNA processing and ribosome biogenesis; protein abundance increases in response to DNA replication stress -S000032244 CDS YCL031C 3 65568 64675 C 2000-09-13 1997-01-28 -S000000535 ORF Verified YCL030C HIS4 trifunctional histidinol dehydrogenase/phosphoribosyl-AMP cyclohydrolase/phosphoribosyl-ATP diphosphatase chromosome 3 L000000781 3 68333 65934 C -22 2000-09-13 2000-09-13|1997-01-28 Multifunctional enzyme containing phosphoribosyl-ATP pyrophosphatase; phosphoribosyl-AMP cyclohydrolase, and histidinol dehydrogenase activities; catalyzes the second, third, ninth and tenth steps in histidine biosynthesis -S000032161 CDS YCL030C 3 68333 65934 C 2000-09-13 2000-09-13|1997-01-28 -S000000534 ORF Verified YCL029C BIK1 PAC14|ARM5 chromosome 3 L000000178 3 69921 68599 C -21 2000-09-13 2000-09-13|1997-01-28 Microtubule-associated protein; component of the interface between microtubules and kinetochore, involved in sister chromatid separation; essential in polyploid cells but not in haploid or diploid cells; ortholog of mammalian CLIP-170 -S000031278 CDS YCL029C 3 69921 68599 C 2000-09-13 2000-09-13|1997-01-28 -S000000533 ORF Verified YCL028W RNQ1 prion domain-containing protein RNQ1|[PIN(+)] chromosome 3 S000007471 3 70150 71367 W 2000-09-13 2000-09-13|1997-01-28 [PIN(+)] prion; an infectious protein conformation that is generally an ordered protein aggregate -S000031217 CDS YCL028W 3 70150 71367 W 2000-09-13 2000-09-13|1997-01-28 -S000000532 ORF Verified YCL027W FUS1 chromosome 3 L000000653 3 71803 73341 W -21 2000-09-13 2000-09-13|1997-01-28 Membrane protein localized to the shmoo tip; required for cell fusion; expression regulated by mating pheromone; proposed to coordinate signaling, fusion, and polarization events required for fusion; potential Cdc28p substrate -S000031087 CDS YCL027W 3 71803 73341 W 2000-09-13 2000-09-13|1997-01-28 -S000007548 ORF Verified YCL026C-B HBN1 putative nitroreductase|YCL027C-A chromosome 3 3 73986 73405 C 2000-09-14 2000-09-14 Protein of unknown function; similar to bacterial nitroreductases; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; protein becomes insoluble upon intracellular iron depletion; protein abundance increases in response to DNA replication stress -S000037064 CDS YCL026C-B 3 73986 73405 C 2000-09-14 2000-09-14 -S000028483 ARS ARS306 ARS306 chromosome 3 3 74458 74677 2003-03-31 2003-03-31 Early-firing autonomously replicating sequence on Chromosome III -S000030165 ARS_consensus_sequence ARS306 3 74521 74531 W 2003-03-31 2003-03-31 -S000000589 ORF Verified YCL026C-A FRM2 type II nitroreductase|YCLX08C chromosome 3 L000004082 3 75285 74704 C 2000-09-13 2000-09-13|1997-01-28 Type II nitroreductase, using NADH as reductant; mutants are defective in fatty acid mediated repression of genes involved in fatty acid biosynthesis indicative of a role in lipid signaling; involved in the oxidative stress response; transcription induction by cadmium and selenite indicates a possible role in the metal stress response; expression induced in cells treated with the mycotoxin patulin -S000032741 CDS YCL026C-A 3 75285 74704 C 2000-09-13 2000-09-13|1997-01-28 -S000000530 ORF Verified YCL025C AGP1 amino acid transporter AGP1|YCC5 chromosome 3 L000003271 3 77919 76018 C 2006-01-12 2000-09-13|1997-01-28|2006-01-12 Low-affinity amino acid permease with broad substrate range; involved in uptake of asparagine, glutamine, and other amino acids; expression regulated by SPS plasma membrane amino acid sensor system (Ssy1p-Ptr3p-Ssy5p); AGP1 has a paralog, GNP1, that arose from the whole genome duplication -S000029928 CDS YCL025C 3 77919 76018 C 2006-01-12 2000-09-13|1997-01-28|2006-01-12 -S000000529 ORF Verified YCL024W KCC4 serine/threonine protein kinase chromosome 3 3 79162 82275 W 2006-01-12 2000-09-13|1997-01-28 Protein kinase of the bud neck involved in the septin checkpoint; associates with septin proteins, negatively regulates Swe1p by phosphorylation, shows structural homology to bud neck kinases Gin4p and Hsl1p; KCC4 has a paralog, GIN4, that arose from the whole genome duplication -S000029873 CDS YCL024W 3 79162 82275 W 2006-01-12 2000-09-13|1997-01-28 -S000000528 ORF Dubious YCL023C chromosome 3 3 79296 78949 C 2006-01-12 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF KCC4 -S000037128 CDS YCL023C 3 79296 78949 C 2006-01-12 1997-01-28 -S000000527 ORF Dubious YCL022C chromosome 3 3 82085 81570 C 2006-01-12 2000-09-13|1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified gene KCC4/YCL024W -S000037053 CDS YCL022C 3 82085 81570 C 2006-01-12 2000-09-13|1997-01-28 -S000006549 tRNA_gene tE(UUC)C chromosome 3 L000003760 3 82533 82462 C 2006-01-12 2000-05-19 Glutamine tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000035973 noncoding_exon tE(UUC)C 3 82533 82462 C 2006-01-12 2000-05-19 -S000126593 long_terminal_repeat YCLWdelta15 chromosome 3 3 82700 83036 W 2008-06-04 2008-06-04 Ty1 LTR -S000006822 long_terminal_repeat YCLCdelta1 chromosome 3 3 83194 83055 C 2007-04-02 2000-05-19|2007-04-02 Ty1 LTR -S000007549 ORF Uncharacterized YCL021W-A chromosome 3 3 83620 83997 W 2006-01-12 2000-09-14 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the vacuole -S000037066 CDS YCL021W-A 3 83620 83997 W 2006-01-12 2000-09-14 -S000006823 long_terminal_repeat YCLWdelta2a chromosome 3 3 84069 84294 W 2006-01-12 2000-05-19 Ty1 LTR -S000006825 long_terminal_repeat YCLWdelta3 chromosome 3 3 84295 84626 W 2006-01-12 2000-05-19 Ty1 LTR -S000006824 long_terminal_repeat YCLWdelta2b chromosome 3 3 84630 84718 W 2006-01-12 2000-05-19 Ty1 LTR -S000006826 long_terminal_repeat YCLWdelta4 chromosome 3 3 84811 85142 W 2006-01-12 2000-05-19 Ty2 LTR -S000006830 LTR_retrotransposon YCLWTy2-1 Ty2 chromosome 3 3 84811 90769 W 2006-01-12 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000000525 transposable_element_gene YCL020W gag protein chromosome 3 3 85102 86418 W 2006-01-12 2000-09-13|1997-01-28 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000036953 CDS YCL020W 3 85102 86418 W 2006-01-12 2000-09-13|1997-01-28 -S000000524 transposable_element_gene YCL019W gag-pol fusion protein chromosome 3 3 85102 90415 W 2006-01-12 2000-12-01|1997-01-28 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000036163 CDS YCL019W 3 85102 86391 W 2006-01-12 2000-12-01 -S000036164 CDS YCL019W 3 86393 90415 W 2006-01-12 2000-12-01|1997-01-28 -S000036165 plus_1_translational_frameshift YCL019W 3 86392 86392 W 2006-01-12 2000-12-01 -S000006827 long_terminal_repeat YCLWdelta5 chromosome 3 3 90438 90769 W 2006-01-12 2000-05-19 Ty2 LTR -S000006637 tRNA_gene tL(CAA)C SUP53 chromosome 3 L000002210|L000003751 3 90859 90972 W -10 2006-01-12 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis; can mutate to suppress amber nonsense mutations -S000033768 intron tL(CAA)C 3 90897 90928 W 2006-01-12 2000-05-19 -S000033766 noncoding_exon tL(CAA)C 3 90859 90896 W 2006-01-12 2000-05-19 -S000033767 noncoding_exon tL(CAA)C 3 90929 90972 W 2006-01-12 2000-05-19 -S000000523 ORF Verified YCL018W LEU2 3-isopropylmalate dehydrogenase chromosome 3 L000000943 3 91324 92418 W -5 2006-01-12 2000-09-13|1997-01-28 Beta-isopropylmalate dehydrogenase (IMDH); catalyzes the third step in the leucine biosynthesis pathway; can additionally catalyze the conversion of beta-ethylmalate into alpha-ketovalerate -S000035270 CDS YCL018W 3 91324 92418 W 2006-01-12 2000-09-13|1997-01-28 -S000000522 ORF Verified YCL017C NFS1 SPL1 chromosome 3 L000001240 3 94270 92777 C 2006-01-12 2000-09-13|1997-01-28 Cysteine desulfurase; involved in iron-sulfur cluster (Fe/S) biogenesis and in thio-modification of mitochondrial and cytoplasmic tRNAs; essential protein located predominantly in mitochondria -S000034976 CDS YCL017C 3 94270 92777 C 2006-01-12 2000-09-13|1997-01-28 -S000000521 ORF Verified YCL016C DCC1 chromosome 3 3 95763 94621 C 2006-01-12 2000-09-13|1997-01-28 Subunit of a complex with Ctf8p and Ctf18p; shares some components with Replication Factor C; required for sister chromatid cohesion and telomere length maintenance -S000034840 CDS YCL016C 3 95763 94621 C 2006-01-12 2000-09-13|1997-01-28 -S000000520 ORF Verified YCL014W BUD3 YCL012W chromosome 3 L000000200 3 96281 101191 W -9 2006-01-12 2000-09-13|1997-01-28 Guanine nucleotide exchange factor (GEF) for Cdc42p; activates Cdc42p in early G1, accounting for the first stage of biphasic activation, with Cdc24p accounting for the second stage in late G1; involved in the Cdc42p-mediated assembly of the axial landmark that dictates the site for the next round of budding, resulting in the axial budding pattern observed in haploids; localizes with septins to the bud neck contractile ring in mitosis -S000033879 CDS YCL014W 3 96281 101191 W 2006-01-12 2000-09-13|1997-01-28 -S000029705 ORF Verified YCL012C YCL011C-A chromosome 3 3 101788 101317 C 2006-01-12 2004-02-20|2011-02-03 Protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively; orthologs are present in S. bayanus, S. paradoxus and Ashbya gossypii; YCL012C is not an essential gene -S000036814 CDS YCL012C 3 101633 101317 C 2006-01-12 2004-02-20 -S000036813 CDS YCL012C 3 101788 101701 C 2006-01-12 2004-02-20 -S000036815 intron YCL012C 3 101700 101634 C 2006-01-12 2004-02-20|2011-02-03 -S000000517 ORF Verified YCL011C GBP2 single-stranded telomeric DNA-binding/mRNA-binding protein|RLF6 chromosome 3 L000002609|L000003049 3 103358 102075 C 2006-01-12 1997-01-28 Poly(A+) RNA-binding protein; key surveillance factor for the selective export of spliced mRNAs from the nucleus to the cytoplasm; preference for intron-containing genes; similar to Npl3p; also binds single-stranded telomeric repeat sequence in vitro; relocalizes to the cytosol in response to hypoxia; GBP2 has a paralog, HRB1, that arose from the whole genome duplication -S000032976 CDS YCL011C 3 103358 102075 C 2006-01-12 1997-01-28 -S000000516 ORF Verified YCL010C SGF29 chromosome 3 3 104350 103571 C 2006-01-12 1999-07-17|1997-01-28 Component of the HAT/Core module of the SAGA, SLIK, and ADA complexes; HAT/Core module also contains Gcn5p, Ngg1p, and Ada2p; binds methylated histone H3K4; involved in transcriptional regulation through SAGA and TBP recruitment to target promoters and H3 acetylation -S000032887 CDS YCL010C 3 104350 103571 C 2006-01-12 1999-07-17|1997-01-28 -S000000515 ORF Verified YCL009C ILV6 acetolactate synthase regulatory subunit chromosome 3 L000004096 3 105548 104619 C 2006-01-12 1999-07-17|1997-01-28 Regulatory subunit of acetolactate synthase; acetolactate synthase catalyzes the first step of branched-chain amino acid biosynthesis; enhances activity of the Ilv2p catalytic subunit, localizes to mitochondria -S000032134 CDS YCL009C 3 105548 104619 C 2006-01-12 1999-07-17|1997-01-28 -S000000514 ORF Verified YCL008C STP22 ubiquitin-binding ESCRT-I subunit protein STP22|AGS1|VPL15|VPS23 chromosome 3 L000003975|S000029031|L000000064 3 106853 105696 C 2006-01-12 2004-02-18|2000-09-13|1997-01-28 Component of the ESCRT-I complex; ESCRT-I is involved in ubiquitin-dependent sorting of proteins into the endosome; prevents polyubiquitination of the arrestin-related protein Rim8p, thereby directing its monoubiquitination by Rsp5p; homologous to the mouse and human Tsg101 tumor susceptibility gene; mutants exhibit a Class E Vps phenotype; -S000032022 CDS YCL008C 3 106853 105696 C 2006-01-12 2004-02-18|1997-01-28|2000-09-13 -S000028508 ORF Verified YCL005W-A VMA9 H(+)-transporting V0 sector ATPase subunit e|LDB10|CWH36 chromosome 3 3 107023 107417 W 2006-01-12 2003-07-29 Vacuolar H+ ATPase subunit e of the V-ATPase V0 subcomplex; essential for vacuolar acidification; interacts with the V-ATPase assembly factor Vma21p in the ER; involved in V0 biogenesis -S000030218 CDS YCL005W-A 3 107023 107033 W 2006-01-12 2003-07-29 -S000030219 CDS YCL005W-A 3 107111 107191 W 2006-01-12 2003-07-29 -S000030220 CDS YCL005W-A 3 107288 107417 W 2006-01-12 2003-07-29 -S000030221 intron YCL005W-A 3 107034 107110 W 2006-01-12 2003-07-29 -S000030222 intron YCL005W-A 3 107192 107287 W 2006-01-12 2003-07-29 -S000000513 ORF Dubious YCL007C CWH36 chromosome 3 L000002918 3 107366 106974 C 2006-01-12 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps verified ORF YCL005W-A; mutations in YCL007C were thought to confer sensitivity to calcofluor white, but this phenotype was later shown to be due to the defect in YCL005W-A -S000031856 CDS YCL007C 3 107366 106974 C 2006-01-12 1997-01-28 -S000006503 snoRNA_gene snR43 SNR43 chromosome 3 L000003410 3 107712 107504 C 2006-01-12 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U966 and of 5.8S rRNA at position 73 -S000030615 noncoding_exon snR43 3 107712 107504 C 2006-01-12 2000-05-19 -S000000511 ORF Verified YCL005W LDB16 chromosome 3 3 108021 108791 W 2006-01-12 2000-09-13|1997-01-28 Protein involved in lipid droplet (LD) assembly; forms a complex with Sei1p at ER-LD contact sites, stabilizing contact sites; ensures that LDs bud from the ER towards the cytosolic side of the membrane; null mutants have decreased net negative cell surface charge and localized accumulation of phosphatidic acid (PA) marker proteins; GFP-fusion protein expression is induced in response to MMS; null mutant can be complemented by the human seipin, BSCL2 -S000030833 CDS YCL005W 3 108021 108791 W 2006-01-12 2000-09-13|1997-01-28 -S000028484 ARS ARS307 ARS307 chromosome 3 3 108727 109060 2014-11-18 2003-03-31|2014-11-18 Autonomously Replicating Sequence on Chromosome III -S000030169 ARS_consensus_sequence ARS307 3 108970 108960 C 2006-01-12 2003-03-31 -S000000510 ORF Verified YCL004W PGS1 CDP-diacylglycerol--glycerol-3-phosphate 3-phosphatidyltransferase|YCL003W|PEL1 chromosome 3 L000001372 3 109105 110670 W 2006-01-12 2000-02-10|1997-01-28 Phosphatidylglycerolphosphate synthase; catalyzes the synthesis of phosphatidylglycerolphosphate from CDP-diacylglycerol and sn-glycerol 3-phosphate in the first committed and rate-limiting step of cardiolipin biosynthesis -S000030745 CDS YCL004W 3 109105 110670 W 2006-01-12 2000-02-10|1997-01-28 -S000000508 ORF Uncharacterized YCL002C chromosome 3 3 111675 110808 C 2011-02-03 2003-09-27|1997-01-28|2000-09-13|2011-02-03 Putative protein of unknown function; YCL002C is not an essential gene -S000037735 CDS YCL002C 3 111557 110808 C 2011-02-03 2003-09-27|1997-01-28|2000-09-13|2011-02-03 -S000037734 CDS YCL002C 3 111675 111634 C 2011-02-03 2003-09-27 -S000037736 intron YCL002C 3 111633 111558 C 2011-02-03 2003-09-27 -S000000507 ORF Verified YCL001W RER1 protein retrieval receptor chromosome 3 L000001613 3 111916 112482 W 2011-02-03 1999-07-17|1997-01-28 Protein involved in retention of membrane proteins; including Sec12p, in the ER; localized to Golgi; functions as a retrieval receptor in returning membrane proteins to the ER -S000037714 CDS YCL001W 3 111916 112482 W 2011-02-03 1999-07-17|1997-01-28 -S000007221 ORF Uncharacterized YCL001W-A chromosome 3 3 113080 113541 W 2011-02-03 1999-07-17 Putative protein of unknown function; YCL001W-A gene has similarity to DOM34 and is present in a region duplicated between chromosomes XIV and III -S000034577 CDS YCL001W-A 3 113080 113541 W 2011-02-03 1999-07-17 -S000007596 ORF Uncharacterized YCL001W-B chromosome 3 3 113770 114024 W 2011-02-03 2001-02-26 Putative protein of unknown function; present in a region duplicated between chromosomes XIV and III; YCL001W-B has a paralog, DOM34, that arose from the whole genome duplication -S000037142 CDS YCL001W-B 3 113770 114024 W 2011-02-03 2001-02-26 -S000028485 ARS ARS308 ARS308 chromosome 3 3 114321 114939 2011-02-03 2003-03-31 Autonomously Replicating Sequence on Chromosome III -S000006465 centromere CEN3 CEN3 chromosome 3 L000000296 3 114385 114501 W 0 2011-02-03 2000-05-19 Chromosome III centromere -S000077263 centromere_DNA_Element_I CEN3 3 114385 114394 W 2011-02-03 2004-10-04 -S000077264 centromere_DNA_Element_II CEN3 3 114395 114476 W 2011-02-03 2004-10-04 -S000077265 centromere_DNA_Element_III CEN3 3 114477 114501 W 2011-02-03 2004-10-04 -S000000594 ORF Uncharacterized YCR001W chromosome 3 3 115685 115999 W 2011-02-03 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YCR001W is not an essential gene -S000035168 CDS YCR001W 3 115685 115999 W 2011-02-03 1997-01-28 -S000000595 ORF Verified YCR002C CDC10 septin CDC10 chromosome 3 L000000250 3 118348 117380 C -.75 2011-02-03 1997-01-28 Component of the septin ring, required for cytokinesis; septins are GTP-binding proteins that assemble into rod-like hetero-oligomers that can associate to form filaments; septin rings at the mother-bud neck act as scaffolds for recruiting cell division factors and as barriers to prevent diffusion of specific proteins between mother and daughter cells; N-terminus interacts with phosphatidylinositol-4,5-bisphosphate; protein abundance increases under DNA damage stress -S000035178 CDS YCR002C 3 118348 117380 C 2011-02-03 1997-01-28 -S000000596 ORF Verified YCR003W MRPL32 mitochondrial 54S ribosomal protein YmL32|YmL32 chromosome 3 L000001169 3 118620 119171 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit; protein abundance increases in response to DNA replication stress -S000036143 CDS YCR003W 3 118620 119171 W 2011-02-03 1997-01-28 -S000000597 ORF Verified YCR004C YCP4 flavodoxin-like fold family protein chromosome 3 L000004160 3 120318 119575 C 2011-02-03 1997-01-28 Protein of unknown function; has sequence and structural similarity to flavodoxins; predicted to be palmitoylated; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000036195 CDS YCR004C 3 120318 119575 C 2011-02-03 1997-01-28 -S000000598 ORF Verified YCR005C CIT2 citrate (Si)-synthase CIT2 chromosome 3 L000000342 3 122328 120946 C 2011-02-03 2000-09-13|1997-01-28 Citrate synthase, peroxisomal isozyme involved in glyoxylate cycle; catalyzes condensation of acetyl coenzyme A and oxaloacetate to form citrate; expression is controlled by Rtg1p and Rtg2p transcription factors; SCF-Ucc1 regulates level of Cit2p to maintain citrate homeostasis; oxaloacetate-dependent positive feedback loop inhibits Cit2p ubiquitination; CIT2 has a paralog, CIT1, that arose from the whole genome duplication -S000031674 CDS YCR005C 3 122328 120946 C 2011-02-03 2000-09-13|1997-01-28 -S000000599 ORF Uncharacterized YCR006C chromosome 3 3 123003 122530 C 2011-02-03 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YCR006C is not an essential gene -S000031816 CDS YCR006C 3 123003 122530 C 2011-02-03 1997-01-28 -S000006678 tRNA_gene tP(AGG)C SUF2 chromosome 3 L000002150|L000003759 3 123648 123577 C 2 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in proline codons -S000033260 noncoding_exon tP(AGG)C 3 123648 123577 C 2011-02-03 2000-05-19 -S000006832 long_terminal_repeat YCRCdelta6 chromosome 3 3 124465 124134 C 2011-02-03 2000-05-19|2007-04-02 Ty1 LTR -S000000600 ORF Uncharacterized YCR007C DUP240 family protein chromosome 3 3 126730 126011 C 2011-02-03 1997-01-28 Putative integral membrane protein; member of DUP240 gene family; SWAT-GFP and mCherry fusion proteins localize to the cell periphery and vacuole; YCR007C is not an essential gene -S000031932 CDS YCR007C 3 126730 126011 C 2011-02-03 1997-01-28 -S000006668 tRNA_gene tN(GUU)C chromosome 3 L000003752 3 127716 127789 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis -S000030674 noncoding_exon tN(GUU)C 3 127716 127789 W 2011-02-03 2000-05-19 -S000000601 ORF Verified YCR008W SAT4 serine/threonine protein kinase SAT4|HAL4 chromosome 3 L000004136 3 128470 130281 W 2011-02-03 1997-01-28 Ser/Thr protein kinase involved in salt tolerance; funtions in regulation of Trk1p-Trk2p potassium transporter; overexpression affects the Fe-S and lipoamide containing proteins in the mitochondrion; required for lipoylation of Lat1p, Kgd2p and Gcv3p; partially redundant with Hal5p; has similarity to Npr1p; localizes to the cytoplasm and mitochondrion -S000037489 CDS YCR008W 3 128470 130281 W 2011-02-03 1997-01-28 -S000000602 ORF Verified YCR009C RVS161 amphiphysin-like protein RVS161|SPE161|FUS7|END6 chromosome 3 L000001788 3 131542 130745 C 1 2011-02-03 1997-01-28 Amphiphysin-like lipid raft protein; N-BAR domain protein that interacts with Rvs167p and regulates polarization of the actin cytoskeleton, endocytosis, cell polarity, cell fusion and viability following starvation or osmotic stress -S000037521 CDS YCR009C 3 131542 130745 C 2011-02-03 1997-01-28 -S000028486 ARS ARS309 ARS309 chromosome 3 3 132043 132120 2014-11-18 2003-03-31|2014-11-18 Autonomously Replicating Sequence on Chromosome III -S000030172 ARS_consensus_sequence ARS309 3 132046 132056 W 2011-02-03 2003-03-31 -S000000603 ORF Verified YCR010C ADY2 ATO1 chromosome 3 3 133124 132273 C 2011-02-03 1997-01-28 Acetate transporter required for normal sporulation; phosphorylated in mitochondria; ADY2 has a paralog, ATO2, that arose from the whole genome duplication -S000037136 CDS YCR010C 3 133124 132273 C 2011-02-03 1997-01-28 -S000000604 ORF Verified YCR011C ADP1 putative ATP-dependent permease ADP1 chromosome 3 L000000049 3 136873 133724 C 1 2011-02-03 2000-09-13|1997-01-28 Putative ATP-dependent permease of the ABC transporter family -S000037210 CDS YCR011C 3 136873 133724 C 2011-02-03 2000-09-13|1997-01-28 -S000000605 ORF Verified YCR012W PGK1 phosphoglycerate kinase chromosome 3 L000001411 3 137746 138996 W 2 2011-02-03 2000-09-13|1997-01-28 3-phosphoglycerate kinase; catalyzes transfer of high-energy phosphoryl groups from the acyl phosphate of 1,3-bisphosphoglycerate to ADP to produce ATP; key enzyme in glycolysis and gluconeogenesis -S000037349 CDS YCR012W 3 137746 138996 W 2011-02-03 2000-09-13|1997-01-28 -S000000606 ORF Dubious YCR013C chromosome 3 3 139049 138402 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; transcription of both YCR013C and the overlapping essential gene PGK1 is reduced in a gcr1 null mutant -S000037371 CDS YCR013C 3 139049 138402 C 2011-02-03 1997-01-28 -S000000607 ORF Verified YCR014C POL4 DNA-directed DNA polymerase IV|POLX chromosome 3 L000001462 3 140933 139185 C 2011-02-03 2000-09-13|1997-01-28 DNA polymerase IV; undergoes pair-wise interactions with Dnl4p-Lif1p and Rad27p to mediate repair of DNA double-strand breaks by non-homologous end joining (NHEJ); homologous to mammalian DNA polymerase beta -S000029998 CDS YCR014C 3 140933 139185 C 2011-02-03 2000-09-13|1997-01-28 -S000000608 ORF Verified YCR015C CTO1 chromosome 3 3 142170 141217 C 2011-02-03 2000-09-13|1997-01-28 Protein required for cold tolerance; involved in phosphate uptake; YCR015C is not an essential gene -S000030089 CDS YCR015C 3 142170 141217 C 2011-02-03 2000-09-13|1997-01-28 -S000007298 snoRNA_gene snR33 SNR33 chromosome 3 L000001971 3 142546 142364 C 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U1042 -S000036761 noncoding_exon snR33 3 142546 142364 C 2011-02-03 2000-05-19 -S000006575 tRNA_gene tG(GCC)C SUF16 chromosome 3 L000002163|L000003758 3 142771 142701 C 3 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis;can mutate to suppress +1 frameshift mutations in glycine codons -S000037891 noncoding_exon tG(GCC)C 3 142771 142701 C 2011-02-03 2000-05-19 -S000006833 long_terminal_repeat YCRCdelta7 chromosome 3 3 143080 142758 C 2011-02-03 2000-05-19|2007-04-02 Ty1 LTR -S000000609 ORF Uncharacterized YCR016W chromosome 3 3 143634 144506 W 2011-02-03 2000-09-13|1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleolus and nucleus; predicted to be involved in ribosome biogenesis -S000030347 CDS YCR016W 3 143634 144506 W 2011-02-03 2000-09-13|1997-01-28 -S000000610 ORF Verified YCR017C CWH43 chromosome 3 3 147634 144773 C 2011-02-03 2000-09-13|1997-01-28 GPI lipid remodelase; responsible for introducing ceramides into GPI anchors having a C26:0 fatty acid in sn-2 of the glycerol moiety; can also use lyso-GPI protein anchors and various base resistant lipids as substrates; contains 14-16 transmembrane segments and several putative glycosylation and phosphorylation sites; null mutation is synthetically lethal with pkc1 deletion -S000030381 CDS YCR017C 3 147634 144773 C 2011-02-03 2000-09-13|1997-01-28 -S000000611 ORF Verified YCR018C SRD1 chromosome 3 L000002054 3 148903 148238 C 9 2011-02-03 2000-09-13|1997-01-28 Protein involved in the processing of pre-rRNA to mature rRNA; contains a C2/C2 zinc finger motif; srd1 mutation suppresses defects caused by the rrp1-1 mutation -S000033700 CDS YCR018C 3 148903 148238 C 2011-02-03 2000-09-13|1997-01-28 -S000006835 long_terminal_repeat YCRWdelta8 chromosome 3 3 149482 149809 W 2011-02-03 2000-05-19 Ty1 LTR -S000006658 tRNA_gene tM(CAU)C chromosome 3 L000003753 3 149920 149991 W 2011-02-03 2000-05-19 Methionine tRNA (tRNA-Met), predicted by tRNAscan-SE analysis -S000034498 noncoding_exon tM(CAU)C 3 149920 149991 W 2011-02-03 2000-05-19 -S000006836 long_terminal_repeat YCRWdelta9 chromosome 3 3 150220 150551 W 2011-02-03 2000-05-19 Ty1 LTR -S000007429 long_terminal_repeat YCRCtau1 chromosome 3 3 151055 150695 C 2011-02-03 2000-05-19|2008-03-05 Ty4 LTR -S000006615 tRNA_gene tK(CUU)C chromosome 3 L000003757 3 151356 151284 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000035985 noncoding_exon tK(CUU)C 3 151356 151284 C 2011-02-03 2000-05-19 -S000006837 long_terminal_repeat YCRWdelta10 chromosome 3 3 151521 151851 W 2011-02-03 2000-05-19 Ty1 LTR -S000007230 ORF Dubious YCR018C-A chromosome 3 3 151862 151608 C 2011-02-03 1999-07-17 Putative protein of unknown function; encoded opposite a Ty1 LTR -S000036351 CDS YCR018C-A 3 151862 151608 C 2011-02-03 1999-07-17 -S000000612 ORF Verified YCR019W MAK32 chromosome 3 L000000999 3 152837 153928 W 2011-02-03 1997-01-28 Protein necessary for stability of L-A dsRNA-containing particles -S000033899 CDS YCR019W 3 152837 153928 W 2011-02-03 1997-01-28 -S000000613 ORF Verified YCR020C PET18 HIT2 chromosome 3 L000001390 3 154659 154012 C 17 2011-02-03 1997-01-28 Protein of unknown function; has weak similarity to proteins involved in thiamin metabolism; expression is induced in the absence of thiamin -S000033420 CDS YCR020C 3 154659 154012 C 2011-02-03 1997-01-28 -S000000614 ORF Verified YCR020C-A MAK31 NAA38|SMX1|LSM9 chromosome 3 L000000998 3 155096 154830 C 2011-02-03 1997-01-28 Non-catalytic subunit of N-terminal acetyltransferase of the NatC type; required for replication of dsRNA virus; member of the Sm protein family -S000031333 CDS YCR020C-A 3 155096 154830 C 2011-02-03 1997-01-28 -S000006439 ORF Verified YCR020W-B HTL1 chromosome 3 L000004545 3 155320 155556 W 2011-02-03 1999-07-17 Component of the RSC chromatin remodeling complex; RSC functions in transcriptional regulation and elongation, chromosome stability, and establishing sister chromatid cohesion; involved in telomere maintenance -S000033349 CDS YCR020W-B 3 155320 155556 W 2011-02-03 1999-07-17 -S000000615 ORF Verified YCR021C HSP30 YRO1 chromosome 3 L000000818 3 157107 156109 C 2011-02-03 1997-01-28 Negative regulator of the H(+)-ATPase Pma1p; stress-responsive protein; hydrophobic plasma membrane localized; induced by heat shock, ethanol treatment, weak organic acid, glucose limitation, and entry into stationary phase -S000033481 CDS YCR021C 3 157107 156109 C 2011-02-03 1997-01-28 -S000000616 ORF Uncharacterized YCR022C chromosome 3 3 157765 157421 C 2011-02-03 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YCR022C is not an essential gene -S000033548 CDS YCR022C 3 157765 157421 C 2011-02-03 1997-01-28 -S000000617 ORF Verified YCR023C chromosome 3 3 160373 158538 C 2011-02-03 2000-09-13|1997-01-28 Vacuolar membrane protein of unknown function; member of the multidrug resistance family; YCR023C is not an essential gene -S000033605 CDS YCR023C 3 160373 158538 C 2011-02-03 2000-09-13|1997-01-28 -S000000618 ORF Verified YCR024C SLM5 asparagine--tRNA ligase SLM5 chromosome 3 3 162222 160744 C 2011-02-03 2000-09-13|1997-01-28 Mitochondrial asparaginyl-tRNA synthetase -S000034549 CDS YCR024C 3 162222 160744 C 2011-02-03 2000-09-13|1997-01-28 -S000028818 ORF Uncharacterized YCR024C-B chromosome 3 3 162865 162599 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000033627 CDS YCR024C-B 3 162865 162599 C 2011-02-03 2003-07-29 -S000000619 ORF Verified YCR024C-A PMP1 proteolipid ATPase chromosome 3 L000001453 3 163067 162945 C 2011-02-03 1997-01-28 Regulatory subunit for the plasma membrane H(+)-ATPase Pma1p; small single-membrane span proteolipid; forms unique helix and positively charged cytoplasmic domain that is able to specifically segregate phosphatidylserines; PMP1 has a paralog, PMP2, that arose from the whole genome duplication -S000030035 CDS YCR024C-A 3 163067 162945 C 2011-02-03 1997-01-28 -S000000620 ORF Dubious YCR025C chromosome 3 3 163856 163446 C 2011-02-03 2000-09-13|1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YCR025C is not an essential gene -S000034636 CDS YCR025C 3 163856 163446 C 2011-02-03 2000-09-13|1997-01-28 -S000000621 ORF Verified YCR026C NPP1 nucleotide diphosphatase/phosphodiesterase NPP1 chromosome 3 3 166339 164111 C 2011-02-03 2000-09-13|1997-01-28 Nucleotide pyrophosphatase/phosphodiesterase; mediates extracellular nucleotide phosphate hydrolysis along with Npp2p and Pho5p; activity and expression enhanced during conditions of phosphate starvation; involved in spore wall assembly; NPP1 has a paralog, NPP2, that arose from the whole genome duplication, and an npp1 npp2 double mutant exhibits reduced dityrosine fluorescence relative to the single mutants -S000034766 CDS YCR026C 3 166339 164111 C 2011-02-03 2000-09-13|1997-01-28 -S000028487 ARS ARS310 ARS310 chromosome 3 3 166503 167348 2011-02-03 2003-03-31 Compound autonomously replicating sequence on Chromosome III -S000030176 ARS_consensus_sequence ARS310 3 166663 166673 W 2011-02-03 2003-03-31 -S000030177 ARS_consensus_sequence ARS310 3 166710 166700 C 2011-02-03 2003-03-31 -S000030178 ARS_consensus_sequence ARS310 3 166766 166756 C 2011-02-03 2003-03-31 -S000000622 ORF Verified YCR027C RHB1 putative GTPase RHB1|RSG1 chromosome 3 S000007419 3 167999 167370 C 2011-02-03 2000-09-13|1997-01-28 Putative Rheb-related GTPase; involved in regulating canavanine resistance and arginine uptake; member of the Ras superfamily of G-proteins -S000035733 CDS YCR027C 3 167999 167370 C 2011-02-03 2000-09-13|1997-01-28 -S000006692 tRNA_gene tQ(UUG)C chromosome 3 L000003756 3 168372 168301 C 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000031663 noncoding_exon tQ(UUG)C 3 168372 168301 C 2011-02-03 2000-05-19 -S000006838 long_terminal_repeat YCRWdelta11 chromosome 3 3 169573 169888 W 2011-02-03 2000-05-19 Ty1 LTR -S000000623 ORF Verified YCR028C FEN2 chromosome 3 L000004079 3 172424 170886 C 2011-02-03 2000-09-13|1997-01-28 Plasma membrane H+-pantothenate symporter; confers sensitivity to the antifungal agent fenpropimorph; relocalizes from vacuole to cytoplasm upon DNA replication stress -S000035840 CDS YCR028C 3 172424 170886 C 2011-02-03 2000-09-13|1997-01-28 -S000007222 ORF Verified YCR028C-A RIM1 chromosome 3 L000001640 3 173440 172950 C 2011-02-03 2000-09-13|1999-07-17 ssDNA-binding protein essential for mitochondrial genome maintenance; involved in mitochondrial DNA replication; stimulates utilization by Mip1p DNA polymerase of RNA primers synthesized by Rpo41p -S000030988 CDS YCR028C-A 3 173115 172950 C 2011-02-03 2000-09-13|1999-07-17 -S000030987 CDS YCR028C-A 3 173440 173199 C 2011-02-03 2000-09-13|1999-07-17 -S000030989 intron YCR028C-A 3 173198 173116 C 2011-02-03 2000-09-13|1999-07-17 -S000000626 ORF Verified YCR030C SYP1 YCR029C-A chromosome 3 3 176438 173826 C 2011-02-03 2000-09-13|1997-01-28|1999-07-17 Negative regulator of WASP-Arp23 complex; involved in endocytic site formation; directly inhibits Las17p stimulation of Arp23 complex-mediated actin assembly in vitro; may regulate assembly and disassembly of the septin ring; colocalizes and interacts with septin subunits; potential role in actin cytoskeletal organization -S000036846 CDS YCR030C 3 176438 173826 C 2011-02-03 2000-09-13|1999-07-17|1997-01-28 -S000006456 snoRNA_gene snR65 SNR65 chromosome 3 L000004534 3 177183 177282 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U2347 -S000030850 noncoding_exon snR65 3 177183 177282 W 2011-02-03 2000-05-19 -S000000627 ORF Verified YCR031C RPS14A uS11|ribosomal 40S subunit protein S14A|S11|rp59A|S14A|RPL59|CRY1 chromosome 3 L000000423 3 178220 177500 C 26 2011-02-03 2000-09-13|1997-01-28 Protein component of the small (40S) ribosomal subunit; required for ribosome assembly and 20S pre-rRNA processing; mutations confer cryptopleurine resistance; homologous to mammalian ribosomal protein S14 and bacterial S11; RPS14A has a paralog, RPS14B, that arose from the whole genome duplication -S000037573 CDS YCR031C 3 177906 177500 C 2011-02-03 2000-09-13|1997-01-28 -S000037572 CDS YCR031C 3 178220 178214 C 2011-02-03 2000-09-13|1997-01-28 -S000037574 intron YCR031C 3 178213 177907 C 2011-02-03 2000-09-13|1997-01-28 -S000007314 snoRNA_gene snR189 SNR189 chromosome 3 L000001976 3 178798 178610 C 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2735 and small subunit (SSU) rRNA at position U466 -S000030325 noncoding_exon snR189 3 178798 178610 C 2011-02-03 2000-05-19 -S000000628 ORF Verified YCR032W BPH1 chromosome 3 L000003507 3 179520 186023 W 2011-02-03 2000-09-13|1997-01-28 Protein homologous to Chediak-Higashi syndrome and Beige proteins; both of which are implicated in disease syndromes in human and mouse, respectively, due to defective lysosomal trafficking; mutant phenotype and genetic interactions suggest a role in protein sorting -S000037675 CDS YCR032W 3 179520 186023 W 2011-02-03 2000-09-13|1997-01-28 -S000000629 ORF Verified YCR033W SNT1 chromosome 3 3 186489 190169 W 2011-02-03 2000-09-13|1997-01-28 Subunit of the Set3C deacetylase complex; interacts directly with the Set3C subunit, Sif2p; putative DNA-binding protein; mutant has increased aneuploidy tolerance; relocalizes to the cytosol in response to hypoxia -S000037732 CDS YCR033W 3 186489 190169 W 2011-02-03 2000-09-13|1997-01-28 -S000000630 ORF Verified YCR034W ELO2 fatty acid elongase ELO2|FEN1|VBM2|GNS1 chromosome 3 L000003126|L000000608 3 190592 191635 W 24 2011-02-03 1997-01-28 Fatty acid elongase, involved in sphingolipid biosynthesis; acts on fatty acids of up to 24 carbons in length; mutations have regulatory effects on 1,3-beta-glucan synthase, vacuolar ATPase, and the secretory pathway; ELO2 has a paralog, ELO1, that arose from the whole genome duplication; lethality of the elo2 elo3 double null mutation is functionally complemented by human ELOVL1 and weakly complemented by human ELOVL3 or ELOV7 -S000037781 CDS YCR034W 3 190592 191635 W 2011-02-03 1997-01-28 -S000000631 ORF Verified YCR035C RRP43 exosome non-catalytic core subunit RRP43 chromosome 3 L000003552 3 193018 191834 C 2011-02-03 2000-09-13|1997-01-28 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; has similarity to E. coli RNase PH and to human hRrp43p (OIP2, EXOSC8); protein abundance increases in response to DNA replication stress -S000030620 CDS YCR035C 3 193018 191834 C 2011-02-03 2000-09-13|1997-01-28 -S000000632 ORF Verified YCR036W RBK1 putative ribokinase chromosome 3 L000001587 3 193297 194298 W 29 2011-02-03 2000-09-13|1997-01-28 Putative ribokinase -S000030780 CDS YCR036W 3 193297 194298 W 2011-02-03 2000-09-13|1997-01-28 -S000028488 ARS ARS313 ARS313 ARSIII-194 chromosome 3 3 194308 194367 2014-11-18 2003-03-31|2014-11-18|2006-09-06 Autonomously Replicating Sequence on Chromosome III -S000000633 ORF Verified YCR037C PHO87 SPX domain-containing inorganic phosphate transporter chromosome 3 L000002740 3 197185 194414 C 2011-02-03 2000-09-13|1997-01-28 Low-affinity inorganic phosphate (Pi) transporter; acts upstream of Pho81p in regulation of the PHO pathway; expression is independent of Pi concentration and Pho4p activity; contains 12 membrane-spanning segments; PHO87 has a paralog, PHO90, that arose from the whole genome duplication -S000030810 CDS YCR037C 3 197185 194414 C 2011-02-03 2000-09-13|1997-01-28 -S000028489 ARS ARS314 ARS314 ARSIII-198 chromosome 3 3 197460 197598 2014-11-18 2003-03-31|2014-11-18|2006-09-06 Autonomously Replicating Sequence on Chromosome III; active in <10% of cell cycles -S000178056 ARS_consensus_sequence ARS314 3 197552 197536 C 2014-11-18 2014-11-18 -S000029699 mating_type_region MATALPHA MATALPHA MAT chromosome 3 L000001031 3 198671 201177 W 30 2011-02-03 2007-12-10 Mating type locus; note that the systematic sequence in SGD contains MATalpha sequences -S000124947 W_region MATALPHA 3 198671 199400 W 2011-02-03 2007-12-10 -S000124948 X_region MATALPHA 3 199401 200103 W 2011-02-03 2007-12-10 -S000124949 Y_region MATALPHA 3 200104 200850 W 2011-02-03 2007-12-10 -S000124950 Z1_region MATALPHA 3 200851 201089 W 2011-02-03 2007-12-10 -S000124951 Z2_region MATALPHA 3 201090 201177 W 2011-02-03 2007-12-10 -S000007597 ORF Dubious YCR038W-A chromosome 3 3 199293 199418 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene BUD5/YCR038C; identified by homology with hemiascomycetous yeast species -S000037143 CDS YCR038W-A 3 199293 199418 W 2011-02-03 2001-02-26 -S000000634 ORF Verified YCR038C BUD5 Ras family guanine nucleotide exchange factor BUD5 chromosome 3 L000000202 3 199549 197621 C 30 2011-02-03 2000-09-13|1997-01-28 GTP/GDP exchange factor for Rsr1p (Bud1p); required for both axial and bipolar budding patterns; mutants exhibit random budding in all cell types -S000031792 CDS YCR038C 3 199549 197621 C 2011-02-03 2000-09-13|1997-01-28 -S000000635 ORF Verified YCR039C MATALPHA2 homeodomain mating type protein alpha2|ALPHA2 chromosome 3 L000002973 3 200178 199546 C 2011-02-03 1997-01-28 Homeobox-domain protein; with Mcm1p, represses a-specific genes in haploids; acts with A1p to repress transcription of haploid-specific genes in diploids; one of two genes encoded by the MATalpha mating type cassette -S000031946 CDS YCR039C 3 200178 199546 C 2011-02-03 1997-01-28 -S000000636 ORF Verified YCR040W MATALPHA1 transcriptional co-activator mating type protein alpha|ALPHA1 chromosome 3 L000002972 3 200442 200969 W 2011-02-03 1997-01-28 Transcriptional co-activator that regulates mating-type-specific genes; targets the transcription factor Mcm1p to the promoters of alpha-specific genes; one of two genes encoded by the MATalpha mating type cassette -S000032771 CDS YCR040W 3 200442 200969 W 2011-02-03 1997-01-28 -S000000637 ORF Verified YCR041W chromosome 3 3 200911 201243 W 2011-02-03 1997-01-28 Protein of unknown function; overexpression suppresses the high-frequency loss of mini-chromosomes, probably by increasing the rate of proper chromosome segregation; translated gene product of YCR041W, but not its transcript, is responsible for suppression; suppression ability of YCR041W is completely dependent on silencing protein Sir4p -S000032864 CDS YCR041W 3 200911 201243 W 2011-02-03 1997-01-28 -S000000638 ORF Verified YCR042C TAF2 TafII150|TSM1|TAF150 chromosome 3 L000002367 3 205397 201174 C 31 2011-02-03 1997-01-28 TFIID subunit (150 kDa); involved in RNA polymerase II transcription initiation -S000032896 CDS YCR042C 3 205397 201174 C 2011-02-03 1997-01-28 -S000000639 ORF Uncharacterized YCR043C chromosome 3 3 206644 206261 C 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the Golgi apparatus; YCR043C is not an essential gene -S000033005 CDS YCR043C 3 206644 206261 C 2011-02-03 1997-01-28 -S000000640 ORF Verified YCR044C PER1 COS16 chromosome 3 3 207950 206877 C 2011-02-03 1997-01-28 Protein of the endoplasmic reticulum; required for GPI-phospholipase A2 activity that remodels the GPI anchor as a prerequisite for association of GPI-anchored proteins with lipid rafts; functionally complemented by human ortholog PERLD1 -S000033673 CDS YCR044C 3 207950 206877 C 2011-02-03 1997-01-28 -S000028607 ORF Dubious YCR045W-A chromosome 3 3 208751 209101 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps with YCR045C; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching -S000031418 CDS YCR045W-A 3 208751 209101 W 2011-02-03 2003-07-29 -S000000641 ORF Verified YCR045C RRT12 OSW3 chromosome 3 3 209610 208135 C 2011-02-03 1997-01-28 Probable subtilisin-family protease; role in formation of the dityrosine layer of spore walls; localizes to the spore wall and also the nuclear envelope and ER region in mature spores -S000033761 CDS YCR045C 3 209610 208135 C 2011-02-03 1997-01-28 -S000000642 ORF Verified YCR046C IMG1 mitochondrial 54S ribosomal protein IMG1 chromosome 3 L000004445 3 210423 209914 C 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit; required for respiration and for maintenance of the mitochondrial genome -S000033858 CDS YCR046C 3 210423 209914 C 2011-02-03 1997-01-28 -S000028608 ORF Dubious YCR047W-A chromosome 3 3 211301 211507 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps with YCR047C; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching -S000031420 CDS YCR047W-A 3 211301 211507 W 2011-02-03 2003-07-29 -S000000643 ORF Verified YCR047C BUD23 18S rRNA (guanine1575-N7)-methyltransferase chromosome 3 3 211545 210718 C 2011-02-03 1997-01-28 Methyltransferase that methylates residue G1575 of 18S rRNA; required for rRNA processing and nuclear export of 40S ribosomal subunits independently of methylation activity; diploid mutant displays random budding pattern; functional homolog of human WBSCR22 -S000034011 CDS YCR047C 3 211545 210718 C 2011-02-03 1997-01-28 -S000000644 ORF Verified YCR048W ARE1 sterol acyltransferase|SAT2 chromosome 3 L000003221|L000002768 3 211929 213761 W 2011-02-03 1997-01-28 Acyl-CoA:sterol acyltransferase; endoplasmic reticulum enzyme that contributes the major sterol esterification activity in the absence of oxygen; ARE1 has a paralog, ARE2, that arose from the whole genome duplication -S000034969 CDS YCR048W 3 211929 213761 W 2011-02-03 1997-01-28 -S000000645 ORF Dubious YCR049C chromosome 3 3 212317 211871 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035033 CDS YCR049C 3 212317 211871 C 2011-02-03 1997-01-28 -S000000646 ORF Uncharacterized YCR050C chromosome 3 3 213772 213464 C 2011-02-03 1997-01-28 Non-essential protein of unknown function; deletion mutant is synthetically sick or lethal with alpha-synuclein -S000036029 CDS YCR050C 3 213772 213464 C 2011-02-03 1997-01-28 -S000000647 ORF Uncharacterized YCR051W chromosome 3 3 214071 214739 W 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; contains ankyrin (Ank) repeats; YCR051W is not an essential gene -S000036913 CDS YCR051W 3 214071 214739 W 2011-02-03 1997-01-28 -S000000648 ORF Verified YCR052W RSC6 chromosome 3 L000003151 3 214994 216445 W 2011-02-03 1997-01-28 Component of the RSC chromatin remodeling complex; essential for mitotic growth; RSC6 has a paralog, SNF12, that arose from the whole genome duplication -S000036966 CDS YCR052W 3 214994 216445 W 2011-02-03 1997-01-28 -S000000649 ORF Verified YCR053W THR4 threonine synthase THR4 chromosome 3 L000002300 3 216697 218241 W 51 2011-02-03 1997-01-28 Threonine synthase; conserved protein that catalyzes formation of threonine from O-phosphohomoserine; expression is regulated by the GCN4-mediated general amino acid control pathway -S000037048 CDS YCR053W 3 216697 218241 W 2011-02-03 1997-01-28 -S000000650 ORF Verified YCR054C CTR86 chromosome 3 L000004071 3 220067 218376 C 2011-02-03 1997-01-28 Essential protein of unknown function; with orthologs in Ashbya gossypii and Candida albicans; similar to human ATXN10, mutations in which cause spinocerebellar ataxia type 10; codon usage corresponds to that observed for yeast genes expressed at low levels; relative distribution to the nucleus increases upon DNA replication stress -S000037070 CDS YCR054C 3 220067 218376 C 2011-02-03 1997-01-28 -S000000653 ORF Verified YCR057C PWP2 snoRNA-binding rRNA-processing protein PWP2|UTP1|YCR058C|YCR055C chromosome 3 L000001540 3 223228 220457 C 2011-02-03 2000-09-13|1997-01-28 Conserved 90S pre-ribosomal component; essential for proper endonucleolytic cleavage of the 35 S rRNA precursor at A0, A1, and A2 sites; contains eight WD-repeats; PWP2 deletion leads to defects in cell cycle and bud morphogenesis -S000029966 CDS YCR057C 3 223228 220457 C 2011-02-03 2000-09-13|1997-01-28 -S000000655 ORF Verified YCR059C YIH1 chromosome 3 3 224230 223454 C 2011-02-03 1997-01-28 Negative regulator of eIF2 kinase Gcn2p; competes with Gcn2p for binding to Gcn1p; may contribute to regulation of translation in response to starvation via regulation of Gcn2p; binds to monomeric actin and to ribosomes and polyribosomes; ortholog of mammalian IMPACT -S000031068 CDS YCR059C 3 224230 223454 C 2011-02-03 1997-01-28 -S000000656 ORF Verified YCR060W TAH1 chromosome 3 3 224399 224734 W 2011-02-03 1997-01-28 Component of conserved R2TP complex (Rvb1-Rvb2-Tah1-Pih1); R2TP complex interacts with Hsp90 (Hsp82p and Hsc82p) to mediate assembly of large protein complexes such as box C/D snoRNPs and RNA polymerase II; contains a single TPR domain with at least two TPR motifs; plays a role in determining prion variants -S000032111 CDS YCR060W 3 224399 224734 W 2011-02-03 1997-01-28 -S000028490 ARS ARS315 ARS315 ARSIII-225 chromosome 3 3 224816 225061 2011-02-03 2003-03-31|2006-09-06 Highly-active autonomously replicating sequence; initiates replication in ~90% of cell cycles -S000178057 ARS_consensus_sequence ARS315 3 224853 224869 W 2014-11-18 2014-11-18 -S000000657 ORF Uncharacterized YCR061W YCR062W chromosome 3 3 225563 227458 W 2011-02-03 2000-09-14|1997-01-28 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; induced by treatment with 8-methoxypsoralen and UVA irradiation -S000032157 CDS YCR061W 3 225563 227458 W 2011-02-03 2000-09-14|1997-01-28 -S000006730 tRNA_gene tS(CGA)C SUP61 chromosome 3 L000002215|L000003754 3 227942 228042 W 68 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis; i6A37 modification is catalyzed by Mod5p; can mutate to suppress amber or ochre nonsense mutations; suppressor mutant alleles are recessive lethal and can only be maintained when an additional wild-type copy of the gene is present, because SUP61 encodes the only tRNA species that can decode UCG codons -S000029830 intron tS(CGA)C 3 227979 227997 W 2011-02-03 2000-05-19 -S000029828 noncoding_exon tS(CGA)C 3 227942 227978 W 2011-02-03 2000-05-19 -S000029829 noncoding_exon tS(CGA)C 3 227998 228042 W 2011-02-03 2000-05-19 -S000000659 ORF Verified YCR063W BUD31 U2 snRNP complex subunit BUD31|CWC14 chromosome 3 3 228318 228791 W 2011-02-03 1997-01-28 Component of the SF3b subcomplex of the U2 snRNP; increases efficiency of first and second step pre-mRNA splicing; diploid mutants display a random budding pattern instead of the wild-type bipolar pattern; facilitates passage through G1/S Start, but is not required for G2/M transition or exit from mitosis -S000033121 CDS YCR063W 3 228318 228791 W 2011-02-03 1997-01-28 -S000000660 ORF Dubious YCR064C chromosome 3 3 228505 228095 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene BUD31 -S000033148 CDS YCR064C 3 228505 228095 C 2011-02-03 1997-01-28 -S000000661 ORF Verified YCR065W HCM1 chromosome 3 L000000757 3 229310 231004 W 2011-02-03 2000-09-13|1997-01-28 Forkhead transcription factor; drives S-phase activation of genes involved in chromosome segregation, spindle dynamics, budding; also activates genes involved in respiration, use of alternative energy sources (like proline), NAD synthesis, oxidative stress resistance; key factor in early adaptation to nutrient deficiency and diauxic shift; suppressor of calmodulin mutants with specific SPB assembly defects; ortholog of C. elegans lifespan regulator PHA-4 -S000033238 CDS YCR065W 3 229310 231004 W 2011-02-03 2000-09-13|1997-01-28 -S000000662 ORF Verified YCR066W RAD18 E3 ubiquitin-protein ligase RAD18 chromosome 3 L000001567 3 231500 232963 W 67 2011-02-03 1997-01-28 E3 ubiquitin ligase; forms heterodimer with Rad6p to monoubiquitinate PCNA-K164; heterodimer binds single-stranded DNA and has single-stranded DNA dependent ATPase activity; required for postreplication repair; SUMO-targeted ubiquitin ligase (STUbl) that contains a SUMO-interacting motif (SIM) which stimulates its ubiquitin ligase activity towards the sumoylated form of PCNA -S000033283 CDS YCR066W 3 231500 232963 W 2011-02-03 1997-01-28 -S000000663 ORF Verified YCR067C SED4 chromosome 3 L000001860 3 236322 233125 C 2011-02-03 1997-01-28 Integral ER membrane protein that stimulates Sar1p GTPase activity; involved in COPII vesicle budding through disassociation of coat proteins from membranes onto liposomes; binds Sec16p; SED4 has a paralog, SEC12, that arose from the whole genome duplication -S000033324 CDS YCR067C 3 236322 233125 C 2011-02-03 1997-01-28 -S000000664 ORF Verified YCR068W ATG15 triglyceride lipase ATG15|CVT17|AUT5 chromosome 3 L000004767|L000004751 3 237214 238776 W 2011-02-03 2000-09-13|1997-01-28 Phospholipase; preferentially hydrolyses phosphatidylserine, with minor activity against cardiolipin and phosphatidylethanolamine; required for lysis of autophagic and CVT bodies; targeted to intravacuolar vesicles during autophagy via the multivesicular body (MVB) pathway; required for the maintenance of lipid droplet quantity after the diauxic shift; regulates lipolysis; expression regulated by Yap1p during autophagy -S000034292 CDS YCR068W 3 237214 238776 W 2011-02-03 2000-09-13|1997-01-28 -S000000665 ORF Verified YCR069W CPR4 peptidylprolyl isomerase family protein CPR4|SCC3|YCR070W|CYP4 chromosome 3 L000001804 3 239055 240011 W 2011-02-03 1997-01-28 Peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; has a potential role in the secretory pathway; CPR4 has a paralog, CPR8, that arose from the whole genome duplication -S000034404 CDS YCR069W 3 239055 240011 W 2011-02-03 1997-01-28 -S000000667 ORF Verified YCR071C IMG2 mitochondrial 54S ribosomal protein IMG2 chromosome 3 L000004446 3 240543 240103 C 2011-02-03 2000-09-13|1997-01-28 Mitochondrial ribosomal protein of the large subunit; conserved in metazoa, with similarity to human mitochondrial ribosomal protein MRPL49 -S000036422 CDS YCR071C 3 240543 240103 C 2011-02-03 2000-09-13|1997-01-28 -S000000668 ORF Verified YCR072C RSA4 chromosome 3 3 242352 240805 C 2011-02-03 2000-09-13|1997-01-28 WD-repeat protein involved in ribosome biogenesis; may interact with ribosomes; required for maturation and efficient intra-nuclear transport or pre-60S ribosomal subunits, localizes to the nucleolus -S000036487 CDS YCR072C 3 242352 240805 C 2011-02-03 2000-09-13|1997-01-28 -S000000669 ORF Verified YCR073C SSK22 mitogen-activated protein kinase kinase kinase SSK22 chromosome 3 L000002827 3 246583 242588 C 2011-02-03 2000-09-13|1997-01-28 MAP kinase kinase kinase of HOG1 mitogen-activated signaling pathway; functionally redundant with Ssk2p; interacts with and is activated by Ssk1p; phosphorylates Pbs2p; SSK22 has a paralog, SSK2, that arose from the whole genome duplication -S000036585 CDS YCR073C 3 246583 242588 C 2011-02-03 2000-09-13|1997-01-28 -S000000718 ORF Verified YCR073W-A SOL2 YCRX13W chromosome 3 L000003116 3 246963 247910 W 2011-02-03 2000-09-13|1997-01-28 Protein with a possible role in tRNA export; shows similarity to 6-phosphogluconolactonase non-catalytic domains but does not exhibit this enzymatic activity; homologous to Sol3p and Sol4p; SOL2 has a paralog, SOL1, that arose from the whole genome duplication -S000032484 CDS YCR073W-A 3 246963 247910 W 2011-02-03 2000-09-13|1997-01-28 -S000000671 ORF Verified YCR075C ERS1 cystinosin-like protein ERS1 chromosome 3 L000000582 3 248815 248033 C 2011-02-03 1997-01-28 Protein involved in cystine transport; localizes to the vacuole, plasma membrane and endosome; similarity to human cystinosin, a H(+)-driven transporter involved in L-cystine export from lysosomes and implicated in the disease cystinosis; contains seven transmembrane domains; mutation is functionally complemented by human CTNS -S000037388 CDS YCR075C 3 248815 248033 C 2011-02-03 1997-01-28 -S000028519 ORF Verified YCR075W-A EGO2 chromosome 3 3 248975 249202 W 2011-02-03 2003-07-29 Component of the EGO and GSE complexes; identified by homology to Ashbya gossypii; YCR075W-A has a paralog, YNR034W-A, that arose from the whole genome duplication -S000030296 CDS YCR075W-A 3 248975 249202 W 2011-02-03 2003-07-29 -S000000672 ORF Verified YCR076C FUB1 chromosome 3 3 250045 249293 C 2011-02-03 1997-01-28 Proteasome-binding protein; interacts physically with multiple subunits of the 20S proteasome and genetically with genes encoding 20S core particle and 19S regulatory particle subunits; exhibits boundary activity which blocks the propagation of heterochromatic silencing; contains a PI31 proteasome regulator domain and sequence similarity with human PSMF1, a proteasome inhibitor; not an essential gene -S000037531 CDS YCR076C 3 250045 249293 C 2011-02-03 1997-01-28 -S000000673 ORF Verified YCR077C PAT1 MRT1 chromosome 3 L000001183|L000003214 3 252628 250238 C 2011-02-03 2000-09-13|1997-01-28|2011-02-03 Deadenylation-dependent mRNA-decapping factor; also required for faithful chromosome transmission, maintenance of rDNA locus stability, and protection of mRNA 3'-UTRs from trimming; associated with topoisomerase II; binds to mRNAs under glucose starvation, most often in the 3' UTR; functionally linked to Pab1p; forms cytoplasmic foci upon DNA replication stress; phosphorylation by PKA inhibits P body foci formation -S000030274 CDS YCR077C 3 252628 250238 C 2011-02-03 2000-09-13|1997-01-28|2011-02-03 -S000002133 ORF Verified YCR079W PTC6 type 2C protein phosphatase PTC6|PPP2|AUP1 chromosome 3 3 252845 254173 W 2011-02-03 2000-09-13|1997-01-28 Mitochondrial type 2C protein phosphatase (PP2C); has similarity to mammalian PP1Ks; involved in mitophagy; null mutant is sensitive to rapamycin and has decreased phosphorylation of the Pda1 subunit of pyruvate dehydrogenase -S000031401 CDS YCR079W 3 252845 254173 W 2011-02-03 2000-09-13|1997-01-28 -S000000677 ORF Verified YCR081W SRB8 MED12|YCR080W|SSN5|NUT6|GIG1 chromosome 3 L000003007 3 254371 258654 W 2011-02-03 2000-09-13|1997-01-28 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation; involved in glucose repression -S000031712 CDS YCR081W 3 254371 258654 W 2011-02-03 2000-09-13|1997-01-28 -S000028609 ORF Dubious YCR081C-A chromosome 3 3 258651 258415 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps with SRB8/YCR081W; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching -S000031422 CDS YCR081C-A 3 258651 258415 C 2011-02-03 2003-07-29 -S000000678 ORF Verified YCR082W AHC2 chromosome 3 3 258883 259269 W 2011-02-03 1997-01-28 Component of the ADA histone acetyltransferase complex; Ahc2p and Ahc1p are unique to the ADA complex and not shared with the related SAGA and SLIK complexes; may tether Ahc1p to the complex -S000031866 CDS YCR082W 3 258883 259269 W 2011-02-03 1997-01-28 -S000000679 ORF Verified YCR083W TRX3 chromosome 3 3 259578 259961 W 2011-02-03 1997-01-28 Mitochondrial thioredoxin; highly conserved oxidoreductase required to maintain the redox homeostasis of the cell, forms the mitochondrial thioredoxin system with Trr2p, redox state is maintained by both Trr2p and Glr1p -S000031961 CDS YCR083W 3 259578 259961 W 2011-02-03 1997-01-28 -S000000680 ORF Verified YCR084C TUP1 chromatin-silencing transcriptional regulator TUP1|UMR7|SFL2|ROX4|FLK1|CYC9|CRT4|AMM1|AER2|AAR1 chromosome 3 L000002391 3 262452 260311 C 77 2011-02-03 1997-01-28 General repressor of transcription; forms complex with Cyc8p, involved in the establishment of repressive chromatin structure through interactions with histones H3 and H4, appears to enhance expression of some genes -S000032798 CDS YCR084C 3 262452 260311 C 2011-02-03 1997-01-28 -S000000681 ORF Uncharacterized YCR085W chromosome 3 3 262916 263269 W 2011-02-03 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YCR085W is not an essential gene -S000032982 CDS YCR085W 3 262916 263269 W 2011-02-03 1997-01-28 -S000000682 ORF Verified YCR086W CSM1 chromosome 3 S000007653 3 263392 263964 W 2011-02-03 1997-01-28 Nucleolar protein that mediates homolog segregation during meiosis I; forms a complex with Lrs4p and then Mam1p at kinetochores; required for condensin recruitment to the replication fork barrier site and rDNA repeat segregation -S000033051 CDS YCR086W 3 263392 263964 W 2011-02-03 1997-01-28 -S000000683 ORF Dubious YCR087W chromosome 3 3 263976 264491 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps uncharacterized gene YCR087C-A; YCR087W is not an essential gene -S000033786 CDS YCR087W 3 263976 264491 W 2011-02-03 1997-01-28 -S000007223 ORF Uncharacterized YCR087C-A LUG1 chromosome 3 3 264467 264006 C 2011-02-03 1999-07-17 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleolus; YCR087C-A is not an essential gene -S000034092 CDS YCR087C-A 3 264467 264006 C 2011-02-03 1999-07-17 -S000000684 ORF Verified YCR088W ABP1 chromosome 3 L000000013 3 265068 266846 W 80 2011-02-03 1997-01-28 Actin-binding protein of the cortical actin cytoskeleton; important for activation of the Arp2/3 complex that plays a key role actin in cytoskeleton organization; inhibits barbed-end actin filament elongation; phosphorylation within its Proline-Rich Regio, mediated by Cdc28p and Pho85p, protects Abp1p from proteolysis mediated by its own PEST sequences; mammalian homolog of HIP-55 (hematopoietic progenitor kinase 1 [HPK1]-interacting protein of 55 kDa) -S000033904 CDS YCR088W 3 265068 266846 W 2011-02-03 1997-01-28 -S000000685 ORF Verified YCR089W FIG2 chromosome 3 L000003312 3 267434 272263 W 2011-02-03 2000-09-13|1997-01-28 Cell wall adhesin, expressed specifically during mating; may be involved in maintenance of cell wall integrity during mating; FIG2 has a paralog, AGA1, that arose from the whole genome duplication -S000034060 CDS YCR089W 3 267434 272263 W 2011-02-03 2000-09-13|1997-01-28 -S000028491 ARS ARS316 ARS316 ARSIII-273 chromosome 3 3 272852 273095 2011-02-03 2003-03-31|2006-09-06 Inefficient autonomously replicating sequence; active in ~25% of cell cycles -S000178058 ARS_consensus_sequence ARS316 3 273024 273008 C 2014-11-18 2014-11-18 -S000000686 ORF Uncharacterized YCR090C chromosome 3 3 272863 272315 C 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; YCR090C is not an essential gene -S000036138 CDS YCR090C 3 272863 272315 C 2011-02-03 1997-01-28 -S000000687 ORF Verified YCR091W KIN82 putative serine/threonine protein kinase KIN82|FPK2 chromosome 3 L000000906 3 274404 276566 W 2011-02-03 2000-09-13|1997-01-28|2011-02-03 Putative serine/threonine protein kinase; implicated in the regulation of phospholipid asymmetry through the activation of phospholipid translocases (flippases); involved in the phosphorylation of upstream inhibitory kinase Ypk1p along with Fpk1p; has a redundant role in the cellular response to mating pheromone; KIN82 has a paralog, FPK1, that arose from the whole genome duplication -S000036298 CDS YCR091W 3 274404 276566 W 2011-02-03 2000-09-13|1997-01-28|2011-02-03 -S000000688 ORF Verified YCR092C MSH3 mismatch repair protein MSH3 chromosome 3 L000001191 3 279820 276764 C 2011-02-03 2007-09-06|1997-01-28 Mismatch repair protein; forms dimers with Msh2p that mediate repair of insertion or deletion mutations and removal of nonhomologous DNA ends, contains a PCNA (Pol30p) binding motif required for genome stability -S000036361 CDS YCR092C 3 279820 276764 C 2011-02-03 1997-01-28|2007-09-06 -S000000689 ORF Verified YCR093W CDC39 CCR4-NOT core subunit CDC39|SMD6|ROS1|NOT1 chromosome 3 L000000274 3 280117 286443 W 91 2011-02-03 2000-09-13|1997-01-28 Subunit of the CCR4-NOT1 core complex; this complex has multiple roles in the regulation of mRNA levels including regulation of transcription and destabilization of mRNA by deadenylation; basal transcription factor that increases initiation and elongation; activates the ATPase activity of Dhh1p, resulting in processing body disassembly -S000037049 CDS YCR093W 3 280117 286443 W 2011-02-03 2000-09-13|1997-01-28 -S000000690 ORF Verified YCR094W CDC50 aminophospholipid translocase regulatory protein CDC50 chromosome 3 L000004326 3 286762 287937 W 2011-02-03 1997-01-28 Endosomal protein that interacts with phospholipid flippase Drs2p; interaction with Cdc50p is essential for Drs2p catalytic activity; mutations affect cell polarity and polarized growth; similar to Lem3p; CDC50 has a paralog, YNR048W, that arose from the whole genome duplication -S000037156 CDS YCR094W 3 286762 287937 W 2011-02-03 1997-01-28 -S000000691 ORF Uncharacterized YCR095C OCA4 chromosome 3 3 289258 288170 C 2011-02-03 1997-01-28 Cytoplasmic protein required for replication of Brome mosaic virus; S. cerevisiae is a model system for studying replication of positive-strand RNA viruses in their natural hosts -S000037199 CDS YCR095C 3 289258 288170 C 2011-02-03 1997-01-28 -S000029724 ORF Uncharacterized YCR095W-A chromosome 3 3 289639 289797 W 2011-02-03 2004-08-27 Putative protein of unknown function -S000036860 CDS YCR095W-A 3 289639 289797 W 2011-02-03 2004-08-27 -S000006839 long_terminal_repeat YCRWdelta12 chromosome 3 3 291373 291712 W 2011-02-03 2000-05-19 Ty1 LTR -S000006841 long_terminal_repeat YCRWomega3 chromosome 3 3 291922 292167 W 2011-02-03 2000-05-19 Ty5 LTR -S000029655 silent_mating_type_cassette_array silenced_gene HMR HMR chromosome 3 L000000792 3 292388 295034 W 94 2011-02-03 2007-12-10 Mating-type cassette - right; unexpressed complete copy of the mating-type genes, silenced by the Sir2 histone deacetylase and its associated SIR1, SIR3 and SIR4 proteins; mating-type switching involves replacement of the Ya or Yalpha sequences present at the MAT locus with either the a or alpha genes located at one of the HM loci in a process stimulated by the HO endonuclease; sequence replacement occurs by gene conversion, leaving the donor unaltered -S000124952 X_region HMR 3 293032 293736 W 2011-02-03 2007-12-10 -S000124953 Y_region HMR 3 293737 294378 W 2011-02-03 2007-12-10 -S000124954 Z1_region HMR 3 294379 294617 W 2011-02-03 2007-12-10 -S000028492 ARS ARS317 ARS317 HMR-E ARS chromosome 3 3 292638 292694 2014-11-18 2003-03-31|2014-11-18 ARS that fires extremely inefficiently and late during S phase; fires late and inefficiently compared to other origins in the genome; active in only a small fraction of cell cycles -S000121225 ARS_consensus_sequence ARS317 3 292684 292674 C 2011-02-03 2007-03-06 -S000000692 ORF Verified|silenced_gene YCR096C HMRA2 homeodomain mating type protein a2|A2 chromosome 3 3 293538 293179 C 2011-02-03 1997-01-28 Silenced copy of a2 at HMR; similarity to Alpha2p; required along with a1p for inhibiting expression of the HO endonuclease in a/alpha HO/HO diploid cells with an active mating-type interconversion system -S000037309 CDS YCR096C 3 293538 293179 C 2011-02-03 1997-01-28 -S000000694 ORF Verified|silenced_gene YCR097W HMRA1 YCR097WB chromosome 3 S000007657 3 293835 294321 W 2011-02-03 1997-01-28 Silenced copy of a1 at HMR; homeobox corepressor that interacts with Alpha2p to repress haploid-specific gene transcription in diploid cells -S000030021 CDS YCR097W 3 293835 293939 W 2011-02-03 1997-01-28 -S000030022 CDS YCR097W 3 293994 294239 W 2011-02-03 1997-01-28 -S000030023 CDS YCR097W 3 294292 294321 W 2011-02-03 1997-01-28 -S000030024 intron YCR097W 3 293940 293993 W 2011-02-03 1997-01-28 -S000030025 intron YCR097W 3 294240 294291 W 2011-02-03 1997-01-28 -S000007632 ORF Dubious YCR097W-A chromosome 3 3 294439 294705 W 2011-02-03 2000-07-12 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by homology to a hemiascomycetous yeast protein -S000036353 CDS YCR097W-A 3 294439 294705 W 2011-02-03 2000-07-12 -S000028493 ARS ARS318 ARS318 HMR-I ARS chromosome 3 3 294820 294901 2014-11-18 2003-03-31|2014-11-18 ARS that becomes active if the nearby ARS317/HMR-E silencer is deleted; active in only a small fraction of cell cycles -S000030213 ARS_consensus_sequence ARS318 3 294824 294834 W 2011-02-03 2003-03-31|2009-02-19 -S000006840 long_terminal_repeat YCRWdelta13 chromosome 3 3 295003 295330 W 2011-02-03 2000-05-19 Ty1 LTR -S000006738 tRNA_gene tT(AGU)C chromosome 3 L000003755 3 295484 295556 W 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000032149 noncoding_exon tT(AGU)C 3 295484 295556 W 2011-02-03 2000-05-19 -S000006834 long_terminal_repeat YCRCdelta14 chromosome 3 3 296190 295958 C 2011-02-03 2000-05-19|2007-04-02 Ty1 LTR -S000000695 ORF Verified YCR098C GIT1 chromosome 3 L000003211 3 298605 297049 C 2011-02-03 1997-01-28 Plasma membrane permease; mediates uptake of glycerophosphoinositol and glycerophosphocholine as sources of the nutrients inositol and phosphate; expression and transport rate are regulated by phosphate and inositol availability -S000030063 CDS YCR098C 3 298605 297049 C 2011-02-03 1997-01-28 -S000000696 ORF Uncharacterized YCR099C chromosome 3 3 301299 300832 C 2011-02-03 1997-01-28 Putative protein of unknown function -S000031088 CDS YCR099C 3 301299 300832 C 2011-02-03 1997-01-28 -S000000697 ORF Uncharacterized YCR100C chromosome 3 3 302221 301271 C 2011-02-03 1997-01-28 Putative protein of unknown function -S000036663 CDS YCR100C 3 302221 301271 C 2011-02-03 1997-01-28 -S000000698 ORF Uncharacterized YCR101C chromosome 3 3 303030 302482 C 2011-02-03 1997-01-28 Putative protein of unknown function; localizes to the membrane fraction; YCR101C is not an essential gene -S000036721 CDS YCR101C 3 303030 302482 C 2011-02-03 1997-01-28 -S000000699 ORF Uncharacterized YCR102C chromosome 3 3 305467 304361 C 2011-02-03 1997-01-28 Putative protein of unknown function; involved in copper metabolism; similar to C. carbonum toxD gene; member of the quinone oxidoreductase family -S000036781 CDS YCR102C 3 305467 304361 C 2011-02-03 1997-01-28 -S000007231 ORF Dubious YCR102W-A chromosome 3 3 306735 306932 W 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037829 CDS YCR102W-A 3 306735 306932 W 2011-02-03 1999-07-17 -S000000701 ORF Verified YCR104W PAU3 seripauperin PAU3 chromosome 3 L000002739 3 307801 308175 W 2011-02-03 1997-01-28 Member of the seripauperin multigene family; encoded mainly in subtelomeric region; active during alcoholic fermentation; regulated by anaerobiosis; negatively regulated by oxygen; repressed by heme -S000037613 CDS YCR104W 3 307801 308175 W 2011-02-03 1997-01-28 -S000000702 ORF Verified YCR105W ADH7 NADP-dependent alcohol dehydrogenase|ADHVII chromosome 3 3 309070 310155 W 2011-02-03 1997-01-28 NADPH-dependent medium chain alcohol dehydrogenase; has broad substrate specificity; member of the cinnamyl family of alcohol dehydrogenases; may be involved in fusel alcohol synthesis or in aldehyde tolerance -S000037676 CDS YCR105W 3 309070 310155 W 2011-02-03 1997-01-28 -S000000703 ORF Verified YCR106W RDS1 chromosome 3 3 310958 313456 W 2011-02-03 1997-01-28 Putative zinc cluster transcription factor; involved in conferring resistance to cycloheximide -S000037733 CDS YCR106W 3 310958 313456 W 2011-02-03 1997-01-28 -S000000704 ORF Verified YCR107W AAD3 putative aryl-alcohol dehydrogenase chromosome 3 L000004636 3 313890 314981 W 2011-02-03 2000-09-13|1997-01-28 Putative aryl-alcohol dehydrogenase; similar to P. chrysosporium aryl-alcohol dehydrogenase; mutational analysis has not yet revealed a physiological role; AAD3 has a paralog, AAD15, that arose from a segmental duplication; members of the AAD gene family comprise three pairs (AAD3 + AAD15, AAD6/AAD16 + AAD4, AAD10 + AAD14) whose two genes are more related to one another than to other members of the family -S000037782 CDS YCR107W 3 313890 314981 W 2011-02-03 2000-09-13|1997-01-28 -S000028944 telomere TEL03R chromosome 3 3 315783 316620 W 102 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome III; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats -S000028945 telomeric_repeat TEL03R 3 316522 316620 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome III -S000028946 X_element TEL03R 3 315783 316239 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome III; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YCR108C -S000028947 X_element_combinatorial_repeat TEL03R 3 316240 316521 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr III; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000028494 ARS ARS319 ARS319 chromosome 3 3 315807 315879 2014-11-18 2003-03-31|2014-11-18 Highly-active subtelomeric autonomously replicating sequence; initiates replication in ~90% of cell cycles -S000030215 ARS_consensus_sequence ARS319 3 315821 315831 W 2011-02-03 2003-03-31 -S000028536 ORF Uncharacterized YCR108C chromosome 3 3 316188 315997 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031145 CDS YCR108C 3 316188 315997 C 2011-02-03 2003-07-29 -S000121226 ARS ARS400 ARSIV-1 chromosome 4 4 137 1392 2007-03-06 2007-03-06 Autonomously Replicating Sequence -S000178059 ARS_consensus_sequence ARS400 4 869 853 C 2014-11-18 2014-11-18 -S000028875 telomere TEL04L chromosome 4 4 904 1 C -153 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome IV; composed of an X element core sequence, X element combinatorial repeats, and a terminal stretch of telomeric repeats -S000028876 telomeric_repeat TEL04L 4 154 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome IV -S000028877 X_element TEL04L 4 904 435 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome IV; spans 469 bp and contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028878 X_element_combinatorial_repeat TEL04L 4 434 155 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr IV; spans 279 bp and contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000002407 ORF Verified YDL248W COS7 chromosome 4 L000004065 4 1802 2953 W 1996-07-31 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000036145 CDS YDL248W 4 1802 2953 W 1996-07-31 1996-07-31 -S000007602 ORF Dubious YDL247W-A chromosome 4 4 3762 3836 W 2001-02-26 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by sequence comparison with hemiascomycetous yeast species -S000037148 CDS YDL247W-A 4 3762 3836 W 2001-02-26 2001-02-26 -S000002406 ORF Verified YDL247W MPH2 alpha-glucoside permease chromosome 4 4 5985 7814 W 1996-07-31 1996-07-31 Alpha-glucoside permease; transports maltose, maltotriose, alpha-methylglucoside, and turanose; almost identical to Mph3p; encoded in a subtelomeric position in a region likely to have undergone duplication -S000035265 CDS YDL247W 4 5985 7814 W 1996-07-31 1996-07-31 -S000002405 ORF Verified YDL246C SOR2 L-iditol 2-dehydrogenase SOR2 chromosome 4 4 9756 8683 C 1996-07-31 1996-07-31 Sorbitol dehydrogenase; protein sequence is 99% identical to the Sor1p sorbitol dehydrogenase -S000035109 CDS YDL246C 4 9756 8683 C 1996-07-31 1996-07-31 -S000002404 ORF Verified YDL245C HXT15 HLT2|hexose transporter HXT15 chromosome 4 L000002986 4 13360 11657 C 1996-07-31 1996-07-31 Putative transmembrane polyol transporter; supports growth on and uptake of mannitol, sorbitol and xylitol with moderate affinity when overexpressed in a strain deleted for hexose family members; minor hexose transport activity when overexpressed in a similar strain; similarity to hexose transporters; expression is induced by low levels of glucose and repressed by high levels of glucose -S000035017 CDS YDL245C 4 13360 11657 C 1996-07-31 1996-07-31 -S000118427 ARS ARS403 ARSIV-16 chromosome 4 4 15493 15739 2006-08-30 2006-08-30 Autonomously Replicating Sequence -S000178060 ARS_consensus_sequence ARS403 4 15682 15666 C 2014-11-18 2014-11-18 -S000002403 ORF Verified YDL244W THI13 4-amino-5-hydroxymethyl-2-methylpyrimidine phosphate synthase chromosome 4 S000007414 4 16204 17226 W 1996-07-31 1996-07-31 Protein involved in synthesis of the thiamine precursor HMP; member of a subtelomeric gene family including THI5, THI11, THI12, and THI13; hydroxymethylpyrimidine is also known as HMP -S000034919 CDS YDL244W 4 16204 17226 W 1996-07-31 1996-07-31 -S000002402 ORF Verified YDL243C AAD4 putative aryl-alcohol dehydrogenase chromosome 4 L000004637 4 18566 17577 C 1996-07-31 1996-07-31 Putative aryl-alcohol dehydrogenase; involved in oxidative stress response; similar to P. chrysosporium aryl-alcohol dehydrogenase; expression induced in cells treated with the mycotoxin patulin; members of the AAD gene family comprise three pairs (AAD3 + AAD15, AAD6/AAD16 + AAD4, AAD10 + AAD14) whose two genes are more related to one another than to other members of the family -S000032895 CDS YDL243C 4 18566 17577 C 1996-07-31 1996-07-31 -S000002401 ORF Dubious YDL242W chromosome 4 4 18959 19312 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032853 CDS YDL242W 4 18959 19312 W 1996-07-31 1996-07-31 -S000002400 ORF Uncharacterized YDL241W chromosome 4 4 20635 21006 W 1996-07-31 1996-07-31 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; YDL241W is not an essential gene -S000032761 CDS YDL241W 4 20635 21006 W 1996-07-31 1996-07-31 -S000007601 ORF Dubious YDL240C-A chromosome 4 4 22608 22471 C 2001-02-26 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by sequence comparison with hemiascomycetous yeast species -S000037147 CDS YDL240C-A 4 22608 22471 C 2001-02-26 2001-02-26 -S000002399 ORF Verified YDL240W LRG1 chromosome 4 L000000953 4 22823 25876 W 1996-07-31 1996-07-31|2011-02-03 GTPase-activating protein (GAP); contains Rho1p-specific GAP activity, interacting with activated forms of Rho1p; functions along with Sac7p as a negative regulator of the Pkc1p-mediated cell wall integrity signaling pathway; negative regulator of cell wall 1,3-beta-glucan biosynthesis; required for efficient cell fusion; contains a RhoGAP domain and three Lin-11-Isl1-Mec-3 (LIM) domains -S000032681 CDS YDL240W 4 22823 25876 W 1996-07-31 1996-07-31|2011-02-03 -S000002398 ORF Verified YDL239C ADY3 chromosome 4 4 28775 26403 C 1996-07-31 1996-07-31|2011-02-03 Protein required for spore wall formation; subunit of the leading edge protein (LEP) complex (Ssp1-Ady3-Don1-Irc10) that forms a ring-like structure at the leading edge of the prospore membrane during meiosis II; mediates assembly of the LEP complex, formation of the ring-like structure via interaction with spindle pole body components and prospore membrane maturation; potentially phosphorylated by Cdc28p; ADY3 has a paralog, CNM67, that arose from the whole -S000032048 CDS YDL239C 4 28775 26403 C 1996-07-31 1996-07-31|2011-02-03 -S000002397 ORF Verified YDL238C GUD1 guanine deaminase chromosome 4 4 30454 28985 C 1996-07-31 1996-07-31 Guanine deaminase; a catabolic enzyme of the guanine salvage pathway producing xanthine and ammonia from guanine; activity is low in exponentially-growing cultures but expression is increased in post-diauxic and stationary-phase cultures -S000031892 CDS YDL238C 4 30454 28985 C 1996-07-31 1996-07-31 -S000002396 ORF Verified YDL237W AIM6 LRC1 chromosome 4 4 30657 31829 W 1996-07-31 1996-07-31|2011-02-03 Protein of unknown function; required for respiratory growth; YDL237W is not an essential gene -S000031783 CDS YDL237W 4 30657 31829 W 1996-07-31 1996-07-31|2011-02-03 -S000002395 ORF Verified YDL236W PHO13 4-nitrophenylphosphatase chromosome 4 L000001425 4 32296 33234 W 1996-07-31 1996-07-31 Conserved phosphatase acting as a metabolite repair enzyme; shows specific dephosphorylating activity on two side-products of central carbohydrate metabolism, 2-phosphoglycolate and 4-phosphoerythronate; alkaline phosphatase specific for p-nitrophenyl phosphate; also has protein phosphatase activity; human ortholog PGP shows similar substrate specificity, deletion causes similar metabolite accumulation phenotypes, suggesting conserved role in eliminating glycolytic byproducts -S000030827 CDS YDL236W 4 32296 33234 W 1996-07-31 1996-07-31 -S000002394 ORF Verified YDL235C YPD1 chromosome 4 L000003285 4 33918 33415 C 1996-07-31 1996-07-31 Osmotic stress-responsive phosphorelay intermediate sensor protein; phosphorylated by the plasma membrane sensor Sln1p in response to osmotic stress and then in turn phosphorylates the response regulators Ssk1p in the cytosol and Skn7p in the nucleus -S000030691 CDS YDL235C 4 33918 33415 C 1996-07-31 1996-07-31 -S000002393 ORF Verified YDL234C GYP7 chromosome 4 L000003067 4 36477 34237 C 2011-02-03 1996-07-31 GTPase-activating protein for yeast Rab family members; members include Ypt7p (most effective), Ypt1p, Ypt31p, and Ypt32p (in vitro); involved in vesicle mediated protein trafficking; contains a PH-like domain -S000036775 CDS YDL234C 4 36477 34237 C 2011-02-03 1996-07-31 -S000002392 ORF Uncharacterized YDL233W MFG1 chromosome 4 4 36797 38173 W 2011-02-03 1996-07-31 Regulator of filamentous growth; interacts with FLO11 promoter and regulates FLO11 expression; binds to transcription factors Flo8p and Mss11p; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; YDL233W is not an essential gene -S000036757 CDS YDL233W 4 36797 38173 W 2011-02-03 1996-07-31 -S000002391 ORF Verified YDL232W OST4 olichyl-diphosphooligosaccharide--protein glycotransferase OST4 chromosome 4 L000003180 4 38487 38597 W 2011-02-03 1996-07-31 Subunit of the oligosaccharyltransferase complex of the ER lumen; complex catalyzes protein asparagine-linked glycosylation; type I membrane protein required for incorporation of Ost3p or Ost6p into the OST complex -S000036662 CDS YDL232W 4 38487 38597 W 2011-02-03 1996-07-31 -S000002390 ORF Verified YDL231C BRE4 chromosome 4 4 42244 38867 C 2011-02-03 1996-07-31 Zinc finger protein containing five transmembrane domains; null mutant exhibits strongly fragmented vacuoles and sensitivity to brefeldin A, a drug which is known to affect intracellular transport -S000036514 CDS YDL231C 4 42244 38867 C 2011-02-03 1996-07-31 -S000002389 ORF Verified YDL230W PTP1 tyrosine protein phosphatase PTP1 chromosome 4 L000001525 4 42700 43707 W 2011-02-03 1996-07-31 Phosphotyrosine-specific protein phosphatase; dephosphorylates a broad range of substrates in vivo, including Fpr3p; localized to the cytoplasm and the mitochondria; proposed to be a negative regulator of filamentation -S000036498 CDS YDL230W 4 42700 43707 W 2011-02-03 1996-07-31 -S000002388 ORF Verified YDL229W SSB1 Hsp70 family ATPase SSB1|YG101 chromosome 4 L000002073|L000002508 4 44065 45906 W -129 2011-02-03 1996-07-31 Cytoplasmic ATPase that is a ribosome-associated molecular chaperone; functions with J-protein partner Zuo1p; may be involved in folding of newly-made polypeptide chains; member of the HSP70 family; interacts with phosphatase subunit Reg1p; SSB1 has a paralog, SSB2, that arose from the whole genome duplication -S000035996 CDS YDL229W 4 44065 45906 W 2011-02-03 1996-07-31 -S000002387 ORF Dubious YDL228C chromosome 4 4 45918 45277 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the verified gene SSB1 -S000035797 CDS YDL228C 4 45918 45277 C 2011-02-03 1996-07-31 -S000114787 ARS ARS404 ARS404 HO ARS chromosome 4 4 46185 46237 2014-11-18 2014-11-18|2006-04-10 Autonomously Replicating Sequence -S000121227 ARS_consensus_sequence ARS404 4 46230 46214 C 2014-11-18 2014-11-18|2007-03-06 -S000002386 ORF Verified YDL227C HO chromosome 4 L000000796 4 48031 46271 C -130 2011-02-03 1996-07-31 Site-specific endonuclease; required for gene conversion at the MAT locus (homothallic switching) through the generation of a ds DNA break; expression restricted to mother cells in late G1 as controlled by Swi4p-Swi6p, Swi5p, and Ash1p -S000035713 CDS YDL227C 4 48031 46271 C 2011-02-03 1996-07-31 -S000002385 ORF Verified YDL226C GCS1 chromosome 4 L000000693 4 52173 51115 C 2011-02-03 1996-07-31 ADP-ribosylation factor GTPase activating protein (ARF GAP); involved in ER-Golgi transport; required for prospore membrane formation; regulates phospholipase Spo14p; shares functional similarity with Glo3p; GCS1 has a paralog, SPS18, that arose from the whole genome duplication -S000035648 CDS YDL226C 4 52173 51115 C 2011-02-03 1996-07-31 -S000002384 ORF Verified YDL225W SHS1 septin SHS1|SEP7 chromosome 4 4 52445 54100 W 2011-02-03 1996-07-31 Component of the septin ring that is required for cytokinesis; present at the ends of rod-like septin hetero-oligomers; C-terminal extension is important for recruitment of Bni5p to the mother-bud neck, which in turn is required for Myo1p recruitment and cytokinesis; undergoes sumoylation and phosphorylation during mitosis; protein abundance increases in response to DNA replication stress -S000035638 CDS YDL225W 4 52445 54100 W 2011-02-03 1996-07-31 -S000002383 ORF Verified YDL224C WHI4 chromosome 4 L000004493 4 56346 54397 C 2011-02-03 1996-07-31 Putative RNA binding protein; regulates the cell size requirement for passage through Start and commitment to cell division; WHI4 has a paralog, WHI3, that arose from the whole genome duplication -S000034657 CDS YDL224C 4 56346 54397 C 2011-02-03 1996-07-31 -S000002382 ORF Verified YDL223C HBT1 chromosome 4 S000007655 4 60405 57265 C 2011-02-03 1996-07-31 Shmoo tip protein, substrate of Hub1p ubiquitin-like protein; mutants are defective for mating projection formation, thereby implicating Hbt1p in polarized cell morphogenesis; HBT1 has a paralog, YNL195C, that arose from the whole genome duplication -S000034598 CDS YDL223C 4 60405 57265 C 2011-02-03 1996-07-31 -S000002381 ORF Verified YDL222C FMP45 chromosome 4 4 61801 60872 C 2011-02-03 1996-07-31 Integral membrane protein localized to mitochondria; required for sporulation and maintaining sphingolipid content; similar to SUR7; FMP45 has a paralog, YNL194C, that arose from the whole genome duplication -S000034458 CDS YDL222C 4 61801 60872 C 2011-02-03 1996-07-31 -S000002380 ORF Dubious YDL221W chromosome 4 4 62011 62562 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the 3' end of essential gene CDC13 -S000034428 CDS YDL221W 4 62011 62562 W 2011-02-03 1996-07-31 -S000002379 ORF Verified YDL220C CDC13 telomere-binding protein CDC13|EST4 chromosome 4 L000000253 4 65018 62244 C -122 2011-02-03 1996-07-31 Single stranded DNA-binding protein found at TG1-3 telomere G-tails; key roles in regulation of telomerase, telomere end protection, conventional telomere replication; regulates telomere replication through recruitment of specific sub-complexes, essential function is telomere capping; forms homodimer via N-terminus; disruption of dimerization leads to short telomeres; autophagy and proteasome are involved in Cdc13p degradation; differentially phosphorylated through cell cycle -S000032343 CDS YDL220C 4 65018 62244 C 2011-02-03 1996-07-31 -S000002378 ORF Verified YDL219W DTD1 D-tyrosyl-tRNA(Tyr) deacylase chromosome 4 4 65242 65765 W 2011-02-03 1996-07-31 D-Tyr-tRNA(Tyr) deacylase; functions in protein translation, may affect nonsense suppression via alteration of the protein synthesis machinery; ubiquitous among eukaryotes -S000032532 CDS YDL219W 4 65242 65306 W 2011-02-03 1996-07-31 -S000032533 CDS YDL219W 4 65378 65765 W 2011-02-03 1996-07-31 -S000032534 intron YDL219W 4 65307 65377 W 2011-02-03 1996-07-31 -S000002377 ORF Uncharacterized YDL218W chromosome 4 4 66493 67446 W 2011-02-03 1996-07-31 Putative protein of unknown function; YDL218W transcription is regulated by Azf1p and induced by starvation and aerobic conditions; expression also induced in cells treated with the mycotoxin patulin -S000031549 CDS YDL218W 4 66493 67446 W 2011-02-03 1996-07-31 -S000002376 ORF Verified YDL217C TIM22 translocation channel protein TIM22 chromosome 4 L000004157 4 68606 67983 C 2011-02-03 1996-07-31 Essential core component of the mitochondrial TIM22 complex; involved in insertion of polytopic proteins into the inner membrane; forms the channel through which proteins are imported -S000031465 CDS YDL217C 4 68606 67983 C 2011-02-03 1996-07-31 -S000002375 ORF Verified YDL216C RRI1 COP9 signalosome catalytic subunit RRI1|JAB1|CSN5 chromosome 4 S000007574 4 70319 68997 C 2011-02-03 1996-07-31|2006-04-13 Catalytic subunit of the COP9 signalosome (CSN) complex; acts as an isopeptidase in cleaving the ubiquitin-like protein Nedd8 from SCF ubiquitin ligases; metalloendopeptidase involved in the adaptation to pheromone signaling; involved in modulation of genes controlling amino acid and lipid metabolism, and ergosterol biosynthesis -S000031346 CDS YDL216C 4 70319 68997 C 2011-02-03 1996-07-31|2006-04-13 -S000002374 ORF Verified YDL215C GDH2 glutamate dehydrogenase (NAD(+))|GDHB|GDH-B chromosome 4 L000000697 4 73918 70640 C 2011-02-03 1996-07-31 NAD(+)-dependent glutamate dehydrogenase; degrades glutamate to ammonia and alpha-ketoglutarate; expression sensitive to nitrogen catabolite repression and intracellular ammonia levels; genetically interacts with GDH3 by suppressing stress-induced apoptosis -S000031302 CDS YDL215C 4 73918 70640 C 2011-02-03 1996-07-31 -S000002373 ORF Verified YDL214C PRR2 serine/threonine protein kinase PRR2 chromosome 4 4 76545 74446 C 2011-02-03 1996-07-31 Serine/threonine protein kinase; inhibits pheromone induced signalling downstream of MAPK, possibly at the level of the Ste12p transcription factor; mutant has increased aneuploidy tolerance; PRR2 has a paralog, NPR1, that arose from the whole genome duplication -S000030339 CDS YDL214C 4 76545 74446 C 2011-02-03 1996-07-31 -S000002372 ORF Verified YDL213C NOP6 chromosome 4 4 77966 77289 C 2011-02-03 1996-07-31 rRNA-binding protein required for 40S ribosomal subunit biogenesis; contains an RNA recognition motif (RRM); hydrophilin essential to overcome the stress of the desiccation-rehydration process; NOP6 may be a fungal-specific gene as no homologs have been yet identified in higher eukaryotes -S000030227 CDS YDL213C 4 77966 77289 C 2011-02-03 1996-07-31 -S000002371 ORF Verified YDL212W SHR3 APF1 chromosome 4 L000001885 4 78426 79058 W 2011-02-03 1996-07-31 Endoplasmic reticulum packaging chaperone; required for incorporation of amino acid permeases into COPII coated vesicles for transport to the cell surface -S000030170 CDS YDL212W 4 78426 79058 W 2011-02-03 1996-07-31 -S000002370 ORF Uncharacterized YDL211C chromosome 4 4 80412 79294 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole; YDL211C has a paralog, TDA7, that arose from the whole genome duplication -S000036399 CDS YDL211C 4 80412 79294 C 2011-02-03 1996-07-31 -S000006576 tRNA_gene tG(GCC)D1 chromosome 4 L000003761 4 83548 83618 W 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis -S000031690 noncoding_exon tG(GCC)D1 4 83548 83618 W 2011-02-03 2000-05-19 -S000002369 ORF Verified YDL210W UGA4 chromosome 4 L000002424 4 84270 85985 W 2011-02-03 1996-07-31 GABA (gamma-aminobutyrate) permease; serves as a GABA transport protein involved in the utilization of GABA as a nitrogen source; catalyzes the transport of putrescine and delta-aminolevulinic acid (ALA); localized to the vacuolar membrane -S000036357 CDS YDL210W 4 84270 85985 W 2011-02-03 1996-07-31 -S000118428 ARS ARS405 ARSIV-86 chromosome 4 4 85945 86176 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178061 ARS_consensus_sequence ARS405 4 86125 86109 C 2014-11-18 2014-11-18 -S000002368 ORF Verified YDL209C CWC2 NTC40 chromosome 4 4 87226 86207 C 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); this complex contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs; binds directly to U6 snRNA; similar to S. pombe Cwf2 -S000036574 CDS YDL209C 4 87226 86207 C 2011-02-03 1996-07-31 -S000002367 ORF Verified YDL208W NHP2 snoRNA-binding protein NHP2 chromosome 4 L000001243 4 87512 87982 W 2011-02-03 1996-07-31|2005-11-22 Protein related to mammalian high mobility group (HMG) proteins; nuclear protein; essential for function of H/ACA-type snoRNPs, which are involved in 18S rRNA processing -S000036516 CDS YDL208W 4 87512 87982 W 2011-02-03 1996-07-31|2005-11-22 -S000002366 ORF Verified YDL207W GLE1 nucleoporin GLE1|NLE2|BRR3|RSS1 chromosome 4 L000003399|L000001255|S000029324 4 88248 89864 W 2011-02-03 1996-07-31 Cytoplasmic nucleoporin required for polyadenylated mRNA export; contains a nuclear export signal; when bound to inositol hexakisphosphate (IP6), functions as an activator for the Dbp5p ATPase activity at the nuclear pore complex during mRNA export; mediates translation initiation; required for efficient translation termination -S000036457 CDS YDL207W 4 88248 89864 W 2011-02-03 1996-07-31 -S000002365 ORF Uncharacterized YDL206W chromosome 4 4 90176 92464 W 2011-02-03 1996-07-31 Putative protein of unknown function; YDL206W is not an essential protein -S000035556 CDS YDL206W 4 90176 92464 W 2011-02-03 1996-07-31 -S000002364 ORF Verified YDL205C HEM3 hydroxymethylbilane synthase|OLE2 chromosome 4 L000000762 4 93745 92762 C 2011-02-03 1996-07-31 Porphobilinogen deaminase; catalyzes the conversion of 4-porphobilinogen to hydroxymethylbilane, the third step in heme biosynthesis; localizes to the cytoplasm and nucleus; expression is regulated by Hap2p-Hap3p, but not by levels of heme; human homolog HMBS can complement yeast mutant and allow growth of haploid null after sporulation of a heterozygous diploid -S000035448 CDS YDL205C 4 93745 92762 C 2011-02-03 1996-07-31 -S000002363 ORF Verified YDL204W RTN2 chromosome 4 4 94605 95786 W 2011-02-03 1996-07-31 Reticulon protein; involved in nuclear pore assembly and maintenance of tubular ER morphology; promotes membrane curvature; regulates the ER asymmetry-induced inheritance block during ER stress; role in ER-derived peroxisomal biogenesis; interacts with Sec6p, Yip3p, and Sbh1p; less abundant than RTN1; member of RTNLA (reticulon-like A) subfamily; protein increases in abundance and relocalizes to plasma membrane upon DNA replication stress -S000035441 CDS YDL204W 4 94605 95786 W 2011-02-03 1996-07-31 -S000002362 ORF Verified YDL203C ACK1 chromosome 4 4 97953 96082 C 2011-02-03 1996-07-31 Protein that functions in the cell wall integrity pathway; functions upstream of Pkc1p; GFP-fusion protein expression is induced in response to the DNA-damaging agent MMS; non-tagged Ack1p is detected in purified mitochondria -S000035331 CDS YDL203C 4 97953 96082 C 2011-02-03 1996-07-31 -S000002361 ORF Verified YDL202W MRPL11 mitochondrial 54S ribosomal protein YmL11|YmL11 chromosome 4 L000002686 4 98475 99224 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; localizes to vacuole in response to H2O2 -S000035301 CDS YDL202W 4 98475 99224 W 2011-02-03 1996-07-31 -S000002360 ORF Verified YDL201W TRM8 tRNA (guanine46-N7)-methyltransferase chromosome 4 4 99561 100421 W 2011-02-03 1996-07-31 Noncatalytic subunit of a tRNA methyltransferase complex; Trm8p and Trm82p comprise an enzyme that catalyzes a methyl-transfer from S-adenosyl-l-methionine to the N(7) atom of guanine at position 46 in tRNA; Trm8 lacks catalytic activity if not bound to Trm82p -S000034332 CDS YDL201W 4 99561 100421 W 2011-02-03 1996-07-31 -S000002359 ORF Verified YDL200C MGT1 methylated-DNA--protein-cysteine methyltransferase|MGMT chromosome 4 L000001106 4 101067 100501 C 2011-02-03 1996-07-31|2006-04-13 DNA repair methyltransferase (6-O-methylguanine-DNA methylase); involved in protection against DNA alkylation damage -S000034219 CDS YDL200C 4 101067 100501 C 2011-02-03 1996-07-31|2006-04-13 -S000002358 ORF Uncharacterized YDL199C chromosome 4 4 103353 101290 C 2011-02-03 1996-07-31 Putative transporter; member of the sugar porter family -S000035760 CDS YDL199C 4 103353 101290 C 2011-02-03 1996-07-31 -S000002357 ORF Verified YDL198C GGC1 SHM1|YHM1 chromosome 4 L000001881 4 104551 103649 C 2011-02-03 1996-07-31 Mitochondrial GTP/GDP transporter; essential for mitochondrial genome maintenance; has a role in mitochondrial iron transport; member of the mitochondrial carrier family -S000035649 CDS YDL198C 4 104551 103649 C 2011-02-03 1996-07-31 -S000002356 ORF Verified YDL197C ASF2 chromosome 4 L000000127 4 106494 104917 C -109.03 2011-02-03 1996-07-31 Anti-silencing protein; causes derepression of silent loci when overexpressed -S000034644 CDS YDL197C 4 106494 104917 C 2011-02-03 1996-07-31 -S000002355 ORF Dubious YDL196W chromosome 4 4 106741 107070 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame is located in promoter region of essential gene SEC31 -S000034607 CDS YDL196W 4 106741 107070 W 2011-02-03 1996-07-31 -S000002354 ORF Verified YDL195W SEC31 WEB1 chromosome 4 L000002484 4 107208 111029 W 2011-02-03 1996-07-31|2011-02-03 Component of the Sec13p-Sec31p complex of the COPII vesicle coat; COPII coat is required for vesicle formation in ER to Golgi transport; mutant has increased aneuploidy tolerance -S000034506 CDS YDL195W 4 107208 111029 W 2011-02-03 1996-07-31|2011-02-03 -S000002353 ORF Verified YDL194W SNF3 glucose sensor chromosome 4 L000001946 4 111580 114234 W -104 2011-02-03 1996-07-31 Plasma membrane low glucose sensor, regulates glucose transport; high affinity sensor that contains 12 predicted transmembrane segments and a long C-terminal tail required for induction of hexose transporters; also senses fructose and mannose; SNF3 has a paralog, RGT2, that arose from the whole genome duplication -S000033579 CDS YDL194W 4 111580 114234 W 2011-02-03 1996-07-31 -S000002352 ORF Verified YDL193W NUS1 ditrans,polycis-polyprenyl diphosphate synthase chromosome 4 4 114672 115799 W 2011-02-03 1996-07-31 Forms dehydrodolichyl diphosphate syntase complex with RER2 or SRT1; tet-repressible mutant shows accumulation of hypoglycosylated forms of CPY, suggesting that Nus1p may be involved in protein trafficking; mutations in human homolog NUS1 have been implicated in congenital scoliosis, neurological impairment, refractory epilepsy, hearing deficit, and visual impairment; human cis-prenyltransferase complex complements yeast null mutant -S000033540 CDS YDL193W 4 114672 115799 W 2011-02-03 1996-07-31 -S000002351 ORF Verified YDL192W ARF1 Arf family GTPase ARF1 chromosome 4 L000000104 4 116321 116866 W -91 2011-02-03 1996-07-31 ADP-ribosylation factor; GTPase of the Ras superfamily involved in regulation of coated vesicle formation in intracellular trafficking within the Golgi; ARF1 has a paralog, ARF2, that arose from the whole genome duplication; arf1 arf2 double null mutation is complemented by human ARF1, ARF4, ARF5, or ARF6 -S000033475 CDS YDL192W 4 116321 116866 W 2011-02-03 1996-07-31 -S000002350 ORF Verified YDL191W RPL35A uL29|ribosomal 60S subunit protein L35A|L35A|L29|SOS1 chromosome 4 L000001985 4 117664 118517 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L35A; homologous to mammalian ribosomal protein L35 and bacterial L29; RPL35A has a paralog, RPL35B, that arose from the whole genome duplication -S000033395 CDS YDL191W 4 117664 117666 W 2011-02-03 1996-07-31 -S000033396 CDS YDL191W 4 118158 118517 W 2011-02-03 1996-07-31 -S000033397 intron YDL191W 4 117667 118157 W 2011-02-03 1996-07-31 -S000002349 ORF Verified YDL190C UFD2 ubiquitin-ubiquitin ligase UFD2 chromosome 4 L000002788 4 121592 118707 C 2011-02-03 1996-07-31|2011-02-03 Ubiquitin chain assembly factor (E4); cooperates with a ubiquitin-activating enzyme (E1), a ubiquitin-conjugating enzyme (E2), and a ubiquitin protein ligase (E3) to conjugate ubiquitin to substrates; also functions as an E3 -S000032665 CDS YDL190C 4 121592 118707 C 2011-02-03 1996-07-31|2011-02-03 -S000002348 ORF Verified YDL189W RBS1 chromosome 4 4 122216 123589 W 2011-02-03 2000-07-22|1996-07-31 Protein involved in assembly of the RNA polymerase III (Pol III) complex; high copy suppressor of Pol III assembly mutation and psk1 psk2 mutations that confer temperature-sensitivity for galactose utilization; physically interacts with Pol III; proposed to bind single-stranded nucleic acids via its R3H domain -S000033663 CDS YDL189W 4 122216 123589 W 2011-02-03 2000-07-22|1996-07-31 -S000122396 five_prime_UTR_intron YDL189W 4 122078 122176 W 2011-02-03 2007-04-27 -S000118429 ARS ARS406 ARSIV-124 chromosome 4 4 123617 123901 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178062 ARS_consensus_sequence ARS406 4 123795 123779 C 2014-11-18 2014-11-18 -S000002347 ORF Verified YDL188C PPH22 phosphoprotein phosphatase 2A catalytic subunit PPH22|PPH2 chromosome 4 L000001473 4 124998 123865 C -102 2011-02-03 1996-07-31 Catalytic subunit of protein phosphatase 2A (PP2A); functionally redundant with Pph21p; methylated at C terminus; forms alternate complexes with several regulatory subunits; involved in signal transduction and regulation of mitosis; protein abundance increases in response to DNA replication stress; dephosphorylates Tel1p/Mec1p-phosphorylated Cdc13p to promote telomerase release from telomeres at G2/M; PPH22 has a paralog, PPH21, that arose from the whole genome duplication -S000030301 CDS YDL188C 4 124998 123865 C 2011-02-03 1996-07-31 -S000002345 ORF Uncharacterized YDL186W chromosome 4 4 125616 126449 W 2011-02-03 1996-07-31 Putative protein of unknown function; YDL186W is not an essential gene -S000030062 CDS YDL186W 4 125616 126449 W 2011-02-03 1996-07-31 -S000002346 ORF Dubious YDL187C chromosome 4 4 125838 125509 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030099 CDS YDL187C 4 125838 125509 C 2011-02-03 1996-07-31 -S000002344 ORF Verified YDL185W VMA1 H(+)-transporting V1 sector ATPase subunit A|TFP1|CLS8 chromosome 4 L000002289 4 126787 130002 W -101.43 2011-02-03 1996-07-31 Subunit A of the V1 peripheral membrane domain of V-ATPase; protein precursor undergoes self-catalyzed splicing to yield the extein Tfp1p and the intein Vde (PI-SceI), which is a site-specific endonuclease; the V1 peripheral membrane domain of the vacuolar H+-ATPase (V-ATPase) has eight subunits; involved in methionine restriction extension of chronological lifespan in an autophagy-dependent manner -S000029978 CDS YDL185W 4 126787 130002 W 2011-02-03 1996-07-31 -S000029636 intein_encoding_region YDL185W S000007537 4 127636 129000 W 2014-11-18 2014-11-18 Vma1p derived endonuclease; a 50 kDa intein derived from the self-splicing of amino acid residues 284-738 of the VMA1 primary translation product; has endonuclease activity and cleaves at the VMA1 gene to stimulate gene conversion during meiosis -S000007600 ORF Dubious YDL185C-A chromosome 4 4 126835 126608 C 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YDL185W; identified by homology with hemiascomycetous yeast species -S000037146 CDS YDL185C-A 4 126835 126608 C 2011-02-03 2001-02-26 -S000002343 ORF Verified YDL184C RPL41A eL41|ribosomal 60S subunit protein L41A|L41e|YL41|L47A|L41A|RPL47A chromosome 4 L000001738 4 130484 130407 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L41A; comprises only 25 amino acids; rpl41a rpl41b double null mutant is viable; homologous to mammalian ribosomal protein L41, no bacterial homolog; RPL41A has a paralog, RPL41B, that arose from the whole genome duplication -S000037317 CDS YDL184C 4 130484 130407 C 2011-02-03 1996-07-31 -S000002342 ORF Verified YDL183C MKR1 chromosome 4 4 131833 130871 C 2011-02-03 1996-07-31 Protein that may form an active mitochondrial KHE system; mitochondrial inner-membrane protein; non-essential gene; KHE system stands for K+/H+ exchanger system -S000037236 CDS YDL183C 4 131833 130871 C 2011-02-03 1996-07-31 -S000002341 ORF Verified YDL182W LYS20 homocitrate synthase LYS20 chromosome 4 L000004103 4 133437 134723 W 2011-02-03 1996-07-31 Homocitrate synthase isozyme and functions in DNA repair; catalyzes the condensation of acetyl-CoA and alpha-ketoglutarate to form homocitrate, which is the first step in the lysine biosynthesis pathway; LYS20 has a paralog, LYS21, that arose from the whole genome duplication -S000037198 CDS YDL182W 4 133437 134723 W 2011-02-03 1996-07-31 -S000002340 ORF Verified YDL181W INH1 ATPase inhibitor chromosome 4 L000000866 4 135179 135436 W 2011-02-03 1996-07-31 Protein that inhibits ATP hydrolysis by the F1F0-ATP synthase; inhibitory function is enhanced by stabilizing proteins Stf1p and Stf2p; has a calmodulin-binding motif and binds calmodulin in vitro; INH1 has a paralog, STF1, that arose from the whole genome duplication -S000037121 CDS YDL181W 4 135179 135436 W 2011-02-03 1996-07-31 -S000002339 ORF Uncharacterized YDL180W chromosome 4 4 135896 137539 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole -S000036445 CDS YDL180W 4 135896 137539 W 2011-02-03 1996-07-31 -S000002338 ORF Verified YDL179W PCL9 chromosome 4 L000004041 4 138291 139205 W 2011-02-03 1996-07-31 Cyclin; forms a functional kinase complex with Pho85p cyclin-dependent kinase (Cdk), expressed in late M/early G1 phase, activated by Swi5p; PCL9 has a paralog, PCL2, that arose from the whole genome duplication -S000032032 CDS YDL179W 4 138291 139205 W 2011-02-03 1996-07-31 -S000002337 ORF Verified YDL178W DLD2 D-lactate dehydrogenase|AIP2 chromosome 4 L000000070 4 139522 141114 W 2011-02-03 1996-07-31 D-2-hydroxyglutarate dehydrogenase, and minor D-lactate dehydrogenase; mitochondrial matrix protein that oxidizes D-2-hydroxyglutarate (D-2HG), an oncometabolite, to alpha-ketoglutarate with a minor role in lactate catabolism; located in the mitochondrial matrix -S000031886 CDS YDL178W 4 139522 141114 W 2011-02-03 1996-07-31 -S000002336 ORF Uncharacterized YDL177C chromosome 4 4 141721 141209 C 2011-02-03 1996-07-31 Putative protein of unknown function; similar to the mouse IMPACT gene; YDL177C is not an essential gene -S000031688 CDS YDL177C 4 141721 141209 C 2011-02-03 1996-07-31 -S000002335 ORF Verified YDL176W chromosome 4 4 142097 144223 W 2011-02-03 1996-07-31 Protein of unknown function; predicted by computational methods to be involved in fructose-1,6-bisphosphatase (Fbp1p) degradation; interacts with components of the GID complex; YDL176W is not an essential gene -S000036245 CDS YDL176W 4 142097 144223 W 2011-02-03 1996-07-31 -S000002334 ORF Verified YDL175C AIR2 TRAMP complex RNA-binding subunit chromosome 4 4 145518 144484 C 2011-02-03 1996-07-31 RNA-binding subunit of the TRAMP nuclear RNA surveillance complex; involved in nuclear RNA processing and degradation; involved in TRAMP complex assembly as a bridge between Mtr4p and Trf4p; stimulates the poly(A) polymerase activity of Pap2p in vitro; has 5 zinc knuckle motifs; AIR2 has a paralog, AIR1, that arose from the whole genome duplication; Air2p and Air1p have nonredundant roles in regulation of substrate specificity of the exosome -S000036095 CDS YDL175C 4 145518 144484 C 2011-02-03 1996-07-31 -S000002333 ORF Verified YDL174C DLD1 D-lactate dehydrogenase chromosome 4 L000000508 4 147589 145826 C 2011-02-03 1996-07-31 Major mitochondrial D-lactate dehydrogenase; oxidizes D-lactate to pyruvate, transcription is heme-dependent, repressed by glucose, and derepressed in ethanol or lactate; located in the mitochondrial inner membrane -S000035215 CDS YDL174C 4 147589 145826 C 2011-02-03 1996-07-31 -S000002332 ORF Verified YDL173W PAR32 chromosome 4 4 148191 149078 W 2011-02-03 1996-07-31 Protein of unknown function; hyperphosphorylated upon rapamycin treatment in a Tap42p-dependent manner; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; PAR32 is not an essential gene -S000035172 CDS YDL173W 4 148191 149078 W 2011-02-03 1996-07-31 -S000002331 ORF Dubious YDL172C chromosome 4 4 149086 148607 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035016 CDS YDL172C 4 149086 148607 C 2011-02-03 1996-07-31 -S000002330 ORF Verified YDL171C GLT1 glutamate synthase (NADH) chromosome 4 L000003333 4 155640 149203 C 2011-02-03 1996-07-31 NAD(+)-dependent glutamate synthase (GOGAT); synthesizes glutamate from glutamine and alpha-ketoglutarate; with Gln1p, forms the secondary pathway for glutamate biosynthesis from ammonia; expression regulated by nitrogen source; assembles into filaments as cells approach stationary phase and under cytosolic acidification and starvation conditions -S000034863 CDS YDL171C 4 155640 149203 C 2011-02-03 1996-07-31 -S000002329 ORF Verified YDL170W UGA3 chromosome 4 L000002423 4 156318 157904 W 2011-02-03 1996-07-31 Transcriptional activator for GABA-dependent induction of GABA genes; binds to DNA elements found in the promoters of target genes and increases their expression in the presence of GABA (gamma-aminobutyrate); zinc finger transcription factor of the Zn(2)-Cys(6) binuclear cluster domain type; localized to the nucleus; examples of GABA genes include UGA1, UGA2, and UGA4 -S000034829 CDS YDL170W 4 156318 157904 W 2011-02-03 1996-07-31 -S000002328 ORF Verified YDL169C UGX2 chromosome 4 L000002851 4 158735 158064 C 2011-02-03 1996-07-31 Protein of unknown function; transcript accumulates in response to any combination of stress conditions -S000033142 CDS YDL169C 4 158735 158064 C 2011-02-03 1996-07-31 -S000002327 ORF Verified YDL168W SFA1 bifunctional alcohol dehydrogenase/S-(hydroxymethyl)glutathione dehydrogenase|ADH5 chromosome 4 L000001868 4 159604 160764 W 2011-02-03 1996-07-31 Bifunctional alcohol dehydrogenase and formaldehyde dehydrogenase; formaldehyde dehydrogenase activity is glutathione-dependent; functions in formaldehyde detoxification and formation of long chain and complex alcohols, regulated by Hog1p-Sko1p; protein abundance increases in response to DNA replication stress -S000033096 CDS YDL168W 4 159604 160764 W 2011-02-03 1996-07-31 -S000002326 ORF Verified YDL167C NRP1 chromosome 4 L000000121 4 163154 160995 C 2011-02-03 1996-07-31 Putative RNA binding protein of unknown function; localizes to stress granules induced by glucose deprivation; predicted to be involved in ribosome biogenesis -S000032963 CDS YDL167C 4 163154 160995 C 2011-02-03 1996-07-31 -S000002325 ORF Verified YDL166C FAP7 nucleoside-triphosphatase chromosome 4 4 164042 163449 C 2011-02-03 1996-07-31 Essential NTPase required for small ribosome subunit synthesis; mediates processing of the 20S pre-rRNA at site D in the cytoplasm but associates only transiently with 43S preribosomes via Rps14p; complex with Rps14 is conserved between humans, yeast, and arches; may be the endonuclease for site D; depletion leads to accumulation of pre-40S ribosomes in 80S-like ribosomes; human TAF9 functionally complements the lethality of the null mutation -S000032043 CDS YDL166C 4 164042 163449 C 2011-02-03 1996-07-31 -S000002324 ORF Verified YDL165W CDC36 CCR4-NOT core subunit CDC36|NOT2|DNA19 chromosome 4 L000000272 4 164290 164865 W -80 2011-02-03 1996-07-31 Component of the CCR4-NOT core complex, involved in mRNA decapping; this complex has multiple roles in regulating mRNA levels including regulation of transcription and destabilizing mRNAs through deadenylation; basal transcription factor -S000031977 CDS YDL165W 4 164290 164865 W 2011-02-03 1996-07-31 -S000002322 ORF Dubious YDL163W chromosome 4 4 166956 167258 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene CDC9/YDL164C encoding DNA ligase -S000030824 CDS YDL163W 4 166956 167258 W 2011-02-03 1996-07-31 -S000002323 ORF Verified YDL164C CDC9 DNA ligase (ATP) CDC9|MMS8 chromosome 4 L000000249 4 167254 164987 C -78 2011-02-03 1996-07-31 DNA ligase I found in nucleus and mitochondria; essential enzyme that joins Okazaki fragments during DNA replication; also acts in ribonucleotide excision repair, base excision repair, and recombination; DNA ligase I mutants trigger ubiquitination of PCNA at K107, facilitating Rad59p-mediated bypass of unligated Okazaki fragments; human homolog LIG1 can complement yeast cdc9 temperature-sensitive mutant at restrictive temperature -S000030891 CDS YDL164C 4 167254 164987 C 2011-02-03 1996-07-31 -S000002320 ORF Verified YDL161W ENT1 epsin chromosome 4 4 167714 169078 W 2011-02-03 1996-07-31 Epsin-like protein involved in endocytosis and actin patch assembly; functionally redundant with Ent2p; binds clathrin via a clathrin-binding domain motif at C-terminus; relocalizes from bud neck to cytoplasm upon DNA replication stress; ENT1 has a paralog, ENT2, that arose from the whole genome duplication -S000030611 CDS YDL161W 4 167714 169078 W 2011-02-03 1996-07-31 -S000002321 ORF Dubious YDL162C chromosome 4 4 167715 167359 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ENT1/YDL161W, a verified gene involved in endocytosis and actin cortical patch assembly -S000030690 CDS YDL162C 4 167715 167359 C 2011-02-03 1996-07-31 -S000028520 ORF Verified YDL160C-A MHF2 chromosome 4 4 169608 169366 C 2011-02-03 2003-07-29 Component of the heterotetrameric MHF histone-fold complex; in humans the MHF complex interacts with both DNA and Mph1p ortholog FANCM to stabilize and remodel blocked replication forks and repair damaged DNA; mhf2 srs2 double mutants are MMS hypersensitive; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-X, also known as MHF2 -S000030315 CDS YDL160C-A 4 169608 169366 C 2011-02-03 2003-07-29 -S000002319 ORF Verified YDL160C DHH1 DExD/H-box ATP-dependent RNA helicase DHH1 chromosome 4 L000000504 4 171930 170410 C 2011-02-03 1996-07-31 Cytoplasmic DEAD-box helicase, stimulates mRNA decapping; coordinates distinct steps in mRNA function and decay, interacting with both decapping and deadenylase complexes; role in translational repression, mRNA decay, and possibly mRNA export; interacts and cooperates with Ngr1p to promote specific mRNA decay; ATP- and RNA-bound form promotes processing body (PB) assembly, while ATPase stimulation by Not1p promotes PB disassembly; forms cytoplasmic foci on replication stress -S000036698 CDS YDL160C 4 171930 170410 C 2011-02-03 1996-07-31 -S000007599 ORF Uncharacterized YDL159W-A YDL159W-B chromosome 4 4 172182 172313 W 2011-02-03 2001-02-26 Putative protein of unknown function; identified by sequence comparison with hemiascomycetous yeast species -S000037145 CDS YDL159W-A 4 172182 172313 W 2011-02-03 2001-02-26 -S000002318 ORF Verified YDL159W STE7 mitogen-activated protein kinase kinase STE7 chromosome 4 L000002117 4 172481 174028 W -76 2011-02-03 1996-07-31 Signal transducing MAP kinase kinase; involved in pheromone response where it phosphorylates Fus3p; involved in the pseudohyphal/invasive growth pathway where it phosphorylates of Kss1p; phosphorylated by Ste11p; degraded by ubiquitin pathway -S000036970 CDS YDL159W 4 172481 174028 W 2011-02-03 1996-07-31 -S000028612 ORF Dubious YDL159C-B YDL159C-A chromosome 4 4 173232 173056 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031444 CDS YDL159C-B 4 173232 173056 C 2011-02-03 2003-07-29 -S000002317 ORF Dubious YDL158C chromosome 4 4 174174 173866 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036885 CDS YDL158C 4 174174 173866 C 2011-02-03 1996-07-31 -S000002316 ORF Uncharacterized YDL157C chromosome 4 4 174588 174232 C 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000036806 CDS YDL157C 4 174588 174232 C 2011-02-03 1996-07-31 -S000002315 ORF Verified YDL156W CMR1 chromosome 4 4 174918 176486 W 2011-02-03 1996-07-31 Nuclear protein with a role in protein quality control; localizes to the intranuclear quality control compartment (INQ) in response to proteasome inhibition or DNA replication stress; INQ likely sequesters proteins involved in DNA metabolism for degradation or re-folding; DNA-binding protein with preference for UV-damaged DNA; contains three WD domains (WD-40 repeat); human ortholog WDR76 also exhibits perinuclear localization under similar stress conditions -S000035992 CDS YDL156W 4 174918 176486 W 2011-02-03 1996-07-31 -S000002314 ORF Verified YDL155W CLB3 B-type cyclin CLB3 chromosome 4 L000000351 4 176773 178056 W 2011-02-03 1996-07-31 B-type cyclin involved in cell cycle progression; activates Cdc28p to promote the G2/M transition; may be involved in DNA replication and spindle assembly; accumulates during S phase and G2, then targeted for ubiquitin-mediated degradation; relative distribution to the nucleus increases upon DNA replication stress; CLB3 has a paralog, CLB4, that arose from the whole genome duplication -S000035864 CDS YDL155W 4 176773 178056 W 2011-02-03 1996-07-31 -S000002313 ORF Verified YDL154W MSH5 MutS family protein MSH5 chromosome 4 L000002573 4 178334 181039 W 2011-02-03 1996-07-31 Protein of the MutS family; forms a dimer with Msh4p that facilitates crossovers between homologs during meiosis; msh5-Y823H mutation confers tolerance to DNA alkylating agents; homologs present in C. elegans and humans -S000035754 CDS YDL154W 4 178334 181039 W 2011-02-03 1996-07-31 -S000002311 ORF Dubious YDL152W chromosome 4 4 182822 183187 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF SAS10/YDL153C, a component of the small ribosomal subunit processosome -S000034761 CDS YDL152W 4 182822 183187 W 2011-02-03 1996-07-31 -S000002312 ORF Verified YDL153C SAS10 rRNA-processing protein SAS10|UTP3 chromosome 4 L000003317 4 183018 181186 C 2011-02-03 1996-07-31 Subunit of U3-containing Small Subunit (SSU) processome complex; involved in production of 18S rRNA and assembly of small ribosomal subunit; disrupts silencing when overproduced; mutant has increased aneuploidy tolerance; essential gene -S000035646 CDS YDL153C 4 183018 181186 C 2011-02-03 1996-07-31 -S000002309 ORF Verified YDL150W RPC53 DNA-directed RNA polymerase III subunit C53|C53|RPC4 chromosome 4 L000001691 4 183343 184611 W -70 2011-02-03 1996-07-31 RNA polymerase III subunit C53 -S000034634 CDS YDL150W 4 183343 184611 W 2011-02-03 1996-07-31 -S000002310 ORF Dubious YDL151C BUD30 chromosome 4 S000007648 4 183899 183318 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 96% of ORF overlaps the verified gene RPC53; diploid mutant displays a weak budding pattern phenotype in a systematic assay -S000034639 CDS YDL151C 4 183899 183318 C 2011-02-03 1996-07-31 -S000002308 ORF Verified YDL149W ATG9 autophagy protein ATG9|CVT6|APG9|CVT7|AUT9 chromosome 4 L000004759|L000004753|L000004758|S000029131 4 184925 187918 W 2011-02-03 1996-07-31 Transmembrane protein involved in forming Cvt and autophagic vesicles; cycles between the phagophore assembly site (PAS) and other cytosolic punctate structures, not found in autophagosomes; may be involved in membrane delivery to the PAS -S000032870 CDS YDL149W 4 184925 187918 W 2011-02-03 1996-07-31 -S000002307 ORF Verified YDL148C NOP14 snoRNA-binding rRNA-processing protein NOP14|UTP2 chromosome 4 4 190586 188154 C 2011-02-03 1996-07-31 Nucleolar protein; forms a complex with Noc4p that mediates maturation and nuclear export of 40S ribosomal subunits; also present in the small subunit processome complex, which is required for processing of pre-18S rRNA -S000032714 CDS YDL148C 4 190586 188154 C 2011-02-03 1996-07-31 -S000002306 ORF Verified YDL147W RPN5 proteasome regulatory particle lid subunit RPN5|NAS5 chromosome 4 L000004451|L000004305 4 190924 192261 W 2011-02-03 1996-07-31 Subunit of the CSN and 26S proteasome lid complexes; similar to mammalian p55 subunit and to another S. cerevisiae regulatory subunit, Rpn7p; Rpn5p is an essential protein; the COP9 signalosome is also known as the CSN -S000032657 CDS YDL147W 4 190924 192261 W 2011-02-03 1996-07-31 -S000002305 ORF Verified YDL146W LDB17 chromosome 4 4 192750 194225 W 2011-02-03 1996-07-31 Protein involved in the regulation of endocytosis; transiently recruited to actin cortical patches in a SLA1-dependent manner after late coat component assembly; GFP-fusion protein localizes to the periphery, cytoplasm, bud, and bud neck -S000032526 CDS YDL146W 4 192750 194225 W 2011-02-03 1996-07-31 -S000002304 ORF Verified YDL145C COP1 coatomer subunit alpha|SOO1|RET1|SEC33 chromosome 4 L000002603 4 198176 194571 C 2011-02-03 1996-07-31 Alpha subunit of COPI vesicle coatomer complex; complex surrounds transport vesicles in the early secretory pathway -S000031516 CDS YDL145C 4 198176 194571 C 2011-02-03 1996-07-31 -S000002303 ORF Verified YDL144C chromosome 4 4 199732 198662 C 2011-02-03 2003-09-22|1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; YDL144C is not an essential gene; protein abundance increases in response to DNA replication stress -S000031463 CDS YDL144C 4 199732 198662 C 2011-02-03 2003-09-22|1996-07-31 -S000002302 ORF Verified YDL143W CCT4 chaperonin-containing T-complex subunit CCT4|ANC2|TCP4 chromosome 4 L000000087 4 199996 201582 W 2011-02-03 1996-07-31 Subunit of the cytosolic chaperonin Cct ring complex; related to Tcp1p, required for the assembly of actin and tubulins in vivo -S000031415 CDS YDL143W 4 199996 201582 W 2011-02-03 1996-07-31 -S000002301 ORF Verified YDL142C CRD1 cardiolipin synthase|CLS1 chromosome 4 L000003358 4 202570 201719 C 2011-02-03 1996-07-31 Cardiolipin synthase; produces cardiolipin, which is a phospholipid of the mitochondrial inner membrane that is required for normal mitochondrial membrane potential and function and for correct integration of membrane-multispanning proteins into the mitochondrial outer membrane; required to maintain tubular mitochondrial morphology and functions in mitochondrial fusion; also required for normal vacuolar ion homeostasis -S000030494 CDS YDL142C 4 202570 201719 C 2011-02-03 1996-07-31 -S000002300 ORF Verified YDL141W BPL1 biotin--[acetyl-CoA-carboxylase] ligase BPL1|ACC2 chromosome 4 L000002771 4 203039 205111 W 2011-02-03 1996-07-31 Biotin:apoprotein ligase; covalently modifies proteins with the addition of biotin, required for acetyl-CoA carboxylase (Acc1p) holoenzyme formation; comparative analysis suggests that a mitochondrially targeted form may result from translation starting at a non-canonical codon upstream of the annotated start codon; human homolog HLCS can complement yeast BPL1 mutant -S000030458 CDS YDL141W 4 203039 205111 W 2011-02-03 1996-07-31 -S000002299 ORF Verified YDL140C RPO21 DNA-directed RNA polymerase II core subunit RPO21|B220|SUA8|RPB220|RPB1 chromosome 4 L000001744 4 210561 205360 C -68 2011-02-03 1996-07-31 RNA polymerase II largest subunit B220; part of central core; phosphorylation of C-terminal heptapeptide repeat domain regulates association with transcription and splicing factors; similar to bacterial beta-prime -S000030216 CDS YDL140C 4 210561 205360 C 2011-02-03 1996-07-31 -S000002298 ORF Verified YDL139C SCM3 chromosome 4 L000003281 4 212046 211375 C 2011-02-03 2003-09-22|1996-07-31 Nonhistone component of centromeric chromatin; binds to histone H3 variant, Cse4p, and recruits it to centromeres; involved in the assembly and maintenance of Cse4-H4 at centromeres; required for kinetochore assembly and G2/M progression; may protect Cse4p from ubiquitination; homolog of mammalian HJURP -S000037514 CDS YDL139C 4 212046 211375 C 2011-02-03 2003-09-22|1996-07-31 -S000118430 ARS ARS409 ARSIV-213 chromosome 4 4 212519 212618 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178063 ARS_consensus_sequence ARS409 4 212594 212578 C 2014-11-18 2014-11-18 -S000002297 ORF Verified YDL138W RGT2 glucose sensor chromosome 4 L000003268 4 213351 215642 W 2011-02-03 1996-07-31 Plasma membrane high glucose sensor that regulates glucose transport; low affinity sesnor that contains 12 predicted transmembrane segments and a long C-terminal tail required for hexose transporter induction; phosphorylation of the tail by Yck1p/Yck2p facilitates binding to the HXT co-repressors, Mth1p and Std1p; RGT2 has a paralog, SNF3, that arose from the whole genome duplication -S000037451 CDS YDL138W 4 213351 215642 W 2011-02-03 1996-07-31 -S000002296 ORF Verified YDL137W ARF2 Arf family GTPase ARF2 chromosome 4 L000000105|L000000060 4 216529 217074 W -64 1996-07-31 1996-07-31 ADP-ribosylation factor; GTPase of the Ras superfamily involved in regulation of coated formation vesicles in intracellular trafficking within the Golgi; ARF2 has a paralog, ARF1, that arose from the whole genome duplication; arf1 arf2 double null mutation is complemented by human ARF1, ARF4, ARF5, or ARF6 -S000036736 CDS YDL137W 4 216529 217074 W 1996-07-31 1996-07-31 -S000122094 five_prime_UTR_intron YDL137W 4 216158 216489 W 2007-04-04 2007-04-04 -S000002295 ORF Verified YDL136W RPL35B uL29|ribosomal 60S subunit protein L35B|L35B|L29|SOS2 chromosome 4 L000001986 4 217600 218367 W 1996-07-31 1996-07-31 Ribosomal 60S subunit protein L35B; homologous to mammalian ribosomal protein L35 and bacterial L29; RPL35B has a paralog, RPL35A, that arose from the whole genome duplication -S000036637 CDS YDL136W 4 217600 217602 W 1996-07-31 1996-07-31 -S000036638 CDS YDL136W 4 218008 218367 W 1996-07-31 1996-07-31 -S000036639 intron YDL136W 4 217603 218007 W 1996-07-31 1996-07-31 -S000002294 ORF Verified YDL135C RDI1 chromosome 4 L000002743 4 219288 218680 C 1996-07-31 1996-07-31 Rho GDP dissociation inhibitor; involved in the localization and regulation of Cdc42p and Rho1p; protein abundance increases in response to DNA replication stress -S000036486 CDS YDL135C 4 219288 218680 C 1996-07-31 1996-07-31 -S000002292 ORF Verified YDL134C PPH21 phosphoprotein phosphatase 2A catalytic subunit PPH21 chromosome 4 L000001472 4 220771 219662 C -66 1996-07-31 1996-07-31 Catalytic subunit of protein phosphatase 2A (PP2A); functionally redundant with Pph22p; methylated at C terminus; forms alternate complexes with several regulatory subunits; involved in signal transduction and regulation of mitosis; forms nuclear foci upon DNA replication stress; PPH21 has a paralog, PPH22, that arose from the whole genome duplication -S000035565 CDS YDL134C 4 220771 219662 C 1996-07-31 1996-07-31 -S000002293 ORF Verified YDL133C-A RPL41B eL41|ribosomal 60S subunit protein L41B|L41e|YL41|L47B|L41B|YDL134C-A|RPL47B chromosome 4 L000001739 4 221801 221724 C 1999-07-17 1999-07-17 Ribosomal 60S subunit protein L41B; comprises only 25 amino acids; rpl41a rpl41b double null mutant is viable; homologous to mammalian ribosomal protein L41, no bacterial homolog; RPL41B has a paralog, RPL41A, that arose from the whole genome duplication -S000030753 CDS YDL133C-A 4 221801 221724 C 1999-07-17 1999-07-17 -S000002291 ORF Verified YDL133W SRF1 chromosome 4 4 222427 223740 W 1996-07-31 1996-07-31 Regulator of phospholipase D (Spo14p); interacts with Spo14p and regulates its catalytic activity; capable of buffering the toxicity of C16:0 platelet activating factor, a lipid that accumulates intraneuronally in Alzheimer's patients -S000035552 CDS YDL133W 4 222427 223740 W 1996-07-31 1996-07-31 -S000002290 ORF Verified YDL132W CDC53 cullin CDC53 chromosome 4 L000000281 4 224304 226751 W -81 1996-07-31 1996-07-31 Cullin; structural protein of SCF complexes (which also contain Skp1p, Cdc34p, Hrt1p and an F-box protein) involved in ubiquitination; SCF promotes the G1-S transition by targeting G1 cyclins and the Cln-CDK inhibitor Sic1p for degradation; human homolog CUL1 can complement yeast cdc53 null mutant -S000035487 CDS YDL132W 4 224304 226751 W 1996-07-31 1996-07-31 -S000002289 ORF Verified YDL131W LYS21 homocitrate synthase LYS21 chromosome 4 L000004259 4 227393 228715 W 1996-07-31 1996-07-31 Homocitrate synthase isozyme; catalyzes the condensation of acetyl-CoA and alpha-ketoglutarate to form homocitrate, which is the first step in the lysine biosynthesis pathway; LYS21 has a paralog, LYS20, that arose from the whole genome duplication -S000035437 CDS YDL131W 4 227393 228715 W 1996-07-31 1996-07-31 -S000007232 ORF Verified YDL130W-A STF1 ATPase-binding protein|AIS2 chromosome 4 L000002126 4 229171 229431 W 1999-07-17 1999-07-17 Protein involved in regulation of the mitochondrial F1F0-ATP synthase; Stf1p and Stf2p act as stabilizing factors that enhance inhibitory action of the Inh1p protein; protein abundance increases in response to DNA replication stress; STF1 has a paralog, INH1, that arose from the whole genome duplication -S000033965 CDS YDL130W-A 4 229171 229431 W 1999-07-17 1999-07-17 -S000002288 ORF Verified YDL130W RPP1B ribosomal protein P1B|YP1beta|P1B|L44'|Ax|RPLA3|RPL44' chromosome 4 L000003298|L000001734 4 229906 230527 W 1996-07-31 1996-07-31 Ribosomal protein P1 beta; component of the ribosomal stalk, which is involved in interaction of translational elongation factors with ribosome; free (non-ribosomal) P1 stimulates the phosphorylation of the eIF2 alpha subunit (Sui2p) by Gcn2p; accumulation is regulated by phosphorylation and interaction with the P2 stalk component -S000035361 CDS YDL130W 4 229906 230019 W 1996-07-31 1996-07-31 -S000035362 CDS YDL130W 4 230321 230527 W 1996-07-31 1996-07-31 -S000035363 intron YDL130W 4 230020 230320 W 1996-07-31 1996-07-31 -S000002287 ORF Verified YDL129W chromosome 4 4 231024 231899 W 1996-07-31 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and the nucleus; YDL129W is not an essential gene; relative distribution to the nucleus increases upon DNA replication stress -S000034421 CDS YDL129W 4 231024 231899 W 1996-07-31 1996-07-31 -S000002286 ORF Verified YDL128W VCX1 MNR1|HUM1 chromosome 4 L000002990 4 232652 233887 W 1996-07-31 1996-07-31 Vacuolar membrane antiporter with Ca2+/H+ and K+/H+ exchange activity; involved in control of cytosolic Ca2+ and K+ concentrations; has similarity to sodium/calcium exchangers, including the bovine Na+/Ca2+,K+ antiporter -S000034358 CDS YDL128W 4 232652 233887 W 1996-07-31 1996-07-31 -S000002285 ORF Verified YDL127W PCL2 cyclin PCL2|CLN4 chromosome 4 L000002784 4 234927 235853 W 2004-02-11 2004-02-11|1996-07-31 Cyclin, interacts with cyclin-dependent kinase Pho85p; member of the Pcl1,2-like subfamily, involved in the regulation of polarized growth and morphogenesis and progression through the cell cycle; localizes to sites of polarized cell growth; PCL2 has a paralog, PCL9, that arose from the whole genome duplication -S000033442 CDS YDL127W 4 234927 235853 W 2004-02-11 2004-02-11|1996-07-31 -S000178064 ARS ARS409.5 chromosome 4 4 235937 236185 2014-11-18 2014-11-18 Strong autonomously replicating sequence -S000002284 ORF Verified YDL126C CDC48 AAA family ATPase CDC48 chromosome 4 L000000280 4 238664 236157 C 2004-02-11 1996-07-31 AAA ATPase; subunit of polyUb-selective segregase complex involved in ERAD, INM-associated degradation (INMAD), mitotic spindle disassembly, macroautophagy, PMN, ribosome-associated degradation, ribophagy, homotypic ER membrane fusion, SCF complex disassembly, cell wall integrity during heat stress, and telomerase regulation; mobilizes membrane-anchored transcription factors by regulated Ub/proteasome-dependent processing (RUP); human ortholog VCP complements a cdc48 mutant -S000033307 CDS YDL126C 4 238664 236157 C 2004-02-11 1996-07-31 -S000002283 ORF Verified YDL125C HNT1 adenosine 5'-monophosphoramidase chromosome 4 L000003334 4 239606 239019 C 2004-02-11 1996-07-31 Adenosine 5'-monophosphoramidase; interacts physically and genetically with Kin28p, a CDK and TFIIK subunit, and genetically with CAK1; member of histidine triad (HIT) superfamily of nucleotide-binding proteins; protein abundance increases in response to DNA replication stress; human homolog HINT1 can complement yeast hnt1 mutant -S000033248 CDS YDL125C 4 239398 239019 C 2004-02-11 1996-07-31 -S000033247 CDS YDL125C 4 239606 239510 C 2004-02-11 1996-07-31 -S000033249 intron YDL125C 4 239509 239399 C 2004-02-11 1996-07-31 -S000002282 ORF Verified YDL124W aldo-keto reductase superfamily protein chromosome 4 4 240259 241197 W 2004-02-11 1996-07-31 NADPH-dependent alpha-keto amide reductase; reduces aromatic alpha-keto amides, aliphatic alpha-keto esters, and aromatic alpha-keto esters; member of the aldo-keto reductase (AKR) family; protein abundance increases in response to DNA replication stress -S000033228 CDS YDL124W 4 240259 241197 W 2004-02-11 1996-07-31 -S000002281 ORF Verified YDL123W SNA4 chromosome 4 4 241418 241840 W 2004-02-11 1996-07-31 Protein of unknown function; localized to the vacuolar outer membrane; predicted to be palmitoylated -S000032369 CDS YDL123W 4 241418 241840 W 2004-02-11 1996-07-31 -S000002280 ORF Verified YDL122W UBP1 ubiquitin-specific protease UBP1 chromosome 4 L000002415 4 242552 244981 W 2004-02-11 1996-07-31 Ubiquitin-specific protease; removes ubiquitin from ubiquitinated proteins; cleaves at the C terminus of ubiquitin fusions irrespective of their size; capable of cleaving polyubiquitin chains -S000032268 CDS YDL122W 4 242552 244981 W 2004-02-11 1996-07-31 -S000002279 ORF Uncharacterized YDL121C chromosome 4 4 245582 245133 C 2004-02-11 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; YDL121C is not an essential protein -S000031235 CDS YDL121C 4 245582 245133 C 2004-02-11 1996-07-31 -S000002278 ORF Verified YDL120W YFH1 ferroxidase chromosome 4 L000003525 4 245923 246447 W 2004-02-11 1996-07-31 Mitochondrial matrix iron chaperone; oxidizes and stores iron; interacts with Isu1p to promote Fe-S cluster assembly; mutation results in multiple Fe/S-dependent enzyme deficiencies; human frataxin homolog FXN is mutated in Friedrich's ataxia; human FTL gene can complement yeast yfh1 null mutant -S000031221 CDS YDL120W 4 245923 246447 W 2004-02-11 1996-07-31 -S000002276 ORF Dubious YDL118W chromosome 4 4 247302 247682 W 2004-02-11 1996-07-31 Dubious open reading frame, unlikely to encode a protein; overlaps almost completely with YDL119C; mutations that would affect both YDL118W and YDL119C confer defective telomere maintenance and are synthetically sick or lethal with alpha-synuclein -S000030066 CDS YDL118W 4 247302 247682 W 2004-02-11 1996-07-31 -S000002277 ORF Verified YDL119C HEM25 chromosome 4 4 247612 246689 C 2004-02-11 1996-07-31 Mitochondrial glycine transporter; required for the transport of glycine into mitochondria for initiation of heme biosynthesis, with YMC1 acting as a secondary transporter; homolog of human SLC25A38, a mitochondrial glycine transporter associated with nonsyndromic autosomal recessive congenital sideroblastic anemia; human SLC25A38 can complement the heme deficiency associated with the null mutant; GFP-fusion protein is induced in response to the DNA-damaging agent MMS -S000030189 CDS YDL119C 4 247612 246689 C 2004-02-11 1996-07-31 -S000002275 ORF Verified YDL117W CYK3 chromosome 4 4 248581 251238 W 2004-02-11 1996-07-31 SH3-domain protein located in the bud neck and cytokinetic actin ring; relocalizes from bud neck to nucleus upon DNA replication stress; activates the chitin synthase activity of Chs2p during cytokinesis; suppressor of growth and cytokinesis defects of chs2 phospho-mutants -S000029965 CDS YDL117W 4 248581 251238 W 2004-02-11 1996-07-31 -S000002274 ORF Verified YDL116W NUP84 chromosome 4 L000003137 4 251566 253746 W 2004-02-11 1996-07-31 Subunit of the Nup84p subcomplex of the nuclear pore complex (NPC); contributes to nucleocytoplasmic transport and NPC biogenesis; also plays roles in several processes that may require localization of genes or chromosomes at the nuclear periphery, including double-strand break repair, transcription and chromatin silencing; homologous to human NUP107 -S000029859 CDS YDL116W 4 251566 253746 W 2004-02-11 1996-07-31 -S000118431 ARS ARS410 ARSIV-254 chromosome 4 4 253791 254039 2006-08-30 2006-08-30 Autonomously Replicating Sequence -S000178065 ARS_consensus_sequence ARS410 4 253948 253932 C 2014-11-18 2014-11-18 -S000007598 ORF Dubious YDL114W-A chromosome 4 4 254935 255048 W 2004-02-11 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified based on homology to hemiascomycetous yeasts -S000037144 CDS YDL114W-A 4 254935 255048 W 2004-02-11 2001-02-26 -S000002273 ORF Verified YDL115C IWR1 chromosome 4 4 255126 253995 C 2007-07-10 2004-02-23|2007-07-10|1996-07-31|2004-01-23 RNA polymerase II transport factor, conserved from yeast to humans; also has a role in transporting RNA polymerase III into the nucleus; interacts with most of the RNAP II subunits; nucleo-cytoplasmic shuttling protein; deletion causes hypersensitivity to K1 killer toxin; protein increases in abundance and relocalizes from nucleus to cytoplasm upon DNA replication stress -S000123279 CDS YDL115C 4 254974 253995 C 2007-07-10 2007-07-10 -S000037159 CDS YDL115C 4 255126 255045 C 2007-07-10 2004-02-23|2007-07-10|1996-07-31|2004-01-23 -S000123278 intron YDL115C 4 255044 254975 C 2007-07-10 2007-07-10 -S000002272 ORF Uncharacterized YDL114W short-chain dehydrogenase/reductase chromosome 4 4 255604 256530 W 2004-02-11 1996-07-31 Putative short-chain dehydrogenase/reductase; YDL114W is not an essential gene -S000037093 CDS YDL114W 4 255604 256530 W 2004-02-11 1996-07-31 -S000130171 ARS ARS411 chromosome 4 4 256530 256633 2009-05-07 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000002271 ORF Verified YDL113C ATG20 CVT20|SNX42 chromosome 4 4 258555 256633 C 2004-02-11 1996-07-31 Sorting nexin family member; required for the cytoplasm-to-vacuole targeting (Cvt) pathway and for endosomal sorting; has a Phox homology domain that binds phosphatidylinositol-3-phosphate; interacts with Snx4p; potential Cdc28p substrate -S000036989 CDS YDL113C 4 258555 256633 C 2004-02-11 1996-07-31 -S000002270 ORF Verified YDL112W TRM3 tRNA (guanosine(18)-2'-O)-methyltransferase chromosome 4 L000004920 4 258915 263225 W 2004-02-11 1996-07-31 2'-O-ribose methyltransferase; catalyzes the ribose methylation of the guanosine nucleotide at position 18 of tRNAs -S000036371 CDS YDL112W 4 258915 263225 W 2004-02-11 1996-07-31 -S000002269 ORF Verified YDL111C RRP42 exosome non-catalytic core subunit RRP42 chromosome 4 L000003551 4 264110 263313 C 2004-02-11 1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; has similarity to E. coli RNase PH and to human hRrp42p (EXOSC7) -S000036214 CDS YDL111C 4 264110 263313 C 2004-02-11 1996-07-31 -S000002268 ORF Verified YDL110C TMA17 ADC17 chromosome 4 S000154294 4 264964 264512 C 2004-02-11 1996-07-31 ATPase dedicated chaperone that adapts proteasome assembly to stress; Tma17p is induced upon stress; interacts with Rpt6p to assist its pairing to Rpt3p and early steps in proteasome biogenesis; associates with ribosomes; heterozygous deletion demonstrated increases in chromosome instability in a rad9 deletion background; protein abundance is decreased upon intracellular iron depletion -S000036093 CDS YDL110C 4 264964 264512 C 2004-02-11 1996-07-31 -S000002267 ORF Uncharacterized YDL109C putative lipase chromosome 4 4 267201 265258 C 2004-02-11 1996-07-31 Putative lipase; involved in lipid metabolism; not an essential gene; YDL109C has a paralog, ROG1, that arose from the whole genome duplication -S000033934 CDS YDL109C 4 267201 265258 C 2004-02-11 1996-07-31 -S000002266 ORF Verified YDL108W KIN28 TFIIH complex serine/threonine-protein kinase subunit KIN28 chromosome 4 L000000905 4 267698 268699 W 2004-02-11 1996-07-31 Serine/threonine protein kinase, subunit of transcription factor TFIIH; involved in transcription initiation at RNA polymerase II promoters; phosphorylates Ser5 residue of the PolII C-terminal domain (CTD) at gene promoters; relocalizes to the cytosol in response to hypoxia -S000033868 CDS YDL108W 4 267698 267725 W 2004-02-11 1996-07-31 -S000033869 CDS YDL108W 4 267807 268699 W 2004-02-11 1996-07-31 -S000033870 intron YDL108W 4 267726 267806 W 2004-02-11 1996-07-31 -S000002265 ORF Verified YDL107W MSS2 chromosome 4 L000001202 4 268921 269976 W 2004-02-11 1996-07-31 Peripherally bound inner membrane protein of the mitochondrial matrix; involved in membrane insertion of C-terminus of Cox2p, interacts genetically and physically with Cox18p -S000033109 CDS YDL107W 4 268921 269976 W 2004-02-11 1996-07-31 -S000002264 ORF Verified YDL106C PHO2 phoB|GRF10|BAS2 chromosome 4 L000000728 4 271901 270222 C -58.01 2004-02-11 1996-07-31 Homeobox transcription factor; regulatory targets include genes involved in phosphate metabolism; binds cooperatively with Pho4p to the PHO5 promoter; phosphorylation of Pho2p facilitates interaction with Pho4p; relocalizes to the cytosol in response to hypoxia -S000032983 CDS YDL106C 4 271901 270222 C 2004-02-11 1996-07-31 -S000002263 ORF Verified YDL105W NSE4 Smc5-Smc6 complex subunit NSE4|QRI2 chromosome 4 L000002653 4 272389 273597 W 2004-02-11 1996-07-31 Component of the SMC5-SMC6 complex; this complex plays a key role in the removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair -S000032948 CDS YDL105W 4 272389 273597 W 2004-02-11 1996-07-31 -S000002262 ORF Verified YDL104C QRI7 putative N(6)-L-threonylcarbamoyladenine synthase chromosome 4 L000002654 4 274876 273653 C 2004-02-11 1996-07-31 Protein involved in threonylcarbamoyl adenosine biosynthesis; Sua5p and Qri7p are necessary and sufficient for RNA t6A modification in vitro; highly conserved mitochondrial protein; essential for t6A modification of mitochondrial tRNAs that decode ANN codons; similar to Kae1p and E. coli YgjD, both of which are also required for tRNA t6A modification; when directed to the cytoplasm, complements the essential function of Kae1p in the KEOPS complex -S000031963 CDS YDL104C 4 274876 273653 C 2004-02-11 1996-07-31 -S000002261 ORF Verified YDL103C QRI1 UDP-N-acetylglucosamine diphosphorylase|UAP1 chromosome 4 L000002652 4 276581 275148 C 2004-02-11 1996-07-31 UDP-N-acetylglucosamine pyrophosphorylase; catalyzes the formation of UDP-N-acetylglucosamine (UDP-GlcNAc), which is important in cell wall biosynthesis, protein N-glycosylation, and GPI anchor biosynthesis; protein abundance increases in response to DNA replication stress -S000031867 CDS YDL103C 4 276581 275148 C 2004-02-11 1996-07-31 -S000002260 ORF Verified YDL102W POL3 DNA-directed DNA polymerase delta POL3|CDC2|TEX1|HPR6 chromosome 4 L000000242 4 276872 280165 W -55 2004-02-11 1996-07-31|2011-02-03 Catalytic subunit of DNA polymerase delta; required for chromosomal DNA replication during mitosis and meiosis, intragenic recombination, repair of double strand DNA breaks, and DNA replication during nucleotide excision repair (NER) -S000031813 CDS YDL102W 4 276872 280165 W 2004-02-11 1996-07-31|2011-02-03 -S000002259 ORF Verified YDL101C DUN1 serine/threonine protein kinase DUN1 chromosome 4 L000000531 4 281848 280307 C 2004-02-11 1996-07-31 Cell-cycle checkpoint S/T protein kinase; required for transient G2/M arrest after DNA damage, damage-induced transcription, and nuclear-to-cytoplasmic redistribution of Rnr2p-Rnr4p after genotoxic stress and iron deprivation; phosphorylates repair protein Rad55p, transcriptional repressor Sml1p, superoxide dismutase, and ribonucleotide reductase inhibitors Crt1p and Dif1p; functions in the Mec1p pathway to regulate dNTP pools and telomere length; postreplicative repair role -S000031605 CDS YDL101C 4 281848 280307 C 2004-02-11 1996-07-31 -S000002258 ORF Verified YDL100C GET3 guanine nucleotide exchange factor GET3|ARR4 chromosome 4 4 283176 282112 C 2004-02-11 1996-07-31 Guanine nucleotide exchange factor for Gpa1p; amplifies G protein signaling; functions as a chaperone under ATP-depleted oxidative stress conditions; subunit of GET complex, involved in ATP dependent Golgi to ER trafficking and insertion of tail-anchored (TA) proteins into ER membrane under non-stress conditions; binds as dimer to transmembrane domain (TMD) cargo, shielding TMDs from aqueous solvent; protein abundance increases under DNA replication stress -S000030758 CDS YDL100C 4 283176 282112 C 2004-02-11 1996-07-31 -S000002257 ORF Verified YDL099W BUG1 chromosome 4 4 283419 284444 W 2004-02-11 1996-07-31 Cis-golgi localized protein involved in ER to Golgi transport; forms a complex with the mammalian GRASP65 homolog, Grh1p; mutants are compromised for the fusion of ER-derived vesicles with Golgi membranes -S000034178 CDS YDL099W 4 283419 284444 W 2004-02-11 1996-07-31 -S000002256 ORF Verified YDL098C SNU23 U4/U6-U5 snRNP complex subunit SNU23 chromosome 4 4 285165 284581 C 2004-02-11 1996-07-31 Component of the U4/U6.U5 snRNP complex; involved in mRNA splicing via spliceosome -S000034033 CDS YDL098C 4 285165 284581 C 2004-02-11 1996-07-31 -S000002255 ORF Verified YDL097C RPN6 proteasome regulatory particle lid subunit RPN6|NAS4 chromosome 4 L000004306 4 286695 285391 C 2004-02-11 1996-07-31 Essential, non-ATPase regulatory subunit of the 26S proteasome lid; required for the assembly and activity of the 26S proteasome; the human homolog (S9 protein) partially rescues Rpn6p depletion; protein abundance increases in response to DNA replication stress -S000033908 CDS YDL097C 4 286695 285391 C 2004-02-11 1996-07-31 -S000002253 ORF Verified YDL095W PMT1 dolichyl-phosphate-mannose-protein mannosyltransferase PMT1 chromosome 4 L000001458 4 287059 289512 W 2004-02-11 1996-07-31 Protein O-mannosyltransferase of the ER membrane; transfers mannose from dolichyl phosphate-D-mannose to protein serine and threonine residues; 1 of 7 related proteins involved in O-glycosylation which is essential for cell wall rigidity; involved in ER quality control; amino terminus faces cytoplasm, carboxyl terminus faces ER lumen -S000033095 CDS YDL095W 4 287059 289512 W 2004-02-11 1996-07-31 -S000002254 ORF Dubious YDL096C OPI6 chromosome 4 4 287324 286998 C 2004-02-11 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene PMT1/YDL095W; YDL096C is not essential -S000033140 CDS YDL096C 4 287324 286998 C 2004-02-11 1996-07-31 -S000002251 ORF Verified YDL093W PMT5 putative dolichyl-phosphate-mannose-protein mannosyltransferase PMT5 chromosome 4 L000003164 4 289909 292140 W 2004-02-11 1996-07-31 Protein O-mannosyltransferase; transfers mannose residues from dolichyl phosphate-D-mannose to protein serine/threonine residues; acts in a complex with Pmt3p, can instead interact with Pmt2p in some conditions; target for new antifungals -S000032094 CDS YDL093W 4 289909 292140 W 2004-02-11 1996-07-31 -S000002252 ORF Dubious YDL094C chromosome 4 4 290081 289572 C 2004-02-11 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verfied gene PMT5/YDL093W; YDL094C is not essential -S000032962 CDS YDL094C 4 290081 289572 C 2004-02-11 1996-07-31 -S000002250 ORF Verified YDL092W SRP14 RNA-binding signal recognition particle subunit SRP14 chromosome 4 L000002061 4 292781 293221 W 2004-02-11 1996-07-31 Signal recognition particle (SRP) subunit; interacts with the RNA component of SRP to form the Alu domain, which is the region of SRP responsible for arrest of nascent chain elongation during membrane targeting; homolog of mammalian SRP14 -S000031975 CDS YDL092W 4 292781 293221 W 2004-02-11 1996-07-31 -S000002249 ORF Verified YDL091C UBX3 chromosome 4 4 294759 293392 C 2004-02-11 1996-07-31 Clathrin-coated vesicle component, regulator of endocytosis; copurifies with the DSC ubiquitin ligase complex; UBX (ubiquitin regulatory X) domain-containing protein that interacts with Cdc48p; required for efficient clathrin-mediated endocytosis; ortholog of fission yeast Ucp10 -S000030889 CDS YDL091C 4 294759 293392 C 2004-02-11 1996-07-31 -S000002248 ORF Verified YDL090C RAM1 protein farnesyltransferase|STE16|SGP2|SCG2|FUS8|DPR1 chromosome 4 L000001579 4 296329 295034 C -33 2004-02-11 1996-07-31 Beta subunit of the CAAX farnesyltransferase (FTase); this complex prenylates the a-factor mating pheromone and Ras proteins; required for the membrane localization of Ras proteins and a-factor; homolog of the mammalian FTase beta subunit -S000030792 CDS YDL090C 4 296329 295034 C 2004-02-11 1996-07-31 -S000002247 ORF Verified YDL089W NUR1 chromosome 4 4 296820 298274 W 2004-02-11 1996-07-31 Protein involved in regulation of mitotic exit; dephosphorylation target of Cdc14p in anaphase, which promotes timely rDNA segregation and allows mitotic progression; interacts with Csm1p, Lrs4p; required for rDNA repeat stability; null mutant causes increase in unequal sister-chromatid exchange; GFP-fusion protein localizes to the nuclear periphery, possible Cdc28p substrate -S000037902 CDS YDL089W 4 296820 298274 W 2004-02-11 1996-07-31 -S000002246 ORF Verified YDL088C ASM4 FG-nucleoporin ASM4|NUP59 chromosome 4 L000002642 4 300003 298417 C 2004-02-11 1996-07-31 FG-nucleoporin component of central core of nuclear pore complex (NPC); contributes directly to nucleocytoplasmic transport; induces membrane tubulation, which may contribute to nuclear pore assembly; ASM4 has a paralog, NUP53, that arose from the whole genome duplication -S000037765 CDS YDL088C 4 300003 298417 C 2004-02-11 1996-07-31 -S000002245 ORF Verified YDL087C LUC7 EPE1|EXM2 chromosome 4 L000003348 4 300999 300214 C 2004-02-11 1996-07-31 Essential protein associated with the U1 snRNP complex; splicing factor involved in recognition of 5' splice site; contains two zinc finger motifs; N-terminal zinc finger binds pre-mRNA; relocalizes to the cytosol in response to hypoxia -S000037703 CDS YDL087C 4 300999 300214 C 2004-02-11 1996-07-31 -S000002244 ORF Uncharacterized YDL086W carboxymethylenebutenolidase chromosome 4 4 301413 302234 W 2004-02-11 1996-07-31 Putative carboxymethylenebutenolidase; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YDL086W is not an essential gene -S000036968 CDS YDL086W 4 301413 302234 W 2004-02-11 1996-07-31 -S000028611 ORF Dubious YDL086C-A chromosome 4 4 302089 301655 C 2004-02-11 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps uncharacterized ORF YDL086W; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching -S000031442 CDS YDL086C-A 4 302089 301655 C 2004-02-11 2003-07-29 -S000007588 ORF Uncharacterized YDL085C-A chromosome 4 4 302670 302464 C 2004-02-11 2001-01-30 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus -S000037099 CDS YDL085C-A 4 302670 302464 C 2004-02-11 2001-01-30 -S000002243 ORF Verified YDL085W NDE2 NADH-ubiquinone reductase (H(+)-translocating) NDE2|NDH2 chromosome 4 4 303211 304848 W 2004-02-11 1996-07-31 Mitochondrial external NADH dehydrogenase; catalyzes the oxidation of cytosolic NADH; Nde1p and Nde2p are involved in providing the cytosolic NADH to the mitochondrial respiratory chain; NDE2 has a paralog, NDE1, that arose from the whole genome duplication -S000036900 CDS YDL085W 4 303211 304848 W 2004-02-11 1996-07-31 -S000002242 ORF Verified YDL084W SUB2 ATP-dependent RNA helicase SUB2 chromosome 4 L000004574 4 305237 306577 W 2004-02-11 1996-07-31 Component of the TREX complex required for nuclear mRNA export; member of the DEAD-box RNA helicase superfamily and is involved in early and late steps of spliceosome assembly; homolog of the human splicing factor hUAP56; relocalizes from nucleus to cytoplasm upon DNA replication stress -S000036856 CDS YDL084W 4 305237 306577 W 2004-02-11 1996-07-31 -S000002241 ORF Verified YDL083C RPS16B uS9|ribosomal 40S subunit protein S16B|S9|rp61R|S16B chromosome 4 L000004478 4 307789 306926 C 2004-02-11 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S16 and bacterial S9; RPS16B has a paralog, RPS16A, that arose from the whole genome duplication -S000035913 CDS YDL083C 4 307333 306926 C 2004-02-11 1996-07-31 -S000035912 CDS YDL083C 4 307789 307766 C 2004-02-11 1996-07-31 -S000035914 intron YDL083C 4 307765 307334 C 2004-02-11 1996-07-31 -S000002240 ORF Verified YDL082W RPL13A eL13|ribosomal 60S subunit protein L13A|L13e|L13A chromosome 4 L000004454 4 308424 309388 W 2004-02-11 1996-07-31 Ribosomal 60S subunit protein L13A; not essential for viability; homologous to mammalian ribosomal protein L13, no bacterial homolog; RPL13A has a paralog, RPL13B, that arose from the whole genome duplication -S000035860 CDS YDL082W 4 308424 308427 W 2004-02-11 1996-07-31 -S000035861 CDS YDL082W 4 308793 309388 W 2004-02-11 1996-07-31 -S000035862 intron YDL082W 4 308428 308792 W 2004-02-11 1996-07-31 -S000002239 ORF Verified YDL081C RPP1A P1A|ribosomal protein P1A|RPLA1 chromosome 4 L000002627 4 310122 309802 C 2004-02-11 1996-07-31 Ribosomal stalk protein P1 alpha; involved in the interaction between translational elongation factors and the ribosome; free (non-ribosomal) P1 stimulates the phosphorylation of the eIF2 alpha subunit (Sui2p) by Gcn2p; accumulation of P1 in the cytoplasm is regulated by phosphorylation and interaction with the P2 stalk component -S000035711 CDS YDL081C 4 310122 309802 C 2004-02-11 1996-07-31 -S000002238 ORF Verified YDL080C THI3 branched-chain-2-oxoacid decarboxylase THI3|KID1 chromosome 4 L000003499 4 312471 310642 C 2004-02-11 1996-07-31 Regulatory protein that binds Pdc2p and Thi2p transcription factors; activates thiamine biosynthesis transcription factors Pdc2p and Thi2p by binding to them, but releases and de-activates them upon binding to thiamine pyrophosphate (TPP), the end product of the pathway; has similarity to decarboxylases but enzymatic activity is not detected -S000035644 CDS YDL080C 4 312471 310642 C 2004-02-11 1996-07-31 -S000002237 ORF Verified YDL079C MRK1 putative serine/threonine protein kinase MRK1 chromosome 4 L000001151 4 314748 312951 C 2004-02-11 1996-07-31 Glycogen synthase kinase 3 (GSK-3) homolog; one of four GSK-3 homologs in S. cerevisiae that function to activate Msn2p-dependent transcription of stress responsive genes and that function in protein degradation; MRK1 has a paralog, RIM11, that arose from the whole genome duplication -S000033718 CDS YDL079C 4 314044 312951 C 2004-02-11 1996-07-31 -S000033717 CDS YDL079C 4 314748 314337 C 2004-02-11 1996-07-31 -S000033719 intron YDL079C 4 314336 314045 C 2004-02-11 1996-07-31 -S000002236 ORF Verified YDL078C MDH3 malate dehydrogenase MDH3 chromosome 4 L000001047 4 316388 315357 C 2004-02-11 1996-07-31 Peroxisomal malate dehydrogenase; catalyzes interconversion of malate and oxaloacetate; involved in the glyoxylate cycle -S000033624 CDS YDL078C 4 316388 315357 C 2004-02-11 1996-07-31 -S000130172 ARS ARS412 chromosome 4 4 316771 317230 2014-11-18 2014-11-18|2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000178066 ARS_consensus_sequence ARS412 4 316862 316878 W 2014-11-18 2014-11-18 -S000002235 ORF Verified YDL077C VAM6 VPS39|VPL22|VPL18|CVT4 chromosome 4 L000003935 4 320120 316971 C 2004-02-11 1996-07-31 Guanine nucleotide exchange factor for the GTPase Gtr1p; subunit of the HOPS endocytic tethering complex; vacuole membrane protein; functions as a Rab GTPase effector, interacting with both GTP- and GDP-bound conformations of Ypt7p; facilitates tethering and promotes membrane fusion events at the late endosome and vacuole; required for both membrane and protein trafficking; component of vacuole-mitochondrion contacts (vCLAMPs) important for lipid transfer between organelles -S000033526 CDS YDL077C 4 320120 316971 C 2004-02-11 1996-07-31 -S000002234 ORF Verified YDL076C RXT3 chromosome 4 4 321552 320668 C 2004-02-11 1996-07-31 Component of the Rpd3L histone deacetylase complex; involved in histone deacetylation; protein abundance increases in response to DNA replication stress -S000032814 CDS YDL076C 4 321552 320668 C 2004-02-11 1996-07-31 -S000002233 ORF Verified YDL075W RPL31A eL31|ribosomal 60S subunit protein L31A|L31e|YL28|L34A|L31A|RPL34 chromosome 4 L000003297|L000001727 4 322226 322988 W 2004-02-11 1996-07-31 Ribosomal 60S subunit protein L31A; associates with karyopherin Sxm1p; loss of both Rpl31p and Rpl39p confers lethality; homologous to mammalian ribosomal protein L31, no bacterial homolog; RPL31A has a paralog, RPL31B, that arose from the whole genome duplication -S000032744 CDS YDL075W 4 322226 322282 W 2004-02-11 1996-07-31 -S000032745 CDS YDL075W 4 322704 322988 W 2004-02-11 1996-07-31 -S000032746 intron YDL075W 4 322283 322703 W 2004-02-11 1996-07-31 -S000006454 snoRNA_gene snR63 SNR63 chromosome 4 L000004532 4 323471 323217 C 2004-02-11 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A2256 -S000030842 noncoding_exon snR63 4 323471 323217 C 2004-02-11 2000-05-19 -S000002232 ORF Verified YDL074C BRE1 E3 ubiquitin-protein ligase BRE1 chromosome 4 4 326149 324047 C 2004-02-11 1996-07-31 E3 ubiquitin ligase; forms heterodimer with Rad6p to regulate K63 polyubiquitination in response to oxidative stress and to monoubiquinate histone H2B-K123, which is required for the subsequent methylation of histone H3-K4 and H3-K79; required for DSBR, transcription, silencing, and checkpoint control; interacts with RNA-binding protein Npl3p, linking histone ubiquitination to mRNA processing; Bre1p-dependent histone ubiquitination promotes pre-mRNA splicing -S000032572 CDS YDL074C 4 326149 324047 C 2004-02-11 1996-07-31 -S000002231 ORF Verified YDL073W AHK1 chromosome 4 4 326613 329567 W 2004-02-11 1996-07-31 Scaffold protein in the HKR1 sub-branch of the Hog1p-signaling pathway; physically interacts with the cytoplasmic domain of Hkr1p, and with Sho1p, Pbs2p, and Ste11p; prevents cross-talk signaling from Hkr1p of the osmotic stress MAPK cascade to the Kss1p MAPK cascade; non-essential gene -S000032520 CDS YDL073W 4 326613 329567 W 2004-02-11 1996-07-31 -S000118432 ARS ARS413 ARSIV-330 chromosome 4 4 329566 329814 2006-08-30 2006-08-30 Autonomously Replicating Sequence -S000178067 ARS_consensus_sequence ARS413 4 329671 329687 W 2014-11-18 2014-11-18 -S000002230 ORF Verified YDL072C YET3 chromosome 4 4 330447 329836 C 2004-02-11 1996-07-31 Protein of unknown function; YET3 null mutant decreases the level of secreted invertase; homolog of human BAP31 protein; protein abundance increases in response to DNA replication stress -S000031514 CDS YDL072C 4 330447 329836 C 2004-02-11 1996-07-31 -S000002228 ORF Verified YDL070W BDF2 chromosome 4 L000004431 4 331024 332940 W 2011-02-03 1996-07-31 Protein involved in transcription initiation; acts at TATA-containing promoters; associates with the basal transcription factor TFIID; contains two bromodomains; corresponds to the C-terminal region of mammalian TAF1; redundant with Bdf1p; protein abundance increases in response to DNA replication stress; BDF2 has a paralog, BDF1, that arose from the whole genome duplication -S000031410 CDS YDL070W 4 331024 332940 W 2011-02-03 1996-07-31 -S000002229 ORF Dubious YDL071C IRC1 chromosome 4 4 331040 330666 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF BDF2/YDL070W -S000031459 CDS YDL071C 4 331040 330666 C 2011-02-03 1996-07-31 -S000002226 ORF Dubious YDL068W chromosome 4 4 333500 333829 W 2004-02-11 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030510 CDS YDL068W 4 333500 333829 W 2004-02-11 1996-07-31 -S000002227 ORF Verified YDL069C CBS1 chromosome 4 L000000230 4 333810 333121 C 2004-02-11 2003-09-22|1996-07-31 Mitochondrial translational activator of the COB mRNA; membrane protein that interacts with translating ribosomes, acts on the COB mRNA 5'-untranslated leader -S000030553 CDS YDL069C 4 333810 333121 C 2004-02-11 2003-09-22|1996-07-31 -S000002225 ORF Verified YDL067C COX9 cytochrome c oxidase subunit VIIa chromosome 4 L000000393 4 334396 334217 C 2004-02-11 1996-07-31 Subunit VIIa of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain -S000037632 CDS YDL067C 4 334396 334217 C 2004-02-11 1996-07-31 -S000002224 ORF Verified YDL066W IDP1 isocitrate dehydrogenase (NADP(+)) IDP1 chromosome 4 L000000852 4 334835 336121 W 2004-02-11 1996-07-31 Mitochondrial NADP-specific isocitrate dehydrogenase; catalyzes the oxidation of isocitrate to alpha-ketoglutarate; not required for mitochondrial respiration and may function to divert alpha-ketoglutarate to biosynthetic processes -S000037594 CDS YDL066W 4 334835 336121 W 2004-02-11 1996-07-31 -S000002223 ORF Verified YDL065C PEX19 PAS12 chromosome 4 L000003965 4 337277 336249 C 2006-04-12 1996-07-31|2006-04-12 Chaperone and import receptor for newly-synthesized class I PMPs; binds peroxisomal membrane proteins (PMPs) in the cytoplasm and delivers them to the peroxisome for subsequent insertion into the peroxisomal membrane; interacts with Myo2p and contributes to peroxisome partitioning -S000037387 CDS YDL065C 4 337277 336249 C 2006-04-12 1996-07-31|2006-04-12 -S000002222 ORF Verified YDL064W UBC9 E2 SUMO-conjugating protein UBC9 chromosome 4 L000002636 4 337487 338070 W 2004-02-11 1996-07-31 SUMO-conjugating enzyme involved in the Smt3p conjugation pathway; nuclear protein required for S- and M-phase cyclin degradation and mitotic control; involved in proteolysis mediated by the anaphase-promoting complex cyclosome (APCC) -S000036730 CDS YDL064W 4 337487 337524 W 2004-02-11 1996-07-31 -S000036731 CDS YDL064W 4 337635 338070 W 2004-02-11 1996-07-31 -S000036732 intron YDL064W 4 337525 337634 W 2004-02-11 1996-07-31 -S000002220 ORF Dubious YDL062W chromosome 4 4 339857 340282 W 2004-02-11 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps uncharacterized ORF YDL063C; YDL062W is not essential -S000036515 CDS YDL062W 4 339857 340282 W 2004-02-11 1996-07-31 -S000002221 ORF Verified YDL063C SYO1 chromosome 4 4 340134 338272 C 2004-02-11 1996-07-31 Transport adaptor or symportin; facilitates synchronized nuclear coimport of the two 5S-rRNA binding proteins Rpl5p and Rpl11p; binds to nascent Rpl5p during translation; required for biogenesis of the large ribosomal subunit; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus -S000036559 CDS YDL063C 4 340134 338272 C 2004-02-11 1996-07-31 -S000002219 ORF Verified YDL061C RPS29B uS14|ribosomal 40S subunit protein S29B|S14|YS29|S36B|S29B|YS29B chromosome 4 L000002550 4 340798 340628 C 2004-02-11 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S29 and bacterial S14; RPS29B has a paralog, RPS29A, that arose from the whole genome duplication -S000035564 CDS YDL061C 4 340798 340628 C 2004-02-11 1996-07-31 -S000122093 five_prime_UTR_intron YDL061C 4 341219 340811 C 2007-04-04 2007-04-04 -S000002218 ORF Verified YDL060W TSR1 chromosome 4 4 341619 343985 W 2004-02-11 1996-07-31 Protein required for processing of 20S pre-rRNA in the cytoplasm; associates with pre-40S ribosomal particles; inhibits the premature association of 60S subunits with assembling 40S subunits in the cytoplasm; similar to Bms1p; relocalizes from nucleus to cytoplasm upon DNA replication stress -S000035549 CDS YDL060W 4 341619 343985 W 2004-02-11 1996-07-31 -S000002217 ORF Verified YDL059C RAD59 chromosome 4 L000003987 4 344953 344237 C 2004-02-11 1996-07-31 Protein involved DNA double-strand break repair; repairs breaks in DNA during vegetative growth via recombination and single-strand annealing; anneals complementary single-stranded DNA; forms nuclear foci upon DNA replication stress; required for loading of Rad52p to DSBs; regulates replication fork progression in DNA ligase I-deficient cells; paralog of Rad52p -S000035590 CDS YDL059C 4 344953 344237 C 2004-02-11 1996-07-31 -S000002216 ORF Verified YDL058W USO1 INT1 chromosome 4 L000002446 4 345665 351037 W 2004-02-11 1996-07-31 Essential protein involved in vesicle-mediated ER to Golgi transport; binds membranes and functions during vesicle docking to the Golgi; required for assembly of the ER-to-Golgi SNARE complex -S000035550 CDS YDL058W 4 345665 351037 W 2004-02-11 1996-07-31 -S000002215 ORF Uncharacterized YDL057W chromosome 4 4 351434 352420 W 2004-02-11 1996-07-31 Putative protein of unknown function; YDL057W is not an essential gene -S000034554 CDS YDL057W 4 351434 352420 W 2004-02-11 1996-07-31 -S000002214 ORF Verified YDL056W MBP1 transcription factor MBP1 chromosome 4 L000001032 4 352877 355378 W 2004-02-11 1996-07-31 Transcription factor; involved in regulation of cell cycle progression from G1 to S phase, forms a complex with Swi6p that binds to MluI cell cycle box regulatory element in promoters of DNA synthesis genes -S000034419 CDS YDL056W 4 352877 355378 W 2004-02-11 1996-07-31 -S000002213 ORF Verified YDL055C PSA1 mannose-1-phosphate guanylyltransferase|SRB1|VIG9|MPG1 chromosome 4 L000002625|L000002860|L000002049 4 356759 355674 C 2004-02-11 1996-07-31 GDP-mannose pyrophosphorylase (mannose-1-phosphate guanyltransferase); synthesizes GDP-mannose from GTP and mannose-1-phosphate in cell wall biosynthesis; required for normal cell wall structure -S000034293 CDS YDL055C 4 356759 355674 C 2004-02-11 1996-07-31 -S000006629 tRNA_gene tK(UUU)D chromosome 4 L000003762|S000007415 4 359577 359672 W 2004-02-11 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000034182 intron tK(UUU)D 4 359614 359636 W 2004-02-11 2000-05-19 -S000034180 noncoding_exon tK(UUU)D 4 359577 359613 W 2004-02-11 2000-05-19 -S000034181 noncoding_exon tK(UUU)D 4 359637 359672 W 2004-02-11 2000-05-19 -S000002212 ORF Verified YDL054C MCH1 chromosome 4 4 361285 359825 C 2004-02-11 1996-07-31 Protein with similarity to mammalian monocarboxylate permeases; monocarboxylate permeases are involved in transport of monocarboxylic acids across the plasma membrane but mutant is not deficient in monocarboxylate transport -S000033372 CDS YDL054C 4 361285 359825 C 2004-02-11 1996-07-31 -S000002211 ORF Verified YDL053C PBP4 chromosome 4 4 362256 361699 C 2004-02-11 1996-07-31 Pbp1p binding protein; interacts strongly with Pab1p-binding protein 1 (Pbp1p) in the yeast two-hybrid system; also interacts with Lsm12p in a copurification assay; relative distribution to the nucleus increases upon DNA replication stress -S000033305 CDS YDL053C 4 362256 361699 C 2004-02-11 1996-07-31 -S000002210 ORF Verified YDL052C SLC1 1-acylglycerol-3-phosphate O-acyltransferase SLC1 chromosome 4 L000001914 4 363583 362672 C 2004-02-11 1996-07-31 1-acyl-sn-glycerol-3-phosphate acyltransferase; catalyzes the acylation of lysophosphatidic acid to form phosphatidic acid, a key intermediate in lipid metabolism; enzymatic activity detected in lipid particles and microsomes -S000033244 CDS YDL052C 4 363583 362672 C 2004-02-11 1996-07-31 -S000002209 ORF Verified YDL051W LHP1 YLA1|LAH1 chromosome 4 L000002518 4 363952 364779 W 2004-02-11 1996-07-31 RNA binding protein required for maturation of tRNA and U6 snRNA; acts as a molecular chaperone for RNAs transcribed by polymerase III; homologous to human La (SS-B) autoantigen -S000033227 CDS YDL051W 4 363952 364779 W 2004-02-11 1996-07-31 -S000002208 ORF Dubious YDL050C chromosome 4 4 364817 364446 C 2004-02-11 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032313 CDS YDL050C 4 364817 364446 C 2004-02-11 1996-07-31 -S000002207 ORF Verified YDL049C KNH1 chromosome 4 L000002837 4 365874 365068 C 2004-02-11 1996-07-31 Protein with similarity to Kre9p; Kre9p is involved in cell wall beta 1,6-glucan synthesis; overproduction suppresses growth defects of a kre9 null mutant; required for propionic acid resistance -S000031388 CDS YDL049C 4 365874 365068 C 2004-02-11 1996-07-31 -S000002206 ORF Verified YDL048C STP4 chromosome 4 L000003372 4 368211 366739 C 2004-02-11 1999-02-09|1996-07-31 Protein containing a Kruppel-type zinc-finger domain; similar to Stp1p, Stp2p; predicted transcription factor; relative distribution to the nucleus increases upon DNA replication stress; STP4 has a paralog, STP3, that arose from the whole genome duplication -S000031282 CDS YDL048C 4 368211 366739 C 2004-02-11 1999-02-09|1996-07-31 -S000002205 ORF Verified YDL047W SIT4 type 2A-related serine/threonine-protein phosphatase SIT4|PPH1 chromosome 4 L000001901 4 369771 370706 W 2011-02-03 1996-07-31 Ceramide-activated, type 2A-related serine-threonine phosphatase; functions in G1/S transition of mitotic cycle; controls lifespan, mitochondrial function, cell cycle progression by regulating HXK2 phosphorylation; regulator of COPII coat dephosphorylation; required for ER to Golgi traffic; interacts with Hrr25p kinase; cytoplasmic and nuclear protein that modulates functions mediated by Pkc1p including cell wall and actin cytoskeleton organization; similar to human PP6 -S000031218 CDS YDL047W 4 369771 370706 W 2011-02-03 1996-07-31 -S000002204 ORF Verified YDL046W NPC2 sterol transporter chromosome 4 S000028462 4 371240 371761 W 2011-02-03 1996-07-31 Sterol transport protein and functional homolog of human NPC2/He1; human NPC2 is a cholesterol-binding protein whose deficiency causes Niemann-Pick type C2 disease involving retention of cholesterol in lysosomes; yeast NPC2 can complement mutations in human NPC2 -S000031100 CDS YDL046W 4 371240 371761 W 2011-02-03 1996-07-31 -S000006430 ORF Verified YDL045W-A MRP10 mitochondrial 37S ribosomal protein YmS-T|YmS-T chromosome 4 L000003390 4 372248 372535 W 2011-02-03 1999-07-17 Mitochondrial ribosomal protein of the small subunit; contains twin cysteine-x9-cysteine motifs; oxidized by Mia40p during import into mitochondria -S000032810 CDS YDL045W-A 4 372248 372535 W 2011-02-03 1999-07-17 -S000002203 ORF Verified YDL045C FAD1 FMN adenylyltransferase chromosome 4 L000000598 4 373608 372688 C 2011-02-03 1996-07-31 Flavin adenine dinucleotide (FAD) synthetase; performs the second step in synthesis of FAD from riboflavin; mutation is functionally complemented by human FLAD1 -S000030018 CDS YDL045C 4 373608 372688 C 2011-02-03 1996-07-31 -S000002202 ORF Verified YDL044C MTF2 NAM1 chromosome 4 L000001212 4 375289 373967 C -17.93 2011-02-03 1996-07-31 Mitochondrial protein that interacts with mitochondrial RNA polymerase; interacts with an N-terminal region of mitochondrial RNA polymerase (Rpo41p) and couples RNA processing and translation to transcription -S000029908 CDS YDL044C 4 375289 373967 C 2011-02-03 1996-07-31 -S000002201 ORF Verified YDL043C PRP11 RNA11 chromosome 4 L000001502 4 376480 375680 C -17.13 2011-02-03 1996-07-31 Subunit of the SF3a splicing factor complex; required for spliceosome assembly -S000037237 CDS YDL043C 4 376480 375680 C 2011-02-03 1996-07-31 -S000002199 ORF Dubious YDL041W chromosome 4 4 378102 378455 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene SIR2/YDL042C -S000037091 CDS YDL041W 4 378102 378455 W 2011-02-03 1996-07-31 -S000002200 ORF Verified YDL042C SIR2 NAD-dependent histone deacetylase SIR2|MAR1 chromosome 4 L000001895 4 378445 376757 C -16.03 2011-02-03 1996-07-31 Conserved NAD+ dependent histone deacetylase of the Sirtuin family; deacetylation targets are primarily nuclear proteins; required for telomere hypercluster formation in quiescent yeast cells; involved in regulation of lifespan; plays roles in silencing at HML, HMR, telomeres, and rDNA; negatively regulates initiation of DNA replication; functions as regulator of autophagy like mammalian homolog SIRT1, and also of mitophagy -S000037155 CDS YDL042C 4 378445 376757 C 2011-02-03 1996-07-31 -S000002198 ORF Verified YDL040C NAT1 peptide alpha-N-acetyltransferase complex A subunit NAT1|NAA15|AAA1 chromosome 4 L000000002 4 381438 378874 C -14.93 2011-02-03 1996-07-31 Subunit of protein N-terminal acetyltransferase NatA; NatA comprised of Nat1p, Ard1p, and Nat5p; N-terminally acetylates many proteins to influence multiple processes such as cell cycle progression, heat-shock resistance, mating, sporulation, telomeric silencing and early stages of mitophagy; orthologous to human NAA15; expression of both human NAA10 and NAA15 functionally complements ard1 nat1 double mutant although single mutations are not complemented by their orthologs -S000036986 CDS YDL040C 4 381438 378874 C 2011-02-03 1996-07-31 -S000002197 ORF Verified YDL039C PRM7 pheromone-regulated protein PRM7|YDL038C chromosome 4 4 384081 381985 C 2011-02-03 1996-07-31|2008-06-05 Pheromone-regulated protein; predicted to have one transmembrane segment; promoter contains Gcn4p binding elements; in W303 strain one continuous open reading frame comprising of YDL037C, the intergenic region and YDL039C encodes the IMI1 -S000035141 CDS YDL039C 4 384081 381985 C 2011-02-03 1996-07-31|2008-06-05 -S000002195 ORF Verified YDL037C BSC1 chromosome 4 4 385587 384601 C 2011-02-03 1996-07-31 Protein of unconfirmed function; similar to cell surface flocculin Flo11p; ORF exhibits genomic organization compatible with a translational readthrough-dependent mode of expression; in W303 strain one continuous open reading frame comprising of YDL037C, the intergenic region and YDL039C encodes the gene IMI1 -S000034059 CDS YDL037C 4 385587 384601 C 2011-02-03 1996-07-31 -S000002194 ORF Verified YDL036C PUS9 pseudouridine synthase PUS9 chromosome 4 4 388901 387513 C 2011-02-03 1996-07-31 Mitochondrial tRNA:pseudouridine synthase; catalyzes the formation of pseudouridine at position 32 in mitochondrial tRNAs; contains an N-terminal mitochondrial targeting sequence; PUS9 has a paralog, RIB2, that arose from the whole genome duplication -S000033903 CDS YDL036C 4 388901 387513 C 2011-02-03 1996-07-31 -S000002192 ORF Dubious YDL034W chromosome 4 4 391783 392127 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps with verified gene GPR1/YDL035C; YDL034W is not an essential gene -S000033108 CDS YDL034W 4 391783 392127 W 2011-02-03 1996-07-31 -S000002193 ORF Verified YDL035C GPR1 chromosome 4 L000004298 4 392057 389172 C 2011-02-03 1996-07-31 Plasma membrane G protein coupled receptor (GPCR); interacts with the heterotrimeric G protein alpha subunit, Gpa2p, and with Plc1p; sensor that integrates nutritional signals with the modulation of cell fate via PKA and cAMP synthesis -S000033783 CDS YDL035C 4 392057 389172 C 2011-02-03 1996-07-31 -S000002190 ORF Dubious YDL032W chromosome 4 4 393690 394001 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene SLM3/YDL033C; YDL032W is not an essential gene -S000032947 CDS YDL032W 4 393690 394001 W 2011-02-03 1996-07-31 -S000002191 ORF Verified YDL033C SLM3 tRNA-5-taurinomethyluridine 2-sulfurtransferase|MTU1|MTO2 chromosome 4 4 393912 392659 C 2011-02-03 1996-07-31 tRNA-specific 2-thiouridylase; responsible for 2-thiolation of the wobble base of mitochondrial tRNAs; human homolog TRMU is implicated in myoclonus epilepsy associated with ragged red fibers (MERRF), and can complement yeast null mutant -S000032981 CDS YDL033C 4 393912 392659 C 2011-02-03 1996-07-31 -S000002189 ORF Verified YDL031W DBP10 putative ATP-dependent RNA helicase DBP10 chromosome 4 L000004557 4 394217 397204 W 2011-02-03 1996-07-31|2011-02-03 Putative ATP-dependent RNA helicase of the DEAD-box protein family; constituent of 66S pre-ribosomal particles; essential protein involved in ribosome biogenesis -S000032837 CDS YDL031W 4 394217 397204 W 2011-02-03 1996-07-31|2011-02-03 -S000002188 ORF Verified YDL030W PRP9 SF3a splicing factor complex subunit PRP9 chromosome 4 L000001501 4 397537 399129 W 2011-02-03 1996-07-31 Subunit of the SF3a splicing factor complex; required for spliceosome assembly; acts after the formation of the U1 snRNP-pre-mRNA complex -S000031920 CDS YDL030W 4 397537 399129 W 2011-02-03 1996-07-31 -S000002187 ORF Verified YDL029W ARP2 actin-related protein 2|ACT2 chromosome 4 L000000026 4 399340 400638 W 2011-02-03 1996-07-31 Essential component of the Arp2/3 complex; Arp2/3 is a highly conserved actin nucleation center required for the motility and integrity of actin patches; involved in endocytosis and membrane growth and polarity; required for efficient Golgi-to-ER trafficking in COPI mutants -S000032598 CDS YDL029W 4 399340 399361 W 2011-02-03 1996-07-31 -S000032599 CDS YDL029W 4 399485 400638 W 2011-02-03 1996-07-31 -S000032600 intron YDL029W 4 399362 399484 W 2011-02-03 1996-07-31 -S000002186 ORF Verified YDL028C MPS1 serine/threonine/tyrosine protein kinase MPS1|PAC8|RPK1 chromosome 4 L000001698 4 403291 400997 C 2011-02-03 1996-07-31|2011-02-03 Dual-specificity kinase; autophosphorylation required for function; required for spindle pole body (SPB) duplication and spindle checkpoint function; contributes to bi-orientation by promoting formation of force-generating kinetochore-microtubule attachments in meiosis I; substrates include SPB proteins Spc42p, Spc110p, and Spc98p, mitotic exit network protein Mob1p, kinetochore protein Cnn1p, and checkpoint protein Mad1p; substrate of APCC(Cdh1); similar to human Mps1p -S000031526 CDS YDL028C 4 403291 400997 C 2011-02-03 1996-07-31|2011-02-03 -S000002184 ORF Dubious YDL026W chromosome 4 4 404749 405060 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031360 CDS YDL026W 4 404749 405060 W 2011-02-03 1996-07-31 -S000002185 ORF Uncharacterized YDL027C MRX9 chromosome 4 4 404957 403695 C 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YDL027C is not an essential gene -S000031399 CDS YDL027C 4 404957 403695 C 2011-02-03 1996-07-31 -S000028610 ORF Dubious YDL025W-A chromosome 4 4 405410 405514 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the ORF YDL025C; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching -S000031440 CDS YDL025W-A 4 405410 405514 W 2011-02-03 2003-07-29 -S000002183 ORF Verified YDL025C RTK1 putative serine/threonine protein kinase RTK1 chromosome 4 4 407206 405344 C 2011-02-03 1996-07-31 Putative protein kinase, potentially phosphorylated by Cdc28p; interacts with ribosome biogenesis factors, Cka2, Gus1 and Arc1; protein abundance increases in response to DNA replication stress -S000030352 CDS YDL025C 4 407206 405344 C 2011-02-03 1996-07-31 -S000118433 ARS ARS414 ARSIV-408 chromosome 4 4 408075 408316 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000002182 ORF Verified YDL024C DIA3 putative acid phosphatase DIA3 chromosome 4 4 409857 408451 C 2011-02-03 1996-07-31 Protein of unknown function; involved in invasive and pseudohyphal growth -S000030155 CDS YDL024C 4 409857 408451 C 2011-02-03 1996-07-31 -S000028537 ORF Uncharacterized YDL022C-A chromosome 4 4 410056 409808 C 2011-02-03 2003-07-29 Protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the cytosol; partially overlaps the verified gene DIA3; identified by fungal homology and RT-PCR; mRNA identified as translated by ribosome profiling data -S000031146 CDS YDL022C-A 4 410056 409808 C 2011-02-03 2003-07-29 -S000006510 tRNA_gene tA(AGC)D chromosome 4 L000003763 4 410379 410451 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine -S000032254 noncoding_exon tA(AGC)D 4 410379 410451 W 2011-02-03 2000-05-19 -S000002180 ORF Verified YDL022W GPD1 glycerol-3-phosphate dehydrogenase (NAD(+)) GPD1|OSR5|OSG1|HOR1|DAR1 chromosome 4 L000000722 4 411825 413000 W 2011-02-03 1996-07-31 NAD-dependent glycerol-3-phosphate dehydrogenase; key enzyme of glycerol synthesis, essential for growth under osmotic stress; expression regulated by high-osmolarity glycerol response pathway; protein abundance increases in response to DNA replication stress; constitutively inactivated via phosphorylation by the protein kinases Ypk1p and Ypk2p, dephosphorylation increases catalytic activity; forms a heterodimer with Pnc1p to facilitate its peroxisomal import -S000037411 CDS YDL022W 4 411825 413000 W 2011-02-03 1996-07-31 -S000002181 ORF Dubious YDL023C SRF4 chromosome 4 4 412081 411761 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in other Saccharomyces species; overlaps the verified gene GPD1; deletion confers sensitivity to GSAO; deletion in cyr1 mutant results in loss of stress resistance -S000037466 CDS YDL023C 4 412081 411761 C 2011-02-03 1996-07-31 -S000002179 ORF Verified YDL021W GPM2 phosphoglycerate mutase family protein GPM2 chromosome 4 L000003294 4 413953 414888 W 2011-02-03 1996-07-31 Homolog of Gpm1p phosphoglycerate mutase; converts 3-phosphoglycerate to 2-phosphoglycerate in glycolysis; may be non-functional; GPM2 has a paralog, GPM3, that arose from the whole genome duplication -S000037296 CDS YDL021W 4 413953 414888 W 2011-02-03 1996-07-31 -S000002178 ORF Verified YDL020C RPN4 stress-regulated transcription factor RPN4|UFD5|SON1 chromosome 4 L000001984 4 416708 415113 C 2011-02-03 1996-07-31 Transcription factor that stimulates expression of proteasome genes; Rpn4p levels are in turn regulated by the 26S proteasome in a negative feedback control mechanism; RPN4 is transcriptionally regulated by various stress responses; relative distribution to the nucleus increases upon DNA replication stress -S000036564 CDS YDL020C 4 416708 415113 C 2011-02-03 1996-07-31 -S000002177 ORF Verified YDL019C OSH2 oxysterol-binding protein related protein OSH2 chromosome 4 4 421514 417663 C 2011-02-03 1996-07-31 Member of an oxysterol-binding protein family with seven members; in S. cerevisiae, family members have overlapping, redundant functions in sterol metabolism and collectively perform a function essential for viability; contains FFAT motif; interacts with ER anchor Scs2p at patches at the plasma membrane and at the nuclear envelope; regulated by sterol binding; OSH2 has a paralog, SWH1, that arose from the whole genome duplication -S000035539 CDS YDL019C 4 421514 417663 C 2011-02-03 1996-07-31 -S000002176 ORF Verified YDL018C ERP3 chromosome 4 L000004680 4 423510 422833 C 2011-02-03 1996-07-31 Protein with similarity to Emp24p and Erv25p; member of the p24 family involved in ER to Golgi transport -S000035452 CDS YDL018C 4 423510 422833 C 2011-02-03 1996-07-31 -S000002175 ORF Verified YDL017W CDC7 serine/threonine protein kinase CDC7|SAS1|LSD6 chromosome 4 L000000247 4 424209 425732 W -1 2011-02-03 1996-07-31 DDK (Dbf4-dependent kinase) catalytic subunit; required for origin firing and replication fork progression in mitotic S phase through phosphorylation of Mcm2-7p complexes and Cdc45p; kinase activity correlates with cyclical DBF4 expression; required for pre-meiotic DNA replication, meiotic DSB formation, recruitment of monopolin complex to kinetochores during meiosis I, regulation of meiosis-specific Ndt80p; mutation complemented by human CDC7 and DBF4 co-expression -S000035373 CDS YDL017W 4 424209 425732 W 2011-02-03 1996-07-31 -S000002174 ORF Dubious YDL016C chromosome 4 4 425872 425570 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF CDC7/YDL153C, the catalytic subunit of a complex that regulates DNA replication -S000034291 CDS YDL016C 4 425872 425570 C 2011-02-03 1996-07-31 -S000002173 ORF Verified YDL015C TSC13 trans-2-enoyl-CoA reductase (NADPH) TSC13 chromosome 4 4 426934 426002 C 2011-02-03 1996-07-31 Enoyl reductase; catalyzes last step in each cycle of very long chain fatty acid elongation; localizes to ER, highly enriched in a structure marking nuclear-vacuolar junctions; coimmunoprecipitates with elongases Elo2p and Elo3p; protein increases in abundance and relative distribution to ER foci increases upon DNA replication stress; human homolog TECR implicated in nonsyndromic mental retardation, can complement yeast mutant -S000034157 CDS YDL015C 4 426934 426002 C 2011-02-03 1996-07-31 -S000002172 ORF Verified YDL014W NOP1 rRNA methyltransferase NOP1|LOT3 chromosome 4 L000001260 4 427364 428347 W -1.93 2011-02-03 1996-07-31 Histone glutamine methyltransferase, modifies H2A at Q105 in nucleolus; component of the small subunit processome complex, which is required for processing of pre-18S rRNA; ortholog of mammalian fibrillarin; inviability of the null mutant is functionally complemented by human FBL -S000034123 CDS YDL014W 4 427364 428347 W 2011-02-03 1996-07-31 -S000002171 ORF Verified YDL013W SLX5 SUMO-targeted ubiquitin ligase complex subunit SLX5|ULS2|HEX3 chromosome 4 L000000768 4 429067 430926 W -1.69 2011-02-03 1996-07-31 Subunit of the Slx5-Slx8 SUMO-targeted Ub ligase (STUbL) complex; role in Ub-mediated degradation of histone variant Cse4p preventing mislocalization to euchromatin; role in proteolysis of spindle positioning protein Kar9p, and DNA repair proteins Rad52p and Rad57p; forms SUMO-dependent nuclear foci, including DNA repair centers; contains a RING domain and two SIM motifs; associates with the centromere; required for maintenance of genome integrity like human ortholog RNF4 -S000033268 CDS YDL013W 4 429067 430926 W 2011-02-03 1996-07-31 -S000002170 ORF Verified YDL012C chromosome 4 4 431517 431108 C 2011-02-03 1996-07-31 Tail-anchored plasma membrane protein with a conserved CYSTM module; possibly involved in response to stress; may contribute to non-homologous end-joining (NHEJ) based on ydl012c htz1 double null phenotype; YDL012C has a paralog, YBR016W, that arose from the whole genome duplication -S000033170 CDS YDL012C 4 431386 431108 C 2011-02-03 1996-07-31 -S000033169 CDS YDL012C 4 431517 431473 C 2011-02-03 1996-07-31 -S000033171 intron YDL012C 4 431472 431387 C 2011-02-03 1996-07-31 -S000002168 ORF Verified YDL010W GRX6 glutathione-disulfide reductase GRX6 chromosome 4 4 432330 433025 W 2011-02-03 1996-07-31 Cis-golgi localized monothiol glutaredoxin, binds Fe-S cluster; more similar in activity to dithiol than other monothiol glutaredoxins; involved in the oxidative stress response; GRX6 has a paralog, GRX7, that arose from the whole genome duplication -S000032278 CDS YDL010W 4 432330 433025 W 2011-02-03 1996-07-31 -S000002169 ORF Dubious YDL011C chromosome 4 4 432631 432308 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the uncharacterized ORF YDL010W -S000032316 CDS YDL011C 4 432631 432308 C 2011-02-03 1996-07-31 -S000002167 ORF Uncharacterized YDL009C chromosome 4 4 433248 432925 C 2011-02-03 1996-07-31 Protein of unknown function; mRNA identified as translated by ribosome profiling data; SWAT-GFP and mCherry fusion proteins localize to the cytosol; partially overlaps the verified ORF YDL010W; YDL009C is not an essential gene -S000032265 CDS YDL009C 4 433248 432925 C 2011-02-03 1996-07-31 -S000002166 ORF Verified YDL008W APC11 anaphase promoting complex subunit 11 chromosome 4 L000004322 4 433497 433994 W 2011-02-03 1996-07-31 Catalytic core subunit, Anaphase-Promoting Complex/Cyclosome (APC/C); which is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; contains a RING-H2 domain that is required for activity -S000032227 CDS YDL008W 4 433497 433994 W 2011-02-03 1996-07-31 -S000006739 tRNA_gene tT(AGU)D chromosome 4 L000003788 4 434336 434264 C 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000032153 noncoding_exon tT(AGU)D 4 434336 434264 C 2011-02-03 2000-05-19 -S000006842 long_terminal_repeat YDLCdelta1 chromosome 4 4 434739 434423 C 2011-02-03 2000-05-19 Ty1 LTR -S000130173 ARS ARS415 chromosome 4 4 434971 435320 2014-11-18 2014-11-18|2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000113557 ORF Uncharacterized YDL007C-A chromosome 4 4 436824 436567 C 2011-02-03 2005-11-17 Putative protein of unknown function -S000113558 CDS YDL007C-A 4 436824 436567 C 2011-02-03 2005-11-17 -S000006843 long_terminal_repeat YDLWtau1 chromosome 4 4 437149 437518 W 2011-02-03 2000-05-19 Ty4 LTR -S000006721 tRNA_gene tS(AGA)D1 chromosome 4 L000003764 4 437772 437853 W 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000031630 noncoding_exon tS(AGA)D1 4 437772 437853 W 2011-02-03 2000-05-19 -S000002165 ORF Verified YDL007W RPT2 proteasome regulatory particle base subunit RPT2|YTA5|YHS4 chromosome 4 L000002559 4 438047 439360 W 2011-02-03 1996-07-31 ATPase of the 19S regulatory particle of the 26S proteasome; one of six ATPases of the regulatory particle; involved in the degradation of ubiquitinated substrates; required for normal peptide hydrolysis by the core 20S particle; N-myristoylation of Rpt2p at Gly2 is involved in regulating the proper intracellular distribution of proteasome activity by controlling the nuclear localization of the 26S proteasome -S000031210 CDS YDL007W 4 438047 439360 W 2011-02-03 1996-07-31 -S000002164 ORF Verified YDL006W PTC1 type 2C protein phosphatase PTC1|TPD1|KCS2|CWH47 chromosome 4 L000000890|L000001523 4 439909 440754 W 2011-02-03 1996-07-31 Type 2C protein phosphatase (PP2C); dephosphorylates Hog1p, inactivating osmosensing MAPK cascade; involved in Fus3p activation during pheromone response; deletion affects precursor tRNA splicing, mitochondrial inheritance, and sporulation -S000031084 CDS YDL006W 4 439909 440754 W 2011-02-03 1996-07-31 -S000002163 ORF Verified YDL005C MED2 chromosome 4 L000003914 4 442309 441014 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation; relocalizes to the cytosol in response to hypoxia -S000030042 CDS YDL005C 4 442309 441014 C 2011-02-03 1996-07-31 -S000002162 ORF Verified YDL004W ATP16 F1F0 ATP synthase subunit delta chromosome 4 L000000150 4 443029 443511 W 2011-02-03 1996-07-31 Delta subunit of the central stalk of mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; F1 translationally regulates ATP6 and ATP8 expression to achieve a balanced output of ATP synthase genes encoded in nucleus and mitochondria; phosphorylated -S000030001 CDS YDL004W 4 443029 443511 W 2011-02-03 1996-07-31 -S000002161 ORF Verified YDL003W MCD1 kleisin alpha|SCC1|RHC21|PDS3 chromosome 4 L000002676 4 444683 446383 W 2011-02-03 1996-07-31 Essential alpha-kleisin subunit of the cohesin complex; required for sister chromatid cohesion in mitosis and meiosis; apoptosis induces cleavage and translocation of a C-terminal fragment to mitochondria; expression peaks in S phase -S000029870 CDS YDL003W 4 444683 446383 W 2011-02-03 1996-07-31 -S000002160 ORF Verified YDL002C NHP10 HMO2 chromosome 4 L000002765 4 447578 446967 C 2011-02-03 1996-07-31 Non-essential INO80 chromatin remodeling complex subunit; preferentially binds DNA ends, protecting them from exonucleatic cleavage; deletion affects telomere maintenance via recombination; related to mammalian high mobility group proteins -S000037122 CDS YDL002C 4 447578 446967 C 2011-02-03 1996-07-31 -S000002159 ORF Verified YDL001W RMD1 chromosome 4 4 447984 449276 W 2011-02-03 1996-07-31 Cytoplasmic protein required for sporulation -S000037078 CDS YDL001W 4 447984 449276 W 2011-02-03 1996-07-31 -S000006466 centromere CEN4 CEN4 chromosome 4 L000000297 4 449711 449821 W 0 2011-02-03 2000-05-19|2006-05-08 Chromosome IV centromere -S000077266 centromere_DNA_Element_I CEN4 4 449711 449720 W 2011-02-03 2004-10-04 -S000077267 centromere_DNA_Element_II CEN4 4 449721 449796 W 2011-02-03 2004-10-04 -S000077268 centromere_DNA_Element_III CEN4 4 449797 449821 W 2011-02-03 2004-10-04 -S000002408 ORF Verified YDR001C NTH1 alpha,alpha-trehalase NTH1 chromosome 4 L000001280 4 452475 450220 C 2011-02-03 1996-07-31 Neutral trehalase, degrades trehalose; required for thermotolerance and may mediate resistance to other cellular stresses; phosphorylated and activated by Cdc28p at the G1/S phase transition to coordinately regulate carbohydrate metabolism and the cell cycle; inhibited by Dcs1p; NTH1 has a paralog, NTH2, that arose from the whole genome duplication -S000033545 CDS YDR001C 4 452475 450220 C 2011-02-03 1996-07-31 -S000002409 ORF Verified YDR002W YRB1 Ran GTPase-binding protein YRB1|STP52|SFO1|HTN1|CST20 chromosome 4 L000001871|S000029527|L000002134 4 453045 453650 W 2011-02-03 1996-07-31 Ran GTPase binding protein; involved in nuclear protein import and RNA export, ubiquitin-mediated protein degradation during the cell cycle; shuttles between the nucleus and cytoplasm; is essential; homolog of human RanBP1 -S000034475 CDS YDR002W 4 453045 453650 W 2011-02-03 1996-07-31 -S000002410 ORF Verified YDR003W RCR2 SSH5 chromosome 4 S000029511|L000002952 4 454122 454754 W 2011-02-03 1996-07-31 Vacuolar protein; presumably functions within the endosomal-vacuolar trafficking pathway, affecting events that determine whether plasma membrane proteins are degraded or routed to the plasma membrane; RCR2 has a paralog, RCR1, that arose from the whole genome duplication -S000034587 CDS YDR003W 4 454122 454754 W 2011-02-03 1996-07-31 -S000028819 ORF Uncharacterized YDR003W-A chromosome 4 4 454782 454904 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000033630 CDS YDR003W-A 4 454782 454904 W 2011-02-03 2003-07-29 -S000002411 ORF Verified YDR004W RAD57 putative DNA-dependent ATPase RAD57 chromosome 4 L000001577 4 455201 456583 W 2 2011-02-03 1996-07-31 Protein that stimulates strand exchange; stimulates strand exchange by stabilizing the binding of Rad51p to single-stranded DNA; involved in the recombinational repair of double-strand breaks in DNA during vegetative growth and meiosis; forms heterodimer with Rad55p -S000034681 CDS YDR004W 4 455201 456583 W 2011-02-03 1996-07-31 -S000002412 ORF Verified YDR005C MAF1 RNA polymerase III-inhibiting protein MAF1 chromosome 4 L000002614 4 458103 456836 C 2011-02-03 1996-07-31 Highly conserved negative regulator of RNA polymerase III; involved in tRNA processing and stability; inhibits tRNA degradation via rapid tRNA decay (RTD) pathway; binds N-terminal domain of Rpc160p subunit of Pol III to prevent closed-complex formation; regulated by phosphorylation mediated by TORC1, protein kinase A, Sch9p, casein kinase 2; localizes to cytoplasm during vegetative growth and translocates to nucleus and nucleolus under stress conditions -S000034763 CDS YDR005C 4 458017 456836 C 2011-02-03 1996-07-31 -S000034762 CDS YDR005C 4 458103 458098 C 2011-02-03 1996-07-31 -S000034764 intron YDR005C 4 458097 458018 C 2011-02-03 1996-07-31 -S000002413 ORF Verified YDR006C SOK1 chromosome 4 L000001983 4 461247 458542 C 2011-02-03 1996-07-31 Protein of unknown function; overexpression suppresses the growth defect of mutants lacking protein kinase A activity; involved in cAMP-mediated signaling; localized to the nucleus; similar to the mouse testis-specific protein PBS13 -S000035723 CDS YDR006C 4 461247 458542 C 2011-02-03 1996-07-31 -S000002414 ORF Verified YDR007W TRP1 phosphoribosylanthranilate isomerase TRP1 chromosome 4 L000002352 4 461842 462516 W 1 2011-02-03 2004-02-11|1996-07-31 Phosphoribosylanthranilate isomerase; catalyzes the third step in tryptophan biosynthesis; in 2004, the sequence of TRP1 from strain S228C was updated by changing the previously annotated internal STOP (TAA) to serine (TCA); enhances vegetative growth at low and high temperatures when used as an auxotrophic marker in strains such as W303 -S000035920 CDS YDR007W 4 461842 462516 W 2011-02-03 2004-02-11|1996-07-31 -S000029652 ARS ARS416 ARS1 chromosome 4 S000007454 4 462567 462622 2014-11-18 2014-11-18|2006-04-10 Early-firing autonomously replicating sequence; highly efficient chromosomal replicator active in nearly every cell cycle -S000121228 ARS_consensus_sequence ARS416 4 462606 462596 C 2011-02-03 2007-03-06 -S000002415 ORF Dubious YDR008C chromosome 4 4 462602 462252 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps TRP1/YDR007W on opposite strand -S000035999 CDS YDR008C 4 462602 462252 C 2011-02-03 1996-07-31 -S000002416 ORF Verified YDR009W GAL3 transcriptional regulator GAL3 chromosome 4 L000000660 4 463434 464996 W 1 2011-02-03 1996-07-31 Transcriptional regulator; involved in activation of the GAL genes in response to galactose; forms a complex with Gal80p to relieve Gal80p inhibition of Gal4p; binds galactose and ATP but does not have galactokinase activity; GAL3 has a paralog, GAL1, that arose from the whole genome duplication -S000037895 CDS YDR009W 4 463434 464996 W 2011-02-03 1996-07-31 -S000002417 ORF Dubious YDR010C chromosome 4 4 465383 465051 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037562 CDS YDR010C 4 465383 465051 C 2011-02-03 1996-07-31 -S000002418 ORF Verified YDR011W SNQ2 ATP-binding cassette transporter SNQ2 chromosome 4 L000001957 4 465919 470424 W 2011-02-03 1996-07-31 Plasma membrane ATP-binding cassette (ABC) transporter; multidrug transporter involved in multidrug resistance and resistance to singlet oxygen species -S000037672 CDS YDR011W 4 465919 470424 W 2011-02-03 1996-07-31 -S000002419 ORF Verified YDR012W RPL4B uL4|ribosomal 60S subunit protein L4B|L4|rp2|YL2|L4B|L2B chromosome 4 L000001702 4 471853 472941 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L4B; homologous to mammalian ribosomal protein L4 and bacterial L4; RPL4B has a paralog, RPL4A, that arose from the whole genome duplication -S000037729 CDS YDR012W 4 471853 472941 W 2011-02-03 1996-07-31 -S000002420 ORF Verified YDR013W PSF1 DNA replication protein PSF1|CDC101 chromosome 4 4 473157 473783 W 2011-02-03 1996-07-31 Subunit of the GINS complex (Sld5p, Psf1p, Psf2p, Psf3p); complex is localized to DNA replication origins and implicated in assembly of the DNA replication machinery -S000037779 CDS YDR013W 4 473157 473783 W 2011-02-03 1996-07-31 -S000002421 ORF Verified YDR014W RAD61 WPL1 chromosome 4 4 474046 475989 W 2011-02-03 1996-07-31 Subunit of a complex that inhibits sister chromatid cohesion; also negatively regulates chromosome condensation; inhibited by Eco1p-acetylated cohesin subunits Smc3p and Mcd1p; binds Smc3p ATPase head of cohesin; related to the human Wapl protein that controls the association of cohesin with chromatin -S000030660 CDS YDR014W 4 474046 475989 W 2011-02-03 1996-07-31 -S000113613 ORF Verified YDR014W-A HED1 chromosome 4 4 477797 478285 W 2011-02-03 2006-04-14 Meiosis-specific protein; down-regulates Rad51p-mediated mitotic recombination when the meiotic recombination machinery is impaired; promotes synapsis and required for the normal morphogenesis of synaptonemal complex; prevents the recruitment of Rad54p to site-specific DNA double-strand breaks in vivo; early meiotic gene, transcribed specifically during meiotic prophase -S000114898 CDS YDR014W-A 4 477797 478285 W 2011-02-03 2006-04-14 -S000002422 ORF Dubious YDR015C chromosome 4 4 478199 477960 C 2011-02-03 1996-07-31|2006-04-13 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene HED1/YDR014W-A -S000030702 CDS YDR015C 4 478199 477960 C 2011-02-03 1996-07-31|2006-04-13 -S000002423 ORF Verified YDR016C DAD1 chromosome 4 4 478758 478474 C 2011-02-03 1996-07-31 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; is transferred to the kinetochore prior to mitosis -S000030807 CDS YDR016C 4 478758 478474 C 2011-02-03 1996-07-31 -S000002424 ORF Verified YDR017C KCS1 inositol polyphosphate kinase KCS1 chromosome 4 L000000889 4 482267 479115 C 2011-02-03 1996-07-31 Inositol hexakisphosphate and inositol heptakisphosphate kinase; generation of high energy inositol pyrophosphates by Kcs1p is required for many processes such as vacuolar biogenesis, stress response, RNA polymerase I-mediated rRNA transcription and telomere maintenance; inositol hexakisphosphate is also known as IP6; inositol heptakisphosphate is also known as IP7 -S000031751 CDS YDR017C 4 482267 479115 C 2011-02-03 1996-07-31 -S000002425 ORF Uncharacterized YDR018C putative acyltransferase chromosome 4 4 483860 482670 C 2011-02-03 1996-07-31 Probable membrane protein with three predicted transmembrane domains; similar to C. elegans F55A11.5 and maize 1-acyl-glycerol-3-phosphate acyltransferase; YDR018C has a paralog, CST26, that arose from the whole genome duplication -S000031907 CDS YDR018C 4 483860 482670 C 2011-02-03 1996-07-31 -S000118434 ARS ARS417 ARSIV-484 chromosome 4 4 484006 484059 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178068 ARS_consensus_sequence ARS417 4 484035 484019 C 2014-11-18 2014-11-18 -S000002426 ORF Verified YDR019C GCV1 glycine decarboxylase subunit T|GSD1 chromosome 4 L000002736 4 485365 484163 C 2011-02-03 1996-07-31 T subunit of the mitochondrial glycine decarboxylase complex; glycine decarboxylase is required for the catabolism of glycine to 5,10-methylene-THF; expression is regulated by levels of levels of 5,10-methylene-THF in the cytoplasm -S000032068 CDS YDR019C 4 485365 484163 C 2011-02-03 1996-07-31 -S000002427 ORF Uncharacterized YDR020C DAS2 putative uridine kinase DAS2|RRT3 chromosome 4 4 486444 485746 C 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene identified in a screen for mutants with increased levels of rDNA transcription; weak similarity with uridine kinases and with phosphoribokinases -S000032817 CDS YDR020C 4 486444 485746 C 2011-02-03 1996-07-31 -S000002428 ORF Verified YDR021W FAL1 ATP-dependent RNA helicase FAL1 chromosome 4 L000003480 4 486804 488003 W 2011-02-03 1996-07-31 Nucleolar protein required for maturation of 18S rRNA; member of the eIF4A subfamily of DEAD-box ATP-dependent RNA helicases; 18S rRNA biogenesis defect of the null mutant is functionally complemented by human EIF4A3 -S000032973 CDS YDR021W 4 486804 488003 W 2011-02-03 1996-07-31 -S000002429 ORF Verified YDR022C ATG31 CIS1 chromosome 4 L000003475 4 488662 488072 C 2011-02-03 1996-07-31 Autophagy-specific protein required for autophagosome formation; forms a complex with Atg17p and Atg29p that localizes other proteins to the pre-autophagosomal structure; constitutively phosphorylated, and phosphorylation of residue S174 is required for function; high-copy suppressor of CIK1 deletion -S000033002 CDS YDR022C 4 488662 488072 C 2011-02-03 1996-07-31 -S000006770 tRNA_gene tV(UAC)D chromosome 4 L000003787 4 488870 488797 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000036290 noncoding_exon tV(UAC)D 4 488870 488797 C 2011-02-03 2000-05-19 -S000002430 ORF Verified YDR023W SES1 serine--tRNA ligase SES1|SerRS chromosome 4 L000001867 4 489508 490896 W 2011-02-03 1996-07-31 Cytosolic seryl-tRNA synthetase; class II aminoacyl-tRNA synthetase that aminoacylates tRNA(Ser), displays tRNA-dependent amino acid recognition which enhances discrimination of the serine substrate, interacts with peroxin Pex21p -S000033710 CDS YDR023W 4 489508 490896 W 2011-02-03 1996-07-31 -S000002431 ORF Dubious YDR024W FYV1 chromosome 4 4 491017 491502 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; mutation decreases survival upon exposure to K1 killer toxin -S000033822 CDS YDR024W 4 491017 491502 W 2011-02-03 1996-07-31 -S000002432 ORF Verified YDR025W RPS11A uS17|ribosomal 40S subunit protein S11A|S17|rp41A|YS12|S18A|S11A chromosome 4 L000001757 4 491515 492324 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S11 and bacterial S17; N-terminally propionylated in vivo; RPS11A has a paralog, RPS11B, that arose from the whole genome duplication -S000033919 CDS YDR025W 4 491515 491559 W 2011-02-03 1996-07-31 -S000033920 CDS YDR025W 4 491899 492324 W 2011-02-03 1996-07-31 -S000033921 intron YDR025W 4 491560 491898 W 2011-02-03 1996-07-31 -S000002433 ORF Verified YDR026C NSI1 YTT1 chromosome 4 4 494268 492556 C 2011-02-03 1996-07-31 RNA polymerase I termination factor; binds to rDNA terminator element, required for efficient Pol I termination; required for rDNA silencing at NTS1; facilities association of Sir2p with NTS1, contributes to rDNA stability and cell longevity; interacts physically with Fob1p and RENT subunits, Sir2p and Net1p; may interact with ribosomes, based on co-purification experiments; Myb-like DNA-binding protein; NSI1 has a paralog, REB1, that arose from the whole genome duplication -S000033977 CDS YDR026C 4 494268 492556 C 2011-02-03 1996-07-31 -S000002434 ORF Verified YDR027C VPS54 TCS3|CGP1|LUV1 chromosome 4 L000004648 4 497318 494649 C 2011-02-03 1996-07-31 Component of the GARP (Golgi-associated retrograde protein) complex; GARP is required for the recycling of proteins from endosomes to the late Golgi, and for mitosis after DNA damage induced checkpoint arrest; potentially phosphorylated by Cdc28p; members of the GARP complex are Vps51p-Vps52p-Vps53p-Vps54p -S000034876 CDS YDR027C 4 497318 494649 C 2011-02-03 1996-07-31 -S000002435 ORF Verified YDR028C REG1 protein phosphatase regulator REG1|SRN1|SPP43|PZF240|HEX2 chromosome 4 L000001609 4 500879 497835 C 2.79 2011-02-03 1996-07-31 Regulatory subunit of type 1 protein phosphatase Glc7p; involved in negative regulation of glucose-repressible genes; involved in regulation of the nucleocytoplasmic shuttling of Hxk2p; REG1 has a paralog, REG2, that arose from the whole genome duplication -S000035027 CDS YDR028C 4 500879 497835 C 2011-02-03 1996-07-31 -S000002436 ORF Uncharacterized YDR029W chromosome 4 4 501100 501414 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YDR029W is not an essential gene -S000035276 CDS YDR029W 4 501100 501414 W 2011-02-03 1996-07-31 -S000002437 ORF Verified YDR030C RAD28 chromosome 4 L000004123 4 503273 501753 C 2011-02-03 1996-07-31 Protein involved in DNA repair; related to the human CSA protein that is involved in transcription-coupled repair nucleotide excision repair -S000036180 CDS YDR030C 4 503273 501753 C 2011-02-03 1996-07-31 -S000002438 ORF Verified YDR031W MIX14 MIC14 chromosome 4 4 503498 503863 W 2011-02-03 2004-07-22|1996-07-31 Mitochondrial intermembrane space protein of unknown function; required for normal oxygen consumption; contains twin cysteine-x9-cysteine motifs; protein abundance increases in response to DNA replication stress -S000036965 CDS YDR031W 4 503498 503863 W 2011-02-03 2004-07-22|1996-07-31 -S000002439 ORF Verified YDR032C PST2 flavodoxin-like fold family protein chromosome 4 4 504695 504099 C 2011-02-03 1996-07-31 Protein with similarity to a family of flavodoxin-like proteins; induced by oxidative stress in a Yap1p dependent manner; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; protein abundance increases in response to DNA replication stress; PST2 has a paralog, RFS1, that arose from the whole genome duplication -S000036988 CDS YDR032C 4 504695 504099 C 2011-02-03 1996-07-31 -S000119069 ARS ARS450 ARSIV-506|ARS417.5 chromosome 4 4 505343 505584 2011-02-03 2006-10-05 Autonomously Replicating Sequence -S000002440 ORF Verified YDR033W MRH1 chromosome 4 4 508147 509109 W 2011-02-03 1996-07-31 Protein that localizes primarily to the plasma membrane; also found at the nuclear envelope; long-lived protein that is asymmetrically retained in the plasma membrane of mother cells; the authentic, non-tagged protein is detected in mitochondria in a phosphorylated state; null mutation confers sensitivity to acetic acid -S000037115 CDS YDR033W 4 508147 509109 W 2011-02-03 1996-07-31 -S000002441 ORF Verified YDR034C LYS14 chromosome 4 L000000971 4 512109 509737 C 8 2011-02-03 1996-07-31 Transcriptional activator involved in regulating lysine biosynthesis; involved in the regulation of genes of the lysine biosynthesis pathway; requires 2-aminoadipate semialdehyde as co-inducer -S000037166 CDS YDR034C 4 512109 509737 C 2011-02-03 1996-07-31 -S000006844 long_terminal_repeat YDRCdelta2 chromosome 4 4 513258 512986 C 2011-02-03 2000-05-19 Ty1 LTR -S000006845 long_terminal_repeat YDRCdelta3 chromosome 4 4 513590 513259 C 2011-02-03 2000-05-19 Ty1 LTR -S000006846 long_terminal_repeat YDRCdelta4 chromosome 4 4 514020 513692 C 2011-02-03 2000-05-19 Ty2 LTR -S000007345 transposable_element_gene YDR034C-D gag-pol fusion protein chromosome 4 4 519356 514043 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000035118 CDS YDR034C-D 4 518062 514043 C 2011-02-03 1999-07-17 -S000035117 CDS YDR034C-D 4 519356 518064 C 2011-02-03 1999-07-17 -S000035119 plus_1_translational_frameshift YDR034C-D 4 518063 518063 C 2011-02-03 1999-07-17 -S000007344 transposable_element_gene YDR034C-C gag protein chromosome 4 4 519356 518040 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000035078 CDS YDR034C-C 4 519356 518040 C 2011-02-03 1999-07-17 -S000006862 LTR_retrotransposon YDRCTy2-1 Ty2 chromosome 4 4 519647 513692 C 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000006847 long_terminal_repeat YDRCdelta5 chromosome 4 4 519647 519316 C 2011-02-03 2000-05-19 Ty2 LTR -S000006649 tRNA_gene tL(UAA)D chromosome 4 L000003765 4 519743 519826 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000037383 noncoding_exon tL(UAA)D 4 519743 519826 W 2011-02-03 2000-05-19 -S000006848 long_terminal_repeat YDRCdelta6a chromosome 4 4 520475 520173 C 2011-02-03 2000-05-19 Ty1 LTR -S000006863 long_terminal_repeat YDRWdelta7 chromosome 4 4 520477 520805 W 2011-02-03 2000-05-19 Ty1 LTR -S000007233 ORF Uncharacterized YDR034C-A chromosome 4 4 520692 520516 C 2011-02-03 1999-07-17 Putative protein of unknown function; contained within the solo Ty1 LTR element YDRWdelta7 -S000035073 CDS YDR034C-A 4 520692 520516 C 2011-02-03 1999-07-17 -S000006849 long_terminal_repeat YDRCdelta6b chromosome 4 4 520833 520806 C 2011-02-03 2000-05-19 Ty1 LTR -S000006693 tRNA_gene tQ(UUG)D1 chromosome 4 L000003766 4 520972 521043 W 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000034805 noncoding_exon tQ(UUG)D1 4 520972 521043 W 2011-02-03 2000-05-19 -S000007234 ORF Uncharacterized YDR034W-B chromosome 4 4 521314 521469 W 2011-02-03 1999-07-17 Predicted tail-anchored plasma membrane protein; contains conserved CYSTM module; related proteins in other organisms may be involved in response to stress; N- and C-terminal fusion proteins localize to the cell periphery; YDR034W-B has a paralog, YBR056W-A, that arose from the whole genome duplication -S000030044 CDS YDR034W-B 4 521314 521469 W 2011-02-03 1999-07-17 -S000002442 ORF Verified YDR035W ARO3 3-deoxy-7-phosphoheptulonate synthase ARO3 chromosome 4 L000000118 4 521816 522928 W 2011-02-03 1996-07-31 3-deoxy-D-arabino-heptulosonate-7-phosphate (DAHP) synthase; catalyzes the first step in aromatic amino acid biosynthesis and is feedback-inhibited by phenylalanine or high concentration of tyrosine or tryptophan -S000029906 CDS YDR035W 4 521816 522928 W 2011-02-03 1996-07-31 -S000002443 ORF Verified YDR036C EHD3 MRP5 chromosome 4 4 524713 523211 C 2011-02-03 1996-07-31 3-hydroxyisobutyryl-CoA hydrolase; member of a family of enoyl-CoA hydratase/isomerases; non-tagged protein is detected in highly purified mitochondria in high-throughput studies; phosphorylated; mutation affects fluid-phase endocytosis -S000029947 CDS YDR036C 4 524713 523211 C 2011-02-03 1996-07-31 -S000002444 ORF Verified YDR037W KRS1 lysine--tRNA ligase KRS1|GCD5 chromosome 4 L000000673|L000000919 4 525440 527215 W 2011-02-03 1996-07-31 Lysyl-tRNA synthetase -S000031019 CDS YDR037W 4 525440 527215 W 2011-02-03 1996-07-31 -S000002445 ORF Verified YDR038C ENA5 putative Na(+)-exporting P-type ATPase ENA5 chromosome 4 L000003293 4 530697 527422 C 2011-02-03 1996-07-31 Protein with similarity to P-type ATPase sodium pumps; member of the Na+ efflux ATPase family -S000031057 CDS YDR038C 4 530697 527422 C 2011-02-03 1996-07-31 -S000002446 ORF Verified YDR039C ENA2 Na(+)-exporting P-type ATPase ENA2 chromosome 4 L000000556 4 534582 531307 C 2011-02-03 1996-07-31 P-type ATPase sodium pump; involved in Na+ efflux to allow salt tolerance; likely not involved in Li+ efflux -S000031179 CDS YDR039C 4 534582 531307 C 2011-02-03 1996-07-31 -S000002447 ORF Verified YDR040C ENA1 Na(+)/Li(+)-exporting P-type ATPase ENA1|PMR2|HOR6 chromosome 4 L000001456 4 538467 535192 C 15 2011-02-03 1996-07-31 P-type ATPase sodium pump; involved in Na+ and Li+ efflux to allow salt tolerance -S000032116 CDS YDR040C 4 538467 535192 C 2011-02-03 1996-07-31 -S000002448 ORF Verified YDR041W RSM10 mitochondrial 37S ribosomal protein RSM10 chromosome 4 4 539803 540414 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; has similarity to E. coli S10 ribosomal protein; essential for viability, unlike most other mitoribosomal proteins -S000032233 CDS YDR041W 4 539803 540414 W 2011-02-03 1996-07-31 -S000002449 ORF Uncharacterized YDR042C chromosome 4 4 541203 540601 C 2011-02-03 1996-07-31 Putative protein of unknown function; expression is increased in ssu72-ts69 mutant -S000032269 CDS YDR042C 4 541203 540601 C 2011-02-03 1996-07-31 -S000006507 snoRNA_gene snR47 SNR47 chromosome 4 L000003414 4 541700 541602 C 2011-02-03 2000-05-19|2007-04-04 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A2220 and small subunit (SSU) rRNA at position A619 -S000030649 noncoding_exon snR47 4 541700 541602 C 2011-02-03 2000-05-19|2007-04-04 -S000002450 ORF Verified YDR043C NRG1 transcriptional regulator NRG1 chromosome 4 L000004598 4 543369 542674 C 2011-02-03 1996-07-31 Transcriptional repressor; recruits the Cyc8p-Tup1p complex to promoters; mediates glucose repression and negatively regulates a variety of processes including filamentous growth and alkaline pH response; activated in stochastic pulses of nuclear localization in response to low glucose -S000033143 CDS YDR043C 4 543369 542674 C 2011-02-03 1996-07-31 -S000002451 ORF Verified YDR044W HEM13 coproporphyrinogen oxidase chromosome 4 L000000765 4 546642 547628 W 2011-02-03 1996-07-31 Coproporphyrinogen III oxidase; oxygen-requiring enzyme that catalyzes sixth step in heme biosynthetic pathway; transcription is repressed by oxygen and heme (via Rox1p and Hap1p); human homolog CPOX can complement yeast mutant and allow growth of haploid null after sporulation of a heterozygous diploid -S000033232 CDS YDR044W 4 546642 547628 W 2011-02-03 1996-07-31 -S000002452 ORF Verified YDR045C RPC11 DNA-directed RNA polymerase III core subunit RPC11|C11 chromosome 4 L000004954 4 548310 547978 C 2011-02-03 1996-07-31 RNA polymerase III subunit C11; mediates pol III RNA cleavage activity and is important for termination of transcription; homologous to TFIIS -S000033256 CDS YDR045C 4 548310 547978 C 2011-02-03 1996-07-31 -S000002453 ORF Verified YDR046C BAP3 amino acid transporter BAP3|PAP1 chromosome 4 L000004277 4 550576 548762 C 2011-02-03 1996-07-31 Amino acid permease; involved in uptake of cysteine, leucine, isoleucine and valine; BAP3 has a paralog, BAP2, that arose from the whole genome duplication -S000033308 CDS YDR046C 4 550576 548762 C 2011-02-03 1996-07-31 -S000002454 ORF Verified YDR047W HEM12 uroporphyrinogen decarboxylase HEM12|HEM6 chromosome 4 L000000764 4 551860 552948 W 2011-02-03 1996-07-31 Uroporphyrinogen decarboxylase; catalyzes the fifth step in the heme biosynthetic pathway; localizes to both the cytoplasm and nucleus; a hem12 mutant has phenotypes similar to patients with porphyria cutanea tarda -S000034271 CDS YDR047W 4 551860 552948 W 2011-02-03 1996-07-31 -S000002456 ORF Verified YDR049W VMS1 chromosome 4 4 553254 555152 W 2011-02-03 1996-07-31 Component of a Cdc48p-complex involved in protein quality control; exhibits cytosolic and ER-membrane localization, with Cdc48p, during normal growth, and contributes to ER-associated degradation (ERAD) of specific substrates at a step after their ubiquitination; forms a mitochondrially-associated complex with Cdc48p and Npl4p under oxidative stress that is required for ubiquitin-mediated mitochondria-associated protein degradation (MAD); conserved in C. elegans and humans -S000035432 CDS YDR049W 4 553254 555152 W 2011-02-03 1996-07-31 -S000002455 ORF Dubious YDR048C chromosome 4 4 553398 553084 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF VMS1/YDR049W -S000034352 CDS YDR048C 4 553398 553084 C 2011-02-03 1996-07-31 -S000118435 ARS ARS418 ARSIV-555 chromosome 4 4 555240 555404 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000002457 ORF Verified YDR050C TPI1 triose-phosphate isomerase TPI1 chromosome 4 L000002326 4 556472 555726 C 2011-02-03 1996-07-31 Triose phosphate isomerase, abundant glycolytic enzyme; mRNA half-life is regulated by iron availability; transcription is controlled by activators Reb1p, Gcr1p, and Rap1p through binding sites in the 5' non-coding region; inhibition of Tpi1p activity by PEP (phosphoenolpyruvate) stimulates redox metabolism in respiring cells; E104D mutation in human homolog TPI1 causes a rare autosomal disease; human TPI1 can complement yeast null mutant -S000036419 CDS YDR050C 4 556472 555726 C 2011-02-03 1996-07-31 -S000002458 ORF Verified YDR051C DET1 acid phosphatase DET1 chromosome 4 4 558060 557056 C 2011-02-03 1996-07-31 Acid phosphatase; involved in the non-vesicular transport of sterols in both directions between the endoplasmic reticulum and plasma membrane; deletion confers sensitivity to nickel -S000036483 CDS YDR051C 4 558060 557056 C 2011-02-03 1996-07-31 -S000002460 ORF Dubious YDR053W chromosome 4 4 560249 560644 W 2011-02-03 1996-07-31 Putative protein of unknown function; open reading frame overlaps 5' end of essential DBF4 gene encoding the regulatory subunit of the Cdc7p-Dbf4p kinase complex -S000037331 CDS YDR053W 4 560249 560644 W 2011-02-03 1996-07-31 -S000002459 ORF Verified YDR052C DBF4 protein serine/threonine kinase activating protein DBF4|DNA52|LSD7 chromosome 4 L000000488|S000029149|L000000513 4 560625 558511 C 2011-02-03 1996-07-31 Regulatory subunit of Cdc7p-Dbf4p kinase complex; required for Cdc7p kinase activity and initiation of DNA replication; phosphorylates the Mcm2-7 family of proteins; cell cycle regulated; relative distribution to the nucleus increases upon DNA replication stress; co-expression of human CDC7 and DBF4 complements single cdc7 or dbf4 null mutations or the cdc7 dbf4 double null mutation -S000036579 CDS YDR052C 4 560625 558511 C 2011-02-03 1996-07-31 -S000002461 ORF Verified YDR054C CDC34 SCF E2 ubiquitin-protein ligase catalytic subunit CDC34|UBC3|DNA6 chromosome 4 L000000271 4 562327 561440 C 37 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme (E2); catalytic subunit of SCF ubiquitin-protein ligase complex (together with Skp1p, Rbx1p, Cdc53p, and an F-box protein) that regulates cell cycle progression by targeting key substrates for degradation; protein abundance increases in response to DNA replication stress; human CDC34 functionally complements the thermosensitivity of the cdc34-2 mutant -S000037377 CDS YDR054C 4 562327 561440 C 2011-02-03 1996-07-31 -S000002462 ORF Verified YDR055W PST1 HPF2 chromosome 4 L000004850 4 563527 564861 W 2011-02-03 1996-07-31 Cell wall protein that contains a putative GPI-attachment site; secreted by regenerating protoplasts; up-regulated by activation of the cell integrity pathway, as mediated by Rlm1p; upregulated by cell wall damage via disruption of FKS1; PST1 has a paralog, ECM33, that arose from the whole genome duplication -S000030148 CDS YDR055W 4 563527 564861 W 2011-02-03 1996-07-31 -S000002463 ORF Uncharacterized YDR056C EMC10 chromosome 4 4 565640 565023 C 2011-02-03 1996-07-31 Putative protein of unknown function; subunit of evolutionarily conserved EMC (Endoplasmic Reticulum Membrane Complex) implicated in ERAD (ER-associated degradation) and proper assembly of multi-pass transmembrane (TM) proteins; EMC acts in yeast as an ER-mitochondria tether that interacts with outer membrane protein Tom5p of TOM (Translocase of the Mitochondrial Outer Membrane) complex; YDR056C is not an essential protein -S000030254 CDS YDR056C 4 565640 565023 C 2011-02-03 1996-07-31 -S000002464 ORF Verified YDR057W YOS9 chromosome 4 4 565927 567555 W 2011-02-03 1996-07-31 ER quality-control lectin; integral subunit of the HRD ligase; participates in efficient ER retention of misfolded proteins by recognizing them and delivering them to Hrd1p; binds to glycans with terminal alpha-1,6 linked mannose on misfolded N-glycosylated proteins and participates in targeting proteins to ERAD; member of the OS-9 protein family -S000030476 CDS YDR057W 4 565927 567555 W 2011-02-03 1996-07-31 -S000118436 ARS ARS419 ARSIV-568 chromosome 4 4 567610 567685 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178069 ARS_consensus_sequence ARS419 4 567677 567661 C 2014-11-18 2014-11-18 -S000002465 ORF Verified YDR058C TGL2 triglyceride lipase chromosome 4 L000003248 4 568703 567723 C 2011-02-03 1996-07-31 Triacylglycerol lipase that is localized to the mitochondria; has lipolytic activity towards triacylglycerols and diacylglycerols when expressed in E. coli -S000030539 CDS YDR058C 4 568703 567723 C 2011-02-03 1996-07-31 -S000006709 tRNA_gene tR(UCU)D chromosome 4 L000003767 4 568882 568953 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000037839 noncoding_exon tR(UCU)D 4 568882 568953 W 2011-02-03 2000-05-19 -S000006531 tRNA_gene tD(GUC)D chromosome 4 L000003768 4 568964 569035 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000037680 noncoding_exon tD(GUC)D 4 568964 569035 W 2011-02-03 2000-05-19 -S000002466 ORF Verified YDR059C UBC5 E2 ubiquitin-conjugating protein UBC5 chromosome 4 L000002408 4 569770 569234 C 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme; mediates selective degradation of short-lived, abnormal, or excess proteins, including histone H3; central component of the cellular stress response; expression is heat inducible; protein abundance increases in response to DNA replication stress; UBC5 has a paralog, UBC4, that arose from the whole genome duplication -S000031454 CDS YDR059C 4 569633 569234 C 2011-02-03 1996-07-31 -S000031453 CDS YDR059C 4 569770 569724 C 2011-02-03 1996-07-31 -S000031455 intron YDR059C 4 569723 569634 C 2011-02-03 1996-07-31 -S000002467 ORF Verified YDR060W MAK21 RNA-binding ribosome biosynthesis protein MAK21|NOC1 chromosome 4 L000000993 4 570649 573726 W 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; required for large (60S) ribosomal subunit biogenesis; acts as part of a Mak21p-Noc2p-Rrp5p module that associates with nascent pre-rRNA during transcription and has a role in bigenesis of the large ribosomal subunit; involved in nuclear export of pre-ribosomes; required for maintenance of dsRNA virus; homolog of human CAATT-binding protein -S000031685 CDS YDR060W 4 570649 573726 W 2011-02-03 1996-07-31 -S000002468 ORF Uncharacterized YDR061W chromosome 4 4 574164 575783 W 2011-02-03 1996-07-31 Protein with similarity to ABC transporter family members; lacks predicted membrane-spanning regions; transcriptionally activated by Yrm1p along with genes involved in multidrug resistance -S000031826 CDS YDR061W 4 574164 575783 W 2011-02-03 1996-07-31 -S000002469 ORF Verified YDR062W LCB2 serine C-palmitoyltransferase LCB2|TSC1|SCS1 chromosome 4 L000001819 4 576474 578159 W 2011-02-03 1996-07-31 Component of serine palmitoyltransferase; responsible along with Lcb1p for the first committed step in sphingolipid synthesis, which is the condensation of serine with palmitoyl-CoA to form 3-ketosphinganine -S000031954 CDS YDR062W 4 576474 578159 W 2011-02-03 1996-07-31 -S000002470 ORF Verified YDR063W AIM7 GMF1|GMF chromosome 4 4 578663 579112 W 2011-02-03 1996-07-31 Protein that interacts with Arp2/3 complex; interacts with Arp2/3 complex to stimulate actin filament debranching and inhibit actin nucleation; has similarity to Cof1p and also to human glia maturation factor (GMF); null mutant displays elevated mitochondrial genome loss -S000032842 CDS YDR063W 4 578663 579112 W 2011-02-03 1996-07-31 -S000002471 ORF Verified YDR064W RPS13 uS15|ribosomal 40S subunit protein S13|YS15|S27a|S15|S13|RPS13C|RPS13B chromosome 4 L000002900|L000002655 4 579458 580452 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S13 and bacterial S15 -S000032956 CDS YDR064W 4 579458 579478 W 2011-02-03 1996-07-31 -S000032957 CDS YDR064W 4 580018 580452 W 2011-02-03 1996-07-31 -S000032958 intron YDR064W 4 579479 580017 W 2011-02-03 1996-07-31 -S000002472 ORF Verified YDR065W RRG1 chromosome 4 4 580687 581784 W 2011-02-03 1996-07-31 Protein of unknown function; required for vacuolar acidification and mitochondrial genome maintenance; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000033047 CDS YDR065W 4 580687 581784 W 2011-02-03 1996-07-31 -S000002473 ORF Verified YDR066C RTR2 putative protein-serine/threonine phosphatase chromosome 4 4 582498 581908 C 2011-02-03 1996-07-31 Protein of unknown function; exhibits genetic interactions with Rtr1p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YDR066C is not an essential gene; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress; RTR2 has a paralog, RTR1, that arose from the whole genome duplication -S000033084 CDS YDR066C 4 582498 581908 C 2011-02-03 1996-07-31 -S000002474 ORF Uncharacterized YDR067C OCA6 protein-tyrosine-phosphatase chromosome 4 4 583465 582791 C 2011-02-03 1996-07-31 Cytoplasmic protein required for replication of Brome mosaic virus; S. cerevisiae is a model system for studying positive-strand RNA virus replication; null mutation confers sensitivity to tunicamycin and DTT -S000033843 CDS YDR067C 4 583465 582791 C 2011-02-03 1996-07-31 -S000002475 ORF Verified YDR068W DOS2 chromosome 4 L000000518 4 583713 584645 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000034055 CDS YDR068W 4 583713 584645 W 2011-02-03 1996-07-31 -S000002476 ORF Verified YDR069C DOA4 ubiquitin-specific protease DOA4|UBP4|SSV7|NPI2|MUT4|DOS1 chromosome 4 L000000514 4 587719 584939 C 2011-02-03 1996-07-31 Ubiquitin hydrolase; deubiquitinates intralumenal vesicle (ILVs) cargo proteins; required for recycling ubiquitin from proteasome-bound ubiquitinated intermediates, acts at the late endosome/prevacuolar compartment to recover ubiquitin from ubiquitinated membrane proteins destined for the vacuole; DOA4 has a paralog, UBP5, that arose from the whole genome duplication -S000034891 CDS YDR069C 4 587719 584939 C 2011-02-03 1996-07-31 -S000002477 ORF Verified YDR070C FMP16 chromosome 4 4 588379 588098 C 2011-02-03 1996-07-31 Protein of unknown function; may be involved in responding to conditions of stress; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; protein abundance increases in response to DNA replication stress -S000036234 CDS YDR070C 4 588379 588098 C 2011-02-03 1996-07-31 -S000002478 ORF Verified YDR071C PAA1 polyamine acetyltransferase chromosome 4 4 589402 588827 C 2011-02-03 1996-07-31 Polyamine acetyltransferase; acetylates polyamines (e.g. putrescine, spermidine, spermine) and also aralkylamines (e.g. tryptamine, phenylethylamine); may be involved in transcription and/or DNA replication -S000036334 CDS YDR071C 4 589402 588827 C 2011-02-03 1996-07-31 -S000002479 ORF Verified YDR072C IPT1 MIC2|inositolphosphotransferase|KTI6|SYR4 chromosome 4 L000004226|L000003534|S000029294 4 591344 589761 C 2011-02-03 1996-07-31 Inositolphosphotransferase; involved in synthesis of mannose-(inositol-P)2-ceramide (M(IP)2C), the most abundant sphingolipid; can mutate to resistance to the antifungals syringomycin E and DmAMP1 and to K. lactis zymocin -S000037011 CDS YDR072C 4 591344 589761 C 2011-02-03 1996-07-31 -S000002480 ORF Verified YDR073W SNF11 chromosome 4 L000003167 4 592439 592948 W 2011-02-03 1996-07-31 Subunit of the SWI/SNF chromatin remodeling complex; involved in transcriptional regulation; interacts with a highly conserved 40-residue sequence of Snf2p; relocates to the cytosol under hypoxic conditions -S000037137 CDS YDR073W 4 592439 592948 W 2011-02-03 1996-07-31 -S000002481 ORF Verified YDR074W TPS2 trehalose-phosphatase TPS2|PFK3|HOG2 chromosome 4 L000002331 4 593893 596583 W 2011-02-03 1996-07-31 Phosphatase subunit of the trehalose-6-P synthase/phosphatase complex; involved in synthesis of the storage carbohydrate trehalose; expression is induced by stress conditions and repressed by the Ras-cAMP pathway; protein abundance increases in response to DNA replication stress -S000037233 CDS YDR074W 4 593893 596583 W 2011-02-03 1996-07-31 -S000002482 ORF Verified YDR075W PPH3 phosphoprotein phosphatase PP4 catalytic subunit PPH3 chromosome 4 L000001471 4 597156 598082 W 53 2011-02-03 1996-07-31 Catalytic subunit of protein phosphatase PP4 complex; Pph3p and Psy2p form active complex, Psy4p may provide substrate specificity; regulates recovery from the DNA damage checkpoint, the gene conversion- and single-strand annealing-mediated pathways of meiotic double-strand break repair and efficient Non-Homologous End-Joining (NHEJ) pathway; involved in activation of Gln3p to alleviate nitrogen catabolite repression; Pph3p and Psy2p localize to foci on meiotic chromosomes -S000029904 CDS YDR075W 4 597156 598082 W 2011-02-03 1996-07-31 -S000002483 ORF Verified YDR076W RAD55 putative DNA-dependent ATPase RAD55 chromosome 4 L000001575 4 598468 599688 W 53 2011-02-03 1996-07-31 Protein that stimulates strand exchange; stimulates strand exchange by stabilizing the binding of Rad51p to single-stranded DNA; involved in the recombinational repair of double-strand breaks in DNA during vegetative growth and meiosis; forms heterodimer with Rad57p -S000030010 CDS YDR076W 4 598468 599688 W 2011-02-03 1996-07-31 -S000002484 ORF Verified YDR077W SED1 chromosome 4 L000001859 4 600793 601809 W 2011-02-03 1996-07-31 Major stress-induced structural GPI-cell wall glycoprotein; associates with translating ribosomes, possible role in mitochondrial genome maintenance; ORF contains two distinct variable minisatellites; SED1 has a paralog, SPI1, that arose from the whole genome duplication -S000030135 CDS YDR077W 4 600793 601809 W 2011-02-03 1996-07-31 -S000002485 ORF Verified YDR078C SHU2 chromosome 4 4 602869 602198 C 2011-02-03 1996-07-31 Component of Shu complex (aka PCSS complex); Shu complex also includes Psy3, Csm2, Shu1, and promotes error-free DNA repair, Shu complex mediates inhibition of Srs2p function; promotes formation of Rad51p filaments; important for both mitotic and meiotic homologous recombination, and contains a conserved SWIM domain that is necessary for both -S000030241 CDS YDR078C 4 602869 602198 C 2011-02-03 1996-07-31 -S000002486 ORF Verified YDR079W PET100 chromosome 4 L000003521 4 603064 603399 W 2011-02-03 1996-07-31 Chaperone that facilitates the assembly of cytochrome c oxidase; integral to the mitochondrial inner membrane; interacts with a subcomplex of subunits VII, VIIa, and VIII (Cox7p, Cox9p, and Cox8p) but not with the holoenzyme -S000031263 CDS YDR079W 4 603064 603399 W 2011-02-03 1996-07-31 -S000007603 ORF Verified YDR079C-A TFB5 TFIIH complex subunit TFB5 chromosome 4 4 603811 603593 C 2011-02-03 2001-02-26 Component of RNA polymerase II general transcription factor TFIIH; involved in transcription initiation and in nucleotide-excision repair; relocalizes to the cytosol in response to hypoxia; homolog of Chlamydomonas reinhardtii REX1-S protein involved in DNA repair -S000037149 CDS YDR079C-A 4 603811 603593 C 2011-02-03 2001-02-26 -S000002487 ORF Verified YDR080W VPS41 VPL20|VAM2|SVL2|FET2|CVT8 chromosome 4 L000003512|L000004234 4 604008 606986 W 2011-02-03 1996-07-31 Subunit of the HOPS endocytic tethering complex; vacuole membrane protein that functions as a Rab GTPase effector, interacting specifically with the GTP-bound conformation of Ypt7p, facilitating tethering, docking and promoting membrane fusion events at the late endosome and vacuole; required for both membrane and protein trafficking; Yck3p-mediated phosphorylation regulates the organization of vacuolar fusion sites -S000032217 CDS YDR080W 4 604008 606986 W 2011-02-03 1996-07-31 -S000002488 ORF Verified YDR081C PDC2 chromosome 4 L000001355 4 610081 607304 C 50 2011-02-03 1996-07-31 Transcription factor for thiamine-regulated genes; required for expression of the two isoforms of pyruvate decarboxylase (PDC1 and PDC5) along with thiamine biosynthetic genes; binds a DNA sequence in the PDC5 promoter; mutant fails to grow on 2% glucose and thus is scored as inviable under standard conditions -S000032243 CDS YDR081C 4 610081 607304 C 2011-02-03 1996-07-31 -S000002489 ORF Verified YDR082W STN1 chromosome 4 L000003921 4 610441 611925 W 2011-02-03 1996-07-31 Telomere end-binding and capping protein; plays a key role with Pol12p in linking telomerase action with completion of lagging strand synthesis, and in a regulatory step required for telomere capping; similar to human Stn1 -S000032408 CDS YDR082W 4 610441 611925 W 2011-02-03 1996-07-31 -S000002490 ORF Verified YDR083W RRP8 25S rRNA (adenine645-N1)-methyltransferase chromosome 4 4 612073 613251 W 2011-02-03 2003-09-22|2006-01-19|1996-07-31 Nucleolar S-adenosylmethionine-dependent rRNA methyltransferase; methylates adenine (m1A) of the large subunit (LSU) rRNA at position 645; involved in pre-rRNA cleavage at site A2; mutation is synthetically lethal with a gar1 mutation; deletion disrupts telomere maintenance by influencing the expression of neighboring gene STN1 -S000033239 CDS YDR083W 4 612073 613251 W 2011-02-03 2003-09-22|2006-01-19|1996-07-31 -S000002491 ORF Verified YDR084C TVP23 chromosome 4 4 614004 613405 C 2011-02-03 1996-07-31 Integral membrane protein; localized to late Golgi vesicles along with the v-SNARE Tlg2p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern -S000033277 CDS YDR084C 4 614004 613405 C 2011-02-03 1996-07-31 -S000002492 ORF Verified YDR085C AFR1 chromosome 4 L000000059 4 616150 614288 C 47.97 2011-02-03 1996-07-31 Protein required for pheromone-induced projection (shmoo) formation; regulates septin architecture during mating; has an RVXF motif that mediates targeting of Glc7p to mating projections; interacts with Cdc12p; AFR1 has a paralog, YER158C, that arose from the whole genome duplication -S000033345 CDS YDR085C 4 616150 614288 C 2011-02-03 1996-07-31 -S000002493 ORF Verified YDR086C SSS1 translocon subunit SSS1 chromosome 4 L000002092 4 617170 616928 C 2011-02-03 1996-07-31 Subunit of the Sec61p translocation complex (Sec61p-Sss1p-Sbh1p); this complex forms a channel for passage of secretory proteins through the endoplasmic reticulum membrane, and of the Ssh1p complex (Ssh1p-Sbh2p-Sss1p); interacts with Ost4p and Wbp1p -S000033427 CDS YDR086C 4 617170 616928 C 2011-02-03 1996-07-31 -S000002494 ORF Verified YDR087C RRP1 chromosome 4 L000001774 4 618306 617470 C 2011-02-03 1996-07-31 Essential evolutionarily conserved nucleolar protein; necessary for biogenesis of 60S ribosomal subunits and for processing of pre-rRNAs to mature rRNA; associated with several distinct 66S pre-ribosomal particles -S000034333 CDS YDR087C 4 618306 617470 C 2011-02-03 1996-07-31 -S000002495 ORF Verified YDR088C SLU7 mRNA splicing protein SLU7|SLT17 chromosome 4 L000001922 4 619645 618497 C 2011-02-03 1996-07-31 RNA splicing factor; required for ATP-independent portion of 2nd catalytic step of spliceosomal RNA splicing; interacts with Prp18p; contains zinc knuckle domain -S000034412 CDS YDR088C 4 619645 618497 C 2011-02-03 1996-07-31 -S000006700 tRNA_gene tR(ACG)D chromosome 4 L000003786 4 620041 619969 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 6 nuclear tRNA genes containing the tDNA-anticodon ACG (converted to ICG in the mature tRNA), decodes CGU, CGC, and probably CGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000030369 noncoding_exon tR(ACG)D 4 620041 619969 C 2011-02-03 2000-05-19 -S000002496 ORF Verified YDR089W VTC5 chromosome 4 4 622112 624721 W 2011-02-03 1996-07-31 Novel subunit of the vacuolar transporter chaperone complex; vacuolar transmembrane protein that regulates biosynthesis of polyphosphate; deletion reduces and overexpression increases polyP accumulation; SPX domain (Syg1, Pho81, Xpr1)-containing protein involved in phosphate homeostasis; relocalizes from vacuole to cytoplasm upon DNA replication stress -S000035491 CDS YDR089W 4 622112 624721 W 2011-02-03 1996-07-31 -S000002497 ORF Uncharacterized YDR090C chromosome 4 4 625998 625066 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000035405 CDS YDR090C 4 625998 625066 C 2011-02-03 1996-07-31 -S000002498 ORF Verified YDR091C RLI1 Fe-S cluster-binding ribosome biosynthesis protein chromosome 4 4 628534 626708 C 2011-02-03 1996-07-31 Essential Fe-S protein; required for ribosome biogenesis, translation initiation/termination; facilitates binding of multifactor complex (MFC) of initiation factors to small ribosomal subunit; Dom34-Hbs1 complex and Rli1p work in dissociating inactive ribosomes, thereby facilitating translation restart; forms complex with Lto1p and Yae1p; dependency on ROS-labile FeS clusters, activity in nuclear ribosomal-subunit export impaired by mild oxidative stress -S000035466 CDS YDR091C 4 628534 626708 C 2011-02-03 1996-07-31 -S000130174 ARS ARS420 chromosome 4 4 628938 629582 2014-11-18 2014-11-18|2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000002499 ORF Verified YDR092W UBC13 E2 ubiquitin-conjugating protein UBC13 chromosome 4 L000003387 4 629876 630605 W 2011-02-03 1996-07-31 E2 ubiquitin-conjugating enzyme; involved in the error-free DNA postreplication repair pathway; interacts with Mms2p to assemble ubiquitin chains at the Ub Lys-63 residue; DNA damage triggers redistribution from the cytoplasm to the nucleus -S000035560 CDS YDR092W 4 629876 629905 W 2011-02-03 1996-07-31 -S000035561 CDS YDR092W 4 630174 630605 W 2011-02-03 1996-07-31 -S000035562 intron YDR092W 4 629906 630173 W 2011-02-03 1996-07-31 -S000002500 ORF Verified YDR093W DNF2 aminophospholipid-translocating P4-type ATPase DNF2 chromosome 4 4 631282 636120 W 2011-02-03 1996-07-31 Aminophospholipid translocase (flippase); type 4 P-type ATPase; involved in phospholipid translocation, contributing to endocytosis, protein transport, and cellular polarization; localizes primarily to the plasma membrane; localizes to the shmoo tip where it has a redundant role in the cellular response to mating pheromone; DNF2 has a paralog, DNF1, that arose from the whole genome duplication -S000036482 CDS YDR093W 4 631282 636120 W 2011-02-03 1996-07-31 -S000002501 ORF Dubious YDR094W chromosome 4 4 635840 636175 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF DNF2/YDR093W -S000036554 CDS YDR094W 4 635840 636175 W 2011-02-03 1996-07-31 -S000002502 ORF Dubious YDR095C chromosome 4 4 636527 636117 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036605 CDS YDR095C 4 636527 636117 C 2011-02-03 1996-07-31 -S000002503 ORF Verified YDR096W GIS1 histone demethylase GIS1 chromosome 4 L000003351 4 637139 639823 W 2011-02-03 1996-07-31 Histone demethylase and transcription factor; regulates genes during nutrient limitation; activity modulated by proteasome-mediated proteolysis; has JmjC and JmjN domain in N-terminus that interact, promoting stability and proper transcriptional activity; contains two transactivating domains downstream of Jmj domains and a C-terminal DNA binding domain; relocalizes to the cytosol in response to hypoxia; GIS1 has a paralog, RPH1, that arose from the whole genome duplication -S000037381 CDS YDR096W 4 637139 639823 W 2011-02-03 1996-07-31 -S000118437 ARS ARS421 ARSIV-640 chromosome 4 4 640006 640072 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178070 ARS_consensus_sequence ARS421 4 640062 640046 C 2014-11-18 2014-11-18 -S000002504 ORF Verified YDR097C MSH6 PMS6|mismatch repair ATPase MSH6|PMS3 chromosome 4 L000003135|L000004503|S000029377 4 643837 640109 C 2011-02-03 1996-07-31 Protein required for mismatch repair in mitosis and meiosis; forms a complex with Msh2p to repair both single-base & insertion-deletion mispairs; also involved in interstrand cross-link repair; potentially phosphorylated by Cdc28p -S000037420 CDS YDR097C 4 643837 640109 C 2011-02-03 1996-07-31 -S000002505 ORF Verified YDR098C GRX3 monothiol glutaredoxin GRX3 chromosome 4 S000007444 4 644930 644178 C 2014-11-18 1996-07-31|2014-11-18 Glutathione-dependent oxidoreductase; hydroperoxide and superoxide-radical responsive; monothiol glutaredoxin subfamily member along with Grx4p and Grx5p; protects cells from oxidative damage; with Grx4p, binds to Aft1p in iron-replete conditions, promoting its dissociation from promoters; evidence exists indicating that the translation start site is not Met1 as currently annotated, but rather Met36; GRX3 has a paralog, GRX4, that arose from the whole genome duplication -S000037543 CDS YDR098C 4 644930 644178 C 2014-11-18 1996-07-31|2014-11-18 -S000006694 tRNA_gene tQ(UUG)D2 chromosome 4 L000003785 4 645224 645153 C 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000034810 noncoding_exon tQ(UUG)D2 4 645224 645153 C 2011-02-03 2000-05-19 -S000006850 long_terminal_repeat YDRCdelta7 chromosome 4 4 645835 645502 C 2011-02-03 2000-05-19 Ty1 LTR -S000007391 transposable_element_gene YDR098C-B gag-pol fusion protein chromosome 4 4 651126 645858 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000032257 CDS YDR098C-B 4 649820 645858 C 2011-02-03 1999-07-17 -S000032256 CDS YDR098C-B 4 651126 649822 C 2011-02-03 1999-07-17 -S000032258 plus_1_translational_frameshift YDR098C-B 4 649821 649821 C 2011-02-03 1999-07-17 -S000007390 transposable_element_gene YDR098C-A gag protein chromosome 4 4 651126 649804 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000032236 CDS YDR098C-A 4 651126 649804 C 2011-02-03 1999-07-17 -S000006859 LTR_retrotransposon YDRCTy1-1 Ty1 chromosome 4 4 651419 645502 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000006851 long_terminal_repeat YDRCdelta8 chromosome 4 4 651419 651086 C 2011-02-03 2000-05-19 Ty1 LTR -S000006855 long_terminal_repeat YDRCsigma1 chromosome 4 4 651503 651420 C 2011-02-03 2000-05-19 Ty3 LTR -S000006852 long_terminal_repeat YDRCdelta9 chromosome 4 4 651980 651682 C 2011-02-03 2000-05-19 Ty1 LTR -S000002506 ORF Verified YDR099W BMH2 14-3-3 family protein BMH2|SCD3 chromosome 4 L000000186 4 653607 654428 W 63 2011-02-03 1996-07-31 14-3-3 protein, minor isoform; controls proteome at post-transcriptional level, binds proteins and DNA, involved in regulation of many processes including exocytosis, vesicle transport, Ras/MAPK signaling, and rapamycin-sensitive signaling; protein increases in abundance and relative distribution to the nucleus increases upon DNA replication stress; abundance relative to Bmh1p increases during sporulation -S000030398 CDS YDR099W 4 653607 654428 W 2011-02-03 1996-07-31 -S000122095 five_prime_UTR_intron YDR099W 4 652781 653523 W 2011-02-03 2007-04-04 -S000002507 ORF Verified YDR100W TVP15 chromosome 4 4 655013 655444 W 2011-02-03 1996-07-31 Integral membrane protein; localized to late Golgi vesicles along with the v-SNARE Tlg2p -S000035845 CDS YDR100W 4 655013 655444 W 2011-02-03 1996-07-31 -S000002508 ORF Verified YDR101C ARX1 putative hydrolase chromosome 4 4 657467 655686 C 2011-02-03 1996-07-31 Nuclear export factor for the ribosomal pre-60S subunit; shuttling factor which directly binds FG rich nucleoporins and facilities translocation through the nuclear pore complex; interacts directly with Alb1p; responsible for Tif6p recycling defects in the absence of Rei1; associated with the ribosomal export complex -S000035887 CDS YDR101C 4 657467 655686 C 2011-02-03 1996-07-31 -S000002509 ORF Uncharacterized YDR102C chromosome 4 4 657980 657648 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YDR102C is not an essential gene; homozygous diploid deletion strain exhibits high budding index -S000036020 CDS YDR102C 4 657980 657648 C 2011-02-03 1996-07-31 -S000002510 ORF Verified YDR103W STE5 NUL3|HMD3 chromosome 4 L000002115 4 658350 661103 W 63 2011-02-03 1996-07-31 Pheromone-responsive MAPK scaffold protein; couples activation of the G-protein-coupled pheromone receptor to MAPK activation; intramolecular interaction of PH and VWA domains blocks activation of assembled signaling cascade components (Ste11p, Ste7p and Fus3p) under basal conditions; Gbeta-gamma (Ste4p-Ste18p)-dependent docking at the plasma membrane and binding of PI(4,5)P2 by the PH domain relieves autoinhibition, resulting in pheromone-dependent pathway activation -S000036909 CDS YDR103W 4 658350 661103 W 2011-02-03 1996-07-31 -S000002511 ORF Verified YDR104C SPO71 chromosome 4 4 664910 661173 C 2011-02-03 1996-07-31 Meiosis-specific protein required for prospore membrane morphogenesis; localizes to the prospore membrane (PSM) during sporulation; required for PSM elongation and closure; genetically antagonistic to SPO1; recruits Vps13p to the PSM during sporulation; interacts and functions cooperatively with Spo73p; mutants have defects in the PSM, aberrant spore wall formation and reduced PtdIns-phosphate pools in the PSM; contains three PH-like domains -S000036931 CDS YDR104C 4 664910 661173 C 2011-02-03 1996-07-31 -S000002512 ORF Verified YDR105C TMS1 chromosome 4 4 666770 665349 C 2011-02-03 1996-07-31 Vacuolar membrane protein of unknown function; is conserved in mammals; predicted to contain eleven transmembrane helices; interacts with Pdr5p, a protein involved in multidrug resistance -S000036992 CDS YDR105C 4 666770 665349 C 2011-02-03 1996-07-31 -S000002513 ORF Verified YDR106W ARP10 chromosome 4 L000003439 4 667004 667858 W 2011-02-03 1996-07-31 Component of the dynactin complex; localized to the pointed end of the Arp1p filament; may regulate membrane association of the complex -S000037120 CDS YDR106W 4 667004 667858 W 2011-02-03 1996-07-31 -S000006601 tRNA_gene tI(AAU)D chromosome 4 L000003784 4 668080 668007 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000030399 noncoding_exon tI(AAU)D 4 668080 668007 C 2011-02-03 2000-05-19 -S000006856 long_terminal_repeat YDRWsigma2 YDRCsigma2 chromosome 4 4 668096 668436 W 2011-02-03 2000-05-19|2007-04-02 Ty3 LTR -S000006864 long_terminal_repeat YDRWdelta10 chromosome 4 4 668543 668784 W 2011-02-03 2000-05-19 Ty1 LTR -S000002514 ORF Verified YDR107C TMN2 chromosome 4 4 671034 669016 C 2011-02-03 1996-07-31 Protein with a role in cellular adhesion and filamentous growth; similar to Tmn3p; member of the evolutionarily conserved Transmembrane Nine family of proteins with nine membrane-spanning segments; TMN2 has a paralog, EMP70, that arose from the whole genome duplication -S000037823 CDS YDR107C 4 671034 669016 C 2011-02-03 1996-07-31 -S000002515 ORF Verified YDR108W TRS85 GSG1|MUM1 chromosome 4 L000002779|S000029315|L000002585 4 671269 673365 W 2011-02-03 1996-07-31 Component of transport protein particle (TRAPP) complex III; TRAPPIII is a multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating endosome-Golgi traffic and required for membrane expansion during autophagy and the CVT pathway; directs Ypt1p to the PAS; late post-replication meiotic role -S000029911 CDS YDR108W 4 671269 673365 W 2011-02-03 1996-07-31 -S000002516 ORF Uncharacterized YDR109C putative phosphotransferase chromosome 4 4 675667 673520 C 2011-02-03 1996-07-31 Putative kinase -S000029962 CDS YDR109C 4 675667 673520 C 2011-02-03 1996-07-31 -S000002517 ORF Verified YDR110W FOB1 replication fork barrier binding protein FOB1|HRM1 chromosome 4 L000003959 4 676102 677802 W 2011-02-03 1996-07-31 Nucleolar protein that binds the rDNA replication fork barrier site; required for replication fork blocking, recombinational hotspot activity, condensin recruitment to replication fork barrier (RFB), and rDNA repeat segregation; related to retroviral integrases -S000031039 CDS YDR110W 4 676102 677802 W 2011-02-03 1996-07-31 -S000002519 ORF Dubious YDR112W IRC2 chromosome 4 4 679544 679852 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ALT2/YDR111C; null mutant displays increased levels of spontaneous Rad52p foci -S000032093 CDS YDR112W 4 679544 679852 W 2011-02-03 1996-07-31 -S000002518 ORF Uncharacterized YDR111C ALT2 alanine transaminase ALT2 chromosome 4 4 679764 678241 C 2011-02-03 1996-07-31 Catalytically inactive alanine transaminase; expression is repressed in the presence of alanine and repression is mediated by Nrg1p; ALT2 has a paralog, ALT1, that arose from the whole genome duplication -S000031067 CDS YDR111C 4 679764 678241 C 2011-02-03 1996-07-31 -S000002520 ORF Verified YDR113C PDS1 securin chromosome 4 L000001368 4 681617 680496 C 2011-02-03 1996-07-31 Securin; inhibits anaphase by binding separin Esp1p; blocks cyclin destruction and mitotic exit, essential for meiotic progression and mitotic cell cycle arrest; localization is cell-cycle dependent and regulated by Cdc28p phosphorylation -S000032118 CDS YDR113C 4 681617 680496 C 2011-02-03 1996-07-31 -S000002522 ORF Verified YDR115W MRX14 putative mitochondrial 54S ribosomal protein chromosome 4 4 682175 682492 W 2011-02-03 1996-07-31 Putative mitochondrial ribosomal protein of the large subunit; similar to E. coli L34 ribosomal protein; required for respiratory growth, as are most mitochondrial ribosomal proteins; protein increases in abundance and relocalizes to the plasma membrane upon DNA replication stress -S000032311 CDS YDR115W 4 682175 682492 W 2011-02-03 1996-07-31 -S000002521 ORF Uncharacterized YDR114C chromosome 4 4 682226 681924 C 2011-02-03 1996-07-31 Putative protein of unknown function; deletion mutant exhibits poor growth at elevated pH and calcium -S000032200 CDS YDR114C 4 682226 681924 C 2011-02-03 1996-07-31 -S000002523 ORF Verified YDR116C MRPL1 mitochondrial 54S ribosomal protein MRPL1 chromosome 4 4 683581 682724 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000033144 CDS YDR116C 4 683581 682724 C 2011-02-03 1996-07-31 -S000002524 ORF Verified YDR117C TMA64 RBF64 chromosome 4 4 685643 683946 C 2011-02-03 1996-07-31 Protein of unknown function that associates with ribosomes; has a putative RNA binding domain; in mammals the corresponding protein, eIF2D, has been shown to possess translation initiation factor activity -S000033197 CDS YDR117C 4 685643 683946 C 2011-02-03 1996-07-31 -S000002525 ORF Verified YDR118W APC4 anaphase promoting complex subunit 4 chromosome 4 L000004319 4 685882 687840 W 2011-02-03 1996-07-31 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); APC/C is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; component of the platform domain of the APC/C, based on structural analysis; relative distribution to the nucleus increases upon DNA replication stress -S000033282 CDS YDR118W 4 685882 687840 W 2011-02-03 1996-07-31 -S000028820 ORF Dubious YDR118W-A chromosome 4 4 687768 687884 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified using a combination of expression profiling and mass spectrometry -S000033639 CDS YDR118W-A 4 687768 687884 W 2011-02-03 2003-07-29 -S000002526 ORF Uncharacterized YDR119W VBA4 chromosome 4 4 688227 690533 W 2011-02-03 1996-07-31 Protein of unknown function; proposed role as a basic amino acid permease based on phylogeny; GFP-fusion protein localizes to vacuolar membrane; physical interaction with Atg27p suggests a possible role in autophagy; non-essential gene -S000034153 CDS YDR119W 4 688227 690533 W 2011-02-03 1996-07-31 -S000113555 ORF Verified YDR119W-A COX26 chromosome 4 4 691014 691214 W 2011-02-03 2005-11-16 Stabilizes or regulates formation of respiratory chain supercomplexes composed of Complex III (ubiquinol-cytochrome c reductase) and Complex IV (cytochrome c oxidase) -S000113556 CDS YDR119W-A 4 691014 691214 W 2011-02-03 2005-11-16 -S000002527 ORF Verified YDR120C TRM1 tRNA (guanine26-N2)-dimethyltransferase chromosome 4 L000002337 4 693261 691549 C 2011-02-03 1996-07-31 tRNA methyltransferase; two forms of protein are made by alternative translation starts; localizes to both nucleus and mitochondrion to produce modified base N2,N2-dimethylguanosine in tRNAs in both compartments; nuclear Trm1p is evenly distributed around inner nuclear membrane in WT, but mislocalizes as puncta near ER-nucleus junctions in spindle pole body (SPB) mutants; both Trm1p inner nuclear membrane targeting and maintenance depend upon SPB -S000035345 CDS YDR120C 4 693261 691549 C 2011-02-03 1996-07-31 -S000002528 ORF Verified YDR121W DPB4 DNA polymerase epsilon noncatalytic subunit chromosome 4 S000007463 4 693585 694175 W 2011-02-03 1996-07-31 Subunit of DNA pol epsilon and of ISW2 chromatin accessibility complex; involved in both chromosomal DNA replication and inheritance of telomeric silencing; stabilizes the interaction of Pol epsilon with primer-template DNA, positively affecting the processivity of the polymerase and exonuclease activities of Pol epsilon; interacts with extranucleosomal DNA and acts as anchor point for ISW2 complex that retains its position on DNA during nucleosome mobilization -S000035456 CDS YDR121W 4 693585 694175 W 2011-02-03 1996-07-31 -S000002529 ORF Verified YDR122W KIN1 serine/threonine protein kinase KIN1 chromosome 4 L000000901 4 694700 697894 W 2011-02-03 1996-07-31 Serine/threonine protein kinase involved in regulation of exocytosis; localizes to the cytoplasmic face of the plasma membrane; KIN1 has a paralog, KIN2, that arose from the whole genome duplication -S000036387 CDS YDR122W 4 694700 697894 W 2011-02-03 1996-07-31 -S000002530 ORF Verified YDR123C INO2 SCS1|DIE1 chromosome 4 L000000868|L000002801 4 699468 698554 C 2011-02-03 1996-07-31 Transcription factor; component of the heteromeric Ino2p/Ino4p basic helix-loop-helix transcription activator that binds inositol/choline-responsive elements (ICREs), required for derepression of phospholipid biosynthetic genes in response to inositol depletion; involved in diauxic shift -S000036420 CDS YDR123C 4 699468 698554 C 2011-02-03 1996-07-31 -S000002531 ORF Uncharacterized YDR124W chromosome 4 4 700315 701289 W 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene; expression is strongly induced by alpha factor -S000036553 CDS YDR124W 4 700315 701289 W 2011-02-03 1996-07-31 -S000002532 ORF Verified YDR125C ECM18 alpha/beta hydrolase family protein chromosome 4 L000003893 4 702758 701397 C 2011-02-03 1996-07-31 Protein of unknown function; ECM18 has a paralog, ICT1, that arose from the whole genome duplication -S000036581 CDS YDR125C 4 702758 701397 C 2011-02-03 1996-07-31 -S000114834 ARS ARS422 ARS422 ARSIV-703|ARO1 ARS chromosome 4 4 702887 703132 2011-02-03 2006-09-08|2006-04-12 Autonomously Replicating Sequence -S000178071 ARS_consensus_sequence ARS422 4 702924 702940 W 2014-11-18 2014-11-18 -S000002533 ORF Verified YDR126W SWF1 palmitoyltransferase SWF1|PSL10 chromosome 4 4 703234 704244 W 2011-02-03 1996-07-31 Palmitoyltransferase that acts on transmembrane proteins; including the SNAREs Snc1p, Syn8p, Tlg1p and likely all SNAREs; contains an Asp-His-His-Cys-cysteine rich (DHHC-CRD) domain; may have a role in vacuole fusion -S000037340 CDS YDR126W 4 703234 704244 W 2011-02-03 1996-07-31 -S000002534 ORF Verified YDR127W ARO1 pentafunctional protein ARO1p chromosome 4 L000000116 4 704484 709250 W 81 2011-02-03 1996-07-31 Pentafunctional arom protein; catalyzes steps 2 through 6 in the biosynthesis of chorismate, which is a precursor to aromatic amino acids -S000037463 CDS YDR127W 4 704484 709250 W 2011-02-03 1996-07-31 -S000002535 ORF Verified YDR128W MTC5 SEA3 chromosome 4 4 709549 712995 W 2011-02-03 1996-07-31 Subunit of SEACAT, a subcomplex of the SEA complex; Mtc1p, along with Rtc1p and Sea4p, redundantly inhibit the TORC1 inhibitory role of the Iml1p/SEACIT (Iml1p-Npr2p-Npr3p) subcomplex, a GAP for GTPase Gtr1p (EGOC subunit) in response to amino acid limitation, thereby resulting in activation of TORC1 signaling; SEA is a coatomer-related complex that associates dynamically with the vacuole; relative distribution to the vacuolar membrane decreases upon DNA replication stress -S000030151 CDS YDR128W 4 709549 712995 W 2011-02-03 1996-07-31 -S000002536 ORF Verified YDR129C SAC6 fimbrin|ABP67 chromosome 4 L000001793 4 715379 713340 C 84 2011-02-03 1996-07-31 Fimbrin, actin-bundling protein; cooperates with Scp1p in organization and maintenance of the actin cytoskeleton; phosphorylated by Cdc28p/Clb2p in metaphase on T103, to regulate conformation, and modulate actin filament binding affinity and actin cable dynamics; relocalizes from the plasma membrane to the cytoplasm upon DNA replication stress; human homologs PLS3 and LCP1 implicated in spinocerebellar ataxia type 2 (SCA2) can each complement yeast null mutant -S000030258 CDS YDR129C 4 715247 713340 C 2011-02-03 1996-07-31 -S000030257 CDS YDR129C 4 715379 715359 C 2011-02-03 1996-07-31 -S000030259 intron YDR129C 4 715358 715248 C 2011-02-03 1996-07-31 -S000002537 ORF Verified YDR130C FIN1 chromosome 4 4 716622 715747 C 2011-02-03 1996-07-31 Spindle pole body-related intermediate filament protein; forms cell cycle-specific filaments between spindle pole bodies in dividing cells; localizes to poles and microtubules of spindle during anaphase and contributes to spindle stability; involved in Glc7p localization and regulation; relative distribution to the nucleus increases upon DNA replication stress -S000030642 CDS YDR130C 4 716622 715747 C 2011-02-03 1996-07-31 -S000002538 ORF Verified YDR131C chromosome 4 4 718460 716790 C 2011-02-03 1996-07-31 F-box protein subunit of SCF ubiquitin ligase complex; substrate-specific adaptor subunit that recruits substrates to a core ubiquitination complex -S000030724 CDS YDR131C 4 718460 716790 C 2011-02-03 1996-07-31 -S000002539 ORF Verified YDR132C chromosome 4 4 720303 718816 C 2011-02-03 1996-07-31 Protein of unknown function; protein increases in abundance and relative distribution to the nucleus increases upon DNA replication stress; YDR132C has a paralog, YLR108C, that arose from the whole genome duplication -S000031561 CDS YDR132C 4 720303 718816 C 2011-02-03 1996-07-31 -S000002540 ORF Dubious YDR133C chromosome 4 4 721297 720962 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps YDR134C -S000031648 CDS YDR133C 4 721297 720962 C 2011-02-03 1996-07-31 -S000002541 blocked_reading_frame YDR134C chromosome 4 4 721481 721071 C 2011-02-03 1996-07-31 Cell wall protein; YDR134C has a paralog, CCW12, that arose from the whole genome duplication; S. cerevisiae genome reference strain S288C contains an internal in-frame stop at codon 67, which in other strains encodes glutamine -S000031764 CDS YDR134C 4 721481 721071 C 2011-02-03 1996-07-31 -S000002542 ORF Verified YDR135C YCF1 ATP-binding cassette glutathione S-conjugate transporter YCF1 chromosome 4 L000002499 4 727551 723004 C 2011-02-03 1996-07-31 Vacuolar glutathione S-conjugate transporter; ABC-C transporter of the ATP-binding cassette family; required for vacuole fusion; forms stable complexes with vacuole fusion machinery; regulates Vam7p recruitment to vacuoles; role in detoxifying metals (Cd, Hg, As); transports GSSG that is not immediately reduced in cytosol to vacuole; transports unconjugated bilirubin, selenodigluthatione, oxidized glutathione; similar to human cystic fibrosis protein CFTR -S000031914 CDS YDR135C 4 727551 723004 C 2011-02-03 1996-07-31 -S000002544 ORF Verified YDR137W RGP1 chromosome 4 L000001628 4 728259 730250 W 82 2011-02-03 1996-07-31 Subunit of a Golgi membrane exchange factor (Ric1p-Rgp1p); this complex catalyzes nucleotide exchange on Ypt6p -S000032960 CDS YDR137W 4 728259 730250 W 2011-02-03 1996-07-31 -S000002543 ORF Dubious YDR136C VPS61 chromosome 4 4 728283 727711 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 4% of ORF overlaps the verified gene RGP1; deletion causes a vacuolar protein sorting defect -S000032795 CDS YDR136C 4 728283 727711 C 2011-02-03 1996-07-31 -S000002545 ORF Verified YDR138W HPR1 TRF1 chromosome 4 L000000808 4 730578 732836 W 82 2011-02-03 1996-07-31 Subunit of THO/TREX complexes; this complex couple transcription elongation with mitotic recombination and with mRNA metabolism and export, subunit of an RNA Pol II complex; regulates lifespan; involved in telomere maintenance; similar to Top1p -S000033050 CDS YDR138W 4 730578 732836 W 2011-02-03 1996-07-31 -S000002546 ORF Verified YDR139C RUB1 NEDD8 family protein RUB1 chromosome 4 L000003330|L000004485 4 733924 733618 C 2011-02-03 2000-12-01|1996-07-31 Ubiquitin-like protein with similarity to mammalian NEDD8; conjugation (neddylation) substrates include the cullins Cdc53p, Rtt101p, and Cul3p; activated by Ula1p and Uba3p (E1 enzyme pair); conjugation mediated by Ubc12p (E2 enzyme) -S000033098 CDS YDR139C 4 733702 733618 C 2011-02-03 2000-12-01|1996-07-31 -S000033097 CDS YDR139C 4 733924 733776 C 2011-02-03 2000-12-01|1996-07-31 -S000033099 intron YDR139C 4 733775 733703 C 2011-02-03 2000-12-01|1996-07-31 -S000002547 ORF Verified YDR140W MTQ2 S-adenosylmethionine-dependent methyltransferase chromosome 4 4 734138 734803 W 2011-02-03 1996-07-31 S-adenosylmethionine-dependent methyltransferase; subunit of complex with Trm112p that methylates translation release factor Sup45p (eRF1) in the ternary complex eRF1-eRF3-GTP; similar to E.coli PrmC; member of the seven beta-strand family -S000036021 CDS YDR140W 4 734138 734803 W 2011-02-03 1996-07-31 -S000002548 ORF Verified YDR141C DOP1 chromosome 4 4 739997 734901 C 2011-02-03 1996-07-31 Golgi-localized, leucine-zipper domain containing protein; involved in endosome to Golgi transport, organization of the ER, establishing cell polarity, and morphogenesis; detected in highly purified mitochondria in high-throughput studies -S000036047 CDS YDR141C 4 739997 734901 C 2011-02-03 1996-07-31 -S000002549 ORF Verified YDR142C PEX7 PEB1|PAS7 chromosome 4 L000001340 4 741600 740473 C 2011-02-03 1996-07-31 Peroxisomal signal receptor for peroxisomal matrix proteins; recognizes the N-terminal nonapeptide signal (PTS2); WD repeat protein; defects in human homolog cause lethal rhizomelic chondrodysplasia punctata (RCDP) -S000036136 CDS YDR142C 4 741600 740473 C 2011-02-03 1996-07-31 -S000002550 ORF Verified YDR143C SAN1 ubiquitin-protein ligase SAN1 chromosome 4 L000001800 4 743874 742042 C 2011-02-03 1996-07-31 Ubiquitin-protein ligase; involved in proteasome-dependent degradation of aberrant nuclear proteins; targets substrates with regions of exposed hydrophobicity containing 5 or more contiguous hydrophobic residues; contains intrinsically disordered regions that contribute to substrate recognition; prefers a window of exposed hydrophobicity that causes a particular level of protein insolubility, suggesting that San1p evolved to target highly aggregation-prone proteins -S000036257 CDS YDR143C 4 743874 742042 C 2011-02-03 1996-07-31 -S000002551 ORF Verified YDR144C MKC7 aspartyl protease|YPS2 chromosome 4 L000003069 4 746101 744311 C 2011-02-03 1996-07-31 GPI-anchored aspartyl protease; member of the yapsin family of proteases involved in cell wall growth and maintenance; shares functions with Yap3p and Kex2p; MKC7 has a paralog, YPS1, that arose from the whole genome duplication -S000036336 CDS YDR144C 4 746101 744311 C 2011-02-03 1996-07-31 -S000002552 ORF Verified YDR145W TAF12 TafII61|TafII68|TAF68|TAF61 chromosome 4 L000003462 4 746738 748357 W 2011-02-03 1996-07-31 Subunit (61/68 kDa) of TFIID and SAGA complexes; involved in RNA polymerase II transcription initiation and in chromatin modification, similar to histone H2A; overexpression of the human ortholog, TAF12, an oncogene involved in the formation of choroid plexus carcinomas, results in dosage chromosomal instability (dCIN) in a human cell line similar to the dCIN observed in yeast overexpressors -S000037046 CDS YDR145W 4 746738 748357 W 2011-02-03 1996-07-31 -S000119070 ARS ARS451 ARSIV-748|ARS422.5 chromosome 4 4 748392 748637 2011-02-03 2006-10-05 Autonomously Replicating Sequence -S000178072 ARS_consensus_sequence ARS451 4 748456 748472 W 2014-11-18 2014-11-18 -S000002553 ORF Verified YDR146C SWI5 DNA-binding transcription factor SWI5 chromosome 4 L000002253 4 750742 748613 C 2011-02-03 1996-07-31 Transcription factor that recruits Mediator and Swi/Snf complexes; activates transcription of genes expressed at the M/G1 phase boundary and in G1 phase; required for expression of the HO gene controlling mating type switching; localization to nucleus occurs during G1 and appears to be regulated by phosphorylation by Cdc28p kinase; SWI5 has a paralog, ACE2, that arose from the whole genome duplication -S000037075 CDS YDR146C 4 750742 748613 C 2011-02-03 1996-07-31 -S000002554 ORF Verified YDR147W EKI1 bifunctional choline kinase/ethanolamine kinase EKI1 chromosome 4 L000004610 4 751631 753235 W 2011-02-03 1996-07-31 Ethanolamine kinase; primarily responsible for phosphatidylethanolamine synthesis via the CDP-ethanolamine pathway; exhibits some choline kinase activity, thus contributing to phosphatidylcholine synthesis via the CDP-choline pathway; EKI1 has a paralog, CKI1, that arose from the whole genome duplication -S000037235 CDS YDR147W 4 751631 753235 W 2011-02-03 1996-07-31 -S000118438 ARS ARS423 ARSIV-753 chromosome 4 4 753242 753386 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178073 ARS_consensus_sequence ARS423 4 753333 753317 C 2014-11-18 2014-11-18 -S000002555 ORF Verified YDR148C KGD2 alpha-ketoglutarate dehydrogenase KGD2 chromosome 4 L000000898 4 755066 753675 C 2011-02-03 1996-07-31 Dihydrolipoyl transsuccinylase; component of the mitochondrial alpha-ketoglutarate dehydrogenase complex, which catalyzes the oxidative decarboxylation of alpha-ketoglutarate to succinyl-CoA in the TCA cycle; phosphorylated -S000037302 CDS YDR148C 4 755066 753675 C 2011-02-03 1996-07-31 -S000002557 ORF Verified YDR150W NUM1 PAC12 chromosome 4 L000001287 4 755628 763874 W 2011-02-03 1996-07-31 Protein required for nuclear migration; component of the mitochondria-ER-cortex-ancor (MECA); required for the association of mitochondria with the cell cortex and for accurate distribution of mitochondrial network; interacts with Mdm36p to link the ER and mitochondria at the cortex; localizes to the mother cell cortex and the bud tip; may mediate interactions of dynein and cytoplasmic microtubules with the cell cortex -S000031071 CDS YDR150W 4 755628 763874 W 2011-02-03 1996-07-31 -S000002556 ORF Dubious YDR149C chromosome 4 4 756262 755555 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene NUM1/YDR150W; null mutation blocks anaerobic growth -S000029951 CDS YDR149C 4 756262 755555 C 2011-02-03 1996-07-31 -S000002558 ORF Verified YDR151C CTH1 putative mRNA-binding protein CTH1 chromosome 4 L000002772 4 765155 764178 C 2011-02-03 1996-07-31 Member of the CCCH zinc finger family; similar to mammalian Tis11 protein, which activates transcription and also has a role in mRNA degradation; may function with Tis11p in iron homeostasis; CTH1 has a paralog, TIS11, that arose from the whole genome duplication -S000031106 CDS YDR151C 4 765155 764178 C 2011-02-03 1996-07-31 -S000002559 ORF Verified YDR152W GIR2 chromosome 4 4 765706 766503 W 2011-02-03 1996-07-31 Highly-acidic RWD domain-containing cytoplasmic protein; forms a highly conserved complex with Rbg2p that is responsible for efficient cell growth under amino acid starvation and binds translational activator Gcn1p in dose-dependent manner according to stress level; associates with translating ribosomes; intrinsically unstructured protein whose stability is enhanced upon binding Rbg2p -S000031232 CDS YDR152W 4 765706 766503 W 2011-02-03 1996-07-31 -S000002560 ORF Verified YDR153C ENT5 chromosome 4 4 767971 766736 C 2011-02-03 1996-07-31 Protein containing an N-terminal epsin-like domain; involved in clathrin recruitment and traffic between the Golgi and endosomes; associates with the clathrin adaptor Gga2p, clathrin adaptor complex AP-1, and clathrin -S000032164 CDS YDR153C 4 767971 766736 C 2011-02-03 1996-07-31 -S000002561 ORF Dubious YDR154C chromosome 4 4 768753 768403 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; null mutant exhibits synthetic phenotype with alpha-synuclein -S000032245 CDS YDR154C 4 768753 768403 C 2011-02-03 1996-07-31 -S000002562 ORF Verified YDR155C CPR1 peptidylprolyl isomerase CPR1|CPH1|CYP1 chromosome 4 L000002663 4 769000 768512 C 2011-02-03 1996-07-31 Cytoplasmic peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; binds the drug cyclosporin A; N-terminally propionylated in vivo; protein abundance increases in response to DNA replication stress -S000032345 CDS YDR155C 4 769000 768512 C 2011-02-03 1996-07-31 -S000002563 ORF Verified YDR156W RPA14 DNA-directed RNA polymerase I subunit RPA14|A14 chromosome 4 L000002883 4 769525 769938 W 2011-02-03 1996-07-31 RNA polymerase I subunit A14 -S000033241 CDS YDR156W 4 769525 769938 W 2011-02-03 1996-07-31 -S000002564 ORF Dubious YDR157W chromosome 4 4 769931 770332 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033302 CDS YDR157W 4 769931 770332 W 2011-02-03 1996-07-31 -S000002565 ORF Verified YDR158W HOM2 aspartate-semialdehyde dehydrogenase|THR2 chromosome 4 L000000799 4 770357 771454 W 92 2011-02-03 1996-07-31 Aspartic beta semi-aldehyde dehydrogenase; catalyzes the second step in the common pathway for methionine and threonine biosynthesis; expression regulated by Gcn4p and the general control of amino acid synthesis -S000033370 CDS YDR158W 4 770357 771454 W 2011-02-03 1996-07-31 -S000002566 ORF Verified YDR159W SAC3 LEP1 chromosome 4 L000001792 4 771877 775782 W 92 2011-02-03 1996-07-31 mRNA export factor; required for biogenesis of the small ribosomal subunit; component of TREX-2 complex (Sac3p-Thp1p-Sus1p-Cdc31p) involved in transcription elongation and mRNA export from the nucleus; involved in post-transcriptional tethering of active genes to the nuclear periphery and to non-nascent mRNP; similar to the human germinal center-associated nuclear protein (GANP) -S000034282 CDS YDR159W 4 771877 775782 W 2011-02-03 1996-07-31 -S000002567 ORF Verified YDR160W SSY1 RAA1|SHR10 chromosome 4 L000004190|L000003184|S000029399|L000001553 4 776163 778721 W 92 2011-02-03 1996-07-31 Component of the SPS plasma membrane amino acid sensor system; senses external amino acid concentration and transmits intracellular signals that result in regulation of expression of amino acid permease genes; other members are Ssy1p, Ptr3p, and Ssy5p -S000034346 CDS YDR160W 4 776163 778721 W 2011-02-03 1996-07-31 -S000002568 ORF Verified YDR161W ACL4 chromosome 4 L000004169 4 779043 780206 W 2011-02-03 1996-07-31 Specific assembly chaperone for ribosomal protein Rpl4p; binds to an evolutionarily conserved surface extension of nascent Rpl4p and chaperones Rpl4p until its assembly into the pre-ribosome; transcriptionally co-regulated with rRNA and ribosome biosynthesis genes -S000035308 CDS YDR161W 4 779043 780206 W 2011-02-03 1996-07-31 -S000002569 ORF Verified YDR162C NBP2 chromosome 4 L000002861 4 781100 780390 C 2011-02-03 1996-07-31 Protein involved in the HOG (high osmolarity glycerol) pathway; negatively regulates Hog1p by recruitment of phosphatase Ptc1p the Pbs2p-Hog1p complex; interacts with Bck1p and down regulates the cell wall integrity pathway; found in the nucleus and cytoplasm, contains an SH3 domain and a Ptc1p binding domain (PBM) -S000035337 CDS YDR162C 4 781100 780390 C 2011-02-03 1996-07-31 -S000002570 ORF Verified YDR163W CWC15 U2-type spliceosomal complex subunit CWC15 chromosome 4 4 781423 781950 W 2011-02-03 1996-07-31 Non-essential protein involved in pre-mRNA splicing; component of a complex containing Cef1p; has similarity to S. pombe Cwf15p -S000035446 CDS YDR163W 4 781423 781950 W 2011-02-03 1996-07-31 -S000002571 ORF Verified YDR164C SEC1 chromosome 4 L000001827 4 784215 782041 C 94.77 2011-02-03 1996-07-31 Sm-like protein involved in docking and fusion of exocytic vesicles; binds to assembled SNARE complexes at the membrane and stimulates membrane fusion; localization to sites of secretion (bud neck and bud tip) is dependent on SNARE function; interacts directly with essential exocyst subunit Sec6p -S000035467 CDS YDR164C 4 784215 782041 C 2011-02-03 1996-07-31 -S000002572 ORF Verified YDR165W TRM82 chromosome 4 4 784871 786205 W 2011-02-03 1996-07-31 Catalytic subunit of a tRNA methyltransferase complex; Trm8p and Trm82p comprise an enzyme that catalyzes a methyl-transfer from S-adenosyl-l-methionine to the N(7) atom of guanine at position 46 in tRNA; Trm8 lacks catalytic activity if not bound to Trm82p; relocalizes to the cytosol in response to hypoxia; mutation in human ortholog WDR4 causes microcephalic primordial dwarfism -S000035563 CDS YDR165W 4 784871 786205 W 2011-02-03 1996-07-31 -S000002573 ORF Verified YDR166C SEC5 exocyst subunit SEC5 chromosome 4 L000001831 4 789221 786306 C 95 2011-02-03 1996-07-31 Essential 107kDa subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis at the plasma membrane prior to SNARE-mediated fusion; involved in assembly of the exocyst complex; required with Sec3p for ER inheritance where it promotes anchoring of the cortical ER at the bud tip -S000035593 CDS YDR166C 4 789221 786306 C 2011-02-03 1996-07-31 -S000002574 ORF Verified YDR167W TAF10 TafII25|TAF25|TAF23 chromosome 4 L000003460 4 789449 790069 W 2011-02-03 1996-07-31 Subunit (145 kDa) of TFIID and SAGA complexes; involved in RNA polymerase II transcription initiation and in chromatin modification -S000036558 CDS YDR167W 4 789449 790069 W 2011-02-03 1996-07-31 -S000002575 ORF Verified YDR168W CDC37 SMO1 chromosome 4 L000000273 4 790328 791848 W 95 2011-02-03 1996-07-31 Essential Hsp90p co-chaperone; necessary for passage through the START phase of the cell cycle; stabilizes protein kinase nascent chains and participates along with Hsp90p in their folding -S000036673 CDS YDR168W 4 790328 791848 W 2011-02-03 1996-07-31 -S000002576 ORF Verified YDR169C STB3 chromosome 4 L000002109 4 793889 792348 C 2011-02-03 1996-07-31 Ribosomal RNA processing element (RRPE)-binding protein; involved in the glucose-induced transition from quiescence to growth; restricted to nucleus in quiescent cells, released into cytoplasm after glucose repletion; binds Sin3p; relative distribution to the nucleus increases upon DNA replication stress -S000036712 CDS YDR169C 4 793889 792348 C 2011-02-03 1996-07-31 -S000028538 ORF Uncharacterized YDR169C-A chromosome 4 4 794723 794574 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031147 CDS YDR169C-A 4 794723 794574 C 2011-02-03 2003-07-29 -S000002577 ORF Verified YDR170C SEC7 Arf family guanine nucleotide exchange factor SEC7 chromosome 4 L000001833 4 802222 796193 C 96 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF) for ADP ribosylation factors; involved in proliferation of the Golgi, intra-Golgi transport and ER-to-Golgi transport; found in the cytoplasm and on Golgi-associated coated vesicles -S000036405 CDS YDR170C 4 802222 796193 C 2011-02-03 1996-07-31 -S000006695 tRNA_gene tQ(UUG)D3 chromosome 4 L000003783 4 802802 802731 C 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000034813 noncoding_exon tQ(UUG)D3 4 802802 802731 C 2011-02-03 2000-05-19 -S000006865 long_terminal_repeat YDRWdelta11 chromosome 4 4 802905 803235 W 2011-02-03 2000-05-19 Ty1 LTR -S000007227 transposable_element_gene YDR170W-A gag protein chromosome 4 4 803195 804517 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag; YDR170W-A is part of a mutant retrotransposon; distribution in the cytoplasm becomes irregular rather than punctate upon DNA replication stress -S000036096 CDS YDR170W-A 4 803195 804517 W 2011-02-03 1999-07-17 -S000118439 ARS ARS425 ARSIV-806 chromosome 4 4 806052 806277 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178074 ARS_consensus_sequence ARS425 4 806099 806115 W 2014-11-18 2014-11-18 -S000002578 ORF Verified YDR171W HSP42 heat shock protein HSP42 chromosome 4 L000003095 4 806621 807748 W 2011-02-03 1996-07-31 Small heat shock protein (sHSP) with chaperone activity; forms barrel-shaped oligomers that suppress unfolded protein aggregation; involved in cytoskeleton reorganization after heat shock; protein abundance increases and forms cytoplasmic foci in response to DNA replication stress -S000030208 CDS YDR171W 4 806621 807748 W 2011-02-03 1996-07-31 -S000002579 ORF Verified YDR172W SUP35 translation termination factor GTPase eRF3|eRF3|[PSI(+)]|[PSI]|SUP36|SUP2|SUF12|SAL3|PNM2|GST1 chromosome 4 L000002200 4 808324 810381 W 142.87 2011-02-03 1996-07-31 Translation termination factor eRF3; has a role in mRNA deadenylation and decay; altered protein conformation creates the [PSI(+)] prion that modifies cellular fitness, alters translational fidelity by affecting reading frame selection, and results in a nonsense suppressor phenotype; many stress-response genes are repressed in the presence of [PSI(+)] -S000030332 CDS YDR172W 4 808324 810381 W 2011-02-03 1996-07-31 -S000002580 ORF Verified YDR173C ARG82 inositol polyphosphate multikinase|ARGRIII|IPK2|ARGR3 chromosome 4 L000002727 4 811632 810565 C 95 2011-02-03 1996-07-31 Inositol polyphosphate multikinase (IPMK); sequentially phosphorylates Ins(1,4,5)P3 to form Ins(1,3,4,5,6)P5; also has diphosphoinositol polyphosphate synthase activity; regulates arginine-, phosphate-, and nitrogen-responsive genes -S000030416 CDS YDR173C 4 811632 810565 C 2011-02-03 1996-07-31 -S000002581 ORF Verified YDR174W HMO1 HSM2 chromosome 4 L000003234 4 812110 812850 W 2011-02-03 1996-07-31 Chromatin associated high mobility group (HMG) family member; involved in compacting, bending, bridging and looping DNA; rDNA-binding component that regulates transcription from RNA polymerase I promoters; regulates start site selection of ribosomal protein genes via RNA polymerase II promoters; role in genome maintenance; associates with a 5'-3' DNA helicase and Fpr1p, a prolyl isomerase; relocalizes to the cytosol in response to hypoxia -S000031344 CDS YDR174W 4 812110 812850 W 2011-02-03 1996-07-31 -S000002582 ORF Verified YDR175C RSM24 mitochondrial 37S ribosomal protein RSM24 chromosome 4 4 814152 813193 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit -S000031376 CDS YDR175C 4 814152 813193 C 2011-02-03 1996-07-31 -S000002583 ORF Verified YDR176W NGG1 histone acetyltransferase NGG1|SWI7|ADA3 chromosome 4 L000001241 4 814452 816560 W 2011-02-03 1996-07-31 Subunit of chromatin modifying histone acetyltransferase complexes; member of the ADA complex, the SAGA complex, and the SLIK complex; transcriptional regulator involved in glucose repression of Gal4p-regulated genes -S000031512 CDS YDR176W 4 814452 816560 W 2011-02-03 1996-07-31 -S000002584 ORF Verified YDR177W UBC1 E2 ubiquitin-conjugating protein UBC1 chromosome 4 L000002406 4 816878 817525 W 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme; key E2 partner with Ubc4p for the anaphase-promoting complex (APC); mediates selective degradation of short-lived and abnormal proteins; plays a role in vesicle biogenesis and ER-associated protein degradation (ERAD); component of the cellular stress response; protein abundance increases in response to DNA replication stress key E2 partner with Ubc4p for the anaphase-promoting complex (APC) -S000031590 CDS YDR177W 4 816878 817525 W 2011-02-03 1996-07-31 -S000002585 ORF Verified YDR178W SDH4 succinate dehydrogenase membrane anchor subunit SDH4|ACN18 chromosome 4 L000001826 4 817950 818495 W 2011-02-03 1996-07-31 Membrane anchor subunit of succinate dehydrogenase (SDH); involved in coupling the oxidation of succinate to the transfer of electrons to ubiquinone as part of the TCA cycle and the mitochondrial respiratory chain; has similarity to human SDH subunit D (SDHD), which is implicated in paraganglioma -S000032569 CDS YDR178W 4 817950 818495 W 2011-02-03 1996-07-31 -S000002586 ORF Verified YDR179C CSN9 chromosome 4 S000007578 4 819196 818708 C 2011-02-03 1996-07-31 Subunit of the Cop9 signalosome; Cop9 signalosome is required for deneddylation, or removal of the ubiquitin-like protein Rub1p from Cdc53p (cullin); involved in adaptation to pheromone signaling -S000032647 CDS YDR179C 4 819196 818708 C 2011-02-03 1996-07-31 -S000002587 ORF Verified YDR179W-A NVJ3 chromosome 4 4 819433 820824 W 2011-02-03 2004-07-21|1996-07-31 Protein with a potential role in tethering ER and vacuoles; localizes to nucleus-vacuole junctions in an Mdm1p-dependent manner; contains a lipid-binding PXA domain -S000037444 CDS YDR179W-A 4 819433 820824 W 2011-02-03 2004-07-21|1996-07-31 -S000002588 ORF Verified YDR180W SCC2 cohesin-loading factor complex subunit SCC2 chromosome 4 L000004262 4 821295 825776 W 2011-02-03 1996-07-31 Subunit of cohesin loading factor (Scc2p-Scc4p); a complex required for loading of cohesin complexes onto chromosomes; involved in establishing sister chromatid cohesion during DSB repair via histone H2AX; promotes gene expression program that supports translational fidelity; evolutionarily-conserved adherin; relocalizes to cytosol in response to hypoxia; human disorder Cornelia de Lange syndrome is caused by mutations in NIPBL, the human ortholog of SCC2 -S000034456 CDS YDR180W 4 821295 825776 W 2011-02-03 1996-07-31 -S000002589 ORF Verified YDR181C SAS4 chromosome 4 L000004214 4 827355 825910 C 2011-02-03 1996-07-31 Subunit of the SAS complex (Sas2p, Sas4p, Sas5p); acetylates free histones and nucleosomes and regulates transcriptional silencing; required for the HAT activity of Sas2p -S000034496 CDS YDR181C 4 827355 825910 C 2011-02-03 1996-07-31 -S000002590 ORF Verified YDR182W CDC1 putative lipid phosphatase CDC1|ESP2|DSR1|DSC1 chromosome 4 L000000241 4 827582 829057 W 2011-02-03 1996-07-31 Putative mannose-ethanolamine phosphate phosphodiesterase; involved in GPI-anchor remodeling prior to the attachment of cell wall proteins to beta 1,3-glucan, removing ethanolamine phosphate from the first mannose of GPI anchors; mutants display elevated Ca2+-dependent signaling resulting in secondary actin polarization and Golgi inheritance defects; enzyme is Mn2+-dependent; mutants have cell division cycle defect and fragile cell walls -S000034637 CDS YDR182W 4 827582 829057 W 2011-02-03 1996-07-31 -S000028539 ORF Uncharacterized YDR182W-A chromosome 4 4 829151 829354 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031148 CDS YDR182W-A 4 829151 829354 W 2011-02-03 2003-07-29 -S000002591 ORF Verified YDR183W PLP1 chromosome 4 L000003424 4 829585 830277 W 2011-02-03 1996-07-31 Protein that interacts with CCT (chaperonin containing TCP-1) complex; has a role in actin and tubulin folding; has weak similarity to phosducins, which are G-protein regulators -S000034709 CDS YDR183W 4 829585 830277 W 2011-02-03 1996-07-31 -S000028540 ORF Dubious YDR183C-A chromosome 4 4 830654 830397 C 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by fungal homology and RT-PCR -S000031190 CDS YDR183C-A 4 830654 830397 C 2011-02-03 2003-07-29 -S000002592 ORF Verified YDR184C ATC1 LIC4 chromosome 4 L000004405 4 831513 830629 C 2011-02-03 1996-07-31 Nuclear protein; possibly involved in regulation of cation stress responses and/or in the establishment of bipolar budding pattern; relative distribution to the nucleus decreases upon DNA replication stress -S000034749 CDS YDR184C 4 831513 830629 C 2011-02-03 1996-07-31 -S000002593 ORF Verified YDR185C UPS3 GEP2 chromosome 4 4 832473 831934 C 2011-02-03 1996-07-31 Mitochondrial protein of unknown function; similar to Ups1p and Ups2p which are involved in regulation of mitochondrial cardiolipin and phosphatidylethanolamine levels; null is viable but interacts synthetically with ups1 and ups2 mutations; UPS3 has a paralog, UPS2, that arose from the whole genome duplication -S000035675 CDS YDR185C 4 832473 831934 C 2011-02-03 1996-07-31 -S000002594 ORF Verified YDR186C SND1 chromosome 4 4 835492 832859 C 2011-02-03 1996-07-31 Protein involved in SRP-independent targeting of substrates to the ER; component of an alternative ER targeting pathway that has partial functional redundancy with the GET pathway; preference for substrates with downstream transmembrane domains; interacts with Env10p/Snd2p and Pho88p/Snd3p; can compensate for loss of SRP; may interact with ribosomes, based on co-purification experiments; GFP-fusion protein localizes to the cytoplasm -S000035744 CDS YDR186C 4 835492 832859 C 2011-02-03 1996-07-31 -S000002596 ORF Verified YDR188W CCT6 chaperonin-containing T-complex subunit CCT6|TCP20|TCP6|HTR3 chromosome 4 L000002271 4 836421 838061 W 2011-02-03 1996-07-31 Subunit of the cytosolic chaperonin Cct ring complex; related to Tcp1p, essential protein that is required for the assembly of actin and tubulins in vivo; contains an ATP-binding motif -S000036804 CDS YDR188W 4 836421 838061 W 2011-02-03 1996-07-31 -S000002595 ORF Dubious YDR187C chromosome 4 4 836746 836228 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified, essential ORF CCT6/YDR188W -S000035828 CDS YDR187C 4 836746 836228 C 2011-02-03 1996-07-31 -S000002597 ORF Verified YDR189W SLY1 syntaxin-binding protein chromosome 4 L000001923 4 838392 840392 W 2011-02-03 1996-07-31 Hydrophilic protein involved in ER/Golgi vesicle trafficking; SM (Sec1/Munc-18) family protein that binds the tSNARE Sed5p and stimulates its assembly into a trans-SNARE membrane-protein complex -S000036882 CDS YDR189W 4 838392 840392 W 2011-02-03 1996-07-31 -S000002598 ORF Verified YDR190C RVB1 RuvB family ATP-dependent DNA helicase pontin|TIP49|TIH1|TIP49A chromosome 4 S000007843 4 841995 840604 C 2011-02-03 1996-07-31 ATP-dependent DNA helicase, also known as pontin; member of the AAA+ and RuvB-like protein families; similar to Rvb2p; conserved component of multiple complexes including the INO80 complex, the Swr1 complex, and the R2TP complex (Rvb1-Rvb2-Tah1-Pih1); involved in multiple processes such as chromatin remodeling, box C/D snoRNP assembly, and RNA polymerase II assembly -S000036562 CDS YDR190C 4 841995 840604 C 2011-02-03 1996-07-31 -S000002599 ORF Verified YDR191W HST4 NAD-dependent histone deacetylase HST4 chromosome 4 L000003043 4 842337 843449 W 2011-02-03 1996-07-31 NAD(+)-dependent protein deacetylase; deacetylation targets are primarily mitochondrial proteins; involved along with Hst3p in silencing at telomeres, cell cycle progression, radiation resistance, genomic stability and short-chain fatty acid metabolism; accumulates in mitochondria in response to biotin starvation and may link biotin metabolism with energy homeostasis; member of the Sir2 family and may be the functional equivalent of human SIRT3 -S000036688 CDS YDR191W 4 842337 843449 W 2011-02-03 1996-07-31 -S000002601 ORF Dubious YDR193W chromosome 4 4 844554 844952 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030657 CDS YDR193W 4 844554 844952 W 2011-02-03 1996-07-31 -S000002600 ORF Verified YDR192C NUP42 FG-nucleoporin NUP42|UIP1|RIP1 chromosome 4 L000002940 4 844861 843569 C 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; also part of the nuclear pore complex (NPC) cytoplasmic filaments; contributes directly to nucleocytoplasmic transport and maintenance of the NPC permeability barrier and is involved in gene tethering at the nuclear periphery; interacts with Gle1p -S000036723 CDS YDR192C 4 844861 843569 C 2011-02-03 1996-07-31 -S000002602 ORF Verified YDR194C MSS116 ATP-dependent RNA helicase chromosome 4 L000001206 4 847946 845952 C 2011-02-03 1996-07-31 Mitochondrial transcription elongation factor; DEAD-box protein; required for efficient splicing of mitochondrial Group I and II introns; non-polar RNA helicase that also facilities strand annealing; promotes RNA folding by stabilizing an early assembly intermediate -S000030696 CDS YDR194C 4 847946 845952 C 2011-02-03 1996-07-31 -S000028541 ORF Uncharacterized YDR194W-A chromosome 4 4 848071 848223 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031191 CDS YDR194W-A 4 848071 848223 W 2011-02-03 2003-07-29 -S000002603 ORF Verified YDR195W REF2 RNA-processing protein REF2 chromosome 4 L000002661 4 848599 850200 W 2011-02-03 1996-07-31 RNA-binding protein; involved in the cleavage step of mRNA 3'-end formation prior to polyadenylation, and in snoRNA maturation; part of holo-CPF subcomplex APT, which associates with 3'-ends of snoRNA- and mRNA-encoding genes; putative regulatory subunit of type 1 protein phosphatase Glc7p, required for actomyosin ring formation, and for timely dephosphorylation and release of Bnr1p from the division site; relocalizes to the cytosol in response to hypoxia -S000030881 CDS YDR195W 4 848599 850200 W 2011-02-03 1996-07-31 -S000002604 ORF Verified YDR196C CAB5 putative dephospho-CoA kinase chromosome 4 4 850999 850274 C 2011-02-03 1996-07-31 Subunit of the CoA-Synthesizing Protein Complex (CoA-SPC); subunits of this complex are: Cab2p, Cab3p, Cab4p, Cab5p, Sis2p and Vhs3p; probable dephospho-CoA kinase (DPCK) that catalyzes the last step in coenzyme A biosynthesis; null mutant lethality is complemented by human homolog DCAKD and by E. coli coaE (encoding DPCK); detected in purified mitochondria in high-throughput studies; also localized to lipid droplets -S000031739 CDS YDR196C 4 850999 850274 C 2011-02-03 1996-07-31 -S000002605 ORF Verified YDR197W CBS2 CBP7 chromosome 4 L000000231 4 851228 852397 W 2011-02-03 1996-07-31 Mitochondrial translational activator of the COB mRNA; interacts with translating ribosomes, acts on the COB mRNA 5'-untranslated leader -S000032020 CDS YDR197W 4 851228 852397 W 2011-02-03 1996-07-31 -S000002606 ORF Verified YDR198C RKM2 protein-lysine N-methyltransferase chromosome 4 4 853972 852533 C 2011-02-03 1996-07-31 Ribosomal protein lysine methyltransferase; responsible for trimethylation of the lysine residue at position 3 of Rpl12Ap and Rpl12Bp -S000032059 CDS YDR198C 4 853972 852533 C 2011-02-03 1996-07-31 -S000002607 ORF Dubious YDR199W chromosome 4 4 854175 854540 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene VPS64/YDR200C; computationally predicted to have thiol-disulfide oxidoreductase activity -S000033057 CDS YDR199W 4 854175 854540 W 2011-02-03 1996-07-31 -S000002608 ORF Verified YDR200C VPS64 FAR9 chromosome 4 4 856093 854279 C 2011-02-03 1996-07-31 Protein required for cytoplasm to vacuole targeting of proteins; forms a complex with Far3p and Far7p to Far11p involved in recovery from pheromone-induced cell cycle arrest; mutant has increased aneuploidy tolerance; VPS64 has a paralog, FAR10, that arose from the whole genome duplication -S000037661 CDS YDR200C 4 856093 854279 C 2011-02-03 1996-07-31 -S000002609 ORF Verified YDR201W SPC19 chromosome 4 L000004693 4 856317 856814 W 2011-02-03 1996-07-31 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; also localized to nuclear side of spindle pole body -S000030528 CDS YDR201W 4 856317 856814 W 2011-02-03 1996-07-31 -S000002611 ORF Dubious YDR203W chromosome 4 4 857682 857999 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF RAV2/YDR202C -S000030685 CDS YDR203W 4 857682 857999 W 2011-02-03 1996-07-31 -S000002610 ORF Verified YDR202C RAV2 chromosome 4 4 857953 856898 C 2011-02-03 1996-07-31 Subunit of RAVE complex (Rav1p, Rav2p, Skp1p); the RAVE complex associates with the V1 domain of the vacuolar membrane (H+)-ATPase (V-ATPase) and promotes assembly and reassembly of the holoenzyme -S000030555 CDS YDR202C 4 857953 856898 C 2011-02-03 1996-07-31 -S000002612 ORF Verified YDR204W COQ4 ubiquinone biosynthesis protein COQ4 chromosome 4 L000003957 4 858137 859144 W 2011-02-03 1996-07-31 Protein with a role in ubiquinone (Coenzyme Q) biosynthesis; possibly functioning in stabilization of Coq7p; located on matrix face of mitochondrial inner membrane; component of a mitochondrial ubiquinone-synthesizing complex; human homolog COQ4 can complement yeast coq4 null mutant -S000030757 CDS YDR204W 4 858137 859144 W 2011-02-03 1996-07-31 -S000002613 ORF Verified YDR205W MSC2 metal cation transporter MSC2 chromosome 4 4 859346 861520 W 2011-02-03 2003-09-22|1996-07-31 Endoplasmic reticulum zinc transporter; part of a heterodimeric transporter with Zrg17p that transfers zinc from the cytosol to the ER lumen; member of the cation diffusion facilitator family of efflux pumps; localizes to ER and nucleus; mutations affect the cellular distribution of zinc and also confer defects in meiotic recombination between homologous chromatids -S000031604 CDS YDR205W 4 859346 861520 W 2011-02-03 2003-09-22|1996-07-31 -S000002614 ORF Verified YDR206W EBS1 chromosome 4 L000004629 4 862054 864708 W 2011-02-03 1996-07-31 Protein involved in translation inhibition and nonsense-mediated decay; interacts with cap binding protein Cdc33p and with Nam7p; localizes to P-bodies upon glucose starvation; mRNA abundance regulated by mRNA decay factors; EBS1 has a paralog, EST1, that arose from the whole genome duplication -S000031711 CDS YDR206W 4 862054 864708 W 2011-02-03 1996-07-31 -S000002615 ORF Verified YDR207C UME6 DNA-binding transcriptional regulator UME6|RIM16|NIM2|CAR80 chromosome 4 L000002426 4 867522 865012 C 2011-02-03 1996-07-31 Rpd3L histone deacetylase complex subunit; key transcriptional regulator of early meiotic genes; involved in chromatin remodeling and transcriptional repression via DNA looping; binds URS1 upstream regulatory sequence, represses transcription by recruiting conserved histone deacetylase Rpd3p (through co-repressor Sin3p) and chromatin-remodeling factor Isw2p; couples metabolic responses to nutritional cues with initiation and progression of meiosis, forms compl -S000031768 CDS YDR207C 4 867522 865012 C 2011-02-03 1996-07-31 -S000002616 ORF Verified YDR208W MSS4 1-phosphatidylinositol-4-phosphate 5-kinase chromosome 4 L000001203 4 868224 870563 W 2011-02-03 1996-07-31 Phosphatidylinositol-4-phosphate 5-kinase; involved in actin cytoskeleton organization and cell morphogenesis; multicopy suppressor of stt4 mutation -S000031959 CDS YDR208W 4 868224 870563 W 2011-02-03 1996-07-31 -S000002618 ORF Uncharacterized YDR210W chromosome 4 4 871074 871301 W 2011-02-03 1996-07-31 Predicted tail-anchored plasma membrane protein; contains a conserved CYSTM module; related proteins in other organisms may be involved in response to stress; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery -S000034858 CDS YDR210W 4 871074 871301 W 2011-02-03 1996-07-31 -S000002617 ORF Uncharacterized YDR209C chromosome 4 4 871449 871036 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YDR209C is not an essential gene; partially overlaps uncharacterized gene YDR210W -S000032797 CDS YDR209C 4 871449 871036 C 2011-02-03 1996-07-31 -S000006867 long_terminal_repeat YDRWdelta13 chromosome 4 4 871821 872152 W 2011-02-03 2000-05-19 Ty1 LTR -S000006884 LTR_retrotransposon YDRWTy2-2 Ty2 chromosome 4 4 871821 877779 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007392 transposable_element_gene YDR210W-A gag protein chromosome 4 4 872112 873428 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000029817 CDS YDR210W-A 4 872112 873428 W 2011-02-03 1999-07-17 -S000007393 transposable_element_gene YDR210W-B gag-pol fusion protein chromosome 4 4 872112 877425 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000029819 CDS YDR210W-B 4 872112 873404 W 2011-02-03 1999-07-17 -S000029820 CDS YDR210W-B 4 873406 877425 W 2011-02-03 1999-07-17 -S000029821 plus_1_translational_frameshift YDR210W-B 4 873405 873405 W 2011-02-03 1999-07-17 -S000006868 long_terminal_repeat YDRWdelta14 chromosome 4 4 877448 877779 W 2011-02-03 2000-05-19 Ty1 LTR -S000007410 transposable_element_gene YDR210C-D gag-pol fusion protein|YDR210W-D chromosome 4 4 883927 878659 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000029824 CDS YDR210C-D 4 882621 878659 C 2011-02-03 1999-07-17 -S000029823 CDS YDR210C-D 4 883927 882623 C 2011-02-03 1999-07-17 -S000029825 plus_1_translational_frameshift YDR210C-D 4 882622 882622 C 2011-02-03 1999-07-17 -S000007409 transposable_element_gene YDR210C-C gag protein|YDR210W-C chromosome 4 4 883927 882605 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000029822 CDS YDR210C-C 4 883927 882605 C 2011-02-03 1999-07-17 -S000006860 LTR_retrotransposon YDRCTy1-2 Ty1 chromosome 4 4 884220 878303 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000006613 tRNA_gene tI(UAU)D chromosome 4 L000003769 4 884361 884493 W 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000035113 intron tI(UAU)D 4 884398 884457 W 2011-02-03 2000-05-19 -S000035111 noncoding_exon tI(UAU)D 4 884361 884397 W 2011-02-03 2000-05-19 -S000035112 noncoding_exon tI(UAU)D 4 884458 884493 W 2011-02-03 2000-05-19 -S000002619 ORF Verified YDR211W GCD6 translation initiation factor eIF2B catalytic subunit epsilon chromosome 4 L000000674 4 884727 886865 W 2011-02-03 1996-07-31 Catalytic epsilon subunit of the translation initiation factor eIF2B; eIF2B is the guanine-nucleotide exchange factor for eIF2; activity subsequently regulated by phosphorylated eIF2; first identified as a negative regulator of GCN4 expression; forms cytoplasmic foci upon DNA replication stress -S000034999 CDS YDR211W 4 884727 886865 W 2011-02-03 1996-07-31 -S000002620 ORF Verified YDR212W TCP1 chaperonin-containing T-complex alpha subunit TCP1|CCT1 chromosome 4 L000002267 4 887232 888911 W 127 2011-02-03 1996-07-31 Alpha subunit of chaperonin-containing T-complex; complex mediates protein folding in the cytosol; involved in actin cytoskeleton maintenance; overexpression in neurons suppresses formation of pathogenic conformations of huntingtin protein -S000035134 CDS YDR212W 4 887232 888911 W 2011-02-03 1996-07-31 -S000002621 ORF Verified YDR213W UPC2 MOX4 chromosome 4 4 889751 892492 W 2011-02-03 1996-07-31 Sterol regulatory element binding protein; induces sterol biosynthetic genes, upon sterol depletion; acts as a sterol sensor, binding ergosterol in sterol rich conditions; relocates from intracellular membranes to perinuclear foci upon sterol depletion; redundant activator of filamentation with ECM22, up-regulating the expression of filamentous growth genes; contains a Zn[2]-Cys[6] binuclear cluster; UPC2 has a paralog, ECM22, that arose from the whole genome duplication -S000036022 CDS YDR213W 4 889751 892492 W 2011-02-03 1996-07-31 -S000002622 ORF Verified YDR214W AHA1 chromosome 4 4 892875 893927 W 2011-02-03 1996-07-31 Co-chaperone that binds Hsp82p and activates its ATPase activity; plays a role in determining prion variants; similar to Hch1p; expression is regulated by stresses such as heat shock; protein abundance increases in response to DNA replication stress -S000036092 CDS YDR214W 4 892875 893927 W 2011-02-03 1996-07-31 -S000002623 ORF Dubious YDR215C chromosome 4 4 894502 894089 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; null mutant displays elevated sensitivity to expression of a mutant huntingtin fragment or of alpha-synuclein -S000036137 CDS YDR215C 4 894502 894089 C 2011-02-03 1996-07-31|2011-02-03 -S000002624 ORF Verified YDR216W ADR1 DNA-binding transcription factor ADR1 chromosome 4 L000000050 4 895035 899006 W 125 2011-02-03 1996-07-31 Carbon source-responsive zinc-finger transcription factor; required for transcription of the glucose-repressed gene ADH2, of peroxisomal protein genes, and of genes required for ethanol, glycerol, and fatty acid utilization -S000036296 CDS YDR216W 4 895035 899006 W 2011-02-03 1996-07-31 -S000130175 ARS ARS427 chromosome 4 4 899051 899596 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000002625 ORF Verified YDR217C RAD9 chromatin-binding protein RAD9 chromosome 4 L000001562 4 903480 899551 C 126 2011-02-03 1996-07-31 DNA damage-dependent checkpoint protein; required for cell-cycle arrest in G1/S, intra-S, and G2/M, plays a role in postreplication repair (PRR) pathway; transmits checkpoint signal by activating Rad53p and Chk1p; hyperphosphorylated by Mec1p and Tel1p; multiple cyclin dependent kinase consensus sites and the C-terminal BRCT domain contribute to DNA damage checkpoint activation; Rad9p Chk1 Activating Domain (CAD) is phosphorylated at multiple sites by Cdc28p/Clb2p -S000036338 CDS YDR217C 4 903480 899551 C 2011-02-03 1996-07-31 -S000002626 ORF Verified YDR218C SPR28 septin SPR28 chromosome 4 L000004150 4 905052 903781 C 2011-02-03 1996-07-31 Sporulation-specific homolog of the CDC3/10/11/12 family of genes; meiotic septin expressed at high levels during meiotic divisions and ascospore formation; the yeast CDC3/10/11/12 family is a family of bud neck microfilament genes -S000037012 CDS YDR218C 4 905052 903781 C 2011-02-03 1996-07-31 -S000002627 ORF Verified YDR219C MFB1 chromosome 4 4 906852 905455 C 2011-02-03 1996-07-31 Mitochondria-associated F-box protein; involved in maintenance of normal mitochondrial morphology; interacts with Skp1p through the F-box motif; preferentially localizes to the mother cell during budding -S000037083 CDS YDR219C 4 906852 905455 C 2011-02-03 1996-07-31 -S000002628 ORF Dubious YDR220C chromosome 4 4 907293 907000 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; null mutant exhibits synthetic phenotype with alpha-synuclein -S000037911 CDS YDR220C 4 907293 907000 C 2011-02-03 1996-07-31 -S000002629 ORF Verified YDR221W GTB1 chromosome 4 4 907330 909438 W 2011-02-03 1996-07-31 Glucosidase II beta subunit, forms a complex with alpha subunit Rot2p; involved in removal of two glucose residues from N-linked glycans during glycoprotein biogenesis in the ER; relocalizes from ER to cytoplasm upon DNA replication stress -S000029995 CDS YDR221W 4 907330 909438 W 2011-02-03 1996-07-31 -S000002630 ORF Uncharacterized YDR222W chromosome 4 4 910054 911301 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; YDR222W has a paralog, YLR225C, that arose from the whole genome duplication -S000030976 CDS YDR222W 4 910054 911301 W 2011-02-03 1996-07-31 -S000002631 ORF Verified YDR223W CRF1 chromosome 4 4 912099 913502 W 2011-02-03 1996-07-31 Transcriptional corepressor; involved in repression of ribosomal protein (RP) gene transcription via the TOR signaling pathway which promotes accumulation of Crf1p in the nucleus; role in repression of RP genes varies by strain; CRF1 has a paralog, IFH1, that arose from the whole genome duplication -S000031073 CDS YDR223W 4 912099 913502 W 2011-02-03 1996-07-31 -S000118440 ARS ARS428 ARSIV-914 chromosome 4 4 913790 914038 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178075 ARS_consensus_sequence ARS428 4 913856 913872 W 2014-11-18 2014-11-18 -S000002632 ORF Verified YDR224C HTB1 histone H2B|SPT12 chromosome 4 L000000829 4 914712 914317 C 132 2011-02-03 1996-07-31 Histone H2B; core histone protein required for chromatin assembly and chromosome function; nearly identical to HTB2; Rad6p-Bre1p-Lge1p mediated ubiquitination regulates reassembly after DNA replication, transcriptional activation, meiotic DSB formation and H3 methylation -S000031108 CDS YDR224C 4 914712 914317 C 2011-02-03 1996-07-31 -S000002633 ORF Verified YDR225W HTA1 histone H2A|SPT11|H2A1 chromosome 4 L000000827 4 915530 915928 W 132 2011-02-03 1996-07-31 Histone H2A; core histone protein required for chromatin assembly and chromosome function; one of two nearly identical subtypes (see also HTA2); DNA damage-dependent phosphorylation by Mec1p facilitates DNA repair; acetylated by Nat4p; N-terminally propionylated in vivo -S000031234 CDS YDR225W 4 915530 915928 W 2011-02-03 1996-07-31 -S000002634 ORF Verified YDR226W ADK1 adenylate kinase ADK1|AKY2|AKY1 chromosome 4 L000000046 4 916486 917154 W 133 2011-02-03 1996-07-31 Adenylate kinase, required for purine metabolism; localized to the cytoplasm and the mitochondria; lacks cleavable signal sequence; protein abundance increases in response to DNA replication stress; mutations affecting Adk1p catalytic activity deregulate expression of phosphate utilization genes PHO5 and PHO84; human homolog AK1 can complement yeast adk1 mutant -S000032219 CDS YDR226W 4 916486 917154 W 2011-02-03 1996-07-31 -S000002635 ORF Verified YDR227W SIR4 chromatin-silencing protein SIR4|UTH2|STE9|ASD1 chromosome 4 L000001897 4 917571 921647 W 128 2011-02-03 1996-07-31 SIR protein involved in assembly of silent chromatin domains; silent information regulator (SIR) along with SIR2 and SIR3; involved in assembly of silent chromatin domains at telomeres and the silent mating-type loci; some alleles of SIR4 prolong lifespan; required for telomere hypercluster formation in quiescent yeast cells -S000032314 CDS YDR227W 4 917571 921647 W 2011-02-03 1996-07-31 -S000118441 ARS ARS429 ARSIV-922 chromosome 4 4 921692 921939 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178076 ARS_consensus_sequence ARS429 4 921736 921752 W 2014-11-18 2014-11-18 -S000002636 ORF Verified YDR228C PCF11 chromosome 4 L000004116 4 923806 921926 C 2011-02-03 1996-07-31 mRNA 3' end processing factor; essential component of cleavage and polyadenylation factor IA (CF IA), involved in pre-mRNA 3' end processing and in transcription termination; binds C-terminal domain of largest subunit of RNA pol II (Rpo21p); required for gene looping; relocalizes to the cytosol in response to hypoxia -S000032352 CDS YDR228C 4 923806 921926 C 2011-02-03 1996-07-31 -S000002637 ORF Verified YDR229W IVY1 chromosome 4 4 924785 926146 W 2011-02-03 1996-07-31 Phospholipid-binding protein that interacts with both Ypt7p and Vps33p; may partially counteract the action of Vps33p and vice versa, localizes to the rim of the vacuole as cells approach stationary phase -S000033246 CDS YDR229W 4 924785 926146 W 2011-02-03 1996-07-31 -S000002638 ORF Dubious YDR230W chromosome 4 4 926223 926570 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene COX20/YDR231C -S000034096 CDS YDR230W 4 926223 926570 W 2011-02-03 1996-07-31 -S000002639 ORF Verified YDR231C COX20 chromosome 4 S000007474 4 926910 926293 C 2011-02-03 1996-07-31 Mitochondrial inner membrane protein; required for proteolytic processing of Cox2p and its assembly into cytochrome c oxidase -S000034128 CDS YDR231C 4 926910 926293 C 2011-02-03 1996-07-31 -S000002640 ORF Verified YDR232W HEM1 5-aminolevulinate synthase|OLE3|CYD1 chromosome 4 L000000760 4 927452 929098 W 2011-02-03 1996-07-31 5-aminolevulinate synthase; catalyzes the first step in the heme biosynthetic pathway; an N-terminal signal sequence is required for localization to the mitochondrial matrix; expression is regulated by Hap2p-Hap3p; has a pyridoxal phosphate cofactor whose insertion is mediated by Mcx1p -S000034287 CDS YDR232W 4 927452 929098 W 2011-02-03 1996-07-31 -S000002641 ORF Verified YDR233C RTN1 chromosome 4 4 930357 929470 C 2011-02-03 1996-07-31 Reticulon protein; involved in nuclear pore assembly and maintenance of tubular ER morphology; promotes membrane curvature; regulates the ER asymmetry-induced inheritance block during ER stress; role in ER-derived peroxisomal biogenesis; increases tubular ER when overexpressed; mutants have reduced phosphatidylserine transfer between the ER and mitochondria; interacts with exocyst subunit Sec6p, Yip3p, and Sbh1p; member of the RTNLA subfamily -S000034311 CDS YDR233C 4 930357 929470 C 2011-02-03 1996-07-31 -S000002642 ORF Verified YDR234W LYS4 homoaconitate hydratase LYS4|LYS3 chromosome 4 L000000966 4 931129 933210 W 145.87 2011-02-03 1996-07-31 Homoaconitase; catalyzes the conversion of homocitrate to homoisocitrate, which is a step in the lysine biosynthesis pathway -S000035310 CDS YDR234W 4 931129 933210 W 2011-02-03 1996-07-31 -S000002643 ORF Verified YDR235W PRP42 mRNA splicing protein PRP42|SNU65|MUD16 chromosome 4 L000003969 4 933504 935138 W 2011-02-03 1996-07-31 U1 snRNP protein involved in splicing; required for U1 snRNP biogenesis; contains multiple tetriatricopeptide repeats -S000035386 CDS YDR235W 4 933504 935138 W 2011-02-03 1996-07-31 -S000002644 ORF Verified YDR236C FMN1 riboflavin kinase chromosome 4 4 935892 935236 C 2011-02-03 1996-07-31 Riboflavin kinase, produces riboflavin monophosphate (FMN); FMN is a necessary cofactor for many enzymes; predominantly localizes to the microsomal fraction and also found in the mitochondrial inner membrane; human RFK functionally complements the lethality of the null mutation -S000035407 CDS YDR236C 4 935892 935236 C 2011-02-03 1996-07-31 -S000002645 ORF Verified YDR237W MRPL7 mitochondrial 54S ribosomal protein YmL7/YmL5|YmL7|YmL5 chromosome 4 L000002684 4 936615 937493 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; MRPL7 produces both YmL5 and YmL7, which are two different modified forms of the same protein -S000035502 CDS YDR237W 4 936615 937493 W 2011-02-03 1996-07-31 -S000002646 ORF Verified YDR238C SEC26 coatomer subunit beta chromosome 4 L000001847 4 940816 937895 C 2011-02-03 1996-07-31 Essential beta-coat protein of the COPI coatomer; involved in ER-to-Golgi protein trafficking and maintenance of normal ER morphology; shares 43% sequence identity with mammalian beta-coat protein (beta-COP) -S000035532 CDS YDR238C 4 940816 937895 C 2011-02-03 1996-07-31 -S000002647 ORF Verified YDR239C chromosome 4 4 943420 941057 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments -S000035595 CDS YDR239C 4 943420 941057 C 2011-02-03 1996-07-31 -S000002649 ORF Dubious YDR241W BUD26 chromosome 4 4 945151 945438 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 1% of ORF overlaps the verified gene SNU56; diploid mutant displays a weak budding pattern phenotype in a systematic assay -S000036282 CDS YDR241W 4 945151 945438 W 2011-02-03 1996-07-31 -S000002648 ORF Verified YDR240C SNU56 MUD10 chromosome 4 L000004362 4 945152 943674 C 2011-02-03 1996-07-31 Component of U1 snRNP required for mRNA splicing via spliceosome; yeast specific, no metazoan counterpart; interacts with mRNA in commitment complex -S000036072 CDS YDR240C 4 945152 943674 C 2011-02-03 1996-07-31 -S000006866 long_terminal_repeat YDRWdelta12 chromosome 4 4 945351 945673 W 2011-02-03 2000-05-19 Ty1 LTR -S000006857 long_terminal_repeat YDRCsigma3 chromosome 4 4 946295 945955 C 2011-02-03 2000-05-19 Ty3 LTR -S000006778 tRNA_gene tY(GUA)D SUP2 chromosome 4 L000003770 4 946312 946400 W 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations -S000034661 intron tY(GUA)D 4 946351 946364 W 2011-02-03 2000-05-19 -S000034659 noncoding_exon tY(GUA)D 4 946312 946350 W 2011-02-03 2000-05-19 -S000034660 noncoding_exon tY(GUA)D 4 946365 946400 W 2011-02-03 2000-05-19 -S000002650 ORF Verified YDR242W AMD2 putative amidase chromosome 4 L000000083 4 946807 948456 W 2011-02-03 1996-07-31 Putative amidase -S000036363 CDS YDR242W 4 946807 948456 W 2011-02-03 1996-07-31 -S000002651 ORF Verified YDR243C PRP28 mRNA splicing protein PRP28 chromosome 4 L000001509 4 950284 948518 C 144.27 2011-02-03 1996-07-31 RNA binding protein; involved in RNA isomerization at the 5' splice site and for exchange of U6 for U1 snRNA at the 5' splice site; similar to the RNA helicases of the DEAD-box family -S000036406 CDS YDR243C 4 950284 948518 C 2011-02-03 1996-07-31 -S000002652 ORF Verified YDR244W PEX5 PAS10 chromosome 4 L000001342 4 950563 952401 W 2011-02-03 1996-07-31 Peroxisomal membrane signal receptor for peroxisomal matrix proteins; receptor for the C-terminal tripeptide signal sequence (PTS1) of peroxisomal matrix proteins; required for peroxisomal matrix protein import; also proposed to have PTS1-receptor independent functions -S000030212 CDS YDR244W 4 950563 952401 W 2011-02-03 1996-07-31 -S000002653 ORF Verified YDR245W MNN10 alpha-1,6-mannosyltransferase|REC41|SLC2|BED1 chromosome 4 L000002793|L000002853 4 952800 953981 W 2011-02-03 1996-07-31 Subunit of a Golgi mannosyltransferase complex; complex mediates elongation of the polysaccharide mannan backbone; membrane protein of the mannosyltransferase family; other members of the complex are Anp1p, Mnn9p, Mnn11p, and Hoc1p -S000030334 CDS YDR245W 4 952800 953981 W 2011-02-03 1996-07-31 -S000002654 ORF Verified YDR246W TRS23 TRAPP subunit TRS23 chromosome 4 S000007432 4 954288 954947 W 2011-02-03 1996-07-31 Core component of transport protein particle (TRAPP) complexes I-III; TRAPP complexes are related multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating ER-Golgi traffic (TRAPPI), intra-Golgi traffic (TRAPPII), endosome-Golgi traffic (TRAPPII and III) and autophagy (TRAPPIII); human homolog is TRAPPC4 -S000030489 CDS YDR246W 4 954288 954947 W 2011-02-03 1996-07-31 -S000028542 ORF Uncharacterized YDR246W-A chromosome 4 4 955133 955333 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031192 CDS YDR246W-A 4 955133 955333 W 2011-02-03 2003-07-29 -S000002655 ORF Verified YDR247W VHS1 putative serine/threonine protein kinase VHS1 chromosome 4 4 956013 957398 W 2011-02-03 1996-07-31 Cytoplasmic serine/threonine protein kinase; identified as a high-copy suppressor of the synthetic lethality of a sis2 sit4 double mutant, suggesting a role in G1/S phase progression; VHS1 has a paralog, SKS1, that arose from the whole genome duplication -S000031345 CDS YDR247W 4 956013 957398 W 2011-02-03 1996-07-31 -S000002656 ORF Uncharacterized YDR248C gluconokinase chromosome 4 4 958339 957758 C 2011-02-03 1996-07-31 Putative gluconokinase; sequence similarity to bacterial and human gluconokinase; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; upregulated by deletion of the RNAP-II associated factor, PAF1 -S000031382 CDS YDR248C 4 958339 957758 C 2011-02-03 1996-07-31 -S000002657 ORF Uncharacterized YDR249C chromosome 4 4 959802 958681 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000031491 CDS YDR249C 4 959802 958681 C 2011-02-03 1996-07-31 -S000002658 ORF Dubious YDR250C chromosome 4 4 960361 960086 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031286 CDS YDR250C 4 960361 960086 C 2011-02-03 1996-07-31 -S000002659 ORF Verified YDR251W PAM1 chromosome 4 L000001334 4 960614 963106 W 2011-02-03 1996-07-31 Essential protein of unknown function; exhibits variable expression during colony morphogenesis; overexpression permits survival without protein phosphatase 2A, inhibits growth, and induces a filamentous phenotype; PAM1 has a paralog, SVL3, that arose from the whole genome duplication -S000032340 CDS YDR251W 4 960614 963106 W 2011-02-03 1996-07-31 -S000002660 ORF Verified YDR252W BTT1 CCR4-NOT core subunit BTT1 chromosome 4 L000000195 4 963412 963861 W 2011-02-03 1996-07-31 Heterotrimeric nascent polypeptide-associated complex beta3 subunit; complex binds ribosomes via its beta-subunits in close proximity to nascent polypeptides; interacts with Caf130p of the CCR4-NOT complex; similar to human BTF3; BTT1 has a paralog, EGD1, that arose from the whole genome duplication -S000032433 CDS YDR252W 4 963412 963861 W 2011-02-03 1996-07-31 -S000002661 ORF Verified YDR253C MET32 chromosome 4 L000003470 4 964565 963990 C 2011-02-03 1996-07-31 Zinc-finger DNA-binding transcription factor; involved in transcriptional regulation of the methionine biosynthetic genes; targets strong transcriptional activator Met4p to promoters of sulfur metabolic genes; feedforward loop exists in the regulation of genes controlled by Met4p and Met32p; lack of such a loop for MET31 may account for the differential actions of Met32p and Met31p; MET32 has a paralog, MET31, that arose from the whole genome duplication -S000032479 CDS YDR253C 4 964565 963990 C 2011-02-03 1996-07-31 -S000002662 ORF Verified YDR254W CHL4 MCM17|CTF17 chromosome 4 L000000321 4 965113 966489 W 2011-02-03 1996-07-31 Outer kinetochore protein required for chromosome stability; involved in new kinetochore assembly and sister chromatid cohesion; forms a stable complex with Iml3p; peripheral component of the Ctf19 kinetochore complex that interacts with Ctf19p, Ctf3p, and Mif2p; required for the spindle assembly checkpoint; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-N and fission yeast mis15 -S000034580 CDS YDR254W 4 965113 966489 W 2011-02-03 1996-07-31 -S000002663 ORF Verified YDR255C RMD5 ubiquitin-protein ligase RMD5|GID2 chromosome 4 4 967822 966557 C 2011-02-03 1996-07-31 Component of GID Complex that confers ubiquitin ligase (U3) activity; necessary for polyubiquitination and degradation of the gluconeogenic enzyme fructose-1,6-bisphosphatase; forms dimer with Fyv10p that is then recruited to GID Complex by Gid8p; also required for sporulation; conserved protein that has a degenerate RING finger domain -S000034601 CDS YDR255C 4 967822 966557 C 2011-02-03 1996-07-31 -S000002664 ORF Verified YDR256C CTA1 catalase A chromosome 4 L000000428 4 969680 968133 C 2011-02-03 1996-07-31 Catalase A; breaks down hydrogen peroxide in the peroxisomal matrix formed by acyl-CoA oxidase (Pox1p) during fatty acid beta-oxidation -S000034671 CDS YDR256C 4 969680 968133 C 2011-02-03 1996-07-31 -S000002665 ORF Verified YDR257C RKM4 ribosomal lysine N-methyltransferase|SET7|RMS1 chromosome 4 L000003277 4 971474 969990 C 2011-02-03 1996-07-31 Ribosomal lysine methyltransferase; specific for monomethylation of Rpl42ap and Rpl42bp (lysine 55); nuclear SET-domain containing protein -S000034751 CDS YDR257C 4 971474 969990 C 2011-02-03 1996-07-31 -S000002666 ORF Verified YDR258C HSP78 chaperone ATPase HSP78 chromosome 4 L000000821 4 974243 971808 C 2011-02-03 1996-07-31 Oligomeric mitochondrial matrix chaperone; cooperates with Ssc1p in mitochondrial thermotolerance after heat shock; able to prevent the aggregation of misfolded proteins as well as resolubilize protein aggregates -S000035676 CDS YDR258C 4 974243 971808 C 2011-02-03 1996-07-31 -S000002667 ORF Verified YDR259C YAP6 HAL7 chromosome 4 L000004344 4 975782 974631 C 2011-02-03 1996-07-31 Basic leucine zipper (bZIP) transcription factor; physically interacts with the Tup1-Cyc8 complex and recruits Tup1p to its targets; overexpression increases sodium and lithium tolerance; computational analysis suggests a role in regulation of expression of genes involved in carbohydrate metabolism; YAP6 has a paralog, CIN5, that arose from the whole genome duplication -S000035746 CDS YDR259C 4 975782 974631 C 2011-02-03 1996-07-31 -S000002668 ORF Verified YDR260C SWM1 APC13 chromosome 4 L000004027 4 977229 976717 C 2011-02-03 1996-07-31 Subunit of the anaphase-promoting complex (APC); APC is an E3 ubiquitin ligase that regulates the metaphase-anaphase transition and exit from mitosis; required for activation of the daughter-specific gene expression and spore wall maturation -S000035460 CDS YDR260C 4 977229 976717 C 2011-02-03 1996-07-31 -S000002669 ORF Verified YDR261C EXG2 glucan exo-1,3-beta-glucosidase chromosome 4 L000000593 4 979209 977521 C 162 2011-02-03 1996-07-31 Exo-1,3-beta-glucanase; involved in cell wall beta-glucan assembly; may be anchored to the plasma membrane via a glycosylphosphatidylinositol (GPI) anchor -S000035548 CDS YDR261C 4 979209 977521 C 2011-02-03 1996-07-31 -S000006722 tRNA_gene tS(AGA)D2 chromosome 4 L000003774 4 981055 980974 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000031633 noncoding_exon tS(AGA)D2 4 981055 980974 C 2011-02-03 2000-05-19 -S000006869 long_terminal_repeat YDRWdelta19 chromosome 4 4 981171 981502 W 2011-02-03 2000-05-19 Ty1 LTR -S000006885 LTR_retrotransposon YDRWTy2-3 Ty2 chromosome 4 4 981171 987125 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007396 transposable_element_gene YDR261W-A gag protein chromosome 4 4 981462 982778 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000034032 CDS YDR261W-A 4 981462 982778 W 2011-02-03 1999-07-17 -S000007397 transposable_element_gene YDR261W-B gag-pol fusion protein chromosome 4 4 981462 986775 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000034034 CDS YDR261W-B 4 981462 982754 W 2011-02-03 1999-07-17 -S000034035 CDS YDR261W-B 4 982756 986775 W 2011-02-03 1999-07-17 -S000034036 plus_1_translational_frameshift YDR261W-B 4 982755 982755 W 2011-02-03 1999-07-17 -S000006870 long_terminal_repeat YDRWdelta20 chromosome 4 4 986794 987125 W 2011-02-03 2000-05-19 Ty1 LTR -S000006853 long_terminal_repeat YDRCdelta21 chromosome 4 4 987483 987150 C 2011-02-03 2000-05-19 Ty1 LTR -S000007395 transposable_element_gene YDR261C-D gag-pol fusion protein chromosome 4 4 992349 987534 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; Gag processing produces capsid proteins, Pol is cleaved to produce protease, reverse transcriptase and integrase activities; in YDRCTy1-3 TYB is mutant and probably non-functional -S000032325 CDS YDR261C-D 4 991043 987534 C 2011-02-03 1999-07-17 -S000032324 CDS YDR261C-D 4 992349 991045 C 2011-02-03 1999-07-17 -S000032326 plus_1_translational_frameshift YDR261C-D 4 991044 991044 C 2011-02-03 1999-07-17 -S000007394 transposable_element_gene YDR261C-C gag protein chromosome 4 4 992349 991027 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; Gag processing produces capsid proteins; in YDRCTy1-3 TYB is mutant and probably non-functional -S000031433 CDS YDR261C-C 4 992349 991027 C 2011-02-03 1999-07-17 -S000006861 LTR_retrotransposon YDRCTy1-3 Ty1 chromosome 4 4 992642 987150 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; mutated in S288C -S000006854 long_terminal_repeat YDRCdelta22 chromosome 4 4 992642 992309 C 2011-02-03 2000-05-19 Ty1 LTR -S000006880 long_terminal_repeat YDRCsigma4 YDRWsigma4 chromosome 4 4 992815 992740 C 2011-02-03 2000-05-19|2007-04-02 Ty3 LTR -S000006577 tRNA_gene tG(GCC)D2 chromosome 4 L000003771 4 992832 992902 W 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis -S000031716 noncoding_exon tG(GCC)D2 4 992832 992902 W 2011-02-03 2000-05-19 -S000002670 ORF Uncharacterized YDR262W chromosome 4 4 993134 993952 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole and is induced in response to the DNA-damaging agent MMS; gene expression increases in response to Zymoliase treatment -S000036503 CDS YDR262W 4 993134 993952 W 2011-02-03 1996-07-31 -S000002671 ORF Verified YDR263C DIN7 exodeoxyribonuclease DIN7|DIN3 chromosome 4 L000003086 4 995534 994242 C 2011-02-03 1996-07-31 Mitochondrial nuclease functioning in DNA repair and replication; modulates the stability of the mitochondrial genome, induced by exposure to mutagens, also induced during meiosis at a time nearly coincident with commitment to recombination; DIN7 has a paralog, EXO1, that arose from the whole genome duplication -S000036563 CDS YDR263C 4 995534 994242 C 2011-02-03 1996-07-31 -S000002672 ORF Verified YDR264C AKR1 palmitoyltransferase AKR1 chromosome 4 L000000072 4 998323 996029 C 2011-02-03 1996-07-31 Palmitoyl transferase involved in protein palmitoylation; acts as a negative regulator of pheromone response pathway; required for endocytosis of pheromone receptors; involved in cell shape control; contains ankyrin repeats; AKR1 has a paralog, AKR2, that arose from the whole genome duplication; any of several human homologs encoding DHHC-type zinc fingers (ZDHHC) can complement temperature sensitivity of yeast akr1 null mutant -S000036629 CDS YDR264C 4 998323 996029 C 2011-02-03 1996-07-31 -S000002673 ORF Verified YDR265W PEX10 ubiquitin-protein ligase peroxin 10|PAS4 chromosome 4 L000003961 4 998864 999877 W 2011-02-03 1996-07-31 Peroxisomal membrane E3 ubiquitin ligase; required for for Ubc4p-dependent Pex5p ubiquitination and peroxisomal matrix protein import; contains zinc-binding RING domain; mutations in human homolog cause various peroxisomal disorders -S000036772 CDS YDR265W 4 998864 999877 W 2011-02-03 1996-07-31 -S000002674 ORF Verified YDR266C HEL2 E3 ubiquitin-protein ligase HEL2 chromosome 4 4 1002023 1000104 C 2011-02-03 1996-07-31 RING finger ubiquitin ligase (E3); involved in ubiquitination and degradation of excess histones; interacts with Ubc4p and Rad53p; null mutant sensitive to hydroxyurea (HU); green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; computational analysis suggests a role as a transcription factor -S000030572 CDS YDR266C 4 1002023 1000104 C 2011-02-03 1996-07-31 -S000002675 ORF Verified YDR267C CIA1 iron-sulfur cluster assembly protein CIA1 chromosome 4 4 1003502 1002510 C 2011-02-03 1996-07-31 Component of cytosolic iron-sulfur protein assembly (CIA) machinery; acts at late step of Fe-S cluster assembly; forms CIA targeting complex with Cia2p and Met18p that directs Fe-S cluster incorporation into subset of proteins involved in methionine biosynthesis, DNA replication and repair, transcription, telomere maintenance; contains WD40 repeats; human homolog CIAO1 can complement yeast cia1 null mutant -S000030699 CDS YDR267C 4 1003502 1002510 C 2011-02-03 1996-07-31 -S000002676 ORF Verified YDR268W MSW1 tryptophan--tRNA ligase MSW1 chromosome 4 L000001209 4 1004004 1005143 W 2011-02-03 1996-07-31 Mitochondrial tryptophanyl-tRNA synthetase -S000030885 CDS YDR268W 4 1004004 1005143 W 2011-02-03 1996-07-31 -S000002678 ORF Verified YDR270W CCC2 Cu(2+)-transporting P-type ATPase CCC2 chromosome 4 L000000235 4 1005675 1008689 W 2011-02-03 1996-07-31 Cu(+2)-transporting P-type ATPase; required for export of copper from the cytosol into an extracytosolic compartment; similar to human proteins involved in Menkes and Wilsons diseases; protein abundance increases in response to DNA replication stress; affects TBSV model (+)RNA virus replication by regulating copper metabolism; human homologs ATP7A and ATP7B both complement yeast null mutant -S000031624 CDS YDR270W 4 1005675 1008689 W 2011-02-03 1996-07-31 -S000002677 ORF Dubious YDR269C chromosome 4 4 1005988 1005665 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031741 CDS YDR269C 4 1005988 1005665 C 2011-02-03 1996-07-31 -S000002679 ORF Dubious YDR271C chromosome 4 4 1008766 1008395 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF CCC2/YDR270W -S000031691 CDS YDR271C 4 1008766 1008395 C 2011-02-03 1996-07-31 -S000002680 ORF Verified YDR272W GLO2 hydroxyacylglutathione hydrolase GLO2 chromosome 4 L000003488 4 1009010 1009834 W 2011-02-03 1996-07-31 Cytoplasmic glyoxalase II; catalyzes the hydrolysis of S-D-lactoylglutathione into glutathione and D-lactate; GLO2 has a paralog, GLO4, that arose from the whole genome duplication -S000032699 CDS YDR272W 4 1009010 1009834 W 2011-02-03 1996-07-31 -S000002681 ORF Verified YDR273W DON1 chromosome 4 4 1010176 1011273 W 2011-02-03 1996-07-31 Meiosis-specific component of the spindle pole body; subunit of the leading edge protein (LEP) complex (Ssp1-Ady3-Don1-Irc10) that forms a ring-like structure at the leading edge of the prospore membrane (PSM) during meiosis II; required for PSM growth and closure; DON1 has a paralog, CUE5, that arose from the whole genome -S000032778 CDS YDR273W 4 1010176 1011273 W 2011-02-03 1996-07-31 -S000002682 ORF Uncharacterized YDR274C chromosome 4 4 1011960 1011589 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YDR274C is not an essential gene -S000032843 CDS YDR274C 4 1011960 1011589 C 2011-02-03 1996-07-31 -S000002683 ORF Verified YDR275W BSC2 chromosome 4 4 1012252 1012959 W 2011-02-03 1996-07-31 Protein of unknown function; ORF exhibits genomic organization compatible with a translational readthrough-dependent mode of expression; null mutant displays increased translation rate and increased readthrough of premature stop codons; BSC2 has a paralog, IRC23, that arose from the whole genome duplication -S000034861 CDS YDR275W 4 1012252 1012959 W 2011-02-03 1996-07-31 -S000002684 ORF Verified YDR276C PMP3 SNA1 chromosome 4 4 1013643 1013476 C 2011-02-03 1996-07-31 Small plasma membrane protein; confers resistance to amphotericin B and is a potential target of this common antifungal drug; related to a family of plant polypeptides that are overexpressed under high salt concentration or low temperature; not essential for viability; deletion causes hyperpolarization of the plasma membrane potential -S000034908 CDS YDR276C 4 1013643 1013476 C 2011-02-03 1996-07-31 -S000002685 ORF Verified YDR277C MTH1 HTR1|DGT1|BPC1 chromosome 4 L000001213|L000000831 4 1015702 1014401 C 2011-02-03 1996-07-31 Negative regulator of the glucose-sensing signal transduction pathway; required for repression of transcription by Rgt1p; interacts with Rgt1p and the Snf3p and Rgt2p glucose sensors; phosphorylated by Yck1p, triggering Mth1p degradation; MTH1 has a paralog, STD1, that arose from the whole genome duplication -S000035061 CDS YDR277C 4 1015702 1014401 C 2011-02-03 1996-07-31 -S000118442 ARS ARS430 ARSIV-1017 chromosome 4 4 1016670 1016911 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178077 ARS_consensus_sequence ARS430 4 1016846 1016830 C 2014-11-18 2014-11-18 -S000006546 tRNA_gene tE(CUC)D chromosome 4 L000003781 4 1017278 1017207 C 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis -S000031893 noncoding_exon tE(CUC)D 4 1017278 1017207 C 2011-02-03 2000-05-19 -S000002686 ORF Uncharacterized YDR278C chromosome 4 4 1017318 1017001 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YDR278C is not an essential gene -S000035163 CDS YDR278C 4 1017318 1017001 C 2011-02-03 1996-07-31 -S000002687 ORF Verified YDR279W RNH202 Rnh2B chromosome 4 4 1019368 1020420 W 2011-02-03 1996-07-31 Ribonuclease H2 subunit; required for RNase H2 activity; role in ribonucleotide excision repair; related to human AGS2 that causes Aicardi-Goutieres syndrome -S000036060 CDS YDR279W 4 1019368 1020420 W 2011-02-03 1996-07-31 -S000002688 ORF Verified YDR280W RRP45 exosome non-catalytic core subunit RRP45 chromosome 4 L000004578 4 1020747 1021664 W 2011-02-03 1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; has similarity to E. coli RNase PH and to human hRrp45p (PM/SCL-75, EXOSC9); protein abundance increases in response to DNA replication stress -S000035087 CDS YDR280W 4 1020747 1021664 W 2011-02-03 1996-07-31 -S000002689 ORF Verified YDR281C PHM6 chromosome 4 S000007515 4 1022321 1022007 C 2011-02-03 1996-07-31 Protein of unknown function; expression is regulated by phosphate levels -S000035153 CDS YDR281C 4 1022321 1022007 C 2011-02-03 1996-07-31 -S000006881 long_terminal_repeat YDRWsigma5 chromosome 4 4 1023137 1023477 W 2011-02-03 2000-05-19 Ty3 LTR -S000002690 ORF Verified YDR282C MRX10 chromosome 4 4 1024755 1023511 C 2011-02-03 1996-07-31 Mitochondrial inner membrane protein of unknown function; associates with mitochondrial ribosome; localizes to the inner membrane with the C terminus facing the intermembrane space; ortholog of human RMND1, mutation in which is implicated in infantile encephaloneuromyopathy and defective mitochondrial translation -S000035316 CDS YDR282C 4 1024755 1023511 C 2011-02-03 1996-07-31 -S000002691 ORF Verified YDR283C GCN2 serine/threonine-protein kinase GCN2|AAS102|NDR2|AAS1 chromosome 4 L000000681 4 1030049 1025070 C 173 2011-02-03 1996-07-31 Protein kinase; phosphorylates the alpha-subunit of translation initiation factor eIF2 (Sui2p) in response to starvation; activated by uncharged tRNAs and the Gcn1p-Gcn20p complex; contributes to DNA damage checkpoint control -S000036262 CDS YDR283C 4 1030049 1025070 C 2011-02-03 1996-07-31 -S000002692 ORF Verified YDR284C DPP1 bifunctional diacylglycerol diphosphate phosphatase/phosphatidate phosphatase|ZRG1 chromosome 4 L000003582 4 1031419 1030550 C 2011-02-03 1996-07-31 Diacylglycerol pyrophosphate (DGPP) phosphatase; zinc-regulated vacuolar membrane-associated lipid phosphatase, dephosphorylates DGPP to phosphatidate (PA) and Pi, then PA to diacylglycerol; involved in lipid signaling and cell metabolism -S000036340 CDS YDR284C 4 1031419 1030550 C 2011-02-03 1996-07-31 -S000002693 ORF Verified YDR285W ZIP1 chromosome 4 L000002568 4 1032436 1035063 W 2011-02-03 1996-07-31 Transverse filament protein of the synaptonemal complex; required for normal levels of meiotic recombination and pairing between homologous chromosome during meiosis; required for meiotic recombination between non-allelc sites; potential Cdc28p substrate -S000036473 CDS YDR285W 4 1032436 1035063 W 2011-02-03 1996-07-31 -S000002694 ORF Uncharacterized YDR286C chromosome 4 4 1035575 1035231 C 2011-02-03 1996-07-31 Putative protein of unknown function; predicted to have thiol-disulfide oxidoreductase active site -S000037085 CDS YDR286C 4 1035575 1035231 C 2011-02-03 1996-07-31 -S000002695 ORF Verified YDR287W INM2 inositol monophosphate 1-phosphatase INM2 chromosome 4 4 1035995 1036873 W 2011-02-03 1996-07-31 Inositol monophosphatase; involved in biosynthesis of inositol; enzymatic activity requires magnesium ions and is inhibited by lithium and sodium ions; inm1 inm2 double mutant lacks inositol auxotrophy -S000037232 CDS YDR287W 4 1035995 1036873 W 2011-02-03 1996-07-31 -S000002696 ORF Verified YDR288W NSE3 Smc5-Smc6 complex subunit NSE3 chromosome 4 4 1037195 1038106 W 2011-02-03 1996-07-31 Component of the SMC5-SMC6 complex; this complex plays a key role in the removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair; protein abundance increases in response to DNA replication stress -S000037315 CDS YDR288W 4 1037195 1038106 W 2011-02-03 1996-07-31 -S000002698 ORF Dubious YDR290W SWS1 chromosome 4 4 1039370 1039699 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF RTT103 -S000031324 CDS YDR290W 4 1039370 1039699 W 2011-02-03 1996-07-31 -S000002697 ORF Verified YDR289C RTT103 chromosome 4 4 1039509 1038280 C 2011-02-03 1996-07-31 Protein involved in transcription termination by RNA polymerase II; interacts with exonuclease Rat1p and Rai1p; has an RPR domain (carboxy-terminal domain interacting domain); also involved in regulation of Ty1 transposition -S000037346 CDS YDR289C 4 1039509 1038280 C 2011-02-03 1996-07-31 -S000002699 ORF Verified YDR291W HRQ1 ATP-dependent 3'-5' DNA helicase chromosome 4 4 1039728 1042961 W 2011-02-03 1996-07-31 3'-5' DNA helicase that has DNA strand annealing activity; helicase activity is stimulated by fork structure and 3'-tail length of substrates; acts with Rad4p in nucleotide-excision repair; belongs to the widely conserved RecQ family of proteins which are involved in maintaining genomic integrity; similar to the human RecQ4p implicated in Rothmund-Thomson syndrome (RTS) -S000032334 CDS YDR291W 4 1039728 1042961 W 2011-02-03 1996-07-31 -S000002700 ORF Verified YDR292C SRP101 Signal recognition particle receptor subunit alpha chromosome 4 L000002067 4 1045011 1043146 C 2011-02-03 1996-07-31 Signal recognition particle (SRP) receptor alpha subunit; contain GTPase domains; involved in SRP-dependent protein targeting; interacts with the beta subunit, Srp102p -S000032412 CDS YDR292C 4 1045011 1043146 C 2011-02-03 1996-07-31 -S000002701 ORF Verified YDR293C SSD1 mRNA-binding translational repressor SSD1|SRK1|RLT1|MCS1|CLA1 chromosome 4 L000002077 4 1049392 1045640 C 176 2011-02-03 1996-07-31 Translational repressor with a role in polar growth and wall integrity; regulated by Cbk1p phosphorylation to effect bud-specific translational control and localization of specific mRNAs; interacts with TOR pathway components; contains a functional N-terminal nuclear localization sequence and nucleocytoplasmic shuttling appears to be critical to Ssd1p function -S000032503 CDS YDR293C 4 1049392 1045640 C 2011-02-03 1996-07-31 -S000002702 ORF Verified YDR294C DPL1 sphinganine-1-phosphate aldolase DPL1|BST1 chromosome 4 L000004296 4 1052228 1050459 C 2011-02-03 1996-07-31 Dihydrosphingosine phosphate lyase; regulates intracellular levels of sphingolipid long-chain base phosphates (LCBPs), degrades phosphorylated long chain bases, prefers C16 dihydrosphingosine-l-phosphate as a substrate -S000032617 CDS YDR294C 4 1052228 1050459 C 2011-02-03 1996-07-31 -S000002703 ORF Verified YDR295C HDA2 PLO2 chromosome 4 4 1054647 1052623 C 2011-02-03 1996-07-31 Subunit of the HDA1 histone deacetylase complex; possibly tetrameric trichostatin A-sensitive class II histone deacetylase complex contains Hda1p homodimer and an Hda2p-Hda3p heterodimer; involved in telomere maintenance; relocalizes to the cytosol in response to hypoxia -S000033335 CDS YDR295C 4 1054647 1052623 C 2011-02-03 1996-07-31 -S000002704 ORF Verified YDR296W MHR1 XTC1 chromosome 4 L000004333 4 1055212 1055892 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; also involved in homologous recombination in mitochondria; required for recombination-dependent mtDNA partitioning; involved in stimulation of mitochondrial DNA replication in response to oxidative stress -S000033421 CDS YDR296W 4 1055212 1055892 W 2011-02-03 1996-07-31 -S000002705 ORF Verified YDR297W SUR2 sphingosine hydroxylase|SYR2 chromosome 4 L000002244|L000002259 4 1056551 1057600 W 2011-02-03 1996-07-31 Sphinganine C4-hydroxylase; catalyses the conversion of sphinganine to phytosphingosine in sphingolipid biosyntheis -S000033508 CDS YDR297W 4 1056551 1057600 W 2011-02-03 1996-07-31 -S000118443 ARS ARS431 ARSIV-1058 chromosome 4 4 1057841 1057951 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178078 ARS_consensus_sequence ARS431 4 1057887 1057903 W 2014-11-18 2014-11-18 -S000002706 ORF Verified YDR298C ATP5 F1F0 ATP synthase subunit 5|OSC1 chromosome 4 L000000145 4 1058814 1058176 C 2011-02-03 1996-07-31 Subunit 5 of the stator stalk of mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; homologous to bovine subunit OSCP (oligomycin sensitivity-conferring protein); phosphorylated -S000033515 CDS YDR298C 4 1058814 1058176 C 2011-02-03 1996-07-31 -S000002707 ORF Verified YDR299W BFR2 rRNA-processing protein BFR2 chromosome 4 L000004432 4 1059627 1061231 W 2011-02-03 1996-07-31 Component of the SSU and 90S preribosomes; involved in pre-18S rRNA processing; binds to U3 snoRNA and Mpp10p; multicopy suppressor of sensitivity to Brefeldin A; expression is induced during lag phase and also by cold shock -S000033609 CDS YDR299W 4 1059627 1061231 W 2011-02-03 1996-07-31 -S000002708 ORF Verified YDR300C PRO1 glutamate 5-kinase chromosome 4 L000001491 4 1062791 1061505 C 187 2011-02-03 1996-07-31 Gamma-glutamyl kinase; catalyzes the first step in proline biosynthesis; required for nitrogen starvation-induced ribophagy but not for nonselective autophagy; PRO1 has a paralog, YHR033W, that arose from the whole genome duplication -S000030896 CDS YDR300C 4 1062791 1061505 C 2011-02-03 1996-07-31 -S000002709 ORF Verified YDR301W CFT1 YHH1 chromosome 4 L000003600 4 1063352 1067425 W 2011-02-03 1996-07-31 RNA-binding subunit of the mRNA cleavage and polyadenylation factor; involved in poly(A) site recognition and required for both pre-mRNA cleavage and polyadenylation, 51% sequence similarity with mammalian AAUAA-binding subunit of CPSF -S000031983 CDS YDR301W 4 1063352 1067425 W 2011-02-03 1996-07-31 -S000002710 ORF Verified YDR302W GPI11 mannose-ethanolamine phosphotransferase GPI11 chromosome 4 4 1067731 1068390 W 2011-02-03 1996-07-31 ER membrane protein involved in a late step of GPI anchor assembly; involved in the addition of phosphoethanolamine to the multiply mannosylated glycosylphosphatidylinositol (GPI) intermediate; human PIG-Fp is a functional homolog -S000032108 CDS YDR302W 4 1067731 1068390 W 2011-02-03 1996-07-31 -S000002711 ORF Verified YDR303C RSC3 chromosome 4 4 1071386 1068729 C 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; essential gene required for maintenance of proper ploidy and regulation of ribosomal protein genes and the cell wall/stress response; RSC3 has a paralog, RSC30, that arose from the whole genome duplication -S000032135 CDS YDR303C 4 1071386 1068729 C 2011-02-03 1996-07-31 -S000002712 ORF Verified YDR304C CPR5 peptidylprolyl isomerase family protein CPR5|CYP5 chromosome 4 L000000466 4 1072557 1071880 C 2011-02-03 1996-07-31 Peptidyl-prolyl cis-trans isomerase (cyclophilin) of the ER; catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; transcriptionally induced in response to unfolded proteins in the ER; CPR5 has a paralog, CPR2, that arose from the whole genome duplication -S000034130 CDS YDR304C 4 1072557 1071880 C 2011-02-03 1996-07-31 -S000002713 ORF Verified YDR305C HNT2 bis(5'-adenosyl)-triphosphatase|APH1 chromosome 4 L000003335 4 1073488 1072746 C 2011-02-03 1996-07-31 Dinucleoside triphosphate hydrolase; has similarity to the tumor suppressor FHIT and belongs to the histidine triad (HIT) superfamily of nucleotide-binding proteins -S000034247 CDS YDR305C 4 1073312 1072746 C 2011-02-03 1996-07-31 -S000034246 CDS YDR305C 4 1073488 1073402 C 2011-02-03 1996-07-31 -S000034248 intron YDR305C 4 1073401 1073313 C 2011-02-03 1996-07-31 -S000002714 ORF Verified YDR306C chromosome 4 4 1075171 1073735 C 2011-02-03 1996-07-31 F-box protein of unknown function; interacts with Sgt1p via a Leucine-Rich Repeat (LRR) domain -S000034313 CDS YDR306C 4 1075171 1073735 C 2011-02-03 1996-07-31 -S000006767 tRNA_gene tV(CAC)D chromosome 4 L000003780 4 1075544 1075472 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000030586 noncoding_exon tV(CAC)D 4 1075544 1075472 C 2011-02-03 2000-05-19 -S000002715 ORF Uncharacterized YDR307W PMT7 putative dolichyl-phosphate-mannose--protein mannosyltransferase chromosome 4 S000029378|L000004021|L000004010 4 1075865 1077853 W 2011-02-03 1996-07-31 Putative protein mannosyltransferase similar to Pmt1p; has a potential role in protein O-glycosylation -S000035324 CDS YDR307W 4 1075865 1077853 W 2011-02-03 1996-07-31 -S000002716 ORF Verified YDR308C SRB7 SSX1|MED21 chromosome 4 L000002754|S000029514|L000002097 4 1078449 1078027 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation; target of the global repressor Tup1p -S000035339 CDS YDR308C 4 1078449 1078027 C 2011-02-03 1996-07-31 -S000002717 ORF Verified YDR309C GIC2 chromosome 4 L000003314 4 1080199 1079048 C 2011-02-03 1996-07-31 Redundant rho-like GTPase Cdc42p effector; involved in initiation of budding and cellular polarization; interacts with Cdc42p via the Cdc42/Rac-interactive binding (CRIB) domain and with PI(4,5)P2 via a polybasic region; GIC2 has a paralog, GIC1, that arose from the whole genome duplication -S000035408 CDS YDR309C 4 1080199 1079048 C 2011-02-03 1996-07-31 -S000002718 ORF Verified YDR310C SUM1 chromosome 4 L000003008 4 1084316 1081128 C 2011-02-03 1996-07-31 Transcriptional repressor that regulates middle-sporulation genes; required for mitotic repression of middle sporulation-specific genes; also acts as general replication initiation factor; involved in telomere maintenance, chromatin silencing; regulated by pachytene checkpoint -S000034868 CDS YDR310C 4 1084316 1081128 C 2011-02-03 1996-07-31 -S000002719 ORF Verified YDR311W TFB1 TFIIH/NER complex subunit TFB1 chromosome 4 L000002284 4 1085065 1086993 W 2011-02-03 1996-07-31 Subunit of TFIIH and nucleotide excision repair factor 3 complexes; required for nucleotide excision repair, target for transcriptional activators; relocalizes to the cytosol in response to hypoxia -S000035123 CDS YDR311W 4 1085065 1086993 W 2011-02-03 1996-07-31 -S000002720 ORF Verified YDR312W SSF2 rRNA-binding ribosome biosynthesis protein chromosome 4 L000002081 4 1087581 1088942 W 2011-02-03 1996-07-31 Protein required for ribosomal large subunit maturation; functionally redundant with Ssf1p; member of the Brix family; SSF2 has a paralog, SSF1, that arose from the whole genome duplication -S000035275 CDS YDR312W 4 1087581 1088942 W 2011-02-03 1996-07-31 -S000002721 ORF Verified YDR313C PIB1 phosphatidylinositol-3-phosphate-binding ubiquitin-protein ligase chromosome 4 L000004635 4 1090079 1089219 C 2011-02-03 1996-07-31 RING-type ubiquitin ligase of the endosomal and vacuolar membranes; binds phosphatidylinositol(3)-phosphate; contains a FYVE finger domain -S000036080 CDS YDR313C 4 1090079 1089219 C 2011-02-03 1996-07-31 -S000002722 ORF Verified YDR314C RAD34 chromosome 4 4 1092511 1090433 C 2011-02-03 1996-07-31 Protein involved in nucleotide excision repair (NER); homologous to RAD4 -S000036213 CDS YDR314C 4 1092511 1090433 C 2011-02-03 1996-07-31 -S000002723 ORF Verified YDR315C IPK1 inositol pentakisphosphate 2-kinase|GSL1 chromosome 4 L000003564 4 1093586 1092741 C 2011-02-03 1996-07-31 Inositol 1,3,4,5,6-pentakisphosphate 2-kinase; nuclear protein required for synthesis of 1,2,3,4,5,6-hexakisphosphate (phytate), which is integral to cell function; has 2 motifs conserved in other fungi; ipk1 gle1 double mutant is inviable; human IPPK can complement ipk1 null mutant -S000036321 CDS YDR315C 4 1093586 1092741 C 2011-02-03 1996-07-31 -S000002724 ORF Verified YDR316W OMS1 putative RNA methyltransferase chromosome 4 4 1093763 1095178 W 2011-02-03 1996-07-31 Protein integral to the mitochondrial membrane; has a conserved methyltransferase motif and is predicted to be an RNA methyltransferase; multicopy suppressor of respiratory defects caused by OXA1 mutations -S000030079 CDS YDR316W 4 1093763 1095178 W 2011-02-03 1996-07-31 -S000006563 tRNA_gene tF(GAA)D chromosome 4 L000003779 4 1095461 1095370 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis -S000035376 intron tF(GAA)D 4 1095424 1095406 C 2011-02-03 2000-05-19 -S000035375 noncoding_exon tF(GAA)D 4 1095405 1095370 C 2011-02-03 2000-05-19 -S000035374 noncoding_exon tF(GAA)D 4 1095461 1095425 C 2011-02-03 2000-05-19 -S000006871 long_terminal_repeat YDRWdelta23 chromosome 4 4 1095767 1096104 W 2011-02-03 2000-05-19 Ty1 LTR -S000006882 LTR_retrotransposon YDRWTy1-4 Ty1 chromosome 4 4 1095767 1101692 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007398 transposable_element_gene YDR316W-A gag protein chromosome 4 4 1096064 1097386 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000034439 CDS YDR316W-A 4 1096064 1097386 W 2011-02-03 1999-07-17 -S000007399 transposable_element_gene YDR316W-B gag-pol fusion protein chromosome 4 4 1096064 1101332 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000034443 CDS YDR316W-B 4 1096064 1097368 W 2011-02-03 1999-07-17 -S000034444 CDS YDR316W-B 4 1097370 1101332 W 2011-02-03 1999-07-17 -S000034445 plus_1_translational_frameshift YDR316W-B 4 1097369 1097369 W 2011-02-03 1999-07-17 -S000006872 long_terminal_repeat YDRWdelta24 chromosome 4 4 1101355 1101692 W 2011-02-03 2000-05-19 Ty1 LTR -S000002725 ORF Verified YDR317W HIM1 chromosome 4 S000029210|L000000774 4 1102184 1103428 W 275 2011-02-03 1996-07-31 Protein of unknown function involved in DNA repair -S000030217 CDS YDR317W 4 1102184 1103428 W 2011-02-03 1996-07-31 -S000002726 ORF Verified YDR318W MCM21 CTF5 chromosome 4 L000003998 4 1103758 1104947 W 2011-02-03 2003-09-27|1996-07-31 Component of the kinetochore sub-complex COMA; COMA (Ctf19p, Okp1p, Mcm21p, Ame1p) bridges kinetochore subunits in contact with centromeric DNA with subunits bound to microtubules during kinetochore assembly; involved in minichromosome maintenance; modified by sumoylation; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-O and fission yeast mal2 -S000030336 CDS YDR318W 4 1103758 1103809 W 2011-02-03 2003-09-27|1996-07-31 -S000030337 CDS YDR318W 4 1103893 1104947 W 2011-02-03 2003-09-27 -S000030338 intron YDR318W 4 1103810 1103892 W 2011-02-03 2003-09-27 -S000002727 ORF Uncharacterized YDR319C YFT2 FIT2A chromosome 4 4 1105827 1105003 C 2011-02-03 1996-07-31 Protein required for normal ER membrane biosynthesis; member of the highly conserved FIT family of proteins involved in triglyceride droplet biosynthesis and homologous to human FIT2; interacts with Sst2p and Hsp82p in high-throughput two-hybrid screens -S000030447 CDS YDR319C 4 1105827 1105003 C 2011-02-03 1996-07-31 -S000002728 ORF Verified YDR320C SWA2 BUD24|AUX1 chromosome 4 4 1108101 1106095 C 2011-02-03 1996-07-31 Auxilin-like protein involved in vesicular transport; clathrin-binding protein required for uncoating of clathrin-coated vesicles -S000030945 CDS YDR320C 4 1108101 1106095 C 2011-02-03 1996-07-31 -S000028821 ORF Dubious YDR320W-B chromosome 4 4 1108484 1108621 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene DAD4/YDR320C-A -S000033640 CDS YDR320W-B 4 1108484 1108621 W 2011-02-03 2003-07-29 -S000007604 ORF Verified YDR320C-A DAD4 HSK2 chromosome 4 4 1108498 1108280 C 2011-02-03 2001-02-26 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; is transferred to the kinetochore prior to mitosis -S000037150 CDS YDR320C-A 4 1108498 1108280 C 2011-02-03 2001-02-26 -S000002729 ORF Verified YDR321W ASP1 asparaginase ASP1 chromosome 4 L000000129 4 1108702 1109847 W 190 2011-02-03 1996-07-31 Cytosolic L-asparaginase, involved in asparagine catabolism; catalyzes hydrolysis of L-asparagine to aspartic acid and ammonia; important enzyme for the treatment of acute lymphoblastic leukemia; has low glutaminase activity and dependence; synthesized constitutively -S000031109 CDS YDR321W 4 1108702 1109847 W 2011-02-03 1996-07-31 -S000119071 ARS ARS452 ARSIV-1110|ARS431.5 chromosome 4 4 1109964 1110204 2011-02-03 2006-10-05 Autonomously Replicating Sequence -S000002730 ORF Verified YDR322W MRPL35 mitochondrial 54S ribosomal protein YmL35|YmL35 chromosome 4 L000002694 4 1110589 1111692 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000031250 CDS YDR322W 4 1110589 1111692 W 2011-02-03 1996-07-31 -S000007255 ORF Verified YDR322C-A TIM11 F1F0 ATP synthase subunit e|ATP21 chromosome 4 L000004719 4 1112293 1112003 C 2011-02-03 1999-07-17 Subunit e of mitochondrial F1F0-ATPase; ATPase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; essential for the dimeric and oligomeric state of ATP synthase, which in turn determines the shape of inner membrane cristae -S000035372 CDS YDR322C-A 4 1112293 1112003 C 2011-02-03 1999-07-17 -S000002731 ORF Verified YDR323C PEP7 VPT19|VPS19|VPL21|VAC1 chromosome 4 L000001377 4 1114027 1112480 C 192 2011-02-03 1996-07-31 Adaptor protein involved in vesicle-mediated vacuolar protein sorting; multivalent adaptor protein; facilitates vesicle-mediated vacuolar protein sorting by ensuring high-fidelity vesicle docking and fusion, which are essential for targeting of vesicles to the endosome; required for vacuole inheritance -S000031288 CDS YDR323C 4 1114027 1112480 C 2011-02-03 1996-07-31 -S000002732 ORF Verified YDR324C UTP4 chromosome 4 4 1116763 1114433 C 2011-02-03 1996-07-31 Subunit of U3-containing 90S preribosome and SSU processome complexes; involved in production of 18S rRNA and assembly of small ribosomal subunit; member of t-Utp subcomplex involved with transcription of 35S rRNA transcript; Small Subunit processome is also known as SSU processome -S000032287 CDS YDR324C 4 1116763 1114433 C 2011-02-03 1996-07-31 -S000002733 ORF Verified YDR325W YCG1 condensin subunit YCG1|YCS5|TIE1 chromosome 4 S000007469 4 1117126 1120233 W 2011-02-03 2002-12-17|1996-07-31 Subunit of the condensin complex; required for establishment and maintenance of chromosome condensation, chromosome segregation and chromatin binding by the complex; required for tRNA genes clustering at the nucleolus; required for replication slow zone breakage following Mec1p inactivation; transcription is cell cycle regulated, peaking in mitosis and declining in G1; protein is constitutively degraded by the proteasome; rate limiting for condensin recruitment to chromatin -S000032437 CDS YDR325W 4 1117126 1120233 W 2011-02-03 2002-12-17|1996-07-31 -S000002734 ORF Verified YDR326C YSP2 LAM2|LTC4 chromosome 4 4 1124925 1120609 C 2011-02-03 1996-07-31 Sterol-binding protein; has a probable role in retrograde transport of sterols from the plasma membrane to the ER; contains two StART-like domains that bind sterols and a GRAM domain; co-localizes to puncta in the cortical ER with Sip3p; one of six StART-like domain-containing proteins in yeast that may be involved in sterol transfer between intracellular membranes; conserved across eukaryotes -S000032495 CDS YDR326C 4 1124925 1120609 C 2011-02-03 1996-07-31 -S000002735 ORF Dubious YDR327W chromosome 4 4 1125302 1125628 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene SKP1 -S000034595 CDS YDR327W 4 1125302 1125628 W 2011-02-03 1996-07-31 -S000002736 ORF Verified YDR328C SKP1 SCF ubiquitin ligase subunit SKP1|CBF3D|MGO1 chromosome 4 L000001910 4 1126018 1125434 C 2011-02-03 1996-07-31 Evolutionarily conserved kinetochore protein; part of multiple protein complexes, including the SCF ubiquitin ligase complex, the CBF3 complex that binds centromeric DNA, and the RAVE complex that regulates assembly of the V-ATPase; protein abundance increases in response to DNA replication stress -S000034604 CDS YDR328C 4 1126018 1125434 C 2011-02-03 1996-07-31 -S000002737 ORF Verified YDR329C PEX3 PAS3 chromosome 4 L000001339 4 1127595 1126270 C 2011-02-03 1996-07-31 Peroxisomal membrane protein (PMP); required for proper localization and stability of PMPs; anchors peroxisome retention factor Inp1p at the peroxisomal membrane; interacts with Pex19p -S000034672 CDS YDR329C 4 1127595 1126270 C 2011-02-03 1996-07-31 -S000002738 ORF Verified YDR330W UBX5 chromosome 4 4 1127872 1129374 W 2011-02-03 1996-07-31 UBX domain-containing protein that interacts with Cdc48p; ubiquitin regulatory X is also known as UBX -S000034262 CDS YDR330W 4 1127872 1129374 W 2011-02-03 1996-07-31 -S000002739 ORF Verified YDR331W GPI8 GPI-anchor transamidase chromosome 4 L000004086 4 1129588 1130823 W 2011-02-03 1996-07-31 ER membrane glycoprotein subunit of the GPI transamidase complex; adds glycosylphosphatidylinositol (GPI) anchors to newly synthesized proteins; human PIG-K protein is a functional homolog -S000034385 CDS YDR331W 4 1129588 1130823 W 2011-02-03 1996-07-31 -S000002740 ORF Verified YDR332W IRC3 double-stranded DNA-dependent ATPase chromosome 4 4 1131001 1133070 W 2011-02-03 1996-07-31 Double-stranded DNA-dependent helicase of the DExH/D-box family; required for maintenance of the mitochondrial (mt) genome; null mutant accumulates double-stranded breaks in mt DNA; localizes to the mt matrix -S000035410 CDS YDR332W 4 1131001 1133070 W 2011-02-03 1996-07-31 -S000002741 ORF Verified YDR333C RQC1 chromosome 4 4 1135431 1133260 C 2011-02-03 1996-07-31 Component of the ribosome quality control complex (RQC); RQC (Rqc1p-Rkr1p-Tae2p-Cdc48p-Npl4p-Ufd1p) is a ribosome-bound complex required for the degradation of polypeptides arising from stalled translation; required along with Rkr1p for recruitment of the Cdc48p-Npl4p-Ufd1p AAA ATPase complex to the RQC -S000035465 CDS YDR333C 4 1135431 1133260 C 2011-02-03 1996-07-31 -S000002742 ORF Verified YDR334W SWR1 chromatin-remodeling protein SWR1 chromosome 4 S000007447 4 1135932 1140476 W 2011-02-03 1996-07-31 Swi2/Snf2-related ATPase; structural component of the SWR1 complex, which exchanges histone variant H2AZ (Htz1p) for chromatin-bound histone H2A; relocalizes to the cytosol in response to hypoxia; chronological aging factor that mediates lifespan extension by dietary restriction -S000035602 CDS YDR334W 4 1135932 1140476 W 2011-02-03 1996-07-31 -S000002743 ORF Verified YDR335W MSN5 karyopherin MSN5|STE21|KAP142 chromosome 4 L000002124|L000003212 4 1141168 1144842 W 196 2011-02-03 1996-07-31 Karyopherin; involved in nuclear import and export of proteins, including import of replication protein A and export of Far1p and transcription factors Swi5p, Swi6p, Msn2p, and Pho4p; required for re-export of mature tRNAs after their retrograde import from the cytoplasm; exportin-5 homolog -S000036506 CDS YDR335W 4 1141168 1144842 W 2011-02-03 1996-07-31 -S000002744 ORF Uncharacterized YDR336W MRX8 chromosome 4 4 1145092 1146036 W 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; sumoylated under stress conditions in a genome wide study; YDR336W is not an essential gene -S000036602 CDS YDR336W 4 1145092 1146036 W 2011-02-03 1996-07-31 -S000002745 ORF Verified YDR337W MRPS28 mitochondrial 37S ribosomal protein MRPS28 chromosome 4 L000001176 4 1146319 1147179 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit -S000036695 CDS YDR337W 4 1146319 1147179 W 2011-02-03 1996-07-31 -S000002746 ORF Uncharacterized YDR338C chromosome 4 4 1149466 1147379 C 2011-02-03 1996-07-31 Putative protein of unknown function; member of the multi-drug and toxin extrusion (MATE) family of the multidrug/oligosaccharidyl-lipid/polysaccharide (MOP) exporter superfamily -S000036729 CDS YDR338C 4 1149466 1147379 C 2011-02-03 1996-07-31 -S000002747 ORF Verified YDR339C FCF1 rRNA-processing protein FCF1|UTP24 chromosome 4 4 1150520 1149951 C 2011-02-03 1996-07-31 Putative PINc domain nuclease; required for early cleavages of 35S pre-rRNA and maturation of 18S rRNA; component of the SSU (small subunit) processome involved in 40S ribosomal subunit biogenesis; copurifies with Faf1p -S000030573 CDS YDR339C 4 1150520 1149951 C 2011-02-03 1996-07-31 -S000002748 ORF Dubious YDR340W chromosome 4 4 1150881 1151183 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000030471 CDS YDR340W 4 1150881 1151183 W 2011-02-03 1996-07-31 -S000006777 tRNA_gene tX(XXX)D chromosome 4 L000003778 4 1150941 1150842 C 2011-02-03 2000-05-19 tRNA of undetermined specificity, predicted by tRNAscan-SE analysis; very similar to serine tRNAs -S000032726 noncoding_exon tX(XXX)D 4 1150941 1150842 C 2011-02-03 2000-05-19 -S000006873 long_terminal_repeat YDRWdelta25 chromosome 4 4 1151039 1151368 W 2011-02-03 2000-05-19 Ty1 LTR -S000002749 ORF Verified YDR341C arginine--tRNA ligase|ArgRS|RRS1 chromosome 4 4 1153626 1151803 C 2011-02-03 1996-07-31 Arginyl-tRNA synthetase; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YDR341C has a paralog, MSR1, that arose from the whole genome duplication -S000030508 CDS YDR341C 4 1153626 1151803 C 2011-02-03 1996-07-31 -S000002750 ORF Verified YDR342C HXT7 hexose transporter HXT7 chromosome 4 L000000841 4 1155928 1154216 C 2011-02-03 1996-07-31 High-affinity glucose transporter; member of the major facilitator superfamily, nearly identical to Hxt6p, expressed at high basal levels relative to other HXTs, expression repressed by high glucose levels; HXT7 has a paralog, HXT4, that arose from the whole genome duplication -S000031436 CDS YDR342C 4 1155928 1154216 C 2011-02-03 1996-07-31 -S000118444 ARS ARS432 ARSIV-1159 chromosome 4 4 1159262 1159510 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000119074 ARS_consensus_sequence ARS432 4 1159461 1159447 C 2011-02-03 2006-10-05 -S000002751 ORF Verified YDR343C HXT6 hexose transporter HXT6 chromosome 4 L000000840 4 1161320 1159608 C 2011-02-03 1996-07-31 High-affinity glucose transporter; member of the major facilitator superfamily, nearly identical to Hxt7p, expressed at high basal levels relative to other HXTs, repression of expression by high glucose requires SNF3; HXT6 has a paralog, HXT1, that arose from the whole genome duplication -S000031535 CDS YDR343C 4 1161320 1159608 C 2011-02-03 1996-07-31 -S000002752 ORF Dubious YDR344C chromosome 4 4 1162449 1162006 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031692 CDS YDR344C 4 1162449 1162006 C 2011-02-03 1996-07-31 -S000002753 ORF Verified YDR345C HXT3 hexose transporter HXT3 chromosome 4 L000000837 4 1164660 1162957 C 209.07 2011-02-03 1996-07-31 Low affinity glucose transporter of the major facilitator superfamily; expression is induced in low or high glucose conditions; HXT3 has a paralog, HXT5, that arose from the whole genome duplication -S000032671 CDS YDR345C 4 1164660 1162957 C 2011-02-03 1996-07-31 -S000119072 ARS ARS453 ARSIV-1166|ARS432.5 chromosome 4 4 1166067 1166212 2014-11-18 2014-11-18|2006-10-05 Autonomously Replicating Sequence -S000119073 ARS_consensus_sequence ARS453 4 1166181 1166167 C 2011-02-03 2006-10-05 -S000002754 ORF Verified YDR346C SVF1 SGI1 chromosome 4 4 1168659 1167214 C 2011-02-03 1996-07-31 Protein with a potential role in cell survival pathways; required for the diauxic growth shift; expression in mammalian cells increases survival under conditions inducing apoptosis; mutant has increased aneuploidy tolerance -S000032732 CDS YDR346C 4 1168659 1167214 C 2011-02-03 1996-07-31 -S000002755 ORF Verified YDR347W MRP1 mitochondrial 37S ribosomal protein MRP1 chromosome 4 L000001152 4 1169178 1170143 W 204.07 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; MRP1 exhibits genetic interactions with PET122, encoding a COX3-specific translational activator, and with PET123, encoding a small subunit mitochondrial ribosomal protein -S000032890 CDS YDR347W 4 1169178 1170143 W 2011-02-03 1996-07-31 -S000002756 ORF Verified YDR348C PAL1 chromosome 4 4 1171825 1170326 C 2011-02-03 1996-07-31 Protein of unknown function thought to be involved in endocytosis; physically interacts with Ede1p and is found at endocytic sites at cell periphery during early stages of endocytosis; green fluorescent protein (GFP)-fusion protein localizes to bud neck; potential Cdc28p substrate; similar to S. pombe Pal1 protein; relocalizes from bud neck to cytoplasm upon DNA replication stress; PAL1 has a paralog, YHR097C, that arose from the whole genome duplication -S000034824 CDS YDR348C 4 1171825 1170326 C 2011-02-03 1996-07-31 -S000002757 ORF Verified YDR349C YPS7 putative aspartic endopeptidase chromosome 4 L000004384 4 1174176 1172386 C 2011-02-03 1996-07-31 Putative GPI-anchored aspartic protease; member of the yapsin family of proteases involved in cell wall growth and maintenance; located in the cytoplasm and endoplasmic reticulum -S000034909 CDS YDR349C 4 1174176 1172386 C 2011-02-03 1996-07-31 -S000006874 long_terminal_repeat YDRWdelta26 chromosome 4 4 1175316 1175647 W 2011-02-03 2000-05-19 Ty1 LTR -S000006858 long_terminal_repeat YDRCsigma6 chromosome 4 4 1175812 1175134 C 2011-02-03 2000-05-19 Ty3 LTR -S000006659 tRNA_gene tM(CAU)D EMT1 chromosome 4 L000000551|L000003772 4 1175829 1175901 W 2011-02-03 2000-05-19 Methionine tRNA (tRNA-Met), functions in translational elongation; not involved in translational initiation; predicted by tRNAscan-SE analysis -S000034501 noncoding_exon tM(CAU)D 4 1175829 1175901 W 2011-02-03 2000-05-19 -S000002758 ORF Verified YDR350C ATP22 TCM10 chromosome 4 L000002912 4 1178174 1176120 C 2011-02-03 1996-07-31|2011-02-03 Specific translational activator for the mitochondrial ATP6 mRNA; Atp6p encodes a subunit of F1F0 ATP synthase; localized to the mitochondrial inner membrane -S000033802 CDS YDR350C 4 1178174 1176120 C 2011-02-03 1996-07-31|2011-02-03 -S000002759 ORF Verified YDR351W SBE2 chromosome 4 L000002745 4 1178666 1181260 W 2011-02-03 1996-07-31 Protein required for bud growth; involved in transport of cell wall components from the Golgi to the cell surface; SBE2 has a paralog, SBE22, that arose from the whole genome duplication -S000034051 CDS YDR351W 4 1178666 1181260 W 2011-02-03 1996-07-31 -S000002760 ORF Verified YDR352W YPQ2 chromosome 4 4 1181801 1182754 W 2011-02-03 1996-07-31 Putative vacuolar membrane transporter for cationic amino acids; likely contributes to amino acid homeostasis by exporting cationic amino acids from the vacuole; member of the PQ-loop family, with seven transmembrane domains; mutant phenotype is functionally complemented by rat PQLC2 vacuolar transporter -S000034941 CDS YDR352W 4 1181801 1182754 W 2011-02-03 1996-07-31 -S000002761 ORF Verified YDR353W TRR1 thioredoxin-disulfide reductase TRR1 chromosome 4 L000003953 4 1183299 1184258 W 2011-02-03 1996-07-31 Cytoplasmic thioredoxin reductase; key regulatory enzyme that determines the redox state of the thioredoxin system, which acts as a disulfide reductase system and protects cells against both oxidative and reductive stress; protein abundance increases in response to DNA replication stress; TRR1 has a paralog, TRR2, that arose from the whole genome duplication -S000035089 CDS YDR353W 4 1183299 1184258 W 2011-02-03 1996-07-31 -S000002762 ORF Verified YDR354W TRP4 anthranilate phosphoribosyltransferase chromosome 4 L000002355 4 1184747 1185889 W 209 2011-02-03 1996-07-31 Anthranilate phosphoribosyl transferase; transferase of the tryptophan biosynthetic pathway; catalyzes the phosphoribosylation of anthranilate; subject to the general control system of amino acid biosynthesis -S000035242 CDS YDR354W 4 1184747 1185889 W 2011-02-03 1996-07-31 -S000028613 ORF Dubious YDR354C-A chromosome 4 4 1185282 1185139 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps TRP4; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031447 CDS YDR354C-A 4 1185282 1185139 C 2011-02-03 2003-07-29 -S000002764 ORF Verified YDR356W SPC110 NUF1|XCM1 chromosome 4 L000001285 4 1186107 1188941 W 2011-02-03 1996-07-31 Inner plaque spindle pole body (SPB) component; ortholog of human kendrin; gamma-tubulin small complex (gamma-TuSC) receptor that interacts with Spc98p to recruit the complex to the nuclear side of the SPB, connecting nuclear microtubules to the SPB; promotes gamma-TuSC assembly and oligomerization to initiate microtubule nucleation; interacts with Tub4p-complex and calmodulin; phosphorylated by Mps1p in cell cycle-dependent manner -S000036297 CDS YDR356W 4 1186107 1188941 W 2011-02-03 1996-07-31 -S000002763 ORF Dubious YDR355C chromosome 4 4 1186369 1186067 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified essential ORF SPC110/YDR356W -S000035318 CDS YDR355C 4 1186369 1186067 C 2011-02-03 1996-07-31 -S000002765 ORF Verified YDR357C CNL1 BLC1 chromosome 4 4 1189567 1189199 C 2011-02-03 1996-07-31 Subunit of the BLOC-1 complex involved in endosomal maturation; interacts with Msb3p; null mutant is sensitive to drug inducing secretion of vacuolar cargo; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000036341 CDS YDR357C 4 1189567 1189199 C 2011-02-03 1996-07-31 -S000002766 ORF Verified YDR358W GGA1 ubiquitin-binding protein chromosome 4 S000007493 4 1190059 1191732 W 2011-02-03 1996-07-31 Golgi-localized protein with homology to gamma-adaptin; interacts with and regulates Arf1p and Arf2p in a GTP-dependent manner in order to facilitate traffic through the late Golgi; GGA1 has a paralog, GGA2, that arose from the whole genome duplication -S000036474 CDS YDR358W 4 1190059 1191732 W 2011-02-03 1996-07-31 -S000002768 ORF Dubious YDR360W OPI7 chromosome 4 4 1194598 1195032 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene VID21/YDR359C -S000030092 CDS YDR360W 4 1194598 1195032 W 2011-02-03 1996-07-31|2011-02-03 -S000002767 ORF Verified YDR359C EAF1 VID21 chromosome 4 4 1194884 1191936 C 2011-02-03 2004-02-06|1996-07-31 Component of the NuA4 histone acetyltransferase complex; acts as a platform for assembly of NuA4 subunits into the native complex; required for initiation of pre-meiotic DNA replication, likely due to its requirement for expression of IME1 -S000037088 CDS YDR359C 4 1194884 1191936 C 2011-02-03 2004-02-06|1996-07-31 -S000002769 ORF Verified YDR361C BCP1 protein-transporting protein BCP1 chromosome 4 4 1196263 1195412 C 2011-02-03 1996-07-31 Essential protein involved in nuclear export of Mss4p; Mss4p is a lipid kinase that generates phosphatidylinositol 4,5-biphosphate and plays a role in actin cytoskeleton organization and vesicular transport -S000030230 CDS YDR361C 4 1196263 1195412 C 2011-02-03 1996-07-31 -S000002770 ORF Verified YDR362C TFC6 transcription factor TFIIIC subunit TFC6|tau 91 chromosome 4 L000004492 4 1198697 1196679 C 2011-02-03 1996-07-31 Subunit of RNA polymerase III transcription initiation factor complex; one of six subunits of RNA polymerase III transcription initiation factor complex (TFIIIC); part of TFIIIC TauB domain that binds BoxB promoter sites of tRNA and other genes; cooperates with Tfc3p in DNA binding; human homolog is TFIIIC-110 -S000031159 CDS YDR362C 4 1198697 1196679 C 2011-02-03 1996-07-31 -S000077077 matrix_attachment_site ETC6 ETC6 chromosome 4 4 1198885 1198907 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; can act as a transcription-blocking insulator or as a heterochromatin barrier element; remains predominantly localized to the nuclear periphery throughout cell cycle; located between divergently transcribed genes TFC6 and ESC2 -S000002771 ORF Verified YDR363W ESC2 chromosome 4 L000004423 4 1199183 1200553 W 2011-02-03 1996-07-31 Sumo-like domain protein; prevents accumulation of toxic intermediates during replication-associated recombinational repair; roles in silencing, lifespan, chromatid cohesion and the intra-S-phase DNA damage checkpoint; RENi family member -S000031326 CDS YDR363W 4 1199183 1200553 W 2011-02-03 1996-07-31 -S000006616 tRNA_gene tK(CUU)D1 chromosome 4 L000003773 4 1201750 1201822 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000035877 noncoding_exon tK(CUU)D1 4 1201750 1201822 W 2011-02-03 2000-05-19 -S000007235 ORF Verified YDR363W-A SEM1 proteasome regulatory particle lid subunit SEM1|HOD1|DSS1 chromosome 4 L000003539|L000004647 4 1202128 1202397 W 2011-02-03 1999-07-17 19S proteasome regulatory particle lid subcomplex component; role in Ub-dependent proteolysis and proteasome stability; involved in TREX-2 mediated mRNA export, and in the prevention of transcription-associated genome instability; ubiquitinated by Nedd4-like E3-ligase, Rsp5p; human ortholog DSS1, a BRCA1 binding protein implicated in cancer, complements the yeast null; drives trinucleotide repeat expansion; protein abundance increases in response to DNA replication stress -S000037294 CDS YDR363W-A 4 1202128 1202397 W 2011-02-03 1999-07-17 -S000002772 ORF Verified YDR364C CDC40 SLU4|SLT15|PRP17 chromosome 4 L000000275|L000001921 4 1204210 1202843 C 211 2011-02-03 1996-07-31 Pre-mRNA splicing factor; important for catalytic step II of pre-mRNA splicing and plays a role in cell cycle progression, particularly at the G1/S phase transition; required for DNA synthesis during mitosis and meiosis; has WD repeats; thermosensitivity of the cdc40 null mutant is functionally complemented by a chimeric construct containing the N-terminal 156 amino acids of yeast Cdc40p fused to the C-terminal two thirds (297 amino acids) of human CDC40 -S000031393 CDS YDR364C 4 1204210 1202843 C 2011-02-03 1996-07-31 -S000002773 ORF Verified YDR365C ESF1 chromosome 4 4 1206383 1204497 C 2011-02-03 1996-07-31 Nucleolar protein involved in pre-rRNA processing; depletion causes severely decreased 18S rRNA levels -S000032429 CDS YDR365C 4 1206383 1204497 C 2011-02-03 1996-07-31 -S000006875 long_terminal_repeat YDRWdelta27 chromosome 4 4 1206704 1207037 W 2011-02-03 2000-05-19 Ty1 LTR -S000006883 LTR_retrotransposon YDRWTy1-5 Ty1 chromosome 4 4 1206704 1212621 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007400 transposable_element_gene YDR365W-A gag protein chromosome 4 4 1206997 1208319 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000032504 CDS YDR365W-A 4 1206997 1208319 W 2011-02-03 1999-07-17 -S000007401 transposable_element_gene YDR365W-B gag-pol fusion protein chromosome 4 S000029012 4 1206997 1212265 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000032510 CDS YDR365W-B 4 1206997 1208301 W 2011-02-03 1999-07-17 -S000032511 CDS YDR365W-B 4 1208303 1212265 W 2011-02-03 1999-07-17 -S000032512 plus_1_translational_frameshift YDR365W-B 4 1208302 1208302 W 2011-02-03 1999-07-17 -S000006876 long_terminal_repeat YDRWdelta28 chromosome 4 4 1212288 1212621 W 2011-02-03 2000-05-19 Ty1 LTR -S000002774 ORF Uncharacterized YDR366C chromosome 4 4 1212836 1212438 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000032506 CDS YDR366C 4 1212836 1212438 C 2011-02-03 1996-07-31 -S000002775 ORF Verified YDR367W KEI1 chromosome 4 4 1212848 1213614 W 2011-02-03 1996-07-31 Component of inositol phosphorylceramide (IPC) synthase; forms a complex with Aur1p and regulates its activity; required for IPC synthase complex localization to the Golgi; post-translationally processed by Kex2p; KEI1 is an essential gene -S000032662 CDS YDR367W 4 1212848 1212877 W 2011-02-03 1996-07-31 -S000032663 CDS YDR367W 4 1212979 1213614 W 2011-02-03 1996-07-31 -S000032664 intron YDR367W 4 1212878 1212978 W 2011-02-03 1996-07-31 -S000002776 ORF Verified YDR368W YPR1 trifunctional aldehyde reductase/carbonyl reductase (NADPH)/glucose 1-dehydrogenase (NADP(+)) YPR1 chromosome 4 L000003084 4 1213904 1214842 W 2011-02-03 1996-07-31 NADPH-dependent aldo-keto reductase; reduces multiple substrates including 2-methylbutyraldehyde and D,L-glyceraldehyde, expression is induced by osmotic and oxidative stress; functionally redundant with other aldo-keto reductases; protein abundance increases in response to DNA replication stress; YPR1 has a paralog, GCY1, that arose from the whole genome duplication; human homolog AKR1B1 can complement yeast null mutant -S000033354 CDS YDR368W 4 1213904 1214842 W 2011-02-03 1996-07-31 -S000002777 ORF Verified YDR369C XRS2 chromosome 4 L000002489 4 1217580 1215016 C 211 2011-02-03 1996-07-31 Protein required for DNA repair; component of the Mre11 complex, which is involved in double strand breaks, meiotic recombination, telomere maintenance, and checkpoint signaling -S000033386 CDS YDR369C 4 1217580 1215016 C 2011-02-03 1996-07-31 -S000002778 ORF Verified YDR370C DXO1 chromosome 4 4 1219110 1217782 C 2011-02-03 1996-07-31 mRNA 5'-end-capping quality-control protein; has distributive, 5'-3' exoRNase activity; similar to Rai1p; -S000034314 CDS YDR370C 4 1219110 1217782 C 2011-02-03 1996-07-31 -S000002779 ORF Uncharacterized YDR371W CTS2 putative chitinase chromosome 4 4 1219413 1220948 W 2011-02-03 1996-07-31 Putative chitinase; functionally complements A. gossypii cts2 mutant sporulation defect -S000034441 CDS YDR371W 4 1219413 1220948 W 2011-02-03 1996-07-31 -S000028822 ORF Dubious YDR371C-A chromosome 4 4 1219613 1219509 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized gene CTS2/YDR371W; identified by expression profiling and mass spectrometry -S000033641 CDS YDR371C-A 4 1219613 1219509 C 2011-02-03 2003-07-29 -S000002780 ORF Verified YDR372C VPS74 MNN3|API1 chromosome 4 4 1222149 1221112 C 2011-02-03 1996-07-31 Golgi phosphatidylinositol-4-kinase effector and PtdIns4P sensor; interacts with the cytosolic domains of cis and medial glycosyltransferases, and in the PtdIns4P-bound state mediates the targeting of these enzymes to the Golgi; interacts with the catalytic domain of Sac1p, the major cellular PtdIns4P phosphatase, to direct dephosphosphorylation of the Golgi pool of PtdIns4P; tetramerization required for function; ortholog of human GOLPH3/GPP34/GMx33 -S000034509 CDS YDR372C 4 1222149 1221112 C 2011-02-03 1996-07-31 -S000002781 ORF Verified YDR373W FRQ1 frequenin chromosome 4 4 1222759 1223331 W 2011-02-03 1996-07-31 N-myristoylated calcium-binding protein; may have a role in intracellular signaling through its regulation of the phosphatidylinositol 4-kinase Pik1p; member of the recoverin/frequenin branch of the EF-hand superfamily; human NCS1 functionally complements the heat sensitivity of a frq1 ts mutant -S000035570 CDS YDR373W 4 1222759 1223331 W 2011-02-03 1996-07-31 -S000002782 ORF Verified YDR374C PHO92 mRNA-binding phosphate metabolism regulator chromosome 4 4 1224394 1223474 C 2011-02-03 1996-07-31 Posttranscriptional regulator of phosphate metabolism; facilitates PHO4 mRNA degradation by interacting with Pop2p; regulates PHO4 mRNA stability by binding to PHO4's 3'UTR in a phosphate-dependent manner; contains highly conserved YTH (YT521-B Homology) domain that exhibits RNA-binding activity; human homolog YTHDF2 can complement yeast null mutant -S000035608 CDS YDR374C 4 1224394 1223474 C 2011-02-03 1996-07-31 -S000113553 ORF Verified YDR374W-A WIP1 chromosome 4 4 1224757 1225026 W 2011-02-03 2005-11-16 Kinetochore localized protein of unknown function; interacts with Cnn1p (CENP-T); orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-W and fission yeast new1 -S000113554 CDS YDR374W-A 4 1224757 1225026 W 2011-02-03 2005-11-16 -S000002783 ORF Verified YDR375C BCS1 bifunctional AAA family ATPase chaperone/translocase BCS1 chromosome 4 L000000164 4 1226536 1225166 C 2011-02-03 1996-07-31 Protein translocase and chaperone required for Complex III assembly; member of the AAA ATPase family; forms a homo-oligomeric complex in the mitochondrial inner membrane that translocates the C-terminal domain of Rip1p from the matrix across the inner membrane and delivers it to an assembly intermediate of respiratory Complex III; also required for assembly of the Qcr10p subunit; mutation is functionally complemented by human homolog BCS1L, linked to neonatal diseases -S000035698 CDS YDR375C 4 1226536 1225166 C 2011-02-03 1996-07-31 -S000002784 ORF Verified YDR376W ARH1 NADPH-adrenodoxin reductase chromosome 4 L000002799 4 1226822 1228303 W 2011-02-03 1996-07-31 Oxidoreductase of the mitochondrial inner membrane; involved in cytoplasmic and mitochondrial iron homeostasis and required for activity of Fe-S cluster-containing enzymes; one of the few mitochondrial proteins essential for viability -S000036678 CDS YDR376W 4 1226822 1228303 W 2011-02-03 1996-07-31 -S000002785 ORF Verified YDR377W ATP17 F1F0 ATP synthase subunit f chromosome 4 L000003415 4 1228611 1228916 W 2011-02-03 1996-07-31 Subunit f of the F0 sector of mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis -S000036737 CDS YDR377W 4 1228611 1228916 W 2011-02-03 1996-07-31 -S000002786 ORF Verified YDR378C LSM6 U4/U6-U5 snRNP complex subunit LSM6 chromosome 4 L000004685 4 1229609 1229349 C 2011-02-03 1996-07-31|2005-11-22 Lsm (Like Sm) protein; part of heteroheptameric complexes (Lsm2p-7p and either Lsm1p or 8p): cytoplasmic Lsm1p complex involved in mRNA decay; nuclear Lsm8p complex part of U6 snRNP and possibly involved in processing tRNA, snoRNA, and rRNA -S000036760 CDS YDR378C 4 1229609 1229349 C 2011-02-03 1996-07-31|2005-11-22 -S000002787 ORF Verified YDR379W RGA2 chromosome 4 L000004022 4 1230167 1233196 W 2011-02-03 1996-07-31 GTPase-activating protein for polarity-establishment protein Cdc42p; implicated in control of septin organization, pheromone response, and haploid invasive growth; regulated by Pho85p and Cdc28p; RGA2 has a paralog, RGA1, that arose from the whole genome duplication -S000036849 CDS YDR379W 4 1230167 1233196 W 2011-02-03 1996-07-31 -S000007605 ORF Verified YDR379C-A SDH6 chromosome 4 4 1233517 1233278 C 2011-02-03 2001-02-26 Mitochondrial protein involved in assembly of succinate dehydrogenase; has a role in maturation of the Sdh2p subunit; member of the LYR protein family; mutations in human ortholog SDHAF1 are associated with infantile leukoencephalopathy -S000037182 CDS YDR379C-A 4 1233517 1233278 C 2011-02-03 2001-02-26 -S000002788 ORF Verified YDR380W ARO10 phenylpyruvate decarboxylase ARO10 chromosome 4 4 1234218 1236125 W 2011-02-03 1996-07-31 Phenylpyruvate decarboxylase; catalyzes decarboxylation of phenylpyruvate to phenylacetaldehyde, which is the first specific step in the Ehrlich pathway; involved in protein N-terminal Met and Ala catabolism -S000037478 CDS YDR380W 4 1234218 1236125 W 2011-02-03 1996-07-31 -S000002789 ORF Verified YDR381W YRA1 RNA-binding protein YRA1|SHE11 chromosome 4 L000002959|L000002873 4 1236558 1238004 W 2011-02-03 1999-07-17|1996-07-31 Nuclear polyadenylated RNA-binding protein; required for export of poly(A)+ mRNA from the nucleus; proposed to couple mRNA export with 3' end processing via its interactions with Mex67p and Pcf11p; interacts with DBP2; inhibits the helicase activity of Dbp2; functionally redundant with Yra2p, another REF family member -S000037615 CDS YDR381W 4 1236558 1236842 W 2011-02-03 1999-07-17|1996-07-31 -S000037616 CDS YDR381W 4 1237609 1238004 W 2011-02-03 1999-07-17 -S000037617 intron YDR381W 4 1236843 1237608 W 2011-02-03 1999-07-17 -S000007650 ORF Verified YDR381C-A chromosome 4 4 1238850 1238312 C 2011-02-03 2004-01-26|2001-03-30 Protein of unknown function; localized to the mitochondrial outer membrane -S000037338 CDS YDR381C-A 4 1238630 1238312 C 2011-02-03 2004-01-26|2001-03-30 -S000037337 CDS YDR381C-A 4 1238850 1238825 C 2011-02-03 2004-01-26|2001-03-30 -S000037339 intron YDR381C-A 4 1238824 1238631 C 2011-02-03 2004-01-26|2001-03-30 -S000002790 ORF Verified YDR382W RPP2B ribosomal protein P2B|YP2beta|P2B|L45|YPA1|RPL45 chromosome 4 L000001736 4 1239492 1239824 W 2011-02-03 1996-07-31 Ribosomal protein P2 beta; a component of the ribosomal stalk, which is involved in the interaction between translational elongation factors and the ribosome; free (non-ribosomal) P2 stimulates the phosphorylation of the eIF2 alpha subunit (Sui2p) by Gcn2p; regulates the accumulation of P1 (Rpp1Ap and Rpp1Bp) in the cytoplasm -S000030372 CDS YDR382W 4 1239492 1239824 W 2011-02-03 1996-07-31 -S000002791 ORF Verified YDR383C NKP1 chromosome 4 4 1240676 1239960 C 2011-02-03 2003-09-22|1996-07-31 Central kinetochore protein and subunit of the Ctf19 complex; mutants have elevated rates of chromosome loss; orthologous to fission yeast kinetochore protein fta4 -S000030450 CDS YDR383C 4 1240676 1239960 C 2011-02-03 2003-09-22|1996-07-31 -S000118445 ARS ARS433 ARSIV-1241 chromosome 4 4 1240882 1241110 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178079 ARS_consensus_sequence ARS433 4 1240919 1240935 W 2014-11-18 2014-11-18 -S000002792 ORF Verified YDR384C ATO3 putative ammonium permease ATO3 chromosome 4 4 1242031 1241204 C 2011-02-03 1996-07-31 Plasma membrane protein, putative ammonium transporter; regulation pattern suggests a possible role in export of ammonia from the cell; phosphorylated in mitochondria; member of the TC 9.B.33 YaaH family of putative transporters -S000030592 CDS YDR384C 4 1242031 1241204 C 2011-02-03 1996-07-31 -S000002793 ORF Verified YDR385W EFT2 elongation factor 2 chromosome 4 L000000544 4 1243230 1245758 W 2011-02-03 1996-07-31 Elongation factor 2 (EF-2), also encoded by EFT1; catalyzes ribosomal translocation during protein synthesis; contains diphthamide, the unique posttranslationally modified histidine residue specifically ADP-ribosylated by diphtheria toxin; EFT2 has a paralog, EFT1, that arose from the whole genome duplication -S000030719 CDS YDR385W 4 1243230 1245758 W 2011-02-03 1996-07-31 -S000002794 ORF Verified YDR386W MUS81 SLX3 chromosome 4 L000004650 4 1246084 1247982 W 2011-02-03 1996-07-31 Subunit of structure-specific Mms4p-Mus81p endonuclease; cleaves branched DNA; involved in DNA repair, replication fork stability, and joint molecule formation/resolution during meiotic recombination; promotes template switching during break-induced replication (BIR), causing non-reciprocal translocations (NRTs); helix-hairpin-helix protein; phosphorylation of non-catalytic subunit Mms4p by Cdc28p and Cdcp during mitotic cell cycle activates function of Mms4p-Mus81p -S000031582 CDS YDR386W 4 1246084 1247982 W 2011-02-03 1996-07-31 -S000002795 ORF Uncharacterized YDR387C CIN10 chromosome 4 4 1249821 1248154 C 2011-02-03 1996-07-31 Putative transporter; member of the sugar porter family; non-essential gene; overexpression results in elevated colony sectoring, an indicator of chromosomal instability -S000031627 CDS YDR387C 4 1249821 1248154 C 2011-02-03 1996-07-31 -S000002796 ORF Verified YDR388W RVS167 amphiphysin chromosome 4 L000001789 4 1250186 1251634 W 2011-02-03 1996-07-31 Calmodulin-binding actin-associated protein; roles in endocytic membrane tabulation and constriction, and exocytosis; N-BAR domain protein that interacts with Rvs161p to regulate actin cytoskeleton, endocytosis, and viability following starvation or osmotic stress; recruited to bud tips by Gyl1p and Gyp5p during polarized growth; homolog of mammalian amphiphysin -S000031800 CDS YDR388W 4 1250186 1251634 W 2011-02-03 1996-07-31 -S000002797 ORF Verified YDR389W SAC7 chromosome 4 L000001794 4 1252537 1254501 W 220 2011-02-03 1996-07-31 GTPase activating protein (GAP) for Rho1p; regulator of a Tor2p-mediated, Rho1p GTPase switch that controls organization of the actin cytoskeleton; negative regulator of the RHO1-PKC1-MAPK cell integrity (CWI) and membrane fluidity homeostasis signaling pathways; potential Cdc28p substrate; SAC7 has a paralog, BAG7, that arose from the whole genome duplication -S000031909 CDS YDR389W 4 1252537 1254501 W 2011-02-03 1996-07-31 -S000002798 ORF Verified YDR390C UBA2 E1 ubiquitin-activating protein UBA2|UAL1 chromosome 4 L000002404 4 1256847 1254937 C 2011-02-03 1996-07-31 Subunit of heterodimeric nuclear SUMO activating enzyme E1 with Aos1p; activates Smt3p (SUMO) before its conjugation to proteins (sumoylation), which may play a role in protein targeting; essential for viability -S000032721 CDS YDR390C 4 1256847 1254937 C 2011-02-03 1996-07-31 -S000006572 tRNA_gene tG(CCC)D SUF3 chromosome 4 L000002151|L000003777 4 1257079 1257008 C 232 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons -S000032332 noncoding_exon tG(CCC)D 4 1257079 1257008 C 2011-02-03 2000-05-19 -S000002799 ORF Uncharacterized YDR391C chromosome 4 4 1258056 1257358 C 2011-02-03 1996-07-31 Putative protein of unknown function; possibly involved in zinc homeostasis; Bdf1p-dependent transcription induced by salt stress; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus -S000032830 CDS YDR391C 4 1258056 1257358 C 2011-02-03 1996-07-31 -S000002800 ORF Verified YDR392W SPT3 transcriptional regulator SPT3 chromosome 4 L000002029 4 1258696 1259709 W 2011-02-03 1996-07-31 Subunit of the SAGA and SAGA-like transcriptional regulatory complexes; interacts with Spt15p to activate transcription of some RNA polymerase II-dependent genes, also functions to inhibit transcription at some promoters; relocalizes to the cytosol in response to hypoxia -S000033594 CDS YDR392W 4 1258696 1259709 W 2011-02-03 1996-07-31 -S000002801 ORF Verified YDR393W SHE9 MDM33 chromosome 4 L000002871 4 1259901 1261271 W 2011-02-03 1996-07-31 Protein required for normal mitochondrial morphology; mitochondrial inner membrane protein; may be involved in fission of the inner membrane; forms a homo-oligomeric complex -S000033681 CDS YDR393W 4 1259901 1261271 W 2011-02-03 1996-07-31 -S000002802 ORF Verified YDR394W RPT3 proteasome regulatory particle base subunit RPT3|YTA2|YNT1 chromosome 4 L000002556|L000002537 4 1261681 1262967 W 2011-02-03 1996-07-31 ATPase of the 19S regulatory particle of the 26S proteasome; one of ATPases of the regulatory particle; involved in the degradation of ubiquitinated substrates; substrate of N-acetyltransferase B -S000033819 CDS YDR394W 4 1261681 1262967 W 2011-02-03 1996-07-31 -S000002803 ORF Verified YDR395W SXM1 KAP108 chromosome 4 L000003508 4 1263324 1266158 W 2011-02-03 1996-07-31 Nuclear transport factor (karyopherin); involved in protein transport between the cytoplasm and nucleoplasm; similar to Nmd5p, Cse1p, Lph2p, and the human cellular apoptosis susceptibility protein, CAS1 -S000034692 CDS YDR395W 4 1263324 1266158 W 2011-02-03 1996-07-31 -S000002804 ORF Dubious YDR396W chromosome 4 4 1266295 1266795 W 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; extensively overlaps essential NCB2 gene encoding the beta subunit of the NC2 dimeric histone-fold complex -S000034845 CDS YDR396W 4 1266295 1266795 W 2011-02-03 1996-07-31 -S000002805 ORF Verified YDR397C NCB2 negative cofactor 2 transcription regulator complex subunit NCB2|YDR1 chromosome 4 L000003241 4 1266898 1266366 C 2011-02-03 1996-07-31 Subunit of a heterodimeric NC2 transcription regulator complex; complex binds to TBP and can repress transcription by preventing preinitiation complex assembly or stimulate activated transcription; homologous to human NC2beta; complex also includes Bur6p -S000034923 CDS YDR397C 4 1266769 1266366 C 2011-02-03 1996-07-31 -S000034922 CDS YDR397C 4 1266898 1266862 C 2011-02-03 1996-07-31 -S000034924 intron YDR397C 4 1266861 1266770 C 2011-02-03 1996-07-31 -S000002806 ORF Verified YDR398W UTP5 chromosome 4 4 1267471 1269402 W 2011-02-03 1996-07-31 Subunit of U3-containing Small Subunit (SSU) processome complex; involved in production of 18S rRNA and assembly of small ribosomal subunit -S000035902 CDS YDR398W 4 1267471 1269402 W 2011-02-03 1996-07-31 -S000002807 ORF Verified YDR399W HPT1 hypoxanthine phosphoribosyltransferase|HGPRTase|HPRT|BRA6 chromosome 4 L000004313 4 1270068 1270733 W 2011-02-03 1996-07-31 Dimeric hypoxanthine-guanine phosphoribosyltransferase; catalyzes the transfer of the phosphoribosyl portion of 5-phosphoribosyl-alpha-1-pyrophosphate to a purine base (either guanine or hypoxanthine) to form pyrophosphate and a purine nucleotide (either guanosine monophosphate or inosine monophosphate); mutations in the human homolog HPRT1 can cause Lesch-Nyhan syndrome and Kelley-Seegmiller syndrome -S000036067 CDS YDR399W 4 1270068 1270733 W 2011-02-03 1996-07-31 -S000002808 ORF Verified YDR400W URH1 trifunctional uridine nucleosidase/nicotinamide riboside hydrolase/nicotinic acid riboside hydrolase chromosome 4 S000007492 4 1271063 1272085 W 2011-02-03 2003-09-22|1996-07-31 Uridine nucleosidase (uridine-cytidine N-ribohydrolase); cleaves N-glycosidic bonds in nucleosides; involved in the pyrimidine salvage and nicotinamide riboside salvage pathways -S000033224 CDS YDR400W 4 1271063 1272085 W 2011-02-03 2003-09-22|1996-07-31 -S000002809 ORF Dubious YDR401W chromosome 4 4 1272223 1272786 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033274 CDS YDR401W 4 1272223 1272786 W 2011-02-03 1996-07-31 -S000002810 ORF Verified YDR402C DIT2 putative cytochrome P450|CYP56 chromosome 4 L000000507 4 1273703 1272234 C 2011-02-03 1996-07-31 N-formyltyrosine oxidase; sporulation-specific microsomal enzyme involved in the production of N,N-bisformyl dityrosine required for spore wall maturation, homologous to cytochrome P-450s; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively -S000033300 CDS YDR402C 4 1273703 1272234 C 2011-02-03 1996-07-31 -S000002811 ORF Verified YDR403W DIT1 chromosome 4 L000000506 4 1274602 1276212 W 2011-02-03 1996-07-31 Sporulation-specific enzyme required for spore wall maturation; involved in the production of a soluble LL-dityrosine-containing precursor of the spore wall; transcripts accumulate at the time of prospore enclosure -S000034267 CDS YDR403W 4 1274602 1276212 W 2011-02-03 1996-07-31 -S000118446 ARS ARS434 ARSIV-1276 chromosome 4 4 1276225 1276452 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000002812 ORF Verified YDR404C RPB7 DNA-directed RNA polymerase II subunit RPB7|B16 chromosome 4 L000001681 4 1277169 1276654 C 2011-02-03 1996-07-31 RNA polymerase II subunit B16; forms dissociable heterodimer with Rpb4p; Rpb4/7 dissociates from RNAPII as Ser2 CTD phosphorylation increases; Rpb4/7 regulates cellular lifespan via mRNA decay process; involved in recruitment of 3'-end processing factors to transcribing RNA polymerase II complex, export of mRNA to cytoplasm under stress conditions; also involved in translation initiation -S000034321 CDS YDR404C 4 1277169 1276654 C 2011-02-03 1996-07-31 -S000002813 ORF Verified YDR405W MRP20 mitochondrial 54S ribosomal protein YmL41|YmL41|MRPL41 chromosome 4 L000001158 4 1277646 1278437 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000035411 CDS YDR405W 4 1277646 1278437 W 2011-02-03 1996-07-31 -S000002814 ORF Verified YDR406W PDR15 ATP-binding cassette multidrug transporter PDR15 chromosome 4 L000002909 4 1279210 1283799 W 2011-02-03 1996-07-31 Plasma membrane ATP binding cassette (ABC) transporter; multidrug transporter and general stress response factor implicated in cellular detoxification; regulated by Pdr1p, Pdr3p and Pdr8p; promoter contains a PDR responsive element; PDR15 has a paralog, PDR5, that arose from the whole genome duplication -S000035511 CDS YDR406W 4 1279210 1283799 W 2011-02-03 1996-07-31 -S000028543 ORF Dubious YDR406W-A YDR406C-A chromosome 4 4 1283799 1284044 W 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by fungal homology and RT-PCR -S000031193 CDS YDR406W-A 4 1283799 1284044 W 2011-02-03 2003-07-29 -S000002815 ORF Verified YDR407C TRS120 chromosome 4 S000007435 4 1287938 1284069 C 2011-02-03 1996-07-31 Component of transport protein particle (TRAPP) complex II; TRAPPII is a multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating intra-Golgi and endosome-Golgi traffic -S000035551 CDS YDR407C 4 1287938 1284069 C 2011-02-03 1996-07-31 -S000002816 ORF Verified YDR408C ADE8 phosphoribosylglycinamide formyltransferase chromosome 4 L000000037 4 1288859 1288215 C 256 2011-02-03 1996-07-31 Phosphoribosyl-glycinamide transformylase; catalyzes a step in the 'de novo' purine nucleotide biosynthetic pathway -S000035623 CDS YDR408C 4 1288859 1288215 C 2011-02-03 1996-07-31 -S000077072 matrix_attachment_site ETC1 ETC1 chromosome 4 4 1289041 1289063 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; located between divergently transcribed genes ADE8 and SIZ1 -S000002817 ORF Verified YDR409W SIZ1 SUMO ligase SIZ1|ULL1 chromosome 4 S000007589 4 1289406 1292120 W 2011-02-03 1996-07-31 SUMO E3 ligase; promotes attachment of small ubiquitin-related modifier sumo (Smt3p) to primarily cytoplasmic proteins; regulates Rsp5p ubiquitin ligase activity and is in turn itself regulated by Rsp5p; required for sumoylation of septins and histone H3 variant Cse4p, a prerequisite for STUbL-mediated Ub-dependent degradation; localizes to the septin ring; acts as an adapter between E2, Ubc9p and substrates; tends to compensate for survival of DNA damage in absence of Nfi1p -S000036616 CDS YDR409W 4 1289406 1292120 W 2011-02-03 1996-07-31 -S000002818 ORF Verified YDR410C STE14 protein-S-isoprenylcysteine carboxyl O-methyltransferase chromosome 4 L000002121 4 1293091 1292372 C 259.47 2011-02-03 1996-07-31 Farnesyl cysteine-carboxyl methyltransferase; mediates the carboxyl methylation step during C-terminal CAAX motif processing of a-factor and RAS proteins in the endoplasmic reticulum, localizes to the ER membrane -S000037364 CDS YDR410C 4 1293091 1292372 C 2011-02-03 1996-07-31 -S000002819 ORF Verified YDR411C DFM1 chromosome 4 4 1294394 1293369 C 2011-02-03 1996-07-31 Endoplasmic reticulum (ER) localized protein; involved in ER-associated protein degradation (ERAD), ER stress, and homeostasis; interacts with components of ERAD-L and ERAD-C and Cdc48p; derlin-like family member similar to Der1p -S000037501 CDS YDR411C 4 1294394 1293369 C 2011-02-03 1996-07-31 -S000002820 ORF Verified YDR412W RRP17 chromosome 4 4 1294693 1295400 W 2011-02-03 1996-07-31 Component of the pre-60S pre-ribosomal particle; required for cell viability under standard (aerobic) conditions but not under anaerobic conditions; exonuclease required for 5' end processing of pre-60S ribosomal RNA -S000030317 CDS YDR412W 4 1294693 1295400 W 2011-02-03 1996-07-31 -S000002821 ORF Dubious YDR413C chromosome 4 4 1295411 1294836 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the essential uncharacterized ORF YDR412W that is implicated in rRNA processing -S000030389 CDS YDR413C 4 1295411 1294836 C 2011-02-03 1996-07-31 -S000002822 ORF Verified YDR414C ERD1 LDB2 chromosome 4 L000000566|L000004741 4 1296686 1295598 C 2011-02-03 1996-07-31|2011-02-03 Predicted membrane protein required for lumenal ER protein retention; mutants secrete the endogenous ER protein, BiP (Kar2p) -S000030512 CDS YDR414C 4 1296686 1295598 C 2011-02-03 1996-07-31|2011-02-03 -S000002823 ORF Uncharacterized YDR415C putative aminopeptidase chromosome 4 4 1298161 1297037 C 2011-02-03 1996-07-31 Putative aminopeptidase; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to the vacuole -S000031437 CDS YDR415C 4 1298161 1297037 C 2011-02-03 1996-07-31 -S000002824 ORF Verified YDR416W SYF1 mRNA splicing protein SYF1|NTC90 chromosome 4 L000004195 4 1298432 1301011 W 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); that contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs; null mutant has splicing defect and arrests in G2/M; relocalizes to the cytosol in response to hypoxia; homologs in human and C. elegans -S000031649 CDS YDR416W 4 1298432 1301011 W 2011-02-03 1996-07-31 -S000002826 ORF Verified YDR418W RPL12B uL11|ribosomal 60S subunit protein L12B|L11|YL23|L15B|L12B chromosome 4 L000001711 4 1301616 1302113 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L12B; rpl12a rpl12b double mutant exhibits slow growth and slow translation; homologous to mammalian ribosomal protein L12 and bacterial L11; RPL12B has a paralog, RPL12A, that arose from the whole genome duplication -S000032701 CDS YDR418W 4 1301616 1302113 W 2011-02-03 1996-07-31 -S000002825 ORF Dubious YDR417C chromosome 4 4 1301926 1301555 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF RPL12B/YDR418W -S000031695 CDS YDR417C 4 1301926 1301555 C 2011-02-03 1996-07-31 -S000118447 ARS ARS435 ARSIV-1303 chromosome 4 4 1302689 1302768 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000002827 ORF Verified YDR419W RAD30 DNA-directed DNA polymerase eta|DBH1 chromosome 4 L000003523 4 1303174 1305072 W 2011-02-03 1996-07-31 DNA polymerase eta; involved in translesion synthesis during post-replication repair; catalyzes the synthesis of DNA opposite cyclobutane pyrimidine dimers and other lesions; involved in formation of post-replicative damage-induced genome-wide cohesion; may also have a role in protection against mitochondrial mutagenesis; mutations in human pol eta are responsible for XPV -S000032806 CDS YDR419W 4 1303174 1305072 W 2011-02-03 1996-07-31 -S000006723 tRNA_gene tS(AGA)D3 chromosome 4 L000003782 4 1305630 1305712 W 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000031657 noncoding_exon tS(AGA)D3 4 1305630 1305712 W 2011-02-03 2000-05-19 -S000130176 ARS ARS436 chromosome 4 4 1305757 1306312 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000002828 ORF Verified YDR420W HKR1 chromosome 4 L000000788 4 1306267 1311675 W 2011-02-03 1996-07-31 Mucin family member that functions as an osmosensor in the HOG pathway; large, highly glycosylated protein that functions redundantly with Msb2p in Sho1p-mediated osmostresss induction of the HOG signaling pathway; cytoplasmic domain interacts with Ahk1p a scaffold protein that prevents cross talk with the Kss1p MAPK of the filamentous growth pathway; mutant displays defects in beta-1,3 glucan synthesis and bud site selection -S000032953 CDS YDR420W 4 1306267 1311675 W 2011-02-03 1996-07-31 -S000002829 ORF Verified YDR421W ARO80 chromosome 4 4 1312040 1314892 W 2011-02-03 1996-07-31 Zinc finger transcriptional activator of the Zn2Cys6 family; activates transcription of aromatic amino acid catabolic genes in the presence of aromatic amino acids -S000033023 CDS YDR421W 4 1312040 1314892 W 2011-02-03 1996-07-31 -S000002830 ORF Verified YDR422C SIP1 chromosome 4 L000001890 4 1317773 1315326 C 2011-02-03 1996-07-31|2006-04-12 Alternate beta-subunit of the Snf1p kinase complex; may confer substrate specificity; vacuolar protein containing KIS (Kinase-Interacting Sequence) and ASC (Association with Snf1 kinase Complex) domains involved in protein interactions -S000033079 CDS YDR422C 4 1317773 1315326 C 2011-02-03 1996-07-31|2006-04-12 -S000002831 ORF Verified YDR423C CAD1 YAP2 chromosome 4 L000000206 4 1319275 1318046 C 271 2011-02-03 1996-07-31 AP-1-like basic leucine zipper (bZIP) transcriptional activator; involved in stress responses, iron metabolism, and pleiotropic drug resistance; controls a set of genes involved in stabilizing proteins; binds consensus sequence TTACTAA; CAD1 has a paralog, YAP1, that arose from the whole genome duplication -S000033829 CDS YDR423C 4 1319275 1318046 C 2011-02-03 1996-07-31 -S000002832 ORF Verified YDR424C DYN2 dynein light chain|SLC1 chromosome 4 L000003064 4 1319841 1319387 C 2011-02-03 1996-07-31 Cytoplasmic light chain dynein, microtubule motor protein; required for intracellular transport and cell division; involved in mitotic spindle positioning; forms complex with dynein intermediate chain Pac11p that promotes Dyn1p homodimerization, potentiates motor processivity; Dyn2p-Pac11p complex important for interaction of dynein motor complex with dynactin complex; acts as molecular glue to dimerize, stabilize Nup82-Nsp1-Nup159 complex module of cytoplasmic pore filaments -S000033950 CDS YDR424C 4 1319617 1319387 C 2011-02-03 1996-07-31 -S000033949 CDS YDR424C 4 1319720 1319698 C 2011-02-03 1996-07-31 -S000033948 CDS YDR424C 4 1319841 1319817 C 2011-02-03 1996-07-31 -S000033952 intron YDR424C 4 1319697 1319618 C 2011-02-03 1996-07-31 -S000033951 intron YDR424C 4 1319816 1319721 C 2011-02-03 1996-07-31 -S000002833 ORF Verified YDR425W SNX41 chromosome 4 4 1320064 1321941 W 2011-02-03 1996-07-31 Sorting nexin; involved in the retrieval of late-Golgi SNAREs from the post-Golgi endosome to the trans-Golgi network; interacts with Snx4p -S000034950 CDS YDR425W 4 1320064 1321941 W 2011-02-03 1996-07-31 -S000002834 ORF Dubious YDR426C chromosome 4 4 1322006 1321629 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF SNX41 -S000035012 CDS YDR426C 4 1322006 1321629 C 2011-02-03 1996-07-31 -S000002835 ORF Verified YDR427W RPN9 proteasome regulatory particle lid subunit RPN9|NAS7 chromosome 4 L000004309 4 1322205 1323386 W 2011-02-03 1996-07-31 Non-ATPase regulatory subunit of the 26S proteasome; similar to putative proteasomal subunits in other species; null mutant is temperature sensitive and exhibits cell cycle and proteasome assembly defects; protein abundance increases in response to DNA replication stress; relocalizes to the cytosol in response to hypoxia -S000035280 CDS YDR427W 4 1322205 1323386 W 2011-02-03 1996-07-31 -S000002836 ORF Verified YDR428C BNA7 arylformamidase chromosome 4 4 1324239 1323454 C 2011-02-03 1996-07-31 Formylkynurenine formamidase; involved in the de novo biosynthesis of NAD from tryptophan via kynurenine -S000035320 CDS YDR428C 4 1324239 1323454 C 2011-02-03 1996-07-31 -S000002837 ORF Verified YDR429C TIF35 translation initiation factor eIF3 core subunit g chromosome 4 L000004253 4 1325301 1324477 C 2011-02-03 1996-07-31 eIF3g subunit of the eukaryotic translation initiation factor 3 (eIF3); subunit of the core complex of eIF3; is essential for translation; stimulates resumption of ribosomal scanning during translation reinitiation; eIF3 is also involved in programmed stop codon readthrough -S000036266 CDS YDR429C 4 1325301 1324477 C 2011-02-03 1996-07-31 -S000002839 ORF Dubious YDR431W chromosome 4 4 1328390 1328701 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000029889 CDS YDR431W 4 1328390 1328701 W 2011-02-03 1996-07-31 -S000002838 ORF Verified YDR430C CYM1 MOP112 chromosome 4 4 1328470 1325501 C 2011-02-03 1996-07-31 Lysine-specific metalloprotease of the pitrilysin family; metalloprotease of the intermembrane space; degrades proteins and presequence peptides cleaved from imported proteins; required for normal mitochondrial morphology -S000037179 CDS YDR430C 4 1328470 1325501 C 2011-02-03 1996-07-31 -S000002840 ORF Verified YDR432W NPL3 mRNA-binding protein NPL3|NAB1|NOP3|MTS1|MTR13 chromosome 4 L000001270 4 1328783 1330027 W 2011-02-03 1996-07-31 RNA-binding protein; promotes elongation, regulates termination, and carries poly(A) mRNA from nucleus to cytoplasm; represses translation initiation by binding eIF4G; required for pre-mRNA splicing; interacts with E3 ubiquitin ligase Bre1p, linking histone ubiquitination to mRNA processing; may have role in telomere maintenance; dissociation from mRNAs promoted by Mtr10p; phosphorylated by Sky1p in cytoplasm; protein abundance increases in response to DNA replication stress -S000029988 CDS YDR432W 4 1328783 1330027 W 2011-02-03 1996-07-31 -S000002841 ORF Dubious YDR433W KRE22 chromosome 4 4 1329600 1330040 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030126 CDS YDR433W 4 1329600 1330040 W 2011-02-03 1996-07-31 -S000002842 ORF Verified YDR434W GPI17 GPI-anchor transamidase GPI17 chromosome 4 4 1331237 1332841 W 2011-02-03 1996-07-31 Transmembrane protein; subunit of the glycosylphosphatidylinositol transamidase complex that adds GPIs to newly synthesized proteins; human PIG-S homolog -S000031125 CDS YDR434W 4 1331237 1332841 W 2011-02-03 1996-07-31 -S000002843 ORF Verified YDR435C PPM1 leucine carboxy methyltransferase chromosome 4 4 1333969 1332983 C 2011-02-03 1996-07-31 Carboxyl methyltransferase; methylates the C terminus of the protein phosphatase 2A catalytic subunit (Pph21p or Pph22p), which is important for complex formation with regulatory subunits; required for methionine to inhibit autophagy and promote growth -S000031177 CDS YDR435C 4 1333969 1332983 C 2011-02-03 1996-07-31 -S000002844 ORF Verified YDR436W PPZ2 salt homeostasis regulator chromosome 4 L000001479 4 1334821 1336953 W 2011-02-03 1996-07-31 Serine/threonine protein phosphatase Z, isoform of Ppz1p; involved in regulation of potassium transport, which affects osmotic stability, cell cycle progression, and halotolerance -S000031349 CDS YDR436W 4 1334821 1336953 W 2011-02-03 1996-07-31 -S000002845 ORF Verified YDR437W GPI19 phosphatidylinositol N-acetylglucosaminyltransferase GPI19 chromosome 4 4 1337352 1337774 W 2011-02-03 1996-07-31 Subunit of GPI-GlcNAc transferase involved in synthesis of GlcNAc-PI; N-acetylglucosaminyl phosphatidylinositol (GlcNAc-PI) is the first intermediate in glycosylphosphatidylinositol (GPI) anchor synthesis; shares similarity with mammalian PIG-P -S000032347 CDS YDR437W 4 1337352 1337774 W 2011-02-03 1996-07-31 -S000002846 ORF Verified YDR438W THI74 chromosome 4 4 1338274 1339386 W 2011-02-03 1996-07-31 Mitochondrial transporter repressible by thiamine; THI74 has a paralog, YML018C, that arose from the whole genome duplication; shows sequence homology to human gene SLC35F3, a thiamine transporter implicated in hypertension -S000032476 CDS YDR438W 4 1338274 1339386 W 2011-02-03 1996-07-31 -S000002847 ORF Verified YDR439W LRS4 chromosome 4 L000004395 4 1339676 1340719 W 2011-02-03 1996-07-31 Nucleolar protein that forms a complex with Csm1p; and then Mam1p at kinetochores during meiosis I to mediate accurate homolog segregation; required for condensin recruitment to the replication fork barrier site and rDNA repeat segregation -S000032575 CDS YDR439W 4 1339676 1340719 W 2011-02-03 1996-07-31 -S000002848 ORF Verified YDR440W DOT1 histone methyltransferase DOT1|KMT4|PCH1 chromosome 4 L000004390|L000004273 4 1342493 1344241 W 2011-02-03 1996-07-31 Nucleosomal histone H3-Lys79 methylase; methylation is required for telomeric silencing, meiotic checkpoint control, and DNA damage response -S000033292 CDS YDR440W 4 1342493 1344241 W 2011-02-03 1996-07-31 -S000002849 ORF Verified YDR441C APT2 adenine phosphoribosyltransferase APT2 chromosome 4 L000000102 4 1345062 1344517 C 2011-02-03 1996-07-31 Potential adenine phosphoribosyltransferase; encodes a protein with similarity to adenine phosphoribosyltransferase, but artificially expressed protein exhibits no enzymatic activity; APT2 has a paralog, APT1, that arose from the whole genome duplication -S000033331 CDS YDR441C 4 1345062 1344517 C 2011-02-03 1996-07-31 -S000002850 ORF Dubious YDR442W chromosome 4 4 1345647 1346039 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034272 CDS YDR442W 4 1345647 1346039 W 2011-02-03 1996-07-31 -S000002851 ORF Verified YDR443C SSN2 SSX5|MED13|RYE3|UME2|SRB9|SCA1|NUT8 chromosome 4 L000001803|L000002088|S000029518|L000002101 4 1349938 1345676 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; required for stable association of Srb10p-Srb11p kinase; essential for transcriptional regulation -S000034322 CDS YDR443C 4 1349938 1345676 C 2011-02-03 1996-07-31 -S000002852 ORF Uncharacterized YDR444W putative hydrolase chromosome 4 4 1350290 1352353 W 2011-02-03 1996-07-31 Putative hydrolase acting on ester bonds -S000034446 CDS YDR444W 4 1350290 1352353 W 2011-02-03 1996-07-31 -S000006617 tRNA_gene tK(CUU)D2 chromosome 4 L000003776 4 1352538 1352466 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000035878 noncoding_exon tK(CUU)D2 4 1352538 1352466 C 2011-02-03 2000-05-19 -S000002853 ORF Dubious YDR445C chromosome 4 4 1352589 1352182 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034512 CDS YDR445C 4 1352589 1352182 C 2011-02-03 1996-07-31 -S000006877 long_terminal_repeat YDRWdelta29 chromosome 4 4 1352644 1352975 W 2011-02-03 2000-05-19 Ty1 LTR -S000006878 long_terminal_repeat YDRWdelta30 chromosome 4 4 1352976 1353226 W 2011-02-03 2000-05-19 Ty1 LTR -S000002854 ORF Verified YDR446W ECM11 chromosome 4 L000003886 4 1353725 1354633 W 2011-02-03 1996-07-31 Meiosis-specific protein; component of the Synaptonemal Complex (SC) along with Gmc2p; required for efficient crossover formation and for the efficient loading of the SC transverse filament protein, Zip1p; is SUMOlytaed in a Gmc2p manner, and SUMOylation is required for its function in meiosis; GFP fusion protein is present in discrete clusters in the nucleus throughout mitosis; may be involved in maintaining chromatin structure -S000035576 CDS YDR446W 4 1353725 1354633 W 2011-02-03 1996-07-31 -S000002855 ORF Verified YDR447C RPS17B eS17|ribosomal 40S subunit protein S17B|S17e|rp51B|S17B|RPL51B|RP51B chromosome 4 L000001670|L000001741 4 1355553 1354829 C 2011-02-03 1996-07-31 Ribosomal protein 51 (rp51) of the small (40s) subunit; homologous to mammalian ribosomal protein S17, no bacterial homolog; RPS17B has a paralog, RPS17A, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000035611 CDS YDR447C 4 1355236 1354829 C 2011-02-03 1996-07-31 -S000035610 CDS YDR447C 4 1355553 1355551 C 2011-02-03 1996-07-31 -S000035612 intron YDR447C 4 1355550 1355237 C 2011-02-03 1996-07-31 -S000002856 ORF Verified YDR448W ADA2 chromatin-binding transcription regulator ADA2|SWI8 chromosome 4 L000000029 4 1356065 1357369 W 2011-02-03 1996-07-31 Transcription coactivator; component of the ADA and SAGA transcriptional adaptor/HAT (histone acetyltransferase) complexes -S000035771 CDS YDR448W 4 1356065 1357369 W 2011-02-03 1996-07-31 -S000002857 ORF Verified YDR449C UTP6 snoRNA-binding rRNA-processing protein UTP6 chromosome 4 4 1358902 1357580 C 2011-02-03 1996-07-31 Nucleolar protein; component of the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA -S000036633 CDS YDR449C 4 1358902 1357580 C 2011-02-03 1996-07-31 -S000002858 ORF Verified YDR450W RPS18A uS13|ribosomal 40S subunit protein S18A|S18A|S13 chromosome 4 L000004480 4 1359923 1360798 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S18 and bacterial S13; RPS18A has a paralog, RPS18B, that arose from the whole genome duplication; protein increases in abundance and relocalizes from cytoplasm to nuclear foci upon DNA replication stress -S000036543 CDS YDR450W 4 1359923 1359969 W 2011-02-03 1996-07-31 -S000036544 CDS YDR450W 4 1360405 1360798 W 2011-02-03 1996-07-31 -S000036545 intron YDR450W 4 1359970 1360404 W 2011-02-03 1996-07-31 -S000002859 ORF Verified YDR451C YHP1 chromosome 4 4 1362181 1361120 C 2011-02-03 1996-07-31 Homeobox transcriptional repressor; binds Mcm1p and early cell cycle box (ECB) elements of cell cycle regulated genes, thereby restricting ECB-mediated transcription to the M/G1 interval; YHP1 has a paralog, YOX1, that arose from the whole genome duplication -S000036584 CDS YDR451C 4 1362181 1361120 C 2011-02-03 1996-07-31 -S000002860 ORF Verified YDR452W PPN1 endopolyphosphatase|PHM5 chromosome 4 S000007514 4 1362878 1364902 W 2011-02-03 1996-07-31 Dual endo- and exopolyphosphatase with a role in phosphate metabolism; acts as both an endopolyphosphatase cleaving long chains of polyphosphate distributively to generate shorter polymer chains and as an exopolyphosphatase catalyzing the hydrolysis of terminal phosphate from polyphosphate; localizes to the vacuole, nucleus and cytosol; functions as a homodimer; relocalizes from vacuole to cytoplasm upon DNA replication stress -S000036745 CDS YDR452W 4 1362878 1364902 W 2011-02-03 1996-07-31 -S000002861 ORF Verified YDR453C TSA2 thioredoxin peroxidase TSA2|cTPxII chromosome 4 4 1365662 1365072 C 2011-02-03 1996-07-31 Stress inducible cytoplasmic thioredoxin peroxidase; cooperates with Tsa1p in the removal of reactive oxygen, nitrogen and sulfur species using thioredoxin as hydrogen donor; deletion enhances the mutator phenotype of tsa1 mutants; protein abundance increases in response to DNA replication stress; TSA2 has a paralog, TSA1, that arose from the whole genome duplication -S000037410 CDS YDR453C 4 1365662 1365072 C 2011-02-03 1996-07-31 -S000002862 ORF Verified YDR454C GUK1 BRA3|guanylate kinase|PUR5 chromosome 4 L000000745 4 1366827 1366264 C 2011-02-03 1996-07-31 Guanylate kinase; converts GMP to GDP; required for growth and mannose outer chain elongation of cell wall N-linked glycoproteins -S000037538 CDS YDR454C 4 1366827 1366264 C 2011-02-03 1996-07-31 -S000002864 ORF Verified YDR456W NHX1 bifunctional K:H/Na:H antiporter NHX1|VPL27|NHA2|VPS44 chromosome 4 L000004336 4 1367485 1369386 W 2011-02-03 1996-07-31 Na+/H+ and K+/H+ exchanger; required for intracellular sequestration of Na+ and K+; located in the vacuole and late endosome compartments; required for osmotolerance to acute hypertonic shock and for vacuolar fusion; ortholog of human NHE9, which is linked to autism -S000030521 CDS YDR456W 4 1367485 1369386 W 2011-02-03 1996-07-31 -S000002863 ORF Dubious YDR455C chromosome 4 4 1367681 1367373 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YDR456W -S000037654 CDS YDR455C 4 1367681 1367373 C 2011-02-03 1996-07-31 -S000002865 ORF Verified YDR457W TOM1 E3 ubiquitin-protein ligase TOM1 chromosome 4 L000002983 4 1369790 1379596 W 2011-02-03 1996-07-31 E3 ubiquitin ligase of the hect-domain class; has a role in mRNA export from the nucleus and may regulate transcriptional coactivators; involved in degradation of excess histones; interacts with Dia2p and is required for Dia2p degradation; required to target Cdc6p for ubiquitin-mediated destruction during G1 phase -S000030634 CDS YDR457W 4 1369790 1379596 W 2011-02-03 1996-07-31 -S000130177 ARS ARS439 chromosome 4 4 1379641 1380100 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000002866 ORF Verified YDR458C HEH2 chromosome 4 4 1382046 1380055 C 2011-02-03 1996-07-31 Inner nuclear membrane (INM) protein; contains helix-extension-helix (HEH) motif, nuclear localization signal sequence; targeting to the INM requires the Srp1p-Kap95p karyopherins and the Ran cycle; HEH2 has a paralog, SRC1, that arose from the whole genome duplication -S000030675 CDS YDR458C 4 1382046 1380055 C 2011-02-03 1996-07-31 -S000002867 ORF Verified YDR459C PFA5 palmitoyltransferase PFA5 chromosome 4 4 1383443 1382319 C 2011-02-03 1996-07-31 Palmitoyltransferase with autoacylation activity; likely functions in pathway(s) outside Ras; member of a family of putative palmitoyltransferases containing an Asp-His-His-Cys-cysteine rich (DHHC-CRD) domain -S000031546 CDS YDR459C 4 1383443 1382319 C 2011-02-03 1996-07-31 -S000002868 ORF Verified YDR460W TFB3 TFIIH/NER complex subunit TFB3|RIG2 chromosome 4 L000003496 4 1383811 1384776 W 2011-02-03 1996-07-31 Subunit of TFIIH and nucleotide excision repair factor 3 complexes; involved in transcription initiation, required for nucleotide excision repair; ring finger protein similar to mammalian CAK and TFIIH subunit -S000031579 CDS YDR460W 4 1383811 1384776 W 2011-02-03 1996-07-31 -S000002869 ORF Verified YDR461W MFA1 mating pheromone a chromosome 4 L000001096 4 1385176 1385286 W 280.27 2011-02-03 1996-07-31 Mating pheromone a-factor; made by a cells; interacts with alpha cells to induce cell cycle arrest and other responses leading to mating; biogenesis involves C-terminal modification, N-terminal proteolysis, and export; also encoded by MFA2 -S000032540 CDS YDR461W 4 1385176 1385286 W 2011-02-03 1996-07-31 -S000087209 ORF Uncharacterized YDR461C-A chromosome 4 4 1385766 1385524 C 2011-02-03 2005-11-15 Putative protein of unknown function -S000087210 CDS YDR461C-A 4 1385766 1385524 C 2011-02-03 2005-11-15 -S000002870 ORF Verified YDR462W MRPL28 mitochondrial 54S ribosomal protein YmL28|YmL28 chromosome 4 L000002691 4 1386073 1386516 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; protein abundance increases in response to DNA replication stress -S000032692 CDS YDR462W 4 1386073 1386516 W 2011-02-03 1996-07-31 -S000002871 ORF Verified YDR463W STP1 SSY2|BAP1 chromosome 4 L000002132 4 1386816 1388375 W 298 2011-02-03 2003-09-22|1996-07-31 Transcription factor; contains a N-terminal regulatory motif (RI) that acts as a cytoplasmic retention determinant and as an Asi dependent degron in the nucleus; undergoes proteolytic processing by SPS (Ssy1p-Ptr3p-Ssy5p)-sensor component Ssy5p in response to extracellular amino acids; activates transcription of amino acid permease genes and may have a role in tRNA processing; STP1 has a paralog, STP2, that arose from the whole genome duplication -S000032755 CDS YDR463W 4 1386816 1388375 W 2011-02-03 2003-09-22|1996-07-31 -S000002872 ORF Verified YDR464W SPP41 chromosome 4 L000002019 4 1388872 1393179 W 297 2011-02-03 1996-07-31 Protein of unknown function; involved in negative regulation of expression of spliceosome components PRP4 and PRP3; relocalizes to the cytosol in response to hypoxia -S000033502 CDS YDR464W 4 1388872 1393179 W 2011-02-03 1996-07-31 -S000028614 ORF Dubious YDR464C-A chromosome 4 4 1392680 1392492 C 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031450 CDS YDR464C-A 4 1392680 1392492 C 2011-02-03 2003-07-29 -S000002873 ORF Verified YDR465C RMT2 protein-arginine N5-methyltransferase chromosome 4 L000004724 4 1394574 1393336 C 2011-02-03 1996-07-31 Arginine N5 methyltransferase; methylates ribosomal protein Rpl12 (L12) on Arg67; relative distribution to the nucleus increases upon DNA replication stress -S000033538 CDS YDR465C 4 1394574 1393336 C 2011-02-03 1996-07-31 -S000002874 ORF Verified YDR466W PKH3 protein kinase PKH3 chromosome 4 4 1395121 1397817 W 2011-02-03 1996-07-31 Protein kinase with similarity to mammalian PDK1 and yeast Pkh1p/Phk2p; yeast Pkh1p and Pkh2p are two redundant upstream activators of Pkc1p; identified as a multicopy suppressor of a pkh1 pkh2 double mutant -S000033694 CDS YDR466W 4 1395121 1397817 W 2011-02-03 1996-07-31 -S000002875 ORF Dubious YDR467C chromosome 4 4 1397909 1397583 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033742 CDS YDR467C 4 1397909 1397583 C 2011-02-03 1996-07-31 -S000002876 ORF Verified YDR468C TLG1 chromosome 4 L000004227 4 1398700 1398026 C 2011-02-03 1996-07-31 Essential t-SNARE that mediates fusion of vesicles with the late Golgi; forms a complex with Tlg2p and Vti1p; mediates fusion of endosome-derived vesicles with the late Golgi; binds the docking complex VFT (Vps fifty-three) through interaction with Vps51p -S000034625 CDS YDR468C 4 1398700 1398026 C 2011-02-03 1996-07-31 -S000002877 ORF Verified YDR469W SDC1 SAF19|CPS25 chromosome 4 4 1399015 1399542 W 2011-02-03 1996-07-31 Subunit of the COMPASS (Set1C) complex; COMPASS methylates lysine 4 of histone H3 and is required in chromatin silencing at telomeres; contains a Dpy-30 domain that mediates interaction with Bre2p; similar to C. elegans and human DPY-30 -S000034852 CDS YDR469W 4 1399015 1399542 W 2011-02-03 1996-07-31 -S000002878 ORF Verified YDR470C UGO1 chromosome 4 4 1401214 1399706 C 2011-02-03 2000-04-06|1996-07-31|2011-02-03 Outer membrane component of the mitochondrial fusion machinery; binds to Fzo1p and Mgm1p to link these two GTPases during mitochondrial fusion; involved in fusion of both the outer and inner membranes; facilitates dimerization of Fzo1p during fusion; import into the outer membrane is mediated by Tom70p and Mim1p; has similarity to carrier proteins but likely not a transporter; similar to human SLC25A46 implicated in optic atroprophy spectrum disorder -S000035822 CDS YDR470C 4 1401214 1399706 C 2011-02-03 2000-04-06|1996-07-31|2011-02-03 -S000002879 ORF Verified YDR471W RPL27B eL27|ribosomal 60S subunit protein L27B|L27e|L27B chromosome 4 L000002898 4 1401770 1402564 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L27B; homologous to mammalian ribosomal protein L27, no bacterial homolog; RPL27B has a paralog, RPL27A, that arose from the whole genome duplication -S000036787 CDS YDR471W 4 1401770 1401800 W 2011-02-03 1996-07-31 -S000036788 CDS YDR471W 4 1402185 1402564 W 2011-02-03 1996-07-31 -S000036789 intron YDR471W 4 1401801 1402184 W 2011-02-03 1996-07-31 -S000006498 snoRNA_gene snR13 SNR13 chromosome 4 L000002849 4 1402919 1403042 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at positions A2280 and A2281 -S000036591 noncoding_exon snR13 4 1402919 1403042 W 2011-02-03 2000-05-19 -S000002880 ORF Verified YDR472W TRS31 TRAPP subunit TRS31 chromosome 4 S000007433 4 1403322 1404173 W 2011-02-03 1996-07-31 Core component of transport protein particle (TRAPP) complexes I-III; TRAPP complexes are related multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating ER-Golgi traffic (TRAPPI), intra-Golgi traffic (TRAPPII), endosome-Golgi traffic (TRAPPII and III) and autophagy (TRAPPIII) -S000036864 CDS YDR472W 4 1403322 1404173 W 2011-02-03 1996-07-31 -S000118448 ARS ARS440 ARSIV-1404 chromosome 4 4 1404290 1404524 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178080 ARS_consensus_sequence ARS440 4 1404322 1404338 W 2014-11-18 2014-11-18 -S000002881 ORF Verified YDR473C PRP3 U4/U6-U5 snRNP complex subunit PRP3|RNA3 chromosome 4 L000001496 4 1405854 1404445 C 300 2011-02-03 1996-07-31 Splicing factor; component of the U4/U6-U5 snRNP complex -S000036886 CDS YDR473C 4 1405854 1404445 C 2011-02-03 1996-07-31 -S000002883 ORF Verified YDR475C JIP4 YDR474C chromosome 4 4 1410094 1407464 C 2011-02-03 2003-09-30|1996-07-31 Protein of unknown function; previously annotated as two separate ORFs, YDR474C and YDR475C, which were merged as a result of corrections to the systematic reference sequence; JIP4 has a paralog, YOR019W, that arose from the whole genome duplication -S000037707 CDS YDR475C 4 1410094 1407464 C 2011-02-03 2003-09-30|1996-07-31 -S000002884 ORF Uncharacterized YDR476C chromosome 4 4 1411127 1410453 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; YDR476C is not an essential gene -S000037771 CDS YDR476C 4 1411127 1410453 C 2011-02-03 1996-07-31 -S000002885 ORF Verified YDR477W SNF1 AMP-activated serine/threonine-protein kinase catalytic subunit SNF1|PAS14|HAF3|GLC2|CCR1|CAT1 chromosome 4 L000001944 4 1412373 1414274 W 304 2011-02-03 1996-07-31 AMP-activated S/T protein kinase; forms a complex with Snf4p and members of the Sip1p/Sip2p/Gal83p family; required for transcription of glucose-repressed genes, thermotolerance, sporulation, and peroxisome biogenesis; regulates nucleocytoplasmic shuttling of Hxk2p; regulates filamentous growth and acts as a non-canonical GEF, activating Arf3p during invasive growth; SUMOylation by Mms21p inhibits its function and targets Snf1p for destruction via the Slx5-Slx8 Ub ligase -S000029842 CDS YDR477W 4 1412373 1414274 W 2011-02-03 1996-07-31 -S000002886 ORF Verified YDR478W SNM1 chromosome 4 L000002825 4 1414575 1415171 W 2011-02-03 1996-07-31 Ribonuclease MRP complex subunit; ribonuclease (RNase) MRP cleaves pre-rRNA and has a role in cell cycle-regulated degradation of daughter cell-specific mRNAs; binds to the NME1 RNA subunit of RNase MRP -S000030848 CDS YDR478W 4 1414575 1415171 W 2011-02-03 1996-07-31 -S000002887 ORF Verified YDR479C PEX29 chromosome 4 4 1416874 1415210 C 2011-02-03 1996-07-31 ER-resident protein involved in peroxisomal biogenesis; ER-localized protein that associates with peroxisomes; interacts with Pex30p and reticulons Rtn1p and Yop1p to regulate peroxisome biogenesis from the ER; role in peroxisomal-destined vesicular flow from the ER; regulates peroxisomal size, number and distribution; Pex28p and Pex29p may act at steps upstream of those mediated by Pex30p, Pex31p, and Pex32p; forms ER foci upon DNA replication stress -S000030901 CDS YDR479C 4 1416874 1415210 C 2011-02-03 1996-07-31 -S000002888 ORF Verified YDR480W DIG2 RST2 chromosome 4 L000003123 4 1417399 1418370 W 2011-02-03 1996-07-31 MAP kinase-responsive inhibitor of the Ste12p transcription factor; involved in the regulation of mating-specific genes and the invasive growth pathway; related regulators Dig1p and Dig2p bind to Ste12p; DIG2 has a paralog, DIG1, that arose from the whole genome duplication -S000032009 CDS YDR480W 4 1417399 1418370 W 2011-02-03 1996-07-31 -S000002889 ORF Verified YDR481C PHO8 alkaline phosphatase PHO8|phoH chromosome 4 L000001422 4 1420250 1418550 C 306 2011-02-03 1996-07-31 Repressible vacuolar alkaline phosphatase; regulated by levels of Pi and by Pho4p, Pho9p, Pho80p, Pho81p and Pho85p; dephosphorylates phosphotyrosyl peptides; contributes to NAD+ metabolism by producing nicotinamide riboside from NMN -S000032056 CDS YDR481C 4 1420250 1418550 C 2011-02-03 1996-07-31 -S000002890 ORF Verified YDR482C CWC21 U2-type spliceosomal complex subunit CWC21 chromosome 4 4 1420838 1420431 C 2011-02-03 1996-07-31 Protein involved in RNA splicing by the spliceosome; component of a complex containing Cef1p; interacts genetically with ISY1 and BUD13; may bind RNA; has similarity to S. pombe Cwf21p -S000032970 CDS YDR482C 4 1420838 1420431 C 2011-02-03 1996-07-31 -S000002891 ORF Verified YDR483W KRE2 alpha-1,2-mannosyltransferase KRE2|MNT1 chromosome 4 L000000913 4 1421157 1422485 W 306 2011-02-03 1996-07-31 Alpha1,2-mannosyltransferase of the Golgi; involved in protein mannosylation; KRE2 has a paralog, KTR6, that arose from the whole genome duplication -S000033119 CDS YDR483W 4 1421157 1422485 W 2011-02-03 1996-07-31 -S000002892 ORF Verified YDR484W VPS52 SAC2 chromosome 4 L000001791 4 1422763 1424688 W 314 2011-02-03 1996-07-31 Component of the GARP (Golgi-associated retrograde protein) complex; GARP is required for the recycling of proteins from endosomes to the late Golgi, and for mitosis after DNA damage induced checkpoint arrest; involved in localization of actin and chitin; members of the GARP complex are Vps51p-Vps52p-Vps53p-Vps54p -S000033198 CDS YDR484W 4 1422763 1424688 W 2011-02-03 1996-07-31 -S000002893 ORF Verified YDR485C VPS72 SWC2 chromosome 4 4 1427207 1424820 C 2011-02-03 2003-09-22|1996-07-31 Htz1p-binding component of the SWR1 complex; exchanges histone variant H2AZ (Htz1p) for chromatin-bound histone H2A; may function as a lock that prevents removal of H2AZ from nucleosomes; required for vacuolar protein sorting -S000033955 CDS YDR485C 4 1427207 1424820 C 2011-02-03 2003-09-22|1996-07-31 -S000002894 ORF Verified YDR486C VPS60 CHM5|MOS10 chromosome 4 4 1428120 1427431 C 2011-02-03 2003-09-22|1996-07-31 Protein involved in late endosome to vacuole transport; cytoplasmic and vacuolar membrane protein; required for normal filament maturation during pseudohyphal growth; may function in targeting cargo proteins for degradation; interacts with Vta1p -S000034065 CDS YDR486C 4 1428120 1427431 C 2011-02-03 2003-09-22|1996-07-31 -S000002895 ORF Verified YDR487C RIB3 3,4-dihydroxy-2-butanone-4-phosphate synthase RIB3 chromosome 4 L000001635 4 1428980 1428354 C 2011-02-03 1996-07-31 3,4-dihydroxy-2-butanone-4-phosphate synthase (DHBP synthase); required for riboflavin biosynthesis from ribulose-5-phosphate, also has an unrelated function in mitochondrial respiration -S000034158 CDS YDR487C 4 1428980 1428354 C 2011-02-03 1996-07-31 -S000002896 ORF Verified YDR488C PAC11 dynein intermediate chain chromosome 4 L000001330 4 1430789 1429188 C 2011-02-03 1996-07-31 Dynein intermediate chain, microtubule motor protein; required for intracellular transport and cell division; acts in cytoplasmic dynein pathway; forms complex with dynein light chain Dyn2p that promotes Dyn1p homodimerization and potentiates motor processivity; Dyn2p-Pac11p complex is also important for interaction of dynein motor complex with dynactin complex; forms cortical cytoplasmic microtubule capture site with Num1p; essential in the absence of CIN8 -S000035100 CDS YDR488C 4 1430789 1429188 C 2011-02-03 1996-07-31 -S000002897 ORF Verified YDR489W SLD5 DNA replication protein SLD5|CDC105 chromosome 4 4 1431012 1431896 W 2011-02-03 1996-07-31 Subunit of the GINS complex (Sld5p, Psf1p, Psf2p, Psf3p); complex is localized to DNA replication origins and implicated in assembly of the DNA replication machinery -S000035299 CDS YDR489W 4 1431012 1431896 W 2011-02-03 1996-07-31 -S000002898 ORF Verified YDR490C PKH1 serine/threonine protein kinase PKH1 chromosome 4 L000004616 4 1434268 1431968 C 2011-02-03 1996-07-31 Serine/threonine protein kinase; involved in sphingolipid-mediated signaling pathway that controls endocytosis; activates Ypk1p and Ykr2p, components of signaling cascade required for maintenance of cell wall integrity; contains a PH-like domain; redundant with Pkh2p; PKH1 has a paralog, PKH2, that arose from the whole genome duplication -S000036098 CDS YDR490C 4 1434268 1431968 C 2011-02-03 1996-07-31 -S000002900 ORF Verified YDR492W IZH1 PAQR-type receptor chromosome 4 4 1434924 1435874 W 2011-02-03 1996-07-31 Membrane protein involved in zinc ion homeostasis; member of the four-protein IZH family; transcription is regulated directly by Zap1p, expression induced by zinc deficiency and fatty acids; deletion increases sensitivity to elevated zinc; IZH1 has a paralog, IZH4, that arose from the whole genome duplication -S000031780 CDS YDR492W 4 1434924 1435874 W 2011-02-03 1996-07-31 -S000002899 ORF Dubious YDR491C chromosome 4 4 1434991 1434500 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036239 CDS YDR491C 4 1434991 1434500 C 2011-02-03 1996-07-31 -S000002901 ORF Verified YDR493W MZM1 AIM8|FMP36 chromosome 4 4 1436217 1436588 W 2011-02-03 1996-07-31 Protein required for assembly of the cytochrome bc(1) complex; acts as a chaperone for Rip1p and facilitates its insertion into the complex at a late stage of assembly; localized to the mitochondrial matrix; null mutant exhibits a respiratory growth defect and reduced mitochondrial zinc levels, which is characteristic of mutations affecting bc(1) complex assembly; member of the LYR protein family; human LYRM7 is a functional ortholog -S000031922 CDS YDR493W 4 1436217 1436588 W 2011-02-03 1996-07-31 -S000002902 ORF Verified YDR494W RSM28 mitochondrial 37S ribosomal protein RSM28 chromosome 4 4 1436930 1438015 W 2011-02-03 2002-12-17|1996-07-31 Mitochondrial ribosomal protein of the small subunit; genetic interactions suggest a possible role in promoting translation initiation -S000037424 CDS YDR494W 4 1436930 1438015 W 2011-02-03 2002-12-17|1996-07-31 -S000002903 ORF Verified YDR495C VPS3 CORVET complex subunit VPS3|VPT17|VPL3|PEP6 chromosome 4 L000002469 4 1441150 1438115 C 2011-02-03 1996-07-31 Component of CORVET membrane tethering complex; cytoplasmic protein required for the sorting and processing of soluble vacuolar proteins, acidification of the vacuolar lumen, and assembly of the vacuolar H+-ATPase -S000037459 CDS YDR495C 4 1441150 1438115 C 2011-02-03 1996-07-31 -S000002904 ORF Verified YDR496C PUF6 chromosome 4 4 1443403 1441433 C 2011-02-03 1996-07-31 Pumilio-homology domain protein; binds the 3' UTR of ASH1 mRNA and represses its translation, resulting in proper asymmetric localization of ASH1 mRNA; required at post-transcriptional step for efficient retrotransposition; absence results in decreased Ty1 Gag:GFP protein levels; co-sediments with the 60S ribosomal subunit and is required for its biogenesis -S000037553 CDS YDR496C 4 1443403 1441433 C 2011-02-03 1996-07-31 -S000002905 ORF Verified YDR497C ITR1 myo-inositol transporter ITR1 chromosome 4 L000000879 4 1445467 1443713 C 2011-02-03 1996-07-31 Myo-inositol transporter; member of the sugar transporter superfamily; expression is repressed by inositol and choline via Opi1p and derepressed via Ino2p and Ino4p; relative distribution to the vacuole increases upon DNA replication stress; ITR1 has a paralog, ITR2, that arose from the whole genome duplication -S000037634 CDS YDR497C 4 1445467 1443713 C 2011-02-03 1996-07-31 -S000002906 ORF Verified YDR498C SEC20 chromosome 4 L000001843 4 1446994 1445843 C 2011-02-03 1996-07-31 Membrane glycoprotein v-SNARE; involved in retrograde transport from the Golgi to the endoplasmic reticulum (ER); required for N- and O-glycosylation in the Golgi but not in the ER and for efficient nuclear fusion during mating; mediates Sey1p-independent homotypic ER fusion; interacts with the Dsl1p complex through Tip20p -S000030424 CDS YDR498C 4 1446994 1445843 C 2011-02-03 1996-07-31 -S000002907 ORF Verified YDR499W LCD1 PIE1|DDC2 chromosome 4 4 1447830 1450073 W 2011-02-03 1996-07-31 Essential protein required for the DNA integrity checkpoint pathways; interacts physically with Mec1p; putative homolog of S. pombe Rad26 and human ATRIP; forms nuclear foci upon DNA replication stress -S000030564 CDS YDR499W 4 1447830 1450073 W 2011-02-03 1996-07-31 -S000002908 ORF Verified YDR500C RPL37B eL37|ribosomal 60S subunit protein L37B|L37e|YL35|L43|L37B chromosome 4 L000002899 4 1450853 1450198 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L37B; required for processing of 27SB pre-rRNA and formation of stable 66S assembly intermediates; protein abundance increases in response to DNA replication stress; homologous to mammalian ribosomal protein L37, no bacterial homolog; RPL37B has a paralog, RPL37A, that arose from the whole genome duplication -S000036331 CDS YDR500C 4 1450457 1450198 C 2011-02-03 1996-07-31 -S000036330 CDS YDR500C 4 1450853 1450847 C 2011-02-03 1996-07-31 -S000036332 intron YDR500C 4 1450846 1450458 C 2011-02-03 1996-07-31 -S000002909 ORF Verified YDR501W PLM2 chromosome 4 S000007440 4 1451353 1452918 W 2011-02-03 1996-07-31 Putative transcription factor, contains Forkhead Associated domain; found associated with chromatin; target of SBF transcription factor; induced in response to DNA damaging agents and deletion of telomerase; PLM2 has a paralog, TOS4, that arose from the whole genome duplication -S000037037 CDS YDR501W 4 1451353 1452918 W 2011-02-03 1996-07-31 -S000002910 ORF Verified YDR502C SAM2 methionine adenosyltransferase SAM2|ETH2 chromosome 4 L000001799 4 1454464 1453310 C 2011-02-03 1996-07-31 S-adenosylmethionine synthetase; catalyzes transfer of the adenosyl group of ATP to the sulfur atom of methionine; comparative analysis suggests that a mitochondrially targeted form may result from translation starting at a non-canonical codon upstream of the annotated start codon -S000037058 CDS YDR502C 4 1454464 1453310 C 2011-02-03 1996-07-31 -S000130178 ARS ARS442 chromosome 4 4 1454509 1455087 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000002911 ORF Verified YDR503C LPP1 phosphatidate phosphatase LPP1 chromosome 4 L000004266 4 1455866 1455042 C 2011-02-03 1996-07-31 Lipid phosphate phosphatase; catalyzes Mg(2+)-independent dephosphorylation of phosphatidic acid (PA), lysophosphatidic acid, and diacylglycerol pyrophosphate; involved in control of the cellular levels of phosphatidylinositol and PA -S000037180 CDS YDR503C 4 1455866 1455042 C 2011-02-03 1996-07-31 -S000002912 ORF Verified YDR504C SPG3 chromosome 4 4 1456694 1456311 C 2011-02-03 1996-07-31 Protein required for high temperature survival during stationary phase; not required for growth on nonfermentable carbon sources; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum -S000037274 CDS YDR504C 4 1456694 1456311 C 2011-02-03 1996-07-31 -S000002913 ORF Verified YDR505C PSP1 GIN5 chromosome 4 L000002881|L000002877 4 1459220 1456695 C 2011-02-03 1996-07-31|2011-02-03 Asn and gln rich protein of unknown function; high-copy suppressor of POL1 (DNA polymerase alpha) and partial suppressor of CDC2 (polymerase delta) and CDC6 (pre-RC loading factor) mutations; overexpression results in growth inhibition; PSP1 has a paralog, YLR177W, that arose from the whole genome duplication -S000029936 CDS YDR505C 4 1459220 1456695 C 2011-02-03 1996-07-31|2011-02-03 -S000002914 ORF Verified YDR506C GMC1 putative oxidoreductase chromosome 4 4 1461554 1459728 C 2011-02-03 1996-07-31 Protein involved in meiotic progression; mutants are delayed in meiotic nuclear division and are defective in synaptonemal complex assembly; possible membrane-localized protein; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively -S000030050 CDS YDR506C 4 1461554 1459728 C 2011-02-03 1996-07-31 -S000006638 tRNA_gene tL(CAA)D chromosome 4 L000003775 4 1461829 1461715 C 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000033776 intron tL(CAA)D 4 1461791 1461759 C 2011-02-03 2000-05-19 -S000033775 noncoding_exon tL(CAA)D 4 1461758 1461715 C 2011-02-03 2000-05-19 -S000033774 noncoding_exon tL(CAA)D 4 1461829 1461792 C 2011-02-03 2000-05-19 -S000118449 ARS ARS443 ARSIV-1462 chromosome 4 4 1461862 1462173 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000002915 ORF Verified YDR507C GIN4 protein kinase GIN4|ERC47 chromosome 4 L000002876 4 1465786 1462358 C 2011-02-03 1996-07-31 Protein kinase involved in bud growth and assembly of the septin ring; proposed to have kinase-dependent and kinase-independent activities; undergoes autophosphorylation; similar to Hsl1p; GIN4 has a paralog, KCC4, that arose from the whole genome duplication -S000030234 CDS YDR507C 4 1465786 1462358 C 2011-02-03 1996-07-31 -S000002917 ORF Dubious YDR509W chromosome 4 4 1468226 1468573 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031352 CDS YDR509W 4 1468226 1468573 W 2011-02-03 1996-07-31 -S000002916 ORF Verified YDR508C GNP1 glutamine permease GNP1 chromosome 4 L000002806 4 1468444 1466453 C 2011-02-03 1996-07-31 High-affinity glutamine permease; also transports Leu, Ser, Thr, Cys, Met and Asn; expression is fully dependent on Grr1p and modulated by the Ssy1p-Ptr3p-Ssy5p (SPS) sensor of extracellular amino acids; GNP1 has a paralog, AGP1, that arose from the whole genome duplication -S000031178 CDS YDR508C 4 1468444 1466453 C 2011-02-03 1996-07-31 -S000002918 ORF Verified YDR510W SMT3 SUMO family protein SMT3 chromosome 4 L000001938 4 1469400 1469705 W 2011-02-03 1996-07-31 Ubiquitin-like protein of the SUMO family; conjugated to lysine residues of target proteins; associates with transcriptionally active genes; regulates chromatid cohesion, chromosome segregation, APC-mediated proteolysis, DNA replication and septin ring dynamics; human homolog SUMO1 can complement yeast null mutant -S000032284 CDS YDR510W 4 1469400 1469705 W 2011-02-03 1996-07-31 -S000028615 ORF Dubious YDR510C-A chromosome 4 4 1469811 1469695 C 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031452 CDS YDR510C-A 4 1469811 1469695 C 2011-02-03 2003-07-29 -S000002919 ORF Verified YDR511W SDH7 ACN9 chromosome 4 4 1470017 1470418 W 2011-02-03 1996-07-31 Mitochondrial protein involved in assembly of succinate dehydrogenase; has a role in maturation of the Sdh2p subunit; localized to the mitochondrial intermembrane space; required for acetate utilization and gluconeogenesis; mutation in Drosophila ortholog SDHAF3 causes reduced succinate dehydrogenase activity and neuronal and muscular dysfunction; member of the LYR protein family -S000032384 CDS YDR511W 4 1470017 1470418 W 2011-02-03 1996-07-31 -S000002921 ORF Verified YDR513W GRX2 dithiol glutaredoxin GRX2|TTR1 chromosome 4 L000000510|L000002386 4 1471017 1471448 W 2011-02-03 1996-07-31 Cytoplasmic glutaredoxin; thioltransferase, glutathione-dependent disulfide oxidoreductase involved in maintaining redox state of target proteins, also exhibits glutathione peroxidase activity, expression induced in response to stress; GRX2 has two in-frame start codons resulting in a shorter isoform that is retained in the cytosol and a longer form translocated to the mitochondrial matrix; GRX2 has a paralog, GRX1, that arose from the whole genome duplication -S000033294 CDS YDR513W 4 1471017 1471448 W 2011-02-03 1996-07-31 -S000002920 ORF Verified YDR512C EMI1 chromosome 4 4 1471063 1470500 C 2011-02-03 1996-07-31 Non-essential protein of unknown function; required for transcriptional induction of the early meiotic-specific transcription factor IME1, also required for sporulation; contains twin cysteine-x9-cysteine motifs; deletion affects mitochondrial morphology -S000032449 CDS YDR512C 4 1471063 1470500 C 2011-02-03 1996-07-31 -S000002922 ORF Verified YDR514C chromosome 4 4 1472999 1471548 C 2011-02-03 1996-07-31 Protein of unknown function that localizes to mitochondria; overexpression affects endocytic protein trafficking; YDR514C has a paralog, GFD2, that arose from the whole genome duplication -S000033333 CDS YDR514C 4 1472999 1471548 C 2011-02-03 1996-07-31 -S000002923 ORF Verified YDR515W SLF1 SRO99 chromosome 4 L000004191|L000002894 4 1473429 1474772 W 2011-02-03 1996-07-31 RNA binding protein that associates with polysomes; may be involved in regulating mRNA translation; involved in the copper-dependent mineralization of copper sulfide complexes on cell surface in cells cultured in copper salts; SLF1 has a paralog, SRO9, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000034278 CDS YDR515W 4 1473429 1474772 W 2011-02-03 1996-07-31 -S000002924 ORF Verified YDR516C EMI2 putative glucokinase chromosome 4 4 1476476 1474974 C 2011-02-03 1996-07-31 Non-essential protein of unknown function; required for transcriptional induction of the early meiotic-specific transcription factor IME1; required for sporulation; expression regulated by glucose-repression transcription factors Mig1/2p; EMI2 has a paralog, GLK1, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000034325 CDS YDR516C 4 1476476 1474974 C 2011-02-03 1996-07-31 -S000002925 ORF Verified YDR517W GRH1 chromosome 4 4 1477239 1478357 W 2011-02-03 1996-07-31 Acetylated cis-Golgi protein, involved in ER to Golgi transport; homolog of human GRASP65; forms a complex with the coiled-coil protein Bug1p; mutants are compromised for the fusion of ER-derived vesicles with Golgi membranes; protein abundance increases in response to DNA replication stress -S000034449 CDS YDR517W 4 1477239 1478357 W 2011-02-03 1996-07-31 -S000002926 ORF Verified YDR518W EUG1 protein disulfide isomerase EUG1 chromosome 4 L000000589 4 1478608 1480161 W 2011-02-03 1996-07-31 Protein disulfide isomerase of the endoplasmic reticulum lumen; EUG1 has a paralog, PDI1, that arose from the whole genome duplication; function overlaps with that of Pdi1p; may interact with nascent polypeptides in the ER -S000034562 CDS YDR518W 4 1478608 1480161 W 2011-02-03 1996-07-31 -S000002927 ORF Verified YDR519W FPR2 peptidylprolyl isomerase family protein FPR2|FKB2 chromosome 4 L000000613 4 1480425 1480832 W 2011-02-03 1996-07-31 Membrane-bound peptidyl-prolyl cis-trans isomerase (PPIase); binds to the drugs FK506 and rapamycin; expression pattern suggests possible involvement in ER protein trafficking; relocalizes from nucleus to vacuole upon DNA replication stress; mutation is functionally complemented by human FKBP2 -S000035584 CDS YDR519W 4 1480425 1480832 W 2011-02-03 1996-07-31 -S000002929 ORF Dubious YDR521W chromosome 4 4 1483141 1483476 W 2011-02-03 1996-07-31 Dubious ORF that overlaps YDR520C; mutant increases expression of PIS1 and RPL3 in glycerol -S000035558 CDS YDR521W 4 1483141 1483476 W 2011-02-03 1996-07-31 -S000002928 ORF Uncharacterized YDR520C URC2 RRT4 chromosome 4 S000122335 4 1483403 1481085 C 2011-02-03 1996-07-31 Putative Zn(II)2Cys6 motif containing transcription factor; non-essential gene identified in a screen for mutants with increased levels of rDNA transcription; similar to S. kluyveri Urc2p involved in uracil catabolism -S000035462 CDS YDR520C 4 1483403 1481085 C 2011-02-03 1996-07-31 -S000002930 ORF Verified YDR522C SPS2 chromosome 4 L000002025 4 1485303 1483795 C 2011-02-03 1996-07-31 Protein expressed during sporulation; SPS2 has a paralog, SPS22, that arose from the whole genome duplication; redundant with Sps22p for organization of the beta-glucan layer of the spore wall; S. pombe ortholog is a spore wall component -S000035591 CDS YDR522C 4 1485303 1483795 C 2011-02-03 1996-07-31 -S000118450 ARS ARS446 ARSIV-1487 chromosome 4 4 1486918 1487161 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178081 ARS_consensus_sequence ARS446 4 1487092 1487076 C 2014-11-18 2014-11-18 -S000002931 ORF Verified YDR523C SPS1 putative serine/threonine protein kinase SPS1 chromosome 4 L000002024 4 1487038 1485566 C 2011-02-03 1996-07-31 Putative protein serine/threonine kinase; localizes to the nucleus and cytoplasm; required for efficient spore packaging, prospore membrane development and closure and localization of enzymes involved in spore wall synthesis; interacts with and required for Ssp1p phosphorylation and turnover; member of the GCKIII subfamily of STE20 kinases; multiply phosphorylated on S/T residues; interacts with 14-3-3 proteins, Bmh1p and Bmh2p; expressed at the end of meiosis -S000036490 CDS YDR523C 4 1487038 1485566 C 2011-02-03 1996-07-31 -S000002932 ORF Verified YDR524C AGE1 SAT1 chromosome 4 S000007502 4 1488990 1487542 C 2011-02-03 1996-07-31 ADP-ribosylation factor (ARF) GTPase activating protein (GAP) effector; involved in the secretory and endocytic pathways; contains C2C2H2 cysteine/histidine motif -S000036586 CDS YDR524C 4 1488990 1487542 C 2011-02-03 1996-07-31 -S000028740 ORF Uncharacterized YDR524W-C YDR524W-A chromosome 4 4 1489403 1489492 W 2011-02-03 2003-07-29 Putative protein of unknown function; small ORF identified by SAGE; deletion strains are moderately sensitive to the radiomimetic drug bleomycin -S000033410 CDS YDR524W-C 4 1489403 1489492 W 2011-02-03 2003-07-29 -S000028739 ORF Uncharacterized YDR524C-B chromosome 4 4 1489798 1489598 C 2011-02-03 2003-07-29 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; YDR524C-B has a paralog, YCL048W-A, that arose from the whole genome duplication -S000033383 CDS YDR524C-B 4 1489798 1489598 C 2011-02-03 2003-07-29 -S000002933 ORF Dubious YDR525W API2 chromosome 4 4 1489905 1490234 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 26% of ORF overlaps the dubious ORF YDR524C-A; insertion mutation in a cdc34-2 mutant background causes altered bud morphology -S000036746 CDS YDR525W 4 1489905 1490234 W 2011-02-03 1996-07-31 -S000028616 ORF Dubious YDR524C-A YDR524C-C chromosome 4 4 1489990 1489871 C 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031456 CDS YDR524C-A 4 1489990 1489871 C 2011-02-03 2003-07-29 -S000007236 ORF Verified YDR525W-A SNA2 chromosome 4 4 1490596 1490835 W 2011-02-03 1999-07-17 Protein of unknown function; has similarity to Pmp3p, which is involved in cation transport; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern -S000036177 CDS YDR525W-A 4 1490596 1490835 W 2011-02-03 1999-07-17 -S000002935 ORF Verified YDR527W RBA50 chromosome 4 4 1491094 1492413 W 2011-02-03 1996-07-31|2011-02-03 Protein involved in transcription; interacts with RNA polymerase II subunits Rpb2p, Rpb3, and Rpb11p; has similarity to human RPAP1 -S000037626 CDS YDR527W 4 1491094 1492413 W 2011-02-03 1996-07-31|2011-02-03 -S000002934 ORF Dubious YDR526C chromosome 4 4 1491545 1491075 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037413 CDS YDR526C 4 1491545 1491075 C 2011-02-03 1996-07-31 -S000028466 snoRNA_gene snR84 SNR84 RUF1 chromosome 4 4 1493026 1492477 C 2011-02-03 2003-03-05 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2266; overexpression confers resistance to baking-associated stress -S000030073 noncoding_exon snR84 4 1493026 1492477 C 2011-02-03 2003-03-05 -S000002936 ORF Verified YDR528W HLR1 chromosome 4 4 1494586 1495857 W 2011-02-03 1996-07-31 Protein involved in regulation of cell wall composition and integrity; also involved in cell wall response to osmotic stress; overproduction suppresses a lysis sensitive PKC mutation; HLR1 has a paralog, LRE1, that arose from the whole genome duplication -S000030394 CDS YDR528W 4 1494586 1495857 W 2011-02-03 1996-07-31 -S000002937 ORF Verified YDR529C QCR7 ubiquinol--cytochrome-c reductase subunit 7|UCR7|CRO1|COR4 chromosome 4 L000001547 4 1496548 1496165 C 2011-02-03 1996-07-31 Subunit 7 of ubiquinol cytochrome-c reductase (Complex III); Complex III is a component of the mitochondrial inner membrane electron transport chain; oriented facing the mitochondrial matrix; N-terminus appears to play a role in complex assembly -S000030475 CDS YDR529C 4 1496548 1496165 C 2011-02-03 1996-07-31 -S000002938 ORF Verified YDR530C APA2 bifunctional AP-4-A phosphorylase/ADP sulfurylase chromosome 4 L000000091 4 1497768 1496791 C 2011-02-03 1996-07-31 Diadenosine 5',5'''-P1,P4-tetraphosphate phosphorylase II; AP4A phosphorylase involved in catabolism of bis(5'-nucleosidyl) tetraphosphates; APA2 has a paralog, APA1, that arose from the whole genome duplication -S000031311 CDS YDR530C 4 1497768 1496791 C 2011-02-03 1996-07-31 -S000002939 ORF Verified YDR531W CAB1 pantothenate kinase chromosome 4 4 1498232 1499335 W 2011-02-03 1996-07-31 Pantothenate kinase, ATP:D-pantothenate 4'-phosphotransferase; catalyzes the first committed step in the universal biosynthetic pathway for synthesis of coenzyme A (CoA); transcriptionally regulated by Upc2p via a sterol response element -S000031423 CDS YDR531W 4 1498232 1499335 W 2011-02-03 1996-07-31 -S000002940 ORF Verified YDR532C KRE28 chromosome 4 4 1500553 1499396 C 2011-02-03 1996-07-31 Subunit of a kinetochore-microtubule binding complex; complex bridges centromeric heterochromatin and kinetochore MAPs and motors; required for sister chromatid bi-orientation and kinetochore binding of SAC components; complex also includes Spc105p; modified by sumoylation -S000031481 CDS YDR532C 4 1500553 1499396 C 2011-02-03 1996-07-31 -S000002941 ORF Verified YDR533C HSP31 glutathione-independent methylglyoxalase chromosome 4 4 1502160 1501447 C 2011-02-03 1996-07-31 Methylglyoxalase that converts methylglyoxal to D-lactate; involved in oxidative stress resistance, diauxic shift, and stationary phase survival; has similarity to E. coli Hsp31 and C. albicans Glx3p; member of the DJ-1/ThiJ/PfpI superfamily, which includes human DJ-1 involved in Parkinson's disease and cancer; exists as a dimer and contains a putative metal-binding site; protein abundance increases in response to DNA replication stress -S000031524 CDS YDR533C 4 1502160 1501447 C 2011-02-03 1996-07-31 -S000002942 ORF Verified YDR534C FIT1 chromosome 4 4 1504900 1503314 C 2011-02-03 1996-07-31 Mannoprotein that is incorporated into the cell wall; incorporated via a glycosylphosphatidylinositol (GPI) anchor; involved in the retention of siderophore-iron in the cell wall -S000031631 CDS YDR534C 4 1504900 1503314 C 2011-02-03 1996-07-31 -S000002943 ORF Dubious YDR535C chromosome 4 4 1507362 1506606 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YDR535C is not an essential gene -S000032613 CDS YDR535C 4 1507058 1506606 C 2011-02-03 1996-07-31 -S000032612 CDS YDR535C 4 1507362 1507315 C 2011-02-03 1996-07-31 -S000032614 intron YDR535C 4 1507314 1507059 C 2011-02-03 1996-07-31 -S000002944 ORF Verified YDR536W STL1 glucose-inactivated glycerol proton symporter STL1 chromosome 4 L000002130 4 1508005 1509714 W 2011-02-03 1996-07-31 Glycerol proton symporter of the plasma membrane; subject to glucose-induced inactivation, strongly but transiently induced when cells are subjected to osmotic shock -S000032772 CDS YDR536W 4 1508005 1509714 W 2011-02-03 1996-07-31 -S000002946 ORF Verified YDR538W PAD1 phenylacrylic acid decarboxylase PAD1|POF1 chromosome 4 L000001331 4 1510902 1511630 W 2011-02-03 1996-07-31 Phenylacrylic acid decarboxylase; confers resistance to cinnamic acid, decarboxylates aromatic carboxylic acids to the corresponding vinyl derivatives; also has mRNA binding activity; homolog of E. coli UbiX; co-overproduction of Pad1p and Fdc1p greatly increases cinnamic acid decarboxylase activity -S000033597 CDS YDR538W 4 1510902 1511630 W 2011-02-03 1996-07-31 -S000002945 ORF Dubious YDR537C chromosome 4 4 1511461 1510856 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps verified ORF PAD1/YDR538W -S000032834 CDS YDR537C 4 1511461 1510856 C 2011-02-03 1996-07-31 -S000002947 ORF Verified YDR539W FDC1 putative phenylacrylic acid decarboxylase FDC1 chromosome 4 4 1512094 1513605 W 2011-02-03 1996-07-31 Ferulic acid decarboxylase, also active on p-coumaric acid; essential for decarboxylation of aromatic carboxylic acids to corresponding vinyl derivatives; co-overproduction of Pad1p and Fdc1p greatly increases cinnamic acid decarboxylase activity; structure implicates Glu285 as the general base in the nonoxidative decarboxylation reaction catalyzed by Fdc1p; homolog of E. coli UbiD; GFP-fusion protein localizes to cytoplasm -S000033698 CDS YDR539W 4 1512094 1513605 W 2011-02-03 1996-07-31 -S000002948 ORF Verified YDR540C IRC4 chromosome 4 4 1517675 1517136 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant displays increased levels of spontaneous Rad52p foci; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus -S000034746 CDS YDR540C 4 1517675 1517136 C 2011-02-03 1996-07-31 -S000006879 long_terminal_repeat YDRWdelta31 chromosome 4 4 1518484 1518807 W 2011-02-03 2000-05-19 Ty1 LTR -S000002949 ORF Verified YDR541C carbonyl reductase (NADPH-dependent) chromosome 4 4 1520698 1519664 C 2011-02-03 1996-07-31|2011-02-03 Aldehyde reductase; substrates include both aromatic and aliphatic aldehydes; uses NADPH as cofactor; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively -S000035672 CDS YDR541C 4 1520698 1519664 C 2011-02-03 1996-07-31|2011-02-03 -S000002950 ORF Verified YDR542W PAU10 seripauperin PAU10 chromosome 4 4 1523249 1523611 W 2011-02-03 1996-07-31 Protein of unknown function; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to the vacuole; member of the seripauperin multigene family encoded mainly in subtelomeric regions -S000035788 CDS YDR542W 4 1523249 1523611 W 2011-02-03 1996-07-31 -S000028948 telomere TEL04R chromosome 4 4 1524625 1531933 W 321 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome IV; composed of an X element core sequence, X element combinatorial repeats, a short stretch of telomeric repeats, and a long Y' element -S000028949 telomeric_repeat TEL04R 4 1525371 1525466 W 2011-02-03 2003-09-09 Internal telomeric repeats on the right arm of Chromosome IV -S000028950 X_element TEL04R 4 1524625 1525089 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome IV; spans 464 bp and contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YDR543C -S000028951 X_element_combinatorial_repeat TEL04R 4 1525090 1525370 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr IV; spans 280 bp and contains repeats of the D, C, B and A types, Tbf1p binding sites, and ORF YDR544C; formerly called SubTelomeric Repeats -S000028952 Y_prime_element TEL04R 4 1525467 1531933 W 2011-02-03 2003-09-09 Telomeric long Y' element on the right arm of Chromosome IV; contains an ARS consensus sequence, a region of 36-bp repeats, and ORFs YRF1-1/YDR545W and YDR545C-A -S000002951 ORF Dubious YDR543C chromosome 4 4 1524933 1524634 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035825 CDS YDR543C 4 1524933 1524634 C 2011-02-03 1996-07-31 -S000002952 ORF Dubious YDR544C chromosome 4 4 1525523 1525095 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035945 CDS YDR544C 4 1525523 1525095 C 2011-02-03 1996-07-31 -S000002953 ORF Verified YDR545W YRF1-1 Y' element ATP-dependent helicase protein 1 copy 1|YRF1 chromosome 4 L000004879 4 1526321 1531711 W 2011-02-03 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p -S000036865 CDS YDR545W 4 1526321 1531711 W 2011-02-03 1996-07-31 -S000028617 ORF Dubious YDR545C-A chromosome 4 4 1531342 1530863 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF YRF1-1/YDR545W -S000031458 CDS YDR545C-A 4 1531342 1530863 C 2011-02-03 2003-07-29 -S000028621 ORF Dubious YEL077W-A chromosome 5 5 630 1112 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031470 CDS YEL077W-A 5 630 1112 W 2003-07-29 2003-07-29 -S000006409 ORF Uncharacterized YEL077C Y' element ATP-dependent helicase chromosome 5 5 4097 264 C 1996-07-31 1996-07-31 Helicase-like protein encoded within the telomeric Y' element -S000034008 CDS YEL077C 5 4097 264 C 1996-07-31 1996-07-31 -S000077377 ARS ARS502 chromosome 5 5 4097 4185 2004-10-19 2004-10-19 Autonomously Replicating Sequence -S000002956 ORF Dubious YEL075W-A YEL076W-C chromosome 5 5 4870 5481 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031130 CDS YEL075W-A 5 4870 5481 W 1996-07-31 1996-07-31 -S000002955 ORF Uncharacterized YEL076C-A chromosome 5 5 5114 4185 C 1996-07-31 1996-07-31 Putative protein of unknown function -S000036122 CDS YEL076C-A 5 4322 4185 C 1996-07-31 1996-07-31 -S000036121 CDS YEL076C-A 5 5114 4602 C 1996-07-31 1996-07-31 -S000036123 intron YEL076C-A 5 4601 4323 C 1996-07-31 1996-07-31 -S000000802 ORF Uncharacterized YEL076C chromosome 5 5 5114 4464 C 1996-07-31 1996-07-31 Putative protein of unknown function -S000033207 CDS YEL076C 5 5114 4464 C 1996-07-31 1996-07-31 -S000000801 ORF Uncharacterized YEL075C chromosome 5 5 5713 5345 C 1996-07-31 1996-07-31 Putative protein of unknown function -S000033136 CDS YEL075C 5 5713 5345 C 1996-07-31 1996-07-31 -S000000800 ORF Dubious YEL074W chromosome 5 5 6126 6464 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; large scale expression analysis showed an increase in mRNA accumulation in strains mutant for exosome components -S000033091 CDS YEL074W 5 6126 6464 W 1996-07-31 1996-07-31 -S000077378 ARS ARS503 chromosome 5 5 6378 6453 2014-11-18 2004-10-19|2014-11-18 Autonomously Replicating Sequence -S000028879 telomere TEL05L chromosome 5 5 6473 1 C -52 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome V; annotated components include an X element core sequence and a long Y' element; TEL05L does have telomeric repeats (TEL05L-TR), but they are missing from the genome annotation due to difficulties encountered during sequencing and/or assembly -S000028880 X_element TEL05L 5 6473 6279 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome V; contains an ARS consensus sequence and spans ORF YEL074W -S000028881 Y_prime_element TEL05L 5 6278 1 C 2003-09-09 2003-09-09 Telomeric long Y' element on the left arm of Chromosome V; contains an ARS consensus sequence, a region of 36-bp repeats, and six ORFs (YEL075C, YEL076C, YEL076C-A, YEL077C, YEL075W-A, YEL077W-A) -S000000799 ORF Uncharacterized YEL073C chromosome 5 5 7553 7230 C 1996-07-31 1996-07-31 Putative protein of unknown function; located adjacent to ARS503 and the telomere on the left arm of chromosome V; regulated by inositol/choline -S000032128 CDS YEL073C 5 7553 7230 C 1996-07-31 1996-07-31 -S000077379 ARS ARS504 chromosome 5 5 8786 10019 2004-10-19 2004-10-19|2011-02-03 Autonomously Replicating Sequence -S000000798 ORF Verified YEL072W RMD6 chromosome 5 5 13720 14415 W 1996-07-31 1996-07-31 Protein required for sporulation -S000032092 CDS YEL072W 5 13720 14415 W 1996-07-31 1996-07-31 -S000000797 ORF Verified YEL071W DLD3 D-lactate dehydrogenase chromosome 5 5 16355 17845 W 1996-07-31 1996-07-31 2-hydroxyglutarate transhydrogenase, and minor D-lactate dehydrogenase; converts D-2-hydroxyglutarate (D-2HG), an oncometabolite, to alpha-ketoglutarate in the presence of FAD, with concomitant reduction of pyruvate to D-lactate; minor lactate dehydrogenase activity; component of the retrograde regulon that consists of genes whose expression are stimulated by damage to mitochondria and reduced in cells grown with glutamate as the sole nitrogen source; located in the cytoplasm -S000031974 CDS YEL071W 5 16355 17845 W 1996-07-31 1996-07-31 -S000000796 ORF Verified YEL070W DSF1 MAN1|mannitol dehydrogenase DSF1 chromosome 5 5 19589 21097 W 1996-07-31 1996-07-31 Mannitol dehydrogenase; deletion suppresses mutation of mpt5; DSF1 has a paralog, MAN2, that arose from a segmental duplication -S000031743 CDS YEL070W 5 19589 21097 W 1996-07-31 1996-07-31 -S000000795 ORF Verified YEL069C HXT13 HLT1|hexose transporter HXT13 chromosome 5 L000002640 5 23231 21537 C 1996-07-31 1996-07-31 Putative transmembrane polyol transporter; supports growth on and uptake of mannitol and sorbitol with moderate affinity when overexpressed in a strain deleted for hexose family members; minor hexose transport activity when overexpressed in a similar strain; induced by non-fermentable carbon sources; induced in low glucose, repressed in high glucose; HXT13 has a paralog, HXT17, that arose from a segmental duplication -S000030787 CDS YEL069C 5 23231 21537 C 1996-07-31 1996-07-31 -S000000794 ORF Uncharacterized YEL068C chromosome 5 5 25978 25646 C 1996-07-31 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels; SWAT-GFP and seamless-GFP fusion proteins localize to the endoplasmic reticulum and mCherry fusion protein localizes to the vacuole -S000037857 CDS YEL068C 5 25978 25646 C 1996-07-31 1996-07-31 -S000000792 ORF Verified YEL066W HPA3 D-amino-acid N-acetyltransferase chromosome 5 L000004380 5 26667 27206 W 1996-07-31 1996-07-31 D-Amino acid N-acetyltransferase that detoxifies D-amino acids; catalyzes N-acetylation of D-amino acids through ordered bi-bi mechanism in which acetyl-CoA is first substrate bound and CoA is last product liberated; acetylates histones and polyamines, also autoacetylates -S000037723 CDS YEL066W 5 26667 27206 W 1996-07-31 1996-07-31 -S000000793 ORF Uncharacterized YEL067C chromosome 5 5 26776 26189 C 1996-07-31 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000037750 CDS YEL067C 5 26776 26189 C 1996-07-31 1996-07-31 -S000000791 ORF Verified YEL065W SIT1 siderophore transporter|ARN3 chromosome 5 5 27657 29543 W 1996-07-31 1996-07-31 Ferrioxamine B transporter; member of the ARN family of transporters that specifically recognize siderophore-iron chelates; transcription is induced during iron deprivation and diauxic shift; potentially phosphorylated by Cdc28p -S000036964 CDS YEL065W 5 27657 29543 W 1996-07-31 1996-07-31 -S000000790 ORF Verified YEL064C AVT2 chromosome 5 5 31239 29797 C 1996-07-31 1996-07-31 Putative transporter; member of a family of seven S. cerevisiae genes (AVT1-7) related to vesicular GABA-glycine transporters -S000036881 CDS YEL064C 5 31239 29797 C 1996-07-31 1996-07-31 -S000000789 ORF Verified YEL063C CAN1 arginine permease CAN1 chromosome 5 L000000213 5 33466 31694 C -50 1996-07-31 1996-07-31 Plasma membrane arginine permease; requires phosphatidyl ethanolamine (PE) for localization, exclusively associated with lipid rafts; mutation confers canavanine resistance; CAN1 has a paralog, ALP1, that arose from the whole genome duplication -S000036793 CDS YEL063C 5 33466 31694 C 1996-07-31 1996-07-31 -S000000788 ORF Verified YEL062W NPR2 nitrogen permease regulating protein NPR2 chromosome 5 L000001274 5 34407 36254 W 2003-09-22 2003-09-22|1996-07-31 Subunit of the Iml1p/SEACIT complex; SEACIT (Iml1p-Npr2p-Npr3p) is a subcomplex of the SEA complex, a coatomer-related complex that associates dynamically with the vacuole; Npr2p may have a structural or regulatory role, supporting Iml1p function as a GAP for the Rag family GTPase Gtr1p, and resulting in inhibition of TORC1 signaling in response to amino acid deprivation; SEACIT is required for non-nitrogen-starvation-induced autophagy; homolog of human tumor suppressor NPRL2 -S000035991 CDS YEL062W 5 34407 36254 W 2003-09-22 2003-09-22|1996-07-31 -S000000787 ORF Verified YEL061C CIN8 kinesin motor protein CIN8|SDS15|KSL2 chromosome 5 L000000340 5 39537 36535 C 2003-09-22 2003-09-22|1996-07-31 Kinesin motor protein; involved in mitotic spindle assembly and chromosome segregation -S000035795 CDS YEL061C 5 39537 36535 C 2003-09-22 2003-09-22|1996-07-31 -S000000786 ORF Verified YEL060C PRB1 proteinase B|CVT1 chromosome 5 L000001480 5 41953 40046 C -48 1996-07-31 1996-07-31 Vacuolar proteinase B (yscB) with H3 N-terminal endopeptidase activity; serine protease of the subtilisin family; involved in protein degradation in the vacuole and required for full protein degradation during sporulation; activity inhibited by Pbi2p; protein abundance increases in response to DNA replication stress; PRB1 has a paralog, YSP3, that arose from the whole genome duplication -S000035710 CDS YEL060C 5 41953 40046 C 1996-07-31 1996-07-31 -S000002954 ORF Verified YEL059C-A SOM1 chromosome 5 L000003993 5 42624 42400 C 1996-07-31 1996-07-31 Subunit of the mitochondrial inner membrane peptidase (IMP); IMP is required for maturation of mitochondrial proteins of the intermembrane space; Som1p facilitates cleavage of a subset of substrates; contains twin cysteine-x9-cysteine motifs -S000035802 CDS YEL059C-A 5 42624 42400 C 1996-07-31 1996-07-31 -S000000785 ORF Dubious YEL059W HHY1 ENV6 chromosome 5 5 42652 42960 W 1996-07-31 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; mutant is hypersensitive to hygromycin B indicative of defects in vacuolar trafficking -S000034663 CDS YEL059W 5 42652 42960 W 1996-07-31 1996-07-31 -S000000784 ORF Verified YEL058W PCM1 phosphoacetylglucosamine mutase PCM1|AGM1 chromosome 5 L000001351 5 43252 44925 W 1996-07-31 1996-07-31 Essential N-acetylglucosamine-phosphate mutase; converts GlcNAc-6-P to GlcNAc-1-P, which is a precursor for the biosynthesis of chitin and for the formation of N-glycosylated mannoproteins and glycosylphosphatidylinositol anchors -S000033785 CDS YEL058W 5 43252 44925 W 1996-07-31 1996-07-31 -S000000783 ORF Verified YEL057C SDD1 chromosome 5 5 45721 45020 C 1996-07-31 1996-07-31 Protein of unknown function; overproduction suppresses lethality due to expression of the dominant PET9 allele AAC2-A128P; may have a role in telomere maintenance; target of UME6 regulation -S000033614 CDS YEL057C 5 45721 45020 C 1996-07-31 1996-07-31 -S000000782 ORF Verified YEL056W HAT2 chromosome 5 L000003400 5 47168 48373 W 1996-07-31 1996-07-31 Subunit of the Hat1p-Hat2p histone acetyltransferase complex; required for high affinity binding of the complex to free histone H4, thereby enhancing Hat1p activity; similar to human RbAp46 and 48; has a role in telomeric silencing -S000033568 CDS YEL056W 5 47168 48373 W 1996-07-31 1996-07-31 -S000000781 ORF Verified YEL055C POL5 DNA-directed DNA polymerase chromosome 5 L000004119 5 51539 48471 C 1996-07-31 1996-07-31 DNA Polymerase phi; has sequence similarity to the human MybBP1A and weak sequence similarity to B-type DNA polymerases, not required for chromosomal DNA replication; required for the synthesis of rRNA -S000032784 CDS YEL055C 5 51539 48471 C 1996-07-31 1996-07-31 -S000081374 snoRNA_gene snR80 SNR80 chromosome 5 5 52320 52150 C 2005-11-29 2005-11-29 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U776 and small subunit (SSU) rRNA at position U759 -S000113618 noncoding_exon snR80 5 52320 52150 C 2005-11-29 2005-11-29 -S000028744 ORF Dubious YEL053W-A chromosome 5 5 52908 53255 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene RPL12A/YEL054C -S000033414 CDS YEL053W-A 5 52908 53255 W 2003-07-29 2003-07-29 -S000000780 ORF Verified YEL054C RPL12A uL11|ribosomal 60S subunit protein L12A|L11|YL23|L15A|L12A chromosome 5 L000001712 5 53218 52721 C 1996-07-31 1996-07-31 Ribosomal 60S subunit protein L12A; rpl12a rpl12b double mutant exhibits slow growth and slow translation; homologous to mammalian ribosomal protein L12 and bacterial L11; RPL12A has a paralog, RPL12B, that arose from the whole genome duplication -S000032694 CDS YEL054C 5 53218 52721 C 1996-07-31 1996-07-31 -S000000779 ORF Verified YEL053C MAK10 NAA35 chromosome 5 L000000983 5 56102 53901 C -43 1996-07-31 1996-07-31 Non-catalytic subunit of the NatC N-terminal acetyltransferase; required for replication of dsRNA virus; expression is glucose-repressible; human NatC ortholog, Naa35, requires co-expression of the human catalytic subunit, Naa30, to functionally complement the null allele -S000032563 CDS YEL053C 5 56102 53901 C 1996-07-31 1996-07-31 -S000000778 ORF Verified YEL052W AFG1 chromosome 5 L000000055 5 56571 58100 W 1996-07-31 1996-07-31 Protein that may act as a chaperone for cytochrome c oxidase subunits; conserved protein; may act as a chaperone in the degradation of misfolded or unassembled cytochrome c oxidase subunits; localized to matrix face of the mitochondrial inner membrane; member of the AAA family but lacks a protease domain -S000031642 CDS YEL052W 5 56571 58100 W 1996-07-31 1996-07-31 -S000000777 ORF Verified YEL051W VMA8 H(+)-transporting V1 sector ATPase subunit D chromosome 5 L000002463 5 58378 59148 W 1996-07-31 1996-07-31 Subunit D of the V1 peripheral membrane domain of V-ATPase; part of the electrogenic proton pump found throughout the endomembrane system; plays a role in the coupling of proton transport and ATP hydrolysis; the V1 peripheral membrane domain of the vacuolar H+-ATPase (V-ATPase) has eight subunits -S000031545 CDS YEL051W 5 58378 59148 W 1996-07-31 1996-07-31 -S000077380 ARS ARS507 ARSV-59 chromosome 5 5 59338 59477 2014-11-18 2014-11-18|2004-10-19|2006-09-07 Autonomously Replicating Sequence -S000178082 ARS_consensus_sequence ARS507 5 59470 59454 C 2014-11-18 2014-11-18 -S000028545 ORF Dubious YEL050W-A chromosome 5 5 59549 59740 W 2003-07-29 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by fungal homology and RT-PCR -S000031195 CDS YEL050W-A 5 59549 59740 W 2003-07-29 2003-07-29 -S000000776 ORF Verified YEL050C RML2 mitochondrial 54S ribosomal protein RML2 chromosome 5 L000004131 5 60851 59670 C 1996-07-31 1996-07-31 Mitochondrial ribosomal protein of the large subunit (L2); has similarity to E. coli L2 ribosomal protein; mutant allele (fat21) causes inability to utilize oleate, and induce oleic acid oxidation; may interfere with activity of the Adr1p transcription factor -S000031449 CDS YEL050C 5 60851 59670 C 1996-07-31 1996-07-31 -S000006458 snoRNA_gene snR67 SNR67 chromosome 5 L000004536 5 61352 61433 W 2000-05-19 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at positions G2619 and U2724 -S000030853 noncoding_exon snR67 5 61352 61433 W 2000-05-19 2000-05-19 -S000006444 snoRNA_gene snR53 SNR53 chromosome 5 L000004522 5 61699 61789 W 2000-05-19 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position A796 -S000030737 noncoding_exon snR53 5 61699 61789 W 2000-05-19 2000-05-19 -S000006578 tRNA_gene tG(GCC)E chromosome 5 L000003808 5 61960 61890 C 2000-05-19 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis -S000037897 noncoding_exon tG(GCC)E 5 61960 61890 C 2000-05-19 2000-05-19 -S000006889 long_terminal_repeat YELWdelta1 chromosome 5 5 62081 62756 W 2000-05-19 2000-05-19 Ty1 LTR -S000006890 long_terminal_repeat YELWdelta2 chromosome 5 5 62142 62474 W 2000-05-19 2000-05-19 Ty1 LTR -S000000775 ORF Verified YEL049W PAU2 seripauperin PAU2 chromosome 5 L000002738 5 63728 64090 W 1996-07-31 1996-07-31 Member of the seripauperin multigene family; encoded mainly in subtelomeric region; active during alcoholic fermentation; regulated by anaerobiosis; negatively regulated by oxygen; repressed by heme -S000030708 CDS YEL049W 5 63728 64090 W 1996-07-31 1996-07-31 -S000000774 ORF Verified YEL048C TCA17 chromosome 5 5 65167 64709 C 1996-07-31 1996-07-31 Component of transport protein particle (TRAPP) complex II; TRAPPII is a multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating intra-Golgi and endosome-Golgi traffic; promotes association of TRAPPII-specific subunits with the TRAPP core complex; sedlin related; human Sedlin mutations cause SEDT, a skeletal disorder -S000030547 CDS YEL048C 5 65167 64709 C 1996-07-31 1996-07-31 -S000000773 ORF Verified YEL047C FRD1 fumarate reductase|FRDS1 chromosome 5 5 66797 65385 C 1996-07-31 1996-07-31 Soluble fumarate reductase; required with isoenzyme Osm1p for anaerobic growth; may interact with ribosomes, based on co-purification experiments; authentic, non-tagged protein is detected in purified mitochondria in high-throughput studies; similar to Arxula adeninovorans fumarate reductase; protein abundance increases in response to DNA replication stress; FRD1 has a paralog, OSM1, that arose from the whole genome duplication -S000030396 CDS YEL047C 5 66797 65385 C 1996-07-31 1996-07-31 -S000000772 ORF Verified YEL046C GLY1 threonine aldolase GLY1 chromosome 5 L000000718 5 68792 67629 C 1996-07-31 1996-07-31 Threonine aldolase; catalyzes the cleavage of L-allo-threonine and L-threonine to glycine; involved in glycine biosynthesis -S000037630 CDS YEL046C 5 68792 67629 C 1996-07-31 1996-07-31 -S000000771 ORF Dubious YEL045C chromosome 5 5 69265 68840 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; deletion gives MMS sensitivity, growth defect under alkaline conditions, less than optimal growth upon citric acid stress -S000037503 CDS YEL045C 5 69265 68840 C 1996-07-31 1996-07-31 -S000000770 ORF Verified YEL044W IES6 chromosome 5 5 69757 70257 W 1996-07-31 1996-07-31 Component of the INO80 chromatin remodeling complex; critical for INO80 function; involved in regulation of chromosome segregation and maintenance of normal centromeric chromatin structure; human ortholog INO80C is a member of the human INO80 complex; implicated in DNA repair based on genetic interactions with RAD52 epistasis genes -S000037449 CDS YEL044W 5 69757 70257 W 1996-07-31 1996-07-31 -S000000769 ORF Verified YEL043W chromosome 5 5 70478 73348 W 1996-07-31 1996-07-31 Predicted cytoskeleton protein involved in intracellular signaling; based on quantitative analysis of protein-protein interaction maps; may interact with ribosomes, based on co-purification studies; contains fibronectin type III domain fold -S000036714 CDS YEL043W 5 70478 73348 W 1996-07-31 1996-07-31 -S000000768 ORF Verified YEL042W GDA1 guanosine diphosphatase chromosome 5 L000000695 5 73771 75327 W 1996-07-31 1996-07-31 Guanosine diphosphatase located in the Golgi; involved in the transport of GDP-mannose into the Golgi lumen, converting GDP to GMP after mannose is transferred to substrates; null mutants are defective in sporulation and pre-meiotic S phase entry; orthologous to human ENTPD6, a meiosis-associated non-obstructive azoospermia (NOA) related gene identified in GWAS studies -S000036632 CDS YEL042W 5 73771 75327 W 1996-07-31 1996-07-31 -S000000767 ORF Verified YEL041W YEF1 NADH/NAD(+) kinase chromosome 5 5 75944 77431 W 1996-07-31 1996-07-31 ATP-NADH kinase; phosphorylates both NAD and NADH; homooctameric structure consisting of 60-kDa subunits; similar to Pos5p; overexpression complements certain pos5 phenotypes; YEF1 has a paralog, UTR1, that arose from the whole genome duplication -S000036511 CDS YEL041W 5 75944 77431 W 1996-07-31 1996-07-31 -S000000766 ORF Verified YEL040W UTR2 CRH2 chromosome 5 L000002448 5 78053 79456 W 1996-07-31 1996-07-31 Chitin transglycosylase; functions in the transfer of chitin to beta(1-6) and beta(1-3) glucans in the cell wall; similar to and functionally redundant with Crh1; glycosylphosphatidylinositol (GPI)-anchored protein localized to bud neck -S000036453 CDS YEL040W 5 78053 79456 W 1996-07-31 1996-07-31 -S000000765 ORF Verified YEL039C CYC7 cytochrome c isoform 2 chromosome 5 L000000451 5 79977 79636 C -27 1996-07-31 1996-07-31 Cytochrome c isoform 2, expressed under hypoxic conditions; also known as iso-2-cytochrome c; electron carrier of the mitochondrial intermembrane space that transfers electrons from ubiquinone-cytochrome c oxidoreductase to cytochrome c oxidase during cellular respiration; protein abundance increases in response to DNA replication stress; CYC7 has a paralog, CYC1, that arose from the whole genome duplication -S000035665 CDS YEL039C 5 79977 79636 C 1996-07-31 1996-07-31 -S000000764 ORF Verified YEL038W UTR4 putative acireductone synthase UTR4 chromosome 5 L000002449 5 80462 81145 W 2006-05-09 1996-07-31|2006-05-09 Protein with sequence similarity to acireductone synthases; involved in methionine salvage; found in both the cytoplasm and nucleus -S000035624 CDS YEL038W 5 80462 81145 W 2006-05-09 1996-07-31|2006-05-09 -S000000763 ORF Verified YEL037C RAD23 chromosome 5 L000001568 5 82603 81407 C -26 1996-07-31 1996-07-31 Protein with ubiquitin-like N terminus; subunit of Nuclear Excision Repair Factor 2 (NEF2) with Rad4p that binds damaged DNA; enhances protein deglycosylation activity of Png1p; also involved, with Rad4p, in ubiquitylated protein turnover; Rad4p-Rad23p heterodimer binds to promoters of DNA damage response genes to repress their transcription in the absence of DNA damage -S000035488 CDS YEL037C 5 82603 81407 C 1996-07-31 1996-07-31 -S000000762 ORF Verified YEL036C ANP1 MNN8|GEM3 chromosome 5 L000000089 5 84552 83050 C -26 1996-07-31 1996-07-31 Subunit of the alpha-1,6 mannosyltransferase complex; type II membrane protein; has a role in retention of glycosyltransferases in the Golgi; involved in osmotic sensitivity and resistance to aminonitrophenyl propanediol -S000034468 CDS YEL036C 5 84552 83050 C 1996-07-31 1996-07-31 -S000000761 ORF Uncharacterized YEL035C UTR5 chromosome 5 L000002450 5 85545 85045 C 1996-07-31 1996-07-31 Protein of unknown function; transcription may be regulated by Gcr1p; essential for growth under standard (aerobic) conditions but not under anaerobic conditions -S000034388 CDS YEL035C 5 85545 85045 C 1996-07-31 1996-07-31 -S000000760 ORF Verified YEL034W HYP2 translation elongation factor eIF-5A|eIF-5A|eIF5A|TIF51A chromosome 5 L000000847|L000002307 5 85676 86149 W 1996-07-31 1996-07-31 Translation elongation factor eIF-5A; required for translation of proteins containing polyproline stretches, including Bni1p, and this leads to a requirement for mating projection formation; structural homolog of bacterial EF-P; undergoes an essential hypusination modification; HYP2 has a paralog, ANB1, that arose from the whole genome duplication; human EIF5A complements the inviability of the yeast hyp2 anb1 double null mutant -S000034356 CDS YEL034W 5 85676 86149 W 1996-07-31 1996-07-31 -S000000759 ORF Uncharacterized YEL033W MTC7 chromosome 5 5 86179 86598 W 1996-07-31 1996-07-31 Protein of unknown function; predicted metabolic role based on network analysis derived from ChIP experiments, a large-scale deletion study and localization of transcription factor binding sites; null mutant is sensitive to temperature oscillation in a cdc13-1 mutant -S000033441 CDS YEL033W 5 86179 86598 W 1996-07-31 1996-07-31 -S000028743 ORF Dubious YEL034C-A chromosome 5 5 86215 85613 C 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps HYP2/YEL034W, a verified gene that encodes eiF-5A -S000033413 CDS YEL034C-A 5 86215 85613 C 2003-07-29 2003-07-29 -S000006724 tRNA_gene tS(AGA)E chromosome 5 L000003789 5 86604 86685 W 2000-05-19 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000032362 noncoding_exon tS(AGA)E 5 86604 86685 W 2000-05-19 2000-05-19 -S000000758 ORF Verified YEL032W MCM3 MCM DNA helicase complex subunit MCM3 chromosome 5 L000001039 5 86937 89852 W -24 1996-07-31 1996-07-31 Protein involved in DNA replication; component of the Mcm2-7 hexameric helicase complex that binds chromatin as a part of the pre-replicative complex -S000033351 CDS YEL032W 5 86937 89852 W 1996-07-31 1996-07-31 -S000028620 ORF Dubious YEL032C-A chromosome 5 5 87201 87040 C 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031469 CDS YEL032C-A 5 87201 87040 C 2003-07-29 2003-07-29 -S000000757 ORF Verified YEL031W SPF1 ion-transporting P-type ATPase SPF1|PER9|PIO1|COD1 chromosome 5 L000003454 5 90258 93905 W 1996-07-31 1996-07-31 P-type ATPase, ion transporter of the ER membrane; required to maintain normal lipid composition of intracellular compartments and proper targeting of mitochondrial outer membrane tail-anchored proteins; involved in ER function and Ca2+ homeostasis; required for regulating Hmg2p degradation; confers sensitivity to a killer toxin (SMKT) produced by Pichia farinosa KK1 -S000033284 CDS YEL031W 5 90258 93905 W 1996-07-31 1996-07-31 -S000077381 ARS ARS508 ARSV-94 chromosome 5 5 93978 94218 2006-09-07 2004-10-19|2006-09-07 Autonomously Replicating Sequence -S000178083 ARS_consensus_sequence ARS508 5 94055 94071 W 2014-11-18 2014-11-18 -S000000756 ORF Verified YEL030W ECM10 Hsp70 family ATPase ECM10|SSC3 chromosome 5 L000003885 5 94644 96578 W 1996-07-31 1996-07-31 Heat shock protein of the Hsp70 family; localized in mitochondrial nucleoids, plays a role in protein translocation, interacts with Mge1p in an ATP-dependent manner; overexpression induces extensive mitochondrial DNA aggregations; ECM10 has a paralog, SSC1, that arose from the whole genome duplication -S000033225 CDS YEL030W 5 94644 96578 W 1996-07-31 1996-07-31 -S000028619 ORF Dubious YEL030C-A chromosome 5 5 94897 94583 C 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031462 CDS YEL030C-A 5 94897 94583 C 2003-07-29 2003-07-29 -S000000755 ORF Verified YEL029C BUD16 putative pyridoxal kinase BUD16 chromosome 5 5 97796 96858 C 1996-07-31 1996-07-31 Putative pyridoxal kinase; a key enzyme involved in pyridoxal 5'-phosphate synthesis, the active form of vitamin B6; required for genome integrity; involved in bud-site selection; similarity to yeast BUD17 and human pyridoxal kinase (PDXK) -S000032366 CDS YEL029C 5 97796 96858 C 1996-07-31 1996-07-31 -S000000754 ORF Uncharacterized YEL028W chromosome 5 5 98668 99129 W 1996-07-31 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YEL028C is not an essential gene -S000031432 CDS YEL028W 5 98668 99129 W 1996-07-31 1996-07-31 -S000006886 long_terminal_repeat YELCdelta3 chromosome 5 5 99664 99490 C 2000-05-19 2000-05-19 Ty1 LTR -S000006660 tRNA_gene tM(CAU)E IMT4 chromosome 5 L000003790 5 100133 100204 W 2000-05-19 2000-05-19 Methionine initiator tRNA (tRNA-Met); predicted by tRNAscan-SE analysis; one of four initiator methionine tRNAs in yeast that are functional for translation -S000034533 noncoding_exon tM(CAU)E 5 100133 100204 W 2000-05-19 2000-05-19 -S000000753 ORF Verified YEL027W VMA3 H(+)-transporting V0 sector ATPase subunit c|CUP5|GEF2|CLS7 chromosome 5 L000000441 5 100769 101251 W -18 1996-07-31 1996-07-31 Proteolipid subunit c of the V0 domain of vacuolar H(+)-ATPase; dicyclohexylcarbodiimide binding subunit; required for vacuolar acidification and important for copper and iron metal ion homeostasis -S000031319 CDS YEL027W 5 100769 101251 W 1996-07-31 1996-07-31 -S000000752 ORF Verified YEL026W SNU13 RNA binding protein SNU13 chromosome 5 5 101943 102323 W 1996-07-31 1996-07-31 RNA binding protein; part of U3 snoRNP involved in rRNA processing, part of U4/U6-U5 tri-snRNP involved in mRNA splicing, similar to human 15.5K protein -S000031209 CDS YEL026W 5 101943 102323 W 1996-07-31 1996-07-31 -S000000751 ORF Uncharacterized YEL025C SRI1 chromosome 5 5 106147 102581 C 1996-07-31 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus -S000030133 CDS YEL025C 5 106147 102581 C 1996-07-31 1996-07-31 -S000000750 ORF Verified YEL024W RIP1 ubiquinol--cytochrome-c reductase catalytic subunit RIP1 chromosome 5 L000001643 5 107260 107907 W 1996-07-31 1996-07-31 Ubiquinol-cytochrome-c reductase; a Rieske iron-sulfur protein of the mitochondrial cytochrome bc1 complex; transfers electrons from ubiquinol to cytochrome c1 during respiration; during import, Rip1p is first imported into the mitochondrial matrix where it is processed, acquires its Fe-S cluster, and is folded, then is translocated into the inner membrane by the action of a homo-oligomer of Bcs1p, and finally is delivered by Bcs1p to Complex III for assembly -S000030065 CDS YEL024W 5 107260 107907 W 1996-07-31 1996-07-31 -S000000749 ORF Uncharacterized YEL023C chromosome 5 5 110552 108504 C 1996-07-31 1996-07-31 Putative protein of unknown function; expression is increased greatly during sporulation; YEL023C is not an essential gene -S000029902 CDS YEL023C 5 110552 108504 C 1996-07-31 1996-07-31 -S000000748 ORF Verified YEL022W GEA2 Arf family guanine nucleotide exchange factor GEA2 chromosome 5 L000004717 5 111421 115800 W 1996-07-31 1996-07-31 Guanine nucleotide exchange factor for ADP ribosylation factors (ARFs); involved in vesicular transport between the Golgi and ER, Golgi organization, and actin cytoskeleton organization; GEA2 has a paralog, GEA1, that arose from the whole genome duplication -S000037316 CDS YEL022W 5 111421 115800 W 1996-07-31 1996-07-31 -S000000747 ORF Verified YEL021W URA3 orotidine-5'-phosphate decarboxylase chromosome 5 L000002432 5 116167 116970 W -7 1996-07-31 1996-07-31 Orotidine-5'-phosphate (OMP) decarboxylase; catalyzes the sixth enzymatic step in the de novo biosynthesis of pyrimidines, converting OMP into uridine monophosphate (UMP); converts 5-FOA into 5-fluorouracil, a toxic compound -S000037201 CDS YEL021W 5 116167 116970 W 1996-07-31 1996-07-31 -S000007256 ORF Verified YEL020W-A TIM9 protein transporter TIM9 chromosome 5 L000004718 5 117211 117474 W 1999-07-17 1999-07-17 Essential protein of the mitochondrial intermembrane space; forms a complex with Tim10p (TIM10 complex) that delivers hydrophobic proteins to the TIM22 complex for insertion into the inner membrane -S000034788 CDS YEL020W-A 5 117211 117474 W 1999-07-17 1999-07-17 -S000028544 ORF Dubious YEL020C-B chromosome 5 5 117380 117183 C 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene YEL020W-A; identified by fungal homology and RT-PCR -S000031194 CDS YEL020C-B 5 117380 117183 C 2003-07-29 2003-07-29 -S000006490 ncRNA_gene RPR1 RPR1 chromosome 5 L000001748 5 118035 117667 C -6 2000-05-19 2000-05-19 RNA component of nuclear RNase P; nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs; may be responsible for recognition of substrate tRNAs -S000032263 noncoding_exon RPR1 5 118035 117667 C 2000-05-19 2000-05-19 -S000006888 long_terminal_repeat YELCtau1 chromosome 5 5 118551 118230 C 2000-05-19 2000-05-19 Ty4 LTR -S000000746 ORF Verified YEL020C PXP1 putative indolepyruvate decarboxylase family protein chromosome 5 5 120299 118617 C 1996-07-31 1996-07-31 Peroxisomal matrix protein; well-conserved in fungi; contains tripartite homology domain of thiamine pyrophosphate (TPP) enzymes; targeted to peroxisomes by Pex5p; contains low sequence identity with Pdc1p; mRNA identified as translated by ribosome profiling data -S000037043 CDS YEL020C 5 120299 118617 C 1996-07-31 1996-07-31 -S000000745 ORF Verified YEL019C MMS21 SUMO ligase MMS21|PSO10|NSE2 chromosome 5 L000001125 5 121301 120498 C 1996-07-31 1996-07-31 Highly conserved SUMO E3 ligase subunit of SMC5-SMC6 complex; required for anchoring dsDNA breaks to the nuclear periphery; SMC5-SMC6 plays a key role in removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair; required for efficient sister chromatid cohesion; mutants are sensitive to MMS, show increased spontaneous mutation and mitotic recombination; SUMOylates and inhibits Snf1p function; supports nucleolar function -S000035285 CDS YEL019C 5 121301 120498 C 1996-07-31 1996-07-31 -S000000744 ORF Verified YEL018W EAF5 chromosome 5 5 121471 122310 W 1996-07-31 1996-07-31 Non-essential subunit of the NuA4 acetyltransferase complex; Esa1p-associated factor; relocalizes to the cytosol in response to hypoxia -S000035234 CDS YEL018W 5 121471 122310 W 1996-07-31 1996-07-31 -S000028742 ORF Dubious YEL018C-A chromosome 5 5 121988 121455 C 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF EAF5/YEL018W -S000033412 CDS YEL018C-A 5 121988 121455 C 2003-07-29 2003-07-29 -S000002103 ORF Verified YEL017C-A PMP2 proteolipid ATPase chromosome 5 L000001454 5 122929 122798 C 1996-07-31 1996-07-31 Proteolipid associated with plasma membrane H(+)-ATPase (Pma1p); regulates plasma membrane H(+)-ATPase activity; protein abundance increases in response to DNA replication stress; PMP2 has a paralog, PMP1, that arose from the whole genome duplication -S000035297 CDS YEL017C-A 5 122929 122798 C 1996-07-31 1996-07-31 -S000000743 ORF Verified YEL017W GTT3 chromosome 5 5 123657 124670 W 1996-07-31 1996-07-31 Protein of unknown function may be involved in glutathione metabolism; function suggested by computational analysis of large-scale protein-protein interaction data; N- and C-terminal fusion proteins localize to the cell periphery -S000035057 CDS YEL017W 5 123657 124670 W 1996-07-31 1996-07-31 -S000000742 ORF Verified YEL016C NPP2 nucleotide diphosphatase/phosphodiesterase NPP2 chromosome 5 5 126218 124737 C 1996-07-31 1996-07-31 Nucleotide pyrophosphatase/phosphodiesterase; mediates extracellular nucleotide phosphate hydrolysis along with Npp1p and Pho5p; activity and expression enhanced during conditions of phosphate starvation; involved in spore wall assembly; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; NPP2 has a paralog, NPP1, that arose from the whole genome duplication; npp1 npp2 double mutant exhibits reduced dityrosine fluorescence relative to single mutants -S000034054 CDS YEL016C 5 126218 124737 C 1996-07-31 1996-07-31 -S000000741 ORF Verified YEL015W EDC3 LSM16|DCP3 chromosome 5 5 126629 128284 W 1996-07-31 1996-07-31 Non-essential conserved protein with a role in mRNA decapping; specifically affects the function of the decapping enzyme Dcp1p; mediates decay of the RPS28B mRNA via binding to both Rps28Bp (or Rps28Ap) and the RPS28B mRNA; mediates decay of the YRA1 mRNA by a different, translation-independent mechanism; localizes to cytoplasmic mRNA processing bodies; forms cytoplasmic foci upon DNA replication stress -S000034021 CDS YEL015W 5 126629 128284 W 1996-07-31 1996-07-31 -S000000740 ORF Dubious YEL014C chromosome 5 5 128608 128303 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033749 CDS YEL014C 5 128608 128303 C 1996-07-31 1996-07-31 -S000000739 ORF Verified YEL013W VAC8 protein anchor VAC8|YEB3 chromosome 5 L000004028 5 128825 130561 W 1996-07-31 1996-07-31 Phosphorylated and palmitoylated vacuolar membrane protein; interacts with Atg13p, required for the cytoplasm-to-vacuole targeting (Cvt) pathway; interacts with Nvj1p to form nucleus-vacuole junctions -S000033107 CDS YEL013W 5 128825 130561 W 1996-07-31 1996-07-31 -S000006697 tRNA_gene tQ(UUG)E2 chromosome 5 L000003807 5 131153 131082 C 2000-05-19 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000034949 noncoding_exon tQ(UUG)E2 5 131153 131082 C 2000-05-19 2000-05-19 -S000000738 ORF Verified YEL012W UBC8 E2 ubiquitin-conjugating protein UBC8|GID3 chromosome 5 L000002410 5 131772 132551 W 2000-12-01 2000-12-01|1996-07-31 Ubiquitin-conjugating enzyme that regulates gluconeogenesis; negatively regulates gluconeogenesis by mediating the glucose-induced ubiquitination of fructose-1,6-bisphosphatase (FBPase); cytoplasmic enzyme that catalyzes the ubiquitination of histones in vitro -S000033012 CDS YEL012W 5 131772 131776 W 2000-12-01 2000-12-01 -S000033013 CDS YEL012W 5 131900 132551 W 2000-12-01 2000-12-01|1996-07-31 -S000033014 intron YEL012W 5 131777 131899 W 2000-12-01 2000-12-01 -S000000737 ORF Verified YEL011W GLC3 1,4-alpha-glucan branching enzyme|GHA1 chromosome 5 L000000705 5 133120 135234 W -2 1996-07-31 1996-07-31 Glycogen branching enzyme, involved in glycogen accumulation; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress; glycogen accumulation defect of the null mutant is functionally complemented by human GBE1, which is associated with glycogen storage disease -S000032907 CDS YEL011W 5 133120 135234 W 1996-07-31 1996-07-31 -S000006618 tRNA_gene tK(CUU)E1 chromosome 5 L000003806 5 135497 135425 C 2000-05-19 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000037790 noncoding_exon tK(CUU)E1 5 135497 135425 C 2000-05-19 2000-05-19 -S000006887 long_terminal_repeat YELCdelta4 chromosome 5 5 135939 135612 C 2000-05-19 2000-05-19 Ty1 LTR -S000000736 ORF Dubious YEL010W chromosome 5 5 136279 136629 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032835 CDS YEL010W 5 136279 136629 W 1996-07-31 1996-07-31 -S000028741 ORF Dubious YEL009C-A chromosome 5 5 136778 136371 C 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF YEL010W -S000033411 CDS YEL009C-A 5 136778 136371 C 2003-07-29 2003-07-29 -S000006891 long_terminal_repeat YELWdelta5 chromosome 5 5 137324 137639 W 2000-05-19 2000-05-19 Ty1 LTR -S000006892 long_terminal_repeat YELWdelta6 chromosome 5 5 138221 138553 W 2000-05-19 2000-05-19 Ty1 LTR -S000006710 tRNA_gene tR(UCU)E chromosome 5 L000003791 5 138666 138737 W 2000-05-19 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000037841 noncoding_exon tR(UCU)E 5 138666 138737 W 2000-05-19 2000-05-19 -S000000735 ORF Verified YEL009C GCN4 amino acid starvation-responsive transcription factor GCN4|AAS101|ARG9|AAS3 chromosome 5 L000000683 5 139763 138918 C -3 1996-07-31 1996-07-31 bZIP transcriptional activator of amino acid biosynthetic genes; activator responds to amino acid starvation; expression is tightly regulated at both the transcriptional and translational levels -S000032641 CDS YEL009C 5 139763 138918 C 1996-07-31 1996-07-31 -S000000734 ORF Uncharacterized YEL008W chromosome 5 5 140512 140892 W 1996-07-31 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YEL008W is not an essential gene; predicted to be involved in metabolism -S000032595 CDS YEL008W 5 140512 140892 W 1996-07-31 1996-07-31 -S000028618 ORF Dubious YEL008C-A chromosome 5 5 140818 140726 C 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031461 CDS YEL008C-A 5 140818 140726 C 2003-07-29 2003-07-29 -S000000733 ORF Verified YEL007W MIT1 TOS9 chromosome 5 5 141892 143892 W 2011-02-03 1996-07-31 Transcriptional regulator of pseudohyphal growth; protein with sequence similarity to S. pombe gti1+ (gluconate transport inducer 1) and C. albicans Wor1 -S000031610 CDS YEL007W 5 141892 143892 W 2011-02-03 1996-07-31 -S000000732 ORF Verified YEL006W YEA6 NAD+ transporter|NDT2 chromosome 5 5 144327 145334 W 2011-02-03 1996-07-31 Putative mitochondrial NAD+ transporter; member of the mitochondrial carrier subfamily (see also YIA6); has putative human ortholog; YEA6 has a paralog, YIA6, that arose from the whole genome duplication -S000031480 CDS YEL006W 5 144327 145334 W 2011-02-03 1996-07-31 -S000077382 ARS ARS510 ARSV-146 chromosome 5 5 145678 145840 2014-11-18 2014-11-18|2004-10-19|2006-09-07 Autonomously Replicating Sequence -S000000731 ORF Verified YEL005C VAB2 VAB31 chromosome 5 5 146755 145907 C 2011-02-03 1996-07-31 Subunit of the BLOC-1 complex involved in endosomal maturation; interacts with Vps21p-GFP; has potential role in vacuolar function, as suggested by its ability to bind Vac8p; likely member of; Vab2p-GFP-fusion localizes to cytoplasm in punctate pattern -S000030477 CDS YEL005C 5 146755 145907 C 2011-02-03 1996-07-31 -S000000730 ORF Verified YEL004W YEA4 chromosome 5 L000004419 5 146951 147979 W 2011-02-03 1996-07-31 Uridine diphosphate-N-acetylglucosamine (UDP-GlcNAc) transporter; required for cell wall chitin synthesis; localized to the ER -S000030440 CDS YEL004W 5 146951 147979 W 2011-02-03 1996-07-31 -S000000729 ORF Verified YEL003W GIM4 tubulin-binding prefolding complex subunit GIM4|PFD2 chromosome 5 L000004368 5 148176 148599 W 2011-02-03 1996-07-31|2007-07-09 Subunit of the heterohexameric cochaperone prefoldin complex; complex binds specifically to cytosolic chaperonin and transfers target proteins to it -S000030310 CDS YEL003W 5 148176 148194 W 2011-02-03 1996-07-31|2007-07-09 -S000123269 CDS YEL003W 5 148283 148599 W 2011-02-03 2007-07-09 -S000123268 intron YEL003W 5 148195 148282 W 2011-02-03 2007-07-09 -S000000728 ORF Verified YEL002C WBP1 dolichyl-diphosphooligosaccharide-protein glycotransferase chromosome 5 L000002483 5 150014 148722 C 2011-02-03 1996-07-31 Beta subunit of the oligosaccharyl transferase glycoprotein complex; required for N-linked glycosylation of proteins in the endoplasmic reticulum; human homolog DDOST can complement yeast growth defect during down-regulation of yeast gene -S000037446 CDS YEL002C 5 150014 148722 C 2011-02-03 1996-07-31 -S000000727 ORF Verified YEL001C IRC22 chromosome 5 5 150978 150301 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion localizes to the ER; YEL001C is non-essential; null mutant displays increased levels of spontaneous Rad52p foci -S000037333 CDS YEL001C 5 150978 150301 C 2011-02-03 1996-07-31 -S000006467 centromere CEN5 CEN5 chromosome 5 L000000298 5 151987 152104 W 0 2011-02-03 2000-05-19|2006-05-08 Chromosome V centromere -S000077269 centromere_DNA_Element_I CEN5 5 151987 151996 W 2011-02-03 2004-10-04 -S000077270 centromere_DNA_Element_II CEN5 5 151997 152079 W 2011-02-03 2004-10-04 -S000077271 centromere_DNA_Element_III CEN5 5 152080 152104 W 2011-02-03 2004-10-04 -S000000803 ORF Verified YER001W MNN1 alpha-1,3-mannosyltransferase MNN1 chromosome 5 L000001126 5 153520 155808 W 0 2011-02-03 1996-07-31 Alpha-1,3-mannosyltransferase; integral membrane glycoprotein of the Golgi complex, required for addition of alpha1,3-mannose linkages to N-linked and O-linked oligosaccharides, one of five S. cerevisiae proteins of the MNN1 family -S000033040 CDS YER001W 5 153520 155808 W 2011-02-03 1996-07-31 -S000000804 ORF Verified YER002W NOP16 chromosome 5 5 156803 157498 W 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; involved in 60S ribosomal subunit biogenesis -S000033709 CDS YER002W 5 156803 157498 W 2011-02-03 1996-07-31 -S000000805 ORF Verified YER003C PMI40 mannose-6-phosphate isomerase PMI40|PMI chromosome 5 L000001452 5 159118 157736 C 2011-02-03 1996-07-31 Mannose-6-phosphate isomerase; catalyzes the interconversion of fructose-6-P and mannose-6-P; required for early steps in protein mannosylation -S000033753 CDS YER003C 5 158994 157736 C 2011-02-03 1996-07-31 -S000033752 CDS YER003C 5 159118 159088 C 2011-02-03 1996-07-31 -S000033754 intron YER003C 5 159087 158995 C 2011-02-03 1996-07-31 -S000000806 ORF Verified YER004W FMP52 chromosome 5 5 159580 160275 W 2011-02-03 1996-07-31 Protein of unknown function; localized to the mitochondrial outer membrane; induced by treatment with 8-methoxypsoralen and UVA irradiation -S000033918 CDS YER004W 5 159580 160275 W 2011-02-03 1996-07-31 -S000000807 ORF Verified YER005W YND1 apyrase|YEJ5|APY1 chromosome 5 S000007428 5 160550 162442 W 2011-02-03 1996-07-31 Apyrase with wide substrate specificity; helps prevent inhibition of glycosylation by hydrolyzing nucleoside tri- and diphosphates that inhibit glycotransferases; partially redundant with Gda1p; mediates adenovirus E4orf4-induced toxicity -S000034049 CDS YER005W 5 160550 162442 W 2011-02-03 1996-07-31 -S000000808 ORF Verified YER006W NUG1 RNA-binding GTPase NUG1 chromosome 5 5 162723 164285 W 2011-02-03 1996-07-31 GTPase that associates with nuclear 60S pre-ribosomes; required for export of 60S ribosomal subunits from the nucleus -S000034937 CDS YER006W 5 162723 164285 W 2011-02-03 1996-07-31 -S000000809 ORF Verified YER007W PAC2 chromosome 5 L000001329 5 164527 166083 W 2011-02-03 1996-07-31 Microtubule effector required for tubulin heterodimer formation; binds alpha-tubulin, required for normal microtubule function, null mutant exhibits cold-sensitive microtubules and sensitivity to benomyl -S000035125 CDS YER007W 5 164527 166083 W 2011-02-03 1996-07-31 -S000028745 ORF Dubious YER006C-A chromosome 5 5 164661 164344 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF PAC2/YER007W -S000033415 CDS YER006C-A 5 164661 164344 C 2011-02-03 2003-07-29 -S000002957 ORF Verified YER007C-A TMA20 RBF20 chromosome 5 5 166885 166237 C 2011-02-03 1996-07-31 Protein of unknown function that associates with ribosomes; has a putative RNA binding domain; interacts with Tma22p; null mutant exhibits translation defects; has homology to human oncogene MCT-1; protein abundance increases in response to DNA replication stress -S000032950 CDS YER007C-A 5 166771 166237 C 2011-02-03 1996-07-31 -S000032949 CDS YER007C-A 5 166885 166875 C 2011-02-03 1996-07-31 -S000032951 intron YER007C-A 5 166874 166772 C 2011-02-03 1996-07-31 -S000006499 snRNA_gene snR14 SNR14 U4 chromosome 5 L000001965 5 167586 167427 C 2011-02-03 2000-05-19 U4 spliceosomal RNA (U4 snRNA); interacts with U6 -S000036593 noncoding_exon snR14 5 167586 167427 C 2011-02-03 2000-05-19 -S000000810 ORF Verified YER008C SEC3 GTP-Rho binding exocyst subunit SEC3|PSL1 chromosome 5 L000001829|L000001520 5 171818 167808 C 3 2011-02-03 1996-07-31 Subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to sites of exocytosis prior to SNARE-mediated fusion; PtdIns[4,5]P2-binding protein that localizes to exocytic sites in a Rho1p-dependent, actin-independent manner, targeting and anchoring the exocyst to the plasma membrane with Exo70p; direct GTP Rho1p effector; required for ER inheritance; relocalizes away from bud neck upon DNA replication stress -S000035220 CDS YER008C 5 171818 167808 C 2011-02-03 1996-07-31 -S000000811 ORF Verified YER009W NTF2 Ran GTPase-binding protein NTF2 chromosome 5 L000002863 5 172115 172492 W 2011-02-03 1996-07-31 Nuclear envelope protein; interacts with GDP-bound Gsp1p and with proteins of the nuclear pore to transport Gsp1p into the nucleus where it is an essential player in nucleocytoplasmic transport -S000036204 CDS YER009W 5 172115 172492 W 2011-02-03 1996-07-31 -S000000812 ORF Verified YER010C bifunctional 4-hydroxy-4-methyl-2-oxoglutarate aldolase/oxaloacetate decarboxylase chromosome 5 5 173338 172634 C 2011-02-03 1996-07-31 Bifunctional HMG aldolase/oxaloacetate decarboxylase; requires divalent metal ions for activity; competitively inhibited by oxalate; forms a ring-shaped homotrimer; similar to members of the prokaryotic RraA family of class II (divalent metal ion dependent) pyruvate aldolases from the meta cleavage pathways of protocatechuate and gallate -S000036925 CDS YER010C 5 173338 172634 C 2011-02-03 1996-07-31 -S000077383 ARS ARS511 ARSV-174 chromosome 5 5 173700 173864 2014-11-18 2014-11-18|2004-10-19|2006-09-07 Autonomously Replicating Sequence -S000178084 ARS_consensus_sequence ARS511 5 173808 173792 C 2014-11-18 2014-11-18 -S000000813 ORF Verified YER011W TIR1 GPI-anchored mannoprotein|SRP1 chromosome 5 L000002059 5 175248 176012 W 2011-02-03 1996-07-31 Cell wall mannoprotein; expression is downregulated at acidic pH and induced by cold shock and anaerobiosis; abundance is increased in cells cultured without shaking; member of the Srp1p/Tip1p family of serine-alanine-rich proteins -S000037042 CDS YER011W 5 175248 176012 W 2011-02-03 1996-07-31 -S000006912 long_terminal_repeat YERWdelta7 chromosome 5 5 176705 176856 W 2011-02-03 2000-05-19 Ty1 LTR -S000006550 tRNA_gene tE(UUC)E1 chromosome 5 L000003792 5 177099 177170 W 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; target of K. lactis zymocin -S000034436 noncoding_exon tE(UUC)E1 5 177099 177170 W 2011-02-03 2000-05-19 -S000000814 ORF Verified YER012W PRE1 proteasome core particle subunit beta 4 chromosome 5 L000001483 5 177835 178431 W 2011-02-03 1996-07-31 Beta 4 subunit of the 20S proteasome; localizes to the nucleus throughout the cell cycle -S000037113 CDS YER012W 5 177835 178431 W 2011-02-03 1996-07-31 -S000000815 ORF Verified YER013W PRP22 DEAH-box ATP-dependent RNA helicase PRP22 chromosome 5 L000001508 5 178841 182278 W 2011-02-03 1996-07-31 DEAH-box RNA-dependent ATPase/ATP-dependent RNA helicase; associates with lariat intermediates before the second catalytic step of splicing; mediates ATP-dependent mRNA release from the spliceosome and unwinds RNA duplexes; required for proofreading the exon ligation reaction -S000037868 CDS YER013W 5 178841 182278 W 2011-02-03 1996-07-31 -S000000816 ORF Verified YER014W HEM14 oxygen-dependent protoporphyrinogen oxidase chromosome 5 L000003353 5 182600 184219 W 2011-02-03 1996-07-31 Protoporphyrinogen oxidase; a mitochondrial enzyme that catalyzes the seventh step in the heme biosynthetic pathway, converting protoporphyrinogen IX to protoporphyrin IX; inhibited by diphenyl ether-type herbicides -S000029903 CDS YER014W 5 182600 184219 W 2011-02-03 1996-07-31 -S000000817 ORF Verified YER015W FAA2 medium-chain fatty acid-CoA ligase FAA2|FAM1 chromosome 5 L000000595|L000000599 5 184541 186775 W 2011-02-03 1996-07-31 Medium chain fatty acyl-CoA synthetase; activates imported fatty acids; accepts a wide range of fatty acid chain lengths with a preference for medium chains, C9:0-C13:0; localized to the peroxisome; comparative analysis suggests that a mitochondrially targeted form may result from translation starting at a non-canonical codon upstream of the annotated start codon -S000030015 CDS YER015W 5 184541 186775 W 2011-02-03 1996-07-31 -S000007590 ORF Verified YER014C-A BUD25 chromosome 5 5 184700 183731 C 2011-02-03 2001-02-14 Protein involved in bud-site selection; diploid mutants display a random budding pattern instead of the wild-type bipolar pattern -S000037101 CDS YER014C-A 5 184169 183731 C 2011-02-03 2001-02-14 -S000037100 CDS YER014C-A 5 184700 184678 C 2011-02-03 2001-02-14 -S000037102 intron YER014C-A 5 184677 184170 C 2011-02-03 2001-02-14 -S000000818 ORF Verified YER016W BIM1 microtubule-binding protein BIM1|EB1|YEB1 chromosome 5 L000003272 5 188277 189311 W 2011-02-03 1996-07-31 Microtubule plus end-tracking protein; together with Kar9p makes up the cortical microtubule capture site and delays the exit from mitosis when the spindle is oriented abnormally; homolog of human end binding protein 1 (EB1) -S000031017 CDS YER016W 5 188277 189311 W 2011-02-03 1996-07-31 -S000000819 ORF Verified YER017C AFG3 AAA family ATPase AFG3|YTA10 chromosome 5 L000002562|L000000057 5 191788 189503 C 2011-02-03 1996-07-31 Mitochondrial inner membrane m-AAA protease component; mediates degradation of misfolded or unassembled proteins; also required for correct assembly of mitochondrial enzyme complexes; involved in cytoplasmic mRNA translation and aging; expression of human homolog AFG3L2 can complement yeast yta12 afg3 double mutant -S000031051 CDS YER017C 5 191788 189503 C 2011-02-03 1996-07-31 -S000000820 ORF Verified YER018C SPC25 kinetochore-associated Ndc80 complex subunit SPC25 chromosome 5 L000004695 5 192624 191959 C 2011-02-03 1996-07-31 Component of the kinetochore-associated Ndc80 complex; involved in chromosome segregation, spindle checkpoint activity, and kinetochore clustering; evolutionarily conserved; other members include Ndc80p, Nuf2p, Spc24p, and Spc25p -S000031164 CDS YER018C 5 192624 191959 C 2011-02-03 1996-07-31 -S000000821 ORF Verified YER019W ISC1 inositol phosphosphingolipid phospholipase chromosome 5 5 192797 194230 W 2011-02-03 1996-07-31 Inositol phosphosphingolipid phospholipase C; mitochondrial membrane localized; hydrolyzes complex sphingolipids to produce ceramide; activates genes required for non-fermentable carbon source metabolism during diauxic shift; activated by phosphatidylserine, cardiolipin, and phosphatidylglycerol; mediates Na+ and Li+ halotolerance; ortholog of mammalian neutral sphingomyelinase type 2 -S000032239 CDS YER019W 5 192797 194230 W 2011-02-03 1996-07-31 -S000002127 ORF Verified YER019C-A SBH2 Arf family guanine nucleotide exchange factor SBH2|SEB2 chromosome 5 L000002847|L000004138 5 194539 194273 C 2011-02-03 1996-07-31 Ssh1p-Sss1p-Sbh2p complex component; involved in protein translocation into the endoplasmic reticulum; SBH2 has a paralog, SBH1, that arose from the whole genome duplication -S000032656 CDS YER019C-A 5 194539 194273 C 2011-02-03 1996-07-31 -S000000822 ORF Verified YER020W GPA2 guanine nucleotide-binding protein subunit alpha|SSP101 chromosome 5 L000000721 5 195168 196517 W 10 2011-02-03 1996-07-31 Nucleotide binding alpha subunit of the heterotrimeric G protein; interacts with the receptor Gpr1p, has signaling role in response to nutrients; required for the recruitment of Ras-GTP at the plasma membrane and in the nucleus -S000032231 CDS YER020W 5 195168 196517 W 2011-02-03 1996-07-31 -S000000823 ORF Verified YER021W RPN3 proteasome regulatory particle lid subunit RPN3|SUN2 chromosome 5 L000003109 5 196948 198519 W 2011-02-03 1996-07-31 Essential non-ATPase regulatory subunit of the 26S proteasome lid; similar to the p58 subunit of the human 26S proteasome; temperature-sensitive alleles cause metaphase arrest, suggesting a role for the proteasome in cell cycle control -S000032304 CDS YER021W 5 196948 198519 W 2011-02-03 1996-07-31 -S000000824 ORF Verified YER022W SRB4 MED17 chromosome 5 L000002051 5 198812 200875 W 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; required for basal RNA polymerase II transcription; homozygosity of the human MED17 L371P mutation is associated with infantile cerebral and cerebellar atrophy with poor myelination -S000033166 CDS YER022W 5 198812 200875 W 2011-02-03 1996-07-31 -S000000825 ORF Verified YER023W PRO3 pyrroline-5-carboxylate reductase|ORE2 chromosome 5 L000001493 5 201076 201936 W 23 2011-02-03 1996-07-31 Delta 1-pyrroline-5-carboxylate reductase; catalyzes the last step in proline biosynthesis -S000033229 CDS YER023W 5 201076 201936 W 2011-02-03 1996-07-31 -S000028622 ORF Dubious YER023C-A chromosome 5 5 201734 201522 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified gene PRO3; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching -S000031472 CDS YER023C-A 5 201734 201522 C 2011-02-03 2003-07-29 -S000000826 ORF Verified YER024W YAT2 carnitine O-acetyltransferase YAT2 chromosome 5 5 202192 204963 W 2011-02-03 1996-07-31 Carnitine acetyltransferase; has similarity to Yat1p, which is a carnitine acetyltransferase associated with the mitochondrial outer membrane -S000033278 CDS YER024W 5 202192 204963 W 2011-02-03 1996-07-31 -S000000827 ORF Verified YER025W GCD11 translation initiation factor eIF2 subunit gamma|SUI4 chromosome 5 L000000677 5 205251 206834 W 14 2011-02-03 1996-07-31 Gamma subunit of the translation initiation factor eIF2; involved in the identification of the start codon; binds GTP when forming the ternary complex with GTP and tRNAi-Met; mutations in human ortholog cause X-linked intellectual disability (XLID) -S000034151 CDS YER025W 5 205251 206834 W 2011-02-03 1996-07-31 -S000006593 tRNA_gene tH(GUG)E1 chromosome 5 L000003793 5 207357 207428 W 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis -S000035209 noncoding_exon tH(GUG)E1 5 207357 207428 W 2011-02-03 2000-05-19 -S000000828 ORF Verified YER026C CHO1 CDP-diacylglycerol-serine O-phosphatidyltransferase|PSS1 chromosome 5 L000000327|L000001521 5 208474 207644 C 22 2011-02-03 1996-07-31 Phosphatidylserine synthase; functions in phospholipid biosynthesis; catalyzes the reaction CDP-diaclyglycerol + L-serine = CMP + L-1-phosphatidylserine, transcriptionally repressed by myo-inositol and choline -S000034205 CDS YER026C 5 208474 207644 C 2011-02-03 1996-07-31 -S000000829 ORF Verified YER027C GAL83 SPM1 chromosome 5 L000000666 5 210232 208979 C 11 2011-02-03 1996-07-31 One of three possible beta-subunits of the Snf1 kinase complex; allows nuclear localization of the Snf1 kinase complex in the presence of a nonfermentable carbon source; necessary and sufficient for phosphorylation of the Mig2p transcription factor in response to alkaline stress; functionally redundant with SIP1 and SIP2 for the phosphorylation of Mig1p in response to glucose deprivation; contains a glycogen-binding domain -S000034334 CDS YER027C 5 210232 208979 C 2011-02-03 1996-07-31 -S000000830 ORF Verified YER028C MIG3 chromosome 5 5 211876 210692 C 2011-02-03 1996-07-31 Transcriptional regulator; partially nonfunctional in S288C strains but has a major role in catabolite repression and ethanol response in some other strains; involved in response to toxic agents; phosphorylation by Snf1p or the Mec1p pathway inactivates Mig3p, allowing induction of damage response genesenvironment -S000035341 CDS YER028C 5 211876 210692 C 2011-02-03 1996-07-31 -S000077384 ARS ARS512 ARSV-212 chromosome 5 5 212383 212631 2011-02-03 2004-10-19|2006-09-07 Autonomously Replicating Sequence -S000178085 ARS_consensus_sequence ARS512 5 212454 212470 W 2014-11-18 2014-11-18 -S000000831 ORF Verified YER029C SMB1 mRNA splicing protein SMB1|Sm B|SmB chromosome 5 L000004361 5 213177 212587 C 2011-02-03 1996-07-31 Core Sm protein Sm B; part of heteroheptameric complex (with Smd1p, Smd2p, Smd3p, Sme1p, Smx3p, and Smx2p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; homolog of human Sm B and Sm B' -S000035476 CDS YER029C 5 213177 212587 C 2011-02-03 1996-07-31 -S000000832 ORF Verified YER030W CHZ1 chromosome 5 5 213437 213898 W 2011-02-03 1996-07-31|2005-11-29 Histone chaperone for Htz1p/H2A-H2B dimer; required for the stabilization of the Chz1p-Htz1-H2B complex; has overlapping function with Nap1p; null mutant displays weak sensitivity to MMS and benomyl; contains a highly conserved CHZ motif; protein abundance increases in response to DNA replication stress -S000036549 CDS YER030W 5 213437 213898 W 2011-02-03 1996-07-31|2005-11-29 -S000000833 ORF Verified YER031C YPT31 Rab family GTPase YPT31|YPT8 chromosome 5 L000002545 5 214747 214076 C 2011-02-03 1996-07-31 Rab family GTPase; involved in the exocytic pathway; mediates intra-Golgi traffic or the budding of post-Golgi vesicles from the trans-Golgi; YPT31 has a paralog, YPT32, that arose from the whole genome duplication; localizes to the transitional and late Golgi -S000036578 CDS YER031C 5 214747 214076 C 2011-02-03 1996-07-31 -S000000834 ORF Verified YER032W FIR1 PIP1 chromosome 5 L000003487 5 215063 217693 W 2011-02-03 2003-09-22|1996-07-31 Protein involved in 3' mRNA processing; interacts with Ref2p; APCC(Cdh1) substrate; potential Cdc28p substrate -S000037329 CDS YER032W 5 215063 217693 W 2011-02-03 2003-09-22|1996-07-31 -S000000835 ORF Verified YER033C ZRG8 chromosome 5 S000007518 5 221287 218057 C 2011-02-03 1996-07-31 Protein of unknown function; authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; GFP-fusion protein is localized to the cytoplasm; transcription induced under conditions of zinc deficiency -S000037376 CDS YER033C 5 221287 218057 C 2011-02-03 1996-07-31 -S000000836 ORF Verified YER034W chromosome 5 5 221846 222403 W 2011-02-03 1996-07-31 Protein of unknown function; non-essential gene; expression induced upon calcium shortage; protein abundance increases in response to DNA replication stress -S000030147 CDS YER034W 5 221846 222403 W 2011-02-03 1996-07-31 -S000000837 ORF Verified YER035W EDC2 chromosome 5 5 222639 223076 W 2011-02-03 1996-07-31 RNA-binding protein that directly activates mRNA decapping; binds mRNA substrate and enhances activity of decapping proteins Dcp1p and Dcp2p; has a role in translation during heat stress; protein increases in abundance and relocalizes to nucleolus and to nuclear foci upon DNA replication stress; EDC2 has a paralog, EDC1, that arose from the whole genome duplication -S000030324 CDS YER035W 5 222639 223076 W 2011-02-03 1996-07-31 -S000000838 ORF Verified YER036C ARB1 ATP-binding cassette family ATPase ARB1 chromosome 5 5 225199 223367 C 2011-02-03 1996-07-31 ATPase of the ATP-binding cassette (ABC) family; involved in 40S and 60S ribosome biogenesis, has similarity to Gcn20p; shuttles from nucleus to cytoplasm, physically interacts with Tif6p, Lsg1p; human homolog ABCF2 can complement yeast ARB1 mutant -S000030397 CDS YER036C 5 225199 223367 C 2011-02-03 1996-07-31 -S000000839 ORF Verified YER037W PHM8 bifunctional nucleotidase/lysophosphatidic acid phosphatase chromosome 5 5 225889 226854 W 2011-02-03 1996-07-31 Lysophosphatidic acid (LPA) phosphatase, nucleotidase; principle and physiological nucleotidase working on GMP, UMP and CMP; involved in LPA hydrolysis in response to phosphate starvation and ribose salvage pathway; phosphatase activity is soluble and Mg2+ dependent; expression is induced by low phosphate levels and by inactivation of Pho85p; repressed by Gcn4p under normal conditions; PHM8 has a paralog, SDT1, that arose from the whole genome duplication -S000031397 CDS YER037W 5 225889 226854 W 2011-02-03 1996-07-31 -S000000840 ORF Verified YER038C KRE29 Smc5-Smc6 complex subunit KRE29|NSE6 chromosome 5 5 228252 226858 C 2011-02-03 1996-07-31 Subunit of the SMC5-SMC6 complex; this complex is involved in removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair; heterozygous mutant shows haploinsufficiency in K1 killer toxin resistance -S000031448 CDS YER038C 5 228252 226858 C 2011-02-03 1996-07-31 -S000028746 ORF Uncharacterized YER038W-A FMP49 chromosome 5 5 228451 228831 W 2011-02-03 2003-07-29 Mitochondrial protein of unknown function; almost completely overlaps ORF HVG1/YER039C -S000033416 CDS YER038W-A 5 228451 228831 W 2011-02-03 2003-07-29 -S000000841 ORF Verified YER039C HVG1 putative GDP-mannose transporter|YEM9 chromosome 5 L000003907 5 229205 228456 C 2011-02-03 1996-07-31 Protein of unknown function; HVG1 has a paralog, VRG4, that arose from the whole genome duplication -S000031567 CDS YER039C 5 229205 228456 C 2011-02-03 1996-07-31 -S000007226 ORF Uncharacterized YER039C-A chromosome 5 5 229481 229263 C 2011-02-03 1999-07-17 Putative protein of unknown function; YER039C-A is not an essential gene -S000030146 CDS YER039C-A 5 229481 229263 C 2011-02-03 1999-07-17 -S000000842 ORF Verified YER040W GLN3 nitrogen-responsive transcriptional regulator GLN3 chromosome 5 L000000710 5 229795 231987 W 38 2011-02-03 1996-07-31 Transcriptional activator of genes regulated by nitrogen catabolite repression; localization and activity regulated by quality of nitrogen source and Ure2p -S000031823 CDS YER040W 5 229795 231987 W 2011-02-03 1996-07-31 -S000000843 ORF Verified YER041W YEN1 crossover junction endodeoxyribonuclease chromosome 5 5 232461 234740 W 2011-02-03 1996-07-31|2011-02-03 Holliday junction resolvase; promotes template switching during break-induced replication (BIR), causing non-reciprocal translocations (NRTs); localization is cell-cycle dependent and regulated by Cdc28p phosphorylation; homolog of human GEN1; similar to S. cerevisiae endonuclease Rth1p -S000031953 CDS YER041W 5 232461 234740 W 2011-02-03 1996-07-31|2011-02-03 -S000000844 ORF Verified YER042W MXR1 peptide-methionine-S-sulfoxide reductase|msrA chromosome 5 L000004794 5 234937 235491 W 2011-02-03 1996-07-31 Methionine-S-sulfoxide reductase; involved in the response to oxidative stress; protects iron-sulfur clusters from oxidative inactivation along with MXR2; involved in the regulation of lifespan; reduced activity of human homolog implicated in Alzheimer disease -S000032841 CDS YER042W 5 234937 235491 W 2011-02-03 1996-07-31 -S000000845 ORF Verified YER043C SAH1 adenosylhomocysteinase chromosome 5 L000002989 5 237119 235770 C 2011-02-03 1996-07-31 S-adenosyl-L-homocysteine hydrolase; catabolizes S-adenosyl-L-homocysteine which is formed after donation of the activated methyl group of S-adenosyl-L-methionine (AdoMet) to an acceptor; regulates cellular lipid homoeostasis by regulating phosphatidylcholine(PC)synthesis and triacylglycerol (TG) levels -S000032879 CDS YER043C 5 237119 235770 C 2011-02-03 1996-07-31 -S000000846 ORF Verified YER044C ERG28 BUD18 chromosome 5 5 238016 237570 C 2011-02-03 1996-07-31 Endoplasmic reticulum membrane protein; may facilitate protein-protein interactions between the Erg26p dehydrogenase and the Erg27p 3-ketoreductase and/or tether these enzymes to the ER, also interacts with Erg6p -S000032987 CDS YER044C 5 238016 237570 C 2011-02-03 1996-07-31 -S000001954 ORF Verified YER044C-A MEI4 chromosome 5 L000001060 5 239774 238460 C 41 2011-02-03 1996-07-31 Meiosis-specific protein involved in forming DSBs; involved in double-strand break (DSBs) formation during meiotic recombination; required for chromosome synapsis and production of viable spores -S000032766 CDS YER044C-A 5 239623 238460 C 2011-02-03 1996-07-31 -S000032765 CDS YER044C-A 5 239774 239712 C 2011-02-03 1996-07-31 -S000032767 intron YER044C-A 5 239711 239624 C 2011-02-03 1996-07-31 -S000000847 ORF Verified YER045C ACA1 chromosome 5 5 241501 240032 C 2011-02-03 1996-07-31 ATF/CREB family basic leucine zipper (bZIP) transcription factor; binds as a homodimer to the ATF/CREB consensus sequence TGACGTCA; important for carbon source utilization; target genes include GRE2 and COS8; ACA1 has a paralog, CST6, that arose from the whole genome duplication -S000033081 CDS YER045C 5 241501 240032 C 2011-02-03 1996-07-31 -S000000848 ORF Verified YER046W SPO73 chromosome 5 5 243180 243611 W 2011-02-03 1996-07-31 Meiosis-specific protein required for prospore membrane morphogenesis; required for the proper shape of the prospore membrane (PSM) and for spore wall formation; functions cooperatively with SPO71 in PSM elongation; physically interacts with Spo71p; genetically antagonistic to SPO1, similar to SPO71; localizes to the PSM; required for spore wall formation during sporulation; dispensable for both nuclear divisions during meiosis; dysferlin domain-only protein -S000033892 CDS YER046W 5 243180 243611 W 2011-02-03 1996-07-31 -S000028747 ORF Dubious YER046W-A chromosome 5 5 243700 244029 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF SAP1/YER047C -S000033417 CDS YER046W-A 5 243700 244029 W 2011-02-03 2003-07-29 -S000000849 ORF Verified YER047C SAP1 putative AAA family ATPase SAP1 chromosome 5 L000004134 5 246503 243810 C 2011-02-03 1996-07-31 Putative ATPase of the AAA family; interacts with the Sin1p transcriptional repressor in the two-hybrid system -S000033982 CDS YER047C 5 246503 243810 C 2011-02-03 1996-07-31 -S000000850 ORF Verified YER048C CAJ1 chromosome 5 L000000210 5 248157 246982 C 2011-02-03 1996-07-31 Nuclear type II J heat shock protein of the E. coli dnaJ family; contains a leucine zipper-like motif, binds to non-native substrates for presentation to Ssa3p, may function during protein translocation, assembly and disassembly -S000034089 CDS YER048C 5 248157 246982 C 2011-02-03 1996-07-31 -S000006893 long_terminal_repeat YERCdelta8 chromosome 5 5 249331 249109 C 2011-02-03 2000-05-19|2007-04-03 Ty1 LTR -S000006913 long_terminal_repeat YERWdelta9 chromosome 5 5 249445 249752 W 2011-02-03 2000-05-19 Ty1 LTR -S000006904 long_terminal_repeat YERCsigma1 chromosome 5 5 250270 249930 C 2011-02-03 2000-05-19 Ty3 LTR -S000006696 tRNA_gene tQ(UUG)E1 chromosome 5 L000003794 5 250286 250357 W 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000034942 noncoding_exon tQ(UUG)E1 5 250286 250357 W 2011-02-03 2000-05-19 -S000007237 ORF Verified YER048W-A ISD11 chromosome 5 5 250718 251002 W 2011-02-03 1999-07-17 Cysteine desulfurase (Nfs1p) activator; essential for the formation of the persulfide intermediate at the desulfurase active site during pyridoxal phosphate-dependent desulfuration of cysteine; required for mitochondrial iron-sulfur cluster biosynthesis; exclusive to eukaryotes, implicated as eukaryotic supplement to the bacterium-derived Fe-S cluster (ISC) assembly apparatus; involved in regulation of iron metabolism; member of the LYR protein family -S000036074 CDS YER048W-A 5 250718 251002 W 2011-02-03 1999-07-17 -S000000851 ORF Verified YER049W TPA1 oxidative DNA demethylase chromosome 5 5 251728 253662 W 2011-02-03 1996-07-31 Fe(II)/2-oxoglutarate-dependent dioxygenase family member; catalyzes the repair of methyl-base lesions in both ss and dsDNA by oxidative demethylation; Poly(rA)-binding protein involved in mRNA poly(A) tail length and mRNA stability; role in translation termination efficiency; interacts with Sup45p (eRF1), Sup35p (eRF3) and Pab1p; similar to human prolyl 4-hydroxylase OGFOD1; binds Fe(II) and 2-oxoglutarate -S000035095 CDS YER049W 5 251728 253662 W 2011-02-03 1996-07-31 -S000000852 ORF Verified YER050C RSM18 mitochondrial 37S ribosomal protein RSM18 chromosome 5 5 254387 253971 C 2011-02-03 1996-07-31|2005-11-28 Mitochondrial ribosomal protein of the small subunit; has similarity to E. coli S18 ribosomal protein -S000036333 CDS YER050C 5 254387 253971 C 2011-02-03 1996-07-31|2005-11-28 -S000000853 ORF Verified YER051W JHD1 [Histone H3]-lysine-36 demethylase|KDM2|JHDM1 chromosome 5 5 254656 256134 W 2011-02-03 1996-07-31 JmjC domain family histone demethylase specific for H3-K36; similar to proteins found in human, mouse, drosophila, X. laevis, C. elegans, and S. pombe -S000037038 CDS YER051W 5 254656 256134 W 2011-02-03 1996-07-31 -S000000854 ORF Verified YER052C HOM3 aspartate kinase|THR3|SIL4|BOR1 chromosome 5 L000000800 5 257958 256375 C 48 2011-02-03 1996-07-31 Aspartate kinase (L-aspartate 4-P-transferase); cytoplasmic enzyme that catalyzes the first step in the common pathway for methionine and threonine biosynthesis; expression regulated by Gcn4p and the general control of amino acid synthesis -S000037071 CDS YER052C 5 257958 256375 C 2011-02-03 1996-07-31 -S000077385 ARS ARS513 chromosome 5 5 257958 258737 2011-02-03 2004-10-19 Autonomously Replicating Sequence -S000000855 ORF Verified YER053C PIC2 Cu/Pi carrier chromosome 5 5 259639 258737 C 2011-02-03 1996-07-31 Mitochondrial copper and phosphate carrier; imports copper and inorganic phosphate into mitochondria; functionally redundant with Mir1p but less abundant than Mir1p under normal conditions; expression is induced at high temperature -S000037192 CDS YER053C 5 259639 258737 C 2011-02-03 1996-07-31 -S000007523 ORF Verified YER053C-A chromosome 5 5 261046 260933 C 2011-02-03 2000-07-14 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; protein abundance increases in response to DNA replication stress -S000037059 CDS YER053C-A 5 261046 260933 C 2011-02-03 2000-07-14 -S000000856 ORF Verified YER054C GIP2 chromosome 5 L000003093 5 263698 262052 C 2011-02-03 1996-07-31 Putative regulatory subunit of protein phosphatase Glc7p; involved in glycogen metabolism; contains a conserved motif (GVNK motif) that is also found in Gac1p, Pig1p, and Pig2p; GIP2 has a paralog, PIG2, that arose from the whole genome duplication -S000037276 CDS YER054C 5 263698 262052 C 2011-02-03 1996-07-31 -S000000857 ORF Verified YER055C HIS1 ATP phosphoribosyltransferase chromosome 5 L000000778 5 265785 264892 C 49 2011-02-03 1996-07-31 ATP phosphoribosyltransferase; a hexameric enzyme, catalyzes the first step in histidine biosynthesis; mutations cause histidine auxotrophy and sensitivity to Cu, Co, and Ni salts; transcription is regulated by general amino acid control -S000029938 CDS YER055C 5 265785 264892 C 2011-02-03 1996-07-31 -S000000858 ORF Verified YER056C FCY2 purine-cytosine permease|BRA7 chromosome 5 L000000607 5 268113 266512 C 49 2011-02-03 1996-07-31 Purine-cytosine permease; mediates purine (adenine, guanine, and hypoxanthine) and cytosine accumulation; relative distribution to the vacuole increases upon DNA replication stress -S000030053 CDS YER056C 5 268113 266512 C 2011-02-03 1996-07-31 -S000002135 ORF Verified YER056C-A RPL34A eL34|ribosomal 60S subunit protein L34A|L34e|L34A chromosome 5 L000004465 5 270185 269423 C 2011-02-03 2000-12-01|1996-07-31 Ribosomal 60S subunit protein L34A; homologous to mammalian ribosomal protein L34, no bacterial homolog; RPL34A has a paralog, RPL34B, that arose from the whole genome duplication -S000031749 CDS YER056C-A 5 269751 269423 C 2011-02-03 2000-12-01|1996-07-31 -S000031748 CDS YER056C-A 5 270185 270149 C 2011-02-03 2000-12-01|1996-07-31 -S000031750 intron YER056C-A 5 270148 269752 C 2011-02-03 2000-12-01|1996-07-31 -S000000859 ORF Verified YER057C HMF1 putative isoleucine biosynthesis protein HMF1|HIG1 chromosome 5 L000004440 5 271126 270737 C 2011-02-03 1996-07-31 Member of the p14.5 protein family; functionally complements Mmf1p function when targeted to mitochondria; heat shock inducible; high-dosage growth inhibitor; forms a homotrimer in vitro; HMF1 has a paralog, MMF1, that arose from the whole genome duplication -S000030235 CDS YER057C 5 271126 270737 C 2011-02-03 1996-07-31 -S000000860 ORF Verified YER058W PET117 chromosome 5 L000001396 5 271768 272091 W 2011-02-03 1996-07-31 Protein required for assembly of cytochrome c oxidase -S000031258 CDS YER058W 5 271768 272091 W 2011-02-03 1996-07-31 -S000000861 ORF Verified YER059W PCL6 chromosome 5 L000004038 5 272624 273886 W 2011-02-03 1996-07-31 Pho85p cyclin of the Pho80p subfamily; forms the major Glc8p kinase together with Pcl7p and Pho85p; involved in the control of glycogen storage by Pho85p; stabilized by Elongin C binding; PCL6 has a paralog, PCL7, that arose from the whole genome duplication -S000031353 CDS YER059W 5 272624 273886 W 2011-02-03 1996-07-31 -S000000862 ORF Verified YER060W FCY21 purine-cytosine permease chromosome 5 L000003373 5 274567 276153 W 2011-02-03 1996-07-31 Putative purine-cytosine permease; very similar to Fcy2p but cannot substitute for its function -S000032301 CDS YER060W 5 274567 276153 W 2011-02-03 1996-07-31 -S000178086 ARS ARS513.5 chromosome 5 5 276130 276528 2014-11-18 2014-11-18 Very weak autonomously replicating sequence -S000002958 ORF Verified YER060W-A FCY22 purine-cytosine permease chromosome 5 L000003374 5 276572 278164 W 2011-02-03 1999-07-17|1996-07-31 Putative purine-cytosine permease; very similar to Fcy2p but cannot substitute for its function -S000032822 CDS YER060W-A 5 276572 278164 W 2011-02-03 1999-07-17|1996-07-31 -S000178087 ARS ARS513.7 chromosome 5 5 278076 278357 2014-11-18 2014-11-18 Weak autonomously replicating sequence -S000178088 ARS_consensus_sequence ARS513.7 5 278177 278161 C 2014-11-18 2014-11-18 -S000000863 ORF Verified YER061C CEM1 fatty acid synthase CEM1 chromosome 5 L000000292 5 279626 278298 C 2011-02-03 1996-07-31|2011-02-03 Mitochondrial beta-keto-acyl synthase; possible role in fatty acid synthesis; required for mitochondrial respiration; human homolog OXSM can complement yeast cem1 null mutant -S000032319 CDS YER061C 5 279626 278298 C 2011-02-03 1996-07-31|2011-02-03 -S000000864 ORF Verified YER062C GPP2 HOR2|glycerol-1-phosphatase HOR2 chromosome 5 L000003979 5 280682 279930 C 2011-02-03 1996-07-31 DL-glycerol-3-phosphate phosphatase involved in glycerol biosynthesis; also known as glycerol-1-phosphatase; induced in response to hyperosmotic or oxidative stress, and during diauxic shift; GPP2 has a paralog, GPP1, that arose from the whole genome duplication -S000032451 CDS YER062C 5 280682 279930 C 2011-02-03 1996-07-31 -S000000865 ORF Verified YER063W THO1 chromosome 5 L000004712 5 281710 282366 W 2011-02-03 1996-07-31 Conserved nuclear RNA-binding protein; specifically binds to transcribed chromatin in a THO- and RNA-dependent manner, genetically interacts with shuttling hnRNP NAB2; overproduction suppresses transcriptional defect caused by hpr1 mutation -S000033296 CDS YER063W 5 281710 282366 W 2011-02-03 1996-07-31 -S000000866 ORF Verified YER064C VHR2 chromosome 5 5 284222 282705 C 2011-02-03 1996-07-31 Non-essential nuclear protein; null mutation has global effects on transcription; VHR2 has a paralog, VHR1, that arose from the whole genome duplication; relative distribution to the nucleus increases upon DNA replication stress -S000033339 CDS YER064C 5 284222 282705 C 2011-02-03 1996-07-31 -S000000867 ORF Verified YER065C ICL1 isocitrate lyase 1 chromosome 5 L000000848 5 286914 285241 C 2011-02-03 1996-07-31 Isocitrate lyase; catalyzes the formation of succinate and glyoxylate from isocitrate, a key reaction of the glyoxylate cycle; expression of ICL1 is induced by growth on ethanol and repressed by growth on glucose -S000033405 CDS YER065C 5 286914 285241 C 2011-02-03 1996-07-31 -S000077386 ARS ARS514 ARSV-288 chromosome 5 5 287552 287629 2014-11-18 2014-11-18|2004-10-19|2006-09-07 Autonomously Replicating Sequence -S000178089 ARS_consensus_sequence ARS514 5 287565 287581 W 2014-11-18 2014-11-18 -S000006894 long_terminal_repeat YERCdelta10 chromosome 5 5 288062 287745 C 2011-02-03 2000-05-19 Ty1 LTR -S000006734 tRNA_gene tS(UGA)E SUP19 SUP20 chromosome 5 L000002192|L000003805 5 288524 288443 C 50 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations -S000034046 noncoding_exon tS(UGA)E 5 288524 288443 C 2011-02-03 2000-05-19 -S000000868 ORF Uncharacterized YER066W RRT13 chromosome 5 5 290242 290799 W 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene identified in a screen for mutants with decreased levels of rDNA transcription -S000034374 CDS YER066W 5 290242 290799 W 2011-02-03 1996-07-31 -S000000869 ORF Verified YER067W RGI1 chromosome 5 5 292066 292551 W 2011-02-03 1996-07-31 Protein of unknown function; involved in energy metabolism under respiratory conditions; protein abundance is increased upon intracellular iron depletion or in response to DNA replication stress; RGI1 has a paralog, RGI2, that arose from the whole genome duplication -S000034452 CDS YER067W 5 292066 292551 W 2011-02-03 1996-07-31 -S000002959 ORF Dubious YER066C-A chromosome 5 5 292203 291703 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps uncharacterized ORF YER067W -S000035687 CDS YER066C-A 5 292203 291703 C 2011-02-03 1996-07-31 -S000028748 ORF Dubious YER067C-A chromosome 5 5 292563 292240 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF RGI1/YER067W -S000033418 CDS YER067C-A 5 292563 292240 C 2011-02-03 2003-07-29 -S000000870 ORF Verified YER068W MOT2 CCR4-NOT core ubiquitin-protein ligase subunit MOT2|SIG1|NOT4 chromosome 5 L000001887|L000001137 5 293050 294813 W 2011-02-03 1996-07-31 Ubiquitin-protein ligase subunit of the CCR4-NOT complex; with Ubc4p, ubiquitinates nascent polypeptide-associated complex subunits and histone demethyase Jhd2p; CCR4-NOT has roles in transcription regulation, mRNA degradation, and post-transcriptional modifications; regulates levels of DNA Polymerase-{alpha} to promote efficient and accurate DNA replication -S000035479 CDS YER068W 5 293050 294813 W 2011-02-03 1996-07-31 -S000000871 ORF Verified YER069W ARG5,6 argC|argB|bifunctional acetylglutamate kinase/N-acetyl-gamma-glutamyl-phosphate reductase chromosome 5 L000000110 5 295410 298001 W 55 2011-02-03 1996-07-31 Acetylglutamate kinase and N-acetyl-gamma-glutamyl-phosphate reductase; N-acetyl-L-glutamate kinase (NAGK) catalyzes the 2nd and N-acetyl-gamma-glutamyl-phosphate reductase (NAGSA), the 3rd step in arginine biosynthesis; synthesized as a precursor which is processed in the mitochondrion to yield mature NAGK and NAGSA; enzymes form a metabolon complex with Arg2p; NAGK C-terminal domain stabilizes the enzymes, slows catalysis and is involved in feed-back inhibition by arginine -S000035588 CDS YER069W 5 295410 298001 W 2011-02-03 1996-07-31 -S000028749 ORF Dubious YER068C-A chromosome 5 5 295732 295301 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF ARG5,6/YER069W -S000033419 CDS YER068C-A 5 295732 295301 C 2011-02-03 2003-07-29 -S000000872 ORF Verified YER070W RNR1 ribonucleotide-diphosphate reductase subunit RNR1|SDS12|RIR1|CRT7 chromosome 5 L000001655 5 298950 301616 W 2011-02-03 1996-07-31 Major isoform of large subunit of ribonucleotide-diphosphate reductase; the RNR complex catalyzes rate-limiting step in dNTP synthesis, regulated by DNA replication and DNA damage checkpoint pathways via localization of small subunits; relative distribution to the nucleus increases upon DNA replication stress; RNR1 has a paralog, RNR3, that arose from the whole genome duplication -S000035499 CDS YER070W 5 298950 301616 W 2011-02-03 1996-07-31 -S000000873 ORF Uncharacterized YER071C TDA2 chromosome 5 5 302327 301947 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; null mutant is sensitive to expression of the top1-T722A allele -S000035526 CDS YER071C 5 302327 301947 C 2011-02-03 1996-07-31 -S000000874 ORF Verified YER072W VTC1 PHM4|NRF1 chromosome 5 L000004689 5 302806 303195 W 2011-02-03 1996-07-31 Regulatory subunit of the vacuolar transporter chaperone (VTC) complex; VTC complex is involved in membrane trafficking, vacuolar polyphosphate accumulation, microautophagy and non-autophagic vacuolar fusion; also has mRNA binding activity; protein abundance increases in response to DNA replication stress -S000036469 CDS YER072W 5 302806 303195 W 2011-02-03 1996-07-31 -S000000875 ORF Verified YER073W ALD5 aldehyde dehydrogenase (NAD(P)(+)) ALD5 chromosome 5 L000004949 5 304030 305592 W 2011-02-03 1996-07-31|2011-02-03 Mitochondrial aldehyde dehydrogenase; involved in regulation or biosynthesis of electron transport chain components and acetate formation; activated by K+; utilizes NADP+ as the preferred coenzyme; constitutively expressed -S000036548 CDS YER073W 5 304030 305592 W 2011-02-03 1996-07-31|2011-02-03 -S000000876 ORF Verified YER074W RPS24A eS24|ribosomal 40S subunit protein S24A|S24e|S24A|RPS24EA chromosome 5 L000002710 5 306323 307196 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S24, no bacterial homolog; RPS24A has a paralog, RPS24B, that arose from the whole genome duplication -S000036669 CDS YER074W 5 306323 306325 W 2011-02-03 1996-07-31 -S000036670 CDS YER074W 5 306792 307196 W 2011-02-03 1996-07-31 -S000036671 intron YER074W 5 306326 306791 W 2011-02-03 1996-07-31 -S000007651 ORF Verified YER074W-A YOS1 chromosome 5 5 307653 308123 W 2011-02-03 2004-01-08|2001-06-29 Integral membrane protein required for ER to Golgi transport; localized to the Golgi, the ER, and COPII vesicles; interacts with Yip1p and Yif1p -S000037341 CDS YER074W-A 5 307653 307746 W 2011-02-03 2004-01-08|2001-06-29 -S000037342 CDS YER074W-A 5 307849 307956 W 2011-02-03 2004-01-08|2001-06-29 -S000037343 CDS YER074W-A 5 308068 308123 W 2011-02-03 2004-01-08|2001-06-29 -S000037344 intron YER074W-A 5 307747 307848 W 2011-02-03 2004-01-08|2001-06-29 -S000037345 intron YER074W-A 5 307957 308067 W 2011-02-03 2004-01-08|2001-06-29 -S000000877 ORF Verified YER075C PTP3 tyrosine protein phosphatase PTP3 chromosome 5 L000003996 5 311199 308413 C 2011-02-03 1996-07-31|2011-02-03 Phosphotyrosine-specific protein phosphatase; involved in the inactivation of mitogen-activated protein kinase (MAPK) during osmolarity sensing; dephosporylates Hog1p MAPK and regulates its localization; localized to the cytoplasm -S000036705 CDS YER075C 5 311199 308413 C 2011-02-03 1996-07-31|2011-02-03 -S000006522 tRNA_gene tA(UGC)E chromosome 5 L000003804 5 312095 312023 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 5 nuclear tRNA genes containing the tDNA-anticodon TGC (mature tRNA may be UGC or may contain modified bases), decodes GCA and probably GCG codons into alanine, one of 16 nuclear tRNAs for alanine -S000034855 noncoding_exon tA(UGC)E 5 312095 312023 C 2011-02-03 2000-05-19 -S000006914 long_terminal_repeat YERWdelta11 chromosome 5 5 312274 312445 W 2011-02-03 2000-05-19 Ty1 LTR -S000028750 ORF Dubious YER076W-A chromosome 5 5 313390 313737 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YER076C -S000033444 CDS YER076W-A 5 313390 313737 W 2011-02-03 2003-07-29 -S000000878 ORF Uncharacterized YER076C chromosome 5 5 313498 312590 C 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; analysis of HA-tagged protein suggests a membrane localization -S000037415 CDS YER076C 5 313498 312590 C 2011-02-03 1996-07-31 -S000000879 ORF Uncharacterized YER077C MRX1 chromosome 5 5 316600 314534 C 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; green fluorescent protein (GFP)-fusion protein localizes to the mitochondrion; null mutation results in a decrease in plasma membrane electron transport -S000037540 CDS YER077C 5 316600 314534 C 2011-02-03 1996-07-31 -S000077387 ARS ARS515 chromosome 5 5 316600 316807 2011-02-03 2004-10-19 Autonomously Replicating Sequence -S000000880 ORF Verified YER078C ICP55 aminopeptidase chromosome 5 5 318342 316807 C 2011-02-03 1996-07-31 Mitochondrial aminopeptidase; cleaves the N termini of at least 38 imported proteins after cleavage by the mitochondrial processing peptidase (MPP), thereby increasing their stability; member of the aminopeptidase P family -S000037656 CDS YER078C 5 318342 316807 C 2011-02-03 1996-07-31 -S000028546 ORF Uncharacterized YER078W-A chromosome 5 5 318646 318810 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031196 CDS YER078W-A 5 318646 318810 W 2011-02-03 2003-07-29 -S000000881 ORF Uncharacterized YER079W chromosome 5 5 318920 319552 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000030524 CDS YER079W 5 318920 319552 W 2011-02-03 1996-07-31 -S000000882 ORF Verified YER080W AIM9 FMP29 chromosome 5 5 319963 321846 W 2011-02-03 1996-07-31 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; null mutant displays elevated frequency of mitochondrial genome loss -S000031341 CDS YER080W 5 319963 321846 W 2011-02-03 1996-07-31 -S000028751 ORF Dubious YER079C-A chromosome 5 5 320240 319902 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF AIM9/YER080W -S000033445 CDS YER079C-A 5 320240 319902 C 2011-02-03 2003-07-29 -S000029010 ncRNA_gene SRG1 SRG1 chromosome 5 5 322212 322762 W 2011-02-03 2003-10-29 Non-protein-coding RNA that regulates the transcription of SER3; expression of SRG1 RNA represses expression of its neighboring gene SER3 via a transcription-interference mechanism -S000035975 noncoding_exon SRG1 5 322212 322762 W 2011-02-03 2003-10-29 -S000000883 ORF Verified YER081W SER3 phosphoglycerate dehydrogenase SER3 chromosome 5 S000007457 5 322686 324095 W 2011-02-03 1996-07-31 3-phosphoglycerate dehydrogenase and alpha-ketoglutarate reductase; 3PG dehydrogenase that catalyzes the first step in serine and glycine biosynthesis; also functions as an alpha-ketoglutarate reductase, converting alpha-ketoglutarate to D-2-hydroxyglutarate (D-2HG); localizes to the cytoplasm; SER3 has a paralog, SER33, that arose from the whole genome duplication -S000031424 CDS YER081W 5 322686 324095 W 2011-02-03 1996-07-31 -S000000884 ORF Verified YER082C UTP7 KRE31 chromosome 5 5 325936 324272 C 2011-02-03 1996-07-31 Nucleolar protein; component of the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA -S000031483 CDS YER082C 5 325936 324272 C 2011-02-03 1996-07-31 -S000000885 ORF Verified YER083C GET2 GET complex subunit GET2|RMD7|HUR2 chromosome 5 5 327031 326174 C 2011-02-03 2003-09-22|1996-07-31 Subunit of the GET complex; involved in insertion of proteins into the ER membrane; required for the retrieval of HDEL proteins from the Golgi to the ER in an ERD2 dependent fashion and for meiotic nuclear division -S000031538 CDS YER083C 5 327031 326174 C 2011-02-03 2003-09-22|1996-07-31 -S000000886 ORF Uncharacterized YER084W chromosome 5 5 327065 327451 W 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels -S000032559 CDS YER084W 5 327065 327451 W 2011-02-03 1996-07-31 -S000028752 ORF Dubious YER084W-A chromosome 5 5 327598 328110 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps uncharacterized ORF YER085C -S000033446 CDS YER084W-A 5 327598 328110 W 2011-02-03 2003-07-29 -S000000887 ORF Uncharacterized YER085C chromosome 5 5 328140 327619 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000032615 CDS YER085C 5 328140 327619 C 2011-02-03 1996-07-31 -S000000888 ORF Verified YER086W ILV1 threonine ammonia-lyase ILV1|ISO1 chromosome 5 L000000857 5 328477 330207 W 64 2011-02-03 1999-07-17|1996-07-31 Threonine deaminase, catalyzes first step in isoleucine biosynthesis; expression is under general amino acid control; ILV1 locus exhibits highly positioned nucleosomes whose organization is independent of known ILV1 regulation -S000032774 CDS YER086W 5 328477 330207 W 2011-02-03 1996-07-31 -S000000889 ORF Verified YER087W AIM10 putative proline--tRNA ligase AIM10 chromosome 5 5 330576 332306 W 2011-02-03 1996-07-31 Protein with similarity to tRNA synthetases; non-tagged protein is detected in purified mitochondria; null mutant is viable and displays elevated frequency of mitochondrial genome loss -S000033504 CDS YER087W 5 330576 332306 W 2011-02-03 1996-07-31 -S000028753 ORF Dubious YER087C-A chromosome 5 5 332368 331817 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF AIM10/YER087W -S000033447 CDS YER087C-A 5 332368 331817 C 2011-02-03 2003-07-29 -S000002128 ORF Verified YER087C-B SBH1 Arf family guanine nucleotide exchange factor SBH1|YER087C-A|SEB1 chromosome 5 L000002846|L000004137 5 332830 332582 C 2011-02-03 1996-07-31 Beta subunit of Sec61p ER translocation complex (Sec61p-Sss1p-Sbh1p); involved in protein translocation into the endoplasmic reticulum; interacts with the exocyst complex and also with Rtn1p; cotranslationally N-acetylated by NatA; SBH1 has a paralog, SBH2, that arose from the whole genome duplication -S000037045 CDS YER087C-B 5 332830 332582 C 2011-02-03 1996-07-31 -S000000890 ORF Verified YER088C DOT6 PBF2 chromosome 5 L000004393 5 335188 333176 C 2011-02-03 1996-07-31 Protein involved in rRNA and ribosome biogenesis; activated in stochastic pulses of nuclear localization; binds polymerase A and C motif; subunit of the RPD3L histone deacetylase complex; has chromatin specific SANT domain; involved in telomeric gene silencing and filamentation; relative distribution to the nucleus increases upon DNA replication stress -S000033553 CDS YER088C 5 335188 333176 C 2011-02-03 1996-07-31 -S000028623 ORF Dubious YER088W-B chromosome 5 5 335927 336073 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the ORF PTC2/YER089C; identified by gene-trapping, expression analysis, and homology searching -S000031475 CDS YER088W-B 5 335927 336073 W 2011-02-03 2003-07-29 -S000028754 ORF Dubious YER088C-A chromosome 5 5 336019 335696 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORFs PTC2/YER089C and YER088W-B -S000033448 CDS YER088C-A 5 336019 335696 C 2011-02-03 2003-07-29 -S000000891 ORF Verified YER089C PTC2 type 2C protein phosphatase PTC2 chromosome 5 L000003403 5 337340 335946 C 2011-02-03 1996-07-31 Type 2C protein phosphatase (PP2C); dephosphorylates Hog1p to limit maximal osmostress induced kinase activity; dephosphorylates Ire1p to downregulate the unfolded protein response; dephosphorylates Cdc28p; inactivates the DNA damage checkpoint; PTC2 has a paralog, PTC3, that arose from the whole genome duplication -S000033635 CDS YER089C 5 337340 335946 C 2011-02-03 1996-07-31 -S000000892 ORF Verified YER090W TRP2 anthranilate synthase TRP2 chromosome 5 L000002353 5 337949 339472 W 76 2011-02-03 1996-07-31 Anthranilate synthase; catalyzes the initial step of tryptophan biosynthesis, forms multifunctional hetero-oligomeric anthranilate synthase:indole-3-glycerol phosphate synthase enzyme complex with Trp3p -S000035640 CDS YER090W 5 337949 339472 W 2011-02-03 1996-07-31 -S000029725 ORF Dubious YER090C-A chromosome 5 5 338411 338322 C 2011-02-03 2004-08-27 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036876 CDS YER090C-A 5 338411 338322 C 2011-02-03 2004-08-27 -S000000893 ORF Verified YER091C MET6 5-methyltetrahydropteroyltriglutamate-homocysteine S-methyltransferase chromosome 5 L000001081 5 342167 339864 C 77 2011-02-03 1996-07-31 Cobalamin-independent methionine synthase; involved in methionine biosynthesis and regeneration; requires a minimum of two glutamates on the methyltetrahydrofolate substrate, similar to bacterial metE homologs -S000035673 CDS YER091C 5 342167 339864 C 2011-02-03 1996-07-31 -S000007238 ORF Dubious YER091C-A chromosome 5 5 342611 342390 C 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034939 CDS YER091C-A 5 342611 342390 C 2011-02-03 1999-07-17 -S000000894 ORF Verified YER092W IES5 chromosome 5 5 342855 343232 W 2011-02-03 1996-07-31 Non-essential INO80 chromatin remodeling complex subunit; deletion affects telomere maintenance via recombination -S000035789 CDS YER092W 5 342855 343232 W 2011-02-03 1996-07-31 -S000000895 ORF Verified YER093C TSC11 TORC2 complex subunit TSC11|AVO3 chromosome 5 5 347612 343320 C 2011-02-03 1996-07-31 Subunit of TORC2 (Tor2p-Lst8p-Avo1-Avo2-Tsc11p-Bit61p); TORC2 is a membrane-associated complex that regulates actin cytoskeletal dynamics during polarized growth and cell wall integrity; involved in sphingolipid metabolism; contains a RasGEFN domain -S000035826 CDS YER093C 5 347612 343320 C 2011-02-03 1996-07-31 -S000002960 ORF Verified YER093C-A AIM11 GEP8 chromosome 5 5 348400 347912 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant is viable but shows increased loss of mitochondrial genome and synthetic interaction with prohibitin (phb1); contains an intron; SWAT-GFP and mCherry fusion proteins localize to the mitochondria; YER093C-A has a paralog, YBL059W, that arose from the whole genome duplication -S000030866 CDS YER093C-A 5 348201 347912 C 2011-02-03 1996-07-31 -S000030865 CDS YER093C-A 5 348400 348277 C 2011-02-03 1996-07-31 -S000030867 intron YER093C-A 5 348276 348202 C 2011-02-03 1996-07-31 -S000000896 ORF Verified YER094C PUP3 proteasome core particle subunit beta 3|SCS32 chromosome 5 L000001532 5 349346 348729 C 2011-02-03 1996-07-31 Beta 3 subunit of the 20S proteasome; involved in ubiquitin-dependent catabolism; human homolog is subunit C10 -S000035946 CDS YER094C 5 349346 348729 C 2011-02-03 1996-07-31 -S000000897 ORF Verified YER095W RAD51 recombinase RAD51|MUT5 chromosome 5 L000001571 5 349980 351182 W 78 2011-02-03 1996-07-31 Strand exchange protein; forms a helical filament with DNA that searches for homology; involved in the recombinational repair of double-strand breaks in DNA during vegetative growth and meiosis; homolog of Dmc1p and bacterial RecA protein -S000036878 CDS YER095W 5 349980 351182 W 2011-02-03 1996-07-31 -S000000898 ORF Verified YER096W SHC1 chromosome 5 L000001879 5 351698 353236 W 79.23 2011-02-03 1996-07-31 Sporulation-specific activator of Chs3p (chitin synthase III); required for the synthesis of the chitosan layer of ascospores; transcriptionally induced at alkaline pH; SHC1 has a paralog, SKT5, that arose from the whole genome duplication -S000036926 CDS YER096W 5 351698 353236 W 2011-02-03 1996-07-31 -S000006915 long_terminal_repeat YERWdelta12 chromosome 5 5 353399 353735 W 2011-02-03 2000-05-19 Ty1 LTR -S000077388 ARS ARS516 ARSV-354 chromosome 5 5 353578 353636 2014-11-18 2014-11-18|2004-10-19|2006-10-02 Autonomously Replicating Sequence -S000178090 ARS_consensus_sequence ARS516 5 353582 353598 W 2014-11-18 2014-11-18 -S000006916 long_terminal_repeat YERWdelta13 chromosome 5 5 354136 354850 W 2011-02-03 2000-05-19 Ty1 LTR -S000006908 long_terminal_repeat YERCtau2 chromosome 5 5 354730 354360 C 2011-02-03 2000-05-19 Ty4 LTR -S000006905 long_terminal_repeat YERCsigma2 chromosome 5 5 354917 354851 C 2011-02-03 2000-05-19 Ty3 LTR -S000006551 tRNA_gene tE(UUC)E2 chromosome 5 L000003795 5 354934 355005 W 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000034437 noncoding_exon tE(UUC)E2 5 354934 355005 W 2011-02-03 2000-05-19 -S000000899 ORF Dubious YER097W chromosome 5 5 355140 355469 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036977 CDS YER097W 5 355140 355469 W 2011-02-03 1996-07-31 -S000000900 ORF Verified YER098W UBP9 putative ubiquitin-specific protease UBP9 chromosome 5 L000003170 5 355466 357730 W 2011-02-03 1996-07-31 Ubiquitin-specific protease that cleaves ubiquitin-protein fusions; UBP9 has a paralog, UBP13, that arose from the whole genome duplication -S000037747 CDS YER098W 5 355466 357730 W 2011-02-03 1996-07-31 -S000000901 ORF Verified YER099C PRS2 ribose phosphate diphosphokinase subunit PRS2 chromosome 5 L000001512 5 359061 358105 C 2011-02-03 1996-07-31 5-phospho-ribosyl-1(alpha)-pyrophosphate synthetase, synthesizes PRPP; which is required for nucleotide, histidine, and tryptophan biosynthesis; one of five related enzymes, which are active as heteromultimeric complexes; PRS2 has a paralog, PRS4, that arose from the whole genome duplication -S000037788 CDS YER099C 5 359061 358105 C 2011-02-03 1996-07-31 -S000000902 ORF Verified YER100W UBC6 E2 ubiquitin-conjugating protein UBC6|DOA2 chromosome 5 L000002409 5 359562 360314 W 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme involved in ERAD; located at the cytosolic side of the ER membrane; tail region contains a transmembrane segment at the C-terminus; substrate of the ubiquitin-proteasome pathway; ER-associated protein degradation is also known as ERAD -S000035454 CDS YER100W 5 359562 360314 W 2011-02-03 1996-07-31 -S000000903 ORF Verified YER101C AST2 chromosome 5 L000000134 5 361794 360502 C 2011-02-03 1996-07-31 Lipid raft associated protein; overexpression restores Pma1p localization to lipid rafts which is required for targeting of Pma1p to the plasma membrane; sometimes classified in the medium-chain dehydrogenase/reductases (MDRs) superfamily; AST2 has a paralog, AST1, that arose from the whole genome duplication -S000036309 CDS YER101C 5 361794 360502 C 2011-02-03 1996-07-31 -S000000904 ORF Verified YER102W RPS8B eS8|ribosomal 40S subunit protein S8B|S8e|rp19|YS9|S8B|S14B chromosome 5 L000001754 5 363100 363702 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S8, no bacterial homolog; RPS8B has a paralog, RPS8A, that arose from the whole genome duplication -S000036450 CDS YER102W 5 363100 363702 W 2011-02-03 1996-07-31 -S000122096 five_prime_UTR_intron YER102W 5 362733 363092 W 2011-02-03 2007-04-04 -S000000905 ORF Verified YER103W SSA4 Hsp70 family chaperone SSA4|YG107 chromosome 5 L000002072 5 364589 366517 W 2011-02-03 1996-07-31 Heat shock protein that is highly induced upon stress; plays a role in SRP-dependent cotranslational protein-membrane targeting and translocation; member of the HSP70 family; cytoplasmic protein that concentrates in nuclei upon starvation; SSA4 has a paralog, SSA3, that arose from the whole genome duplication -S000036552 CDS YER103W 5 364589 366517 W 2011-02-03 1996-07-31 -S000000906 ORF Verified YER104W RTT105 chromosome 5 S000007476 5 366802 367428 W 2011-02-03 1996-07-31 Protein with a role in regulation of Ty1 transposition -S000037250 CDS YER104W 5 366802 367428 W 2011-02-03 1996-07-31 -S000000907 ORF Verified YER105C NUP157 chromosome 5 L000003139 5 372013 367838 C 2011-02-03 1996-07-31 Subunit of the inner ring of the nuclear pore complex (NPC); contributes to NPC assembly and tethering of DNA to the nuclear periphery; both Nup170p and NUP157p are similar to human Nup155p; NUP157 has a paralog, NUP170, that arose from the whole genome duplication -S000037287 CDS YER105C 5 372013 367838 C 2011-02-03 1996-07-31 -S000000908 ORF Verified YER106W MAM1 chromosome 5 5 372326 373234 W 2011-02-03 1996-07-31 Monopolin; meiosis-specific kinetochore-associated protein involved in monopolar attachment of sister kinetochores to the meiotic spindle; subunit of monopolin, a complex that prevents biorientation of sister kinetochores to ensure homolog biorientation during meiosis I; regulates the conformation, enzyme kinetics and substrate specificity of the Dsn1p kinase, Hrr1p; expressed only during the first meiotic division -S000037445 CDS YER106W 5 372326 373234 W 2011-02-03 1996-07-31 -S000028755 ORF Dubious YER107W-A chromosome 5 5 374394 374714 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF GLE2/YER107C -S000033449 CDS YER107W-A 5 374394 374714 W 2011-02-03 2003-07-29 -S000000909 ORF Verified YER107C GLE2 RNA export factor GLE2|RAE1 chromosome 5 L000004084 5 374545 373448 C 2011-02-03 1996-07-31 RNA export factor associated with the nuclear pore complex (NPC); associates with NUP116p; required for polyadenylated RNA export but not for protein import; homologous to S. pombe Rae1p and human RAE1 -S000037509 CDS YER107C 5 374545 373448 C 2011-02-03 1996-07-31 -S000000911 blocked_reading_frame YER109C FLO8 transcription factor FLO8|STA10|YER108C|PHD5 chromosome 5 L000003202|S000000910|S000029523|L000004208 5 377614 375215 C 2011-02-03 1999-07-17|1996-07-31 Transcription factor; required for flocculation, diploid filamentous growth, and haploid invasive growth; forms a heterodimer with Mss1p that interacts with the Swi/Snf complex during transcriptional activation of FLO1, FLO11, and STA1; S. cerevisiae genome reference strain S288C contains an internal in-frame stop at codon 142, which in other strains encodes tryptophan -S000030400 CDS YER109C 5 377614 375215 C 2011-02-03 1999-07-17|1996-07-31 -S000000912 ORF Verified YER110C KAP123 YRB4 chromosome 5 L000003445|L000003466 5 382103 378762 C 2011-02-03 1996-07-31 Karyopherin beta; mediates nuclear import of ribosomal proteins prior to assembly into ribosomes and import of histones H3 and H4; localizes to the nuclear pore, nucleus, and cytoplasm; exhibits genetic interactions with RAI1 -S000030722 CDS YER110C 5 382103 378762 C 2011-02-03 1996-07-31 -S000000913 ORF Verified YER111C SWI4 SBF complex DNA-binding subunit SWI4|ART1 chromosome 5 L000000124|L000002252 5 385876 382595 C 2011-02-03 1996-07-31 DNA binding component of the SBF complex (Swi4p-Swi6p); a transcriptional activator that in concert with MBF (Mbp1-Swi6p) regulates late G1-specific transcription of targets including cyclins and genes required for DNA synthesis and repair; Slt2p-independent regulator of cold growth; acetylation at two sites, K1016 and K1066, regulates interaction with Swi6p -S000031559 CDS YER111C 5 385876 382595 C 2011-02-03 1996-07-31 -S000000914 ORF Verified YER112W LSM4 U6 snRNA complex subunit LSM4|USS1|SDB23 chromosome 5 L000002447 5 387232 387795 W 2011-02-03 1996-07-31 Lsm (Like Sm) protein; part of heteroheptameric complexes (Lsm2p-7p and either Lsm1p or 8p): cytoplasmic Lsm1p complex involved in mRNA decay; nuclear Lsm8p complex part of U6 snRNP and possibly involved in processing tRNA, snoRNA, and rRNA; forms cytoplasmic foci upon DNA replication stress -S000031681 CDS YER112W 5 387232 387795 W 2011-02-03 1996-07-31 -S000000915 ORF Verified YER113C TMN3 chromosome 5 5 390052 387932 C 2011-02-03 1996-07-31 Protein with a role in cellular adhesion and filamentous growth; similar to Emp70p and Tmn2p; member of Transmembrane Nine family with 9 transmembrane segments; localizes to Golgi; induced by 8-methoxypsoralen plus UVA irradiation -S000031762 CDS YER113C 5 390052 387932 C 2011-02-03 1996-07-31 -S000000916 ORF Verified YER114C BOI2 BEB1 chromosome 5 L000000166|L000002916 5 393712 390590 C 2011-02-03 1996-07-31 Protein implicated in polar growth, functionally redundant with Boi1p; interacts with bud-emergence protein Bem1p; contains an SH3 (src homology 3) domain and a PH (pleckstrin homology) domain; BOI2 has a paralog, BOI1, that arose from the whole genome duplication -S000031880 CDS YER114C 5 393712 390590 C 2011-02-03 1996-07-31 -S000000917 ORF Verified YER115C SPR6 chromosome 5 L000002023 5 394867 394292 C 93 2011-02-03 1996-07-31 Protein of unknown function; expressed during sporulation; not required for sporulation, but gene exhibits genetic interactions with other genes required for sporulation -S000032791 CDS YER115C 5 394867 394292 C 2011-02-03 1996-07-31 -S000000918 ORF Verified YER116C SLX8 SUMO-targeted ubiquitin ligase complex subunit SLX8 chromosome 5 5 396172 395348 C 2011-02-03 1996-07-31 Subunit of Slx5-Slx8 SUMO-targeted ubiquitin ligase (STUbL) complex; role in proteolysis of spindle positioning protein Kar9, DNA repair proteins Rad52p and Rad57p; stimulated by SUMO-modified substrates; contains a C-terminal RING domain; forms nuclear foci upon DNA replication stress; required for maintenance of genome integrity like human ortholog RNF -S000032881 CDS YER116C 5 396172 395348 C 2011-02-03 1996-07-31 -S000000919 ORF Verified YER117W RPL23B uL14|ribosomal 60S subunit protein L23B|L14|YL32|L23B|L17aB chromosome 5 L000001717 5 396769 397653 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L23B; homologous to mammalian ribosomal protein L23 and bacterial L14; RPL23B has a paralog, RPL23A, that arose from the whole genome duplication -S000033044 CDS YER117W 5 396769 396810 W 2011-02-03 1996-07-31 -S000033045 CDS YER117W 5 397282 397653 W 2011-02-03 1996-07-31 -S000033046 intron YER117W 5 396811 397281 W 2011-02-03 1996-07-31 -S000000920 ORF Verified YER118C SHO1 osmosensor SHO1|SSU81 chromosome 5 L000002632|L000002823 5 399055 397952 C 2011-02-03 1996-07-31 Transmembrane osmosensor for filamentous growth and HOG pathways; involved in activation of the Cdc42p- and MAP kinase-dependent filamentous growth pathway and the high-osmolarity glycerol (HOG) response pathway; phosphorylated by Hog1p; interacts with Pbs2p, Msb2p, Hkr1p, and Ste11p -S000033082 CDS YER118C 5 399055 397952 C 2011-02-03 1996-07-31 -S000000921 ORF Verified YER119C AVT6 aspartate/glutamate transporter chromosome 5 5 400842 399496 C 2011-02-03 1996-07-31 Vacuolar aspartate and glutamate exporter; member of a family of seven genes (AVT1-7) related to vesicular GABA-glycine transporters; involved in compartmentalizing acidic amino acids in response to nitrogen starvation; AVT6 has a paralog, AVT5, that arose from the whole genome duplication -S000033839 CDS YER119C 5 400842 399496 C 2011-02-03 1996-07-31 -S000000922 ORF Verified YER120W SCS2 phosphatidylinositol-binding protein SCS2 chromosome 5 L000002629 5 401135 401869 W 2011-02-03 1996-07-31 Integral ER membrane protein, regulates phospholipid metabolism; one of 6 proteins (Ist2p, Scs2p, Scs22p, Tcb1p, Tcb2p, Tcb3p) that connect ER to plasma membrane (PM) and regulate PI4P levels by controlling access of Sac1p phosphatase to substrate PI4P in the PM; interacts with FFAT motifs in Opi1p, Swh1p, Osh2p, and Osh3p; involved in telomeric silencing; VAP homolog; SCS2 has a paralog, SCS22, that arose from the whole genome duplication -S000036090 CDS YER120W 5 401135 401869 W 2011-02-03 1996-07-31 -S000002961 ORF Dubious YER119C-A chromosome 5 5 401238 400867 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; deletion mutation blocks replication of Brome mosaic virus in S. cerevisiae, but this is likely due to effects on the overlapping gene SCS2 -S000033092 CDS YER119C-A 5 401238 400867 C 2011-02-03 1996-07-31 -S000000923 ORF Uncharacterized YER121W chromosome 5 5 402375 402719 W 2011-02-03 1996-07-31 Putative protein of unknown function; may be involved in phosphatase regulation and/or generation of precursor metabolites and energy -S000036211 CDS YER121W 5 402375 402719 W 2011-02-03 1996-07-31 -S000000924 ORF Verified YER122C GLO3 ADP-ribosylation factor GTPase-activating protein chromosome 5 L000000713 5 404352 402871 C 2011-02-03 1996-07-31 ADP-ribosylation factor GTPase activating protein (ARF GAP); involved in ER-Golgi transport; shares functional similarity with Gcs1p -S000036231 CDS YER122C 5 404352 402871 C 2011-02-03 1996-07-31 -S000000925 ORF Verified YER123W YCK3 casein kinase YCK3|CKI3 chromosome 5 L000002915 5 404813 406387 W 2011-02-03 2000-03-16|1996-07-31 Palmitoylated vacuolar membrane-localized casein kinase I isoform; negatively regulates vacuole fusion during hypertonic stress via phosphorylation of Vps41p; shares essential functions with Hrr25p; regulates vesicle fusion in AP-3 pathway -S000036985 CDS YER123W 5 404813 406387 W 2011-02-03 2000-03-16|1996-07-31 -S000077389 ARS ARS517 ARSV-407 chromosome 5 5 406752 406953 2011-02-03 2004-10-19|2006-09-07 Autonomously Replicating Sequence -S000000926 ORF Verified YER124C DSE1 chromosome 5 5 409063 407342 C 2011-02-03 1996-07-31 Daughter cell-specific protein; may regulate cross-talk between the mating and filamentation pathways; deletion affects cell separation after division and sensitivity to alpha-factor and drugs affecting the cell wall; relocalizes from bud neck to cytoplasm upon DNA replication stress -S000037009 CDS YER124C 5 409063 407342 C 2011-02-03 1996-07-31 -S000000927 ORF Verified YER125W RSP5 NEDD4 family E3 ubiquitin-protein ligase|SMM1|UBY1|NPI1|MUT2|MDP1 chromosome 5 L000001054|L000001779|L000001220 5 410189 412618 W 2011-02-03 1996-07-31 NEDD4 family E3 ubiquitin ligase; regulates processes including: MVB sorting, the heat shock response, transcription, endocytosis and ribosome stability; ubiquitinates Sec23p, Sna3p, Ste4p, Nfi1p, Rpo21p and Sem1p; autoubiquitinates; deubiquitinated by Ubp2p; regulated by SUMO ligase Siz1p, in turn regulates Siz1p SUMO ligase activity; required for efficient Golgi-to-ER trafficking in COPI mutants; mutant tolerates aneuploidy; human homolog implicated in Liddle syndrome -S000037135 CDS YER125W 5 410189 412618 W 2011-02-03 1996-07-31 -S000000928 ORF Verified YER126C NSA2 rRNA-processing protein NSA2 chromosome 5 5 414179 413394 C 2011-02-03 1996-07-31 Protein constituent of 66S pre-ribosomal particles; contributes to processing of the 27S pre-rRNA; recruited by ribosomal proteins L17, L35, and L37 to assembling ribosomes after 27SB pre-rRNA is generated, immediately preceding removal of ITS2 -S000037193 CDS YER126C 5 414179 413394 C 2011-02-03 1996-07-31 -S000000929 ORF Verified YER127W LCP5 chromosome 5 L000004265 5 414481 415554 W 2011-02-03 1996-07-31 Essential protein involved in maturation of 18S rRNA; depletion leads to inhibited pre-rRNA processing and reduced polysome levels; localizes primarily to the nucleolus -S000029893 CDS YER127W 5 414481 415554 W 2011-02-03 1996-07-31 -S000000930 ORF Verified YER128W VFA1 chromosome 5 5 415859 416470 W 2011-02-03 1996-07-31 Protein that interacts with Vps4p and has a role in vacuolar sorting; stimulates the ATPase activity of Vps4; localizes to endosomes in a Vps4-dependent manner; overexpression causes canavanine sensitivity and confers a partial class D vacuole morphology -S000030007 CDS YER128W 5 415859 416470 W 2011-02-03 1996-07-31 -S000000931 ORF Verified YER129W SAK1 serine/threonine protein kinase SAK1|PAK1 chromosome 5 L000001333 5 417281 420709 W 2011-02-03 1996-07-31 Upstream serine/threonine kinase for the SNF1 complex; plays a role in pseudohyphal groth; partially redundant with Elm1p and Tos3p; members of this family have functional orthology with LKB1, a mammalian kinase associated with Peutz-Jeghers cancer-susceptibility syndrome; SAK1 has a paralog, TOS3, that arose from the whole genome duplication -S000030128 CDS YER129W 5 417281 420709 W 2011-02-03 1996-07-31 -S000000932 ORF Verified YER130C COM2 chromosome 5 5 422446 421115 C 2011-02-03 1996-07-31 Transcription factor that binds IME1 Upstream Activation Signal (UAS)ru; COM2 transcription is regulated by Haa1p, Sok2p and Zap1p transcriptional activators; may bind the IME1 promoter under all growth conditions to negatively regulate its transcription in the absence of a positive regulator that binds more effectively; repressor activity may depend on phosphorylation by PKA; C. albicans homolog (MNL1) plays a role in adaptation to stress -S000031102 CDS YER130C 5 422446 421115 C 2011-02-03 1996-07-31 -S000000933 ORF Verified YER131W RPS26B eS26|ribosomal 40S subunit protein S26B|S26e|S26B chromosome 5 L000001763 5 423952 424311 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S26, no bacterial homolog; RPS26B has a paralog, RPS26A, that arose from the whole genome duplication; human homolog can partially complement an RPS26A, RPS26B double null mutant; mutations in the human gene are associated with Diamond-Blackfan anemia -S000031231 CDS YER131W 5 423952 424311 W 2011-02-03 1996-07-31 -S000122097 five_prime_UTR_intron YER131W 5 423591 423951 W 2011-02-03 2007-04-04 -S000006493 snoRNA_gene snR4 SNR4 chromosome 5 L000001959 5 424698 424883 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA) but not shown to be active; no target site is predicted within the ribosomal RNAs -S000034305 noncoding_exon snR4 5 424698 424883 W 2011-02-03 2000-05-19 -S000000934 ORF Verified YER132C PMD1 chromosome 5 L000003968 5 430449 425188 C 2011-02-03 1996-07-31 Protein with an N-terminal kelch-like domain; putative negative regulator of early meiotic gene expression; required, with Mds3p, for growth under alkaline conditions; PMD1 has a paralog, MDS3, that arose from the whole genome duplication -S000032160 CDS YER132C 5 430449 425188 C 2011-02-03 1996-07-31 -S000006443 snoRNA_gene snR52 SNR52 chromosome 5 L000004521 5 431220 431129 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U2921 and small subunit (SSU) rRNA at position A420 -S000030733 noncoding_exon snR52 5 431220 431129 C 2011-02-03 2000-05-19 -S000006895 long_terminal_repeat YERCdelta14 chromosome 5 5 431822 431490 C 2011-02-03 2000-05-19 Ty1 LTR -S000000935 ORF Verified YER133W GLC7 type 1 serine/threonine-protein phosphatase catalytic subunit GLC7|DIS2S1|PP1|DIS2|CID1 chromosome 5 L000000706 5 432495 433958 W 2011-02-03 1996-07-31 Type 1 S/T protein phosphatase (PP1) catalytic subunit; involved in glycogen metabolism, sporulation and mitotic progression; interacts with multiple regulatory subunits; regulates actomyosin ring formation; subunit of CPF; recruited to mating projections by Afr1p interaction; regulates nucleocytoplasmic shuttling of Hxk2p; import into the nucleus is inhibited during spindle assembly checkpoint arrest; involved in dephosphorylating Rps6a/b and Bnr1p -S000032307 CDS YER133W 5 432495 432671 W 2011-02-03 1996-07-31 -S000032308 CDS YER133W 5 433197 433958 W 2011-02-03 1996-07-31 -S000032309 intron YER133W 5 432672 433196 W 2011-02-03 1996-07-31 -S000006594 tRNA_gene tH(GUG)E2 chromosome 5 L000003803 5 434612 434541 C 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis -S000035212 noncoding_exon tH(GUG)E2 5 434612 434541 C 2011-02-03 2000-05-19 -S000006906 long_terminal_repeat YERCsigma3 chromosome 5 5 434971 434631 C 2011-02-03 2000-05-19 Ty3 LTR -S000006896 long_terminal_repeat YERCdelta15 chromosome 5 5 435447 435128 C 2011-02-03 2000-05-19 Ty1 LTR -S000006619 tRNA_gene tK(CUU)E2 chromosome 5 L000003802 5 435824 435752 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000037795 noncoding_exon tK(CUU)E2 5 435824 435752 C 2011-02-03 2000-05-19 -S000006897 long_terminal_repeat YERCdelta16 chromosome 5 5 436277 435946 C 2011-02-03 2000-05-19 Ty1 LTR -S000006909 long_terminal_repeat YERCtau3 chromosome 5 5 436605 436279 C 2011-02-03 2000-05-19 Ty4 LTR -S000028756 ORF Dubious YER133W-A chromosome 5 5 437191 437532 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF YER134C -S000033450 CDS YER133W-A 5 437191 437532 W 2011-02-03 2003-07-29 -S000000936 ORF Verified YER134C Mg-dependent acid phosphatase|MDP-1 chromosome 5 5 437803 437267 C 2011-02-03 1996-07-31 Magnesium-dependent acid phosphatase; member of the haloacid dehalogenase superfamily; non-essential gene -S000032339 CDS YER134C 5 437803 437267 C 2011-02-03 1996-07-31 -S000000937 ORF Uncharacterized YER135C chromosome 5 5 438344 437952 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YER135C is not an essential gene -S000032452 CDS YER135C 5 438344 437952 C 2011-02-03 1996-07-31 -S000006753 tRNA_gene tV(AAC)E1 chromosome 5 L000003796 5 438700 438773 W 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000035942 noncoding_exon tV(AAC)E1 5 438700 438773 W 2011-02-03 2000-05-19 -S000077390 ARS ARS518 ARSV-439 chromosome 5 5 438934 439182 2011-02-03 2004-10-19|2006-09-07 Autonomously Replicating Sequence -S000178091 ARS_consensus_sequence ARS518 5 439102 439086 C 2014-11-18 2014-11-18 -S000000938 ORF Verified YER136W GDI1 SEC19 chromosome 5 L000000699 5 439616 440971 W 2011-02-03 1996-07-31 GDP dissociation inhibitor; regulates vesicle traffic in secretory pathways by regulating the dissociation of GDP from the Sec4/Ypt/rab family of GTP binding proteins -S000033298 CDS YER136W 5 439616 440971 W 2011-02-03 1996-07-31 -S000028757 ORF Dubious YER137W-A chromosome 5 5 441575 441880 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF YER137C -S000033451 CDS YER137W-A 5 441575 441880 W 2011-02-03 2003-07-29 -S000000939 ORF Uncharacterized YER137C chromosome 5 5 441819 441373 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000033341 CDS YER137C 5 441819 441373 C 2011-02-03 1996-07-31 -S000006491 ncRNA_gene SCR1 SCR1 chromosome 5 L000001818 5 441987 442508 W 2011-02-03 2000-05-19|2004-10-08 RNA subunit of the Signal Recognition Particle (SRP) -S000034550 noncoding_exon SCR1 5 441987 442508 W 2011-02-03 2000-05-19|2004-10-08 -S000077391 ARS ARS519 chromosome 5 5 442416 442735 2011-02-03 2004-10-19 Autonomously Replicating Sequence -S000006917 long_terminal_repeat YERWdelta17 chromosome 5 5 442734 443072 W 2011-02-03 2000-05-19 Ty1 LTR -S000006602 tRNA_gene tI(AAU)E1 chromosome 5 L000003801 5 443275 443202 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000037353 noncoding_exon tI(AAU)E1 5 443275 443202 C 2011-02-03 2000-05-19 -S000006898 long_terminal_repeat YERCdelta19 chromosome 5 5 443733 443397 C 2011-02-03 2000-05-19 Ty1 LTR -S000006919 long_terminal_repeat YERWdelta21 chromosome 5 5 444834 445139 W 2011-02-03 2000-05-19 Ty1 LTR -S000000940 transposable_element_gene YER138C gag-pol fusion protein chromosome 5 5 449024 443756 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000033407 CDS YER138C 5 447721 443756 C 2011-02-03 1996-07-31 -S000033406 CDS YER138C 5 449024 447723 C 2011-02-03 1996-07-31 -S000033408 plus_1_translational_frameshift YER138C 5 447722 447722 C 2011-02-03 1996-07-31 -S000007402 transposable_element_gene YER137C-A gag protein chromosome 5 5 449024 447702 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000034807 CDS YER137C-A 5 449024 447702 C 2011-02-03 1999-07-17 -S000006910 LTR_retrotransposon YERCTy1-1 Ty1 chromosome 5 5 449320 443397 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000006899 long_terminal_repeat YERCdelta20 chromosome 5 5 449320 448984 C 2011-02-03 2000-05-19 Ty1 LTR -S000007239 ORF Uncharacterized YER138W-A chromosome 5 5 449474 449578 W 2011-02-03 1999-07-17 Putative protein of unknown function; YER138W-A has a paralog, YBL107W-A, that arose from a single-locus duplication -S000030980 CDS YER138W-A 5 449474 449578 W 2011-02-03 1999-07-17 -S000000941 ORF Verified YER139C RTR1 RNA polymerase II subunit B1 CTD phosphatase RTR1 chromosome 5 5 451243 450563 C 2011-02-03 1996-07-31 CTD phosphatase; dephosphorylates S5-P in the C-terminal domain of Rpo21p; has a cysteine-rich motif required for function and conserved in eukaryotes; shuttles between the nucleus and cytoplasm; RTR1 has a paralog, RTR2, that arose from the whole genome duplication -S000034331 CDS YER139C 5 451243 450563 C 2011-02-03 1996-07-31 -S000000942 ORF Verified YER140W EMP65 chromosome 5 5 451565 453235 W 2011-02-03 1996-07-31 Integral membrane protein of the ER; forms an ER-membrane associated protein complex with Slp1p; identified along with SLP1 in a screen for mutants defective in the unfolded protein response (UPR); proposed to function in the folding of integral membrane proteins; interacts genetically with MPS3; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000035305 CDS YER140W 5 451565 453235 W 2011-02-03 1996-07-31 -S000000943 ORF Verified YER141W COX15 chromosome 5 L000002578 5 453459 454919 W 2011-02-03 1996-07-31 Protein required for the hydroxylation of heme O to form heme A; heme A is an essential prosthetic group for cytochrome c oxidase -S000035366 CDS YER141W 5 453459 454919 W 2011-02-03 1996-07-31 -S000000944 ORF Verified YER142C MAG1 MMS5 chromosome 5 L000000976 5 456036 455146 C 110 2011-02-03 1996-07-31 3-methyl-adenine DNA glycosylase; involved in protecting DNA against alkylating agents; initiates base excision repair by removing damaged bases to create abasic sites that are subsequently repaired; protein abundance increases in response to DNA replication stress -S000035403 CDS YER142C 5 456036 455146 C 2011-02-03 1996-07-31 -S000000945 ORF Verified YER143W DDI1 VSM1 chromosome 5 L000004257 5 456319 457605 W 2011-02-03 1996-07-31 DNA damage-inducible v-SNARE binding protein; role in suppression of protein secretion; may play a role in S-phase checkpoint control; has ubiquitin-associated (UBA), ubiquitin-like (UBL), and retroviral-like proteinase (RVP) domains -S000035500 CDS YER143W 5 456319 457605 W 2011-02-03 1996-07-31 -S000000946 ORF Verified YER144C UBP5 putative ubiquitin-specific protease UBP5 chromosome 5 L000002419 5 460223 457806 C 2011-02-03 1996-07-31 Putative ubiquitin-specific protease; concentrates at the bud neck; UBP5 has a paralog, DOA4, that arose from the whole genome duplication -S000035528 CDS YER144C 5 460223 457806 C 2011-02-03 1996-07-31 -S000000947 ORF Verified YER145C FTR1 high-affinity iron permease FTR1 chromosome 5 L000003066 5 461740 460526 C 2011-02-03 1996-07-31 High affinity iron permease; involved in the transport of iron across the plasma membrane; forms complex with Fet3p; expression is regulated by iron; protein abundance increases in response to DNA replication stress -S000035592 CDS YER145C 5 461740 460526 C 2011-02-03 1996-07-31 -S000000948 ORF Verified YER146W LSM5 RNA-binding protein LSM5 chromosome 5 L000004684 5 462585 462866 W 2011-02-03 1996-07-31 Lsm (Like Sm) protein; part of heteroheptameric complexes (Lsm2p-7p and either Lsm1p or 8p): cytoplasmic Lsm1p complex involved in mRNA decay; nuclear Lsm8p complex part of U6 snRNP and possibly involved in processing tRNA, snoRNA, and rRNA -S000036550 CDS YER146W 5 462585 462866 W 2011-02-03 1996-07-31 -S000028758 ORF Dubious YER145C-A chromosome 5 5 462823 462386 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps verified ORF LSM5/YER146W -S000033452 CDS YER145C-A 5 462823 462386 C 2011-02-03 2003-07-29 -S000000949 ORF Verified YER147C SCC4 cohesin-loading factor complex subunit SCC4 chromosome 5 5 464842 462968 C 2011-02-03 1996-07-31 Subunit of cohesin loading factor (Scc2p-Scc4p); complex is required for the loading of cohesin complexes onto chromosomes; involved in establishing sister chromatid cohesion during double-strand break repair via phosphorylated histone H2AX -S000036587 CDS YER147C 5 464842 462968 C 2011-02-03 1996-07-31 -S000000950 ORF Verified YER148W SPT15 TATA-binding protein|TBP|TBP1|BTF1 chromosome 5 L000002037 5 465303 466025 W 110 2011-02-03 1996-07-31 TATA-binding protein (TBP); general transcription factor that interacts with other factors to form the preinitiation complex at promoters; essential for viability, highly conserved; yeast gene can complement mutations in human homolog TBP -S000037378 CDS YER148W 5 465303 466025 W 2011-02-03 1996-07-31 -S000028759 ORF Dubious YER147C-A chromosome 5 5 465613 465203 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF SPT15/YER148W -S000033453 CDS YER147C-A 5 465613 465203 C 2011-02-03 2003-07-29 -S000028760 ORF Dubious YER148W-A chromosome 5 5 466185 466763 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF PEA2/YER149C -S000033464 CDS YER148W-A 5 466185 466763 W 2011-02-03 2003-07-29 -S000000951 ORF Verified YER149C PEA2 PPF2|DFG9 chromosome 5 L000003143 5 467470 466208 C 2011-02-03 1996-07-31 Coiled-coil 12S polarisome subunit; required for polarity establishment, apical bud growth, shmoo formation, filamentous differentiation; involved in Bni1p localization at sites of polarized growth, controlling polarized assembly of actin cables; role in apical growth affects diploid-specific bipolar bud site selection; retains Slt2p at bud tip to regulate ER inheritance; role in Ca2+ influx, cell fusion; S288C allele encoding Leu409 rather than Met linked with non-invasion -S000037418 CDS YER149C 5 467470 466208 C 2011-02-03 1996-07-31 -S000000952 ORF Verified YER150W SPI1 chromosome 5 L000004852 5 468370 468816 W 2011-02-03 1996-07-31 GPI-anchored cell wall protein involved in weak acid resistance; basal expression requires Msn2p/Msn4p; expression is induced under conditions of stress and during the diauxic shift; SPI1 has a paralog, SED1, that arose from the whole genome duplication -S000030182 CDS YER150W 5 468370 468816 W 2011-02-03 1996-07-31 -S000006754 tRNA_gene tV(AAC)E2 chromosome 5 L000003797 5 469457 469530 W 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000035943 noncoding_exon tV(AAC)E2 5 469457 469530 W 2011-02-03 2000-05-19 -S000000953 ORF Verified YER151C UBP3 mRNA-binding ubiquitin-specific protease UBP3|BLM3 chromosome 5 L000002417|S000086717 5 472424 469686 C 2011-02-03 1996-07-31 Ubiquitin-specific protease involved in transport and osmotic response; negatively regulates Ras/PKA signaling; interacts with Bre5p to coregulate anterograde, retrograde transport between ER and Golgi; involved in transcription elongation in response to osmostress through phosphorylation at Ser695 by Hog1p; inhibitor of gene silencing; role in ribophagy; cleaves ubiquitin fusions but not polyubiquitin; protein abundance increases in response to DNA replication stress -S000030288 CDS YER151C 5 472424 469686 C 2011-02-03 1996-07-31 -S000028761 ORF Dubious YER152W-A chromosome 5 5 473485 474051 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF YER152C -S000033465 CDS YER152W-A 5 473485 474051 W 2011-02-03 2003-07-29 -S000000954 ORF Verified YER152C 2-aminoadipate transaminase chromosome 5 5 473988 472657 C 2011-02-03 1996-07-31 Protein with 2-aminoadipate transaminase activity; shares amino acid similarity with the aminotransferases Aro8p and Aro9p; YER152C is not an essential gene -S000030401 CDS YER152C 5 473988 472657 C 2011-02-03 1996-07-31 -S000000955 ORF Verified YER153C PET122 chromosome 5 L000001397 5 474805 474041 C 118 2011-02-03 1996-07-31 Mitochondrial translational activator specific for the COX3 mRNA; acts together with Pet54p and Pet494p; located in the mitochondrial inner membrane -S000031314 CDS YER153C 5 474805 474041 C 2011-02-03 1996-07-31 -S000000956 ORF Verified YER154W OXA1 membrane insertase OXA1|PET1402 chromosome 5 L000001318 5 475020 476228 W 112 2011-02-03 1996-07-31 Mitochondrial inner membrane insertase; mediates the insertion of both mitochondrial- and nuclear-encoded proteins from the matrix into the inner membrane; also has a role in insertion of carrier proteins into the inner membrane; acts as a voltage-gated ion channel, activated by substrate peptides; interacts with mitochondrial ribosomes; conserved from bacteria to animals -S000031446 CDS YER154W 5 475020 476228 W 2011-02-03 1996-07-31 -S000000957 ORF Verified YER155C BEM2 TSL1|SUP9|IPL2 chromosome 5 L000000168 5 482848 476345 C 119 2011-02-03 1996-07-31 Rho GTPase activating protein (RhoGAP); involved in the control of cytoskeleton organization and cellular morphogenesis; required for bud emergence; potential GAP for Rho4p -S000031485 CDS YER155C 5 482848 476345 C 2011-02-03 1996-07-31 -S000000958 ORF Uncharacterized YER156C chromosome 5 5 484341 483325 C 2011-02-03 1996-07-31 Putative protein of unknown function; interacts with Hsp82p and copurifies with Ipl1p; expression is copper responsive and downregulated in strains deleted for MAC1, a copper-responsive transcription factor; similarity to mammalian MYG1 -S000031540 CDS YER156C 5 484341 483325 C 2011-02-03 1996-07-31 -S000000959 ORF Verified YER157W COG3 Golgi transport complex subunit COG3|SEC34|GRD20 chromosome 5 L000004876 5 484788 487193 W 2011-02-03 1996-07-31 Essential component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments -S000032561 CDS YER157W 5 484788 487193 W 2011-02-03 1996-07-31 -S000006552 tRNA_gene tE(UUC)E3 chromosome 5 L000003800 5 487402 487331 C 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; target of K. lactis zymocin -S000034442 noncoding_exon tE(UUC)E3 5 487402 487331 C 2011-02-03 2000-05-19 -S000006920 long_terminal_repeat YERWdelta22 chromosome 5 5 487834 488165 W 2011-02-03 2000-05-19 Ty1 LTR -S000000960 ORF Uncharacterized YER158C chromosome 5 5 490578 488857 C 2011-02-03 1996-07-31 Protein of unknown function; potentially phosphorylated by Cdc28p; YER158C has a paralog, AFR1, that arose from the whole genome duplication -S000032616 CDS YER158C 5 490578 488857 C 2011-02-03 1996-07-31 -S000028624 ORF Dubious YER158W-A chromosome 5 5 491487 491702 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031478 CDS YER158W-A 5 491487 491702 W 2011-02-03 2003-07-29 -S000000961 ORF Verified YER159C BUR6 negative cofactor 2 transcription regulator complex subunit BUR6|NCB1 chromosome 5 L000003240 5 491958 491530 C 2011-02-03 1996-07-31 Subunit of a heterodimeric NC2 transcription regulator complex; complex binds to TBP and can repress transcription by preventing preinitiation complex assembly or stimulate activated transcription; homologous to human NC2alpha; complex also includes Ncb2p; bur6 ncb2 double mutation is functionally complemented by coexpression of human DRAP1 and DR1, although the single bur6 mutation is not complemented by its ortholog DRAP1 -S000032723 CDS YER159C 5 491958 491530 C 2011-02-03 1996-07-31 -S000006701 tRNA_gene tR(ACG)E chromosome 5 L000003799 5 492424 492352 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 6 nuclear tRNA genes containing the tDNA-anticodon ACG (converted to ICG in the mature tRNA), decodes CGU, CGC, and probably CGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000030371 noncoding_exon tR(ACG)E 5 492424 492352 C 2011-02-03 2000-05-19 -S000006900 long_terminal_repeat YERCdelta23 chromosome 5 5 492833 492695 C 2011-02-03 2000-05-19 Ty1 LTR -S000000962 transposable_element_gene YER160C gag-pol fusion protein chromosome 5 5 498124 492856 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000034492 CDS YER160C 5 496821 492856 C 2011-02-03 1996-07-31 -S000034491 CDS YER160C 5 498124 496823 C 2011-02-03 1996-07-31 -S000034493 plus_1_translational_frameshift YER160C 5 496822 496822 C 2011-02-03 1996-07-31 -S000007403 transposable_element_gene YER159C-A gag protein chromosome 5 5 498124 496802 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000030149 CDS YER159C-A 5 498124 496802 C 2011-02-03 1999-07-17 -S000006911 LTR_retrotransposon YERCTy1-2 Ty1 chromosome 5 5 498421 492695 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000006901 long_terminal_repeat YERCdelta24 chromosome 5 5 498421 498084 C 2011-02-03 2000-05-19 Ty1 LTR -S000077392 ARS ARS520 chromosome 5 5 498884 499182 2014-11-18 2004-10-19|2014-11-18 Autonomously Replicating Sequence -S000178092 ARS_consensus_sequence ARS520 5 498884 498900 W 2014-11-18 2014-11-18 -S000000963 ORF Verified YER161C SPT2 EXA1|SIN1 chromosome 5 L000002028 5 500348 499347 C 127 2011-02-03 1996-07-31 Protein involved in negative regulation of transcription; required for RNA polyadenylation; exhibits regulated interactions with both histones and SWI-SNF components; relocalizes to the cytosol in response to hypoxia; similar to mammalian HMG1 proteins -S000034600 CDS YER161C 5 500348 499347 C 2011-02-03 1996-07-31 -S000000964 ORF Verified YER162C RAD4 chromosome 5 L000001558 5 502894 500630 C 128 2011-02-03 1996-07-31|2011-02-03 Protein that recognizes and binds damaged DNA (with Rad23p) during NER; subunit of Nuclear Excision Repair Factor 2 (NEF2); also involved, with Rad23p, in turnover of ubiquitylated proteins; Rad4p-Rad23p heterodimer binds to promoters of DNA damage response genes to repress their transcription in the absence of DNA damage; NER stands for nucleotide excision repair -S000034668 CDS YER162C 5 502894 500630 C 2011-02-03 1996-07-31|2011-02-03 -S000000965 ORF Verified YER163C GCG1 gamma-glutamylcyclotransferase chromosome 5 5 503782 503084 C 2011-02-03 1996-07-31 Gamma-glutamyl cyclotransferase; cleaves the gamma-glutamyl bond of glutathione to yield 5-oxoproline and a Cys-Gly dipeptide; similar to mammalian pro-apoptotic protein ChaC1; expression of mouse ChaC1 in yeast increases apoptosis; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; periodically expressed during the metabolic cycle -S000034748 CDS YER163C 5 503782 503084 C 2011-02-03 1996-07-31 -S000000966 ORF Verified YER164W CHD1 chromatin-remodeling ATPase CHD1 chromosome 5 L000003467 5 505392 509798 W 2011-02-03 1996-07-31 Chromatin remodeler that regulates various aspects of transcription; acts in in conjunction with Isw1b to regulate chromatin structure and maintain chromatin integrity during transcription elongation by RNAP II by preventing trans-histone exchange over coding regions; contains a chromo domain, a helicase domain and a DNA-binding domain; component of both the SAGA and SLIK complexes -S000035707 CDS YER164W 5 505392 509798 W 2011-02-03 1996-07-31 -S000000967 ORF Verified YER165W PAB1 polyadenylate-binding protein chromosome 5 L000001327 5 510373 512106 W 2011-02-03 1996-07-31 Poly(A) binding protein; part of the 3'-end RNA-processing complex, mediates interactions between the 5' cap structure and the 3' mRNA poly(A) tail, involved in control of poly(A) tail length, interacts with translation factor eIF-4G; stimulates, but is not required for the deadenylation activity of the Pan2p-Pan3p poly(A)-ribonuclease complex -S000035793 CDS YER165W 5 510373 512106 W 2011-02-03 1996-07-31 -S000000968 ORF Verified YER166W DNF1 aminophospholipid-translocating P4-type ATPase DNF1 chromosome 5 5 512744 517459 W 2011-02-03 1996-07-31 Aminophospholipid translocase (flippase); type 4 P-type ATPase; involved in phospholipid translocation, contributing to endocytosis, protein transport, and cellular polarization; localizes primarily to the plasma membrane; localizes to the shmoo tip where it has a redundant role in the cellular response to mating pheromone; DNF1 has a paralog, DNF2, that arose from the whole genome duplication -S000035898 CDS YER166W 5 512744 517459 W 2011-02-03 1996-07-31 -S000028762 ORF Dubious YER165C-A chromosome 5 5 512983 512627 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene DNF1/YER166W -S000033466 CDS YER165C-A 5 512983 512627 C 2011-02-03 2003-07-29 -S000000969 ORF Verified YER167W BCK2 CTR7 chromosome 5 L000000163 5 518216 520771 W 2011-02-03 1996-07-31 Serine/threonine-rich protein involved in PKC1 signaling pathway; protein kinase C (PKC1) signaling pathway controls cell integrity; overproduction suppresses pkc1 mutations -S000036791 CDS YER167W 5 518216 520771 W 2011-02-03 1996-07-31 -S000077393 ARS ARS521 chromosome 5 5 520772 521030 2011-02-03 2004-10-19 Autonomously Replicating Sequence -S000000970 ORF Verified YER168C CCA1 tRNA adenylyltransferase|TNT1 chromosome 5 L000000232 5 522669 521029 C 2011-02-03 1996-07-31 ATP (CTP):tRNA-specific tRNA nucleotidyltransferase; different forms targeted to the nucleus, cytosol, and mitochondrion are generated via the use of multiple transcriptional and translational start sites; human homolog TRNT1 complements yeast null mutant -S000036817 CDS YER168C 5 522669 521029 C 2011-02-03 1996-07-31 -S000000971 ORF Verified YER169W RPH1 KDM4 chromosome 5 L000004504 5 523369 525759 W 2011-02-03 1996-07-31 JmjC domain-containing histone demethylase; targets tri- and dimethylated H3K36; associates with actively transcribed regions and promotes elongation; repressor of autophagy-related genes in nutrient-replete conditions; damage-responsive repressor of PHR1; phosphorylated by the Rad53p-dependent DNA damage checkpoint pathway and by a Rim1p-mediated event during starvation; target of stress-induced hormesis; RPH1 has a paralog, GIS1, that arose from the whole genome duplication -S000036928 CDS YER169W 5 523369 525759 W 2011-02-03 1996-07-31 -S000000972 ORF Verified YER170W ADK2 adenylate kinase ADK2|PAK3|AKY3 chromosome 5 L000000047 5 525974 526651 W 146 2011-02-03 1996-07-31 Mitochondrial adenylate kinase; catalyzes the reversible synthesis of GTP and AMP from GDP and ADP; may serve as a back-up for synthesizing GTP or ADP depending on metabolic conditions; 3' sequence of ADK2 varies with strain background -S000036684 CDS YER170W 5 525974 526651 W 2011-02-03 1996-07-31 -S000000973 ORF Verified YER171W RAD3 TFIIH/NER complex ATP-dependent 5'-3' DNA helicase subunit RAD3|REM1 chromosome 5 L000001557 5 527082 529418 W 146 2011-02-03 1996-07-31 5' to 3' DNA helicase; involved in nucleotide excision repair and transcription; subunit of RNA polII initiation factor TFIIH and of Nucleotide Excision Repair Factor 3 (NEF3); homolog of human XPD protein; mutant has aneuploidy tolerance; protein abundance increases in response to DNA replication stress -S000036770 CDS YER171W 5 527082 529418 W 2011-02-03 1996-07-31 -S000000974 ORF Verified YER172C BRR2 ATP-dependent RNA helicase BRR2|PRP44|SNU246|SLT22|RSS1 chromosome 5 L000003100|L000003283 5 536021 529530 C 2011-02-03 1996-07-31 RNA-dependent ATPase RNA helicase (DEIH box); required for disruption of U4/U6 base-pairing in native snRNPs to activate the spliceosome for catalysis; homologous to human U5-200kD -S000030569 CDS YER172C 5 536021 529530 C 2011-02-03 1996-07-31 -S000000975 ORF Verified YER173W RAD24 RS1 chromosome 5 L000001777 5 536300 538279 W 147 2011-02-03 1996-07-31 Checkpoint protein; involved in the activation of the DNA damage and meiotic pachytene checkpoints; subunit of a clamp loader that loads Rad17p-Mec3p-Ddc1p onto DNA; homolog of human and S. pombe Rad17 protein -S000030767 CDS YER173W 5 536300 538279 W 2011-02-03 1996-07-31 -S000028763 ORF Dubious YER172C-A chromosome 5 5 536655 536275 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF RAD24/YER173W -S000033467 CDS YER172C-A 5 536655 536275 C 2011-02-03 2003-07-29 -S000000976 ORF Verified YER174C GRX4 monothiol glutaredoxin GRX4 chromosome 5 S000007445 5 539168 538434 C 2011-02-03 1996-07-31 Glutathione-dependent oxidoreductase; hydroperoxide and superoxide-radical responsive; monothiol glutaredoxin subfamily member along with Grx3p and Grx5p; protects cells from oxidative damage; with Grx3p, binds to Aft1p in iron-replete conditions, promoting its dissociation from promoters; mutant has increased aneuploidy tolerance; transcription regulated by Yap5p; GRX4 has a paralog, GRX3, that arose from the whole genome duplication -S000030799 CDS YER174C 5 539168 538434 C 2011-02-03 1996-07-31 -S000000977 ORF Verified YER175C TMT1 TAM1 chromosome 5 5 540363 539464 C 2011-02-03 1996-07-31 Trans-aconitate methyltransferase; cytosolic enzyme that catalyzes the methyl esterification of 3-isopropylmalate, an intermediate of the leucine biosynthetic pathway, and trans-aconitate, which inhibits the citric acid cycle -S000031738 CDS YER175C 5 540363 539464 C 2011-02-03 1996-07-31 -S000028625 ORF Uncharacterized YER175W-A chromosome 5 5 540650 540814 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031479 CDS YER175W-A 5 540650 540814 W 2011-02-03 2003-07-29 -S000000978 ORF Verified YER176W ECM32 MTT1|HEL1 chromosome 5 L000003934 5 541690 545055 W 2011-02-03 1996-07-31 DNA dependent ATPase/DNA helicase; helicase belonging to the Dna2p- and Nam7p-like family of helicases that is involved in modulating translation termination; interacts with the translation termination factors, localized to polysomes -S000032015 CDS YER176W 5 541690 545055 W 2011-02-03 1996-07-31 -S000000979 ORF Verified YER177W BMH1 14-3-3 family protein BMH1|APR6 chromosome 5 L000000185 5 545611 546414 W 148 2011-02-03 1996-07-31 14-3-3 protein, major isoform; controls proteome at post-transcriptional level, binds proteins and DNA, involved in regulation of exocytosis, vesicle transport, Ras/MAPK and rapamycin-sensitive signaling, aggresome formation, spindle position checkpoint; protein increases in abundance and relative distribution to the nucleus increases upon DNA replication stress; antiapoptotic gene similar to human 14-3-3; BMH1 has a paralog, BMH2, that arose from whole genome duplication -S000032121 CDS YER177W 5 545611 546414 W 2011-02-03 1996-07-31 -S000000980 ORF Verified YER178W PDA1 pyruvate dehydrogenase (acetyl-transferring) subunit E1 alpha chromosome 5 L000001352 5 546817 548079 W 143 2011-02-03 2003-09-22|1996-07-31 E1 alpha subunit of the pyruvate dehydrogenase (PDH) complex; catalyzes the direct oxidative decarboxylation of pyruvate to acetyl-CoA; phosphorylated; regulated by glucose; PDH complex is concentrated in spots within the mitochondrial matrix, often near the ERMES complex and near peroxisomes -S000033032 CDS YER178W 5 546817 548079 W 2011-02-03 2003-09-22|1996-07-31 -S000000981 ORF Verified YER179W DMC1 recombinase DMC1|ISC2 chromosome 5 L000000509 5 548421 549517 W 2011-02-03 1996-07-31 Meiosis-specific recombinase required for double-strand break repair; also required for pairing between homologous chromosomes; required for the normal morphogenesis of synaptonemal complex; homolog of Rad51p and the bacterial RecA protein; binds ssDNA and dsDNA, forms helical filaments; stimulated by Rdh54p -S000033128 CDS YER179W 5 548421 548552 W 2011-02-03 1996-07-31 -S000033129 CDS YER179W 5 548645 549517 W 2011-02-03 1996-07-31 -S000033130 intron YER179W 5 548553 548644 W 2011-02-03 1996-07-31 -S000077394 ARS ARS522 ARSV-550|ARS501 chromosome 5 5 549566 549814 2011-02-03 2004-10-19|2006-09-07 Autonomously Replicating Sequence; active origin of replication near the right end of Chromosome V that is activated late in S phase, late activation appears to result from telomeric proximity -S000000982 ORF Verified YER180C ISC10 chromosome 5 L000000876 5 550527 549724 C 2011-02-03 1996-07-31 Protein required for sporulation; transcript is induced 7.5 hours after induction of meiosis, expected to play significant role in the formation of reproductive cells -S000032813 CDS YER180C 5 550527 549724 C 2011-02-03 1996-07-31 -S000028437 ORF Verified YER180C-A SLO1 chromosome 5 S000028475 5 551122 550865 C 2011-02-03 2003-03-07 Protein interacting with Arl3p; Arl3p is a GTPase of the Ras superfamily involved in vesicle-tethering at the Golgi; putative ortholog of human SCOCO -S000030116 CDS YER180C-A 5 551122 550865 C 2011-02-03 2003-03-07 -S000006603 tRNA_gene tI(AAU)E2 chromosome 5 L000003798 5 551358 551285 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000037354 noncoding_exon tI(AAU)E2 5 551358 551285 C 2011-02-03 2000-05-19 -S000006921 long_terminal_repeat YERWdelta25 chromosome 5 5 551442 551773 W 2011-02-03 2000-05-19 Ty1 LTR -S000000983 ORF Verified YER181C chromosome 5 5 551796 551473 C 2011-02-03 1996-07-31 Mitochondrial protein of unknown function; conserved among S. cerevisiae strains; extensively overlaps a Ty1 LTR; YER181C is not an essential gene -S000032942 CDS YER181C 5 551796 551473 C 2011-02-03 1996-07-31 -S000006902 long_terminal_repeat YERCdelta26 chromosome 5 5 552267 552040 C 2011-02-03 2000-05-19 Ty1 LTR -S000000984 ORF Uncharacterized YER182W FMP10 chromosome 5 5 552525 553259 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000034960 CDS YER182W 5 552525 553259 W 2011-02-03 1996-07-31 -S000000985 ORF Verified YER183C FAU1 5-formyltetrahydrofolate cyclo-ligase chromosome 5 5 553969 553334 C 2011-02-03 1996-07-31 5,10-methenyltetrahydrofolate synthetase; involved in folic acid biosynthesis -S000035021 CDS YER183C 5 553969 553334 C 2011-02-03 1996-07-31 -S000000986 ORF Verified YER184C TOG1 chromosome 5 5 558680 556296 C 2011-02-03 1996-07-31 Transcriptional activator of oleate genes; regulates genes involved in fatty acid utilization; zinc cluster protein; deletion confers sensitivity to Calcufluor white, and prevents growth on glycerol or lactate as sole carbon source -S000035120 CDS YER184C 5 558680 556296 C 2011-02-03 1996-07-31 -S000000987 ORF Verified YER185W PUG1 chromosome 5 5 559454 560365 W 2011-02-03 1996-07-31 Plasma membrane protein involved in protoprophyrin and heme transport; roles in the uptake of protoprophyrin IX and the efflux of heme; expression is induced under both low-heme and low-oxygen conditions; member of the fungal lipid-translocating exporter (LTE) family of proteins -S000036056 CDS YER185W 5 559454 560365 W 2011-02-03 1996-07-31 -S000000988 ORF Uncharacterized YER186C chromosome 5 5 562625 561705 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000036102 CDS YER186C 5 562625 561705 C 2011-02-03 1996-07-31 -S000006903 long_terminal_repeat YERComega1 chromosome 5 5 564024 563928 C 2011-02-03 2000-05-19 Ty5 LTR -S000000989 ORF Uncharacterized YER187W chromosome 5 5 566230 566655 W 2011-02-03 1996-07-31 Putative protein of unknown function; induced in respiratory-deficient cells -S000031676 CDS YER187W 5 566230 566655 W 2011-02-03 1996-07-31 -S000000990 ORF Dubious YER188W chromosome 5 5 568040 568759 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; large-scale analyses show mRNA expression increases under anaerobic conditions and two-hybrid interactions with Sst2p -S000031818 CDS YER188W 5 568040 568759 W 2011-02-03 1996-07-31 -S000006922 long_terminal_repeat YERWomega2 chromosome 5 5 568791 569024 W 2011-02-03 2000-05-19 Ty5 LTR -S000028953 telomere TEL05R chromosome 5 5 569599 576874 W 151 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome V; annotated components include an X element core sequence, X element combinatorial repeats, and a long Y' element; TEL05R does have telomeric repeats (TEL05R-TR), but they are missing from the genome annotation due to difficulties encountered during sequencing and/or assembly -S000028954 X_element TEL05R 5 569599 570060 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome V; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YER188C-A -S000028955 X_element_combinatorial_repeat TEL05R 5 570061 570329 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr V; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; Formerly called SubTelomeric Repeats -S000028956 Y_prime_element TEL05R 5 570330 576874 W 2011-02-03 2003-09-09 Telomeric long Y' element on the right arm of Chromosome V; contains an ARS consensus sequence, a region of 36-bp repeats, and four ORFs (YRF1-2/YER190W, YER189W, YER190C-A, YER190C-B) -S000077395 ARS ARS523 chromosome 5 5 569618 569695 2014-11-18 2014-11-18|2004-10-19 Autonomously Replicating Sequence -S000178093 ARS_consensus_sequence ARS523 5 569629 569645 W 2014-11-18 2014-11-18 -S000028764 ORF Uncharacterized YER188C-A chromosome 5 5 569907 569608 C 2011-02-03 2003-07-29 Putative protein of unknown function -S000033468 CDS YER188C-A 5 569907 569608 C 2011-02-03 2003-07-29 -S000000991 ORF Uncharacterized YER189W chromosome 5 5 571155 571523 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000031933 CDS YER189W 5 571155 571523 W 2011-02-03 1996-07-31 -S000000992 ORF Verified YER190W YRF1-2 Y' element ATP-dependent helicase protein 1 copy 2|YRF1 chromosome 5 5 571480 576525 W 2011-02-03 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p; induced by treatment with 8-methoxypsoralen and UVA irradiation -S000036410 CDS YER190W 5 571480 576525 W 2011-02-03 1996-07-31 -S000028626 ORF Dubious YER190C-A chromosome 5 5 575379 574804 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF YRF1-2/YER190W; identified by gene-trapping, expression analysis, and homology -S000031482 CDS YER190C-A 5 575379 574804 C 2011-02-03 2003-07-29 -S000028627 ORF Uncharacterized YER190C-B chromosome 5 5 576162 575680 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031484 CDS YER190C-B 5 576162 575680 C 2011-02-03 2003-07-29 -S000001826 ORF Uncharacterized YFL068W chromosome 6 6 53 535 W 1996-07-31 1996-07-31 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the cytosol -S000030466 CDS YFL068W 6 53 535 W 1996-07-31 1996-07-31 -S000001827 ORF Uncharacterized YFL067W chromosome 6 6 836 1363 W 1996-07-31 1996-07-31 Protein of unknown function; down-regulated at low calcium levels; mCherry fusion protein localizes to the vacuole -S000037641 CDS YFL067W 6 836 1363 W 1996-07-31 1996-07-31 -S000001828 ORF Uncharacterized YFL066C Y' element ATP-dependent helicase chromosome 6 6 2615 1437 C 1996-07-31 1996-07-31 Helicase-like protein encoded within the telomeric Y' element; induced by treatment with 8-methoxypsoralen and UVA irradiation; SWAT-GFP and mCherry fusion proteins localize to the nucleus -S000037520 CDS YFL066C 6 2615 1437 C 1996-07-31 1996-07-31 -S000001829 ORF Uncharacterized YFL065C chromosome 6 6 3338 3030 C 1996-07-31 1996-07-31 Putative protein of unknown function; induced by treatment with 8-methoxypsoralen and UVA irradiation -S000037426 CDS YFL065C 6 3338 3030 C 1996-07-31 1996-07-31 -S000001830 ORF Uncharacterized YFL064C chromosome 6 6 3846 3322 C 1996-07-31 1996-07-31 Putative protein of unknown function -S000031930 CDS YFL064C 6 3846 3322 C 1996-07-31 1996-07-31 -S000001831 ORF Dubious YFL063W chromosome 6 6 5066 5521 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031881 CDS YFL063W 6 5066 5521 W 1996-07-31 1996-07-31 -S000029653 ARS ARS600 ARS600 ARS600.1|ARS120 chromosome 6 L000000123 6 5426 5529 2014-11-18 2014-11-18|2006-03-02 Subtelomeric Autonomously Replicating Sequence; originally published as ARS120 -S000114519 ARS_consensus_sequence ARS600 6 5492 5482 C 2006-03-02 2006-03-02 -S000028882 telomere TEL06L chromosome 6 6 5530 1 C -60 2003-09-09 2003-09-09|2011-02-03 Telomeric region on the left arm of Chromosome VI; composed of an X element core sequence, X element combinatorial repeats, a stretch of telomeric repeats, and a short Y' element -S000028883 telomeric_repeat TEL06L 6 4819 4685 C 2003-09-09 2003-09-09 Internal telomeric repeats on the left arm of Chromosome VI -S000028884 X_element TEL06L 6 5530 5068 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome VI; contains an ARS consensus sequence, an Abf1p binding site consensus sequence and ORF YFL063W -S000028885 X_element_combinatorial_repeat TEL06L 6 5067 4820 C 2003-09-09 2003-09-09|2011-02-03 Telomeric X element combinatorial repeat on the left arm of Chr VI; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000028886 Y_prime_element TEL06L 6 4684 1 C 2003-09-09 2003-09-09 Telomeric short Y' element on the left arm of Chromosome VI; contains a region of 36-bp repeats and five ORFs (YFL064C, YFL065C, YFL066C, YFL067W, YFL068W) -S000001832 ORF Verified YFL062W COS4 chromosome 6 L000004062 6 6426 7565 W 1996-07-31 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins -S000031765 CDS YFL062W 6 6426 7565 W 1996-07-31 1996-07-31 -S000001833 ORF Verified YFL061W DDI2 cyanamide hydratase chromosome 6 6 9545 10222 W 1996-07-31 1996-07-31 Cyanamide hydratase that detoxifies cyanamide; member of the HD domain metalloprotein superfamily; expression is induced over 100-fold by cyanamide and by SN2-type DNA alkylating agents such as MMS and DMA; induction decreased in rad6 and rad18 mutants; gene and protein are identical to DDI3 and Ddi3p -S000036244 CDS YFL061W 6 9545 10222 W 1996-07-31 1996-07-31 -S000001834 ORF Verified YFL060C SNO3 putative pyridoxal 5'-phosphate synthase chromosome 6 L000003453 6 10969 10301 C 1996-07-31 1996-07-31 Protein of unknown function; nearly identical to Sno2p; expression is induced before the diauxic shift and also in the absence of thiamin -S000036055 CDS YFL060C 6 10969 10301 C 1996-07-31 1996-07-31 -S000001835 ORF Verified YFL059W SNZ3 pyridoxine biosynthesis protein SNZ3 chromosome 6 L000002577 6 11363 12259 W 1996-07-31 1996-07-31 Member of a stationary phase-induced gene family; expressed in the presence of galactose; transcription of SNZ3 is induced prior to diauxic shift, and also in the absence of thiamin in a Thi2p-dependent manner; forms a coregulated gene pair with SNO3 -S000035247 CDS YFL059W 6 11363 12259 W 1996-07-31 1996-07-31 -S000001836 ORF Verified YFL058W THI5 4-amino-5-hydroxymethyl-2-methylpyrimidine phosphate synthase chromosome 6 L000002850 6 12929 13951 W 1996-07-31 1996-07-31 Protein involved in synthesis of the thiamine precursor HMP; member of a subtelomeric gene family including THI5, THI11, THI12, and THI13; hydroxymethylpyrimidine is also known as HMP -S000035156 CDS YFL058W 6 12929 13951 W 1996-07-31 1996-07-31 -S000001838 pseudogene YFL056C AAD6 YFL057C chromosome 6 L000004638 6 15431 14305 C 2014-11-18 1996-07-31|2014-11-18 Putative aryl-alcohol dehydrogenase; involved in oxidative stress response; similar to P. chrysosporium aryl-alcohol dehydrogenase; ORFs AAD6/YFL056C and AAD16/YFL057C are displaced from one another by -1 frameshift; members of the AAD gene family comprise three pairs (AAD3 + AAD15, AAD6/AAD16 + AAD4, AAD10 + AAD14) whose two genes are more related to one another than to other members of the family; expression induced in cells treated with the mycotoxin patulin -S000034007 CDS YFL056C 6 15431 14305 C 2014-11-18 1996-07-31|2014-11-18 -S000001839 ORF Verified YFL055W AGP3 chromosome 6 L000003948 6 17004 18680 W 1996-07-31 1996-07-31 Low-affinity amino acid permease; may act to supply the cell with amino acids as nitrogen source in nitrogen-poor conditions; transcription is induced under conditions of sulfur limitation; plays a role in regulating Ty1 transposition -S000033961 CDS YFL055W 6 17004 18680 W 1996-07-31 1996-07-31 -S000178094 ARS ARS600.4 chromosome 6 6 20702 20900 2014-11-18 2014-11-18 Strong autonomously replicating sequence -S000001840 ORF Uncharacterized YFL054C AQY3 chromosome 6 6 22787 20847 C 1996-07-31 1996-07-31 Putative channel-like protein; similar to Fps1p; mediates passive diffusion of glycerol in the presence of ethanol -S000033120 CDS YFL054C 6 22787 20847 C 1996-07-31 1996-07-31 -S000001841 ORF Verified YFL053W DAK2 dihydroxyacetone kinase chromosome 6 L000004204 6 23423 25198 W 1996-07-31 1996-07-31 Dihydroxyacetone kinase; required for detoxification of dihydroxyacetone (DHA); involved in stress adaptation -S000033090 CDS YFL053W 6 23423 25198 W 1996-07-31 1996-07-31 -S000001842 ORF Verified YFL052W ZNF1 DNA-binding domain containing protein|ROP1 chromosome 6 6 28232 29629 W 1996-07-31 1996-07-31 Zinc cluster transcription factor that regulates respiratory growth; binds to promoters of genes involved in respiration, gluconeogenesis, and the glyoxylate shunt; required for normal carbon source utilization and stress response -S000032997 CDS YFL052W 6 28232 29629 W 1996-07-31 1996-07-31 -S000001843 ORF Uncharacterized YFL051C chromosome 6 6 30540 30058 C 1996-07-31 1996-07-31 Putative protein of unknown function; SWAT-GFP fusion protein localizes to the cell periphery while mCherry fusion protein localizes to both the cell periphery and vacuole; YFL051C is not an essential gene -S000032013 CDS YFL051C 6 30540 30058 C 1996-07-31 1996-07-31 -S000007633 ARS ARS601 ARS601 chromosome 6 6 32473 32995 2001-03-02 2001-03-02 Autonomously replicating sequence on Chromosome VI; overlaps ARS602, ARS601/ARS602 together appear to be activated during the second half of S phase in ~32% of cell cycles -S000121262 ARS_consensus_sequence ARS601 6 32708 32718 W 2007-03-08 2007-03-08 -S000007634 ARS ARS602 ARS602 chromosome 6 6 32667 33247 2001-03-02 2001-03-02 Autonomously replicating sequence on Chromosome VI; overlaps ARS601, ARS601/ARS602 together appear to be activated during the second half of S phase in ~32% of cell cycles -S000121263 ARS_consensus_sequence ARS602 6 32970 32960 C 2007-03-08 2007-03-08 -S000001844 ORF Verified YFL050C ALR2 putative Mg(2+) transporter ALR2 chromosome 6 L000002888 6 35848 33272 C 1996-07-31 1996-07-31 Probable Mg(2+) transporter; overexpression confers increased tolerance to Al(3+) and Ga(3+) ions; plays a role in regulating Ty1 transposition -S000031839 CDS YFL050C 6 35848 33272 C 1996-07-31 1996-07-31 -S000001845 ORF Verified YFL049W SWP82 chromosome 6 6 36803 38674 W 1996-07-31 1996-07-31 Member of the SWI/SNF chromatin remodeling complex; has an as yet unidentified role in the complex; has identifiable counterparts in closely related yeast species; abundantly expressed in many growth conditions; paralog of Npl6p; relocates to the cytosol under hypoxic conditions -S000030907 CDS YFL049W 6 36803 38674 W 1996-07-31 1996-07-31 -S000001846 ORF Verified YFL048C EMP47 chromosome 6 L000002804 6 40180 38843 C 1996-07-31 1996-07-31 Integral membrane component of ER-derived COPII-coated vesicles; functionS in ER to Golgi transport; EMP47 has a paralog, EMP46, that arose from the whole genome duplication -S000030785 CDS YFL048C 6 40180 38843 C 1996-07-31 1996-07-31 -S000001847 ORF Verified YFL047W RGD2 chromosome 6 6 40421 42565 W 1996-07-31 1996-07-31 GTPase-activating protein (RhoGAP) for Cdc42p and Rho5p; relocalizes from bud neck to cytoplasm upon DNA replication stress -S000037893 CDS YFL047W 6 40421 42565 W 1996-07-31 1996-07-31 -S000001848 ORF Verified YFL046W FMP32 chromosome 6 6 42815 43438 W 1996-07-31 1996-07-31 Putative assembly factor for cytochrome c oxidase; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; has similarity to human MCUR1/CCDC90A -S000037798 CDS YFL046W 6 42815 43438 W 1996-07-31 1996-07-31 -S000001849 ORF Verified YFL045C SEC53 phosphomannomutase SEC53|ALG4 chromosome 6 L000001849 6 44392 43628 C 1996-07-31 1996-07-31 Phosphomannomutase; involved in synthesis of GDP-mannose and dolichol-phosphate-mannose; required for folding and glycosylation of secretory proteins in the ER lumen -S000037699 CDS YFL045C 6 44392 43628 C 1996-07-31 1996-07-31 -S000001850 ORF Verified YFL044C OTU1 ubiquitin-specific protease OTU1|YOD1 chromosome 6 6 45560 44655 C 1996-07-31 1996-07-31 Deubiquitylation enzyme that binds to the chaperone-ATPase Cdc48p; may contribute to regulation of protein degradation by deubiquitylating substrates that have been ubiquitylated by Ufd2p; member of the Ovarian Tumor (OTU) family; protein abundance increases in response to DNA replication stress -S000036927 CDS YFL044C 6 45560 44655 C 1996-07-31 1996-07-31 -S000001852 ORF Verified YFL042C LAM5 LTC2|YFL043C chromosome 6 6 47744 45720 C 2001-05-29 2001-05-29|1996-07-31 Putative sterol transfer protein; one of six StART-like domain-containing proteins in yeast that may be involved in sterol transfer between intracellular membranes; conserved across eukaryotes; has both GRAM and StART-like (VASt) domains; localizes to membrane contact sites throughout the cell, including nucleus-vacuole junctions and ER-mitochondrial contact sites -S000036790 CDS YFL042C 6 47744 45720 C 2001-05-29 2001-05-29|1996-07-31 -S000028547 ORF Uncharacterized YFL041W-A chromosome 6 6 48734 48925 W 2003-07-29 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031197 CDS YFL041W-A 6 48734 48925 W 2003-07-29 2003-07-29 -S000001853 ORF Verified YFL041W FET5 ferroxidase FET5 chromosome 6 L000002773 6 49139 51007 W 2001-05-29 1996-07-31 Multicopper oxidase; integral membrane protein with similarity to Fet3p; may have a role in iron transport -S000035986 CDS YFL041W 6 49139 51007 W 2001-05-29 1996-07-31 -S000001854 ORF Uncharacterized YFL040W chromosome 6 6 51350 52972 W 2001-05-29 1996-07-31 Putative transporter; member of the sugar porter family; YFL040W is not an essential gene; may have a role in intracellular sterol transport -S000035851 CDS YFL040W 6 51350 52972 W 2001-05-29 1996-07-31 -S000001855 ORF Verified YFL039C ACT1 actin|ABY1|END7 chromosome 6 L000000025 6 54696 53260 C -59 2011-02-03 1996-07-31|2011-02-03 Actin; structural protein involved in cell polarization, endocytosis, and other cytoskeletal functions -S000034732 CDS YFL039C 6 54377 53260 C 2001-05-29 1996-07-31 -S000034731 CDS YFL039C 6 54696 54687 C 2011-02-03 1996-07-31 -S000034733 intron YFL039C 6 54686 54378 C 2011-02-03 1996-07-31|2011-02-03 -S000001856 ORF Verified YFL038C YPT1 Rab family GTPase YPT1|YP2 chromosome 6 L000002543 6 55986 55366 C -59 2011-02-03 1996-07-31 Rab family GTPase; involved in the ER-to-Golgi step of the secretory pathway; complex formation with the Rab escort protein Mrs6p is required for prenylation of Ypt1p by type II protein geranylgeranyltransferase (Bet2p-Bet4p); binds to unspliced HAC1 mRNA; regulates the unfolded protein response (UPR) by promoting the decay of HAC1 RNA; localizes to the early Golgi, the transitional Golgi and ER membranes, pre-autophagosomal structures, and cytoplasmic vesicles -S000033828 CDS YFL038C 6 55986 55366 C 2011-02-03 1996-07-31 -S000001857 ORF Verified YFL037W TUB2 beta-tubulin|SHE8|ARM10 chromosome 6 L000002388 6 56336 57709 W -59 2011-02-03 1996-07-31 Beta-tubulin; associates with alpha-tubulin (Tub1p and Tub3p) to form tubulin dimer, which polymerizes to form microtubules; mutation in human ortholog is associated with congenital fibrosis of the extraocular muscles (CFEOM) with polymicrogyria -S000033779 CDS YFL037W 6 56336 57709 W 2011-02-03 1996-07-31 -S000130129 ncRNA_gene RUF21 RUF21 chromosome 6 6 58521 57815 C 2011-02-03 2009-05-04|2011-02-03 RNA of Unknown Function -S000130130 noncoding_exon RUF21 6 58521 57815 C 2011-02-03 2009-05-04|2011-02-03 -S000001858 ORF Verified YFL036W RPO41 DNA-directed RNA polymerase chromosome 6 L000001747 6 58782 62837 W 2011-02-03 1996-07-31 Mitochondrial RNA polymerase; single subunit enzyme similar to those of T3 and T7 bacteriophages; requires a specificity subunit encoded by MTF1 for promoter recognition; Mtf1p interacts with and stabilizes the Rpo41p-promoter complex, enhancing DNA bending and melting to facilitate pre-initiation open complex formation; Rpo41p also synthesizes RNA primers for mitochondrial DNA replication -S000033655 CDS YFL036W 6 58782 62837 W 2011-02-03 1996-07-31 -S000001859 ORF Verified YFL034C-B MOB2 YFL035C-A|YFL035C chromosome 6 L000003535|S000007658|S000002966 6 63993 63016 C 2011-02-03 1996-07-31 Activator of Cbk1p kinase; component of the RAM signaling network that regulates cellular polarity and morphogenesis; activation of Cbk1p facilitates the Ace2p-dependent daughter cell-specific transcription of genes involved in cell separation; similar to Mob1p -S000036508 CDS YFL034C-B 6 63859 63016 C 2011-02-03 1996-07-31 -S000036507 CDS YFL034C-B 6 63993 63974 C 2011-02-03 1996-07-31 -S000036509 intron YFL034C-B 6 63973 63860 C 2011-02-03 1996-07-31 -S000006436 ORF Verified YFL034C-A RPL22B eL22|ribosomal 60S subunit protein L22B|L22e|rp4|l1c|YL31|L22B|YFL035C-B chromosome 6 L000004513|S000002967 6 64932 64243 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L22A; required for translation of long 5' UTR of IME1 mRNA and meiotic entry; homologous to mammalian ribosomal protein L22, no bacterial homolog; RPL22B has a paralog, RPL22A, that arose from the whole genome duplication -S000036495 CDS YFL034C-A 6 64599 64243 C 2011-02-03 1996-07-31 -S000036494 CDS YFL034C-A 6 64932 64921 C 2011-02-03 1996-07-31 -S000036496 intron YFL034C-A 6 64920 64600 C 2011-02-03 1996-07-31 -S000001860 ORF Uncharacterized YFL034W MIL1 chromosome 6 6 65477 68698 W 2011-02-03 1996-07-31|2011-02-03 Predicted lipase; binds variant medium clathrin chain Apm2p and contributes to its membrane recruitment; putative integral membrane protein that interacts with Rpp0p component of ribosomal stalk -S000032866 CDS YFL034W 6 65477 68698 W 2011-02-03 1996-07-31|2011-02-03 -S000007635 ARS ARS603 ARS603 chromosome 6 6 68759 68861 2014-11-18 2001-03-02|2014-11-18 Highly-efficient autonomously replicating sequence on Chromosome VI; activated during the second half of S phase in ~67% of cell cycles -S000121268 ARS_consensus_sequence ARS603 6 68829 68839 W 2011-02-03 2007-03-08 -S000121269 ARS_consensus_sequence ARS603 6 68855 68845 C 2011-02-03 2007-03-08 -S000001861 ORF Verified YFL033C RIM15 protein kinase RIM15|TAK1 chromosome 6 L000003524|L000003204 6 74427 69115 C 2011-02-03 1996-07-31 Protein kinase involved in cell proliferation in response to nutrients; glucose-repressible; involved in signal transduction during cell proliferation in response to nutrients, specifically the establishment of stationary phase; identified as a regulator of IME2; phosphorylates Igo1p and Igo2p; substrate of Pho80p-Pho85p kinase -S000032693 CDS YFL033C 6 74427 69115 C 2011-02-03 1996-07-31 -S000001862 ORF Dubious YFL032W chromosome 6 6 74872 75192 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene HAC1/YFL031W; YFL032W is not an essential gene -S000032655 CDS YFL032W 6 74872 75192 W 2011-02-03 1996-07-31 -S000001863 ORF Verified YFL031W HAC1 transcription factor HAC1|IRE15|ERN4 chromosome 6 L000002611 6 75179 76147 W 2011-02-03 2001-05-29|1996-07-31 Basic leucine zipper (bZIP) transcription factor (ATF/CREB1 homolog); regulates the unfolded protein response, via UPRE binding, and membrane biogenesis; ER stress-induced splicing pathway facilitates efficient Hac1p synthesis; two functional forms of Hac1p are produced; translation initiation is repressed under non-stress conditions; protein abundance increases in response to DNA replication stress -S000031638 CDS YFL031W 6 75179 75839 W 2011-02-03 2001-05-29|1996-07-31 -S000031639 CDS YFL031W 6 76092 76147 W 2011-02-03 2001-05-29 -S000031640 intron YFL031W 6 75840 76091 W 2011-02-03 2001-05-29 -S000028629 ORF Dubious YFL031C-A YFL030C-A chromosome 6 6 76115 76014 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps HAC1/YFL031W; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000031489 CDS YFL031C-A 6 76115 76014 C 2011-02-03 2003-07-29 -S000001864 ORF Verified YFL030W AGX1 alanine--glyoxylate transaminase chromosome 6 6 76831 77988 W 2011-02-03 1996-07-31 Alanine:glyoxylate aminotransferase (AGT); catalyzes the synthesis of glycine from glyoxylate, which is one of three pathways for glycine biosynthesis in yeast; similar to mammalian and plant alanine:glyoxylate aminotransferases; human homolog AGXT complements yeast null mutant -S000031544 CDS YFL030W 6 76831 77988 W 2011-02-03 1996-07-31 -S000001865 ORF Verified YFL029C CAK1 cyclin-dependent protein kinase-activating kinase CAK1|CIV1 chromosome 6 L000003177 6 79161 78055 C 2011-02-03 1996-07-31 Cyclin-dependent kinase-activating kinase; required for passage through the cell cycle; phosphorylates and activates Cdc28p; nucleotide-binding pocket differs significantly from those of most other protein kinases -S000031499 CDS YFL029C 6 79161 78055 C 2011-02-03 1996-07-31 -S000001866 ORF Verified YFL028C CAF16 putative ATP-binding cassette family ATPase CAF16 chromosome 6 L000003418 6 80213 79344 C 2011-02-03 1996-07-31 Part of evolutionarily-conserved CCR4-NOT regulatory complex; contains single ABC-type ATPase domain but no transmembrane domain; interacts with several subunits of Mediator -S000030636 CDS YFL028C 6 80213 79344 C 2011-02-03 1996-07-31 -S000001867 ORF Verified YFL027C GYP8 chromosome 6 6 81912 80419 C 2011-02-03 1996-07-31 GTPase-activating protein for yeast Rab family members; Ypt1p is the preferred in vitro substrate but also acts on Sec4p, Ypt31p and Ypt32p; involved in the regulation of ER to Golgi vesicle transport -S000030523 CDS YFL027C 6 81912 80419 C 2011-02-03 1996-07-31 -S000001868 ORF Verified YFL026W STE2 alpha-factor pheromone receptor STE2 chromosome 6 L000002112 6 82580 83875 W -37 2011-02-03 1996-07-31|2011-02-03 Receptor for alpha-factor pheromone; seven transmembrane-domain GPCR that interacts with both pheromone and a heterotrimeric G protein to initiate the signaling response that leads to mating between haploid a and alpha cells -S000030488 CDS YFL026W 6 82580 83875 W 2011-02-03 1996-07-31|2011-02-03 -S000001869 ORF Verified YFL025C BST1 PER17 chromosome 6 L000004294 6 87234 84145 C 2011-02-03 1996-07-31 GPI inositol deacylase of the endoplasmic reticulum (ER); negatively regulates COPII vesicle formation; prevents production of vesicles with defective subunits; required for proper discrimination between resident ER proteins and Golgi-bound cargo molecules; functional ortholog of human PGAP1, mutation of which is associated with intellectual disability and encephalopathy -S000037627 CDS YFL025C 6 87234 84145 C 2011-02-03 1996-07-31 -S000001870 ORF Verified YFL024C EPL1 chromosome 6 L000004576 6 90345 87847 C 2011-02-03 1996-07-31 Subunit of NuA4, an essential histone H4/H2A acetyltransferase complex; conserved region at N-terminus is essential for interaction with the NPC (nucleosome core particle); required for autophagy; homologous to Drosophila Enhancer of Polycomb; coding sequence contains length polymorphisms in different strains -S000037484 CDS YFL024C 6 90345 87847 C 2011-02-03 1996-07-31 -S000001871 ORF Verified YFL023W BUD27 URI1 chromosome 6 S000007647 6 90986 93376 W 2011-02-03 1996-07-31 Unconventional prefoldin protein involved in translation initiation; required for correct assembly of RNAP I, II, and III in an Rpb5p-dependent manner; shuttles between nucleus and cytoplasm; mutants have inappropriate expression of nutrient sensitive genes due to translational derepression of Gcn4p transcription factor; diploid mutants show random budding; ortholog of human URI/RMP -S000037447 CDS YFL023W 6 90986 93376 W 2011-02-03 1996-07-31 -S000001872 ORF Verified YFL022C FRS2 phenylalanine--tRNA ligase subunit alpha chromosome 6 L000000630 6 95010 93499 C 2011-02-03 1996-07-31|2011-02-03 Alpha subunit of cytoplasmic phenylalanyl-tRNA synthetase; forms a tetramer with Frs1p to form active enzyme; evolutionarily distant from mitochondrial phenylalanyl-tRNA synthetase based on protein sequence, but substrate binding is similar -S000036666 CDS YFL022C 6 95010 93499 C 2011-02-03 1996-07-31|2011-02-03 -S000001873 ORF Verified YFL021W GAT1 MEP80|NIL1 chromosome 6 L000002835 6 95966 97498 W 2011-02-03 1996-07-31 Transcriptional activator of nitrogen catabolite repression genes; contains a GATA-1-type zinc finger DNA-binding motif; activity and localization regulated by nitrogen limitation and Ure2p; different translational starts produce two major and two minor isoforms that are differentially regulated and localized -S000036630 CDS YFL021W 6 95966 97498 W 2011-02-03 1996-07-31 -S000028766 ORF Dubious YFL021C-A chromosome 6 6 96615 95761 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF GAT1/YFL021W -S000033470 CDS YFL021C-A 6 96615 95761 C 2011-02-03 2003-07-29 -S000001874 ORF Verified YFL020C PAU5 seripauperin PAU5 chromosome 6 L000002815 6 99599 99231 C 2011-02-03 1996-07-31 Member of the seripauperin multigene family; encoded mainly in subtelomeric regions; induced during alcoholic fermentation; induced by low temperature and also by anaerobic conditions; negatively regulated by oxygen and repressed by heme -S000036468 CDS YFL020C 6 99599 99231 C 2011-02-03 1996-07-31 -S000006924 long_terminal_repeat YFLWdelta1 chromosome 6 6 100581 100901 W 2011-02-03 2000-05-19 Ty1 LTR -S000001875 ORF Dubious YFL019C chromosome 6 6 100605 100252 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YFL019C is not an essential gene -S000035776 CDS YFL019C 6 100605 100252 C 2011-02-03 1996-07-31 -S000006681 tRNA_gene tP(UGG)F SUF9 chromosome 6 L000002157|L000003809 6 101376 101478 W -13 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in proline codons -S000035980 intron tP(UGG)F 6 101412 101442 W 2011-02-03 2000-05-19 -S000035978 noncoding_exon tP(UGG)F 6 101376 101411 W 2011-02-03 2000-05-19 -S000035979 noncoding_exon tP(UGG)F 6 101443 101478 W 2011-02-03 2000-05-19 -S000001876 ORF Verified YFL018C LPD1 dihydrolipoyl dehydrogenase|HPD1 chromosome 6 L000000951 6 103127 101628 C 2011-02-03 1996-07-31 Dihydrolipoamide dehydrogenase; the lipoamide dehydrogenase component (E3) of the pyruvate dehydrogenase and 2-oxoglutarate dehydrogenase multi-enzyme complexes; PDH complex is concentrated in spots within the mitochondrial matrix, often near the ERMES complex and near peroxisomes; LPD1 has a paralog, IRC15, that arose from the whole genome duplication -S000035657 CDS YFL018C 6 103127 101628 C 2011-02-03 1996-07-31 -S000002965 ORF Verified YFL017W-A SMX2 mRNA splicing protein SMX2|Sm G|SmG|YFL018W-A|SNP2 chromosome 6 L000001955 6 103699 103932 W 2011-02-03 1996-07-31 Core Sm protein Sm G; part of heteroheptameric complex (with Smb1p, Smd1p, Smd2p, Smd3p, Sme1p, and Smx3p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; homolog of human Sm G -S000037748 CDS YFL017W-A 6 103699 103932 W 2011-02-03 1996-07-31 -S000001877 ORF Verified YFL017C GNA1 glucosamine 6-phosphate N-acetyltransferase|PAT1 chromosome 6 L000004865 6 104462 103983 C 2011-02-03 1996-07-31 Glucosamine-6-phosphate acetyltransferase; evolutionarily conserved; required for multiple cell cycle events including passage through START, DNA synthesis, and mitosis; involved in UDP-N-acetylglucosamine synthesis, forms GlcNAc6P from AcCoA -S000035587 CDS YFL017C 6 104462 103983 C 2011-02-03 1996-07-31 -S000178095 ARS ARS603.1 chromosome 6 6 104463 104701 2014-11-18 2014-11-18 Very weak autonomously replicating sequence -S000001878 ORF Verified YFL016C MDJ1 chromosome 6 L000001048 6 106236 104701 C 2011-02-03 1996-07-31 Co-chaperone that stimulates HSP70 protein Ssc1p ATPase activity; involved in protein folding/refolding in the mitochodrial matrix; required for proteolysis of misfolded proteins; member of the HSP40 (DnaJ) family of chaperones -S000035478 CDS YFL016C 6 106236 104701 C 2011-02-03 1996-07-31 -S000028765 ORF Dubious YFL015W-A chromosome 6 6 106415 106732 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF YFL015C -S000033469 CDS YFL015W-A 6 106415 106732 W 2011-02-03 2003-07-29 -S000001879 ORF Dubious YFL015C chromosome 6 6 106963 106469 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps dubious ORF YFL015W-A; YFL015C is not an essential gene -S000034451 CDS YFL015C 6 106963 106469 C 2011-02-03 1996-07-31 -S000001880 ORF Verified YFL014W HSP12 lipid-binding protein HSP12|HOR5|GLP1 chromosome 6 L000000816 6 107256 107585 W 2011-02-03 1996-07-31 Plasma membrane protein involved in maintaining membrane organization; involved in maintaining organization during stress conditions; induced by heat shock, oxidative stress, osmostress, stationary phase, glucose depletion, oleate and alcohol; protein abundance increased in response to DNA replication stress and dietary restriction; regulated by the HOG and Ras-Pka pathways; required for dietary restriction-induced lifespan extension -S000034418 CDS YFL014W 6 107256 107585 W 2011-02-03 1996-07-31 -S000028628 ORF Dubious YFL013W-A chromosome 6 6 107799 108602 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps IES1/YFL013C; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching -S000031487 CDS YFL013W-A 6 107799 108602 W 2011-02-03 2003-07-29 -S000002964 ORF Dubious YFL012W-A YFL013W-A chromosome 6 6 109810 110184 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene IES1/YFL013C -S000029905 CDS YFL012W-A 6 109810 110184 W 2011-02-03 1996-07-31 -S000001881 ORF Verified YFL013C IES1 chromosome 6 6 109930 107852 C 2011-02-03 1996-07-31 Subunit of the INO80 chromatin remodeling complex; relocalizes to the cytosol in response to hypoxia -S000034280 CDS YFL013C 6 109930 107852 C 2011-02-03 1996-07-31 -S000001882 ORF Uncharacterized YFL012W chromosome 6 6 110647 111093 W 2011-02-03 1996-07-31 Putative protein of unknown function; transcribed during sporulation; null mutant exhibits increased resistance to rapamycin -S000033440 CDS YFL012W 6 110647 111093 W 2011-02-03 1996-07-31 -S000001883 ORF Verified YFL011W HXT10 hexose transporter HXT10 chromosome 6 L000000844 6 112345 113985 W 2011-02-03 1996-07-31 Putative hexose transporter; expressed at low levels and expression is repressed by glucose -S000033350 CDS YFL011W 6 112345 113985 W 2011-02-03 1996-07-31 -S000001955 ORF Verified YFL010W-A AUA1 YFL011W-A chromosome 6 L000000156 6 114990 115274 W 2011-02-03 1999-07-17 Protein required for the negative regulation by ammonia of Gap1p; Gap1p is a general amino acid permease -S000031553 CDS YFL010W-A 6 114990 115274 W 2011-02-03 1999-07-17 -S000001884 ORF Verified YFL010C WWM1 chromosome 6 6 115743 115108 C 2011-02-03 1996-07-31 WW domain containing protein of unknown function; binds to Mca1p, a caspase-related protease that regulates H2O2-induced apoptosis; overexpression causes G1 phase growth arrest and clonal death that is suppressed by overexpression of MCA1 -S000033237 CDS YFL010C 6 115743 115108 C 2011-02-03 1996-07-31 -S000001885 ORF Verified YFL009W CDC4 SCF ubiquitin ligase complex subunit CDC4 chromosome 6 L000000244 6 116145 118484 W -9 2011-02-03 1996-07-31 F-box protein required for both the G1/S and G2/M phase transitions; modular substrate specificity factor which associates with core SCF (Cdc53p, Skp1p and Hrt1p/Rbx1p) to form the SCFCdc4 complex; SCFCdc4 acts as a ubiquitin-protein ligase directing ubiquitination of cyclin-dependent kinase (CDK) phosphorylated substrates, such as: Sic1p, Far1p, Cdc6p, Clb6p, and Cln3p -S000032546 CDS YFL009W 6 116145 118484 W 2011-02-03 1996-07-31 -S000007645 ARS ARS603.5 ARS603.5 chromosome 6 6 118637 118957 2011-02-03 2001-03-15 Autonomously replicating sequence on Chromosome VI; activated early in S phase in ~50% of cell cycles -S000121270 ARS_consensus_sequence ARS603.5 6 118688 118678 C 2011-02-03 2007-03-08 -S000001886 ORF Verified YFL008W SMC1 cohesin subunit SMC1|CHL10 chromosome 6 L000001926 6 119429 123106 W -10 2011-02-03 1996-07-31 Subunit of the multiprotein cohesin complex; essential protein involved in chromosome segregation and in double-strand DNA break repair; SMC chromosomal ATPase family member, binds DNA with a preference for DNA with secondary structure -S000032447 CDS YFL008W 6 119429 123106 W 2011-02-03 1996-07-31 -S000001887 ORF Verified YFL007W BLM10 YFL006W chromosome 6 S000007437 6 123479 129910 W 2011-02-03 2003-09-26|1996-07-31 Proteasome activator; binds the core proteasome (CP) and stimulates proteasome-mediated protein degradation by inducing gate opening; required for sequestering CP into proteasome storage granule (PSG) during quiescent phase and for nuclear import of CP in proliferating cells; required for resistance to bleomycin, may be involved in protecting against oxidative damage; similar to mammalian PA200 -S000031431 CDS YFL007W 6 123479 129910 W 2011-02-03 2003-09-26|1996-07-31 -S000007636 ARS ARS604 ARS604 chromosome 6 6 127751 128071 2011-02-03 2001-03-02 Extremely inefficient ARS on Chromosome VI -S000121271 ARS_consensus_sequence ARS604 6 127869 127879 W 2011-02-03 2007-03-08 -S000001889 ORF Verified YFL005W SEC4 Rab family GTPase SEC4|SRO6 chromosome 6 L000001830 6 130334 130981 W -6 2011-02-03 1996-07-31 Rab family GTPase; essential for vesicle-mediated exocytic secretion and autophagy; associates with the exocyst component Sec15p and may regulate polarized delivery of transport vesicles to the exocyst at the plasma membrane -S000031208 CDS YFL005W 6 130334 130981 W 2011-02-03 1996-07-31 -S000130127 ncRNA_gene RUF20 RUF20 chromosome 6 6 131503 131061 C 2011-02-03 2009-05-04 RNA of Unknown Function -S000130128 noncoding_exon RUF20 6 131503 131061 C 2011-02-03 2009-05-04 -S000001890 ORF Verified YFL004W VTC2 vacuolar transporter chaperone|PHM1 chromosome 6 S000007511 6 131810 134296 W 2011-02-03 1996-07-31 Regulatory subunit of the vacuolar transporter chaperone (VTC) complex; involved in membrane trafficking, vacuolar polyphosphate accumulation, microautophagy and non-autophagic vacuolar fusion; VTC2 has a paralog, VTC3, that arose from the whole genome duplication -S000031094 CDS YFL004W 6 131810 134296 W 2011-02-03 1996-07-31 -S000007637 ARS ARS605 ARS605 chromosome 6 6 135985 136085 2011-02-03 2001-03-02 Autonomously replicating sequence on Chromosome VI; activated early in S phase in ~27% of cell cycles; inactive during premeiotic S phase -S000121274 ARS_consensus_sequence ARS605 6 136047 136037 C 2011-02-03 2007-03-08 -S000001891 ORF Verified YFL003C MSH4 MutS family protein MSH4 chromosome 6 L000001192 6 137157 134521 C 2011-02-03 1996-07-31 Protein involved in meiotic recombination; required for normal levels of crossing over, colocalizes with Zip2p to discrete foci on meiotic chromosomes, has homology to bacterial MutS protein -S000030006 CDS YFL003C 6 137157 134521 C 2011-02-03 1996-07-31 -S000006669 tRNA_gene tN(GUU)F chromosome 6 L000003818 6 137559 137486 C 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis -S000030707 noncoding_exon tN(GUU)F 6 137559 137486 C 2011-02-03 2000-05-19 -S000006925 long_terminal_repeat YFLWdelta2 chromosome 6 6 137663 137912 W 2011-02-03 2000-05-19 Ty1 LTR -S000006926 long_terminal_repeat YFLWdelta3 chromosome 6 6 137913 138240 W 2011-02-03 2000-05-19 Ty2 LTR -S000006930 LTR_retrotransposon YFLWTy2-1 Ty2 chromosome 6 6 137913 143871 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007404 transposable_element_gene YFL002W-B gag protein chromosome 6 6 138204 139520 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000031732 CDS YFL002W-B 6 138204 139520 W 2011-02-03 1999-07-17 -S000002962 transposable_element_gene YFL002W-A gag-pol fusion protein chromosome 6 6 138204 143517 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000031719 CDS YFL002W-A 6 138204 139496 W 2011-02-03 1999-07-17 -S000031720 CDS YFL002W-A 6 139498 143517 W 2011-02-03 1999-07-17 -S000031721 plus_1_translational_frameshift YFL002W-A 6 139497 139497 W 2011-02-03 1999-07-17 -S000006927 long_terminal_repeat YFLWdelta4 chromosome 6 6 143540 143871 W 2011-02-03 2000-05-19 Ty2 LTR -S000006928 long_terminal_repeat YFLWdelta5 chromosome 6 6 143872 143947 W 2011-02-03 2000-05-19 Ty1 LTR -S000006929 long_terminal_repeat YFLWtau1 chromosome 6 6 144203 144523 W 2011-02-03 2000-05-19 Ty4 LTR -S000006923 long_terminal_repeat YFLCdelta6 chromosome 6 6 144822 144524 C 2011-02-03 2000-05-19 Ty1 LTR -S000001894 ORF Verified YFL002C SPB4 putative ATP-dependent RNA helicase SPB4 chromosome 6 L000001991 6 146934 145114 C 2011-02-03 1996-07-31 Putative ATP-dependent RNA helicase; nucleolar protein required for synthesis of 60S ribosomal subunits at a late step in the pathway; sediments with 66S pre-ribosomes in sucrose gradients -S000029891 CDS YFL002C 6 146934 145114 C 2011-02-03 1996-07-31 -S000001895 ORF Verified YFL001W DEG1 pseudouridine synthase DEG1|HRM3|PUS3 chromosome 6 L000000501 6 147131 148459 W -1 2011-02-03 1996-07-31 tRNA:pseudouridine synthase; introduces pseudouridines at position 38 or 39 in tRNA; also responsible for pseudouracil modification of some mRNAs; important for maintenance of translation efficiency and normal cell growth, localizes to both the nucleus and cytoplasm; non-essential for viability -S000037314 CDS YFL001W 6 147131 148459 W 2011-02-03 1996-07-31 -S000001896 centromere CEN6 CEN6 chromosome 6 L000000299 6 148510 148627 W 0 2011-02-03 2000-05-19|2006-05-08 Chromosome VI centromere -S000077272 centromere_DNA_Element_I CEN6 6 148510 148519 W 2011-02-03 2004-10-04 -S000077273 centromere_DNA_Element_II CEN6 6 148520 148602 W 2011-02-03 2004-10-04 -S000077274 centromere_DNA_Element_III CEN6 6 148603 148627 W 2011-02-03 2004-10-04 -S000001897 ORF Verified YFR001W LOC1 chromosome 6 6 149110 149724 W 2011-02-03 1996-07-31 Nuclear protein involved in asymmetric localization of ASH1 mRNA; binds double-stranded RNA in vitro; constituent of 66S pre-ribosomal particles; required at post-transcriptional step for efficient retrotransposition; absence results in decreased Ty1 Gag:GFP protein levels; relocalizes from nucleus to cytoplasm upon DNA replication stress -S000033165 CDS YFR001W 6 149110 149724 W 2011-02-03 1996-07-31 -S000001898 ORF Verified YFR002W NIC96 linker nucleoporin NIC96 chromosome 6 L000001250 6 150016 152535 W 2011-02-03 1996-07-31 Linker nucleoporin component of the nuclear pore complex (NPC); also part of the NPC nuclear basket; contributes to nucleocytoplasmic transport and NPC biogenesis; forms stable associations with three FG-nucleoporins (Nsp1p, Nup57p, and Nup49p) -S000033226 CDS YFR002W 6 150016 152535 W 2011-02-03 1996-07-31 -S000001899 ORF Verified YFR003C YPI1 type 1 protein phosphatase-activating protein YPI1 chromosome 6 6 153124 152657 C 2011-02-03 1996-07-31 Regulatory subunit of the type I protein phosphatase (PP1) Glc7p; Glc7p participates in the regulation of a variety of metabolic processes including mitosis and glycogen metabolism; in vitro evidence suggests Ypi1p is an inhibitor of Glc7p while in vivo evidence suggests it is an activator; overproduction causes decreased cellular content of glycogen; partial depletion causes lithium sensitivity, while overproduction confers lithium-tolerance -S000033251 CDS YFR003C 6 153124 152657 C 2011-02-03 1996-07-31 -S000001900 ORF Verified YFR004W RPN11 proteasome regulatory particle lid subunit RPN11|MPR1 chromosome 6 L000002976|L000002965 6 153393 154313 W 2011-02-03 1996-07-31 Metalloprotease subunit of 19S regulatory particle; part of 26S proteasome lid; couples the deubiquitination and degradation of proteasome substrates; involved, independent of catalytic activity, in fission of mitochondria and peroxisomes; protein abundance increases in response to DNA replication stress -S000034135 CDS YFR004W 6 153393 154313 W 2011-02-03 1996-07-31 -S000001901 ORF Verified YFR005C SAD1 mRNA splicing protein SAD1 chromosome 6 L000001795 6 155873 154527 C 2011-02-03 1996-07-31 Conserved zinc-finger domain protein involved in pre-mRNA splicing; critical for splicing of nearly all intron-containing genes; required for assembly of U4 snRNA into the U4/U6 particle -S000034191 CDS YFR005C 6 155873 154527 C 2011-02-03 1996-07-31 -S000001902 ORF Uncharacterized YFR006W putative Xaa-Pro dipeptidase chromosome 6 6 156145 157752 W 2011-02-03 1996-07-31 Putative X-Pro aminopeptidase; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YFR006W is not an essential gene -S000034389 CDS YFR006W 6 156145 157752 W 2011-02-03 1996-07-31 -S000006564 tRNA_gene tF(GAA)F chromosome 6 L000003817 6 158007 157916 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis -S000035384 intron tF(GAA)F 6 157970 157952 C 2011-02-03 2000-05-19 -S000035383 noncoding_exon tF(GAA)F 6 157951 157916 C 2011-02-03 2000-05-19 -S000035382 noncoding_exon tF(GAA)F 6 158007 157971 C 2011-02-03 2000-05-19 -S000006933 long_terminal_repeat YFRWdelta7 chromosome 6 6 158376 158686 W 2011-02-03 2000-05-19 Ty1 LTR -S000001903 ORF Verified YFR007W YFH7 AIM12 chromosome 6 6 159299 160360 W 2011-02-03 1996-07-31 Putative kinase with similarity to the PRK/URK/PANK kinase subfamily; the PRK/URK/PANK subfamily of P-loop kinases is also known as phosphoribulokinase/uridine kinase/bacterial pantothenate kinase -S000035412 CDS YFR007W 6 159299 160360 W 2011-02-03 1996-07-31 -S000001904 ORF Verified YFR008W FAR7 chromosome 6 6 160535 161200 W 2011-02-03 1996-07-31 Protein involved in recovery from pheromone-induced cell cycle arrest; acts in a Far1p-independent pathway; interacts with Far3p, Far8p, Far9p, Far10p, and Far11p; protein abundance increases in response to DNA replication stress -S000035513 CDS YFR008W 6 160535 161200 W 2011-02-03 1996-07-31 -S000006931 long_terminal_repeat YFRCdelta8 chromosome 6 6 162135 161804 C 2011-02-03 2000-05-19 Ty1 LTR -S000006579 tRNA_gene tG(GCC)F1 SUF20 chromosome 6 L000002167|L000003810 6 162228 162298 W 6 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons -S000031966 noncoding_exon tG(GCC)F1 6 162228 162298 W 2011-02-03 2000-05-19 -S000001905 ORF Verified YFR009W GCN20 putative AAA family ATPase GCN20 chromosome 6 L000000689 6 162488 164746 W 2011-02-03 1996-07-31 Positive regulator of the Gcn2p kinase activity; forms a complex with Gcn1p; proposed to stimulate Gcn2p activation by an uncharged tRNA -S000035605 CDS YFR009W 6 162488 164746 W 2011-02-03 1996-07-31 -S000028823 ORF Dubious YFR009W-A chromosome 6 6 163875 164132 W 2011-02-03 2003-08-07|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene YFR009W; identified by expression profiling and mass spectrometry -S000033643 CDS YFR009W-A 6 163875 164132 W 2011-02-03 2003-08-07|2003-07-29 -S000001906 ORF Verified YFR010W UBP6 ubiquitin-specific protease UBP6 chromosome 6 L000004586 6 165067 166566 W 2011-02-03 1996-07-31 Ubiquitin-specific protease; situated in the base subcomplex of the 26S proteasome, releases free ubiquitin from branched polyubiquitin chains en bloc, rather than from the distal tip of the chain; negatively regulates degradation of ubiquitinated proteins by the proteasome; works in opposition to Hul5p polyubiquitin elongation activity; mutant has aneuploidy tolerance; human homolog UBP14 complements yeast null mutant -S000037248 CDS YFR010W 6 165067 166566 W 2011-02-03 1996-07-31 -S000028824 ORF Dubious YFR010W-A chromosome 6 6 166728 166916 W 2011-02-03 2003-08-07|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized gene YFR011C; identified by expression profiling and mass spectrometry -S000033645 CDS YFR010W-A 6 166728 166916 W 2011-02-03 2003-08-07|2003-07-29 -S000001907 ORF Verified YFR011C MIC19 AIM13|MCS19 chromosome 6 6 167258 166746 C 2011-02-03 1996-07-31 Component of the MICOS complex; MICOS (formerly MINOS or MitOS) is a mitochondrial inner membrane complex that extends into the intermembrane space and has a role in the maintenance of crista junctions, inner membrane architecture, and formation of contact sites to the outer membrane; Mic19p is peripheral to the inner membrane and may connect Mic60p with the Mic10p-Mic12p-Mic27p subcomplex; both yeast and human Mic19p become oxidized, and oxidation may regulate MICOS -S000037259 CDS YFR011C 6 167258 166746 C 2011-02-03 1996-07-31 -S000006779 tRNA_gene tY(GUA)F1 SUP11 chromosome 6 L000003811|L000002188 6 167437 167525 W 4 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations -S000030879 intron tY(GUA)F1 6 167476 167489 W 2011-02-03 2000-05-19 -S000030877 noncoding_exon tY(GUA)F1 6 167437 167475 W 2011-02-03 2000-05-19 -S000030878 noncoding_exon tY(GUA)F1 6 167490 167525 W 2011-02-03 2000-05-19 -S000007638 ARS ARS606 ARS606 chromosome 6 6 167547 167801 2014-11-18 2001-03-06|2014-11-18 Highly-efficient autonomously replicating sequence on Chromosome VI; activated early in S phase in ~74% of cell cycles; replication capacity dependent upon Sum1p -S000121275 ARS_consensus_sequence ARS606 6 167736 167726 C 2011-02-03 2007-03-08 -S000001908 ORF Verified YFR012W DCV1 chromosome 6 6 167888 168496 W 2011-02-03 1996-07-31 Protein of unknown function; deletion mutant shows strong genetic interaction with cdc28-as1 mutant in the presence of 1-NM-PP1; DCV1 has a paralog, YOL019W, that arose from the whole genome duplication -S000037437 CDS YFR012W 6 167888 168496 W 2011-02-03 1996-07-31 -S000007606 ORF Uncharacterized YFR012W-A chromosome 6 6 169224 169310 W 2011-02-03 2001-02-26 Putative protein of unknown function; identified by homology -S000037183 CDS YFR012W-A 6 169224 169310 W 2011-02-03 2001-02-26 -S000001909 ORF Verified YFR013W IOC3 chromosome 6 6 169922 172285 W 2011-02-03 1996-07-31 Subunit of the Isw1a complex; Isw1a has nucleosome-stimulated ATPase activity and represses transcription initiation by specific positioning of a promoter proximal dinucleosome; promotes nucleosome shifts in the 5 prime direction; IOC3 has a paralog, ESC8, that arose from the whole genome duplication -S000037546 CDS YFR013W 6 169922 172285 W 2011-02-03 1996-07-31 -S000001910 ORF Verified YFR014C CMK1 calmodulin-dependent protein kinase CMK1 chromosome 6 L000000366 6 173877 172537 C 2011-02-03 1996-07-31|2011-02-03 Calmodulin-dependent protein kinase; may play a role in stress response, many Ca++/calmodulin dependent phosphorylation substrates demonstrated in vitro, amino acid sequence similar to mammalian Cam Kinase II; CMK1 has a paralog, CMK2, that arose from the whole genome duplication -S000030207 CDS YFR014C 6 173877 172537 C 2011-02-03 1996-07-31|2011-02-03 -S000001911 ORF Verified YFR015C GSY1 glycogen (starch) synthase GSY1 chromosome 6 L000000739 6 176391 174265 C 2011-02-03 1996-07-31 Glycogen synthase; expression induced by glucose limitation, nitrogen starvation, environmental stress, and entry into stationary phase; GSY1 has a paralog, GSY2, that arose from the whole genome duplication; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress -S000030390 CDS YFR015C 6 176391 174265 C 2011-02-03 1996-07-31 -S000001912 ORF Verified YFR016C chromosome 6 6 180743 177042 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and bud; interacts with Spa2p; YFR016C is not an essential gene -S000030514 CDS YFR016C 6 180743 177042 C 2011-02-03 1996-07-31 -S000006580 tRNA_gene tG(GCC)F2 chromosome 6 L000003816 6 181044 180974 C 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis -S000031970 noncoding_exon tG(GCC)F2 6 181044 180974 C 2011-02-03 2000-05-19 -S000001913 ORF Verified YFR017C IGD1 chromosome 6 6 182861 182274 C 2011-02-03 1996-07-31 Cytoplasmic protein that inhibits Gdb1p glycogen debranching activity; required for normal intracellular accumulation of glycogen; phosphorylated in vivo; expression increases during wine fermentation; protein abundance increases in response to DNA replication stress; IGD1 has a paralog, YOL024W, that arose from the whole genome duplication -S000031438 CDS YFR017C 6 182861 182274 C 2011-02-03 1996-07-31 -S000001914 ORF Uncharacterized YFR018C chromosome 6 6 184222 183131 C 2011-02-03 1996-07-31 Putative protein of unknown function; SWAT-GFP and seamless GFP fusion proteins localize to the endoplasmic reticulum and mCherry fusion protein localizes to the vacuole -S000031539 CDS YFR018C 6 184222 183131 C 2011-02-03 1996-07-31 -S000001915 ORF Verified YFR019W FAB1 1-phosphatidylinositol-3-phosphate 5-kinase|SVL7 chromosome 6 L000000597 6 184502 191338 W 2011-02-03 1996-07-31|2011-02-03 1-phosphatidylinositol-3-phosphate 5-kinase; vacuolar membrane kinase that generates phosphatidylinositol (3,5)P2, which is involved in vacuolar sorting and homeostasis -S000032628 CDS YFR019W 6 184502 191338 W 2011-02-03 1996-07-31|2011-02-03 -S000006731 tRNA_gene tS(GCU)F chromosome 6 L000003815 6 191613 191513 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000037442 intron tS(GCU)F 6 191576 191558 C 2011-02-03 2000-05-19 -S000037441 noncoding_exon tS(GCU)F 6 191557 191513 C 2011-02-03 2000-05-19 -S000037440 noncoding_exon tS(GCU)F 6 191613 191577 C 2011-02-03 2000-05-19 -S000006932 long_terminal_repeat YFRCdelta9 chromosome 6 6 191854 191685 C 2011-02-03 2000-05-19 Ty1 LTR -S000001916 ORF Verified YFR020W CSS2 chromosome 6 6 192737 193435 W 2011-02-03 1996-07-31 Protein of unknown function, secreted when constitutively expressed; SWAT-GFP fusion protein localizes to the endoplasmic reticulum (ER) and extracellular region, while mCherry fusion protein localizes to the ER and vacuole; mRNA identified as translated by ribosome profiling data; CSS2 is a non-essential gene -S000031952 CDS YFR020W 6 192737 193435 W 2011-02-03 1996-07-31 -S000001917 ORF Verified YFR021W ATG18 phosphoinositide binding protein ATG18|SVP1|AUT10|CVT18|NMR1 chromosome 6 6 194812 196314 W 2011-02-03 1996-07-31 Phosphoinositide binding protein; required for vesicle formation in autophagy and the cytoplasm-to-vacuole targeting (Cvt) pathway; binds both phosphatidylinositol (3,5)-bisphosphate and phosphatidylinositol 3-phosphate; WD-40 repeat protein; relocalizes from vacuole to cytoplasm upon DNA replication stress; has 4 mammalian homologs WIPI1, WIPI2, WIPI3 and WIPI4/WDR45; mutations in human WDR45 cause static encephalopathy of childhood with neurodegeneration in adulthood -S000032840 CDS YFR021W 6 194812 196314 W 2011-02-03 1996-07-31 -S000001918 ORF Verified YFR022W ROG3 ART7 chromosome 6 6 196833 199034 W 2011-02-03 1996-07-31 Alpha-arrestin involved in ubiquitin-dependent endocytosis; contributes to desensitization of agonist-occupied alpha-factor receptor Ste2p by Rsp5p-independent internalization; PPXY motif-mediated binding of the ubiquitin ligase Rsp5p is not required for adaptation; mutation suppresses the temperature sensitivity of an mck1 rim11 double mutant; SWAT-GFP and mCherry fusion proteins localize to the cytosol; ROG3 has a paralog, ROD1, that arose from the whole genome duplication -S000032952 CDS YFR022W 6 196833 199034 W 2011-02-03 1996-07-31 -S000007639 ARS ARS607 ARS607 chromosome 6 6 199395 199505 2011-02-03 2001-03-06 Highly-efficient autonomously replicating sequence on Chromosome VI; activated very early in S phase in >85% of cell cycles -S000121276 ARS_consensus_sequence ARS607 6 199416 199426 W 2011-02-03 2007-03-08 -S000130131 ncRNA_gene RUF22 RUF22 chromosome 6 6 199813 199299 C 2011-02-03 2009-05-04 RNA of Unknown Function; precise location of 3' end uncertain; RUF22 may be longer than currently annotated -S000130132 noncoding_exon RUF22 6 199813 199299 C 2011-02-03 2009-05-04 -S000001919 ORF Verified YFR023W PES4 chromosome 6 L000001381 6 199874 201709 W 2011-02-03 1996-07-31 Poly(A) binding protein, suppressor of DNA polymerase epsilon mutation; PES4 has a paralog, MIP6, that arose from the whole genome duplication -S000033022 CDS YFR023W 6 199874 201709 W 2011-02-03 1996-07-31 -S000002968 ORF Verified YFR024C-A LSB3 YFR024C chromosome 6 6 203433 201960 C 2011-02-03 1996-07-31|2008-06-02 Protein containing a C-terminal SH3 domain; binds Las17p, which is a homolog of human Wiskott-Aldrich Syndrome protein involved in actin patch assembly and actin polymerization; protein abundance increases in response to DNA replication stress; LSB3 has a paralog, YSC84, that arose from the whole genome duplication -S000035055 CDS YFR024C-A 6 203292 201960 C 2011-02-03 1996-07-31|2008-06-02 -S000035054 CDS YFR024C-A 6 203433 203387 C 2011-02-03 1996-07-31 -S000035056 intron YFR024C-A 6 203386 203293 C 2011-02-03 1996-07-31|2008-06-02 -S000001921 ORF Verified YFR025C HIS2 histidinol-phosphatase chromosome 6 L000000779 6 204750 203743 C 32 2011-02-03 1996-07-31 Histidinolphosphatase; catalyzes the eighth step in histidine biosynthesis; mutations cause histidine auxotrophy and sensitivity to Cu, Co, and Ni salts; transcription is regulated by general amino acid control -S000033826 CDS YFR025C 6 204750 203743 C 2011-02-03 1996-07-31 -S000006511 tRNA_gene tA(AGC)F chromosome 6 L000003814 6 204996 204924 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine -S000032277 noncoding_exon tA(AGC)F 6 204996 204924 C 2011-02-03 2000-05-19 -S000001922 ORF Verified YFR026C ULI1 chromosome 6 6 206257 205748 C 2011-02-03 1996-07-31 Protein of unknown function; involved in and induced by the endoplasmic reticulum unfolded protein response (UPR); SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum -S000033947 CDS YFR026C 6 206257 205748 C 2011-02-03 1996-07-31 -S000006934 long_terminal_repeat YFRWdelta10 chromosome 6 6 206922 207138 W 2011-02-03 2000-05-19 Ty1 LTR -S000001923 ORF Verified YFR027W ECO1 CTF7 chromosome 6 L000004789 6 207452 208297 W 2011-02-03 1996-07-31 Acetyltransferase; required for establishment of sister chromatid cohesion; acetylates Mps3p to regulate nuclear organization; modifies Smc3p at replication forks and Mcd1p in response to dsDNA breaks; phosphorylated by three kinases (Cdc28p, Cdc7p, Mck1p) to generate pair of phosphates spaced precisely for recognition by ubiquitin ligase SCF-Cdc4; mutations in human homolog ESCO2 cause Roberts syndrome; relative distribution to nucleus increases upon DNA replication stress -S000034947 CDS YFR027W 6 207452 208297 W 2011-02-03 1996-07-31 -S000001924 ORF Verified YFR028C CDC14 phosphoprotein phosphatase CDC14|OAF3 chromosome 6 L000000254 6 210068 208413 C 36 2011-02-03 1996-07-31 Protein phosphatase required for mitotic exit; required for rDNA segregation, cytokinesis, meiosis I spindle disassembly, environmental stress response; held in nucleolus by Cdc55p in early meiosis, liberated by FEAR and Mitotic Exit Network in anaphase, enabling it to effect a decrease in CDK/B-cyclin activity and mitotic exit; sequestered in metaphase II, released upon entry into anaphase II; human homolog CDC14A can complement thermosensitivity of yeast cdc14-1 mutant -S000035011 CDS YFR028C 6 210068 208413 C 2011-02-03 1996-07-31 -S000006780 tRNA_gene tY(GUA)F2 SUP6 chromosome 6 L000003813|L000002185 6 210707 210619 C 38 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations -S000030888 intron tY(GUA)F2 6 210668 210655 C 2011-02-03 2000-05-19 -S000030887 noncoding_exon tY(GUA)F2 6 210654 210619 C 2011-02-03 2000-05-19 -S000030886 noncoding_exon tY(GUA)F2 6 210707 210669 C 2011-02-03 2000-05-19 -S000001925 ORF Verified YFR029W PTR3 RAA2|SSY3 chromosome 6 L000003185|L000003493|S000029400|L000001554 6 210937 212973 W 46 2011-02-03 1996-07-31 Component of the SPS plasma membrane amino acid sensor system; senses external amino acid concentration and transmits intracellular signals that result in regulation of expression of amino acid permease genes; other members are Ssy1p, Ptr3p, and Ssy5p -S000035279 CDS YFR029W 6 210937 212973 W 2011-02-03 1996-07-31 -S000001926 ORF Verified YFR030W MET10 sulfite reductase subunit alpha chromosome 6 L000001084 6 213312 216419 W 41 2011-02-03 1996-07-31 Subunit alpha of assimilatory sulfite reductase; complex converts sulfite into sulfide -S000037036 CDS YFR030W 6 213312 216419 W 2011-02-03 1996-07-31 -S000007640 ARS ARS608 ARS608 chromosome 6 6 216357 216704 2011-02-03 2001-03-06 Extremely inefficient autonomously replicating sequence on Chr VI; activated early in S phase in <10% of cell cycles -S000121280 ARS_consensus_sequence ARS608 6 216484 216494 W 2011-02-03 2007-03-08 -S000001927 ORF Verified YFR031C SMC2 condensin subunit SMC2 chromosome 6 L000001927 6 220106 216594 C 2011-02-03 1996-07-31|2011-02-03 Subunit of the condensin complex; condensin reorganizes chromosomes during both mitosis and meiosis; essential SMC chromosomal ATPase family member that forms a subcomplex with Smc2p that has ATP-hydrolyzing and DNA-binding activity, but other condensin subunits are required for chromatin binding; required for clustering of tRNA genes at the nucleolus -S000037057 CDS YFR031C 6 220106 216594 C 2011-02-03 1996-07-31|2011-02-03 -S000002104 ORF Verified YFR031C-A RPL2A uL2|ribosomal 60S subunit protein L2A|L2|rp8|YL6|L5A|L2A|RPL5B chromosome 6 L000003147 6 221418 220507 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L2A; homologous to mammalian ribosomal protein L2 and bacterial L2; RPL2A has a paralog, RPL2B, that arose from the whole genome duplication -S000032329 CDS YFR031C-A 6 221267 220507 C 2011-02-03 1996-07-31 -S000032328 CDS YFR031C-A 6 221418 221415 C 2011-02-03 1996-07-31 -S000032330 intron YFR031C-A 6 221414 221268 C 2011-02-03 1996-07-31 -S000130133 ncRNA_gene RUF23 RUF23 chromosome 6 6 221714 221967 W 2011-02-03 2009-05-04 RNA of Unknown Function; precise location of 3' end uncertain; RUF23 may be longer than currently annotated -S000130134 noncoding_exon RUF23 6 221714 221967 W 2011-02-03 2009-05-04 -S000001928 ORF Uncharacterized YFR032C RRT5 chromosome 6 6 222959 222090 C 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene identified in a screen for mutants with increased levels of rDNA transcription; expressed at high levels during sporulation -S000037177 CDS YFR032C 6 222959 222090 C 2011-02-03 1996-07-31 -S000006437 ORF Verified YFR032C-A RPL29 eL29|ribosomal 60S subunit protein L29|L29e|YL43|L29 chromosome 6 L000004514 6 223437 223258 C 2011-02-03 1999-07-17 Ribosomal 60S subunit protein L29; not essential for translation, but required for proper joining of large and small ribosomal subunits and for normal translation rate; homologous to mammalian ribosomal protein L29, no bacterial homolog -S000034020 CDS YFR032C-A 6 223437 223258 C 2011-02-03 1999-07-17 -S000122098 five_prime_UTR_intron YFR032C-A 6 223771 223441 C 2011-02-03 2007-04-04 -S000028630 ORF Uncharacterized YFR032C-B chromosome 6 6 223973 223710 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032386 CDS YFR032C-B 6 223973 223710 C 2011-02-03 2003-07-29 -S000001929 ORF Verified YFR033C QCR6 ubiquinol--cytochrome-c reductase subunit 6|UCR6|COR3 chromosome 6 L000001546 6 224769 224326 C 2011-02-03 1996-07-31 Subunit 6 of the ubiquinol cytochrome-c reductase complex; the complex, also known as the cytochrome bc(1) complex or Complex III, is a component of the mitochondrial inner membrane electron transport chain; highly acidic protein; required for maturation of cytochrome c1; may be loosely associated with the complex since it is easily released into the intermembrane space -S000037271 CDS YFR033C 6 224769 224326 C 2011-02-03 1996-07-31 -S000001930 ORF Verified YFR034C PHO4 phosphate-sensing transcription factor PHO4|phoD chromosome 6 L000001420 6 225958 225020 C 47 2011-02-03 1996-07-31 Basic helix-loop-helix (bHLH) transcription factor of the myc-family; activates transcription cooperatively with Pho2p in response to phosphate limitation; binding to 'CACGTG' motif is regulated by chromatin restriction, competitive binding of Cbf1p to the same DNA binding motif and cooperation with Pho2p; function is regulated by phosphorylation at multiple sites and by phosphate availability -S000029931 CDS YFR034C 6 225958 225020 C 2011-02-03 1996-07-31 -S000028631 ORF Dubious YFR034W-A chromosome 6 6 226022 226309 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps YFR035C; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching -S000032387 CDS YFR034W-A 6 226022 226309 W 2011-02-03 2003-07-29 -S000001931 ORF Uncharacterized YFR035C chromosome 6 6 226465 226121 C 2011-02-03 1996-07-31 Putative protein of unknown function; deletion mutant exhibits synthetic phenotype with alpha-synuclein -S000030041 CDS YFR035C 6 226465 226121 C 2011-02-03 1996-07-31 -S000006620 tRNA_gene tK(CUU)F chromosome 6 L000003812 6 226760 226688 C 2011-02-03 2000-05-19|2011-02-03 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000036006 noncoding_exon tK(CUU)F 6 226760 226688 C 2011-02-03 2000-05-19|2011-02-03 -S000001932 ORF Verified YFR036W CDC26 anaphase promoting complex subunit CDC26|SCD26|HIT3 chromosome 6 L000000265|L000001809 6 226963 227337 W 52 2011-02-03 1996-07-31 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); which is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; relocalizes to the cytosol in response to hypoxia -S000031122 CDS YFR036W 6 226963 227337 W 2011-02-03 1996-07-31 -S000028767 ORF Dubious YFR036W-A chromosome 6 6 227451 228101 W 2011-02-03 2003-08-07|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps verified ORF RSC8/YFR037C -S000033471 CDS YFR036W-A 6 227451 228101 W 2011-02-03 2003-08-07|2003-07-29 -S000001933 ORF Verified YFR037C RSC8 SWH3 chromosome 6 L000003458|L000003393 6 229186 227513 C 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; essential for viability and mitotic growth; homolog of SWI/SNF subunit Swi3p, but unlike Swi3p, does not activate transcription of reporters -S000031163 CDS YFR037C 6 229186 227513 C 2011-02-03 1996-07-31 -S000001934 ORF Verified YFR038W IRC5 putative ATPase chromosome 6 6 229380 231941 W 2011-02-03 2004-02-05|1996-07-31 Putative ATPase containing the DEAD/H helicase-related sequence motif; null mutant displays increased levels of spontaneous Rad52p foci; SWAT-GFP and mCherry fusion proteins localize to the nucleus -S000031348 CDS YFR038W 6 229380 231941 W 2011-02-03 2004-02-05|1996-07-31 -S000001935 ORF Verified YFR039C OSW7 chromosome 6 6 233544 232012 C 2011-02-03 1996-07-31 Protein involved in outer spore wall assembly; likely involved directly in dityrosine layer assembly; may be involved in response to high salt and changes in carbon source; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; deletion mutant has decreased spore survival in Drosophila feces; OSW7 has a paralog, SHE10, that arose from the whole genome duplication; paralogs are redundant for spore wall dityrosine assembly -S000031395 CDS YFR039C 6 233544 232012 C 2011-02-03 1996-07-31 -S000001936 ORF Verified YFR040W SAP155 chromosome 6 L000002598 6 234242 237250 W 2011-02-03 2003-09-26|1996-07-31|2011-02-03 Protein required for function of the Sit4p protein phosphatase; forms a complex with Sit4p; member of a family of similar proteins including Sap4p, Sap185p, and Sap190p; protein abundance increases in response to DNA replication stress; SAP155 has a paralog, SAP4, that arose from the whole genome duplication -S000032382 CDS YFR040W 6 234242 237250 W 2011-02-03 2003-09-26|1996-07-31|2011-02-03 -S000001937 ORF Verified YFR041C ERJ5 chromosome 6 6 238255 237368 C 2011-02-03 1996-07-31 Type I membrane protein with a J domain; required to preserve the folding capacity of the endoplasmic reticulum; loss of the non-essential ERJ5 gene leads to a constitutively induced unfolded protein response -S000032446 CDS YFR041C 6 238255 237368 C 2011-02-03 1996-07-31 -S000001938 ORF Verified YFR042W KEG1 chromosome 6 6 238458 239060 W 2011-02-03 1996-07-31 Integral membrane protein of the ER; physically interacts with Kre6p; has a role in the synthesis of beta-1,6-glucan in the cell wall; required for cell viability -S000033287 CDS YFR042W 6 238458 239060 W 2011-02-03 1996-07-31 -S000001939 ORF Verified YFR043C IRC6 chromosome 6 6 239827 239114 C 2011-02-03 1996-07-31 Clathrin coat accessory factor; involved in clathrin-mediated vesicle trafficking; may function to link the AP-1 clathrin adaptor complex with the Rab GTPase Ypt31p; has structural similarity to G-proteins; mouse homolog Aagab (p34) functionally complements irc6 null mutation; null mutant displays increased levels of spontaneous Rad52p foci -S000033328 CDS YFR043C 6 239827 239114 C 2011-02-03 1996-07-31 -S000001940 ORF Verified YFR044C DUG1 metallodipeptidase chromosome 6 6 241437 239992 C 2011-02-03 1996-07-31 Cys-Gly metallo-di-peptidase; forms a complex with Dug2p and Dug3p to degrade glutathione (GSH) and other peptides containing a gamma-glu-X bond in an alternative pathway to GSH degradation by gamma-glutamyl transpeptidase (Ecm38p); human homolog CNDP2 can complement yeast dug1 mutant -S000033403 CDS YFR044C 6 241437 239992 C 2011-02-03 1996-07-31 -S000001941 ORF Uncharacterized YFR045W chromosome 6 6 241998 242999 W 2011-02-03 2004-02-05|2007-04-04|1996-07-31 Putative mitochondrial transport protein; null mutant is viable, exhibits decreased levels of chitin and normal resistance to calcofluor white -S000122078 CDS YFR045W 6 241998 242009 W 2011-02-03 2007-04-04 -S000034370 CDS YFR045W 6 242082 242999 W 2011-02-03 2004-02-05|2007-04-04|1996-07-31 -S000122079 intron YFR045W 6 242010 242081 W 2011-02-03 2007-04-04 -S000001942 ORF Verified YFR046C CNN1 centromere-binding protein CNN1 chromosome 6 6 244159 243074 C 2011-02-03 1996-07-31 Kinetochore protein; associated with the essential kinetochore proteins Nnf1p and Spc24p; phosphorylated by Clb5-Cdk1, Mps1p, Ipl1p and to a lesser extent by Clb2-Cdk1; localizes to the lower region of the Ndc80 complex during anaphase and regulates KMN activity by inhibiting the Mtw1 and Spc105 complexes from binding to the Ndc80 complex; similar to metazoan CENP-T -S000034403 CDS YFR046C 6 244159 243074 C 2011-02-03 1996-07-31 -S000001943 ORF Verified YFR047C BNA6 nicotinate-nucleotide diphosphorylase (carboxylating)|QPT1 chromosome 6 6 245166 244279 C 2011-02-03 1996-07-31 Quinolinate phosphoribosyl transferase; required for the de novo biosynthesis of NAD from tryptophan via kynurenine; expression regulated by Hst1p -S000034510 CDS YFR047C 6 245166 244279 C 2011-02-03 1996-07-31 -S000001944 ORF Verified YFR048W RMD8 chromosome 6 6 246146 248134 W 2011-02-03 1996-07-31 Cytosolic protein required for sporulation -S000035572 CDS YFR048W 6 246146 248134 W 2011-02-03 1996-07-31 -S000001945 ORF Verified YFR049W YMR31 KGD4|mitochondrial 37S ribosomal protein YMR31 chromosome 6 L000002726 6 248523 248894 W 2011-02-03 1996-07-31 Subunit of the mitochondrial alpha-ketoglutarate dehydrogenase; recruits E3 subunit (Lpd1p) to the E1-E2 (Kgd1p, Kgd2p) core; has similarity to human mitochondrial ribosomal protein MRP-S36 -S000035651 CDS YFR049W 6 248523 248894 W 2011-02-03 1996-07-31 -S000001946 ORF Verified YFR050C PRE4 proteasome core particle subunit beta 7 chromosome 6 L000001486 6 249866 249066 C 2011-02-03 1996-07-31 Beta 7 subunit of the 20S proteasome -S000035525 CDS YFR050C 6 249866 249066 C 2011-02-03 1996-07-31 -S000001947 ORF Verified YFR051C RET2 coatomer subunit delta chromosome 6 L000004127 6 251803 250163 C 2011-02-03 1996-07-31 Delta subunit of the coatomer complex (COPI); COPI coats Golgi-derived transport vesicles; involved in retrograde transport between Golgi and ER -S000035589 CDS YFR051C 6 251803 250163 C 2011-02-03 1996-07-31 -S000001948 ORF Verified YFR052W RPN12 proteasome regulatory particle lid subunit RPN12|NIN1 chromosome 6 L000001251 6 252505 253329 W 2011-02-03 1996-07-31 Subunit of the 19S regulatory particle of the 26S proteasome lid; synthetically lethal with RPT1, which is an ATPase component of the 19S regulatory particle; physically interacts with Nob1p and Rpn3p; protein abundance increases in response to DNA replication stress -S000036541 CDS YFR052W 6 252505 253329 W 2011-02-03 1996-07-31 -S000028768 ORF Dubious YFR052C-A chromosome 6 6 253734 253429 C 2011-02-03 2003-08-07|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF HXK1/YFR053C -S000033472 CDS YFR052C-A 6 253734 253429 C 2011-02-03 2003-08-07|2003-07-29 -S000001949 ORF Verified YFR053C HXK1 hexokinase 1 chromosome 6 L000000833 6 255049 253592 C 70 2011-02-03 1996-07-31 Hexokinase isoenzyme 1; a cytosolic protein that catalyzes phosphorylation of glucose during glucose metabolism; expression is highest during growth on non-glucose carbon sources; glucose-induced repression involves hexokinase Hxk2p; HXK1 has a paralog, HXK2, that arose from the whole genome duplication -S000036582 CDS YFR053C 6 255049 253592 C 2011-02-03 1996-07-31 -S000007641 ARS ARS609 ARS609 chromosome 6 6 256277 256431 2011-02-03 2001-03-06 Autonomously replicating sequence on Chromosome VI; activated very late in S phase in ~37% of cell cycles; this origin is specifically fired in the absence of RAD53 in the presence of hydroxyurea -S000121281 ARS_consensus_sequence ARS609 6 256385 256375 C 2011-02-03 2007-03-08 -S000001950 ORF Dubious YFR054C chromosome 6 6 259433 258855 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000036701 CDS YFR054C 6 259433 258855 C 2011-02-03 1996-07-31 -S000001952 ORF Verified YFR055W IRC7 cysteine-S-conjugate beta-lyase IRC7 chromosome 6 6 264204 265226 W 2011-02-03 1996-07-31 Beta-lyase involved in the production of thiols; null mutant displays increased levels of spontaneous Rad52p foci; expression induced by nitrogen limitation in a GLN3, GAT1-dependent manner and by copper levels in a Mac1-dependent manner -S000037482 CDS YFR055W 6 264204 265226 W 2011-02-03 1996-07-31 -S000001951 ORF Dubious YFR056C chromosome 6 6 264325 263957 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized gene YFR055W -S000037536 CDS YFR056C 6 264325 263957 C 2011-02-03 1996-07-31 -S000001953 ORF Uncharacterized YFR057W chromosome 6 6 269061 269516 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000030392 CDS YFR057W 6 269061 269516 W 2011-02-03 1996-07-31 -S000121260 ARS ARS610 ARS610 ARSVI-270 chromosome 6 6 269417 270035 2011-02-03 2007-03-08 Autonomously Replicating Sequence -S000028957 telomere TEL06R chromosome 6 6 269731 270161 W 73 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome VI; composed of an X element core sequence and a short terminal stretch of telomeric repeats -S000028958 telomeric_repeat TEL06R 6 270113 270161 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome VI -S000028959 X_element TEL06R 6 269731 270112 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome VI; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000029680 gene_group MAL1 MAL1 chromosome 7 L000001000 7 Multigene complex, polymeric locus for maltose fermentation; encodes the MAL13 trans-acting MAL-activator, MAL11 maltose permease, and MAL12 maltase -S000028887 telomere TEL07L chromosome 7 7 781 1 C -172 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome VII; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats -S000028888 telomeric_repeat TEL07L 7 34 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome VII -S000028889 X_element TEL07L 7 781 318 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome VII; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028890 X_element_combinatorial_repeat TEL07L 7 317 35 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr VII; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000006948 long_terminal_repeat YGLWomega1 chromosome 7 7 838 1079 W 2000-05-19 2000-05-19 Ty5 LTR -S000003232 ORF Verified YGL263W COS12 chromosome 7 L000004069 7 2790 3932 W 1996-07-31 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins -S000031687 CDS YGL263W 7 2790 3932 W 1996-07-31 1996-07-31 -S000003231 ORF Uncharacterized YGL262W chromosome 7 7 5312 5839 W 1996-07-31 1996-07-31 Putative protein of unknown function; null mutant displays elevated sensitivity to expression of a mutant huntingtin fragment or of alpha-synuclein; YGL262W is not an essential gene -S000031603 CDS YGL262W 7 5312 5839 W 1996-07-31 1996-07-31 -S000003230 ORF Uncharacterized YGL261C PAU11 seripauperin PAU11 chromosome 7 7 6652 6290 C 1996-07-31 1996-07-31 Putative protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; mRNA expression appears to be regulated by SUT1 and UPC2 -S000030725 CDS YGL261C 7 6652 6290 C 1996-07-31 1996-07-31 -S000003229 ORF Uncharacterized YGL260W chromosome 7 7 6860 7090 W 1996-07-31 1996-07-31 Putative protein of unknown function; transcription is significantly increased in a NAP1 deletion background; deletion mutant has increased accumulation of nickel and selenium -S000030684 CDS YGL260W 7 6860 7090 W 1996-07-31 1996-07-31 -S000003228 ORF Uncharacterized YGL259W YPS5 chromosome 7 L000004385 7 8470 8967 W 1996-07-31 1996-07-31 Protein with similarity to GPI-anchored aspartic proteases; such proteases are Yap1p and Yap3p; mCherry fusion protein localizes to the vacuole -S000030354 CDS YGL259W 7 8470 8967 W 1996-07-31 1996-07-31 -S000007607 ORF Uncharacterized YGL258W-A chromosome 7 7 9162 9395 W 2001-02-26 2001-02-26 Putative protein of unknown function -S000037184 CDS YGL258W-A 7 9162 9395 W 2001-02-26 2001-02-26 -S000003227 ORF Verified YGL258W VEL1 chromosome 7 7 11110 11730 W 1996-07-31 1996-07-31 Protein of unknown function; highly induced in zinc-depleted conditions and has increased expression in NAP1 deletion mutants; VEL1 has a paralog, YOR387C, that arose from a single-locus duplication -S000030158 CDS YGL258W 7 11110 11730 W 1996-07-31 1996-07-31 -S000003226 ORF Verified YGL257C MNT2 alpha-1,3-mannosyltransferase MNT2 chromosome 7 S000007417 7 14157 12481 C 1996-07-31 1996-07-31 Mannosyltransferase; involved in adding the 4th and 5th mannose residues of O-linked glycans -S000037390 CDS YGL257C 7 14157 12481 C 1996-07-31 1996-07-31 -S000003225 ORF Verified YGL256W ADH4 alcohol dehydrogenase ADH4|ZRG5|NRC465 chromosome 7 L000000044 7 15159 16307 W -169 2008-06-02 1996-07-31|2008-06-02 Alcohol dehydrogenase isoenzyme type IV; dimeric enzyme demonstrated to be zinc-dependent despite sequence similarity to iron-activated alcohol dehydrogenases; transcription is induced in response to zinc deficiency -S000037356 CDS YGL256W 7 15159 16307 W 2008-06-02 1996-07-31|2008-06-02 -S000003224 ORF Verified YGL255W ZRT1 high-affinity Zn(2+) transporter ZRT1 chromosome 7 L000003260 7 20978 22108 W 1996-07-31 1996-07-31 High-affinity zinc transporter of the plasma membrane; responsible for the majority of zinc uptake; transcription is induced under low-zinc conditions by the Zap1p transcription factor -S000037251 CDS YGL255W 7 20978 22108 W 1996-07-31 1996-07-31 -S000003223 ORF Verified YGL254W FZF1 SUL1|RSU1|NRC299 chromosome 7 L000001781|L000000656 7 22304 23203 W 1996-07-31 1996-07-31 Transcription factor involved in sulfite metabolism; sole identified regulatory target is SSU1; overexpression suppresses sulfite-sensitivity of many unrelated mutants due to hyperactivation of SSU1, contains five zinc fingers; protein abundance increases in response to DNA replication stress -S000036566 CDS YGL254W 7 22304 23203 W 1996-07-31 1996-07-31 -S000003222 ORF Verified YGL253W HXK2 hexokinase 2|SCI2|HKB|HEX1 chromosome 7 L000000834 7 23935 25395 W -167 1996-07-31 1996-07-31 Hexokinase isoenzyme 2; phosphorylates glucose in cytosol; predominant hexokinase during growth on glucose; represses expression of HXK1, GLK1, induces expression of its own gene; antiapoptotic; phosphorylation/dephosphorylation at Ser14 by kinase Snf1p, phosphatase Glc7p-Reg1p regulates nucleocytoplasmic shuttling of Hxk2p; functions downstream of Sit4p in control of cell cycle, mitochondrial function, oxidative stress resistance, chronological lifespan; has paralog HXK1 -S000036456 CDS YGL253W 7 23935 25395 W 1996-07-31 1996-07-31 -S000003221 ORF Verified YGL252C RTG2 chromosome 7 L000001784 7 27484 25718 C 1996-07-31 1996-07-31 Sensor of mitochondrial dysfunction; regulates the subcellular location of Rtg1p and Rtg3p, transcriptional activators of the retrograde (RTG) and TOR pathways; Rtg2p is inhibited by the phosphorylated form of Mks1p -S000036310 CDS YGL252C 7 27484 25718 C 1996-07-31 1996-07-31 -S000003220 ORF Verified YGL251C HFM1 MER3 chromosome 7 L000002581 7 31636 27921 C 2000-07-14 2000-07-14|1996-07-31 Meiosis specific DNA helicase; involved in the conversion of double-stranded breaks to later recombination intermediates and in crossover control; catalyzes the unwinding of Holliday junctions; has ssDNA and dsDNA stimulated ATPase activity -S000035419 CDS YGL251C 7 31426 27921 C 2000-07-14 2000-07-14|1996-07-31 -S000035418 CDS YGL251C 7 31636 31579 C 2000-07-14 2000-07-14 -S000035420 intron YGL251C 7 31578 31427 C 2000-07-14 2000-07-14 -S000003219 ORF Verified YGL250W RMR1 chromosome 7 7 31910 32635 W 2003-09-22 2003-09-22|1996-07-31 Protein required for meiotic recombination and gene conversion; null mutant displays reduced PIS1 expression and growth defects on non-fermentable carbon sources and minimal media; GFP-fusion protein localizes to both cytoplasm and nucleus -S000035397 CDS YGL250W 7 31910 32635 W 2003-09-22 2003-09-22|1996-07-31 -S000003218 ORF Verified YGL249W ZIP2 chromosome 7 L000003536 7 33098 35212 W 1996-07-31 1996-07-31 Meiosis-specific protein; involved in normal synaptonemal complex formation and pairing between homologous chromosomes during meiosis; relocalizes from mitochondrion to cytoplasm upon DNA replication stress -S000034159 CDS YGL249W 7 33098 35212 W 1996-07-31 1996-07-31 -S000144910 ncRNA_gene RME3 RME3 SUT534 chromosome 7 7 35013 33109 C 2014-11-18 2014-11-18 Antisense transcript that represses the meiosis-specific ZIP2 gene; expressed in haploid cells under sporulation inducing conditions; regulates ZIP2 in a cis-dependent manner; RME3 is repressed by the MAT a1/alpha2 complex in diploid cells -S000178099 noncoding_exon RME3 7 35013 33109 C 2014-11-18 2014-11-18 -S000003217 ORF Verified YGL248W PDE1 3',5'-cyclic-nucleotide phosphodiesterase PDE1 chromosome 7 L000001358 7 35653 36762 W 1996-07-31 1996-07-31 Low-affinity cyclic AMP phosphodiesterase; controls glucose and intracellular acidification-induced cAMP signaling, target of the cAMP-protein kinase A (PKA) pathway; glucose induces transcription and inhibits translation -S000033288 CDS YGL248W 7 35653 36762 W 1996-07-31 1996-07-31 -S000003216 ORF Verified YGL247W BRR6 chromosome 7 7 36933 37526 W 1996-07-31 1996-07-31 Essential nuclear envelope integral membrane protein; interacts and functions with Apq12p and Brl1p in lipid homeostasis; mutants are defective in nuclear pore complex biogenesis, nuclear envelope morphology, mRNA nuclear export, and are sensitive to sterol biosynthesis inhibitors and membrane fluidizing agents; exhibits synthetic lethal genetic interactions with genes involved in lipid metabolism; homologous to Brl1p -S000033240 CDS YGL247W 7 36933 37526 W 1996-07-31 1996-07-31 -S000003215 ORF Verified YGL246C RAI1 decapping nuclease chromosome 7 S000007430 7 38780 37617 C 1996-07-31 1996-07-31 Nuclear protein with decapping endonuclease activity; targets mRNAs with unmethylated 7-methylguanosine cap structures and 5'-triphosphates; binds to and stabilizes the exoribonuclease Rat1p; required for pre-rRNA processing; relocalizes to the cytosol in response to hypoxia; homologous to human DOM3Z -S000033150 CDS YGL246C 7 38780 37617 C 1996-07-31 1996-07-31 -S000003214 ORF Verified YGL245W GUS1 glutamate--tRNA ligase GUS1|GluRS|GSN1 chromosome 7 7 39023 41149 W 2003-09-22 2003-09-22|1996-07-31 Glutamyl-tRNA synthetase (GluRS); forms a complex with methionyl-tRNA synthetase (Mes1p) and Arc1p; complex formation increases the catalytic efficiency of both tRNA synthetases and ensures their correct localization to the cytoplasm; protein abundance increases in response to DNA replication stress -S000033122 CDS YGL245W 7 39023 41149 W 2003-09-22 2003-09-22|1996-07-31 -S000003213 ORF Verified YGL244W RTF1 CSL3 chromosome 7 L000001782 7 41498 43174 W 1999-07-17 1999-07-17|1996-07-31 Subunit of RNAPII-associated chromatin remodeling Paf1 complex; regulates gene expression by directing cotranscriptional histone modification, influences transcription and chromatin structure through several independent functional domains; directly or indirectly regulates DNA-binding properties of Spt15p and relative activities of different TATA elements; involved in transcription elongation as demonstrated by the G-less-based run-on (GLRO) assay -S000032242 CDS YGL244W 7 41498 43174 W 1999-07-17 1999-07-17|1996-07-31 -S000003212 ORF Verified YGL243W TAD1 tRNA-specific adenosine deaminase chromosome 7 L000004621 7 43307 44509 W 1996-07-31 1996-07-31 tRNA-specific adenosine deaminase; deaminates adenosine-37 to inosine in tRNA-Ala -S000032159 CDS YGL243W 7 43307 44509 W 1996-07-31 1996-07-31 -S000003211 ORF Verified YGL242C chromosome 7 7 45197 44652 C 1996-07-31 1996-07-31 Protein of unknown function; N-terminally propionylated in vivo; deletion mutant is viable -S000032036 CDS YGL242C 7 45197 44652 C 1996-07-31 1996-07-31 -S000003210 ORF Verified YGL241W KAP114 chromosome 7 L000004867 7 45445 48459 W 1996-07-31 1996-07-31 Karyopherin, responsible for nuclear import of specific proteins; cargoes include Spt15p, Sua7p, histones H2A and H2B, and Nap1p; amino terminus shows similarity to those of other importins, particularly Cse1p; localization is primarily nuclear; function is regulated by sumoylation; protein abundance increases in response to DNA replication stress -S000032007 CDS YGL241W 7 45445 48459 W 1996-07-31 1996-07-31 -S000003209 ORF Verified YGL240W DOC1 anaphase promoting complex subunit DOC1|APC10 chromosome 7 L000004350 7 48613 49365 W 2003-09-22 2003-09-22|1996-07-31 Processivity factor; required for the ubiquitination activity of the anaphase promoting complex (APC), mediates the activity of the APC by contributing to substrate recognition; involved in cyclin proteolysis; contains a conserved DOC1 homology domain -S000031054 CDS YGL240W 7 48613 49365 W 2003-09-22 2003-09-22|1996-07-31 -S000003207 ORF Verified YGL238W CSE1 importin-alpha export receptor|KAP109 chromosome 7 L000000425 7 49552 52434 W 1996-07-31 1996-07-31 Nuclear envelope protein that acts as a recycling factor; mediates the nuclear export of Srp1p (importin alpha) back to the cytoplasm after its import substrates have been released into the nucleoplasm, thereby allowing the participation of Srp1p in multiple rounds of nuclear import; required for accurate chromosome segregation; homolog of metazoan CAS and human CSE1L, overexpression of which is implicated in cancer progression -S000029914 CDS YGL238W 7 49552 52434 W 1996-07-31 1996-07-31 -S000003208 ORF Dubious YGL239C chromosome 7 7 49745 49431 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene CSE1 -S000029968 CDS YGL239C 7 49745 49431 C 1996-07-31 1996-07-31 -S000003206 ORF Verified YGL237C HAP2 chromosome 7 L000000752 7 53528 52731 C -148 1996-07-31 1996-07-31 Subunit of the Hap2p/3p/4p/5p CCAAT-binding complex; complex is heme-activated and glucose-repressed; complex is a transcriptional activator and global regulator of respiratory gene expression; contains sequences sufficient for both complex assembly and DNA binding; respiratory defect of the null mutant is functionally complemented by human NFYA -S000037826 CDS YGL237C 7 53528 52731 C 1996-07-31 1996-07-31 -S000003204 ORF Uncharacterized YGL235W chromosome 7 7 55279 55815 W 2004-07-15 1996-07-31 Putative protein of unknown function; potential Cdc28p substrate; null mutant displays increased resistance to antifungal agents gliotoxin, cycloheximide and H2O2 -S000037051 CDS YGL235W 7 55279 55815 W 2004-07-15 1996-07-31 -S000003205 ORF Verified YGL236C MTO1 tRNA modification protein MTO1|IPS1 chromosome 7 7 55796 53787 C 2004-07-15 2004-07-15|1996-07-31 Mitochondrial protein; forms heterodimer complex with Mss1p that performs 5-carboxymethylaminomethyl modification of the wobble uridine base in mitochondrial tRNAs; required for respiration in paromomycin-resistant 15S rRNA mutants; human homolog MTO1 can complement yeast null mutant -S000037073 CDS YGL236C 7 55796 53787 C 2004-07-15 2004-07-15|1996-07-31 -S000003203 ORF Verified YGL234W ADE5,7 bifunctional aminoimidazole ribotide synthase/glycinamide ribotide synthase chromosome 7 L000000035 7 56482 58890 W -152 2004-07-15 1996-07-31 Enzyme of the 'de novo' purine nucleotide biosynthetic pathway; contains aminoimidazole ribotide synthetase and glycinamide ribotide synthetase activities -S000036969 CDS YGL234W 7 56482 58890 W 2004-07-15 1996-07-31 -S000003202 ORF Verified YGL233W SEC15 Rab GTPase-binding exocyst subunit SEC15 chromosome 7 L000001840 7 59122 61854 W 2004-07-15 1996-07-31 Essential 113 kDa subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis prior to SNARE-mediated fusion; interacts with and functions as a downstream effector of active, GTP-bound Sec4p, a Rab family GTPase -S000036914 CDS YGL233W 7 59122 61854 W 2004-07-15 1996-07-31 -S000003201 ORF Verified YGL232W TAN1 putative tRNA acetyltransferase chromosome 7 7 62075 63002 W 2004-07-15 1996-07-31 Putative tRNA acetyltransferase; RNA-binding protein required for the formation of the modified nucleoside N(4)-acetylcytidine in serine and leucine tRNAs but not required for the same modification in 18S rRNA; protein abundance increases in response to DNA replication stress -S000036130 CDS YGL232W 7 62075 62131 W 2004-07-15 1996-07-31 -S000036131 CDS YGL232W 7 62190 63002 W 2004-07-15 1996-07-31 -S000036132 intron YGL232W 7 62132 62189 W 2004-07-15 1996-07-31 -S000003200 ORF Verified YGL231C EMC4 chaperone EMC4 chromosome 7 7 63620 63048 C 2004-07-15 1996-07-31 Member of conserved ER transmembrane complex; required for efficient folding of proteins in the ER; null mutant displays induction of the unfolded protein response; homologous to worm ZK616.6/EMC-4 and fly CG11137; mutation is functionally complemented by human EMC4 -S000035888 CDS YGL231C 7 63620 63048 C 2004-07-15 1996-07-31 -S000003199 ORF Uncharacterized YGL230C chromosome 7 7 64215 63772 C 2004-07-15 1996-07-31 Putative protein of unknown function; non-essential gene -S000034975 CDS YGL230C 7 64215 63772 C 2004-07-15 1996-07-31 -S000118451 ARS ARS702 ARSVII-64 chromosome 7 7 64360 64464 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000119018 ARS_consensus_sequence ARS702 7 64458 64444 C 2006-10-03 2006-10-03 -S000003198 ORF Verified YGL229C SAP4 chromosome 7 L000003341 7 66959 64503 C 2004-07-15 1996-07-31 Protein required for function of the Sit4p protein phosphatase; member of a family of similar proteins that form complexes with Sit4p, including Sap155p, Sap185p, and Sap190p; SAP4 has a paralog, SAP155, that arose from the whole genome duplication -S000034012 CDS YGL229C 7 66959 64503 C 2004-07-15 1996-07-31 -S000003197 ORF Verified YGL228W SHE10 chromosome 7 L000002872 7 67598 69331 W 2004-07-15 1996-07-31 Protein involved in outer spore wall assembly; likely involved directly in dityrosine layer assembly; putative GPI-anchored protein; overexpression causes growth arrest;; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; SHE10 has a paralog, OSW7/YFR039C, that arose from the whole genome duplication; paralogs are redundant for spore wall dityrosine assembly -S000033924 CDS YGL228W 7 67598 69331 W 2004-07-15 1996-07-31 -S000003196 ORF Verified YGL227W VID30 glucose-induced degradation complex subunit VID30|GID1 chromosome 7 L000004008 7 69671 72547 W 2004-07-15 1996-07-31 Central component of GID Complex, involved in FBPase degradation; interacts strongly with Gid8p to serve as a scaffold for other GID Complex subunits; contains SPRY domain and 3 domains that are also found in Gid8p - LisH, CTLH, and CRA; required for association of Vid vesicles and actin patches in vacuole import and degradation pathway; shifts the balance of nitrogen metabolism toward glutamate production; localizes to the nucleus and the cytoplasm -S000033846 CDS YGL227W 7 69671 72547 W 2004-07-15 1996-07-31 -S000003194 ORF Verified YGL226C-A OST5 dolichyl-diphosphooligosaccharide--protein glycotransferase subunit chromosome 7 L000002944 7 73158 72749 C 2011-02-03 1996-07-31 Zeta subunit of the oligosaccharyltransferase complex of the ER lumen; complex catalyzes asparagine-linked glycosylation of newly synthesized proteins -S000037108 CDS YGL226C-A 7 72988 72749 C 2011-02-03 1996-07-31 -S000037107 CDS YGL226C-A 7 73158 73138 C 2011-02-03 1996-07-31 -S000037109 intron YGL226C-A 7 73137 72989 C 2011-02-03 1996-07-31 -S000003195 ORF Verified YGL226W MTC3 chromosome 7 7 73340 73711 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the mitochondrion; mtc3 is synthetically sick with cdc13-1 -S000033716 CDS YGL226W 7 73340 73711 W 2011-02-03 1996-07-31 -S000006757 tRNA_gene tV(AAC)G3 chromosome 7 L000003854 7 73902 73829 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000036907 noncoding_exon tV(AAC)G3 7 73902 73829 C 2011-02-03 2000-05-19 -S000003193 ORF Verified YGL225W VRG4 GDP-mannose transporter|VIG4|LDB3|GOG5|VAN2 chromosome 7 L000000719 7 76894 77907 W 2011-02-03 1996-07-31 Golgi GDP-mannose transporter; regulates Golgi function and glycosylation in Golgi; VRG4 has a paralog, HVG1, that arose from the whole genome duplication -S000033042 CDS YGL225W 7 76894 77907 W 2011-02-03 1996-07-31 -S000003192 ORF Verified YGL224C SDT1 nucleotidase|SSM1 chromosome 7 L000003406 7 78857 78015 C 2011-02-03 1996-07-31 Pyrimidine nucleotidase; responsible for production of nicotinamide riboside and nicotinic acid riboside; overexpression suppresses the 6-AU sensitivity of transcription elongation factor S-II, as well as resistance to other pyrimidine derivatives; SDT1 has a paralog, PHM8, that arose from the whole genome duplication -S000032898 CDS YGL224C 7 78857 78015 C 2011-02-03 1996-07-31 -S000003191 ORF Verified YGL223C COG1 Golgi transport complex subunit COG1|SEC36|LDB11|COD3 chromosome 7 7 80365 79112 C 2011-02-03 1996-07-31 Essential component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments -S000032824 CDS YGL223C 7 80365 79112 C 2011-02-03 1996-07-31 -S000003190 ORF Verified YGL222C EDC1 chromosome 7 7 81186 80659 C 2011-02-03 1996-07-31 RNA-binding protein that activates mRNA decapping directly; binds to mRNA substrate and enhances activity of decapping proteins Dcp1p and Dcp2p; has a role in translation during heat stress; protein becomes more abundant and forms cytoplasmic foci in response to DNA replication stress; EDC1 has a paralog, EDC2, that arose from the whole genome duplication -S000031900 CDS YGL222C 7 81186 80659 C 2011-02-03 1996-07-31 -S000003189 ORF Verified YGL221C NIF3 hypothetical protein chromosome 7 L000003316 7 82292 81426 C 2011-02-03 1996-07-31 Protein of unknown function; similar to Listeria monocytogenes major sigma factor (rpoD gene product); the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000031759 CDS YGL221C 7 82292 81426 C 2011-02-03 1996-07-31 -S000003188 ORF Verified YGL220W BOL2 FRA2|AIM15 chromosome 7 7 82374 82736 W 2011-02-03 1996-07-31 Cytosolic protein involved in repression of iron regulon transcription; forms an iron-independent complex with Fra1p, Grx3p, and Grx4p; null mutant fails to repress the iron regulon and is sensitive to nickel; sequence similarity to human BOLA family member, BOLA2 -S000031708 CDS YGL220W 7 82374 82736 W 2011-02-03 1996-07-31 -S000003186 ORF Dubious YGL218W SRF1 chromosome 7 7 83650 84300 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 93% of ORF overlaps the verified gene MDM34; deletion in cyr1 mutant results in loss of stress resistance -S000030779 CDS YGL218W 7 83650 84300 W 2011-02-03 1996-07-31 -S000003187 ORF Verified YGL219C MDM34 ERMES complex subunit MDM34|MMM2 chromosome 7 7 84257 82878 C 2011-02-03 1996-07-31 Mitochondrial component of the ERMES complex; links the ER to mitochondria and may promote inter-organellar calcium and phospholipid exchange as well as coordinating mitochondrial DNA replication and growth; required for mitophagy; ERMES complex is often co-localized with peroxisomes and with concentrated areas of pyruvate dehydrogenase -S000030809 CDS YGL219C 7 84257 82878 C 2011-02-03 1996-07-31 -S000003184 ORF Verified YGL216W KIP3 tubulin-dependent ATPase KIP3 chromosome 7 L000003911 7 84885 87302 W 2011-02-03 1996-07-31 Kinesin-related antiparallel sliding motor protein; involved in mitotic spindle positioning; sliding activity promotes bipolar spindle assembly and maintenance of genome stability; inhibits spindle elongation, destabilizing late anaphase spindle microtubules that polymerize beyond the midzone -S000037780 CDS YGL216W 7 84885 87302 W 2011-02-03 1996-07-31 -S000003185 ORF Dubious YGL217C chromosome 7 7 85180 84839 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF KIP3/YGL216W -S000030618 CDS YGL217C 7 85180 84839 C 2011-02-03 1996-07-31 -S000003183 ORF Verified YGL215W CLG1 chromosome 7 L000000356 7 87981 89339 W 2011-02-03 1996-07-31 Cyclin-like protein that interacts with Pho85p; has sequence similarity to G1 cyclins PCL1 and PCL2 -S000037731 CDS YGL215W 7 87981 89339 W 2011-02-03 1996-07-31 -S000003182 ORF Dubious YGL214W chromosome 7 7 90010 90495 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; deletion mutation phenotype is likely due to the overlapping verified ORF SKI8/YGL213C -S000037674 CDS YGL214W 7 90010 90495 W 2011-02-03 1996-07-31|2011-02-03 -S000003181 ORF Verified YGL213C SKI8 SKI complex subunit WD repeat protein SKI8|REC103 chromosome 7 L000001906 7 91247 90054 C -149 2011-02-03 1996-07-31 Ski complex component and WD-repeat protein; mediates 3'-5' RNA degradation by the cytoplasmic exosome; also required for meiotic double-strand break recombination; null mutants have superkiller phenotype -S000037570 CDS YGL213C 7 91247 90054 C 2011-02-03 1996-07-31 -S000003180 ORF Verified YGL212W VAM7 VPL24|VPS43 chromosome 7 L000002452 7 91432 92382 W 2011-02-03 1996-07-31 Vacuolar SNARE protein; functions with Vam3p in vacuolar protein trafficking; has an N-terminal PX domain (phosphoinositide-binding module) that binds PtdIns-3-P and mediates membrane binding; SNAP-25 homolog; protein abundance increases in response to DNA replication stress -S000036874 CDS YGL212W 7 91432 92382 W 2011-02-03 1996-07-31 -S000003179 ORF Verified YGL211W NCS6 TUC1|YGL210W-A chromosome 7 7 92512 93591 W 2011-02-03 2004-07-20|1996-07-31 Protein required for uridine thiolation of Gln, Lys, and Glu tRNAs; required for the thiolation of uridine at the wobble position of Gln, Lys, and Glu tRNAs; has a role in urmylation and in invasive and pseudohyphal growth; inhibits replication of Brome mosaic virus in S. cerevisiae -S000036823 CDS YGL211W 7 92512 93591 W 2011-02-03 2004-07-20|1996-07-31 -S000003178 ORF Verified YGL210W YPT32 Rab family GTPase YPT32 chromosome 7 L000002897 7 93792 94460 W 2011-02-03 1996-07-31 Rab family GTPase involved in the exocytic pathway; mediates intra-Golgi traffic or the budding of post-Golgi vesicles from the trans-Golgi; protein abundance increases in response to DNA replication stress; YPT32 has a paralog, YPT31, that arose from the whole genome duplication -S000036765 CDS YGL210W 7 93792 94460 W 2011-02-03 1996-07-31 -S000003177 ORF Verified YGL209W MIG2 MLZ1 chromosome 7 L000003254 7 95858 97006 W 2011-02-03 1996-07-31 Zinc finger transcriptional repressor; cooperates with Mig1p in glucose-induced gene repression; under low glucose conditions relocalizes to mitochondrion, where it interacts with Ups1p, antagonizes mitochondrial fission factor Dnm1p, indicative of a role in mitochondrial fusion or regulating morphology; regulates filamentous growth in response to glucose depletion; activated in stochastic pulses of nuclear localization in response to low glucose -S000035806 CDS YGL209W 7 95858 97006 W 2011-02-03 1996-07-31 -S000003176 ORF Verified YGL208W SIP2 SPM2 chromosome 7 L000001891|L000001998 7 97338 98585 W 2011-02-03 1996-07-31|2011-02-03 One of three beta subunits of the Snf1 kinase complex; involved in the response to glucose starvation; null mutants exhibit accelerated aging; N-myristoylprotein localized to the cytoplasm and the plasma membrane; SIP2 has a paralog, GAL83, that arose from the whole genome duplication -S000035685 CDS YGL208W 7 97338 98585 W 2011-02-03 1996-07-31|2011-02-03 -S000003175 ORF Verified YGL207W SPT16 chromatin-remodeling protein SPT16|SSF1|CDC68 chromosome 7 L000002038 7 98969 102076 W -134 2011-02-03 1996-07-31 Subunit of the heterodimeric FACT complex (Spt16p-Pob3p); FACT associates with chromatin via interaction with Nhp6Ap and Nhp6Bp, and reorganizes nucleosomes to facilitate access to DNA by RNA and DNA polymerases; specifically required for diauxic shift-induced H2B deposition onto rDNA genes; mutations cause reduced nucleosome occupancy over highly transcribed regions; coregulates transcription with Mot1p through preinitiation complex assembly and nucleosome organization -S000034683 CDS YGL207W 7 98969 102076 W 2011-02-03 1996-07-31 -S000003174 ORF Verified YGL206C CHC1 clathrin heavy chain|SWA5 chromosome 7 L000000317 7 107504 102543 C -133 2011-02-03 1996-07-31 Clathrin heavy chain; subunit of the major coat protein involved in intracellular protein transport and endocytosis; the clathrin triskelion is a trimeric molecule composed of three heavy chains that radiate from a vertex and three light chains which bind noncovalently near the vertex of the triskelion; the light chain (CLC1) is thought to regulate function -S000034547 CDS YGL206C 7 107504 102543 C 2011-02-03 1996-07-31 -S000003173 ORF Verified YGL205W POX1 acyl-CoA oxidase|FOX1 chromosome 7 L000001467 7 108158 110404 W 2011-02-03 1996-07-31 Fatty-acyl coenzyme A oxidase; involved in the fatty acid beta-oxidation pathway; localized to the peroxisomal matrix -S000034502 CDS YGL205W 7 108158 110404 W 2011-02-03 1996-07-31 -S000006595 tRNA_gene tH(GUG)G1 chromosome 7 L000003822 7 110696 110625 C 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis -S000036197 noncoding_exon tH(GUG)G1 7 110696 110625 C 2011-02-03 2000-05-19 -S000006950 long_terminal_repeat YGLWtau1 chromosome 7 7 110855 111225 W 2011-02-03 2000-05-19 Ty4 LTR -S000006935 long_terminal_repeat YGLCdelta1 chromosome 7 7 111505 111226 C 2011-02-03 2000-05-19 Ty1 LTR -S000006940 long_terminal_repeat YGLWdelta2 chromosome 7 7 111506 111698 W 2011-02-03 2000-05-19 Ty1 LTR -S000003172 ORF Uncharacterized YGL204C chromosome 7 7 112005 111700 C 2011-02-03 1996-07-31 Protein of unknown function; mRNA identified as translated by ribosome profiling data; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum -S000033547 CDS YGL204C 7 112005 111700 C 2011-02-03 1996-07-31 -S000118452 ARS ARS704 ARSVII-112 chromosome 7 7 112079 112317 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000119019 ARS_consensus_sequence ARS704 7 112125 112139 W 2011-02-03 2006-10-03 -S000003171 ORF Verified YGL203C KEX1 serine-type carboxypeptidase chromosome 7 L000000895 7 114664 112475 C -131 2011-02-03 1996-07-31 Cell death protease essential for hypochlorite-induced apoptosis; involved in the processing of killer toxin and alpha factor precursor; cleaves Lys and Arg residues from the C-terminus of peptides and proteins -S000033480 CDS YGL203C 7 114664 112475 C 2011-02-03 1996-07-31 -S000006941 long_terminal_repeat YGLWdelta3 chromosome 7 7 114939 115269 W 2011-02-03 2000-05-19 Ty1 LTR -S000006630 tRNA_gene tK(UUU)G1 chromosome 7 L000003819 7 115488 115583 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000033672 intron tK(UUU)G1 7 115525 115547 W 2011-02-03 2000-05-19 -S000033670 noncoding_exon tK(UUU)G1 7 115488 115524 W 2011-02-03 2000-05-19 -S000033671 noncoding_exon tK(UUU)G1 7 115548 115583 W 2011-02-03 2000-05-19 -S000003170 ORF Verified YGL202W ARO8 bifunctional 2-aminoadipate transaminase/aromatic-amino-acid:2-oxoglutarate transaminase chromosome 7 L000003949 7 116059 117561 W 2011-02-03 1996-07-31 Aromatic aminotransferase I; expression is regulated by general control of amino acid biosynthesis -S000033459 CDS YGL202W 7 116059 117561 W 2011-02-03 1996-07-31 -S000114845 ARS ARS706 ARS706 ARO8 ARS chromosome 7 7 117561 117854 2011-02-03 2006-04-12 Autonomously Replicating Sequence -S000003169 ORF Verified YGL201C MCM6 MCM DNA helicase complex subunit MCM6 chromosome 7 L000004104 7 120907 117854 C 2011-02-03 2004-01-23|1996-07-31 Protein involved in DNA replication; component of the Mcm2-7 hexameric helicase complex that binds chromatin as a part of the pre-replicative complex; forms a subcomplex with Mcm4p and Mcm7p -S000033344 CDS YGL201C 7 120907 117854 C 2011-02-03 2004-01-23|1996-07-31 -S000006621 tRNA_gene tK(CUU)G1 chromosome 7 L000003820 7 122269 122341 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000029888 noncoding_exon tK(CUU)G1 7 122269 122341 W 2011-02-03 2000-05-19 -S000003168 ORF Verified YGL200C EMP24 BST2 chromosome 7 L000000549 7 123305 122694 C 2011-02-03 1996-07-31 Component of the p24 complex; role in misfolded protein quality control; binds to GPI anchor proteins and mediates their efficient transport from the ER to the Golgi; integral membrane protein that associates with endoplasmic reticulum-derived COPII-coated vesicles -S000032658 CDS YGL200C 7 123305 122694 C 2011-02-03 1996-07-31 -S000003166 ORF Verified YGL198W YIP4 chromosome 7 7 123591 124298 W 2011-02-03 2004-01-23|1996-07-31 Protein that interacts with Rab GTPases; localized to late Golgi vesicles; computational analysis of large-scale protein-protein interaction data suggests a possible role in vesicle-mediated transport -S000034057 CDS YGL198W 7 123591 124298 W 2011-02-03 2004-01-23|1996-07-31 -S000003167 ORF Dubious YGL199C chromosome 7 7 124042 123572 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YIP4/YGL198W -S000034896 CDS YGL199C 7 124042 123572 C 2011-02-03 1996-07-31 -S000003165 ORF Verified YGL197W MDS3 chromosome 7 L000003960 7 124698 129161 W 2011-02-03 1996-07-31|2011-02-03 Putative component of the TOR regulatory pathway; negative regulator of early meiotic gene expression; required, with Pmd1p, for growth under alkaline conditions; has an N-terminal kelch-like domain; MDS3 has a paralog, PMD1, that arose from the whole genome duplication -S000033900 CDS YGL197W 7 124698 129161 W 2011-02-03 1996-07-31|2011-02-03 -S000003164 ORF Verified YGL196W DSD1 D-serine ammonia-lyase DSD1 chromosome 7 7 129883 131169 W 2011-02-03 2004-07-19|1996-07-31 D-serine dehydratase (aka D-serine ammonia-lyase); converts D-serine to pyruvate and ammonia by a reaction dependent on pyridoxal 5'-phosphate and zinc; may play a role in D-serine detoxification; L-serine is not a substrate -S000033780 CDS YGL196W 7 129883 131169 W 2011-02-03 2004-07-19|1996-07-31 -S000003163 ORF Verified YGL195W GCN1 AAS103|NDR1 chromosome 7 L000000680 7 131525 139543 W 2011-02-03 1996-07-31 Positive regulator of the Gcn2p kinase activity; forms a complex with Gcn20p; proposed to stimulate Gcn2p activation by an uncharged tRNA -S000033049 CDS YGL195W 7 131525 139543 W 2011-02-03 1996-07-31 -S000087160 ORF Uncharacterized YGL194C-A chromosome 7 7 139961 139719 C 2011-02-03 2005-11-10 Putative protein of unknown function; identified based on comparisons of the genome sequences of six Saccharomyces species; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum -S000087161 CDS YGL194C-A 7 139961 139719 C 2011-02-03 2005-11-10 -S000003162 ORF Verified YGL194C HOS2 histone deacetylase HOS2|RTL1 chromosome 7 L000004092|L000003448 7 141726 140368 C 2011-02-03 1996-07-31 Histone deacetylase and subunit of Set3 and Rpd3L complexes; required for gene activation via specific deacetylation of lysines in H3 and H4 histone tails; subunit of the Set3 complex, a meiotic-specific repressor of sporulation specific genes that contains deacetylase activity; co-localizes with Cmr1p in nuclear foci in response to DNA damage by MMS -S000032901 CDS YGL194C 7 141726 140368 C 2011-02-03 1996-07-31 -S000003161 ORF Uncharacterized YGL193C chromosome 7 7 142227 141916 C 2011-02-03 1996-07-31 Haploid-specific gene repressed by a1-alpha2; turned off in sir3 null strains, absence enhances the sensitivity of rad52-327 cells to campothecin almost 100-fold -S000032793 CDS YGL193C 7 142227 141916 C 2011-02-03 1996-07-31 -S000003160 ORF Verified YGL192W IME4 mRNA (N6-adenosine)-methyltransferase|SPO8 chromosome 7 L000000863|L000002001 7 142246 144048 W -130 2011-02-03 1996-07-31 mRNA N6-adenosine methyltransferase required for entry into meiosis; mediates N6-adenosine methylation of bulk mRNA during the induction of sporulation which includes the meiotic regulators IME1, IME2 and IME4 itself; repressed in haploids via production of antisense IME4 transcripts; transcribed in diploid cells where antisense transcription is repressed; orthologous to human METTL3 (MT-A70) -S000031956 CDS YGL192W 7 142246 144048 W 2011-02-03 1996-07-31 -S000144908 ncRNA_gene RME2 RME2 IME4-AS chromosome 7 7 144120 141898 C 2014-11-18 2014-11-18 Antisense transcript initiated from the 3' end of the IME4 locus; expressed in haploids and interferes with IME4 expression through a cis-acting mechanism; RME2 expression is repressed by the MAT a1/alpha2 repressor complex -S000178098 noncoding_exon RME2 7 144120 141898 C 2014-11-18 2014-11-18 -S000003159 ORF Verified YGL191W COX13 cytochrome c oxidase subunit VIa chromosome 7 L000000397 7 144808 145197 W 2011-02-03 1996-07-31 Subunit VIa of cytochrome c oxidase; present in a subclass of cytochrome c oxidase complexes that may have a role in mimimizing generation of reactive oxygen species; not essential for cytochrome c oxidase activity but may modulate activity in response to ATP; required for assembly of Rcf2p into cytochrome c oxidase - cytochrome bc1 supercomplexes -S000031830 CDS YGL191W 7 144808 145197 W 2011-02-03 1996-07-31 -S000003158 ORF Verified YGL190C CDC55 TMR4|protein phosphatase 2A regulatory subunit CDC55 chromosome 7 L000000282|S000029602|L000003191 7 147389 145809 C -125 2011-02-03 1996-07-31 Regulatory subunit B of protein phosphatase 2A (PP2A); Zds1p/2p-dependent localization to cytoplasm promotes mitotic entry; localization to nucleus prevents mitotic exit; required for correct nuclear division, chromosome segregation during achiasmate meiosis; maintains nucleolar sequestration of Cdc14p during early meiosis; limits formation of PP2A-Rts1p holocomplexes to ensure timely dissolution of sister chromosome cohesion; homolog of mammalian B55 -S000031647 CDS YGL190C 7 147389 145809 C 2011-02-03 1996-07-31 -S000003157 ORF Verified YGL189C RPS26A eS26|ribosomal 40S subunit protein S26A|S26e|S26A|RPS26 chromosome 7 L000003256|L000001762 7 148588 148229 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S26, no bacterial homolog; RPS26A has a paralog, RPS26B, that arose from the whole genome duplication; human homolog can partially complement an RPS26A, RPS26B double null mutant; mutations in the human gene are associated with Diamond-Blackfan anemia -S000031468 CDS YGL189C 7 148588 148229 C 2011-02-03 1996-07-31 -S000122100 five_prime_UTR_intron YGL189C 7 148966 148599 C 2011-02-03 2007-04-04 -S000028635 ORF Uncharacterized YGL188C-A chromosome 7 7 148964 148824 C 2011-02-03 2003-07-29 Putative protein of unknown function -S000032391 CDS YGL188C-A 7 148964 148824 C 2011-02-03 2003-07-29 -S000003156 ORF Dubious YGL188C chromosome 7 7 149516 149343 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030546 CDS YGL188C 7 149516 149343 C 2011-02-03 1996-07-31 -S000003155 ORF Verified YGL187C COX4 cytochrome c oxidase subunit IV chromosome 7 L000000386 7 150171 149704 C 2011-02-03 1996-07-31 Subunit IV of cytochrome c oxidase; the terminal member of the mitochondrial inner membrane electron transport chain; precursor N-terminal 25 residues are cleaved during mitochondrial import; phosphorylated; spermidine enhances translation -S000030404 CDS YGL187C 7 150171 149704 C 2011-02-03 1996-07-31 -S000122089 five_prime_UTR_intron YGL187C 7 150525 150184 C 2011-02-03 2007-03-28 -S000003154 ORF Verified YGL186C TPN1 chromosome 7 7 152776 151037 C 2011-02-03 1996-07-31 Plasma membrane pyridoxine (vitamin B6) transporter; member of the purine-cytosine permease subfamily within the major facilitator superfamily; proton symporter with similarity to Fcy21p, Fcy2p, and Fcy22p -S000030268 CDS YGL186C 7 152776 151037 C 2011-02-03 1996-07-31 -S000003153 ORF Uncharacterized YGL185C putative hydroxyacid dehydrogenase chromosome 7 7 154306 153167 C 2011-02-03 1996-07-31 Putative protein with sequence similar to hydroxyacid dehydrogenases; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000037513 CDS YGL185C 7 154306 153167 C 2011-02-03 1996-07-31 -S000003152 ORF Verified YGL184C STR3 cystathionine beta-lyase STR3 chromosome 7 7 156012 154615 C 2011-02-03 1996-07-31 Peroxisomal cystathionine beta-lyase; converts cystathionine into homocysteine; may be redox regulated by Gto1p; involved in the release of the aromatic thiol 3-mercaptohexanol during wine fermentation -S000037385 CDS YGL184C 7 156012 154615 C 2011-02-03 1996-07-31 -S000003151 ORF Verified YGL183C MND1 chromosome 7 7 157285 156543 C 2011-02-03 2003-01-07|1996-07-31 Protein required for recombination and meiotic nuclear division; forms a complex with Hop2p, which is involved in chromosome pairing and repair of meiotic double-strand breaks -S000037289 CDS YGL183C 7 157199 156543 C 2011-02-03 2003-01-07|1996-07-31 -S000037288 CDS YGL183C 7 157285 157283 C 2011-02-03 2003-01-07 -S000037290 intron YGL183C 7 157282 157200 C 2011-02-03 2003-01-07 -S000003150 ORF Dubious YGL182C chromosome 7 7 157596 157273 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF MND1/YGL183C -S000036583 CDS YGL182C 7 157596 157273 C 2011-02-03 1996-07-31 -S000003149 ORF Verified YGL181W GTS1 LSR1|FHT1 chromosome 7 L000000743 7 157906 159096 W 2011-02-03 1996-07-31 Protein involved in Arf3p regulation and in transcription regulation; localizes to the nucleus and to endocytic patches; contains an N-terminal Zn-finger and ArfGAP homology domain, a C-terminal glutamine-rich region, and a UBA (ubiquitin associated) domain; gts1 mutations affect budding, cell size, heat tolerance, sporulation, life span, ultradian rhythms, endocytosis; expression oscillates in a pattern similar to metabolic oscillations -S000036556 CDS YGL181W 7 157906 159096 W 2011-02-03 1996-07-31 -S000003148 ORF Verified YGL180W ATG1 serine/threonine protein kinase ATG1|APG1|CVT10|AUT3 chromosome 7 L000003955|S000028502|L000004761 7 160065 162758 W 2011-02-03 1996-07-31 Protein serine/threonine kinase; required for vesicle formation in autophagy and the cytoplasm-to-vacuole targeting (Cvt) pathway; structurally required for phagophore assembly site formation; during autophagy forms a complex with Atg13p and Atg17p; essential for cell cycle progression from G2/M to G1 under nitrogen starvation -S000036454 CDS YGL180W 7 160065 162758 W 2011-02-03 1996-07-31 -S000118453 ARS ARS707 ARSVII-163 chromosome 7 7 163218 163318 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000119020 ARS_consensus_sequence ARS707 7 163236 163250 W 2011-02-03 2006-10-03 -S000003147 ORF Verified YGL179C TOS3 serine/threonine protein kinase TOS3 chromosome 7 7 165091 163409 C 2011-02-03 1996-07-31 Protein kinase; related to and functionally redundant with Elm1p and Sak1p for the phosphorylation and activation of Snf1p; functionally orthologous to LKB1, a mammalian kinase associated with Peutz-Jeghers cancer-susceptibility syndrome; TOS3 has a paralog, SAK1, that arose from the whole genome duplication -S000035343 CDS YGL179C 7 165091 163409 C 2011-02-03 1996-07-31 -S000003146 ORF Verified YGL178W MPT5 UTH4|PUF5|HTR1 chromosome 7 L000001146 7 167352 170571 W 2011-02-03 1996-07-31 mRNA-binding protein of the PUF family; binds to specific mRNAs, often in the 3' UTR; has broad specificity and binds to more than 1000 mRNAs (16% of the transcriptome); recruits the CCR4-NOT deadenylase complex to mRNAs along with Dhh1p and Dcp1p to promote deadenylation, decapping, and decay; also interacts with the Caf20p translational initiation repressor, affecting its mRNA target specificity -S000034396 CDS YGL178W 7 167352 167354 W 2011-02-03 1996-07-31 -S000034397 CDS YGL178W 7 167995 170571 W 2011-02-03 1996-07-31 -S000034398 intron YGL178W 7 167355 167994 W 2011-02-03 1996-07-31 -S000003145 ORF Dubious YGL177W chromosome 7 7 167559 167906 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034289 CDS YGL177W 7 167559 167906 W 2011-02-03 1996-07-31 -S000003144 ORF Uncharacterized YGL176C chromosome 7 7 173079 171415 C 2011-02-03 1996-07-31 Putative protein of unknown function; deletion mutant is viable and has no detectable phenotype -S000033315 CDS YGL176C 7 173079 171415 C 2011-02-03 1996-07-31 -S000003143 ORF Verified YGL175C SAE2 ssDNA endodeoxyribonuclease SAE2|COM1 chromosome 7 L000002892 7 174322 173285 C 2011-02-03 1996-07-31 Endonuclease required for telomere elongation; required for telomeric 5' C-rich strand resection; involved in ds-break repair and processing hairpin DNA structures with the MRX complex; function requires sumoylation and phosphorylation; exists as inactive oligomers that are transiently released into smaller active units by phosphorylation; DNA damage triggers Sae2p removal, so active Sae2p is present only transiently; sequence and functional similarity with human CtIP/RBBP8 -S000033258 CDS YGL175C 7 174322 173285 C 2011-02-03 1996-07-31 -S000003142 ORF Verified YGL174W BUD13 CWC26 chromosome 7 7 174545 175345 W 2011-02-03 1996-07-31 Subunit of the RES complex; RES complex is required for nuclear pre-mRNA retention and splicing; involved in bud-site selection; diploid mutants display a unipolar budding pattern instead of the wild-type bipolar pattern due to a specific defect in MATa1 pre-mRNA splicing which leads to haploid gene expression in diploids -S000033236 CDS YGL174W 7 174545 175345 W 2011-02-03 1996-07-31 -S000003141 ORF Verified YGL173C XRN1 chromatin-binding exonuclease XRN1|KEM1|SKI1|SEP1|RAR5|DST2 chromosome 7 L000000891|L000001902 7 180113 175527 C -111 2011-02-03 1996-07-31 Evolutionarily-conserved 5'-3' exonuclease; component of cytoplasmic processing (P) bodies involved in mRNA decay; also enters the nucleus and positively regulates transcription initiation and elongation; plays a role in microtubule-mediated processes, filamentous growth, ribosomal RNA maturation, and telomere maintenance; activated by the scavenger decapping enzyme Dcs1p -S000033145 CDS YGL173C 7 180113 175527 C 2011-02-03 1996-07-31 -S000003140 ORF Verified YGL172W NUP49 FG-nucleoporin NUP49|NSP49 chromosome 7 L000001290 7 180700 182118 W 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; contributes directly to nucleocytoplasmic transport and maintenance of the nuclear pore complex (NPC) permeability barrier; found in stable complex with Nic96p and two other FG-nucleoproteins (Nsp1p and Nup57p) -S000032312 CDS YGL172W 7 180700 182118 W 2011-02-03 1996-07-31 -S000003139 ORF Verified YGL171W ROK1 RNA-dependent ATPase ROK1 chromosome 7 L000003005 7 182390 184084 W 2011-02-03 1996-07-31 RNA-dependent ATPase; involved in pre-rRNA processing at sites A0, A1, and A2, and in control of cell cycle progression; contains two upstream open reading frames (uORFs) in 5' untranslated region which regulate translation -S000032238 CDS YGL171W 7 182390 184084 W 2011-02-03 1996-07-31 -S000003138 ORF Verified YGL170C SPO74 chromosome 7 7 185394 184153 C 2011-02-03 1996-07-31 Component of the meiotic outer plaque of the spindle pole body; involved in modifying the meiotic outer plaque that is required prior to prospore membrane formation -S000032119 CDS YGL170C 7 185394 184153 C 2011-02-03 1996-07-31 -S000006622 tRNA_gene tK(CUU)G2 chromosome 7 L000003852 7 185786 185714 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000029890 noncoding_exon tK(CUU)G2 7 185786 185714 C 2011-02-03 2000-05-19 -S000003137 ORF Verified YGL169W SUA5 threonylcarbamoyladenylate synthase chromosome 7 L000002140 7 186059 187339 W -104.06 2011-02-03 1996-07-31 Protein involved in threonylcarbamoyl adenosine biosynthesis; Sua5p and Qri7p are necessary and sufficient for RNA t6A modification in vitro; null mutant lacks N6-threonylcarbamoyl adenosine (t6A) modification in the anticodon loop of ANN-decoding tRNA; member of conserved YrdC/Sua5 family; binds single-stranded telomeric DNA and null mutant has abnormal telomere length -S000031262 CDS YGL169W 7 186059 187339 W 2011-02-03 1996-07-31 -S000003136 ORF Verified YGL168W HUR1 chromosome 7 7 187464 187796 W 2011-02-03 1996-07-31 Protein of unknown function; reported null mutant phenotype of hydroxyurea sensitivity may be due to effects on overlapping PMR1 gene -S000031124 CDS YGL168W 7 187464 187796 W 2011-02-03 1996-07-31 -S000130163 ARS ARS709 chromosome 7 7 187464 187796 2011-02-03 2009-05-07 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay -S000003135 ORF Verified YGL167C PMR1 Ca(2+)/Mn(2+)-transporting P-type ATPase PMR1|SSC1|LDB1|BSD1 chromosome 7 L000004740|L000001455 7 190468 187616 C -104 2011-02-03 1996-07-31 High affinity Ca2+/Mn2+ P-type ATPase; required for Ca2+ and Mn2+ transport into Golgi; involved in Ca2+ dependent protein sorting, processing; D53A mutant (Mn2+ transporting) is rapamycin sensitive, Q783A mutant (Ca2+ transporting) is rapamycin resistant; Mn2+ transport into Golgi lumen required for rapamycin sensitivity; mutations in human homolog ATP2C1 cause acantholytic skin condition Hailey-Hailey disease; human ATP2C1 can complement yeast null mutant -S000030956 CDS YGL167C 7 190468 187616 C 2011-02-03 1996-07-31 -S000003134 ORF Verified YGL166W CUP2 ACE1 chromosome 7 L000000439 7 191129 191806 W -101 2011-02-03 1996-07-31 Copper-binding transcription factor; activates transcription of the metallothionein genes CUP1-1 and CUP1-2 in response to elevated copper concentrations; required for regulation of copper genes in response to DNA-damaging reagents; CUP2 has a paralog, HAA1, that arose from the whole genome duplication -S000030040 CDS YGL166W 7 191129 191806 W 2011-02-03 1996-07-31 -S000003133 ORF Dubious YGL165C chromosome 7 7 191976 191398 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF CUP2/YGL166W -S000029838 CDS YGL165C 7 191976 191398 C 2011-02-03 1996-07-31 -S000003132 ORF Verified YGL164C YRB30 chromosome 7 7 193300 191978 C 2011-02-03 1996-07-31 RanGTP-binding protein; inhibits RanGAP1 (Rna1p)-mediated GTP hydrolysis of RanGTP (Gsp1p); shares similarity to proteins in other fungi but not in higher eukaryotes -S000037824 CDS YGL164C 7 193300 191978 C 2011-02-03 1996-07-31 -S000003131 ORF Verified YGL163C RAD54 DNA-dependent ATPase RAD54|XRS1 chromosome 7 L000001574 7 196403 193707 C -111 2011-02-03 1996-07-31 DNA-dependent ATPase that stimulates strand exchange; modifies the topology of double-stranded DNA; involved in the recombinational repair of double-strand breaks in DNA during vegetative growth and meiosis; member of the SWI/SNF family of DNA translocases; forms nuclear foci upon DNA replication stress -S000037069 CDS YGL163C 7 196403 193707 C 2011-02-03 1996-07-31 -S000003130 ORF Verified YGL162W SUT1 chromosome 7 L000003483 7 198138 199037 W 2011-02-03 1996-07-31 Zn(II)2Cys6 family transcription factor; positively regulates sterol uptake genes under anaerobic conditions; involved in hypoxic gene expression; represses filamentation-inducing genes during vegetative growth; positively regulates mating with SUT2 by repressing expression of genes that act as mating inhibitors; repressed by STE12; relocalizes from the nucleus to the cytoplasm upon DNA replication stress; SUT1 has a paralog, SUT2, that arose from the whole genome duplication -S000037047 CDS YGL162W 7 198138 199037 W 2011-02-03 1996-07-31 -S000003129 ORF Verified YGL161C YIP5 chromosome 7 7 200142 199210 C 2011-02-03 1996-07-31 Protein that interacts with Rab GTPases; localized to late Golgi vesicles; computational analysis of large-scale protein-protein interaction data suggests a possible role in vesicle-mediated transport -S000036937 CDS YGL161C 7 200142 199210 C 2011-02-03 1996-07-31 -S000003128 ORF Verified YGL160W AIM14 putative metalloreductase|YNO1 chromosome 7 7 200561 202273 W 2011-02-03 1996-07-31 NADPH oxidase localized to the perinuclear ER; produces superoxide from NADPH; overexpression causes MCA1 dependent apoptosis; likely involved in superoxide-mediated regulation of the actin cytoskeleton; member of a conserved superfamily of NADPH oxidases (NOX enzymes); has similarity to iron/copper reductases (FRE1-8), particularly Fre8p -S000036910 CDS YGL160W 7 200561 202273 W 2011-02-03 1996-07-31 -S000003127 ORF Uncharacterized YGL159W chromosome 7 7 202721 203833 W 2011-02-03 1996-07-31 Putative protein of unknown function; deletion mutant has no detectable phenotype -S000036059 CDS YGL159W 7 202721 203833 W 2011-02-03 1996-07-31 -S000118454 ARS ARS710 ARSVII-204 chromosome 7 7 203914 204155 2011-02-03 2006-08-30|2011-02-03 Autonomously Replicating Sequence -S000119021 ARS_consensus_sequence ARS710 7 203972 203986 W 2011-02-03 2006-10-03 -S000006951 long_terminal_repeat YGLWtau2 chromosome 7 7 204982 205337 W 2011-02-03 2000-05-19 Ty4 LTR -S000006639 tRNA_gene tL(CAA)G1 chromosome 7 L000003821 7 205521 205634 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000034236 intron tL(CAA)G1 7 205559 205590 W 2011-02-03 2000-05-19 -S000034234 noncoding_exon tL(CAA)G1 7 205521 205558 W 2011-02-03 2000-05-19 -S000034235 noncoding_exon tL(CAA)G1 7 205591 205634 W 2011-02-03 2000-05-19 -S000003126 ORF Verified YGL158W RCK1 putative serine/threonine protein kinase RCK1 chromosome 7 L000001592 7 207033 208571 W 2011-02-03 1996-07-31 Protein kinase involved in oxidative stress response; promotes pseudohyphal growth via activation of Ubp3p phosphorylation; identified as suppressor of S. pombe cell cycle checkpoint mutations; RCK1 has a paralog, RCK2, that arose from the whole genome duplication -S000035130 CDS YGL158W 7 207033 208571 W 2011-02-03 1996-07-31 -S000003125 ORF Verified YGL157W ARI1 carbonyl reductase (NADPH-dependent) ARI1 chromosome 7 7 209006 210049 W 2011-02-03 1996-07-31 NADPH-dependent aldehyde reductase; utilizes aromatic and alophatic aldehyde substrates; member of the short-chain dehydrogenase/reductase superfamily -S000034964 CDS YGL157W 7 209006 210049 W 2011-02-03 1996-07-31 -S000003124 ORF Verified YGL156W AMS1 alpha-mannosidase chromosome 7 L000000084 7 210416 213667 W -98 2011-02-03 1996-07-31 Vacuolar alpha mannosidase; involved in free oligosaccharide (fOS) degradation; delivered to the vacuole in a novel pathway separate from the secretory pathway -S000034834 CDS YGL156W 7 210416 213667 W 2011-02-03 1996-07-31 -S000003123 ORF Verified YGL155W CDC43 protein geranylgeranyltransferase type I subunit CDC43|CAL1 chromosome 7 L000000277 7 214081 215211 W -99 2011-02-03 1996-07-31 Beta subunit of geranylgeranyltransferase type I; subunit of the Ram2p-Cdc43p heterodimer that catalyzes the geranylgeranylation of the cysteine residue in proteins containing a C-terminal CaaX sequence ending in Leu or Phe; has substrates important for morphogenesis -S000033923 CDS YGL155W 7 214081 215211 W 2011-02-03 1996-07-31 -S000003122 ORF Verified YGL154C LYS5 holo-[acyl-carrier-protein] synthase chromosome 7 L000000967 7 216096 215278 C -97 2011-02-03 1996-07-31 Phosphopantetheinyl transferase involved in lysine biosynthesis; converts inactive apo-form of Lys2p (alpha-aminoadipate reductase) into catalytically active holo-form by posttranslational addition of phosphopantetheine -S000033755 CDS YGL154C 7 216096 215278 C 2011-02-03 1996-07-31 -S000003121 ORF Verified YGL153W PEX14 chromosome 7 L000004118 7 216273 217298 W 2011-02-03 1996-07-31 Central component of the peroxisomal importomer complex; peroxisomal protein import machinery docking complex component; interacts with both PTS1 (Pex5p) and PTS2 (Pex7p) peroxisomal matrix protein signal recognition factors and membrane receptor Pex13p -S000033715 CDS YGL153W 7 216273 217298 W 2011-02-03 1996-07-31 -S000003120 ORF Dubious YGL152C chromosome 7 7 217369 216692 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF PEX14/YGL153W -S000033004 CDS YGL152C 7 217369 216692 C 2011-02-03 1996-07-31 -S000003119 ORF Verified YGL151W NUT1 SSX4|MED5 chromosome 7 L000003073|S000029517|L000002100 7 217524 220922 W 2011-02-03 1996-07-31 Component of the RNA polymerase II mediator complex; mediator is required for transcriptional activation and also has a role in basal transcription -S000032975 CDS YGL151W 7 217524 220922 W 2011-02-03 1996-07-31 -S000003117 ORF Uncharacterized YGL149W chromosome 7 7 225572 225877 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YGL149W is not an essential gene -S000032110 CDS YGL149W 7 225572 225877 W 2011-02-03 1996-07-31 -S000003118 ORF Verified YGL150C INO80 chromatin-remodeling ATPase INO80 chromosome 7 L000004543 7 225573 221104 C 2011-02-03 1996-07-31 ATPase and nucleosome spacing factor; subunit of complex containing actin and actin-related proteins that has chromatin remodeling activity and 3' to 5' DNA helicase activity in vitro; promotes nucleosome shifts in the 3 prime direction; has a role in modulating stress gene transcription -S000032821 CDS YGL150C 7 225573 221104 C 2011-02-03 1996-07-31 -S000003116 ORF Verified YGL148W ARO2 bifunctional chorismate synthase/riboflavin reductase [NAD(P)H] ARO2 chromosome 7 L000000117 7 226399 227529 W -90 2011-02-03 1996-07-31 Bifunctional chorismate synthase and flavin reductase; catalyzes the conversion of 5-enolpyruvylshikimate 3-phosphate (EPSP) to form chorismate, which is a precursor to aromatic amino acids; protein abundance increases in response to DNA replication stress -S000031990 CDS YGL148W 7 226399 227529 W 2011-02-03 1996-07-31 -S000003115 ORF Verified YGL147C RPL9A uL6|ribosomal 60S subunit protein L9A|L6|rp24|YL11|L9A|L8A chromosome 7 L000001708 7 228329 227754 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L9A; homologous to mammalian ribosomal protein L9 and bacterial L6; RPL9A has a paralog, RPL9B, that arose from a single-locus duplication -S000031756 CDS YGL147C 7 228329 227754 C 2011-02-03 1996-07-31 -S000003114 ORF Uncharacterized YGL146C RRT6 chromosome 7 7 229686 228751 C 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene identified in a screen for mutants with increased levels of rDNA transcription; contains two putative transmembrane spans, but no significant homology to other known proteins -S000030808 CDS YGL146C 7 229686 228751 C 2011-02-03 1996-07-31 -S000003113 ORF Verified YGL145W TIP20 TIP1 chromosome 7 L000002756 7 230243 232348 W 2011-02-03 1996-07-31|2011-02-03 Peripheral membrane protein required for COPI vesicle fusion to the ER; mediates Sey1p-independent homotypic ER fusion; prohibits back-fusion of COPII vesicles with the ER; forms a tethering complex with Sec39p and Dsl1p that interacts with ER SNAREs Sec20p and Use1p -S000030778 CDS YGL145W 7 230243 232348 W 2011-02-03 1996-07-31|2011-02-03 -S000007642 ARS ARS701 ARS137 chromosome 7 7 231907 231981 2011-02-03 2001-03-06 ARS containing only an imperfect match to the core consensus sequence -S000003112 ORF Verified YGL144C ROG1 putative lipase ROG1 chromosome 7 7 234507 232450 C 2011-02-03 1996-07-31 Lipase with specificity for monoacylglycerol; preferred substrate is 1-oleoylglycerol; null mutation affects lipid droplet morphology and overexpression causes increased accumulation of reactive oxygen species -S000030591 CDS YGL144C 7 234507 232450 C 2011-02-03 1996-07-31 -S000003111 ORF Verified YGL143C MRF1 chromosome 7 L000001150 7 235958 234717 C 2011-02-03 1996-07-31 Mitochondrial translation release factor; involved in stop codon recognition and hydrolysis of the peptidyl-tRNA bond during mitochondrial translation; lack of MRF1 causes mitochondrial genome instability -S000037757 CDS YGL143C 7 235958 234717 C 2011-02-03 1996-07-31 -S000003110 ORF Verified YGL142C GPI10 putative glycosylphosphatidylinositol-alpha 1,2 mannosyltransferase chromosome 7 L000004297 7 238119 236269 C 2011-02-03 1996-07-31 Integral membrane protein involved in GPI anchor synthesis; putative alpha 1,2 mannosyltransferase required for addition of the third mannose onto the glycosylphosphatidylinositol (GPI) core structure; human PIG-Bp is a functional homolog -S000037696 CDS YGL142C 7 238119 236269 C 2011-02-03 1996-07-31 -S000003109 ORF Verified YGL141W HUL5 ubiquitin-ubiquitin ligase HUL5 chromosome 7 7 238353 241085 W 2011-02-03 1996-07-31 Multiubiquitin chain assembly factor (E4); proteasome processivity factor that elongates polyUb chains on substrates, opposing Ubp6p, a branched polyubiquitin protease; required for retrograde transport of misfolded proteins during ERAD; required for ubiquitination of a subset of cytosolic misfolded proteins upon heat shock -S000037673 CDS YGL141W 7 238353 241085 W 2011-02-03 1996-07-31 -S000130164 ARS ARS712 chromosome 7 7 241085 241353 2011-02-03 2009-05-07 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay -S000003108 ORF Uncharacterized YGL140C chromosome 7 7 245012 241353 C 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene; contains multiple predicted transmembrane domains -S000037564 CDS YGL140C 7 245012 241353 C 2011-02-03 1996-07-31 -S000003107 ORF Verified YGL139W FLC3 putative flavin adenine dinucleotide transporter|HUF3 chromosome 7 7 245716 248124 W 2011-02-03 1996-07-31 Putative FAD transporter, similar to Flc1p and Flc2p; localized to the ER; FLC3 has a paralog, FLC1, that arose from the whole genome duplication -S000037900 CDS YGL139W 7 245716 248124 W 2011-02-03 1996-07-31 -S000003106 ORF Uncharacterized YGL138C chromosome 7 7 249531 248494 C 2011-02-03 1996-07-31 Putative protein of unknown function; has no significant sequence similarity to any known protein -S000036000 CDS YGL138C 7 249531 248494 C 2011-02-03 1996-07-31 -S000003105 ORF Verified YGL137W SEC27 coatomer subunit beta' chromosome 7 L000001848 7 249869 252738 W 2011-02-03 1996-07-31 Essential beta'-coat protein of the COPI coatomer; involved in ER-to-Golgi and Golgi-to-ER transport; contains WD40 domains that mediate cargo selective interactions; 45% sequence identity to mammalian beta'-COP -S000035921 CDS YGL137W 7 249869 249886 W 2011-02-03 1996-07-31 -S000035922 CDS YGL137W 7 250087 252738 W 2011-02-03 1996-07-31 -S000035923 intron YGL137W 7 249887 250086 W 2011-02-03 1996-07-31 -S000003104 ORF Verified YGL136C MRM2 21S rRNA (uridine2791-2'-O) methyltransferase chromosome 7 7 253859 252897 C 2011-02-03 1996-07-31 Mitochondrial 2' O-ribose methyltransferase; required for methylation of U(2791) in 21S rRNA; MRM2 deletion confers thermosensitive respiration and loss of mitochondrial DNA; has similarity to Spb1p and Trm7p, and to E. coli FtsJ/RrmJ -S000035725 CDS YGL136C 7 253859 252897 C 2011-02-03 1996-07-31 -S000003103 ORF Verified YGL135W RPL1B uL1|ribosomal 60S subunit protein L1B|L1|L1B|SSM2 chromosome 7 L000002658 7 254641 255294 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L1B; N-terminally acetylated; homologous to mammalian ribosomal protein L10A and bacterial L1; RPL1B has a paralog, RPL1A, that arose from the whole genome duplication; rpl1a rpl1b double null mutation is lethal -S000035683 CDS YGL135W 7 254641 255294 W 2011-02-03 1996-07-31 -S000003102 ORF Verified YGL134W PCL10 chromosome 7 L000004042 7 255663 256964 W 2011-02-03 1996-07-31 Pho85p cyclin; recruits, activates, and targets Pho85p cyclin-dependent protein kinase to its substrate; PCL10 has a paralog, PCL8, that arose from the whole genome duplication -S000034682 CDS YGL134W 7 255663 256964 W 2011-02-03 1996-07-31 -S000003101 ORF Verified YGL133W ITC1 chromosome 7 7 257707 261501 W 2011-02-03 1996-07-31 Subunit of ATP-dependent Isw2p-Itc1p chromatin remodeling complex; required for repression of a-specific genes, repression of early meiotic genes during mitotic growth, and repression of INO1; similar to mammalian Acf1p, the regulatory subunit of the mammalian ATP-utilizing chromatin assembly and modifying factor (ACF) complex; ITC1 has a paralog, YPL216W, that arose from the whole genome duplication -S000034589 CDS YGL133W 7 257707 261501 W 2011-02-03 1996-07-31 -S000003100 ORF Dubious YGL132W chromosome 7 7 261580 261915 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene SNT2/YGL131C -S000034500 CDS YGL132W 7 261580 261915 W 2011-02-03 1996-07-31 -S000003099 ORF Verified YGL131C SNT2 DNA-binding E3 ubiquitin-protein ligase SNT2 chromosome 7 7 265859 261648 C 2011-02-03 1996-07-31 Subunit of Snt2C complex, RING finger ubiquitin ligase (E3); physically associates with Ecm5p and Rpd3p; along with Ecm5p, recruits Rpd3p to small number of promoters; colocalizes with Ecm5p, independently of Rpd3p, to promoters of stress response genes upon oxidative stress; involved in ubiquitination, degradation of excess histones; interacts with Ubc4p; role in regulating genes encoding amine transporters; relocalizes from nucleus to cytoplasm upon DNA replication stress -S000033546 CDS YGL131C 7 265859 261648 C 2011-02-03 1996-07-31 -S000003098 ORF Verified YGL130W CEG1 mRNA guanylyltransferase chromosome 7 L000000291 7 266145 267524 W 2011-02-03 1996-07-31 Guanylyltransferase involved in mRNA 5' capping; subunit of mRNA capping enzyme, which is a heterotetramer composed of two molecules of Ceg1p and a homodimer of Cet1p, the mRNA 5'-triphosphatase subunit; nuclear import of Ceg1p requires interaction with Cet1p; mammalian capping enzyme is a single bifunctional polypeptide; human homolog RNGTT can complement yeast ceg1 null mutant -S000033518 CDS YGL130W 7 266145 267524 W 2011-02-03 1996-07-31 -S000003097 ORF Verified YGL129C RSM23 mitochondrial 37S ribosomal protein RSM23 chromosome 7 7 269075 267723 C 2011-02-03 1996-07-31|2011-02-03 Mitochondrial ribosomal protein of the small subunit; has similarity to mammalian apoptosis mediator proteins; null mutation prevents induction of apoptosis by overproduction of metacaspase Mca1p -S000033944 CDS YGL129C 7 269075 267723 C 2011-02-03 1996-07-31|2011-02-03 -S000003096 ORF Verified YGL128C CWC23 U2-type spliceosomal complex subunit CWC23 chromosome 7 7 270144 269293 C 2011-02-03 2003-09-22|1996-07-31 Component of a complex containing Cef1p; putatively involved in pre-mRNA splicing; has similarity to E. coli DnaJ and other DnaJ-like proteins and to S. pombe Cwf23p -S000033837 CDS YGL128C 7 270144 269293 C 2011-02-03 2003-09-22|1996-07-31 -S000003095 ORF Verified YGL127C SOH1 MED31 chromosome 7 L000001982 7 270775 270392 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; involved in telomere maintenance; conserved with other metazoan MED31 subunits -S000033696 CDS YGL127C 7 270775 270392 C 2011-02-03 1996-07-31 -S000003094 ORF Verified YGL126W SCS3 FIT2B chromosome 7 L000002845 7 270997 272139 W 2011-02-03 1996-07-31 Protein required for inositol prototrophy; required for normal ER membrane biosynthesis; ortholog of the FIT family of proteins involved in triglyceride droplet biosynthesis and homologous to human FIT2; disputed role in the synthesis of inositol phospholipids from inositol -S000033638 CDS YGL126W 7 270997 272139 W 2011-02-03 1996-07-31 -S000003093 ORF Verified YGL125W MET13 methylenetetrahydrofolate reductase (NAD(P)H) MET13|MRPL45|MET11 chromosome 7 L000003570|L000001085 7 272520 274322 W -77 2011-02-03 2003-01-06|1996-07-31 Major isozyme of methylenetetrahydrofolate reductase; catalyzes the reduction of 5,10-methylenetetrahydrofolate to 5-methyltetrahydrofolate in the methionine biosynthesis pathway -S000030346 CDS YGL125W 7 272520 274322 W 2011-02-03 2003-01-06|1996-07-31 -S000003092 ORF Verified YGL124C MON1 AUT12 chromosome 7 7 276714 274780 C 2011-02-03 1996-07-31|2011-02-03 Subunit of a heterodimeric guanine nucleotide exchange factor (GEF); subunit of the Mon1-Ccz1 GEF complex which stimulates nucleotide exchange and activation of Ypt7p, a Rab family GTPase involved in membrane tethering and fusion events at the late endosome and vacuole; GEF activity is stimulated by membrane association and anionic phospholipids; role in localizing Ypt7p to the vacuolar membrane; required for autophagy, the CVT pathway and mitophagy; potential Cdc28 substrate -S000030087 CDS YGL124C 7 276714 274780 C 2011-02-03 1996-07-31|2011-02-03 -S000003091 ORF Verified YGL123W RPS2 uS5|ribosomal 40S subunit protein S2|rp12|Ys5|S5|S4|S2|SUP138|SUP44|SUP38|RPS4 chromosome 7 L000002205 7 277617 278381 W -72 2011-02-03 1996-07-31 Protein component of the small (40S) subunit; essential for control of translational accuracy; phosphorylation by C-terminal domain kinase I (CTDK-I) enhances translational accuracy; methylated on one or more arginine residues by Hmt1p; homologous to mammalian ribosomal protein S2 and bacterial S5 -S000030054 CDS YGL123W 7 277617 278381 W 2011-02-03 1996-07-31 -S000028634 ORF Dubious YGL123C-A chromosome 7 7 277864 277634 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene RPS2/YGL123W -S000032390 CDS YGL123C-A 7 277864 277634 C 2011-02-03 2003-07-29 -S000003090 ORF Verified YGL122C NAB2 mRNA-binding protein NAB2 chromosome 7 L000001227 7 280523 278946 C 2011-02-03 1996-07-31 Nuclear polyadenylated RNA-binding protein; required for nuclear mRNA export and poly(A) tail length control; stimulates RNA polymerase III transcription by enhancing TFIIIB binding to promoters; protects mRNA against decay by the nuclear exosome in a poly(A)-tail-dependent manner; involved in forming export-competent mRNPs in the nucleus; autoregulates mRNA levels; NLS binds Kap104p; protein abundance increases under DNA replication stress; related to human hnRNPs -S000037370 CDS YGL122C 7 280523 278946 C 2011-02-03 1996-07-31 -S000003089 ORF Verified YGL121C GPG1 chromosome 7 7 281157 280777 C 2011-02-03 1996-07-31 Proposed gamma subunit of the heterotrimeric G protein; interacts with the receptor Gpr1p; involved in regulation of pseudohyphal growth; requires Gpb1p or Gpb2p to interact with Gpa2p; overproduction causes prion curing -S000037311 CDS YGL121C 7 281157 280777 C 2011-02-03 1996-07-31 -S000003088 ORF Verified YGL120C PRP43 DEAH-box ATP-dependent RNA helicase PRP43|JA1 chromosome 7 L000003359 7 283937 281634 C 2011-02-03 1996-07-31 RNA helicase in the DEAH-box family; functions in both RNA polymerase I and polymerase II transcript metabolism; catalyzes removal of U2, U5, and U6 snRNPs from the postsplicing lariat-intron ribonucleoprotein complex; required for efficient biogenesis of both small- and large-subunit rRNAs; acts with Sqs1p to promote 20S to 18S rRNA processing catalyzed by endonuclease Nob1p -S000037207 CDS YGL120C 7 283937 281634 C 2011-02-03 1996-07-31 -S000003087 ORF Verified YGL119W COQ8 protein kinase COQ8|ABC1 chromosome 7 L000000010 7 284442 285947 W 2011-02-03 1996-07-31 ATPase required for ubiquinone biosynthesis and respiratory growth; maintains levels of CoQ biosynthetic proteins; binds to CoQ biosynthesis intermediates; UbiB protein kinase-like family member that lacks canonical protein kinase activity; similar to prokaryotic proteins involved in ubiquinone biosynthesis; human homolog ADCK3 complements a coq8 null, is associated with CoQ and respiratory-chain deficiencies, and is mutated in autosomal-recessive cerebellar ataxia type 2 -S000037639 CDS YGL119W 7 284442 285947 W 2011-02-03 1996-07-31 -S000118455 ARS ARS714 ARSVII-286 chromosome 7 7 285991 286081 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000119022 ARS_consensus_sequence ARS714 7 286004 286018 W 2011-02-03 2006-10-03 -S000006771 tRNA_gene tW(CCA)G1 chromosome 7 L000003851 7 287455 287350 C 2011-02-03 2000-05-19 Tryptophan tRNA (tRNA-Trp), predicted by tRNAscan-SE analysis -S000032524 intron tW(CCA)G1 7 287419 287386 C 2011-02-03 2000-05-19 -S000032523 noncoding_exon tW(CCA)G1 7 287385 287350 C 2011-02-03 2000-05-19 -S000032522 noncoding_exon tW(CCA)G1 7 287455 287420 C 2011-02-03 2000-05-19 -S000003086 ORF Uncharacterized YGL118C chromosome 7 7 288451 288014 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YGL118C is not an essential gene -S000037518 CDS YGL118C 7 288451 288014 C 2011-02-03 1996-07-31 -S000130165 ARS ARS715 chromosome 7 7 288451 288512 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000003085 ORF Uncharacterized YGL117W chromosome 7 7 288512 289309 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000037461 CDS YGL117W 7 288512 289309 W 2011-02-03 1996-07-31 -S000003084 ORF Verified YGL116W CDC20 ubiquitin-protein transferase activating protein CDC20|PAC5 chromosome 7 L000000259 7 289809 291641 W -70 2011-02-03 1996-07-31 Activator of anaphase-promoting complex/cyclosome (APC/C); APC/C is required for metaphase/anaphase transition; directs ubiquitination of mitotic cyclins, Pds1p, and other anaphase inhibitors; cell-cycle regulated; potential Cdc28p substrate; relative distribution to the nucleus increases upon DNA replication stress -S000032000 CDS YGL116W 7 289809 291641 W 2011-02-03 1996-07-31 -S000003083 ORF Verified YGL115W SNF4 AMP-activated serine/threonine-protein kinase regulatory subunit SNF4|SCI1|CAT3 chromosome 7 L000001947 7 292033 293001 W 2011-02-03 1996-07-31 Activating gamma subunit of the AMP-activated Snf1p kinase complex; additional subunits of the complex are Snf1p and a Sip1p/Sip2p/Gal83p family member; activates glucose-repressed genes, represses glucose-induced genes; role in sporulation, and peroxisome biogenesis; protein abundance increases in response to DNA replication stress -S000031879 CDS YGL115W 7 292033 293001 W 2011-02-03 1996-07-31 -S000003082 ORF Uncharacterized YGL114W OPT3 chromosome 7 7 293460 295637 W 2011-02-03 1996-07-31 Putative protein of unknown function; predicted member of the oligopeptide transporter (OPT) family of membrane transporters -S000031734 CDS YGL114W 7 293460 295637 W 2011-02-03 1996-07-31 -S000003081 ORF Verified YGL113W SLD3 chromosome 7 7 295932 297938 W 2011-02-03 1996-07-31 Protein involved in the initiation of DNA replication; required for proper assembly of replication proteins at the origins of replication; interacts with Cdc45p; localizes to nuclear foci that become diffuse upon DNA replication stress; homologous to the human Treslin/Ticrr protein -S000036243 CDS YGL113W 7 295932 297938 W 2011-02-03 1996-07-31 -S000003080 ORF Verified YGL112C TAF6 TafII60|TAF60 chromosome 7 L000002828 7 299728 298178 C 2011-02-03 1996-07-31 Subunit (60 kDa) of TFIID and SAGA complexes; involved in transcription initiation of RNA polymerase II and in chromatin modification, similar to histone H4; relocalizes to the cytosol in response to hypoxia -S000036054 CDS YGL112C 7 299728 298178 C 2011-02-03 1996-07-31 -S000003079 ORF Verified YGL111W NSA1 ribosome biosynthesis protein NSA1 chromosome 7 7 299978 301369 W 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; involved in 60S ribosomal subunit biogenesis -S000035260 CDS YGL111W 7 299978 301369 W 2011-02-03 1996-07-31 -S000003078 ORF Verified YGL110C CUE3 chromosome 7 7 303411 301537 C 2011-02-03 1996-07-31 Protein of unknown function; has a CUE domain that binds ubiquitin, which may facilitate intramolecular monoubiquitination -S000035107 CDS YGL110C 7 303411 301537 C 2011-02-03 1996-07-31 -S000003077 ORF Dubious YGL109W chromosome 7 7 303513 303836 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the uncharacterized gene YGL108C -S000034172 CDS YGL109W 7 303513 303836 W 2011-02-03 1996-07-31|2011-02-03 -S000003076 ORF Verified YGL108C chromosome 7 7 304071 303649 C 2011-02-03 1996-07-31 Protein of unknown function, predicted to be palmitoylated; SWAT-GFP, seamless-GFP and mCherry C-terminal fusion proteins localize to the cytosol, while N-terminal GFP fusion protein localizes to the cell periphery; protein abundance increases in response to DNA replication stress -S000034006 CDS YGL108C 7 304071 303649 C 2011-02-03 1996-07-31 -S000003075 ORF Verified YGL107C RMD9 chromosome 7 7 306273 304333 C 2011-02-03 1996-07-31 Mitochondrial protein required for respiratory growth; mutant phenotype and genetic interactions suggest a role in delivering mt mRNAs to ribosomes; located on matrix face of the inner membrane and loosely associated with mitoribosomes; RMD9 has a paralog, YBR238C, that arose from the whole genome duplication -S000033204 CDS YGL107C 7 306273 304333 C 2011-02-03 1996-07-31 -S000003074 ORF Verified YGL106W MLC1 chromosome 7 L000004170 7 306560 307009 W 2011-02-03 1996-07-31 Essential light chain for Myo1p; light chain for Myo2p; stabilizes Myo2p by binding to the neck region; interacts with Myo1p, Iqg1p, and Myo2p to coordinate formation and contraction of the actomyosin ring with targeted membrane deposition -S000033181 CDS YGL106W 7 306560 307009 W 2011-02-03 1996-07-31 -S000003073 ORF Verified YGL105W ARC1 chromosome 7 L000003553 7 307437 308567 W 2011-02-03 1996-07-31 Protein that binds tRNA and methionyl- and glutamyl-tRNA synthetases; involved in tRNA delivery, stimulating catalysis, and ensuring localization; also binds quadruplex nucleic acids; protein abundance increases in response to DNA replication stress; methionyl-tRNA synthetase is Mes1p; glutamyl-tRNA synthetase is Gus1p -S000033089 CDS YGL105W 7 307437 308567 W 2011-02-03 1996-07-31 -S000003072 ORF Verified YGL104C VPS73 putative sugar transporter chromosome 7 7 310173 308713 C 2011-02-03 1996-07-31 Mitochondrial protein; mutation affects vacuolar protein sorting; putative transporter; member of the sugar porter family; VPS73 has a paralog, YBR241C, that arose from the whole genome duplication -S000032120 CDS YGL104C 7 310173 308713 C 2011-02-03 1996-07-31 -S000003071 ORF Verified YGL103W RPL28 uL15|ribosomal 60S subunit protein L28|L15|rp44|YL24|L29|L28|CYH2 chromosome 7 L000000454 7 310967 311927 W -64 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L28; homologous to mammalian ribosomal protein L27A and bacterial L15; may have peptidyl transferase activity; can mutate to cycloheximide resistance -S000032088 CDS YGL103W 7 310967 311015 W 2011-02-03 1996-07-31 -S000032089 CDS YGL103W 7 311527 311927 W 2011-02-03 1996-07-31 -S000032090 intron YGL103W 7 311016 311526 W 2011-02-03 1996-07-31 -S000003070 ORF Dubious YGL102C chromosome 7 7 311933 311505 C 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; overlaps 3' end of essential RPL28 gene encoding a large subunit ribosomal protein -S000031837 CDS YGL102C 7 311933 311505 C 2011-02-03 1996-07-31 -S000003069 ORF Uncharacterized YGL101W chromosome 7 7 312193 312840 W 2011-02-03 1996-07-31 Protein of unknown function; non-essential gene; interacts with the DNA helicase Hpr5p; YGL101W has a paralog, YBR242W, that arose from the whole genome duplication -S000031742 CDS YGL101W 7 312193 312840 W 2011-02-03 1996-07-31 -S000003068 ORF Verified YGL100W SEH1 chromosome 7 L000003153 7 313234 314283 W 2011-02-03 1996-07-31 Subunit of the Nup84 nuclear pore and SEACAT subcomplexes; involved in nucleocytoplasmic transport and NPC biogenesis in the nuclear pore subcomplex; subunit of SEACAT, a subcomplex of the SEA complex that inhibits the TORC1 inhibitory role of SEACIT (Iml1p-Npr2p-Npr3p), a GAP for Gtr1p in response to amino acid limitation, thereby resulting in activation of TORC1 signaling; SEA is a coatomer-related complex that associates dynamically with the vacuole; human SEH1 homolog -S000030802 CDS YGL100W 7 313234 314283 W 2011-02-03 1996-07-31 -S000003067 ORF Verified YGL099W LSG1 putative GTPase LSG1|KRE35 chromosome 7 7 314631 316553 W 2011-02-03 1996-07-31 Putative GTPase involved in 60S ribosomal subunit biogenesis; required for the release of Nmd3p from 60S subunits in the cytoplasm -S000032465 CDS YGL099W 7 314631 316553 W 2011-02-03 1996-07-31 -S000028467 snoRNA_gene snR82 SNR82 RUF2 chromosome 7 7 316788 317055 W 2011-02-03 2003-03-06 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at positions U1110, U2349, and U2351 -S000030074 noncoding_exon snR82 7 316788 317055 W 2011-02-03 2003-03-06 -S000003066 ORF Verified YGL098W USE1 SNAP receptor USE1|SLT1 chromosome 7 7 317342 318079 W 2011-02-03 1996-07-31 Essential SNARE protein localized to the ER; involved in retrograde traffic from the Golgi to the ER and Sey1p-independent homotypic ER fusion; required for efficient nuclear fusion during mating; forms a complex with the SNAREs Sec22p, Sec20p and Ufe1p -S000032364 CDS YGL098W 7 317342 318079 W 2011-02-03 1996-07-31 -S000006942 long_terminal_repeat YGLWdelta4 chromosome 7 7 318697 318860 W 2011-02-03 2000-05-19 Ty1 LTR -S000006936 long_terminal_repeat YGLCdelta5 chromosome 7 7 319341 319009 C 2011-02-03 2000-05-19 Ty1 LTR -S000006937 long_terminal_repeat YGLCsigma1 chromosome 7 7 319762 319423 C 2011-02-03 2000-05-19 Ty3 LTR -S000006596 tRNA_gene tH(GUG)G2 chromosome 7 L000003853 7 319781 319852 W 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis -S000036200 noncoding_exon tH(GUG)G2 7 319781 319852 W 2011-02-03 2000-05-19 -S000006939 long_terminal_repeat YGLCtau3 chromosome 7 7 320707 320355 C 2011-02-03 2000-05-19 Ty4 LTR -S000003065 ORF Verified YGL097W SRM1 Ran guanyl-nucleotide exchange factor|TSM437|PRP20|MTR1 chromosome 7 L000002058|L000001216|S000029621|L000002370 7 321782 323230 W 2011-02-03 1996-07-31 Nucleotide exchange factor for Gsp1p; localizes to the nucleus, required for nucleocytoplasmic trafficking of macromolecules; suppressor of the pheromone response pathway; potentially phosphorylated by Cdc28p; human homolog of the RAN GEF, RCC1, can complement a temperature sensitive point mutant -S000032259 CDS YGL097W 7 321782 323230 W 2011-02-03 1996-07-31 -S000003064 ORF Verified YGL096W TOS8 chromosome 7 7 325331 326161 W 2011-02-03 1996-07-31 Homeodomain-containing protein and putative transcription factor; found associated with chromatin; target of SBF transcription factor; induced during meiosis and under cell-damaging conditions; TOS8 has a paralog, CUP9, that arose from the whole genome duplication -S000031260 CDS YGL096W 7 325331 326161 W 2011-02-03 1996-07-31 -S000006943 long_terminal_repeat YGLWdelta6 chromosome 7 7 327904 328224 W 2011-02-03 2000-05-19 Ty1 LTR -S000006553 tRNA_gene tE(UUC)G1 SOE1 chromosome 7 L000003823|L000001980 7 328583 328654 W -63 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; can mutate to become a missense suppressor tRNA that inserts glutamate residues at lysine codons; target of K. lactis zymocin -S000034645 noncoding_exon tE(UUC)G1 7 328583 328654 W 2011-02-03 2000-05-19 -S000003063 ORF Verified YGL095C VPS45 VPL28|STT10 chromosome 7 L000002478 7 330607 328874 C 2011-02-03 1996-07-31 Protein of the Sec1p/Munc-18 family; essential for vacuolar protein sorting; required for the function of Pep12p and the early endosome/late Golgi SNARE Tlg2p; essential for fusion of Golgi-derived vesicles with the prevacuolar compartment -S000031062 CDS YGL095C 7 330607 328874 C 2011-02-03 1996-07-31 -S000003062 ORF Verified YGL094C PAN2 poly(A)-specific ribonuclease chromosome 7 L000003115 7 334465 331118 C 2011-02-03 1996-07-31 Catalytic subunit of the Pan2p-Pan3p poly(A)-ribonuclease complex; complex acts to control poly(A) tail length and regulate the stoichiometry and activity of postreplication repair complexes -S000030953 CDS YGL094C 7 334465 331118 C 2011-02-03 1996-07-31 -S000003061 ORF Verified YGL093W SPC105 chromosome 7 L000004697 7 334886 337639 W 2011-02-03 1996-07-31 Subunit of a kinetochore-microtubule binding complex; complex bridges centromeric heterochromatin and kinetochore MAPs and motors; required for sister chromatid bi-orientation and kinetochore binding of SAC components; complex also includes Kre28p; modified by sumoylation -S000030038 CDS YGL093W 7 334886 337639 W 2011-02-03 1996-07-31 -S000003060 ORF Verified YGL092W NUP145 nucleocytoplasmic transporter NUP145|RAT10 chromosome 7 L000001294 7 337906 341859 W 2011-02-03 1996-07-31 Essential protein with distinct roles in two nuclear pore subcomplexes; catalyzes its own proteolytic cleavage in vivo to generate a C-terminal fragment that is a structural component of the Nup84p subcomplex (with roles in NPC biogenesis and localization of genes to the nuclear periphery), and an N-terminal fragment that is one of several FG-nucleoporins within the NPC central core directly responsible for nucleocytoplasmic transport; homologous to human NUP98 -S000029907 CDS YGL092W 7 337906 341859 W 2011-02-03 1996-07-31 -S000003059 ORF Verified YGL091C NBP35 Fe-S cluster-binding ATPase chromosome 7 L000003338 7 343042 342056 C 2011-02-03 1996-07-31 Essential cytoplasmic iron-sulfur cluster binding protein; forms a complex with Cfd1p that is involved in iron-sulfur protein assembly in the cytosol; similar to P-loop NTPases -S000037170 CDS YGL091C 7 343042 342056 C 2011-02-03 1996-07-31 -S000003058 ORF Verified YGL090W LIF1 chromosome 7 L000004541 7 343319 344584 W 2011-02-03 1996-07-31 Component of the DNA ligase IV complex; this complex mediates nonhomologous end joining in DNA double-strand break repair; physically interacts with Dnl4p and Nej1p; homologous to mammalian XRCC4 protein -S000037116 CDS YGL090W 7 343319 344584 W 2011-02-03 1996-07-31 -S000003057 ORF Verified YGL089C MF(ALPHA)2 chromosome 7 L000001095 7 345153 344791 C -58 2011-02-03 1996-07-31 Mating pheromone alpha-factor, made by alpha cells; interacts with mating type a cells to induce cell cycle arrest and other responses leading to mating; also encoded by MF(ALPHA)1, which is more highly expressed; binds copper(II) ions -S000036327 CDS YGL089C 7 345153 344791 C 2011-02-03 1996-07-31 -S000003056 ORF Dubious YGL088W chromosome 7 7 345836 346201 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps snR10, a snoRNA required for preRNA processing -S000036288 CDS YGL088W 7 345836 346201 W 2011-02-03 1996-07-31 -S000007499 snoRNA_gene snR10 SNR10 chromosome 7 7 345986 346230 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); essential gene required for for preRNA processing, specifically for cleavage at sites A1 and A2; also guides pseudouridylation of large subunit (LSU) rRNA at position U2923 -S000036589 noncoding_exon snR10 7 345986 346230 W 2011-02-03 2000-05-19 -S000003055 ORF Verified YGL087C MMS2 E2 ubiquitin-conjugating protein MMS2 chromosome 7 L000004015 7 346904 346406 C 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme variant; involved in error-free postreplication repair; forms a heteromeric complex with Ubc13p, an active ubiquitin-conjugating enzyme; cooperates with chromatin-associated RING finger proteins, Rad18p and Rad5p; protein abundance increases in response to DNA replication stress -S000036106 CDS YGL087C 7 346808 346406 C 2011-02-03 1996-07-31 -S000036105 CDS YGL087C 7 346904 346894 C 2011-02-03 1996-07-31 -S000036107 intron YGL087C 7 346893 346809 C 2011-02-03 1996-07-31 -S000003054 ORF Verified YGL086W MAD1 coiled-coil domain-containing protein MAD1 chromosome 7 L000000974 7 347119 349368 W 2011-02-03 1996-07-31 Coiled-coil protein involved in spindle-assembly checkpoint; required for inhibition of karyopherin/importin Pse1p (aka Kap121p) upon spindle assembly checkpoint arrest; phosphorylated by Mps1p upon checkpoint activation which leads to inhibition of anaphase promoting complex activity; forms a complex with Mad2p; gene dosage imbalance between MAD1 and MAD2 leads to chromosome instability -S000035277 CDS YGL086W 7 347119 349368 W 2011-02-03 1996-07-31 -S000003053 ORF Uncharacterized YGL085W LCL3 chromosome 7 7 349616 350440 W 2011-02-03 1996-07-31 Putative protein of unknown function; mutant has long chronological lifespan; has homology to Staphylococcus aureus nuclease; GFP-fusion protein localizes to mitochondria; is induced in response to the DNA-damaging agent MMS -S000035126 CDS YGL085W 7 349616 350440 W 2011-02-03 1996-07-31 -S000003052 ORF Verified YGL084C GUP1 O-acyltransferase chromosome 7 L000004739 7 352298 350616 C 2011-02-03 1996-07-31 Plasma membrane protein involved in remodeling GPI anchors; member of the MBOAT family of putative membrane-bound O-acyltransferases; role in misfolded protein quality control; proposed to be involved in glycerol transport; homolog of the mammalian Hedgehog pathway modulator HHATL; GUP1 has a paralog, GUP2, that arose from the whole genome duplication -S000034877 CDS YGL084C 7 352298 350616 C 2011-02-03 1996-07-31 -S000118456 ARS ARS716 ARSVII-353 chromosome 7 7 352760 352906 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178100 ARS_consensus_sequence ARS716 7 352865 352849 C 2014-11-18 2014-11-18 -S000003051 ORF Verified YGL083W SCY1 chromosome 7 L000003258 7 353058 355472 W 2011-02-03 1996-07-31 Putative kinase; suppressor of GTPase mutant; similar to bovine rhodopsin kinase; may have a role in intracellular sterol transport -S000034832 CDS YGL083W 7 353058 355472 W 2011-02-03 1996-07-31 -S000003050 ORF Uncharacterized YGL082W chromosome 7 7 355827 356972 W 2011-02-03 1996-07-31 Putative protein of unknown function; predicted prenylation/proteolysis target of Afc1p and Rce1p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; not an essential gene; YGL082W has a paralog, YPL191C, that arose from the whole genome duplication -S000033922 CDS YGL082W 7 355827 356972 W 2011-02-03 1996-07-31 -S000003049 ORF Uncharacterized YGL081W chromosome 7 7 357377 358339 W 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene; interacts genetically with CHS5, a gene involved in chitin biosynthesis -S000033825 CDS YGL081W 7 357377 358339 W 2011-02-03 1996-07-31 -S000003048 ORF Verified YGL080W MPC1 pyruvate transporter MPC1|FMP37 chromosome 7 7 358636 359028 W 2011-02-03 1996-07-31 Highly conserved subunit of mitochondrial pyruvate carrier (MPC); MPC is a mitochondrial inner membrane complex that mediates pyruvate uptake and comprises Mpc1p and Mpc2p during fermentative growth, or Mcp1p and Mpc3p during respiratory growth; null mutant displays slow growth that is complemented by expression of human or mouse ortholog; mutation in human ortholog MPC1 is associated with lactic acidosis and hyperpyruvatemia -S000033711 CDS YGL080W 7 358636 359028 W 2011-02-03 1996-07-31 -S000003047 ORF Verified YGL079W KXD1 KIB1 chromosome 7 7 359444 360100 W 2011-02-03 1996-07-31 Subunit of the BLOC-1 complex involved in endosomal maturation; null mutant is sensitive to drug inducing secretion of vacuolar cargo; GFP-fusion protein localizes to the endosome -S000034302 CDS YGL079W 7 359444 360100 W 2011-02-03 1996-07-31 -S000003046 ORF Verified YGL078C DBP3 RNA-dependent ATPase DBP3 chromosome 7 L000000494 7 361859 360288 C 2011-02-03 1996-07-31 RNA-Dependent ATPase, member of DExD/H-box family; involved in cleavage of site A3 within the ITS1 spacer during rRNA processing; not essential for growth, but deletion causes severe slow-growth phenotype -S000034146 CDS YGL078C 7 361859 360288 C 2011-02-03 1996-07-31 -S000003045 ORF Verified YGL077C HNM1 CTR1 chromosome 7 L000000433|L000000795 7 363916 362225 C 2011-02-03 1996-07-31 Plasma membrane transporter for choline, ethanolamine, and carnitine; involved in the uptake of nitrogen mustard and the uptake of glycine betaine during hypersaline stress; co-regulated with phospholipid biosynthetic genes and negatively regulated by choline and myo-inositol -S000034066 CDS YGL077C 7 363916 362225 C 2011-02-03 1996-07-31 -S000007302 snoRNA_gene snR39 SNR39 chromosome 7 L000003054 7 365251 365163 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A807 -S000036769 noncoding_exon snR39 7 365251 365163 C 2011-02-03 2000-05-19 -S000003044 ORF Verified YGL076C RPL7A uL30|ribosomal 60S subunit protein L7A|YL8|L7A|L6A|L30|rp11 chromosome 7 L000002704|L000003255 7 365996 364335 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L7A; required for processing of 27SA3 pre-rRNA to 27SB pre-rRNA during assembly of large ribosomal subunit; depletion leads to a turnover of pre-rRNA; contains a conserved C-terminal Nucleic acid Binding Domain (NDB2); binds to Domain II of 25S and 5.8S rRNAs; homologous to mammalian ribosomal protein L7 and bacterial L30; RPL7A has a paralog, RPL7B, that arose from the whole genome duplication -S000032065 CDS YGL076C 7 364964 364335 C 2011-02-03 1996-07-31 -S000032064 CDS YGL076C 7 365526 365433 C 2011-02-03 1996-07-31 -S000032063 CDS YGL076C 7 365996 365986 C 2011-02-03 1996-07-31 -S000032067 intron YGL076C 7 365432 364965 C 2011-02-03 1996-07-31 -S000032066 intron YGL076C 7 365985 365527 C 2011-02-03 1996-07-31 -S000007303 snoRNA_gene snR39B SNR39B chromosome 7 L000003494 7 366469 366374 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position G805 -S000030654 noncoding_exon snR39B 7 366469 366374 C 2011-02-03 2000-05-19 -S000003043 ORF Verified YGL075C MPS2 MMC1 chromosome 7 L000004546|L000004250 7 368088 366925 C 2011-02-03 1996-07-31 Essential membrane protein localized at nuclear envelope and SPBs; required for insertion of the newly duplicated spindle pole body into the nuclear envelope; potentially phosphorylated by Cdc28p; MPS2 has a paralog, CSM4, that arose from the whole genome duplication -S000031904 CDS YGL075C 7 368088 366925 C 2011-02-03 1996-07-31 -S000003041 ORF Verified YGL073W HSF1 stress-responsive transcription factor HSF1|MAS3|EXA3 chromosome 7 L000000814 7 368753 371254 W 2011-02-03 1996-07-31 Trimeric heat shock transcription factor; activates multiple genes in response to highly diverse stresses; recognizes variable heat shock elements (HSEs) consisting of inverted NGAAN repeats; monitors translational status of cell through an RQC (Ribosomal Quality Control)-mediated translation-stress signal; involved in diauxic shift; posttranslationally regulated; human homolog HSF1 with linker region mutations can complement yeast hsf1 mutant -S000030864 CDS YGL073W 7 368753 371254 W 2011-02-03 1996-07-31 -S000003042 ORF Dubious YGL074C chromosome 7 7 368922 368596 C 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; overlaps 5' end of essential HSF1 gene encoding heat shock transcription factor -S000031746 CDS YGL074C 7 368922 368596 C 2011-02-03 1996-07-31 -S000003040 ORF Dubious YGL072C chromosome 7 7 371362 371003 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene HSF1; null mutant displays increased resistance to antifungal agents gliotoxin, cycloheximide and H2O2 -S000030701 CDS YGL072C 7 371362 371003 C 2011-02-03 1996-07-31 -S000003039 ORF Verified YGL071W AFT1 DNA-binding transcription factor AFT1|RCS1 chromosome 7 L000002660|L000001594 7 372012 374084 W 2011-02-03 1996-07-31 Transcription factor involved in iron utilization and homeostasis; binds consensus site PyPuCACCCPu and activates transcription in response to changes in iron availability; in iron-replete conditions localization is regulated by Grx3p, Grx4p, and Fra2p, and promoter binding is negatively regulated via Grx3p-Grx4p binding; AFT1 has a paralog, AFT2, that arose from the whole genome duplication; relative distribution to the nucleus increases upon DNA replication stress -S000030658 CDS YGL071W 7 372012 374084 W 2011-02-03 1996-07-31 -S000003038 ORF Verified YGL070C RPB9 DNA-directed RNA polymerase II core subunit RPB9|B12.6|SSU73|SHI chromosome 7 L000001683|L000001880 7 374827 374459 C 2011-02-03 1996-07-31 RNA polymerase II subunit B12.6; contacts DNA; mutations affect transcription start site selection and fidelity of transcription -S000037754 CDS YGL070C 7 374827 374459 C 2011-02-03 1996-07-31 -S000003036 ORF Verified YGL068W MNP1 mitochondrial nucleoid protein MNP1 chromosome 7 7 375087 375671 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; has similarity to E. coli L7/L12 and human MRPL7 ribosomal proteins; associates with the mitochondrial nucleoid; required for normal respiratory growth -S000030909 CDS YGL068W 7 375087 375671 W 2011-02-03 1996-07-31 -S000003037 ORF Dubious YGL069C SRF3 chromosome 7 7 375514 375050 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 92% of ORF overlaps the uncharacterized ORF YGL068W; deletion in cyr1 mutant results in loss of stress resistance -S000030942 CDS YGL069C 7 375514 375050 C 2011-02-03 1996-07-31 -S000003035 ORF Verified YGL067W NPY1 NAD(+) diphosphatase chromosome 7 S000007505 7 376101 377255 W 2011-02-03 1996-07-31 NADH diphosphatase (pyrophosphatase); hydrolyzes the pyrophosphate linkage in NADH and related nucleotides; localizes to peroxisomes; nudix hydrolase family member -S000029896 CDS YGL067W 7 376101 377255 W 2011-02-03 1996-07-31 -S000003034 ORF Verified YGL066W SGF73 deubiquitination module subunit SGF73|SCA7 chromosome 7 7 377609 379582 W 2011-02-03 1996-07-31 Subunit of DUBm module of SAGA and SLIK; has roles in anchoring deubiquitination module (DUBm) into SAGA and SLIK complexes, maintaining organization and ubiquitin-binding conformation of Ubp8p, thereby contributing to overall DUBm activity; involved in preinitiation complex assembly at promoters; relocalizes to cytosol under hypoxia; human homolog ATXN7 implicated in spinocerebellar ataxia, and can complement yeast null mutant -S000037894 CDS YGL066W 7 377609 379582 W 2011-02-03 1996-07-31 -S000003033 ORF Verified YGL065C ALG2 GDP-Man:Man(1)GlcNAc(2)-PP-dolichol alpha-1,3-mannosyltransferase chromosome 7 L000002798 7 381271 379760 C 2011-02-03 1996-07-31 Mannosyltransferase in the N-linked glycosylation pathway; catalyzes two consecutive steps in the N-linked glycosylation pathway; alg2 mutants exhibit temperature-sensitive growth and abnormal accumulation of the lipid-linked oligosaccharide Man2GlcNAc2-PP-Dol; human ALG2 complements the temperature sensitivity and dolichol-linked oligosaccharide biosynthesis defect of the alg2-1 mutant, but mutant form from a patient with CDG-Ii fails to complement -S000035998 CDS YGL065C 7 381271 379760 C 2011-02-03 1996-07-31 -S000003032 ORF Verified YGL064C MRH4 ATP-dependent RNA helicase chromosome 7 7 383208 381523 C 2011-02-03 1996-07-31 Mitochondrial ATP-dependent RNA helicase of the DEAD-box family; required for assembly of the large subunit of mitochondrial ribosomes; binds to the large subunit rRNA, 21S_rRNA; localizes to the matrix face of the mitochondrial inner membrane and associates with the large subunit precursor and with mature ribosomes -S000035835 CDS YGL064C 7 383208 381523 C 2011-02-03 1996-07-31 -S000003031 ORF Verified YGL063W PUS2 pseudouridine synthase PUS2 chromosome 7 L000003361 7 383654 384766 W 2011-02-03 1996-07-31|2011-02-03 Mitochondrial tRNA:pseudouridine synthase; acts at positions 27 and 28, but not at position 72; efficiently and rapidly targeted to mitochondria, specifically dedicated to mitochondrial tRNA modification; mutation also affects pseudouridylation of some nuclear-encoded mRNAs; PUS2 has a paralog, PUS1, that arose from the whole genome duplication -S000035805 CDS YGL063W 7 383654 384766 W 2011-02-03 1996-07-31|2011-02-03 -S000028633 ORF Dubious YGL063C-A chromosome 7 7 384651 384502 C 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032389 CDS YGL063C-A 7 384651 384502 C 2011-02-03 2003-07-29 -S000003030 ORF Verified YGL062W PYC1 pyruvate carboxylase 1 chromosome 7 L000001542 7 385196 388732 W 2011-02-03 1996-07-31 Pyruvate carboxylase isoform; cytoplasmic enzyme that converts pyruvate to oxaloacetate; differentially regulated than isoform Pyc2p; mutations in the human homolog are associated with lactic acidosis; PYC1 has a paralog, PYC2, that arose from the whole genome duplication -S000035682 CDS YGL062W 7 385196 388732 W 2011-02-03 1996-07-31 -S000118457 ARS ARS717 ARSVII-389 chromosome 7 7 388658 388891 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000119023 ARS_consensus_sequence ARS717 7 388846 388832 C 2011-02-03 2006-10-03 -S000003029 ORF Verified YGL061C DUO1 chromosome 7 L000004421 7 389711 388968 C 2011-02-03 1996-07-31 Essential subunit of the Dam1 complex (aka DASH complex); cooperates with Dam1p to connect the DASH complex with microtubules (MT); couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; is transferred to the kinetochore prior to mitosis -S000034613 CDS YGL061C 7 389711 388968 C 2011-02-03 1996-07-31 -S000003028 ORF Verified YGL060W YBP2 YBH1 chromosome 7 7 390065 391990 W 2011-02-03 1996-07-31 Central kinetochore associated protein; mediates mitotic progression; interacts with several central kinetochore proteins and centromeric histone Cse4p; role in resistance to oxidative stress; similar to Slk19p; YBP2 has a paralog, YBP1, that arose from the whole genome duplication -S000034586 CDS YGL060W 7 390065 391990 W 2011-02-03 1996-07-31 -S000003027 ORF Verified YGL059W PKP2 protein kinase PKP2 chromosome 7 7 392223 393698 W 2011-02-03 2003-01-02|1996-07-31|2011-02-03 Mitochondrial protein kinase; negatively regulates activity of the pyruvate dehydrogenase complex by phosphorylating the ser-133 residue of the Pda1p subunit; acts in concert with kinase Pkp1p and phosphatases Ptc5p and Ptc6p; relocalizes from mitochondrion to cytoplasm upon DNA replication stress -S000035146 CDS YGL059W 7 392223 393698 W 2011-02-03 2003-01-02|1996-07-31|2011-02-03 -S000003026 ORF Verified YGL058W RAD6 E2 ubiquitin-conjugating protein RAD6|PSO8|UBC2 chromosome 7 L000001560 7 393986 394504 W -44 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme (E2); involved in postreplication repair as a heterodimer with Rad18p, regulation of K63 polyubiquitination in response to oxidative stress, DSBR and checkpoint control as a heterodimer with Bre1p, ubiquitin-mediated N-end rule protein degradation as a heterodimer with Ubr1p, ERAD with Ubr1p in the absence of canonical ER membrane ligases, and Rpn4p turnover as part of proteasome homeostasis, in complex with Ubr2p and Mub1p -S000035031 CDS YGL058W 7 393986 394504 W 2011-02-03 1996-07-31 -S000003025 ORF Verified YGL057C GEP7 chromosome 7 7 395829 394966 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant exhibits a respiratory growth defect and synthetic interactions with prohibitin (phb1) and gem1; authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000034817 CDS YGL057C 7 395829 394966 C 2011-02-03 1996-07-31 -S000003024 ORF Verified YGL056C SDS23 chromosome 7 L000004692 7 397618 396035 C 2011-02-03 1996-07-31|2011-02-03 Protein involved in cell separation during budding; one of two S. cerevisiae homologs (Sds23p and Sds24p) of the S. pombe Sds23 protein, which is implicated in APC/cyclosome regulation; SDS23 has a paralog, SDS24, that arose from the whole genome duplication -S000033939 CDS YGL056C 7 397618 396035 C 2011-02-03 1996-07-31|2011-02-03 -S000003023 ORF Verified YGL055W OLE1 stearoyl-CoA 9-desaturase|MDM2 chromosome 7 L000001052|L000001297 7 398628 400160 W -37 2011-02-03 1996-07-31 Delta(9) fatty acid desaturase; required for monounsaturated fatty acid synthesis and for normal distribution of mitochondria -S000033893 CDS YGL055W 7 398628 400160 W 2011-02-03 1996-07-31 -S000003022 ORF Verified YGL054C ERV14 cornichon family protein chromosome 7 L000004816 7 401287 400871 C 2011-02-03 1996-07-31 COPII-coated vesicle protein; involved in vesicle formation and incorporation of specific secretory cargo; required for the delivery of bud-site selection protein Axl2p and Nha1p antiporter to cell surface; related to Drosophila cornichon; ERV14 has a paralog, ERV15, that arose from the whole genome duplication -S000033689 CDS YGL054C 7 401287 400871 C 2011-02-03 1996-07-31 -S000006554 tRNA_gene tE(UUC)G2 chromosome 7 L000003850 7 401598 401527 C 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000034647 noncoding_exon tE(UUC)G2 7 401598 401527 C 2011-02-03 2000-05-19 -S000006949 long_terminal_repeat YGLWsigma2 chromosome 7 7 401616 401894 W 2011-02-03 2000-05-19 Ty3 LTR -S000006944 long_terminal_repeat YGLWdelta7 chromosome 7 7 401959 402290 W 2011-02-03 2000-05-19 Ty1 LTR -S000003021 ORF Verified YGL053W PRM8 pheromone-regulated DUP240 family protein PRM8 chromosome 7 7 402589 403302 W 2011-02-03 1996-07-31 Pheromone-regulated protein; contains with 2 predicted transmembrane segments and an FF sequence, a motif involved in COPII binding; forms a complex with Prp9p in the ER; member of DUP240 gene family; PRM8 has a paralog, PRM9, that arose from a segmental duplication -S000033637 CDS YGL053W 7 402589 403302 W 2011-02-03 1996-07-31 -S000003020 ORF Dubious YGL052W chromosome 7 7 403437 403742 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF MST27 -S000030345 CDS YGL052W 7 403437 403742 W 2011-02-03 1996-07-31 -S000003019 ORF Verified YGL051W MST27 DUP240 family protein MST27 chromosome 7 7 403687 404391 W 2011-02-03 1996-07-31 Putative integral membrane protein, involved in vesicle formation; forms complex with Mst28p; member of DUP240 gene family; binds COPI and COPII vesicles; MST27 has a paralog, MST28, that arose from a segmental duplication -S000030145 CDS YGL051W 7 403687 404391 W 2011-02-03 1996-07-31 -S000006945 long_terminal_repeat YGLWdelta8 chromosome 7 7 405004 405145 W 2011-02-03 2000-05-19 Ty1 LTR -S000006946 long_terminal_repeat YGLWdelta9 chromosome 7 7 405146 405207 W 2011-02-03 2000-05-19 Ty1 LTR -S000006938 long_terminal_repeat YGLCsigma3 chromosome 7 7 405453 405208 C 2011-02-03 2000-05-19 Ty3 LTR -S000006711 tRNA_gene tR(UCU)G1 chromosome 7 L000003824 7 405470 405541 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000037328 noncoding_exon tR(UCU)G1 7 405470 405541 W 2011-02-03 2000-05-19 -S000003018 ORF Verified YGL050W TYW3 tRNA methyltransferase TYW3 chromosome 7 7 405776 406597 W 2011-02-03 1996-07-31 tRNA methyltransferase required for synthesis of wybutosine; a modified guanosine found at the 3'-position adjacent to the anticodon of phenylalanine tRNA which supports reading frame maintenance by stabilizing codon-anticodon interactions -S000030037 CDS YGL050W 7 405776 406597 W 2011-02-03 1996-07-31 -S000003017 ORF Verified YGL049C TIF4632 translation initiation factor eIF4G|eIF4G2 chromosome 7 L000002310 7 409604 406860 C 2011-02-03 1996-07-31 Translation initiation factor eIF4G; subunit of the mRNA cap-binding protein complex (eIF4F) that also contains eIF4E (Cdc33p); associates with the poly(A)-binding protein Pab1p, also interacts with eIF4A (Tif1p); TIF4632 has a paralog, TIF4631, that arose from the whole genome duplication -S000030563 CDS YGL049C 7 409604 406860 C 2011-02-03 1996-07-31 -S000003016 ORF Verified YGL048C RPT6 proteasome regulatory particle base subunit RPT6|SUG1|SCB68|CRL3|CIM3 chromosome 7 L000002174|L000000406|L000002265 7 411286 410069 C -43 2011-02-03 1996-07-31 ATPase of the 19S regulatory particle of the 26S proteasome; one of six ATPases of the regulatory particle; involved in the degradation of ubiquitinated substrates; bound by ubiquitin-protein ligases Ubr1p and Ufd4p; localized mainly to the nucleus throughout the cell cycle; protein abundance increases in response to DNA replication stress -S000030499 CDS YGL048C 7 411286 410069 C 2011-02-03 1996-07-31 -S000003015 ORF Verified YGL047W ALG13 N-acetylglucosaminyldiphosphodolichol N-acetylglucosaminyltransferase catalytic subunit ALG13 chromosome 7 7 411552 412160 W 2011-02-03 1996-07-31 Catalytic component of UDP-GlcNAc transferase; required for the second step of dolichyl-linked oligosaccharide synthesis; anchored to the ER membrane via interaction with Alg14p; similar to bacterial and human glycosyltransferases; protein abundance increases in response to DNA replication stress; both human homologs ALG13 and ALG14 are required to complement yeast alg13 mutant -S000030465 CDS YGL047W 7 411552 412160 W 2011-02-03 1996-07-31 -S000006755 tRNA_gene tV(AAC)G1 chromosome 7 L000003849 7 412367 412294 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000036903 noncoding_exon tV(AAC)G1 7 412367 412294 C 2011-02-03 2000-05-19 -S000006947 long_terminal_repeat YGLWdelta10 chromosome 7 7 412456 412725 W 2011-02-03 2000-05-19 Ty1 LTR -S000003013 ORF Verified YGL045W RIM8 ART9|YGL046W|PAL3 chromosome 7 L000004171 7 414102 415730 W 2011-02-03 2003-01-09|1996-07-31 Protein involved in proteolytic activation of Rim101p; part of response to alkaline pH; interacts with ESCRT-1 subunits Stp22p and Vps28p; essential for anaerobic growth; member of the arrestin-related trafficking adaptor family -S000037558 CDS YGL045W 7 414102 415730 W 2011-02-03 2003-01-09|1996-07-31 -S000003012 ORF Verified YGL044C RNA15 chromosome 7 L000001651 7 417036 416146 C 2011-02-03 1996-07-31 Component of the cleavage and polyadenylation factor I (CF I); CF 1, composed of the CF 1A complex (Rna14p, Rna15p, Clp1p, Pcf11p) and Hrp1, is involved in cleavage and polyadenylation of mRNA 3' ends; interacts with the A-rich polyadenylation signal in complex with Rna14p and Hrp1p; mutant displays reduced transcription elongation in the G-less-based run-on (GLRO) assay; required for gene looping and maintenance of genome stability -S000037423 CDS YGL044C 7 417036 416146 C 2011-02-03 1996-07-31 -S000003011 ORF Verified YGL043W DST1 SII|S-II|TFIIS|P37|PPR2 chromosome 7 L000001476|L000000530 7 417483 418412 W 24 2011-02-03 1996-07-31 General transcription elongation factor TFIIS; enables RNA polymerase II to read through blocks to elongation by stimulating cleavage of nascent transcripts stalled at transcription arrest sites; maintains RNAPII elongation activity on ribosomal protein genes during conditions of transcriptional stress -S000031998 CDS YGL043W 7 417483 418412 W 2011-02-03 1996-07-31 -S000003010 ORF Dubious YGL042C chromosome 7 7 418593 418288 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; deletion mutation blocks replication of Brome mosaic virus in S. cerevisiae, but this is likely due to effects on the overlapping gene DST1 -S000031778 CDS YGL042C 7 418593 418288 C 2011-02-03 1996-07-31 -S000028826 ORF Uncharacterized YGL041W-A chromosome 7 7 418825 419289 W 2011-02-03 2003-07-29|2011-02-03 Putative protein of unknown function; conserved in fungi; identified by expression profiling and mass spectrometry -S000033650 CDS YGL041W-A 7 418825 419289 W 2011-02-03 2003-07-29|2011-02-03 -S000028548 ORF Uncharacterized YGL041C-B chromosome 7 7 418886 418704 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum -S000031198 CDS YGL041C-B 7 418886 418704 C 2011-02-03 2003-07-29 -S000003009 ORF Dubious YGL041C chromosome 7 7 419225 419022 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000029877 CDS YGL041C 7 419225 419022 C 2011-02-03 1996-07-31|2011-02-03 -S000003008 ORF Verified YGL040C HEM2 porphobilinogen synthase HEM2|OLE4|SLU1 chromosome 7 L000000761 7 420555 419527 C 2011-02-03 1996-07-31 Aminolevulinate dehydratase; a homo-octameric enzyme, catalyzes the conversion of 5-aminolevulinate to porphobilinogen, the second step in heme biosynthesis; enzymatic activity is zinc-dependent; localizes to the cytoplasm and nucleus; human homolog ALAD can complement yeast hem2 mutant -S000036193 CDS YGL040C 7 420555 419527 C 2011-02-03 1996-07-31 -S000118458 ARS ARS718 ARSVII-421 chromosome 7 7 421171 421279 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000119024 ARS_consensus_sequence ARS718 7 421279 421265 C 2011-02-03 2006-10-03 -S000006640 tRNA_gene tL(CAA)G2 SUP54 chromosome 7 L000003825|L000002211 7 423092 423205 W -24 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis; can mutate to suppress amber nonsense mutations -S000034245 intron tL(CAA)G2 7 423130 423161 W 2011-02-03 2000-05-19 -S000034243 noncoding_exon tL(CAA)G2 7 423092 423129 W 2011-02-03 2000-05-19 -S000034244 noncoding_exon tL(CAA)G2 7 423162 423205 W 2011-02-03 2000-05-19 -S000003007 ORF Verified YGL039W carbonyl reductase (NADPH-dependent) chromosome 7 7 423961 425007 W 2011-02-03 1996-07-31 Aldehyde reductase; reduces aliphatic aldehyde substrates using NADH as cofactor; shown to reduce carbonyl compounds to chiral alcohols -S000035325 CDS YGL039W 7 423961 425007 W 2011-02-03 1996-07-31 -S000003006 ORF Verified YGL038C OCH1 LDB12|NGD29 chromosome 7 L000001295 7 426804 425362 C -31.86 2011-02-03 1996-07-31 Mannosyltransferase of the cis-Golgi apparatus; initiates the polymannose outer chain elongation of N-linked oligosaccharides of glycoproteins -S000035173 CDS YGL038C 7 426804 425362 C 2011-02-03 1996-07-31 -S000003005 ORF Verified YGL037C PNC1 nicotinamidase chromosome 7 7 427947 427297 C 2011-02-03 1996-07-31 Nicotinamidase that converts nicotinamide to nicotinic acid; part of the NAD(+) salvage pathway; required for life span extension by calorie restriction; lacks a peroxisomal targeting signal but is imported into peroxisomes via binding to Gpd1p; PNC1 expression responds to all known stimuli that extend replicative life span; protein increases in abundance and relative distribution to cytoplasmic foci decreases upon DNA replication stress -S000034206 CDS YGL037C 7 427947 427297 C 2011-02-03 1996-07-31 -S000003004 ORF Uncharacterized YGL036W chromosome 7 L000003392 7 428601 431330 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YGL036W is not an essential gene -S000034168 CDS YGL036W 7 428601 431330 W 2011-02-03 1996-07-31 -S000003003 ORF Verified YGL035C MIG1 transcription factor MIG1|TDS22|SSN1|CAT4 chromosome 7 L000001110 7 433062 431548 C -27 2011-02-03 1996-07-31 Transcription factor involved in glucose repression; sequence specific DNA binding protein containing two Cys2His2 zinc finger motifs; regulated by the SNF1 kinase and the GLC7 phosphatase; regulates filamentous growth along with Mig2p in response to glucose depletion; activated in stochastic pulses of nuclear localization, shuttling between cytosol and nucleus depending on external glucose levels and its phosphorylation state -S000034005 CDS YGL035C 7 433062 431548 C 2011-02-03 1996-07-31 -S000003002 ORF Uncharacterized YGL034C chromosome 7 7 433579 433214 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YGL034C is not an essential gene -S000033200 CDS YGL034C 7 433579 433214 C 2011-02-03 1996-07-31 -S000003001 ORF Verified YGL033W HOP2 chromosome 7 L000004230 7 435625 436401 W 2014-11-18 2000-12-01|2014-11-18|1996-07-31 Meiosis-specific protein that localizes to chromosomes; prevents synapsis between nonhomologous chromosomes and ensures synapsis between homologs; complexes with Mnd1p to promote homolog pairing and meiotic double-strand break repair; heterodimer of Hop2p-Mnd1p stimulates the Dmc1p-mediated strand invasion -S000033177 CDS YGL033W 7 435625 435679 W 2011-02-03 2000-12-01|1996-07-31 -S000033178 CDS YGL033W 7 435750 436312 W 2014-11-18 2000-12-01|2014-11-18|1996-07-31 -S000178097 CDS YGL033W 7 436375 436401 W 2014-11-18 2014-11-18 -S000033179 intron YGL033W 7 435680 435749 W 2011-02-03 2000-12-01|1996-07-31 -S000178096 intron YGL033W 7 436313 436374 W 2014-11-18 2014-11-18 -S000003000 ORF Verified YGL032C AGA2 chromosome 7 L000000062 7 436833 436570 C -23.06 2011-02-03 1996-07-31 Adhesion subunit of a-agglutinin of a-cells; C-terminal sequence acts as a ligand for alpha-agglutinin (Sag1p) during agglutination, modified with O-linked oligomannosyl chains, linked to anchorage subunit Aga1p via two disulfide bonds -S000033030 CDS YGL032C 7 436833 436570 C 2011-02-03 1996-07-31 -S000002999 ORF Verified YGL031C RPL24A eL24|ribosomal 60S subunit protein L24A|L24e|rp29|YL21|L30A|L24A|RPL30A chromosome 7 L000001724 7 437934 437467 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L24A; not essential for translation but may be required for normal translation rate; homologous to mammalian ribosomal protein L24, no bacterial homolog; RPL24A has a paralog, RPL24B, that arose from the whole genome duplication -S000032115 CDS YGL031C 7 437934 437467 C 2011-02-03 1996-07-31 -S000122099 five_prime_UTR_intron YGL031C 7 438397 437942 C 2011-02-03 2007-04-04 -S000002998 ORF Verified YGL030W RPL30 eL30|ribosomal 60S subunit protein L30|L30e|rp73|YL38|L32|L30 chromosome 7 L000001726 7 439091 439638 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L30; involved in pre-rRNA processing in the nucleolus; autoregulates splicing of its transcript; homologous to mammalian ribosomal protein L30, no bacterial homolog -S000032082 CDS YGL030W 7 439091 439093 W 2011-02-03 1996-07-31 -S000032083 CDS YGL030W 7 439324 439638 W 2011-02-03 1996-07-31 -S000032084 intron YGL030W 7 439094 439323 W 2011-02-03 1996-07-31 -S000002997 ORF Verified YGL029W CGR1 chromosome 7 S000007411 7 440063 440425 W 2011-02-03 1996-07-31 Protein involved in nucleolar integrity and processing of pre-rRNA; has a role in processing rRNA for the 60S ribosome subunit; transcript is induced in response to cytotoxic stress but not genotoxic stress; relocalizes from nucleus to nucleolus upon DNA replication stress -S000030962 CDS YGL029W 7 440063 440425 W 2011-02-03 1996-07-31 -S000006565 tRNA_gene tF(GAA)G chromosome 7 L000003848 7 440807 440716 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis -S000035389 intron tF(GAA)G 7 440770 440752 C 2011-02-03 2000-05-19 -S000035388 noncoding_exon tF(GAA)G 7 440751 440716 C 2011-02-03 2000-05-19 -S000035387 noncoding_exon tF(GAA)G 7 440807 440771 C 2011-02-03 2000-05-19 -S000002996 ORF Verified YGL028C SCW11 putative glucan endo-1,3-beta-D-glucosidase chromosome 7 7 442909 441281 C 2011-02-03 1996-07-31 Cell wall protein with similarity to glucanases; may play a role in conjugation during mating based on its regulation by Ste12p -S000030849 CDS YGL028C 7 442909 441281 C 2011-02-03 1996-07-31 -S000002995 ORF Verified YGL027C CWH41 DER7|GLS1 chromosome 7 L000003121|L000000715 7 446143 443642 C 2011-02-03 1996-07-31 Processing alpha glucosidase I; ER type II integral membrane N-glycoprotein involved in assembly of cell wall beta 1,6 glucan and asparagine-linked protein glycosylation; also involved in ER protein quality control and sensing of ER stress -S000029845 CDS YGL027C 7 446143 443642 C 2011-02-03 1996-07-31 -S000002994 ORF Verified YGL026C TRP5 tryptophan synthase TRP5 chromosome 7 L000002356 7 448535 446412 C -22 2011-02-03 1996-07-31 Tryptophan synthase; catalyzes the last step of tryptophan biosynthesis; regulated by the general control system of amino acid biosynthesis -S000037836 CDS YGL026C 7 448535 446412 C 2011-02-03 1996-07-31 -S000002992 ORF Dubious YGL024W SST3 chromosome 7 7 449788 450123 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially/completely overlaps the verified ORF PGD1/YGL025C -S000037721 CDS YGL024W 7 449788 450123 W 2011-02-03 1996-07-31 -S000002993 ORF Verified YGL025C PGD1 MED3|HRS1 chromosome 7 L000000811|L000001408 7 449957 448764 C 2011-02-03 2003-09-22|1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for basal and activated transcription; direct target of Cyc8p-Tup1p transcriptional corepressor -S000037746 CDS YGL025C 7 449957 448764 C 2011-02-03 2003-09-22|1996-07-31 -S000002991 ORF Verified YGL023C PIB2 chromosome 7 S000007475 7 452104 450197 C 2011-02-03 1996-07-31 Protein of unknown function; contains FYVE domain; similar to Fab1 and Vps27 -S000036924 CDS YGL023C 7 452104 450197 C 2011-02-03 1996-07-31 -S000002990 ORF Verified YGL022W STT3 dolichyl-diphosphooligosaccharide--protein glycosyltransferase subunit STT3 chromosome 7 L000002716 7 452404 454560 W 2011-02-03 1996-07-31 Subunit of the oligosaccharyltransferase complex of the ER lumen; complex catalyzes asparagine-linked glycosylation of newly synthesized proteins; forms a subcomplex with Ost3p and Ost4p and is directly involved in catalysis -S000036896 CDS YGL022W 7 452404 454560 W 2011-02-03 1996-07-31 -S000002989 ORF Verified YGL021W ALK1 protein kinase ALK1 chromosome 7 L000002852 7 454785 457067 W 2011-02-03 1996-07-31 Protein kinase; along with its paralog, ALK2, required for proper spindle positioning and nuclear segregation following mitotic arrest, proper organization of cell polarity factors in mitosis, proper localization of formins and polarity factors, and survival in cells that activate spindle assembly checkpoint; phosphorylated in response to DNA damage; ALK1 has a paralog, ALK2, that arose from the whole genome duplication; similar to mammalian haspins -S000036836 CDS YGL021W 7 454785 457067 W 2011-02-03 1996-07-31 -S000002988 ORF Verified YGL020C GET1 GET complex subunit GET1|MDM39 chromosome 7 7 457870 457163 C 2011-02-03 1996-07-31 Subunit of the GET complex; involved in insertion of proteins into the ER membrane; required for the retrieval of HDEL proteins from the Golgi to the ER in an ERD2 dependent fashion and for normal mitochondrial morphology and inheritance -S000035892 CDS YGL020C 7 457870 457163 C 2011-02-03 1996-07-31 -S000002987 ORF Verified YGL019W CKB1 casein kinase 2 regulatory subunit CKB1 chromosome 7 L000002856 7 458156 458992 W 2011-02-03 1996-07-31 Beta regulatory subunit of casein kinase 2 (CK2); a Ser/Thr protein kinase with roles in cell growth and proliferation; CK2, comprised of CKA1, CKA2, CKB1 and CKB2, has many substrates including transcription factors and all RNA polymerases -S000034946 CDS YGL019W 7 458156 458992 W 2011-02-03 1996-07-31 -S000002986 ORF Verified YGL018C JAC1 J-type chaperone JAC1 chromosome 7 L000003591 7 459664 459110 C 2011-02-03 1996-07-31 Specialized J-protein that functions in Fe-S cluster biogenesis; functions with Hsp70 in Fe-S cluster biogenesis in mitochondria; involved in iron metabolism; contains a J domain typical to J-type chaperones; localizes to the mitochondrial matrix -S000034703 CDS YGL018C 7 459664 459110 C 2011-02-03 1996-07-31 -S000002985 ORF Verified YGL017W ATE1 arginyltransferase chromosome 7 L000000137 7 459854 461365 W -12 2011-02-03 1996-07-31 Arginyl-tRNA-protein transferase; catalyzes post-translational conjugation of arginine to the amino termini of acceptor proteins which are then subject to degradation via the N-end rule pathway -S000034655 CDS YGL017W 7 459854 461365 W 2011-02-03 1996-07-31 -S000002984 ORF Verified YGL016W KAP122 PDR6 chromosome 7 L000001366 7 461666 464911 W -10 2011-02-03 1996-07-31 Karyopherin beta; responsible for import of the Toa1p-Toa2p complex into the nucleus; binds to nucleoporins Nup1p and Nup2p; may play a role in regulation of pleiotropic drug resistance -S000033773 CDS YGL016W 7 461666 464911 W 2011-02-03 1996-07-31 -S000002983 ORF Uncharacterized YGL015C chromosome 7 7 465435 465043 C 2011-02-03 1996-07-31 Putative protein of unknown function; null mutants accumulate cargo in the Golgi -S000033596 CDS YGL015C 7 465435 465043 C 2011-02-03 1996-07-31 -S000002982 ORF Verified YGL014W PUF4 YGL023 chromosome 7 7 466141 468807 W 2011-02-03 1996-07-31 Member of the PUF protein family; PUF family is defined by the presence of Pumilio homology domains that confer RNA binding activity; preferentially binds mRNAs encoding nucleolar ribosomal RNA-processing factors -S000033567 CDS YGL014W 7 466141 468807 W 2011-02-03 1996-07-31 -S000028825 ORF Dubious YGL014C-A chromosome 7 7 466398 466237 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by expression profiling and mass spectrometry -S000033647 CDS YGL014C-A 7 466398 466237 C 2011-02-03 2003-07-29 -S000002981 ORF Verified YGL013C PDR1 drug-responsive transcription factor PDR1|TPE3|TPE1|TIL1|SMR2|NRA2|CYH3|BOR2|ANT1|AMY1 chromosome 7 L000002984|L000003503|L000001361 7 472298 469092 C -8 2011-02-03 1996-07-31 Transcription factor that regulates the pleiotropic drug response; zinc cluster protein that is a master regulator involved in recruiting other zinc cluster proteins to pleiotropic drug response elements (PDREs) to fine tune the regulation of multidrug resistance genes; relocalizes to the cytosol in response to hypoxia; PDR1 has a paralog, PDR3, that arose from the whole genome duplication -S000032756 CDS YGL013C 7 472298 469092 C 2011-02-03 1996-07-31 -S000002980 ORF Verified YGL012W ERG4 delta(24(24(1)))-sterol reductase chromosome 7 L000000571 7 472855 474276 W 2011-02-03 1996-07-31 C-24(28) sterol reductase; catalyzes the final step in ergosterol biosynthesis; mutants are viable, but lack ergosterol -S000032737 CDS YGL012W 7 472855 474276 W 2011-02-03 1996-07-31 -S000002979 ORF Verified YGL011C SCL1 proteasome core particle subunit alpha 1|PRC2 chromosome 7 L000001812 7 475247 474489 C -8 2011-02-03 1996-07-31 Alpha 1 subunit of the 20S proteasome; involved in the degradation of ubiquitinated substrates; 20S proteasome is the core complex of the 26S proteasome; essential for growth; detected in the mitochondria -S000032541 CDS YGL011C 7 475247 474489 C 2011-02-03 1996-07-31 -S000002978 ORF Verified YGL010W MPO1 chromosome 7 7 475545 476069 W 2011-02-03 1996-07-31 Protein involved in metabolism of phytosphingosine; not an essential gene -S000031636 CDS YGL010W 7 475545 476069 W 2011-02-03 1996-07-31 -S000002977 ORF Verified YGL009C LEU1 3-isopropylmalate dehydratase LEU1 chromosome 7 L000000942 7 478652 476313 C -5 2011-02-03 1996-07-31 Isopropylmalate isomerase; catalyzes the second step in the leucine biosynthesis pathway -S000031584 CDS YGL009C 7 478652 476313 C 2011-02-03 1996-07-31 -S000002976 ORF Verified YGL008C PMA1 H(+)-exporting P2-type ATPase PMA1|KTI10 chromosome 7 L000001449 7 482666 479910 C -2 2011-02-03 1996-07-31 Plasma membrane P2-type H+-ATPase; pumps protons out of cell; major regulator of cytoplasmic pH and plasma membrane potential; long-lived protein asymmetrically distributed at plasma membrane between mother cells and buds; accumulates at high levels in mother cells during aging, buds emerge with very low levels of Pma1p, newborn cells have low levels of Pma1p; Hsp30p plays a role in Pma1p regulation; interactions with Std1p appear to propagate [GAR+] -S000030720 CDS YGL008C 7 482666 479910 C 2011-02-03 1996-07-31 -S000028632 ORF Uncharacterized YGL007C-A chromosome 7 7 483027 482941 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; deletion exhibits slow-growth phenotype; computationally predicted to have a role in cell budding -S000032388 CDS YGL007C-A 7 483027 482941 C 2011-02-03 2003-07-29 -S000002975 ORF Uncharacterized YGL007W BRP1 chromosome 7 7 483260 483637 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; located in the upstream region of PMA1; deletion leads to polyamine resistance due to downregulation of PMA1 -S000030678 CDS YGL007W 7 483260 483637 W 2011-02-03 1996-07-31 -S000118459 ARS ARS719 ARSVII-485 chromosome 7 7 484930 485157 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000119025 ARS_consensus_sequence ARS719 7 485110 485096 C 2011-02-03 2006-10-03 -S000028769 ORF Uncharacterized YGL006W-A chromosome 7 7 485423 485533 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by SAGE -S000033473 CDS YGL006W-A 7 485423 485533 W 2011-02-03 2003-07-29 -S000002974 ORF Verified YGL006W PMC1 calcium-transporting ATPase PMC1 chromosome 7 L000001451 7 485921 489442 W 2011-02-03 1996-07-31 Vacuolar Ca2+ ATPase involved in depleting cytosol of Ca2+ ions; prevents growth inhibition by activation of calcineurin in the presence of elevated concentrations of calcium; similar to mammalian PMCA1a -S000030624 CDS YGL006W 7 485921 489442 W 2011-02-03 1996-07-31 -S000002973 ORF Verified YGL005C COG7 Golgi transport complex subunit COG7|COD5 chromosome 7 7 490547 489708 C 2011-02-03 1996-07-31 Component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments -S000030391 CDS YGL005C 7 490547 489708 C 2011-02-03 1996-07-31 -S000002972 ORF Verified YGL004C RPN14 chromosome 7 7 491956 490703 C 2011-02-03 1996-07-31 Evolutionarily conserved 19S regulatory particle assembly-chaperone; proteasome-interacting protein involved in the assembly of the base subcomplex of the 19S proteasome regulatory particle (RP); null mutants accumulate ubiquitinated Gcn4p and display decreased 26S proteasome stability; interacts with Rpt5p -S000037620 CDS YGL004C 7 491956 490703 C 2011-02-03 1996-07-31 -S000002971 ORF Verified YGL003C CDH1 HCT1 chromosome 7 L000004229 7 494174 492474 C 2011-02-03 1996-07-31 Activator of anaphase-promoting complex/cyclosome (APC/C); antagonist of the spindle assembly checkpoint; directs ubiquitination of cyclins resulting in mitotic exit; targets the APC/C to specific substrates including: Cdc20p, Ase1p, Cin8p, Fin1p and Clb5p; partially active in metaphase, and fully active in anaphase; cell-cycle regulated -S000037480 CDS YGL003C 7 494174 492474 C 2011-02-03 1996-07-31 -S000002970 ORF Verified YGL002W ERP6 chromosome 7 L000004683 7 494517 495167 W 2011-02-03 1996-07-31 Member of the p24 family involved in ER to Golgi transport; similar to Emp24p and Erv25p; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; ERP6 has a paralog, ERP1, that arose from the whole genome duplication -S000037443 CDS YGL002W 7 494517 495167 W 2011-02-03 1996-07-31 -S000002969 ORF Verified YGL001C ERG26 sterol-4-alpha-carboxylate 3-dehydrogenase (decarboxylating) chromosome 7 7 496502 495453 C 2011-02-03 1996-07-31 C-3 sterol dehydrogenase; catalyzes the second of three steps required to remove two C-4 methyl groups from an intermediate in ergosterol biosynthesis; human homolog NSDHL implicated in CK syndrome, and can complement yeast null mutant; molecular target of natural product and antifungal compound FR171456 -S000036649 CDS YGL001C 7 496502 495453 C 2011-02-03 1996-07-31 -S000006468 centromere CEN7 CEN7 chromosome 7 L000000300 7 497038 496920 C 0 2011-02-03 2000-05-19|2004-10-08|2006-05-09 Chromosome VII centromere -S000077293 centromere_DNA_Element_I CEN7 7 497038 497029 C 2011-02-03 2004-10-08 -S000077294 centromere_DNA_Element_II CEN7 7 497028 496945 C 2011-02-03 2004-10-08 -S000077295 centromere_DNA_Element_III CEN7 7 496944 496920 C 2011-02-03 2004-10-08 -S000003233 ORF Verified YGR001C EFM5 protein-lysine N-methyltransferase|AML1 chromosome 7 7 498034 497133 C 2011-02-03 2000-07-14|1996-07-31 S-adenosylmethionine-dependent lysine methyltransferase; involved in the trimethylation of eEF1A (Tef1p/Tef2p) at lysine 79; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; required for replication of Brome mosaic virus in budding yeast; expresses a circular RNA; originally misclassified as a N-6-adenine specific DNA methyltransferase based on sequence similarity; both Efm5p and human ortholog N6AMT2 can methylate eEF1a from either species in vitro -S000032873 CDS YGR001C 7 497365 497133 C 2011-02-03 1996-07-31 -S000032872 CDS YGR001C 7 497937 497459 C 2011-02-03 2000-07-14|1996-07-31 -S000032871 CDS YGR001C 7 498034 498000 C 2011-02-03 2000-07-14 -S000032875 intron YGR001C 7 497458 497366 C 2011-02-03 1996-07-31 -S000032874 intron YGR001C 7 497999 497938 C 2011-02-03 2000-07-14 -S000003234 ORF Verified YGR002C SWC4 GOD1|EAF2 chromosome 7 7 499906 498476 C 2011-02-03 1996-07-31 Component of the Swr1p complex that incorporates Htz1p into chromatin; component of the NuA4 histone acetyltransferase complex -S000032986 CDS YGR002C 7 499906 498476 C 2011-02-03 1996-07-31 -S000003235 ORF Verified YGR003W CUL3 cullin CUL3|CULLIN B|CULB chromosome 7 7 500132 502366 W 2011-02-03 1996-07-31 Ubiquitin-protein ligase; forms a complex with Elc1p that polyubiquitylates monoubiquitylated RNA polymerase II to trigger its proteolysis; cullin family member with similarity to Cdc53p and human CUL3 -S000033740 CDS YGR003W 7 500132 502366 W 2011-02-03 1996-07-31 -S000003236 ORF Verified YGR004W PEX31 peroxisome biogenesis protein chromosome 7 7 502938 504326 W 2011-02-03 1996-07-31 Peroxisomal integral membrane protein; involved in negative regulation of peroxisome size; partially functionally redundant with Pex30p and Pex32p; probably acts at a step downstream of steps mediated by Pex28p and Pex29p; PEX31 has a paralog, PEX30, that arose from the whole genome duplication -S000033874 CDS YGR004W 7 502938 504326 W 2011-02-03 1996-07-31 -S000003237 ORF Verified YGR005C TFG2 transcription factor IIF subunit TFG2 chromosome 7 L000002633 7 505859 504657 C 2011-02-03 1996-07-31 TFIIF (Transcription Factor II) middle subunit; involved in both transcription initiation and elongation of RNA polymerase II; homologous to human RAP30 -S000033942 CDS YGR005C 7 505859 504657 C 2011-02-03 1996-07-31 -S000003238 ORF Verified YGR006W PRP18 mRNA splicing protein PRP18 chromosome 7 L000001505 7 506070 506825 W 2011-02-03 2004-01-22|1996-07-31 Splicing factor and component of snRNP U5; factor involved in the positioning of the 3' splice site during the second catalytic step of splicing; interacts with Slu7p -S000034938 CDS YGR006W 7 506070 506825 W 2011-02-03 2004-01-22|1996-07-31 -S000003239 ORF Verified YGR007W ECT1 ethanolamine-phosphate cytidylyltransferase|MUQ1 chromosome 7 L000001218 7 506969 507940 W 2011-02-03 1996-07-31 Ethanolamine-phosphate cytidylyltransferase; catalyzes the second step of phosphatidylethanolamine biosynthesis; involved in the maintenance of plasma membrane; similar to mammalian CTP: phosphocholine cytidylyl-transferases; inability of the null mutant to synthesize phosphatidylethanolamine and phosphatidylcholine from ethanolamine is functionally complemented by human PCYT2 -S000035086 CDS YGR007W 7 506969 507940 W 2011-02-03 1996-07-31 -S000003240 ORF Verified YGR008C STF2 ATPase-stabilizing factor family protein chromosome 7 L000002127 7 508364 508110 C 2011-02-03 1996-07-31 Protein involved in resistance to desiccation stress; Stf2p exhibits antioxidant properties, and its overexpression prevents ROS accumulation and apoptosis; binds to F0 sector of mitochondrial F1F0 ATPase in vitro and may modulate the inhibitory action of Inh1p and Stf1p; protein abundance increases in response to DNA replication stress; STF2 has a paralog, TMA10, that arose from the whole genome duplication -S000035152 CDS YGR008C 7 508364 508110 C 2011-02-03 1996-07-31 -S000118460 ARS ARS720 ARSVII-509 chromosome 7 7 508729 508977 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178101 ARS_consensus_sequence ARS720 7 508909 508893 C 2014-11-18 2014-11-18 -S000003241 ORF Verified YGR009C SEC9 HSS7 chromosome 7 L000001835 7 511002 509047 C 2011-02-03 1996-07-31 t-SNARE protein required for secretory vesicle-plasma membrane fusion; similar to but not functionally redundant with Spo20p; interacts non-exocyst bound Sec6p; SNAP-25 homolog -S000035315 CDS YGR009C 7 511002 509047 C 2011-02-03 1996-07-31 -S000003242 ORF Verified YGR010W NMA2 nicotinamide-nucleotide adenylyltransferase NMA2 chromosome 7 7 511545 512732 W 2011-02-03 1996-07-31 Nicotinic acid mononucleotide adenylyltransferase; catalyzes the transfer of the adenylyl moiety of ATP to nicotinamide mononucleotide to form NAD; involved in de novo and salvage synthesis of NAD(+); homolog of human NMNAT; NMA2 has a paralog, NMA1, that arose from the whole genome duplication -S000037117 CDS YGR010W 7 511545 512732 W 2011-02-03 1996-07-31 -S000003243 ORF Dubious YGR011W chromosome 7 7 512497 512823 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037223 CDS YGR011W 7 512497 512823 W 2011-02-03 1996-07-31 -S000003244 ORF Verified YGR012W MCY1 putative cysteine synthase chromosome 7 7 513159 514340 W 2011-02-03 1996-07-31 Putative cysteine synthase; localized to the mitochondrial outer membrane -S000029879 CDS YGR012W 7 513159 514340 W 2011-02-03 1996-07-31 -S000003245 ORF Verified YGR013W SNU71 chromosome 7 L000004363 7 514554 516416 W 2011-02-03 1996-07-31 Component of U1 snRNP required for mRNA splicing via spliceosome; yeast specific, no metazoan counterpart -S000029977 CDS YGR013W 7 514554 516416 W 2011-02-03 1996-07-31 -S000003246 ORF Verified YGR014W MSB2 chromosome 7 L000001185 7 516943 520863 W 2 2011-02-03 1996-07-31 Mucin family member involved in various signaling pathways; functions as osmosensor in the Sho1p-mediated HOG pathway; functions in Cdc42p- and MAP kinase-dependent filamentous growth signaling pathway; processed into secreted and cell-associated forms by aspartyl protease Yps1p; potential Cdc28p substrate -S000030086 CDS YGR014W 7 516943 520863 W 2011-02-03 1996-07-31 -S000003247 ORF Uncharacterized YGR015C putative hydrolase chromosome 7 7 522076 521090 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the mitochondrion -S000030196 CDS YGR015C 7 522076 521090 C 2011-02-03 1996-07-31 -S000003248 ORF Uncharacterized YGR016W chromosome 7 7 522261 522833 W 2011-02-03 1996-07-31 Putative protein of unknown function -S000031230 CDS YGR016W 7 522261 522833 W 2011-02-03 1996-07-31 -S000003249 ORF Uncharacterized YGR017W chromosome 7 7 523787 524680 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the nucleus and the cytoplasm -S000031323 CDS YGR017W 7 523787 524680 W 2011-02-03 1996-07-31 -S000003250 ORF Uncharacterized YGR018C chromosome 7 7 524694 524365 C 2011-02-03 1996-07-31 Protein of unknown function; mRNA identified as translated by ribosome profiling data; partially overlaps the uncharacterized ORF YGR017W -S000031392 CDS YGR018C 7 524694 524365 C 2011-02-03 1996-07-31 -S000003251 ORF Verified YGR019W UGA1 4-aminobutyrate transaminase chromosome 7 L000002422 7 525229 526644 W 2011-02-03 1996-07-31 Gamma-aminobutyrate (GABA) transaminase; also known as 4-aminobutyrate aminotransferase; involved in the 4-aminobutyrate and glutamate degradation pathways; required for normal oxidative stress tolerance and nitrogen utilization; protein abundance increases in response to DNA replication stress -S000032468 CDS YGR019W 7 525229 526644 W 2011-02-03 1996-07-31 -S000003252 ORF Verified YGR020C VMA7 H(+)-transporting V1 sector ATPase subunit F chromosome 7 L000002462 7 527329 526973 C 2011-02-03 1996-07-31 Subunit F of the V1 peripheral membrane domain of V-ATPase; part of the electrogenic proton pump found throughout the endomembrane system; required for the V1 domain to assemble onto the vacuolar membrane; the V1 peripheral membrane domain of vacuolar H+-ATPase (V-ATPase) has eight subunits -S000032415 CDS YGR020C 7 527329 526973 C 2011-02-03 1996-07-31 -S000003253 ORF Uncharacterized YGR021W HAH1 chromosome 7 7 527632 528504 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000033286 CDS YGR021W 7 527632 528504 W 2011-02-03 1996-07-31 -S000003255 ORF Verified YGR023W MTL1 chromosome 7 L000004649 7 529264 530919 W 2011-02-03 1996-07-31 Putative plasma membrane sensor; involved in cell integrity signaling and stress response during glucose starvation and oxidative stress; has structural and functional similarity to Mid2p; MTL1 has a paralog, MID2, that arose from the whole genome duplication -S000034269 CDS YGR023W 7 529264 530919 W 2011-02-03 1996-07-31 -S000003254 ORF Dubious YGR022C chromosome 7 7 529586 529257 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps almost completely with the verified ORF MTL1/YGR023W -S000033318 CDS YGR022C 7 529586 529257 C 2011-02-03 1996-07-31 -S000006532 tRNA_gene tD(GUC)G1 chromosome 7 L000003826 7 531610 531681 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000036686 noncoding_exon tD(GUC)G1 7 531610 531681 W 2011-02-03 2000-05-19 -S000003256 ORF Verified YGR024C THG1 tRNA guanylyltransferase chromosome 7 7 532596 531883 C 2011-02-03 1996-07-31 tRNAHis guanylyltransferase; adds a guanosine residue to the 5' end of tRNAH is after transcription and RNase P cleavage; can also catalyze reverse (3'-5') polymerization with certain substrates in a template-dependent reaction; couples nuclear division and migration to cell budding and cytokinesis; essential enzyme conserved among eukaryotes -S000034310 CDS YGR024C 7 532596 531883 C 2011-02-03 1996-07-31 -S000003257 ORF Dubious YGR025W chromosome 7 7 532639 532941 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034440 CDS YGR025W 7 532639 532941 W 2011-02-03 1996-07-31 -S000003258 ORF Uncharacterized YGR026W chromosome 7 7 532985 533821 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery -S000034561 CDS YGR026W 7 532985 533821 W 2011-02-03 1996-07-31 -S000003259 ORF Verified YGR027C RPS25A eS25|ribosomal 40S subunit protein S25A|S25e|rp45|YS23|S31A|S25A|RPS31A chromosome 7 L000003257 7 534458 534132 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S25, no bacterial homolog; RPS25A has a paralog, RPS25B, that arose from the whole genome duplication -S000035521 CDS YGR027C 7 534458 534132 C 2011-02-03 1996-07-31 -S000122101 five_prime_UTR_intron YGR027C 7 534785 534474 C 2011-02-03 2007-04-04 -S000006965 long_terminal_repeat YGRWdelta11 chromosome 7 7 535211 535542 W 2011-02-03 2000-05-19 Ty1 LTR -S000006952 long_terminal_repeat YGRCdelta12 chromosome 7 7 535759 535607 C 2011-02-03 2000-05-19 Ty1 LTR -S000006966 long_terminal_repeat YGRWdelta13 chromosome 7 7 535760 536097 W 2011-02-03 2000-05-19 Ty1 LTR -S000006982 LTR_retrotransposon YGRWTy1-1 Ty1 chromosome 7 7 535760 541685 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007405 transposable_element_gene YGR027W-A gag protein chromosome 7 7 536057 537379 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000036251 CDS YGR027W-A 7 536057 537379 W 2011-02-03 1999-07-17 -S000007406 transposable_element_gene YGR027W-B gag-pol fusion protein chromosome 7 S000029013 7 536057 541325 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000036253 CDS YGR027W-B 7 536057 537361 W 2011-02-03 1999-07-17 -S000036254 CDS YGR027W-B 7 537363 541325 W 2011-02-03 1999-07-17 -S000036255 plus_1_translational_frameshift YGR027W-B 7 537362 537362 W 2011-02-03 1999-07-17 -S000006967 long_terminal_repeat YGRWdelta14 chromosome 7 7 541348 541685 W 2011-02-03 2000-05-19 Ty1 LTR -S000006555 tRNA_gene tE(UUC)G3 chromosome 7 L000003827 7 541850 541921 W 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; target of K. lactis zymocin -S000034674 noncoding_exon tE(UUC)G3 7 541850 541921 W 2011-02-03 2000-05-19 -S000003260 ORF Verified YGR028W MSP1 YTA4 chromosome 7 L000001200|L000002558 7 542203 543291 W 2011-02-03 1996-07-31 Highly-conserved N-terminally anchored AAA-ATPase; distributed in the mitochondrial outer membrane and peroxisomes; involved in mitochondrial protein sorting; functions as an extraction engine in local organelle surveillance to remove and initiate degradation of mistargeted proteins, ensuring fidelity of organelle-specific localization of tail-anchored proteins; contains an N-terminal transmembrane domain and C-terminal cytoplasmic ATPase domain -S000035635 CDS YGR028W 7 542203 543291 W 2011-02-03 1996-07-31 -S000003261 ORF Verified YGR029W ERV1 flavin-linked sulfhydryl oxidase chromosome 7 L000000583 7 543553 544205 W 2011-02-03 2000-07-14|1996-07-31 Flavin-linked sulfhydryl oxidase of the mitochondrial IMS; N-terminus is an intrinsically disordered domain that in the cytosol helps target Erv1p to mitochondria, and in the intermembrane space oxidizes Mia40p as part of a disulfide relay system that promotes intermembrane space retention of imported proteins; functional ortholog of human GFER (ALR); human GFER carrying N-terminal 21 amino acids of Erv1p functionally complements the lethality of the erv1 null mutation -S000035763 CDS YGR029W 7 543553 543638 W 2011-02-03 2000-07-14 -S000035764 CDS YGR029W 7 543722 544205 W 2011-02-03 2000-07-14|1996-07-31 -S000035765 intron YGR029W 7 543639 543721 W 2011-02-03 2000-07-14 -S000006533 tRNA_gene tD(GUC)G2 chromosome 7 L000003847 7 544648 544577 C 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000036692 noncoding_exon tD(GUC)G2 7 544648 544577 C 2011-02-03 2000-05-19 -S000006506 snoRNA_gene snR46 SNR46 chromosome 7 L000003413 7 545370 545566 W 2011-02-03 2000-05-19|2007-05-08 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2865 -S000030619 noncoding_exon snR46 7 545370 545566 W 2011-02-03 2000-05-19|2007-05-08 -S000003262 ORF Verified YGR030C POP6 ribonuclease P/MRP protein subunit POP6 chromosome 7 L000004302 7 546157 545681 C 2011-02-03 1996-07-31 Subunit of RNase MRP, nuclear RNase P and telomerase; forms a soluble heterodimer with Pop7p that binds P3 domain of RNase MRP and RNase P RNAs; RNase MRP cleaves pre-rRNA, nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs, while telomerase replenishes telomeric DNA; relocalizes to the cytosol in response to hypoxia -S000035582 CDS YGR030C 7 546157 545681 C 2011-02-03 1996-07-31 -S000003263 ORF Verified YGR031W IMO32 chromosome 7 7 546441 547469 W 2011-02-03 1996-07-31 Conserved mitochondrial protein of unknown function; processed by both mitochondrial processing peptidase and mitochondrial octapeptidyl aminopeptidase; gene contains the nested antisense gene NAG1 -S000036524 CDS YGR031W 7 546441 547469 W 2011-02-03 1996-07-31 -S000028636 ORF Verified YGR031C-A NAG1 chromosome 7 7 547300 546809 C 2011-02-03 2003-07-29 Protein involved in yeast cell wall biogenesis; localizes to the cell periphery; production of Nag1p is dependent upon the presence of Slt2p and Rlm1p; gene is nested within and antisense to IMO32 -S000032392 CDS YGR031C-A 7 547300 546809 C 2011-02-03 2003-07-29 -S000003264 ORF Verified YGR032W GSC2 1,3-beta-glucan synthase GSC2|FKS2 chromosome 7 L000000716|L000000733 7 548264 553951 W 2011-02-03 1996-07-31 Catalytic subunit of 1,3-beta-glucan synthase; involved in formation of the inner layer of the spore wall; activity positively regulated by Rho1p and negatively by Smk1p; GSC2 has a paralog, FKS1, that arose from the whole genome duplication -S000036645 CDS YGR032W 7 548264 553951 W 2011-02-03 1996-07-31 -S000003265 ORF Verified YGR033C TIM21 FMP17 chromosome 7 7 554967 554248 C 2011-02-03 1996-07-31 Nonessential component of the TIM23 complex; interacts with the Translocase of the Outer Mitochondrial membrane (TOM complex) and with respiratory enzymes; may regulate the Translocase of the Inner Mitochondrial membrane (TIM23 complex) activity -S000036681 CDS YGR033C 7 554967 554248 C 2011-02-03 1996-07-31 -S000003266 ORF Verified YGR034W RPL26B uL24|ribosomal 60S subunit protein L26B|L24|YL33|L33B|L26B chromosome 7 L000004462 7 555812 556672 W 2011-02-03 1996-07-31|2006-10-05 Ribosomal 60S subunit protein L26B; binds to 5.8S rRNA; non-essential even when paralog is also deleted; deletion has minimal affections on ribosome biosynthesis; homologous to mammalian ribosomal protein L26 and bacterial L24; RPL26B has a paralog, RPL26A, that arose from the whole genome duplication -S000037472 CDS YGR034W 7 555812 555830 W 2011-02-03 1996-07-31|2006-10-05 -S000037473 CDS YGR034W 7 556308 556672 W 2011-02-03 1996-07-31 -S000037474 intron YGR034W 7 555831 556307 W 2011-02-03 1996-07-31|2006-10-05 -S000003267 ORF Uncharacterized YGR035C chromosome 7 7 557422 557072 C 2011-02-03 1996-07-31 Putative protein of unknown function, potential Cdc28p substrate; transcription is activated by paralogous transcription factors Yrm1p and Yrr1p along with genes involved in multidrug resistance; YGR035C has a paralog, YLR346C, that arose from the whole genome duplication -S000037516 CDS YGR035C 7 557422 557072 C 2011-02-03 1996-07-31 -S000028827 ORF Uncharacterized YGR035W-A chromosome 7 7 557565 557786 W 2011-02-03 2003-07-29 Putative protein of unknown function -S000033652 CDS YGR035W-A 7 557565 557786 W 2011-02-03 2003-07-29 -S000003268 ORF Verified YGR036C CAX4 CWH8 chromosome 7 L000002917 7 558868 558149 C 2011-02-03 1996-07-31 Dolichyl pyrophosphate (Dol-P-P) phosphatase; has a luminally oriented active site in the ER; cleaves the anhydride linkage in Dol-P-P; required for Dol-P-P-linked oligosaccharide intermediate synthesis and protein N-glycosylation -S000037649 CDS YGR036C 7 558868 558149 C 2011-02-03 1996-07-31 -S000003269 ORF Verified YGR037C ACB1 long-chain fatty acid transporter ACB1 chromosome 7 L000000016 7 559994 559731 C 2011-02-03 1996-07-31 Acyl-CoA-binding protein; transports newly synthesized acyl-CoA esters from fatty acid synthetase (Fas1p-Fas2p) to acyl-CoA-consuming processes; subject to starvation-induced, Grh1p-mediated unconventional secretion; protein abundance increases in response to DNA replication stress -S000030442 CDS YGR037C 7 559994 559731 C 2011-02-03 1996-07-31 -S000003270 ORF Verified YGR038W ORM1 sphingolipid homeostasis protein ORM1 chromosome 7 L000003422 7 560682 561350 W 2011-02-03 1996-07-31 Protein that mediates sphingolipid homeostasis; evolutionarily conserved, required for resistance to agents that induce unfolded protein response; Orm1p and Orm2p together control membrane biogenesis by coordinating lipid homeostasis with protein quality control; ORM1 has a paralog, ORM2, that arose from the whole genome duplication -S000030632 CDS YGR038W 7 560682 561350 W 2011-02-03 1996-07-31 -S000006725 tRNA_gene tS(AGA)G chromosome 7 L000003846 7 561743 561662 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000032368 noncoding_exon tS(AGA)G 7 561743 561662 C 2011-02-03 2000-05-19 -S000006953 long_terminal_repeat YGRCdelta15 chromosome 7 7 562176 561843 C 2011-02-03 2000-05-19 Ty1 LTR -S000007408 transposable_element_gene YGR038C-B gag-pol fusion protein chromosome 7 7 567467 562199 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000031864 CDS YGR038C-B 7 566161 562199 C 2011-02-03 1999-07-17 -S000031863 CDS YGR038C-B 7 567467 566163 C 2011-02-03 1999-07-17 -S000031865 plus_1_translational_frameshift YGR038C-B 7 566162 566162 C 2011-02-03 1999-07-17 -S000007407 transposable_element_gene YGR038C-A gag protein chromosome 7 7 567467 566145 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000031828 CDS YGR038C-A 7 567467 566145 C 2011-02-03 1999-07-17 -S000006962 LTR_retrotransposon YGRCTy1-2 Ty1 chromosome 7 7 567760 561843 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000006954 long_terminal_repeat YGRCdelta16 chromosome 7 7 567760 567427 C 2011-02-03 2000-05-19 Ty1 LTR -S000118461 ARS ARS721 ARSVII-569 chromosome 7 7 568490 568737 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000119026 ARS_consensus_sequence ARS721 7 568660 568646 C 2011-02-03 2006-10-03 -S000006955 long_terminal_repeat YGRCdelta17 chromosome 7 7 569072 568740 C 2011-02-03 2000-05-19 Ty2 LTR -S000118462 ARS ARS722 ARSVII-575 chromosome 7 7 574622 574915 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178102 ARS_consensus_sequence ARS722 7 574701 574717 W 2014-11-18 2014-11-18 -S000006964 LTR_retrotransposon YGRCTy2-1 Ty2 chromosome 7 7 574700 568740 C 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; mutated in S288C -S000006956 long_terminal_repeat YGRCdelta18 chromosome 7 7 574700 574369 C 2011-02-03 2000-05-19 Ty2 LTR -S000003271 ORF Uncharacterized YGR039W chromosome 7 7 574888 575199 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YGR039W is not an essential gene -S000030717 CDS YGR039W 7 574888 575199 W 2011-02-03 1996-07-31 -S000003272 ORF Verified YGR040W KSS1 mitogen-activated serine/threonine-protein kinase KSS1 chromosome 7 L000000922 7 575398 576504 W 2011-02-03 1996-07-31 Mitogen-activated protein kinase (MAPK); involved in signal transduction pathways that control filamentous growth and pheromone response; regulates septum assembly, and may directly phosphorylate Bni4p; the KSS1 gene is nonfunctional in S288C strains and functional in W303 strains -S000031506 CDS YGR040W 7 575398 576504 W 2011-02-03 1996-07-31 -S000130166 ARS ARS723 chromosome 7 7 575484 576346 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000003273 ORF Verified YGR041W BUD9 chromosome 7 L000003939 7 577487 579130 W 2011-02-03 1996-07-31 Protein involved in bud-site selection; mutant has increased aneuploidy tolerance; diploid mutants display a unipolar budding pattern instead of the wild-type bipolar pattern, and bud at the distal pole; BUD9 has a paralog, BUD8, that arose from the whole genome duplication -S000031558 CDS YGR041W 7 577487 579130 W 2011-02-03 1996-07-31 -S000003274 ORF Verified YGR042W MTE1 chromosome 7 7 579476 580291 W 2011-02-03 1996-07-31 Protein of unknown function; involved in maintenance of proper telomere length; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus; forms nuclear foci upon DNA replication stress -S000032536 CDS YGR042W 7 579476 580291 W 2011-02-03 1996-07-31 -S000003275 ORF Verified YGR043C NQM1 sedoheptulose-7-phosphate:D-glyceraldehyde-3-phosphate transaldolase NQM1 chromosome 7 7 581436 580435 C 2011-02-03 1996-07-31 Transaldolase of unknown function; transcription is repressed by Mot1p and induced by alpha-factor and during diauxic shift; NQM1 has a paralog, TAL1, that arose from the whole genome duplication -S000032607 CDS YGR043C 7 581436 580435 C 2011-02-03 1996-07-31 -S000130167 ARS ARS724 chromosome 7 7 581436 582213 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000003276 ORF Verified YGR044C RME1 CSP1 chromosome 7 L000001648 7 583892 582990 C 14 2011-02-03 1996-07-31 Zinc finger protein involved in control of meiosis; prevents meiosis by repressing IME1 expression and promotes mitosis by activating CLN2 expression; directly repressed by a1-alpha2 regulator; mediates cell type control of sporulation; relocalizes from nucleus to cytoplasm upon DNA replication stress -S000032718 CDS YGR044C 7 583892 582990 C 2011-02-03 1996-07-31 -S000003277 ORF Dubious YGR045C chromosome 7 7 584296 583934 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032825 CDS YGR045C 7 584296 583934 C 2011-02-03 1996-07-31 -S000003278 ORF Verified YGR046W TAM41 putative phosphatidate cytidylyltransferase|MMP37 chromosome 7 7 584895 586052 W 2011-02-03 1996-07-31 Mitochondrial phosphatidate cytidylyltransferase (CDP-DAG synthase); required for cardiolipin biosynthesis; viability of null mutant is strain-dependent; mRNA is targeted to the bud; mutant displays defect in mitochondrial protein import, likely due to altered membrane lipid composition -S000033590 CDS YGR046W 7 584895 586052 W 2011-02-03 1996-07-31 -S000003279 ORF Verified YGR047C TFC4 transcription factor TFIIIC subunit TFC4|tau 131|PCF1 chromosome 7 L000001348|L000002288 7 589469 586392 C 2011-02-03 1996-07-31 Subunit of RNA polymerase III transcription initiation factor complex; one of six subunits of RNA polymerase III transcription initiation factor complex (TFIIIC); part of the TauA domain of TFIIIC that binds BoxA DNA promoter sites of tRNA and similar genes; has TPR motifs; human homolog is TFIIIC-102 -S000033631 CDS YGR047C 7 589469 586392 C 2011-02-03 1996-07-31 -S000003280 ORF Verified YGR048W UFD1 polyubiquitin-binding protein UFD1 chromosome 7 L000002787 7 589826 590911 W 2011-02-03 1996-07-31 Substrate-recruiting cofactor of the Cdc48p-Npl4p-Ufd1p segregase; polyubiquitin binding protein that assists in the dislocation of misfolded, ERAD substrates that are subsequently delivered to the proteasome for degradation; involved in regulated destruction of ER membrane proteins such as HMG-CoA reductase (Hmg1/2p) and cytoplasmic proteins (Fbp1p); involved in mobilizing membrane bound transcription factors by regulated Ub/proteasome-dependent processing (RUP) -S000033814 CDS YGR048W 7 589826 590911 W 2011-02-03 1996-07-31 -S000003281 ORF Verified YGR049W SCM4 chromosome 7 L000001814 7 591314 591877 W 2011-02-03 1996-07-31 Mitochondrial outer membrane protein of unknown function; predicted to have 4 transmembrane segments; import is mediated by Tom70p and Mim1p; interacts genetically with a cdc4 mutation; SCM4 has a paralog, ATG33, that arose from the whole genome duplication -S000034690 CDS YGR049W 7 591314 591877 W 2011-02-03 1996-07-31 -S000003282 ORF Uncharacterized YGR050C chromosome 7 7 592442 592086 C 2011-02-03 1996-07-31 Protein of unknown function; mRNA identified as translated by ribosome profiling data -S000035714 CDS YGR050C 7 592442 592086 C 2011-02-03 1996-07-31 -S000003283 ORF Dubious YGR051C chromosome 7 7 593229 592906 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YGR051C is not an essential gene -S000035801 CDS YGR051C 7 593229 592906 C 2011-02-03 1996-07-31 -S000003284 ORF Uncharacterized YGR052W FMP48 protein kinase FMP48 chromosome 7 7 593596 594705 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; induced by treatment with 8-methoxypsoralen and UVA irradiation -S000036785 CDS YGR052W 7 593596 594705 W 2011-02-03 1996-07-31 -S000003285 ORF Uncharacterized YGR053C chromosome 7 7 595837 594986 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000036816 CDS YGR053C 7 595837 594986 C 2011-02-03 1996-07-31 -S000003286 ORF Verified YGR054W chromosome 7 7 596693 598621 W 2011-02-03 1996-07-31|2011-02-03 Eukaryotic initiation factor eIF2A; associates specifically with both 40S subunits and 80 S ribosomes, and interacts genetically with both eIF5b and eIF4E; homologous to mammalian eIF2A -S000036916 CDS YGR054W 7 596693 598621 W 2011-02-03 1996-07-31|2011-02-03 -S000003287 ORF Verified YGR055W MUP1 chromosome 7 L000003071 7 599417 601141 W 2011-02-03 1996-07-31 High affinity methionine permease; integral membrane protein with 13 putative membrane-spanning regions; also involved in cysteine uptake -S000036973 CDS YGR055W 7 599417 601141 W 2011-02-03 1996-07-31 -S000003288 ORF Verified YGR056W RSC1 RSC subunit protein RSC1 chromosome 7 L000004024 7 601661 604447 W 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; required for expression of mid-late sporulation-specific genes; contains two essential bromodomains, a bromo-adjacent homology (BAH) domain, and an AT hook; RSC1 has a paralog, RSC2, that arose from the whole genome duplication -S000037741 CDS YGR056W 7 601661 604447 W 2011-02-03 1996-07-31 -S000003289 ORF Verified YGR057C LST7 chromosome 7 L000004355 7 605501 604773 C 2011-02-03 2003-09-22|1996-07-31 Subunit of the Lst4p-Lst7p GTPase activating protein complex for Gtr2p; stimulates the GTPase activity of Rag family GTPase Gtr2p, within the context of the Gtr1p-Gtr2p heterodimer, after amino acid stimulation; required for activation of TORC1 in response to amino acid stimulation; recruited to the vacuolar membrane during amino acid starvation and released from the membrane by TORC1; required for the transport of amino acid permease Gap1p from the Golgi to the cell surface -S000037768 CDS YGR057C 7 605501 604773 C 2011-02-03 2003-09-22|1996-07-31 -S000003290 ORF Verified YGR058W PEF1 chromosome 7 7 606136 607143 W 2011-02-03 1996-07-31|2011-02-03 Penta-EF-hand protein; required for polar bud growth and cell wall abscission; binds calcium and zinc with different affinity; localizes to bud site in G1, bud neck in G2; binds to Sec31p and modulates COPII coat assembly -S000029835 CDS YGR058W 7 606136 607143 W 2011-02-03 1996-07-31|2011-02-03 -S000003291 ORF Verified YGR059W SPR3 septin SPR3 chromosome 7 L000002022 7 607563 609101 W 2011-02-03 1996-07-31 Sporulation-specific homolog of the CDC3/10/11/12 family of genes; septin protein involved in sporulation; regulated by ABFI; the yeast CDC3/10/11/12 family is a family of bud neck microfilament genes -S000030838 CDS YGR059W 7 607563 609101 W 2011-02-03 1996-07-31 -S000006440 snoRNA_gene snR48 SNR48 chromosome 7 L000004518 7 609584 609696 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at positions G2791 and G2793 -S000030651 noncoding_exon snR48 7 609584 609696 W 2011-02-03 2000-05-19 -S000003292 ORF Verified YGR060W ERG25 methylsterol monooxygenase chromosome 7 L000003089 7 610564 611493 W 2011-02-03 1996-07-31 C-4 methyl sterol oxidase; catalyzes the first of three steps required to remove two C-4 methyl groups from an intermediate in ergosterol biosynthesis; mutants accumulate the sterol intermediate 4,4-dimethylzymosterol; human MSMO1 functionally complements the growth defect caused by repression of ERG25 expression -S000031788 CDS YGR060W 7 610564 611493 W 2011-02-03 1996-07-31 -S000003293 ORF Verified YGR061C ADE6 phosphoribosylformylglycinamidine synthase chromosome 7 L000000036 7 615965 611889 C 39 2011-02-03 1996-07-31 Formylglycinamidine-ribonucleotide (FGAM)-synthetase; catalyzes a step in the 'de novo' purine nucleotide biosynthetic pathway -S000031938 CDS YGR061C 7 615965 611889 C 2011-02-03 1996-07-31 -S000003294 ORF Verified YGR062C COX18 membrane insertase COX18|OXA2 chromosome 7 L000003308 7 617278 616328 C 2011-02-03 1996-07-31 Protein required for membrane insertion of C-terminus of Cox2p; mitochondrial integral inner membrane protein; interacts genetically and physically with Mss2p and Pnt1p; similar to S. cerevisiae Oxa1, N. crassa Oxa2p, and E. coli YidC; respiratory defect of the null mutant is functionally complemented by human COX18 carrying the N-terminal 54 amino acids of S. cerevisiae Cox18p -S000032054 CDS YGR062C 7 617278 616328 C 2011-02-03 1996-07-31 -S000003296 ORF Dubious YGR064W chromosome 7 7 617621 617989 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF SPT4/YGR063C -S000033116 CDS YGR064W 7 617621 617989 W 2011-02-03 1996-07-31 -S000003295 ORF Verified YGR063C SPT4 transcription elongation factor SPT4 chromosome 7 L000002030 7 617824 617516 C 40 2011-02-03 1996-07-31 Spt4p/5p (DSIF) transcription elongation factor complex subunit; the Spt4/5 complex binds to ssRNA in a sequence-specific manner, and along with RNAP I and II has multiple roles regulating transcriptional elongation, RNA processing, quality control, and transcription-coupled repair; localizes to kinetochores and heterochromatin, influencing chromosomal dynamics and silencing; required for transcription through long trinucleotide repeats in ORFs and non-protein coding regions -S000032968 CDS YGR063C 7 617824 617516 C 2011-02-03 1996-07-31 -S000003297 ORF Verified YGR065C VHT1 chromosome 7 S000007487 7 619858 618077 C 2011-02-03 1996-07-31 High-affinity plasma membrane H+-biotin (vitamin H) symporter; mutation results in fatty acid auxotrophy; 12 transmembrane domain containing major facilitator subfamily member; mRNA levels negatively regulated by iron deprivation and biotin -S000033152 CDS YGR065C 7 619858 618077 C 2011-02-03 1996-07-31 -S000003298 ORF Uncharacterized YGR066C chromosome 7 7 621799 620921 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000033915 CDS YGR066C 7 621799 620921 C 2011-02-03 1996-07-31 -S000003299 ORF Uncharacterized YGR067C chromosome 7 7 624786 622372 C 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; contains a zinc finger motif similar to that of Adr1p -S000034061 CDS YGR067C 7 624786 622372 C 2011-02-03 1996-07-31|2011-02-03 -S000028637 ORF Dubious YGR068W-A chromosome 7 7 626294 626389 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps with the uncharacterized ORF YGR068C -S000032393 CDS YGR068W-A 7 626294 626389 W 2011-02-03 2003-07-29 -S000003301 ORF Dubious YGR069W chromosome 7 7 627083 627418 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035169 CDS YGR069W 7 627083 627418 W 2011-02-03 1996-07-31 -S000003300 ORF Verified YGR068C ART5 chromosome 7 7 627084 625324 C 2011-02-03 1996-07-31 Protein proposed to regulate endocytosis of plasma membrane proteins; regulates by recruiting the ubiquitin ligase Rsp5p to its target in the plasma membrane; SWAT-GFP and mCherry fusion proteins localize to the cytosol -S000034144 CDS YGR068C 7 627084 625324 C 2011-02-03 1996-07-31 -S000003302 ORF Verified YGR070W ROM1 Rho family guanine nucleotide exchange factor ROM1|SKC1 chromosome 7 L000003181 7 627806 631273 W 2011-02-03 1996-07-31|2011-02-03 Guanine nucleotide exchange factor (GEF) for Rho1p; mutations are synthetically lethal with mutations in rom2, which also encodes a GEP; ROM1 has a paralog, ROM2, that arose from the whole genome duplication -S000036051 CDS YGR070W 7 627806 631273 W 2011-02-03 1996-07-31|2011-02-03 -S000003303 ORF Verified YGR071C ENV11 chromosome 7 7 634063 631481 C 2011-02-03 1996-07-31 Protein proposed to be involved in vacuolar functions; mutant shows defect in CPY processing and fragmented vacuoles; deletion mutant has increased glycogen accumulation and displays elongated buds; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; ENV11 has a paralog, VID22, that arose from the whole genome duplication -S000036097 CDS YGR071C 7 634063 631481 C 2011-02-03 1996-07-31 -S000003304 ORF Verified YGR072W UPF3 SUP112|SUA6 chromosome 7 L000003057|S000029549|L000002231 7 634304 635467 W 32 2011-02-03 1996-07-31 Component of the nonsense-mediated mRNA decay (NMD) pathway; along with Nam7p and Nmd2p; involved in decay of mRNA containing nonsense codons; involved in telomere maintenance -S000029860 CDS YGR072W 7 634304 635467 W 2011-02-03 1996-07-31 -S000003306 ORF Verified YGR074W SMD1 mRNA splicing protein SMD1|SPP92 chromosome 7 L000001928 7 635712 636152 W 2011-02-03 1996-07-31 Core Sm protein Sm D1; part of heteroheptameric complex (with Smb1p, Smd2p, Smd3p, Sme1p, Smx3p, and Smx2p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; relocalizes to the cytosol in response to hypoxia; homolog of human Sm D1; protein abundance increases in response to DNA replication stress -S000031921 CDS YGR074W 7 635712 636152 W 2011-02-03 1996-07-31 -S000003305 ORF Dubious YGR073C chromosome 7 7 635986 635615 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; extensively overlaps essential SMD1 gene encoding a U6 snRNP protein -S000031714 CDS YGR073C 7 635986 635615 C 2011-02-03 1996-07-31 -S000003307 ORF Verified YGR075C PRP38 U4/U6-U5 snRNP complex subunit PRP38 chromosome 7 L000001510 7 636875 636147 C 2011-02-03 1996-07-31 Unique component of the U4/U6.U5 tri-snRNP particle; tri-snRNP is required for conformational changes which result in the catalytic activation of the spliceosome; dispensable for spliceosome assembly -S000031968 CDS YGR075C 7 636875 636147 C 2011-02-03 1996-07-31 -S000003308 ORF Verified YGR076C MRPL25 mitochondrial 54S ribosomal protein YmL25|AFO1|YmL25|YMR26 chromosome 7 L000002532 7 637577 637104 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; mutation confers increased replicative lifespan -S000037456 CDS YGR076C 7 637577 637104 C 2011-02-03 1996-07-31 -S000003309 ORF Verified YGR077C PEX8 PAS6 chromosome 7 L000004222|L000003962 7 639513 637744 C 2011-02-03 1996-07-31 Intraperoxisomal organizer of the peroxisomal import machinery; organizes the formation of the importomer complex, bridging the docking complex with the RING finger complex; tightly associated with the lumenal face of the peroxisomal membrane; essential for peroxisome biogenesis; binds PTS1-signal receptor Pex5p, and PTS2-signal receptor Pex7p -S000037552 CDS YGR077C 7 639513 637744 C 2011-02-03 1996-07-31 -S000003310 ORF Verified YGR078C PAC10 tubulin-binding prefolding complex subunit PAC10|RKS2|PFD3|GIM2 chromosome 7 L000002864 7 640371 639772 C 2011-02-03 1996-07-31 Part of the heteromeric co-chaperone GimC/prefoldin complex; complex promotes efficient protein folding -S000037609 CDS YGR078C 7 640371 639772 C 2011-02-03 1996-07-31 -S000003311 ORF Uncharacterized YGR079W chromosome 7 7 640720 641832 W 2011-02-03 1996-07-31 Putative protein of unknown function; YGR079W is not an essential gene -S000030491 CDS YGR079W 7 640720 641832 W 2011-02-03 1996-07-31 -S000003312 ORF Verified YGR080W TWF1 chromosome 7 L000004372 7 642010 643008 W 2011-02-03 1996-07-31 Twinfilin; highly conserved actin monomer-sequestering protein involved in regulation of the cortical actin cytoskeleton; coordinates actin filament severing and monomer sequestering at sites of rapid actin turnover; composed of two cofilin-like regions, stimulates actin depolymerization as does the mouse homolog, mTwf1 -S000037367 CDS YGR080W 7 642010 643008 W 2011-02-03 1996-07-31 -S000003313 ORF Verified YGR081C SLX9 chromosome 7 7 643780 643148 C 2011-02-03 1996-07-31 Protein required for pre-rRNA processing; associated with the 90S pre-ribosome and 43S small ribosomal subunit precursor; interacts with U3 snoRNA; deletion mutant has synthetic fitness defect with an sgs1 deletion mutant -S000037394 CDS YGR081C 7 643780 643148 C 2011-02-03 1996-07-31 -S000003314 ORF Verified YGR082W TOM20 MOM19|MAS20 chromosome 7 L000001029 7 644044 644595 W 2011-02-03 1996-07-31 Component of the TOM (translocase of outer membrane) complex; responsible for recognition and initial import steps for all mitochondrially directed proteins; acts as a receptor for incoming precursor proteins -S000030069 CDS YGR082W 7 644044 644595 W 2011-02-03 1996-07-31 -S000003315 ORF Verified YGR083C GCD2 translation initiation factor eIF2B subunit delta|GCD12 chromosome 7 L000000671 7 646815 644860 C 54 2011-02-03 1996-07-31 Delta subunit of the translation initiation factor eIF2B; the guanine-nucleotide exchange factor for eIF2; activity subsequently regulated by phosphorylated eIF2; first identified as a negative regulator of GCN4 expression -S000030132 CDS YGR083C 7 646815 644860 C 2011-02-03 1996-07-31 -S000003316 ORF Verified YGR084C MRP13 mitochondrial 37S ribosomal protein YmS-A chromosome 7 L000001142|L000001157 7 648142 647123 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit -S000030307 CDS YGR084C 7 648142 647123 C 2011-02-03 1996-07-31 -S000003317 ORF Verified YGR085C RPL11B uL5|ribosomal 60S subunit protein L11B|rp39B|YL22|L5|L16A|L11B chromosome 7 L000001730|L000001713 7 648907 648383 C 56 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L11B; expressed at half the level of Rpl11Ap; involved in ribosomal assembly; depletion causes degradation of 60S proteins and RNA; homologous to mammalian ribosomal protein L11 and bacterial L5; RPL11B has a paralog, RPL11A, that arose from the whole genome duplication -S000033620 CDS YGR085C 7 648907 648383 C 2011-02-03 1996-07-31 -S000003318 ORF Verified YGR086C PIL1 lipid-binding protein PIL1 chromosome 7 7 650617 649598 C 2011-02-03 1996-07-31 Eisosome core component; eisosomes are large immobile cell cortex structures associated with endocytosis; detected in phosphorylated state in mitochondria; phosphorylated on Thr233 upon Pkc1p hyperactivation in a Slt2p MAPK-dependent fashion; null mutant shows activation of Pkc1p/Ypk1p stress resistance pathways; member of BAR domain family; protein increases in abundance and relocalizes from plasma membrane to cytoplasm upon DNA replication stress -S000033727 CDS YGR086C 7 650617 649598 C 2011-02-03 1996-07-31 -S000003319 ORF Verified YGR087C PDC6 indolepyruvate decarboxylase 6 chromosome 7 L000001357 7 652981 651290 C 2011-02-03 1996-07-31 Minor isoform of pyruvate decarboxylase; decarboxylates pyruvate to acetaldehyde, involved in amino acid catabolism; transcription is glucose- and ethanol-dependent, and is strongly induced during sulfur limitation -S000033866 CDS YGR087C 7 652981 651290 C 2011-02-03 1996-07-31 -S000003320 ORF Verified YGR088W CTT1 catalase T|SPS101 chromosome 7 L000000435 7 654634 656322 W 2011-02-03 1996-07-31|2006-01-23 Cytosolic catalase T; has a role in protection from oxidative damage by hydrogen peroxide -S000034811 CDS YGR088W 7 654634 656322 W 2011-02-03 1996-07-31|2006-01-23 -S000003321 ORF Verified YGR089W NNF2 chromosome 7 7 656960 659770 W 2011-02-03 1996-07-31 Protein that exhibits physical and genetic interactions with Rpb8p; Rpb8p is a subunit of RNA polymerases I, II, and III; computational analysis of large-scale protein-protein interaction data suggests a role in chromosome segregation -S000034943 CDS YGR089W 7 656960 659770 W 2011-02-03 1996-07-31 -S000118463 ARS ARS727 ARSVII-660 chromosome 7 7 659907 660002 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000119027 ARS_consensus_sequence ARS727 7 660000 659986 C 2011-02-03 2006-10-03 -S000006749 tRNA_gene tT(UGU)G1 chromosome 7 L000003828 7 661749 661820 W 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000030910 noncoding_exon tT(UGU)G1 7 661749 661820 W 2011-02-03 2000-05-19 -S000003322 ORF Verified YGR090W UTP22 rRNA-processing protein UTP22 chromosome 7 7 662358 666071 W 2011-02-03 1996-07-31 Component of the small-subunit processome; required for nuclear export of tRNAs; may facilitate binding of Utp8p to aminoacylated tRNAs and their delivery to Los1p for export; conserved from yeast to mammals -S000033602 CDS YGR090W 7 662358 666071 W 2011-02-03 1996-07-31 -S000003323 ORF Verified YGR091W PRP31 U4/U6-U5 snRNP complex subunit PRP31 chromosome 7 L000002947 7 666341 667825 W 2011-02-03 1996-07-31 Splicing factor; component of the U4/U6-U5 snRNP complex -S000034543 CDS YGR091W 7 666341 667825 W 2011-02-03 1996-07-31 -S000003324 ORF Verified YGR092W DBF2 serine/threonine-protein kinase DBF2 chromosome 7 L000000487 7 668189 669907 W 28 2011-02-03 1996-07-31 Ser/Thr kinase involved in transcription and stress response; functions as part of a network of genes in exit from mitosis; localization is cell cycle regulated; activated by Cdc15p during the exit from mitosis; also plays a role in regulating the stability of SWI5 and CLB2 mRNAs; phosphorylates Chs2p to regulate primary septum formation and Hof1p to regulate cytokinesis; DBF2 has a paralog, DBF20, that arose from the whole genome duplication -S000034610 CDS YGR092W 7 668189 669907 W 2011-02-03 1996-07-31 -S000003325 ORF Verified YGR093W DRN1 chromosome 7 7 670388 671911 W 2011-02-03 1996-07-31 Splicing factor that modulates turnover of branched RNAs by Dbr1p; interacts with spliceosomal components and branched RNA splicing products; enhances Dbr1p debranching in vitro; conserved protein with domain organization identical from yeast to human; N-terminal homology to Dbr1p N-terminus, but Dbr1p catalytic residues not conserved; relocalizes to the cytosol in response to hypoxia -S000034725 CDS YGR093W 7 670388 671911 W 2011-02-03 1996-07-31 -S000003326 ORF Verified YGR094W VAS1 valine--tRNA ligase chromosome 7 L000002457 7 672186 675500 W 2011-02-03 1996-07-31 Mitochondrial and cytoplasmic valyl-tRNA synthetase; human homolog VARS2 implicated in mitochondrial diseases, can partially complement yeast null mutant -S000035718 CDS YGR094W 7 672186 675500 W 2011-02-03 1996-07-31 -S000003327 ORF Verified YGR095C RRP46 exosome non-catalytic core subunit RRP46 chromosome 7 L000004579 7 676342 675671 C 2011-02-03 2003-09-22|1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; has similarity to E. coli RNase PH and to human hRrp46p (EXOSC5) -S000035767 CDS YGR095C 7 676342 675671 C 2011-02-03 2003-09-22|1996-07-31 -S000003328 ORF Verified YGR096W TPC1 thiamine transporter TPC1 chromosome 7 7 676621 677565 W 2011-02-03 1996-07-31 Mitochondrial membrane transporter; mediates uptake of the essential cofactor thiamine pyrophosphate (ThPP) into mitochondria; expression appears to be regulated by carbon source; member of the mitochondrial carrier family -S000035962 CDS YGR096W 7 676621 677565 W 2011-02-03 1996-07-31 -S000003329 ORF Verified YGR097W ASK10 RGC2 chromosome 7 L000002770 7 678695 682135 W 2011-02-03 1996-07-31 Regulator of the Fps1p glycerol channel; under nonstress conditions, binds to Fps1p to positively regulate glycerol transport; under osmotic stress, multiple phosphorylation by Hog1p causes Ask10p to dissociate from Fps1p; forms homodimers and heterodimerizes with paralog Rgc1p; phosphorylated in response to oxidative stress; has a role in destruction of Ssn8p; associates with RNA polymerase II holoenzyme -S000037821 CDS YGR097W 7 678695 682135 W 2011-02-03 1996-07-31 -S000003330 ORF Verified YGR098C ESP1 separase chromosome 7 L000000584 7 687458 682566 C 60 2011-02-03 1996-07-31 Separase, a caspase-like cysteine protease; promotes sister chromatid separation by mediating dissociation of the cohesin Scc1p from chromatin; inhibits protein phosphatase 2A-Cdc55p to promote mitotic exit; inhibited by Pds1p; relative distribution to the nucleus increases upon DNA replication stress -S000037871 CDS YGR098C 7 687458 682566 C 2011-02-03 1996-07-31 -S000003331 ORF Verified YGR099W TEL2 chromosome 7 L000002913 7 687899 689965 W 2011-02-03 1996-07-31 Subunit of the ASTRA complex, involved in chromatin remodeling; subunit of the telomere cap complex DNA-binding protein specific to single-stranded yeast telomeric DNA repeats, required for telomere length regulation and telomere position effect; involved in the stability or biogenesis of PIKKs such as TORC1 -S000029946 CDS YGR099W 7 687899 689965 W 2011-02-03 1996-07-31 -S000003332 ORF Verified YGR100W MDR1 GYP2|MIC1 chromosome 7 L000003270 7 690245 693097 W 2011-02-03 1996-07-31 Cytoplasmic GTPase-activating protein; activates Ypt/Rab transport GTPases Ypt6p, Ypt31p and Sec4p; involved in recycling of internalized proteins and regulation of Golgi secretory function -S000035442 CDS YGR100W 7 690245 693097 W 2011-02-03 1996-07-31 -S000003333 ORF Verified YGR101W PCP1 rhomboid protease PCP1|RBD1|MDM37 chromosome 7 7 693363 694403 W 2011-02-03 1996-07-31 Mitochondrial serine protease; required for the processing of various mitochondrial proteins and maintenance of mitochondrial DNA and morphology; belongs to the rhomboid-GlpG superfamily of intramembrane peptidases -S000035497 CDS YGR101W 7 693363 694403 W 2011-02-03 1996-07-31 -S000003334 ORF Verified YGR102C GTF1 glutamyl-tRNA(Gln) amidotransferase subunit F chromosome 7 7 695135 694584 C 2011-02-03 1996-07-31 Subunit of the trimeric GatFAB AmidoTransferase(AdT) complex; involved in the formation of Q-tRNAQ; transposon insertion mutant is salt sensitive and null mutant has growth defects; non-tagged protein is detected in purified mitochondria -S000035523 CDS YGR102C 7 695135 694584 C 2011-02-03 1996-07-31 -S000003335 ORF Verified YGR103W NOP7 mRNA-binding ribosome synthesis protein NOP7|YPH1 chromosome 7 S000007661 7 695417 697234 W 2011-02-03 1996-07-31 Component of several different pre-ribosomal particles; forms a complex with Ytm1p and Erb1p that is required for maturation of the large ribosomal subunit; required for exit from G0 and the initiation of cell proliferation -S000036462 CDS YGR103W 7 695417 697234 W 2011-02-03 1996-07-31 -S000003336 ORF Verified YGR104C SRB5 MED18 chromosome 7 L000002052 7 698368 697445 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation; required for proper termination of transcription for some genes; involved in telomere maintenance -S000036489 CDS YGR104C 7 698368 697445 C 2011-02-03 1996-07-31 -S000003337 ORF Verified YGR105W VMA21 chromosome 7 L000002466 7 698599 698832 W 2011-02-03 1996-07-31 Integral membrane protein required for V-ATPase function; not an actual component of the vacuolar H+-ATPase (V-ATPase) complex; diverged ortholog of human XMEA (X-linked Myopathy with Excessive Autophagy); functions in the assembly of the V-ATPase; localized to the yeast endoplasmic reticulum (ER) -S000036647 CDS YGR105W 7 698599 698832 W 2011-02-03 1996-07-31 -S000003338 ORF Verified YGR106C VOA1 chromosome 7 7 699786 698989 C 2011-02-03 1996-07-31 ER protein that functions in assembly of the V0 sector of V-ATPase; functions with other assembly factors; null mutation enhances the vacuolar ATPase (V-ATPase) deficiency of a vma21 mutant impaired in endoplasmic reticulum (ER) retrieval -S000036683 CDS YGR106C 7 699786 698989 C 2011-02-03 1996-07-31 -S000006646 tRNA_gene tL(GAG)G chromosome 7 L000003829 7 700675 700756 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis; not essential for viability even though this is the only tRNA that decodes GAG codons -S000031926 noncoding_exon tL(GAG)G 7 700675 700756 W 2011-02-03 2000-05-19 -S000006631 tRNA_gene tK(UUU)G2 chromosome 7 L000003845 7 701048 700953 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000033693 intron tK(UUU)G2 7 701011 700989 C 2011-02-03 2000-05-19 -S000033692 noncoding_exon tK(UUU)G2 7 700988 700953 C 2011-02-03 2000-05-19 -S000033691 noncoding_exon tK(UUU)G2 7 701048 701012 C 2011-02-03 2000-05-19 -S000006968 long_terminal_repeat YGRWdelta19 chromosome 7 7 701104 701350 W 2011-02-03 2000-05-19 Ty1 LTR -S000003339 ORF Dubious YGR107W chromosome 7 7 702667 703116 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037476 CDS YGR107W 7 702667 703116 W 2011-02-03 1996-07-31 -S000003340 ORF Verified YGR108W CLB1 B-type cyclin CLB1|SCB1 chromosome 7 L000000349 7 703636 705051 W 2011-02-03 1996-07-31 B-type cyclin involved in cell cycle progression; activates Cdc28p to promote the transition from G2 to M phase; accumulates during G2 and M, then targeted via a destruction box motif for ubiquitin-mediated degradation by the proteasome; CLB1 has a paralog, CLB2, that arose from the whole genome duplication -S000037604 CDS YGR108W 7 703636 705051 W 2011-02-03 1996-07-31 -S000003341 ORF Verified YGR109C CLB6 B-type cyclin CLB6 chromosome 7 L000000354 7 706501 705359 C 2011-02-03 1996-07-31 B-type cyclin involved in DNA replication during S phase; activates Cdc28p to promote initiation of DNA synthesis; functions in formation of mitotic spindles along with Clb3p and Clb4p; most abundant during late G1; CLB6 has a paralog, CLB5, that arose from the whole genome duplication -S000037653 CDS YGR109C 7 706501 705359 C 2011-02-03 1996-07-31 -S000006527 tRNA_gene tC(GCA)G chromosome 7 L000003844 7 707179 707108 C 2011-02-03 2000-05-19 Cysteine tRNA (tRNA-Cys), predicted by tRNAscan-SE analysis -S000035213 noncoding_exon tC(GCA)G 7 707179 707108 C 2011-02-03 2000-05-19 -S000006978 long_terminal_repeat YGRWsigma4 chromosome 7 7 707195 707534 W 2011-02-03 2000-05-19 Ty3 LTR -S000006984 LTR_retrotransposon YGRWTy3-1 Ty3 chromosome 7 7 707195 712545 W 2011-02-03 2000-05-19 Ty3 element, LTR retrotransposon of the Gypsy (Metaviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; transposition is induced upon exposure to mating pheromone -S000007346 transposable_element_gene YGR109W-A gag protein chromosome 7 7 707610 708482 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000033102 CDS YGR109W-A 7 707610 708482 W 2011-02-03 1999-07-17 -S000007347 transposable_element_gene YGR109W-B gag-pol fusion protein chromosome 7 7 707610 712254 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000033103 CDS YGR109W-B 7 707610 708459 W 2011-02-03 1999-07-17 -S000033104 CDS YGR109W-B 7 708461 712254 W 2011-02-03 1999-07-17 -S000033105 plus_1_translational_frameshift YGR109W-B 7 708460 708460 W 2011-02-03 1999-07-17 -S000006979 long_terminal_repeat YGRWsigma5 chromosome 7 7 712206 712545 W 2011-02-03 2000-05-19 Ty3 LTR -S000006957 long_terminal_repeat YGRCdelta20 chromosome 7 7 713384 713084 C 2011-02-03 2000-05-19 Ty1 LTR -S000003342 ORF Verified YGR110W CLD1 carboxylic ester hydrolase chromosome 7 7 713709 715046 W 2011-02-03 1996-07-31 Mitochondrial cardiolipin-specific phospholipase; functions upstream of Taz1p to generate monolyso-cardiolipin; transcription increases upon genotoxic stress; involved in restricting Ty1 transposition; has homology to mammalian CGI-58 -S000030464 CDS YGR110W 7 713709 715046 W 2011-02-03 1996-07-31 -S000118464 ARS ARS728 ARSVII-715 chromosome 7 7 715312 715377 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000119028 ARS_consensus_sequence ARS728 7 715315 715329 W 2011-02-03 2006-10-03 -S000003343 ORF Uncharacterized YGR111W chromosome 7 7 715828 717030 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus -S000031339 CDS YGR111W 7 715828 717030 W 2011-02-03 1996-07-31 -S000003344 ORF Verified YGR112W SHY1 chromosome 7 L000004140 7 717358 718527 W 2011-02-03 1996-07-31 Mitochondrial inner membrane protein required for complex IV assembly; associates with complex IV assembly intermediates and complex III/complex IV supercomplexes; similar to human SURF1 involved in Leigh Syndrome; complex IV is also known as cytochrome c oxidase -S000031421 CDS YGR112W 7 717358 718527 W 2011-02-03 1996-07-31 -S000003345 ORF Verified YGR113W DAM1 chromosome 7 L000004420 7 718893 719924 W 2011-02-03 2001-05-31|1996-07-31 Essential subunit of the Dam1 complex (aka DASH complex); cooperates with Duo1p to connect the DASH complex with the microtubules (MT); couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; Ipl1p target for regulating kinetochore-MT attachments -S000031509 CDS YGR113W 7 718893 719924 W 2011-02-03 2001-05-31|1996-07-31 -S000003348 ORF Verified YGR116W SPT6 chromatin-remodeling histone chaperone SPT6|SSN20|CRE2 chromosome 7 L000002032 7 720409 724764 W 87.64 2011-02-03 1996-07-31 Nucleosome remodeling protein; functions in various aspects of transcription, chromatin maintenance, and RNA processing; required for the maintenance of chromatin structure during transcription in order to inhibit transcription from promoters within the coding region; required for H3K36 trimethylation but not dimethylation by Set2p -S000032690 CDS YGR116W 7 720409 724764 W 2011-02-03 1996-07-31 -S000003346 ORF Dubious YGR114C chromosome 7 7 720654 720265 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame overlaps 5' end of the essential gene SPT6 -S000031522 CDS YGR114C 7 720654 720265 C 2011-02-03 1996-07-31 -S000003347 ORF Dubious YGR115C chromosome 7 7 721151 720372 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified and essential ORF SPT6/YGR115C -S000031629 CDS YGR115C 7 721151 720372 C 2011-02-03 1996-07-31 -S000003349 ORF Uncharacterized YGR117C chromosome 7 7 726479 725049 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000032722 CDS YGR117C 7 726479 725049 C 2011-02-03 1996-07-31 -S000003350 ORF Verified YGR118W RPS23A uS12|ribosomal 40S subunit protein S23A|rp37|YS14|S28A|S23A|S12 chromosome 7 L000001764 7 726974 727730 W 2011-02-03 1996-07-31|2011-02-03 Ribosomal protein 28 (rp28) of the small (40S) ribosomal subunit; required for translational accuracy; homologous to mammalian ribosomal protein S23 and bacterial S12; RPS23A has a paralog, RPS23B, that arose from the whole genome duplication; deletion of both RPS23A and RPS23B is lethal -S000033494 CDS YGR118W 7 726974 727038 W 2011-02-03 1996-07-31 -S000033495 CDS YGR118W 7 727358 727730 W 2011-02-03 1996-07-31 -S000033496 intron YGR118W 7 727039 727357 W 2011-02-03 1996-07-31|2011-02-03 -S000003351 ORF Verified YGR119C NUP57 FG-nucleoporin NUP57 chromosome 7 L000002619 7 729671 728046 C 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; contributes directly to nucleocytoplasmic transport and maintenance of the nuclear pore complex (NPC) permeability barrier; found in stable complex with Nic96p and two other FG-nucleoproteins (Nsp1p and Nup49p) -S000033534 CDS YGR119C 7 729671 728046 C 2011-02-03 1996-07-31 -S000003352 ORF Verified YGR120C COG2 Golgi transport complex subunit COG2|SEC35 chromosome 7 L000004877 7 730821 730033 C 2011-02-03 2003-09-22|1996-07-31 Essential component of the conserved oligomeric Golgi complex; a cytosolic tethering complex that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments; the components of the Golgi complex are Gog1p through Cog8p -S000034667 CDS YGR120C 7 730821 730033 C 2011-02-03 2003-09-22|1996-07-31 -S000006670 tRNA_gene tN(GUU)G chromosome 7 L000003830 7 731137 731210 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis -S000030710 noncoding_exon tN(GUU)G 7 731137 731210 W 2011-02-03 2000-05-19 -S000003353 ORF Verified YGR121C MEP1 ammonium permease MEP1|AMT1 chromosome 7 L000001073 7 732927 731449 C 2011-02-03 1996-07-31 Ammonium permease; belongs to a ubiquitous family of cytoplasmic membrane proteins that transport only ammonium (NH4+); expression is under the nitrogen catabolite repression regulation; human homolog RHCG complements yeast null mutant; mutations in human homolog RHCG implicated in metabolic acidosis; MEP1 has a paralog, MEP3, that arose from the whole genome duplication -S000034743 CDS YGR121C 7 732927 731449 C 2011-02-03 1996-07-31 -S000028550 ORF Uncharacterized YGR121W-A chromosome 7 7 733412 733627 W 2011-02-03 2003-07-29 Putative protein of unknown function -S000031236 CDS YGR121W-A 7 733412 733627 W 2011-02-03 2003-07-29 -S000003354 ORF Verified YGR122W chromosome 7 7 733935 735143 W 2011-02-03 1996-07-31 Protein that may be involved in pH regulation; probable ortholog of A. nidulans PalC, which is involved in pH regulation and binds to the ESCRT-III complex; null mutant does not properly process Rim101p and has decreased resistance to rapamycin; GFP-fusion protein is cytoplasmic; relative distribution to cytoplasm increases upon DNA replication stress -S000035706 CDS YGR122W 7 733935 735143 W 2011-02-03 1996-07-31 -S000006969 long_terminal_repeat YGRWdelta21 chromosome 7 7 735542 735872 W 2011-02-03 2000-05-19 Ty1 LTR -S000007240 ORF Dubious YGR122C-A chromosome 7 7 735758 735630 C 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; similar to YLR334C and YOL106W -S000032623 CDS YGR122C-A 7 735758 735630 C 2011-02-03 1999-07-17 -S000006980 long_terminal_repeat YGRWsigma6 chromosome 7 7 735982 736322 W 2011-02-03 2000-05-19 Ty3 LTR -S000006713 tRNA_gene tR(UCU)G3 chromosome 7 L000003831 7 736340 736411 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000037332 noncoding_exon tR(UCU)G3 7 736340 736411 W 2011-02-03 2000-05-19 -S000003355 ORF Verified YGR123C PPT1 protein serine/threonine phosphatase chromosome 7 L000002624 7 738203 736662 C 2011-02-03 1996-07-31 Protein serine/threonine phosphatase; regulates Hsp90 chaperone by affecting its ATPase and cochaperone binding activities; has similarity to human phosphatase PP5; present in both the nucleus and cytoplasm; expressed during logarithmic growth -S000035715 CDS YGR123C 7 738203 736662 C 2011-02-03 1996-07-31 -S000006604 tRNA_gene tI(AAU)G chromosome 7 L000003832 7 739122 739195 W 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000030407 noncoding_exon tI(AAU)G 7 739122 739195 W 2011-02-03 2000-05-19 -S000003356 ORF Verified YGR124W ASN2 asparagine synthase (glutamine-hydrolyzing) 2 chromosome 7 L000003156 7 739944 741662 W 2011-02-03 1996-07-31 Asparagine synthetase; catalyzes the synthesis of L-asparagine from L-aspartate in the asparagine biosynthetic pathway; ASN2 has a paralog, ASN1, that arose from the whole genome duplication -S000035868 CDS YGR124W 7 739944 741662 W 2011-02-03 1996-07-31 -S000003357 ORF Uncharacterized YGR125W chromosome 7 7 742325 745435 W 2011-02-03 1996-07-31 Putative protein of unknown function; deletion mutant has decreased rapamycin resistance but normal wormannin resistance; green fluorescent protein (GFP)-fusion protein localizes to the vacuole -S000036786 CDS YGR125W 7 742325 745435 W 2011-02-03 1996-07-31 -S000003358 ORF Uncharacterized YGR126W chromosome 7 7 745835 746527 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus and is induced in response to the DNA-damaging agent MMS -S000036861 CDS YGR126W 7 745835 746527 W 2011-02-03 1996-07-31 -S000003359 ORF Uncharacterized YGR127W chromosome 7 7 746798 747736 W 2011-02-03 1996-07-31 Putative protein of unknown function; expression is regulated by Msn2p/Msn4p, indicating a possible role in stress response -S000036917 CDS YGR127W 7 746798 747736 W 2011-02-03 1996-07-31 -S000003360 ORF Verified YGR128C UTP8 chromosome 7 7 750091 747950 C 2011-02-03 1996-07-31 Nucleolar protein required for export of tRNAs from the nucleus; also copurifies with the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA -S000036949 CDS YGR128C 7 750091 747950 C 2011-02-03 1996-07-31 -S000003361 ORF Verified YGR129W SYF2 NTC31 chromosome 7 L000004196 7 750400 751047 W 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); NTC contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs; relocalizes to the cytosol in response to hypoxia; isy1 syf2 cells have defective spindles activiating cell cycle arrest -S000037743 CDS YGR129W 7 750400 751047 W 2011-02-03 1996-07-31 -S000003362 ORF Verified YGR130C chromosome 7 7 753844 751394 C 2011-02-03 1996-07-31 Component of the eisosome with unknown function; GFP-fusion protein localizes to the cytoplasm; specifically phosphorylated in vitro by mammalian diphosphoinositol pentakisphosphate (IP7) -S000030568 CDS YGR130C 7 753844 751394 C 2011-02-03 1996-07-31 -S000003363 ORF Verified YGR131W FHN1 chromosome 7 7 754726 755250 W 2011-02-03 1996-07-31 Protein of unknown function; induced by ketoconazole; promoter region contains sterol regulatory element motif, which has been identified as a Upc2p-binding site; overexpression complements function of Nce102p in NCE102 deletion strain; FHN1 has a paralog, NCE102, that arose from the whole genome duplication -S000030762 CDS YGR131W 7 754726 755250 W 2011-02-03 1996-07-31 -S000003364 ORF Verified YGR132C PHB1 prohibitin subunit PHB1 chromosome 7 L000001416|L000001415 7 756452 755589 C 2011-02-03 1996-07-31 Subunit of the prohibitin complex (Phb1p-Phb2p); prohibitin is a 1.2 MDa ring-shaped inner mitochondrial membrane chaperone that stabilizes newly synthesized proteins; determinant of replicative life span; involved in mitochondrial segregation; prohibitin deficiency induces a mitochondrial unfolded protein response (mtUPR) -S000030798 CDS YGR132C 7 756452 755589 C 2011-02-03 1996-07-31 -S000003365 ORF Verified YGR133W PEX4 E2 ubiquitin-protein ligase peroxin 4|UBC10|PAS2 chromosome 7 L000001338 7 756896 757447 W 2011-02-03 1996-07-31 Peroxisomal ubiquitin conjugating enzyme; required for peroxisomal matrix protein import and peroxisome biogenesis -S000031790 CDS YGR133W 7 756896 757447 W 2011-02-03 1996-07-31 -S000003366 ORF Verified YGR134W CAF130 CCR4-NOT core subunit CAF130 chromosome 7 7 757770 761138 W 2011-02-03 1996-07-31 Subunit of the CCR4-NOT transcriptional regulatory complex; CCR4-NOT complex is evolutionarily-conserved and involved in controlling mRNA initiation, elongation, and degradation -S000031982 CDS YGR134W 7 757770 761138 W 2011-02-03 1996-07-31 -S000003367 ORF Verified YGR135W PRE9 proteasome core particle subunit alpha 3 chromosome 7 L000002701 7 761392 762168 W 2011-02-03 1996-07-31 Alpha 3 subunit of the 20S proteasome; the only nonessential 20S subunit; may be replaced by the alpha 4 subunit (Pre6p) under stress conditions to create a more active proteasomal isoform -S000032101 CDS YGR135W 7 761392 762168 W 2011-02-03 1996-07-31 -S000003368 ORF Verified YGR136W LSB1 chromosome 7 7 762428 763153 W 2011-02-03 1996-07-31 Negative regulator of actin nucleation-promoting factor activity; interacts with Las17p, a homolog of human Wiskott-Aldrich Syndrome protein (WASP), via an N-terminal SH3 domain, and along with PIN3 cooperatively inhibits the nucleation of actin filaments; overexpression blocks receptor-mediated endocytosis; protein increases in abundance and forms nuclear foci in response to DNA replication stress; LSB1 has a paralog, PIN3, that arose from the whole genome duplication -S000033027 CDS YGR136W 7 762428 763153 W 2011-02-03 1996-07-31 -S000003369 ORF Dubious YGR137W chromosome 7 7 762888 763262 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033117 CDS YGR137W 7 762888 763262 W 2011-02-03 1996-07-31 -S000003370 ORF Verified YGR138C TPO2 spermine transporter chromosome 7 7 765606 763762 C 2011-02-03 1996-07-31 Polyamine transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; specific for spermine; localizes to the plasma membrane; transcription of TPO2 is regulated by Haa1p; TPO2 has a paralog, TPO3, that arose from the whole genome duplication -S000033153 CDS YGR138C 7 765606 763762 C 2011-02-03 1996-07-31 -S000003371 ORF Dubious YGR139W chromosome 7 7 765726 766064 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034004 CDS YGR139W 7 765726 766064 W 2011-02-03 1996-07-31 -S000003372 ORF Verified YGR140W CBF2 CSL5|NDC10|CTF14|CEP2|CBF3A chromosome 7 L000000430|L000001238|L000000221 7 767429 770299 W 2011-02-03 1996-07-31 Essential kinetochore protein; component of the CBF3 multisubunit complex that binds to the CDEIII region of the centromere; Cbf2p also binds to the CDEII region possibly forming a different multimeric complex, ubiquitinated in vivo; sumoylated in an Mms21p-dependent manner; relative distribution to the spindle pole body decreases upon DNA replication stress -S000034959 CDS YGR140W 7 767429 770299 W 2011-02-03 1996-07-31 -S000003373 ORF Verified YGR141W VPS62 chromosome 7 7 770569 771972 W 2011-02-03 1996-07-31 Vacuolar protein sorting (VPS) protein; required for cytoplasm to vacuole targeting of proteins; VPS62 has a paralog, TDA6, that arose from the whole genome duplication -S000035068 CDS YGR141W 7 770569 771972 W 2011-02-03 1996-07-31 -S000003374 ORF Verified YGR142W BTN2 chromosome 7 7 772454 773686 W 2011-02-03 1996-07-31 v-SNARE binding protein; facilitates specific protein retrieval from a late endosome to the Golgi; modulates arginine uptake, possible role in mediating pH homeostasis between the vacuole and plasma membrane H(+)-ATPase; contributes to prion curing; preferentially expressed after severe ethanol stress -S000035175 CDS YGR142W 7 772454 773686 W 2011-02-03 1996-07-31 -S000006970 long_terminal_repeat YGRWdelta22 chromosome 7 7 774040 774162 W 2011-02-03 2000-05-19 Ty1 LTR -S000006512 tRNA_gene tA(AGC)G chromosome 7 L000003833 7 774349 774421 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine -S000032279 noncoding_exon tA(AGC)G 7 774349 774421 W 2011-02-03 2000-05-19 -S000003375 ORF Verified YGR143W SKN1 beta-glucan synthesis-associated protein SKN1 chromosome 7 L000001907 7 775193 777508 W 88.14 2011-02-03 1996-07-31 Protein involved in sphingolipid biosynthesis; type II membrane protein; SKN1 has a paralog, KRE6, that arose from the whole genome duplication -S000036052 CDS YGR143W 7 775193 777508 W 2011-02-03 1996-07-31 -S000118465 ARS ARS729 ARSVII-778 chromosome 7 7 777966 778214 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000119029 ARS_consensus_sequence ARS729 7 778014 778028 W 2011-02-03 2006-10-03 -S000178103 ARS_consensus_sequence ARS729 7 778196 778180 C 2014-11-18 2014-11-18 -S000006971 long_terminal_repeat YGRWdelta23 chromosome 7 7 778784 779112 W 2011-02-03 2000-05-19 Ty1 LTR -S000006972 long_terminal_repeat YGRWdelta24 chromosome 7 7 779116 779224 W 2011-02-03 2000-05-19 Ty1 LTR -S000006958 long_terminal_repeat YGRCdelta25 chromosome 7 7 779515 779225 C 2011-02-03 2000-05-19 Ty1 LTR -S000006590 tRNA_gene tG(UCC)G SUF4 chromosome 7 L000002152|L000003834 7 779616 779687 W 105 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons -S000037534 noncoding_exon tG(UCC)G 7 779616 779687 W 2011-02-03 2000-05-19 -S000003376 ORF Verified YGR144W THI4 thiamine thiazole synthase|MOL1|ESP35 chromosome 7 L000001133|L000000585 7 780399 781379 W 2011-02-03 1996-07-31 Thiazole synthase; abundant protein involved in the formation of the thiazole moiety of thiamine during thiamine biosynthesis; acts more as a co-substrate rather than an enzyme by providing the sulphur source for thiazole formation; undergoes a single turnover only; required for mitochondrial genome stability in response to DNA damaging agents -S000036192 CDS YGR144W 7 780399 781379 W 2011-02-03 1996-07-31 -S000003377 ORF Verified YGR145W ENP2 ribosome biosynthesis protein ENP2 chromosome 7 7 781767 783890 W 2011-02-03 1996-07-31|2011-02-03 Component of the SSU; required for pre-18S rRNA processing, biogenesis of the small ribosomal subunit; interacts with U3 snoRNA, Mpp10p and Bfr2p; contains WD repeats, and has homology to Spb1p -S000029871 CDS YGR145W 7 781767 783890 W 2011-02-03 1996-07-31|2011-02-03 -S000003378 ORF Verified YGR146C ECL1 chromosome 7 7 784858 784223 C 2011-02-03 1996-07-31 Protein of unknown function; mitochondrial-dependent role in the extension of chronological lifespan; overexpression increases oxygen consumption and respiratory activity while deletion results in reduced oxygen consumption under conditions of caloric restriction; induced by iron homeostasis transcription factor Aft2p; multicopy suppressor of temperature sensitive hsf1 mutant; induced by treatment with 8-methoxypsoralen and UVA irradiation -S000031718 CDS YGR146C 7 784858 784223 C 2011-02-03 1996-07-31 -S000028638 ORF Uncharacterized YGR146C-A chromosome 7 7 785437 785276 C 2011-02-03 2003-07-29 Putative protein of unknown function -S000032394 CDS YGR146C-A 7 785437 785276 C 2011-02-03 2003-07-29 -S000003379 ORF Verified YGR147C NAT2 chromosome 7 L000001233 7 786920 786054 C 2011-02-03 1996-07-31 Protein of unknown function; has an apparent role in acetylation of N-terminal methionine residues -S000031870 CDS YGR147C 7 786920 786054 C 2011-02-03 1996-07-31 -S000003380 ORF Verified YGR148C RPL24B eL24|ribosomal 60S subunit protein L24B|L24e|rp29|YL21|L30B|L24B|RPL30B chromosome 7 L000001725 7 787779 787312 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L24B; not essential for translation but may be required for normal translation rate; homologous to mammalian ribosomal protein L24, no bacterial homolog; RPL24B has a paralog, RPL24A, that arose from the whole genome duplication -S000031971 CDS YGR148C 7 787779 787312 C 2011-02-03 1996-07-31 -S000122102 five_prime_UTR_intron YGR148C 7 788178 787787 C 2011-02-03 2007-04-04 -S000003381 ORF Verified YGR149W GPC1 chromosome 7 7 789031 790329 W 2011-02-03 1996-07-31 Glycerophosphocholine acyltransferase (GPCAT); involved in in phosphatidylcholine (PC) synthesis; uses acetyl-CoA to acylate glycero-3-phosphocholine to yield lyso-PC; also catalyzes acylation of glycerophosphoethanolamine with acyl-CoA; predicted to be an integal membrane protein -S000037495 CDS YGR149W 7 789031 790329 W 2011-02-03 1996-07-31 -S000003382 ORF Verified YGR150C CCM1 DMR1|RRG2 chromosome 7 7 793053 790459 C 2011-02-03 1996-07-31 Mitochondrial 15S rRNA-binding protein; required for intron removal of COB and COX1 pre-mRNAs; has separable roles in stabilizing mitochondrial 15S rRNA and in maturation of the COB and COX1 mRNAs; contains pentatricopeptide repeat (PPR) motifs; mutant is respiratory deficient and has defective plasma membrane electron transport -S000036478 CDS YGR150C 7 793053 790459 C 2011-02-03 1996-07-31 -S000006973 long_terminal_repeat YGRWdelta26 chromosome 7 7 793237 793559 W 2011-02-03 2000-05-19 Ty1 LTR -S000006523 tRNA_gene tA(UGC)G chromosome 7 L000003835 7 794417 794489 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 5 nuclear tRNA genes containing the tDNA-anticodon TGC (mature tRNA may be UGC or may contain modified bases), decodes GCA and probably GCG codons into alanine, one of 16 nuclear tRNAs for alanine -S000034874 noncoding_exon tA(UGC)G 7 794417 794489 W 2011-02-03 2000-05-19 -S000003383 ORF Dubious YGR151C chromosome 7 7 794990 794655 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps almost completely with the verified ORF RSR1/BUD1/YGR152C; relative distribution to the nucleus increases upon DNA replication stress -S000037176 CDS YGR151C 7 794990 794655 C 2011-02-03 1996-07-31 -S000003384 ORF Verified YGR152C RSR1 Ras family GTPase RSR1|BUD1 chromosome 7 L000001780 7 795492 794674 C 98 2011-02-03 1996-07-31 GTP-binding protein of the Ras superfamily; required for bud site selection, morphological changes in response to mating pheromone, and efficient cell fusion; localized to the plasma membrane; significantly similar to mammalian Rap GTPases -S000037247 CDS YGR152C 7 795492 794674 C 2011-02-03 1996-07-31 -S000003385 ORF Uncharacterized YGR153W TOS10 chromosome 7 7 796092 796745 W 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function -S000037368 CDS YGR153W 7 796092 796745 W 2011-02-03 1996-07-31|2011-02-03 -S000003386 ORF Verified YGR154C GTO1 omega-class glutathione transferase chromosome 7 7 797868 796798 C 2011-02-03 1996-07-31 Omega-class glutathione transferase; induced under oxidative stress; putative peroxisomal localization -S000037395 CDS YGR154C 7 797868 796798 C 2011-02-03 1996-07-31 -S000003387 ORF Verified YGR155W CYS4 cystathionine beta-synthase CYS4|VMA41|STR4|NHS5 chromosome 7 L000001248|L000000471 7 798543 800066 W 87.14 2011-02-03 1996-07-31 Cystathionine beta-synthase; catalyzes synthesis of cystathionine from serine and homocysteine, the first committed step in cysteine biosynthesis; responsible for hydrogen sulfide generation; advances passage through START by promoting cell growth which requires catalytic activity, and reducing critical cell size independent of catalytic activity; mutations in human ortholog CBS cause homocystinuria; human CBS can complement yeast null mutant -S000030070 CDS YGR155W 7 798543 800066 W 2011-02-03 1996-07-31 -S000003388 ORF Verified YGR156W PTI1 cleavage polyadenylation factor subunit PTI1 chromosome 7 7 800546 801823 W 2011-02-03 1996-07-31 Essential component of CPF (cleavage and polyadenylation factor); involved in 3' end formation of snoRNA and mRNA; interacts directly with Pta1p; relocalizes to the cytosol in response to hypoxia; similar to mammalian Cleavage-Stimulation Factor CstF-64 -S000030236 CDS YGR156W 7 800546 801823 W 2011-02-03 1996-07-31 -S000003389 ORF Verified YGR157W CHO2 phosphatidylethanolamine N-methyltransferase|PEM1 chromosome 7 L000000328 7 802440 805049 W 2011-02-03 1996-07-31 Phosphatidylethanolamine methyltransferase (PEMT); catalyzes the first step in the conversion of phosphatidylethanolamine to phosphatidylcholine during the methylation pathway of phosphatidylcholine biosynthesis -S000030380 CDS YGR157W 7 802440 805049 W 2011-02-03 1996-07-31 -S000003390 ORF Verified YGR158C MTR3 exosome non-catalytic core subunit MTR3 chromosome 7 L000003982 7 806021 805269 C 2011-02-03 1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; has similarity to E. coli RNase PH and to human hMtr3p (EXOSC6) -S000033622 CDS YGR158C 7 806021 805269 C 2011-02-03 1996-07-31 -S000003392 ORF Dubious YGR160W chromosome 7 7 807073 807684 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033399 CDS YGR160W 7 807073 807684 W 2011-02-03 1996-07-31 -S000003391 ORF Verified YGR159C NSR1 SHE5 chromosome 7 L000001278 7 807656 806412 C 2011-02-03 1996-07-31 Nucleolar protein that binds nuclear localization sequences; required for pre-rRNA processing and ribosome biogenesis; binds to single stranded telomeric DNA and mRNA; methylated by Hmt1p; interaction with Top1p and nucleolar localization are negatively regulated by polyphosphorylation -S000033736 CDS YGR159C 7 807656 806412 C 2011-02-03 1996-07-31 -S000003393 ORF Uncharacterized YGR161C RTS3 chromosome 7 7 809420 808629 C 2011-02-03 1996-07-31 Putative component of the protein phosphatase type 2A complex -S000033431 CDS YGR161C 7 809420 808629 C 2011-02-03 1996-07-31 -S000029726 ORF Uncharacterized YGR161W-C chromosome 7 7 810227 810505 W 2011-02-03 2004-08-27 Putative protein of unknown function; identified by sequence comparison with hemiascomycetous yeast species -S000036877 CDS YGR161W-C 7 810227 810505 W 2011-02-03 2004-08-27 -S000006974 long_terminal_repeat YGRWdelta27 chromosome 7 7 811447 811778 W 2011-02-03 2000-05-19 Ty2 LTR -S000006983 LTR_retrotransposon YGRWTy2-2 Ty2 chromosome 7 7 811447 817397 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007369 transposable_element_gene YGR161W-A gag protein chromosome 7 7 811738 813054 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000030119 CDS YGR161W-A 7 811738 813054 W 2011-02-03 1999-07-17 -S000007370 transposable_element_gene YGR161W-B gag-pol fusion protein chromosome 7 S000029014 7 811738 817051 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000030122 CDS YGR161W-B 7 811738 813030 W 2011-02-03 1999-07-17 -S000030123 CDS YGR161W-B 7 813032 817051 W 2011-02-03 1999-07-17 -S000030124 plus_1_translational_frameshift YGR161W-B 7 813031 813031 W 2011-02-03 1999-07-17 -S000006975 long_terminal_repeat YGRWdelta28 chromosome 7 7 817074 817397 W 2011-02-03 2000-05-19 Ty2 LTR -S000006959 long_terminal_repeat YGRCdelta29 chromosome 7 7 817724 817393 C 2011-02-03 2000-05-19 Ty1 LTR -S000007368 transposable_element_gene YGR161C-D gag-pol fusion protein chromosome 7 7 823015 817747 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000036390 CDS YGR161C-D 7 821709 817747 C 2011-02-03 1999-07-17 -S000036389 CDS YGR161C-D 7 823015 821711 C 2011-02-03 1999-07-17 -S000036391 plus_1_translational_frameshift YGR161C-D 7 821710 821710 C 2011-02-03 1999-07-17 -S000007367 transposable_element_gene YGR161C-C gag protein chromosome 7 7 823015 821693 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000036388 CDS YGR161C-C 7 823015 821693 C 2011-02-03 1999-07-17 -S000006963 LTR_retrotransposon YGRCTy1-3 Ty1 chromosome 7 7 823306 817393 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000006960 long_terminal_repeat YGRCdelta30 chromosome 7 7 823306 822975 C 2011-02-03 2000-05-19 Ty1 LTR -S000006756 tRNA_gene tV(AAC)G2 chromosome 7 L000003836 7 823482 823555 W 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000036904 noncoding_exon tV(AAC)G2 7 823482 823555 W 2011-02-03 2000-05-19 -S000003394 ORF Verified YGR162W TIF4631 translation initiation factor eIF4G|eiF4G1 chromosome 7 L000002309 7 824059 826917 W 2011-02-03 1996-07-31 Translation initiation factor eIF4G; subunit of the mRNA cap-binding protein complex (eIF4F) that also contains eIF4E (Cdc33p); interacts with Pab1p and with eIF4A (Tif1p); also has a role in biogenesis of the large ribosomal subunit; TIF4631 has a paralog, TIF4632, that arose from the whole genome duplication -S000033543 CDS YGR162W 7 824059 826917 W 2011-02-03 1996-07-31 -S000003395 ORF Verified YGR163W GTR2 chromosome 7 L000004611 7 827552 828577 W 2011-02-03 1996-07-31 Subunit of a TORC1-stimulating GTPase complex; subunit of the Gtr1-Gtr2 GTPase complex that stimulates TORC1 in response to amino acid stimulation; stimulates the GTPase activity of Gtr1p; negatively regulates the Ran/Tc4 GTPase cycle; activates transcription; tethered to the vacuolar membrane as part of the EGO complex (EGOC); required for sorting of Gap1p; activated by the the Lst4p-Lst7p GAP complex; localizes to cytoplasm and to chromatin; homolog of human RagC and -S000033603 CDS YGR163W 7 827552 828577 W 2011-02-03 1996-07-31 -S000003396 ORF Dubious YGR164W chromosome 7 7 828625 828960 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034546 CDS YGR164W 7 828625 828960 W 2011-02-03 1996-07-31 -S000006712 tRNA_gene tR(UCU)G2 chromosome 7 L000003843 7 828794 828723 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine -S000037330 noncoding_exon tR(UCU)G2 7 828794 828723 C 2011-02-03 2000-05-19 -S000003397 ORF Verified YGR165W MRPS35 mitochondrial 37S ribosomal protein MRPS35 chromosome 7 7 829116 830153 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; null mutant does not grow on glycerol, is sensitive to 2,4-dichlorophenol, and accumulates large lipid droplets -S000034612 CDS YGR165W 7 829116 830153 W 2011-02-03 1996-07-31 -S000003398 ORF Verified YGR166W TRS65 KRE11 chromosome 7 L000000918 7 830515 832197 W 154.34 2011-02-03 1996-07-31 Component of transport protein particle (TRAPP) complex II; TRAPPII is a multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating intra-Golgi and endosome-Golgi traffic; role in cell wall beta-glucan biosynthesis and the stress response -S000034756 CDS YGR166W 7 830515 832197 W 2011-02-03 1996-07-31 -S000003399 ORF Verified YGR167W CLC1 SCD4 chromosome 7 L000000355 7 832456 833157 W 2011-02-03 1996-07-31 Clathrin light chain; subunit of the major coat protein involved in intracellular protein transport and endocytosis; regulates endocytic progression; thought to regulate clathrin function; the clathrin triskelion is a trimeric molecule composed of three heavy chains that radiate from a vertex and three light chains which bind noncovalently near the vertex of the triskelion -S000035721 CDS YGR167W 7 832456 833157 W 2011-02-03 1996-07-31 -S000003400 ORF Uncharacterized YGR168C chromosome 7 7 834482 833352 C 2011-02-03 1996-07-31 Putative protein of unknown function; YGR168C is not an essential gene -S000035768 CDS YGR168C 7 834482 833352 C 2011-02-03 1996-07-31 -S000118466 ARS ARS731 ARSVII-835 chromosome 7 7 834491 834734 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000119030 ARS_consensus_sequence ARS731 7 834664 834650 C 2011-02-03 2006-10-03 -S000003401 ORF Verified YGR169C PUS6 pseudouridine synthase PUS6 chromosome 7 7 835903 834689 C 2011-02-03 1996-07-31 tRNA:pseudouridine synthase; catalyzes the conversion of uridine to pseudouridine at position 31 in cytoplasmic and mitochondrial tRNAs; mutation of Asp168 to Ala abolishes enzyme activity; not essential for viability -S000035880 CDS YGR169C 7 835903 834689 C 2011-02-03 1996-07-31 -S000028521 ORF Verified YGR169C-A LSO2 YGR169C-C chromosome 7 7 836665 836387 C 2011-02-03 2003-07-29 Protein with a potential role in response to iron deprivation; localizes to nucleus and cytoplasm, and nuclear localization is enhanced under iron-replete conditions; null mutant exhibits slow growth during iron deprivation; LSO2 has a paralog, LSO1, that arose from the whole genome duplication -S000030316 CDS YGR169C-A 7 836665 836387 C 2011-02-03 2003-07-29 -S000003402 ORF Verified YGR170W PSD2 phosphatidylserine decarboxylase 2 chromosome 7 L000002817 7 837142 840558 W 2011-02-03 1996-07-31 Phosphatidylserine decarboxylase of the Golgi and vacuolar membranes; converts phosphatidylserine to phosphatidylethanolamine; controls vacuolar membrane phospholipid content by regulating phospholipids in compartments that will eventually give rise to the vacuole; loss of Psd2p causes a specific reduction in vacuolar membrane PE levels while total PE levels are not significantly affected -S000036827 CDS YGR170W 7 837142 840558 W 2011-02-03 1996-07-31 -S000003403 ORF Verified YGR171C MSM1 methionine--tRNA ligase MSM1 chromosome 7 L000001196 7 842551 840824 C 2011-02-03 1996-07-31 Mitochondrial methionyl-tRNA synthetase (MetRS); functions as a monomer in mitochondrial protein synthesis; functions similarly to cytoplasmic MetRS although the cytoplasmic form contains a zinc-binding domain not found in Msm1p -S000036868 CDS YGR171C 7 842551 840824 C 2011-02-03 1996-07-31 -S000003404 ORF Verified YGR172C YIP1 transporter YIP1 chromosome 7 L000003259 7 843591 842845 C 2011-02-03 1996-07-31 Integral membrane protein; required for the biogenesis of ER-derived COPII transport vesicles; interacts with Yif1p and Yos1p; localizes to the Golgi, the ER, and COPII vesicles; human homolog YIPF5 can complement yeast yip1 mutant -S000037595 CDS YGR172C 7 843591 842845 C 2011-02-03 1996-07-31 -S000003405 ORF Verified YGR173W RBG2 GIR1 chromosome 7 7 843854 844960 W 2011-02-03 1996-07-31 Protein with a role in translation; forms a complex with Gir2p; has similarity to mammalian developmentally regulated GTP-binding protein -S000037694 CDS YGR173W 7 843854 844960 W 2011-02-03 1996-07-31 -S000006981 long_terminal_repeat YGRWsigma7 chromosome 7 7 845281 845602 W 2011-02-03 2000-05-19 Ty3 LTR -S000006581 tRNA_gene tG(GCC)G1 chromosome 7 L000003837 7 845649 845719 W 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis -S000037454 noncoding_exon tG(GCC)G1 7 845649 845719 W 2011-02-03 2000-05-19 -S000003406 ORF Verified YGR174C CBP4 chromosome 7 L000000227 7 846405 845893 C 2011-02-03 1996-07-31 Mitochondrial protein required for assembly of cytochrome bc1 complex; interacts with the Cbp3p-Cbp6p complex and newly synthesized cytochrome b (Cobp) to promote assembly of Cobp into the cytochrome bc1 complex -S000037715 CDS YGR174C 7 846405 845893 C 2011-02-03 1996-07-31 -S000028639 ORF Uncharacterized YGR174W-A chromosome 7 7 846655 846741 W 2011-02-03 2003-07-29 Putative protein of unknown function; predicted to have a role in cell budding based on computational "guilt by association" analysis -S000032395 CDS YGR174W-A 7 846655 846741 W 2011-02-03 2003-07-29 -S000003407 ORF Verified YGR175C ERG1 squalene monooxygenase chromosome 7 L000000568 7 848423 846933 C 2011-02-03 1996-07-31 Squalene epoxidase; catalyzes the epoxidation of squalene to 2,3-oxidosqualene; plays an essential role in the ergosterol-biosynthesis pathway and is the specific target of the antifungal drug terbinafine; human SQLE functionally complements the lethality of the erg1 null mutation -S000037776 CDS YGR175C 7 848423 846933 C 2011-02-03 1996-07-31 -S000003408 ORF Dubious YGR176W chromosome 7 7 848720 849067 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030672 CDS YGR176W 7 848720 849067 W 2011-02-03 1996-07-31 -S000003409 ORF Verified YGR177C ATF2 alcohol O-acetyltransferase chromosome 7 L000003345 7 850436 848829 C 2011-02-03 1996-07-31 Alcohol acetyltransferase; may play a role in steroid detoxification; forms volatile esters during fermentation, which is important for brewing and winemaking -S000030746 CDS YGR177C 7 850436 848829 C 2011-02-03 1996-07-31 -S000003410 ORF Verified YGR178C PBP1 MRS16 chromosome 7 L000003967 7 853215 851047 C 2011-02-03 1996-07-31 Component of glucose deprivation induced stress granules; involved in P-body-dependent granule assembly; similar to human ataxin-2; interacts with Pab1p to regulate mRNA polyadenylation; interacts with Mkt1p to regulate HO translation; protein increases in abundance and relative distribution to the nucleus increases upon DNA replication stress -S000030834 CDS YGR178C 7 853215 851047 C 2011-02-03 1996-07-31 -S000003411 ORF Verified YGR179C OKP1 chromosome 7 7 854895 853675 C 2011-02-03 1996-07-31 Outer kinetochore protein required for accurate chromosome segregation; component of COMA (Ctf19p, Okp1p, Mcm21p, Ame1p) a kinetochore sub-complex which functions as a platform for kinetochore assembly; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-Q and fission yeast fta7 -S000031845 CDS YGR179C 7 854895 853675 C 2011-02-03 1996-07-31 -S000003412 ORF Verified YGR180C RNR4 ribonucleotide-diphosphate reductase subunit RNR4|PSO3|CRT3 chromosome 7 L000002819|S000029396|L000004184 7 856301 855264 C 2011-02-03 1996-07-31 Ribonucleotide-diphosphate reductase (RNR) small subunit; the RNR complex catalyzes the rate-limiting step in dNTP synthesis and is regulated by DNA replication and DNA damage checkpoint pathways via localization of the small subunits; relocalizes from nucleus to cytoplasm upon DNA replication stress; RNR4 has a paralog, RNR2, that arose from the whole genome duplication -S000031850 CDS YGR180C 7 856301 855264 C 2011-02-03 1996-07-31 -S000006641 tRNA_gene tL(CAA)G3 chromosome 7 L000003842 7 857491 857378 C 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis -S000034251 intron tL(CAA)G3 7 857453 857422 C 2011-02-03 2000-05-19 -S000034250 noncoding_exon tL(CAA)G3 7 857421 857378 C 2011-02-03 2000-05-19 -S000034249 noncoding_exon tL(CAA)G3 7 857491 857454 C 2011-02-03 2000-05-19 -S000003413 ORF Verified YGR181W TIM13 protein translocase subunit TIM13 chromosome 7 7 858287 858604 W 2011-02-03 1996-07-31 Mitochondrial intermembrane space protein; forms a complex with Tim8p that delivers a subset of hydrophobic proteins to the TIM22 complex for insertion into the inner membrane -S000032812 CDS YGR181W 7 858287 858604 W 2011-02-03 1996-07-31 -S000003414 ORF Dubious YGR182C chromosome 7 7 858904 858551 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF TIM13/YGR181W -S000032855 CDS YGR182C 7 858904 858551 C 2011-02-03 1996-07-31 -S000003415 ORF Verified YGR183C QCR9 ubiquinol--cytochrome-c reductase subunit 9|UCR9 chromosome 7 L000001549 7 859476 859063 C 148 2011-02-03 1996-07-31 Subunit 9 of ubiquinol cytochrome-c reductase (Complex III); Complex III is a component of the mitochondrial inner membrane electron transport chain; required for electron transfer at the ubiquinol oxidase site of the complex -S000032944 CDS YGR183C 7 859260 859063 C 2011-02-03 1996-07-31 -S000032943 CDS YGR183C 7 859476 859474 C 2011-02-03 1996-07-31 -S000032945 intron YGR183C 7 859473 859261 C 2011-02-03 1996-07-31 -S000003416 ORF Verified YGR184C UBR1 E3 ubiquitin-protein ligase UBR1|PTR1 chromosome 7 L000002420 7 865753 859901 C 2011-02-03 1996-07-31 E3 ubiquitin ligase (N-recognin); heterodimerizes with Rad6p to recognize and ubiquitinate substrates of the N-end rule pathway; role in endoplasmic reticulum-associated protein degradation (ERAD) in the absence of canonical ER membrane ligases or after stress; major role in targeting misfolded cytosolic proteins for degradation; regulates peptide transport via Cup9p ubiquitination; mutation in human UBR1 causes Johansson-Blizzard Syndrome (JBS) -S000033034 CDS YGR184C 7 865753 859901 C 2011-02-03 1996-07-31 -S000003417 ORF Verified YGR185C TYS1 tyrosine--tRNA ligase TYS1|TyrRS|TTS1 chromosome 7 L000001105 7 867520 866336 C 2011-02-03 1996-07-31 Cytoplasmic tyrosyl-tRNA synthetase; required for cytoplasmic protein synthesis; interacts with positions 34 and 35 of the tRNATyr anticodon; mutations in human ortholog YARS are associated with Charcot-Marie-Tooth (CMT) neuropathies; human ortholog YARS functionally complements the heat sensitivity of a ts allele; protein abundance increases in response to DNA replication stress -S000033686 CDS YGR185C 7 867520 866336 C 2011-02-03 1996-07-31 -S000003418 ORF Verified YGR186W TFG1 transcription factor IIF subunit TFG1|RAP74|SSU71 chromosome 7 L000002594 7 867774 869981 W 2011-02-03 1996-07-31 TFIIF (Transcription Factor II) largest subunit; involved in both transcription initiation and elongation of RNA polymerase II; homologous to human RAP74 -S000033854 CDS YGR186W 7 867774 869981 W 2011-02-03 1996-07-31 -S000003419 ORF Verified YGR187C HGH1 chromosome 7 L000003003 7 871416 870232 C 2011-02-03 1996-07-31 Nonessential protein of unknown function; predicted to be involved in ribosome biogenesis; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; similar to mammalian BRP16 (Brain protein 16); relative distribution to the nucleus increases upon DNA replication stress -S000033880 CDS YGR187C 7 871416 870232 C 2011-02-03 1996-07-31 -S000003420 ORF Verified YGR188C BUB1 protein kinase BUB1 chromosome 7 L000000196 7 875109 872044 C 150 2011-02-03 1996-07-31 Protein kinase involved in the cell cycle checkpoint into anaphase; in complex with Mad1p and Bub3p, prevents progression into anaphase in presence of spindle damage; Cdc28p-mediated phosphorylation at Bub1p-T566 is important for degradation in anaphase and adaptation of checkpoint to prolonged mitotic arrest; associates with centromere DNA via Skp1p; involved in Sgo1p relocalization in response to sister kinetochore tension; paralog MAD3 arose from whole genome duplication -S000034040 CDS YGR188C 7 875109 872044 C 2011-02-03 1996-07-31 -S000006976 long_terminal_repeat YGRWdelta31 chromosome 7 7 875951 876279 W 2011-02-03 2000-05-19 Ty1 LTR -S000006623 tRNA_gene tK(CUU)G3 chromosome 7 L000003838 7 876394 876466 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000029892 noncoding_exon tK(CUU)G3 7 876394 876466 W 2011-02-03 2000-05-19 -S000003421 ORF Verified YGR189C CRH1 transglycosylase chromosome 7 S000007423 7 878192 876669 C 2011-02-03 1996-07-31 Chitin transglycosylase; functions in the transfer of chitin to beta(1-6) and beta(1-3) glucans in the cell wall; similar and functionally redundant to Utr2; localizes to sites of polarized growth; expression induced by cell wall stress -S000034926 CDS YGR189C 7 878192 876669 C 2011-02-03 1996-07-31 -S000006772 tRNA_gene tW(CCA)G2 chromosome 7 L000003841 7 878815 878710 C 2011-02-03 2000-05-19 Tryptophan tRNA (tRNA-Trp), predicted by tRNAscan-SE analysis -S000032530 intron tW(CCA)G2 7 878779 878746 C 2011-02-03 2000-05-19 -S000032529 noncoding_exon tW(CCA)G2 7 878745 878710 C 2011-02-03 2000-05-19 -S000032528 noncoding_exon tW(CCA)G2 7 878815 878780 C 2011-02-03 2000-05-19 -S000003423 ORF Verified YGR191W HIP1 histidine permease chromosome 7 L000000775 7 880420 882231 W 146 2011-02-03 1996-07-31 High-affinity histidine permease; also involved in the transport of manganese ions -S000036175 CDS YGR191W 7 880420 882231 W 2011-02-03 1996-07-31 -S000003422 ORF Dubious YGR190C chromosome 7 7 880661 880296 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene HIP1/YGR191W -S000035932 CDS YGR190C 7 880661 880296 C 2011-02-03 1996-07-31 -S000003424 ORF Verified YGR192C TDH3 glyceraldehyde-3-phosphate dehydrogenase (phosphorylating) TDH3|GAPDH|GPD|SSS2|HSP36|HSP35|GLD1 chromosome 7 L000002274 7 883810 882812 C 2011-02-03 1996-07-31 Glyceraldehyde-3-phosphate dehydrogenase (GAPDH), isozyme 3; involved in glycolysis and gluconeogenesis; tetramer that catalyzes the reaction of glyceraldehyde-3-phosphate to 1,3 bis-phosphoglycerate; detected in the cytoplasm and cell wall; GAPDH-derived antimicrobial peptides secreted by S. cerevisiae are active against a wide variety of wine-related yeasts and bacteria; binds AU-rich RNA -S000036226 CDS YGR192C 7 883810 882812 C 2011-02-03 1996-07-31 -S000003425 ORF Verified YGR193C PDX1 chromosome 7 L000001369 7 885741 884509 C 2011-02-03 1996-07-31 E3-binding protein of the mitochondrial pyruvate dehydrogenase complex; plays a structural role in the complex by binding and positioning dihydrolipoamide dehydrogenase (E3) to the dihydrolipoamide acetyltransferase (E2) core -S000036958 CDS YGR193C 7 885741 884509 C 2011-02-03 1996-07-31 -S000003426 ORF Verified YGR194C XKS1 xylulokinase chromosome 7 7 887875 886073 C 2011-02-03 1996-07-31 Xylulokinase; converts D-xylulose and ATP to xylulose 5-phosphate and ADP; rate limiting step in fermentation of xylulose; required for xylose fermentation by recombinant S. cerevisiae strains -S000037017 CDS YGR194C 7 887875 886073 C 2011-02-03 1996-07-31 -S000119032 ARS ARS737 ARSVII-888|ARS731.5 chromosome 7 7 888413 888493 2014-11-18 2014-11-18|2006-10-03 Autonomously Replicating Sequence -S000119033 ARS_consensus_sequence ARS737 7 888414 888430 W 2014-11-18 2014-11-18|2006-10-03 -S000003427 ORF Verified YGR195W SKI6 exosome non-catalytic core subunit SKI6|RRP41|ECM20 chromosome 7 L000003895|L000004426 7 888882 889622 W 2011-02-03 1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; has similarity to E. coli RNase PH and to human hRrp41p (EXOSC4) -S000037164 CDS YGR195W 7 888882 889622 W 2011-02-03 1996-07-31 -S000003428 ORF Verified YGR196C FYV8 chromosome 7 7 892186 889733 C 2011-02-03 1996-07-31 Protein of unknown function; required for survival upon exposure to K1 killer toxin -S000037853 CDS YGR196C 7 892186 889733 C 2011-02-03 1996-07-31 -S000003429 ORF Verified YGR197C SNG1 chromosome 7 L000002747 7 894140 892497 C 2011-02-03 1996-07-31 Protein involved in resistance to nitrosoguanidine and 6-azauracil; expression is regulated by transcription factors involved in multidrug resistance; SNG1 has a paralog, YJR015W, that arose from the whole genome duplication -S000029875 CDS YGR197C 7 894140 892497 C 2011-02-03 1996-07-31 -S000003430 ORF Verified YGR198W YPP1 chromosome 7 7 894693 897146 W 2011-02-03 1996-07-31 Cargo-transport protein involved in endocytosis; interacts with phosphatidylinositol-4-kinase Stt4p; is required, along with Efr3p, for the assembly and recruitment of multiple copies of the kinase into phosphoinositide kinase (PIK) patches at the plasma membrane; positively regulates Stt4p; GFP-fusion protein localizes to the cytoplasm; YGR198W is an essential gene -S000030951 CDS YGR198W 7 894693 897146 W 2011-02-03 1996-07-31 -S000003431 ORF Verified YGR199W PMT6 dolichyl-phosphate-mannose-protein mannosyltransferase PMT6 chromosome 7 L000004009|L000004020 7 897502 899781 W 2011-02-03 1996-07-31 Protein O-mannosyltransferase; transfers mannose from dolichyl phosphate-D-mannose to protein serine/threonine residues of secretory proteins; reaction is essential for cell wall rigidity; member of a family of mannosyltransferases -S000031053 CDS YGR199W 7 897502 899781 W 2011-02-03 1996-07-31 -S000003432 ORF Verified YGR200C ELP2 Elongator subunit ELP2|KTI3|TOT2 chromosome 7 7 902270 899904 C 2011-02-03 1996-07-31 Subunit of Elongator complex; binds to microtubules via conserved alkaline residues; has two seven-bladed WD40 β propellers; Elongator complex is required for modification of wobble nucleosides in tRNA; target of Kluyveromyces lactis zymocin -S000036532 CDS YGR200C 7 902270 899904 C 2011-02-03 1996-07-31 -S000003433 ORF Uncharacterized YGR201C chromosome 7 7 903197 902520 C 2011-02-03 2003-09-22|1996-07-31 Putative protein of unknown function -S000036618 CDS YGR201C 7 903197 902520 C 2011-02-03 2003-09-22|1996-07-31 -S000003434 ORF Verified YGR202C PCT1 choline-phosphate cytidylyltransferase|CCT1|BSR2 chromosome 7 L000000240 7 904748 903474 C 2011-02-03 1996-07-31 Cholinephosphate cytidylyltransferase; a rate-determining enzyme of the CDP-choline pathway for phosphatidylcholine synthesis, inhibited by Sec14p, activated upon lipid-binding; contains an element within the regulatory domain involved in both silencing and activation of enzymatic activity -S000036716 CDS YGR202C 7 904748 903474 C 2011-02-03 1996-07-31 -S000003435 ORF Verified YGR203W YCH1 phosphatase YCH1 chromosome 7 7 905237 905683 W 2011-02-03 1996-07-31 Phosphatase with sequence similarity to Cdc25p; Arr2p and Mih1p; member of the single-domain rhodanese homology superfamily; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus -S000030650 CDS YGR203W 7 905237 905683 W 2011-02-03 1996-07-31 -S000003436 ORF Verified YGR204W ADE3 trifunctional formate-tetrahydrofolate ligase/methenyltetrahydrofolate cyclohydrolase/methylenetetrahydrofolate dehydrogenase ADE3 chromosome 7 L000000033 7 905934 908774 W 159 2011-02-03 1996-07-31 Cytoplasmic trifunctional enzyme C1-tetrahydrofolate synthase; involved in single carbon metabolism and required for biosynthesis of purines, thymidylate, methionine, and histidine; null mutation causes auxotrophy for adenine and histidine -S000030764 CDS YGR204W 7 905934 908774 W 2011-02-03 1996-07-31 -S000028640 ORF Uncharacterized YGR204C-A chromosome 7 7 909174 909061 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032416 CDS YGR204C-A 7 909174 909061 C 2011-02-03 2003-07-29 -S000003437 ORF Verified YGR205W TDA10 putative ATP-dependent kinase chromosome 7 7 909213 910085 W 2011-02-03 1996-07-31 ATP-binding protein of unknown function; crystal structure resembles that of E.coli pantothenate kinase and other small kinases; null mutant is sensitive to expression of the top1-T722A allele -S000030854 CDS YGR205W 7 909213 910085 W 2011-02-03 1996-07-31 -S000003438 ORF Verified YGR206W MVB12 ubiquitin-binding ESCRT-I subunit protein MVB12 chromosome 7 7 910432 910737 W 2011-02-03 1996-07-31 ESCRT-I subunit required to stabilize ESCRT-I core complex oligomers; the ESCRT-I core complex (Stp22p, Vps28p, Srn2p) is involved in ubiquitin-dependent sorting of proteins into the endosome; deletion mutant is sensitive to rapamycin and nystatin -S000031833 CDS YGR206W 7 910432 910737 W 2011-02-03 1996-07-31 -S000003439 ORF Verified YGR207C CIR1 chromosome 7 7 911628 910843 C 2011-02-03 1996-07-31 Mitochondrial protein that interacts with frataxin (Yfh1p); putative ortholog of mammalian electron transfer flavoprotein complex subunit ETF-beta; may have a role in oxidative stress response -S000031940 CDS YGR207C 7 911628 910843 C 2011-02-03 1996-07-31 -S000003440 ORF Verified YGR208W SER2 phosphoserine phosphatase chromosome 7 L000001866 7 911883 912812 W 168 2011-02-03 1996-07-31 Phosphoserine phosphatase of the phosphoglycerate pathway; involved in serine and glycine biosynthesis, expression is regulated by the available nitrogen source -S000032117 CDS YGR208W 7 911883 912812 W 2011-02-03 1996-07-31 -S000003441 ORF Verified YGR209C TRX2 thioredoxin TRX2|LMA1 chromosome 7 L000002358 7 913227 912913 C 161 2011-02-03 1996-07-31 Cytoplasmic thioredoxin isoenzyme; part of thioredoxin system which protects cells against oxidative and reductive stress; forms LMA1 complex with Pbi2p; acts as a cofactor for Tsa1p; required for ER-Golgi transport and vacuole inheritance; with Trx1p, facilitates mitochondrial import of small Tims Tim9p, Tim10p, Tim13p by maintaining them in reduced form; abundance increases under DNA replication stress; TRX2 has a paralog, TRX1, that arose from the whole genome duplication -S000032991 CDS YGR209C 7 913227 912913 C 2011-02-03 1996-07-31 -S000003442 ORF Uncharacterized YGR210C chromosome 7 7 914738 913503 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000032713 CDS YGR210C 7 914738 913503 C 2011-02-03 1996-07-31 -S000003443 ORF Verified YGR211W ZPR1 zinc finger-containing protein ZPR1 chromosome 7 L000004700 7 915241 916701 W 2011-02-03 1996-07-31 Essential protein with two zinc fingers; present in nucleus of growing cells, relocates to cytoplasm in starved cells via a process mediated by Cpr1p; binds translation elongation factor eEF-1 (Tef1p); relative distribution to nucleus increases upon DNA replication stress; human ZPR1 gene can complement yeast by allowing growth during down-regulation of yeast zpr1 -S000032885 CDS YGR211W 7 915241 916701 W 2011-02-03 1996-07-31 -S000003444 ORF Verified YGR212W SLI1 N-acetyltransferase chromosome 7 7 917040 918446 W 2011-02-03 1996-07-31 N-acetyltransferase; confers resistance to the sphingolipid biosynthesis inhibitor myriocin (ISP-1) by converting it into N-acetyl-myriocin, co-operates with Ypk1p in mediating resistance to myriocin -S000034830 CDS YGR212W 7 917040 918446 W 2011-02-03 1996-07-31 -S000003445 ORF Verified YGR213C RTA1 chromosome 7 L000003245 7 919465 918512 C 2011-02-03 1996-07-31 Protein involved in 7-aminocholesterol resistance; has seven potential membrane-spanning regions; expression is induced under both low-heme and low-oxygen conditions; member of the fungal lipid-translocating exporter (LTE) family of protein; RTA1 has a paralog, YLR046C, that arose from the whole genome duplication -S000034869 CDS YGR213C 7 919465 918512 C 2011-02-03 1996-07-31 -S000003446 ORF Verified YGR214W RPS0A uS2|ribosomal 40S subunit protein S0A|S2|S0A|YST1|NAB1A|NAB1 chromosome 7 L000001226|L000001225 7 920575 921788 W 2011-02-03 1996-07-31 Ribosomal 40S subunit protein S0A; required for maturation of 18S rRNA along with Rps0Bp; deletion of either RPS0 gene reduces growth rate, deletion of both genes is lethal; homologous to human ribosomal protein SA and bacterial S2; RPS0A has a paralog, RPS0B, that arose from the whole genome duplication; -S000035102 CDS YGR214W 7 920575 920664 W 2011-02-03 1996-07-31 -S000035103 CDS YGR214W 7 921120 921788 W 2011-02-03 1996-07-31 -S000035104 intron YGR214W 7 920665 921119 W 2011-02-03 1996-07-31 -S000003447 ORF Verified YGR215W RSM27 mitochondrial 37S ribosomal protein RSM27 chromosome 7 7 922175 922507 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit -S000035176 CDS YGR215W 7 922175 922507 W 2011-02-03 1996-07-31 -S000003448 ORF Verified YGR216C GPI1 phosphatidylinositol N-acetylglucosaminyltransferase chromosome 7 L000000725 7 924462 922633 C 2011-02-03 1996-07-31 Membrane protein involved in the synthesis of GlcNAc-PI; N-acetylglucosaminyl phosphatidylinositol (GlcNAc-PI) is the first intermediate in the synthesis of glycosylphosphatidylinositol (GPI) anchors; human and mouse GPI1p are functional homologs -S000035248 CDS YGR216C 7 924462 922633 C 2011-02-03 1996-07-31 -S000003449 ORF Verified YGR217W CCH1 chromosome 7 L000003440 7 924696 930815 W 2011-02-03 1996-07-31 Voltage-gated high-affinity calcium channel; involved in calcium influx in response to some environmental stresses as well as exposure to mating pheromones; interacts and partially co-localizes with Mid1p; however, evidence suggests CCH1 is not required for Mid1p function -S000036194 CDS YGR217W 7 924696 930815 W 2011-02-03 1996-07-31 -S000006582 tRNA_gene tG(GCC)G2 chromosome 7 L000003840 7 931023 930953 C 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis -S000037457 noncoding_exon tG(GCC)G2 7 931023 930953 C 2011-02-03 2000-05-19 -S000006961 long_terminal_repeat YGRCtau3 chromosome 7 7 931540 931171 C 2011-02-03 2000-05-19 Ty4 LTR -S000006977 long_terminal_repeat YGRWdelta32 chromosome 7 7 931688 932019 W 2011-02-03 2000-05-19 Ty1 LTR -S000003450 ORF Verified YGR218W CRM1 exportin CRM1|XPO1|KAP124 chromosome 7 L000000420 7 932541 935795 W 2011-02-03 1996-07-31 Major karyopherin; involved in export of proteins, RNAs, and ribosomal subunits from the nucleus; exportin -S000029874 CDS YGR218W 7 932541 935795 W 2011-02-03 1996-07-31 -S000003451 ORF Dubious YGR219W chromosome 7 7 936035 936376 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF MRPL9/YGR220C -S000031776 CDS YGR219W 7 936035 936376 W 2011-02-03 1996-07-31 -S000003452 ORF Verified YGR220C MRPL9 mitochondrial 54S ribosomal protein YmL9|YmL9 chromosome 7 L000001163|L000002525 7 936883 936074 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000036227 CDS YGR220C 7 936883 936074 C 2011-02-03 1996-07-31 -S000003453 ORF Verified YGR221C TOS2 chromosome 7 7 938992 937124 C 2011-02-03 1996-07-31|2011-02-03 Protein involved in localization of Cdc24p to the site of bud growth; may act as a membrane anchor; localizes to the bud neck and bud tip; potentially phosphorylated by Cdc28p; TOS2 has a paralog, SKG6, that arose from the whole genome duplication -S000036329 CDS YGR221C 7 938992 937124 C 2011-02-03 1996-07-31|2011-02-03 -S000006495 snRNA_gene snR7-L SNR7-L U5L|SNR7 chromosome 7 7 939672 939459 C 2011-02-03 2004-03-30 U5 spliceosomal RNA (U5 snRNA), long form; associated with spliceosome -S000033299 noncoding_exon snR7-L 7 939672 939459 C 2011-02-03 2004-03-30 -S000006496 snRNA_gene snR7-S SNR7-S U5S|SNR7 chromosome 7 7 939672 939494 C 2011-02-03 2004-04-01 U5 spliceosomal RNA (U5 snRNA), short form; derived from SNR7-L by 3' end processing; associated with spliceosome -S000033320 noncoding_exon snR7-S 7 939672 939494 C 2011-02-03 2004-04-01 -S000003454 ORF Verified YGR222W PET54 chromosome 7 L000001391 7 939923 940804 W 174 2011-02-03 1996-07-31 Mitochondrial inner membrane protein; binds to the 5' UTR of the COX3 mRNA to activate its translation together with Pet122p and Pet494p; also binds to the COX1 Group I intron AI5 beta to facilitate exon ligation during splicing -S000036470 CDS YGR222W 7 939923 940804 W 2011-02-03 1996-07-31 -S000003455 ORF Verified YGR223C HSV2 chromosome 7 7 942215 940869 C 2011-02-03 1996-07-31 Phosphatidylinositol 3,5-bisphosphate-binding protein; plays a role in micronucleophagy; belongs to the PROPPIN family of proteins; predicted to fold as a seven-bladed beta-propeller; displays punctate cytoplasmic localization -S000036479 CDS YGR223C 7 942215 940869 C 2011-02-03 1996-07-31 -S000003456 ORF Verified YGR224W AZR1 azole transporter chromosome 7 7 942806 944647 W 2011-02-03 1996-07-31 Plasma membrane transporter of the major facilitator superfamily; involved in resistance to azole drugs such as ketoconazole and fluconazole -S000037202 CDS YGR224W 7 942806 944647 W 2011-02-03 1996-07-31 -S000003457 ORF Verified YGR225W AMA1 SPO70 chromosome 7 L000004668 7 945145 947019 W 2011-02-03 2000-12-01|1996-07-31|2005-11-29 Activator of meiotic anaphase promoting complex (APC/C); Cdc20p family member; required for initiation of spore wall assembly; required for Clb1p degradation during meiosis; prevents premature assembly of the meiosis I spindle, required for DSB induced prophase I arrest -S000037306 CDS YGR225W 7 945145 946327 W 2011-02-03 2000-12-01|1996-07-31 -S000037307 CDS YGR225W 7 946421 947019 W 2011-02-03 2000-12-01|2005-11-29 -S000037308 intron YGR225W 7 946328 946420 W 2011-02-03 2000-12-01 -S000003458 ORF Dubious YGR226C chromosome 7 7 947001 946792 C 2011-02-03 1996-07-31|2005-11-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; overlaps significantly with a verified ORF, AMA1/YGR225W -S000037323 CDS YGR226C 7 947001 946792 C 2011-02-03 1996-07-31|2005-11-29 -S000003459 ORF Verified YGR227W DIE2 dolichyl-P-Glc:Glc(2)Man(9)GlcNAc(2)-PP-dolichol alpha-1,2- glucosyltransferase|ALG10 chromosome 7 L000002802 7 947420 948997 W 2011-02-03 1996-07-31|2011-02-03 Dolichyl-phosphoglucose-dependent alpha-1,2-glucosyltransferase; located in the ER; functions in pathway that synthesizes the dolichol-linked oligosaccharide precursor for N-linked protein glycosylation; has a role in regulation of ITR1 and INO1; human homolog ALG10B can complement yeast die2 null mutant -S000029996 CDS YGR227W 7 947420 948997 W 2011-02-03 1996-07-31|2011-02-03 -S000003460 ORF Dubious YGR228W chromosome 7 7 949365 949709 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF SMI1/YGR229C -S000030071 CDS YGR228W 7 949365 949709 W 2011-02-03 1996-07-31 -S000003461 ORF Verified YGR229C SMI1 KNR4 chromosome 7 L000000909 7 950899 949382 C 2011-02-03 1996-07-31 Protein involved in the regulation of cell wall synthesis; proposed to be involved in coordinating cell cycle progression with cell wall integrity -S000030134 CDS YGR229C 7 950899 949382 C 2011-02-03 1996-07-31 -S000003462 ORF Verified YGR230W BNS1 chromosome 7 L000004859 7 951894 952307 W 2011-02-03 1996-07-31 Protein of unknown function; overexpression bypasses need for Spo12p, but not required for meiosis; BNS1 has a paralog, SPO12, that arose from the whole genome duplication -S000032548 CDS YGR230W 7 951894 952307 W 2011-02-03 1996-07-31 -S000003463 ORF Verified YGR231C PHB2 prohibitin subunit PHB2 chromosome 7 L000004019 7 953480 952548 C 2011-02-03 2004-07-15|1996-07-31 Subunit of the prohibitin complex (Phb1p-Phb2p); prohibitin is a 1.2 MDa ring-shaped inner mitochondrial membrane chaperone that stabilizes newly synthesized proteins; determinant of replicative life span; involved in mitochondrial segregation; prohibitin deficiency induces a mitochondrial unfolded protein response (mtUPR) -S000032579 CDS YGR231C 7 953480 952548 C 2011-02-03 2004-07-15|1996-07-31 -S000003464 ORF Verified YGR232W NAS6 chromosome 7 7 953960 954646 W 2011-02-03 1996-07-31 Evolutionarily conserved 19S regulatory particle assembly-chaperone; proteasome-interacting protein involved in the assembly of the base subcomplex of the 19S proteasomal regulatory particle (RP); ortholog of human oncoprotein gankyrin, also known as p28, which interacts with the Rb tumor suppressor and CDK4/6 -S000033340 CDS YGR232W 7 953960 954646 W 2011-02-03 1996-07-31 -S000003465 ORF Verified YGR233C PHO81 VAC6|phoS chromosome 7 L000001427|S000029634|L000004050 7 958210 954674 C 2011-02-03 1996-07-31 Cyclin-dependent kinase (CDK) inhibitor; regulates Pho80p-Pho85p and Pcl7p-Pho85p cyclin-CDK complexes in response to phosphate levels; inhibitory activity for Pho80p-Pho85p requires myo-D-inositol heptakisphosphate (IP7) generated by Vip1p; relative distribution to the nucleus increases upon DNA replication stress -S000033365 CDS YGR233C 7 958210 954674 C 2011-02-03 1996-07-31 -S000003466 ORF Verified YGR234W YHB1 flavohemoglobin|YHB4 chromosome 7 L000002510 7 959904 961103 W 2011-02-03 1996-07-31 Nitric oxide oxidoreductase; flavohemoglobin that plays role in oxidative and nitrosative stress responses; protects against nitration of cellular targets and against cell growth inhibition under aerobic or anaerobic conditions; yeast flavohemoglobin Yhb1p and human homolog neuroglobin NGB protect cells against alpha-synuclein cytotoxicity and aggregate formation; protein increases in abundance, relocalizes from nucleus to cytoplasmic foci upon DNA replication stress -S000033479 CDS YGR234W 7 959904 961103 W 2011-02-03 1996-07-31 -S000003467 ORF Verified YGR235C MIC26 MOS2|MCS29|MIO27 chromosome 7 7 962061 961360 C 2011-02-03 1996-07-31 Component of the MICOS complex; MICOS (formerly MINOS or MitOS) is a mitochondrial inner membrane complex that extends into the intermembrane space and has a role in the maintenance of crista junctions, inner membrane architecture, and formation of contact sites to the outer membrane; Mic26p is a non-essential component of the complex -S000033513 CDS YGR235C 7 962061 961360 C 2011-02-03 1996-07-31 -S000003468 ORF Verified YGR236C SPG1 chromosome 7 7 962817 962530 C 2011-02-03 1996-07-31|2005-11-22 Protein required for high temperature survival during stationary phase; not required for growth on nonfermentable carbon sources; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000033575 CDS YGR236C 7 962817 962530 C 2011-02-03 1996-07-31|2005-11-22 -S000003469 ORF Uncharacterized YGR237C chromosome 7 7 965655 963298 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000034450 CDS YGR237C 7 965655 963298 C 2011-02-03 1996-07-31 -S000003470 ORF Verified YGR238C KEL2 chromosome 7 L000003593 7 968687 966039 C 2011-02-03 1996-07-31 Protein that negatively regulates mitotic exit; forms a complex with Kel1p and Bud14p that regulates Bnr1p (formin) to affect actin cable assembly, cytokinesis, and polarized growth; functions in a complex with Kel1p, interacts with Tem1p and Lte1p; localizes to regions of polarized growth; potential Cdc28p substrate -S000034584 CDS YGR238C 7 968687 966039 C 2011-02-03 1996-07-31 -S000003471 ORF Verified YGR239C PEX21 chromosome 7 L000004797 7 970053 969187 C 2011-02-03 1996-07-31 Peroxin required for peroxisomal matrix protein targeting; acts on proteins containing the PTS2 targeting sequence; interacts with Pex7p; constitutively expressed; partially redundant with Pex18p; required for import of the Gpd1p-Pnc1p heterodimer in which only Gpd1p has a peroxisomal targeting signal; relative distribution to cytoplasmic foci increases upon DNA replication stress -S000034676 CDS YGR239C 7 970053 969187 C 2011-02-03 1996-07-31 -S000003472 ORF Verified YGR240C PFK1 6-phosphofructokinase subunit alpha chromosome 7 L000001404 7 973734 970771 C 184 2011-02-03 1996-07-31 Alpha subunit of heterooctameric phosphofructokinase; involved in glycolysis, indispensable for anaerobic growth, activated by fructose-2,6-bisphosphate and AMP, mutation inhibits glucose induction of cell cycle-related genes -S000036620 CDS YGR240C 7 973734 970771 C 2011-02-03 1996-07-31 -S000028551 ORF Uncharacterized YGR240C-A chromosome 7 7 974777 974577 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031237 CDS YGR240C-A 7 974777 974577 C 2011-02-03 2003-07-29 -S000003474 ORF Dubious YGR242W chromosome 7 7 976415 976723 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YAP1802/YGR241C -S000036776 CDS YGR242W 7 976415 976723 W 2011-02-03 1996-07-31 -S000003473 ORF Verified YGR241C YAP1802 chromosome 7 L000004199 7 976581 974875 C 2011-02-03 1996-07-31 Protein of the AP180 family, involved in clathrin cage assembly; binds Pan1p and clathrin; YAP1802 has a paralog, YAP1801, that arose from the whole genome duplication -S000036696 CDS YGR241C 7 976581 974875 C 2011-02-03 1996-07-31 -S000003475 ORF Verified YGR243W MPC3 mitochondrial pyruvate carrier|FMP43 chromosome 7 7 977336 977776 W 2011-02-03 1996-07-31 Highly conserved subunit of the mitochondrial pyruvate carrier (MPC); expressed during growth on nonfermentable carbon sources, and heterodimerizes with Mpc1p to form the respiratory isoform of MPC; MPC localizes to the mitochondrial inner membrane and mediates pyruvate uptake; MPC3 paralog, MPC2, heterodimerizes with Mpc1p to form the fermentative MPC isoform; protein abundance increases in response to DNA replication stress -S000036844 CDS YGR243W 7 977336 977776 W 2011-02-03 1996-07-31 -S000118467 ARS ARS733 ARSVII-978 chromosome 7 7 977728 977976 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000119031 ARS_consensus_sequence ARS733 7 977905 977891 C 2011-02-03 2006-10-03 -S000003476 ORF Verified YGR244C LSC2 succinate--CoA ligase (GDP-forming) subunit beta chromosome 7 L000004592 7 979319 978036 C 2011-02-03 1996-07-31 Beta subunit of succinyl-CoA ligase; succinyl-CoA ligase is a mitochondrial enzyme of the TCA cycle that catalyzes the nucleotide-dependent conversion of succinyl-CoA to succinate -S000036869 CDS YGR244C 7 979319 978036 C 2011-02-03 1996-07-31 -S000003477 ORF Verified YGR245C SDA1 chromosome 7 7 982068 979765 C 2011-02-03 1996-07-31 Protein required for actin organization and passage through Start; highly conserved nuclear protein; required for actin cytoskeleton organization; plays a critical role in G1 events; binds Nap1p; involved in 60S ribosome biogenesis -S000037596 CDS YGR245C 7 982068 979765 C 2011-02-03 1996-07-31 -S000003478 ORF Verified YGR246C BRF1 transcription factor TFIIIB subunit BRF1|TFIIIB70|TDS4|PCF4 chromosome 7 L000000193 7 984272 982482 C 2011-02-03 1996-07-31 TFIIIB B-related factor; one of three subunits of RNA polymerase III transcription initiation factor TFIIIB, binds TFIIIC and TBP and recruits RNA pol III to promoters, amino-terminal half is homologous to TFIIB; mutations in human homolog are associated with autosomal recessive cerebellar-facial-dental syndrome -S000037668 CDS YGR246C 7 984272 982482 C 2011-02-03 1996-07-31 -S000003479 ORF Verified YGR247W CPD1 2',3'-cyclic-nucleotide 3'-phosphodiesterase chromosome 7 7 984966 985685 W 2011-02-03 1996-07-31 Cyclic nucleotide phosphodiesterase; hydrolyzes ADP-ribose 1'', 2''-cyclic phosphate to ADP-ribose 1''-phosphate; may have a role in tRNA splicing; no detectable phenotype is conferred by null mutation or by overexpression; protein abundance increases in response to DNA replication stress -S000037753 CDS YGR247W 7 984966 985685 W 2011-02-03 1996-07-31 -S000003480 ORF Verified YGR248W SOL4 6-phosphogluconolactonase SOL4 chromosome 7 L000003365 7 985972 986739 W 2011-02-03 1996-07-31 6-phosphogluconolactonase; protein abundance increases in response to DNA replication stress; SOL4 has a paralog, SOL3, that arose from the whole genome duplication -S000030588 CDS YGR248W 7 985972 986739 W 2011-02-03 1996-07-31 -S000003481 ORF Verified YGR249W MGA1 chromosome 7 L000001100 7 988049 989419 W 2011-02-03 1996-07-31 Protein similar to heat shock transcription factor; multicopy suppressor of pseudohyphal growth defects of ammonium permease mutants -S000030700 CDS YGR249W 7 988049 989419 W 2011-02-03 1996-07-31 -S000003482 ORF Verified YGR250C RIE1 chromosome 7 7 993521 991176 C 2011-02-03 1996-07-31 Putative RNA binding protein; localizes to stress granules induced by glucose deprivation; interacts with Rbg1p in a two-hybrid assay; protein abundance increases in response to DNA replication stress -S000031515 CDS YGR250C 7 993521 991176 C 2011-02-03 1996-07-31 -S000003483 ORF Verified YGR251W NOP19 DHI1 chromosome 7 7 995639 996229 W 2011-02-03 1996-07-31 Ribosome biogenesis factor; nucleolar protein associated with pre-rRNA components of the 90S preribosome, required for cleavage of pre-rRNA at A0, A1 and A2 sites; interacts with RNA helicase Dhr2p and RNA helicase-like protein Utp25p; required for incorporation of Utp25p into preribosomes -S000031667 CDS YGR251W 7 995639 996229 W 2011-02-03 1996-07-31 -S000003484 ORF Verified YGR252W GCN5 histone acetyltransferase GCN5|AAS104|KAT2|SWI9|ADA4 chromosome 7 L000000684 7 996869 998188 W 2011-02-03 1996-07-31 Catalytic subunit of ADA and SAGA histone acetyltransferase complexes; modifies N-terminal lysines on histones H2B and H3; acetylates Rsc4p, a subunit of the RSC chromatin-remodeling complex, altering replication stress tolerance; relocalizes to the cytosol in response to hypoxia; mutant displays reduced transcription elongation in the G-less-based run-on (GLRO) assay; greater involvement in repression of RNAPII-dependent transcription than in activation -S000031757 CDS YGR252W 7 996869 998188 W 2011-02-03 1996-07-31 -S000003485 ORF Verified YGR253C PUP2 proteasome core particle subunit alpha 5|DOA5 chromosome 7 L000001531 7 999140 998358 C 2011-02-03 1996-07-31 Alpha 5 subunit of the 20S proteasome; involved in ubiquitin-dependent catabolism; human homolog is subunit zeta -S000031854 CDS YGR253C 7 999140 998358 C 2011-02-03 1996-07-31 -S000118468 ARS ARS734 ARSVII-999 chromosome 7 7 999456 999576 2014-11-18 2014-11-18|2006-08-30|2011-02-03 Autonomously Replicating Sequence -S000178104 ARS_consensus_sequence ARS734 7 999504 999520 W 2014-11-18 2014-11-18 -S000003486 ORF Verified YGR254W ENO1 phosphopyruvate hydratase ENO1|HSP48 chromosome 7 L000000559 7 1000927 1002240 W 2011-02-03 1996-07-31 Enolase I, a phosphopyruvate hydratase; catalyzes conversion of 2-phosphoglycerate to phosphoenolpyruvate during glycolysis and the reverse reaction during gluconeogenesis; expression repressed in response to glucose; protein abundance increases in response to DNA replication stress; N-terminally propionylated in vivo; ENO1 has a paralog, ENO2, that arose from the whole genome duplication -S000032820 CDS YGR254W 7 1000927 1002240 W 2011-02-03 1996-07-31 -S000130168 ARS ARS735 chromosome 7 7 1002239 1002522 2011-02-03 2009-05-07 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay -S000003487 ORF Verified YGR255C COQ6 putative N,N-dimethylaniline monooxygenase COQ6 chromosome 7 L000003876 7 1003962 1002523 C 2011-02-03 1996-07-31 Flavin-dependent monooxygenase involved in ubiquinone biosynthesis; responsible for hydroxylation at position C5 and deamination at C4 during ubiquinone (Coenzyme Q) biosynthesis; localizes to matrix face of mitochondrial inner membrane in a large complex with other ubiquinone biosynthetic enzymes; human homolog COQ6 can complement yeast null mutant and is implicated in steroid-resistant nephrotic syndrome (SRNS) -S000032856 CDS YGR255C 7 1003962 1002523 C 2011-02-03 1996-07-31 -S000006750 tRNA_gene tT(UGU)G2 chromosome 7 L000003839 7 1004216 1004287 W 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000030915 noncoding_exon tT(UGU)G2 7 1004216 1004287 W 2011-02-03 2000-05-19 -S000003488 ORF Verified YGR256W GND2 phosphogluconate dehydrogenase (decarboxylating) GND2 chromosome 7 L000003352 7 1004624 1006102 W 2011-02-03 1996-07-31 6-phosphogluconate dehydrogenase (decarboxylating); catalyzes an NADPH regenerating reaction in the pentose phosphate pathway; required for growth on D-glucono-delta-lactone; GND2 has a paralog, GND1, that arose from the whole genome duplication -S000033003 CDS YGR256W 7 1004624 1006102 W 2011-02-03 1996-07-31 -S000003489 ORF Verified YGR257C MTM1 chromosome 7 7 1007305 1006205 C 2011-02-03 1996-07-31 Mitochondrial protein of the mitochondrial carrier family; high affinity pyridoxal 5'-phosphate (PLP) transporter, important for delivery of PLP cofactor to mitochondrial enzymes; involved in mitochondrial iron homeostasis and in activating mitochondrial Sod2p by facilitating insertion of an essential manganese cofactor -S000033036 CDS YGR257C 7 1007305 1006205 C 2011-02-03 1996-07-31 -S000003490 ORF Verified YGR258C RAD2 ssDNA endodeoxyribonuclease RAD2 chromosome 7 L000001556 7 1010766 1007671 C 192 2011-02-03 1996-07-31 Single-stranded DNA endonuclease; cleaves single-stranded DNA during nucleotide excision repair to excise damaged DNA; subunit of Nucleotide Excision Repair Factor 3 (NEF3); homolog of human XPG protein -S000033688 CDS YGR258C 7 1010766 1007671 C 2011-02-03 1996-07-31 -S000077075 matrix_attachment_site ETC4 ETC4 chromosome 7 7 1010927 1010949 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; can act as a transcription-blocking insulator or as a heterochromatin barrier element; remains predominantly localized to the nuclear periphery throughout cell cycle; located between divergently transcribed genes RAD2 and TNA1 -S000003492 ORF Verified YGR260W TNA1 chromosome 7 7 1012485 1014089 W 2011-02-03 1996-07-31 High affinity nicotinic acid plasma membrane permease; responsible for uptake of low levels of nicotinic acid; expression of the gene increases in the absence of extracellular nicotinic acid or para-aminobenzoate (PABA) -S000034815 CDS YGR260W 7 1012485 1014089 W 2011-02-03 1996-07-31 -S000003491 ORF Dubious YGR259C chromosome 7 7 1012921 1012481 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps almost completely with the verified ORF TNA1/YGR260W -S000033805 CDS YGR259C 7 1012921 1012481 C 2011-02-03 1996-07-31 -S000003493 ORF Verified YGR261C APL6 YKS5 chromosome 7 L000003034 7 1016750 1014321 C 2011-02-03 1996-07-31 Beta3-like subunit of the yeast AP-3 complex; functions in transport of alkaline phosphatase to the vacuole via the alternate pathway; exists in both cytosolic and peripherally associated membrane-bound pools -S000034880 CDS YGR261C 7 1016750 1014321 C 2011-02-03 1996-07-31 -S000003494 ORF Verified YGR262C BUD32 serine/threonine protein kinase BUD32|LDB14 chromosome 7 7 1017759 1016974 C 2011-02-03 1996-07-31 Protein kinase; component of the EKC/KEOPS complex with Kae1p, Cgi121p, Pcc1p, and Gon7p; Pyrococcus Bud32 ortholog functions as a P-loop ATPase rather than a protein kinase in the context of the complex; EKC/KEOPS complex is required for t6A tRNA modification and telomeric TG1-3 recombination; may have role in transcription; mutation is functionally complemented by human TP53RK -S000034994 CDS YGR262C 7 1017759 1016974 C 2011-02-03 1996-07-31 -S000003495 ORF Verified YGR263C SAY1 steryl deacetylase chromosome 7 7 1019241 1017967 C 2011-02-03 1996-07-31 Sterol deacetylase; component of the sterol acetylation/deacetylation cycle along with Atf2p; active both in the endoplasmic reticulum (ER) and in lipid droplets; integral membrane protein with active site in the ER lumen; green fluorescent protein (GFP)-fusion protein localizes to the ER -S000035935 CDS YGR263C 7 1019241 1017967 C 2011-02-03 1996-07-31 -S000003497 ORF Dubious YGR265W chromosome 7 7 1021648 1022058 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF MES1/YGR264C, which encodes methionyl-tRNA synthetase -S000036929 CDS YGR265W 7 1021648 1022058 W 2011-02-03 1996-07-31 -S000003496 ORF Verified YGR264C MES1 methionine--tRNA ligase MES1|MetRS|MESI chromosome 7 L000001075 7 1021853 1019598 C 204 2011-02-03 1996-07-31 Methionyl-tRNA synthetase; forms a complex with glutamyl-tRNA synthetase (Gus1p) and Arc1p, which increases the catalytic efficiency of both tRNA synthetases; also has a role in nuclear export of tRNAs; mutations in human ortholog MARS are associated with pediatric pulmonary alveolar proteinosis -S000036088 CDS YGR264C 7 1021853 1019598 C 2011-02-03 1996-07-31 -S000003498 ORF Verified YGR266W chromosome 7 7 1022656 1024761 W 2011-02-03 1996-07-31 Protein of unknown function; predicted to contain a single transmembrane domain; mutant has increased aneuploidy tolerance; localized to both the mitochondrial outer membrane and the plasma membrane; protein abundance increases in response to DNA replication stress -S000036991 CDS YGR266W 7 1022656 1024761 W 2011-02-03 1996-07-31 -S000003499 ORF Verified YGR267C FOL2 GTP cyclohydrolase I chromosome 7 L000000621 7 1025735 1025004 C 215 2011-02-03 1996-07-31 GTP-cyclohydrolase I, catalyzes first step in folic acid biosynthesis; human homolog GCH1 is implicated in dopa-responsive dystonia (DRD), and can complement yeast null mutant -S000037019 CDS YGR267C 7 1025735 1025004 C 2011-02-03 1996-07-31 -S000003501 ORF Dubious YGR269W chromosome 7 7 1026636 1026962 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF HUA1/YGR268C -S000029827 CDS YGR269W 7 1026636 1026962 W 2011-02-03 1996-07-31 -S000003500 ORF Verified YGR268C HUA1 chromosome 7 7 1026653 1026057 C 2011-02-03 1996-07-31 Cytoplasmic protein containing a zinc finger domain; sequence similarity to that of Type I J-proteins; computational analysis of large-scale protein-protein interaction data suggests a possible role in actin patch assembly -S000037084 CDS YGR268C 7 1026653 1026057 C 2011-02-03 1996-07-31 -S000003502 ORF Verified YGR270W YTA7 chromosome 7 L000002561 7 1027370 1031509 W 2011-02-03 1996-07-31 Protein that localizes to chromatin; has a role in regulation of histone gene expression; has a bromodomain-like region that interacts with the N-terminal tail of histone H3, and an ATPase domain; relocalizes to the cytosol in response to hypoxia; potentially phosphorylated by Cdc28p -S000030911 CDS YGR270W 7 1027370 1031509 W 2011-02-03 1996-07-31 -S000028641 ORF Dubious YGR270C-A chromosome 7 7 1027600 1027382 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF YTA7/YGR270W -S000032417 CDS YGR270C-A 7 1027600 1027382 C 2011-02-03 2003-07-29 -S000003503 ORF Verified YGR271W SLH1 putative RNA helicase chromosome 7 7 1031791 1037694 W 2011-02-03 1996-07-31|2011-02-03 Putative RNA helicase related to Ski2p; involved in translation inhibition of non-poly(A) mRNAs; required for repressing propagation of dsRNA viruses -S000030983 CDS YGR271W 7 1031791 1037694 W 2011-02-03 1996-07-31|2011-02-03 -S000007608 ORF Verified YGR271C-A EFG1 YGR272C chromosome 7 7 1038501 1037800 C 2011-02-03 2001-02-26|2007-12-11 Essential protein required for maturation of 18S rRNA; null mutant is sensitive to hydroxyurea and is delayed in recovering from alpha-factor arrest; green fluorescent protein (GFP)-fusion protein localizes to the nucleolus -S000037185 CDS YGR271C-A 7 1038501 1037800 C 2011-02-03 2001-02-26|2007-12-11 -S000003505 ORF Uncharacterized YGR273C IBI1 chromosome 7 7 1039239 1038715 C 2011-02-03 1996-07-31 Putative protein of unknown function; expression downregulated by treatment with 8-methoxypsoralen plus UVA irradiation; not an essential gene; YGR273C has a paralog, YMR295C, that arose from the whole genome duplication -S000031075 CDS YGR273C 7 1039239 1038715 C 2011-02-03 1996-07-31 -S000003506 ORF Verified YGR274C TAF1 KAT4|TafII145|TafII130|TAF145|TAF130 chromosome 7 L000002748 7 1043095 1039895 C 2011-02-03 1996-07-31|2011-02-03 TFIID subunit, involved in RNA pol II transcription initiation; possesses in vitro histone acetyltransferase activity but its role in vivo appears to be minor; involved in promoter binding and G1/S progression; relocalizes to the cytosol in response to hypoxia -S000032074 CDS YGR274C 7 1043095 1039895 C 2011-02-03 1996-07-31|2011-02-03 -S000003507 ORF Verified YGR275W RTT102 chromosome 7 L000004851 7 1043276 1043749 W 2011-02-03 2003-09-22|1996-07-31 Component of both the SWI/SNF and RSC chromatin remodeling complexes; suggested role in chromosome maintenance; possible weak regulator of Ty1 transposition; protein abundance increases in response to DNA replication stress -S000032191 CDS YGR275W 7 1043276 1043749 W 2011-02-03 2003-09-22|1996-07-31 -S000003508 ORF Verified YGR276C RNH70 RNA82|REX1 chromosome 7 L000004048 7 1045480 1043819 C 2011-02-03 1996-07-31 3'-5' exoribonuclease; required for maturation of 3' ends of 5S rRNA and tRNA-Arg3 from dicistronic transcripts -S000032221 CDS YGR276C 7 1045480 1043819 C 2011-02-03 1996-07-31 -S000003509 ORF Verified YGR277C CAB4 putative pantetheine-phosphate adenylyltransferase chromosome 7 7 1046561 1045644 C 2011-02-03 1996-07-31 Subunit of the CoA-Synthesizing Protein Complex (CoA-SPC); subunits of this complex are: Cab2p, Cab3p, Cab4p, Cab5p, Sis2p and Vhs3p; probable pantetheine-phosphate adenylyltransferase (PPAT); PPAT catalyzes the fourth step in the biosynthesis of coenzyme A from pantothenate; null mutant lethality is complemented by E. coli coaD (encoding PPAT) and by human COASY -S000032280 CDS YGR277C 7 1046561 1045644 C 2011-02-03 1996-07-31 -S000003510 ORF Verified YGR278W CWC22 U2-type spliceosomal complex subunit CWC22 chromosome 7 7 1046731 1048464 W 2011-02-03 1996-07-31 Spliceosome-associated protein that is required for pre-mRNA splicing; necessary for Prp2p function at the first catalytic step of splicing; has similarity to S. pombe Cwf22p; CWC22 is an essential protein -S000033193 CDS YGR278W 7 1046731 1048464 W 2011-02-03 1996-07-31 -S000003511 ORF Verified YGR279C SCW4 putative family 17 glucosidase chromosome 7 L000004565 7 1049958 1048798 C 2011-02-03 1996-07-31 Cell wall protein with similarity to glucanases; scw4 scw10 double mutants exhibit defects in mating; SCW4 has a paralog, SCW10, that arose from the whole genome duplication -S000033219 CDS YGR279C 7 1049958 1048798 C 2011-02-03 1996-07-31 -S000003512 ORF Verified YGR280C PXR1 telomerase inhibitor|PinX1|GNO1 chromosome 7 S000007659 7 1051725 1050910 C 2011-02-03 1996-07-31 Essential protein involved in rRNA and snoRNA maturation; competes with TLC1 RNA for binding to Est2p, suggesting a role in negative regulation of telomerase; human homolog inhibits telomerase; contains a G-patch RNA interacting domain -S000035203 CDS YGR280C 7 1051725 1050910 C 2011-02-03 1996-07-31 -S000003513 ORF Verified YGR281W YOR1 ATP-binding cassette transporter YOR1|YRS1 chromosome 7 L000003083 7 1052824 1057257 W 2011-02-03 1996-07-31 Plasma membrane ATP-binding cassette (ABC) transporter; multidrug transporter mediates export of many different organic anions including oligomycin; homolog of human cystic fibrosis transmembrane receptor (CFTR) -S000035335 CDS YGR281W 7 1052824 1057257 W 2011-02-03 1996-07-31 -S000003514 ORF Verified YGR282C BGL2 glucan 1,3-beta-glucosidase|SCW9 chromosome 7 L000000175|S000029440|L000004570 7 1058724 1057783 C 2011-02-03 1996-07-31 Endo-beta-1,3-glucanase; major protein of the cell wall, involved in cell wall maintenance; involved in incorporation of newly synthesized mannoprotein molecules into the cell wall -S000035378 CDS YGR282C 7 1058724 1057783 C 2011-02-03 1996-07-31 -S000003515 ORF Verified YGR283C putative methyltransferase chromosome 7 7 1060040 1059015 C 2011-02-03 1996-07-31 Putative methyltransferase; may interact with ribosomes, based on co-purification experiments; predicted to be involved in ribosome biogenesis; null mutant is resistant to fluconazole; GFP-fusion protein localizes to the nucleolus; YGR283C has a paralog, YMR310C, that arose from the whole genome duplication -S000035443 CDS YGR283C 7 1060040 1059015 C 2011-02-03 1996-07-31 -S000003516 ORF Verified YGR284C ERV29 chromosome 7 7 1061590 1060658 C 2011-02-03 1996-07-31 Protein localized to COPII-coated vesicles; involved in vesicle formation and incorporation of specific secretory cargo; protein abundance increases in response to DNA replication stress -S000036349 CDS YGR284C 7 1061590 1060658 C 2011-02-03 1996-07-31 -S000003517 ORF Verified YGR285C ZUO1 zuotin chromosome 7 L000002571 7 1063153 1061852 C 2011-02-03 1996-07-31 Ribosome-associated chaperone; zuotin functions in ribosome biogenesis and as a chaperone for nascent polypeptide chains in partnership with Ssz1p and SSb1/2; contains a DnaJ domain and functions as a J-protein partner for Ssb1p and Ssb2p; human gene DNAJC2 can partially complement yeast zuo1 null mutant -S000036447 CDS YGR285C 7 1063153 1061852 C 2011-02-03 1996-07-31 -S000003518 ORF Verified YGR286C BIO2 biotin synthase chromosome 7 L000000181 7 1064940 1063813 C 2011-02-03 1996-07-31 Biotin synthase; catalyzes the conversion of dethiobiotin to biotin, which is the last step of the biotin biosynthesis pathway; complements E. coli bioB mutant -S000036536 CDS YGR286C 7 1064940 1063813 C 2011-02-03 1996-07-31 -S000003519 ORF Verified YGR287C IMA1 oligo-1,6-glucosidase IMA1 chromosome 7 7 1068991 1067222 C 2011-02-03 1996-07-31 Major isomaltase (alpha-1,6-glucosidase/alpha-methylglucosidase); required for isomaltose utilization; preferred specificity for isomaltose, alpha-methylglucoside, and palatinose, but also exhibits alpha-1,2 glucosidase activity on sucrose and kojibiose, and can cleave the 1,3-alpha linkage of nigerose and turanose and the alpha-1,5 linkage of leucrose in vitro; member of the IMA isomaltase family -S000036609 CDS YGR287C 7 1068991 1067222 C 2011-02-03 1996-07-31 -S000003520 ORF Verified YGR288W MAL13 transcription factor MAL13|MALR chromosome 7 L000001010 7 1070293 1071714 W 2011-02-03 1996-07-31 MAL-activator protein; part of complex locus MAL1; nonfunctional in genomic reference strain S288C -S000037379 CDS YGR288W 7 1070293 1071714 W 2011-02-03 1996-07-31 -S000003522 ORF Dubious YGR290W chromosome 7 7 1075482 1075925 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; putative HLH protein; partially overlaps the verified ORF MAL11/YGR289C (a high-affinity maltose transporter) -S000030534 CDS YGR290W 7 1075482 1075925 W 2011-02-03 1996-07-31 -S000003521 ORF Verified YGR289C MAL11 alpha-glucoside permease|MALT|AGT1 chromosome 7 L000002978 7 1075813 1073963 C 2011-02-03 1996-07-31 High-affinity maltose transporter (alpha-glucoside transporter); inducible; encoded in the MAL1 complex locus; broad substrate specificity that includes maltotriose; required for isomaltose utilization -S000037432 CDS YGR289C 7 1075813 1073963 C 2011-02-03 1996-07-31 -S000003523 ORF Dubious YGR291C chromosome 7 7 1076504 1076283 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030599 CDS YGR291C 7 1076504 1076283 C 2011-02-03 1996-07-31 -S000003524 ORF Verified YGR292W MAL12 alpha-glucosidase MAL12|MALS chromosome 7 L000001009 7 1076599 1078353 W 226 2011-02-03 1996-07-31 Maltase (alpha-D-glucosidase); inducible protein involved in maltose catabolism; encoded in the MAL1 complex locus; hydrolyzes the disaccharides maltose, turanose, maltotriose, and sucrose -S000030723 CDS YGR292W 7 1076599 1078353 W 2011-02-03 1996-07-31 -S000003526 ORF Verified YGR294W PAU12 seripauperin PAU12 chromosome 7 7 1080306 1080668 W 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP fusion protein localizes to both the endoplasmic reticulum and vacuole -S000031646 CDS YGR294W 7 1080306 1080668 W 2011-02-03 1996-07-31 -S000003525 ORF Dubious YGR293C chromosome 7 7 1080346 1079885 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YGR294W -S000030754 CDS YGR293C 7 1080346 1079885 C 2011-02-03 1996-07-31 -S000003527 ORF Verified YGR295C COS6 chromosome 7 L000004064 7 1082729 1081584 C 2011-02-03 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins -S000031677 CDS YGR295C 7 1082729 1081584 C 2011-02-03 1996-07-31 -S000028960 telomere TEL07R chromosome 7 7 1083635 1090940 W 231 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome VII; annotated components include an X element core sequence, X element combinatorial repeats, and a long Y' element; TEL07R does have telomeric repeats (TEL07R-TR), but they are missing from the genome annotation due to difficulties encountered during sequencing and/or assembly -S000028961 X_element TEL07R 7 1083635 1084092 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome VII; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028962 X_element_combinatorial_repeat TEL07R 7 1084093 1084346 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr VII; contains repeats of the D, C, and B types; formerly called SubTelomeric Repeats -S000028963 Y_prime_element TEL07R 7 1084347 1090940 W 2011-02-03 2003-09-09 Telomeric long Y' element on the right arm of Chromosome VII; contains an ARS consensus sequence, a region of 36-bp repeats, and three ORFs (YRF1-3/YGR296W, YGR296C-A, YGR296C-B) -S000130170 ARS ARS736 chromosome 7 7 1083795 1084863 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000003528 ORF Verified YGR296W YRF1-3 Y' element ATP-dependent helicase protein 1 copy 3|YRF1 chromosome 7 7 1084864 1090591 W 2011-02-03 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p -S000031882 CDS YGR296W 7 1084864 1084882 W 2011-02-03 1996-07-31 -S000031883 CDS YGR296W 7 1085031 1090591 W 2011-02-03 1996-07-31 -S000031884 intron YGR296W 7 1084883 1085030 W 2011-02-03 1996-07-31 -S000028642 ORF Dubious YGR296C-A chromosome 7 7 1089445 1088870 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps TEL07R -S000032418 CDS YGR296C-A 7 1089445 1088870 C 2011-02-03 2003-07-29 -S000028643 ORF Dubious YGR296C-B chromosome 7 7 1090228 1089746 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; contained completely within TEL07R -S000032419 CDS YGR296C-B 7 1090228 1089746 C 2011-02-03 2003-07-29 -S000028644 ORF Dubious YHL050W-A chromosome 8 8 811 1293 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032420 CDS YHL050W-A 8 811 1293 W 2003-07-29 2003-07-29 -S000001042 ORF Uncharacterized YHL050C chromosome 8 8 3311 445 C 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; potential Cdc28p substrate -S000030583 CDS YHL050C 8 1897 445 C 1996-07-31 1996-07-31 -S000030582 CDS YHL050C 8 3311 2671 C 2011-02-03 1996-07-31 -S000030584 intron YHL050C 8 2670 1898 C 2011-02-03 1996-07-31|2011-02-03 -S000001041 ORF Uncharacterized YHL049C chromosome 8 8 4541 3726 C 2011-02-03 1996-07-31 Putative protein of unknown function -S000031013 CDS YHL049C 8 4541 3726 C 2011-02-03 1996-07-31 -S000130145 ARS ARS801 chromosome 8 8 5471 6401 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000028891 telomere TEL08L chromosome 8 8 5505 1 C -40 2011-02-03 2003-09-09|2011-02-03 Telomeric region on the left arm of Chromosome VIII; composed of an X element core sequence, an X element combinatorial repeat, a short Y' element, and a short terminal stretch of telomeric repeats -S000028892 telomeric_repeat TEL08L 8 34 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome VIII -S000028893 X_element TEL08L 8 5505 5052 C 2011-02-03 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome VIII; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028894 X_element_combinatorial_repeat TEL08L 8 5051 4952 C 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr VIII; contains a D-type repeat; formerly called SubTelomeric Repeats -S000028895 Y_prime_element TEL08L 8 4951 35 C 2011-02-03 2003-09-09|2011-02-03 Telomeric short Y' element on the left arm of Chromosome VIII; contains an ARS consensus sequence, a region of 36-bp repeats, and three ORFs (YHL049C, YHL050C, YHL050W-A) -S000028829 ORF Uncharacterized YHL048C-A chromosome 8 8 5797 5663 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000033659 CDS YHL048C-A 8 5797 5663 C 2011-02-03 2003-07-29 -S000001040 ORF Verified YHL048W COS8 chromosome 8 L000004066 8 6401 7546 W 2011-02-03 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins -S000030997 CDS YHL048W 8 6401 7546 W 2011-02-03 1996-07-31 -S000118356 ARS ARS802 ARSVIII-8 chromosome 8 8 7702 7767 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178105 ARS_consensus_sequence ARS802 8 7755 7739 C 2014-11-18 2014-11-18 -S000006986 long_terminal_repeat YHLComega1 chromosome 8 8 8225 7994 C 2011-02-03 2000-05-19 Ty5 LTR -S000028775 ORF Dubious YHL046W-A chromosome 8 8 9981 10307 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF ARN2/YHL047C -S000033493 CDS YHL046W-A 8 9981 10307 W 2011-02-03 2003-07-29 -S000001039 ORF Verified YHL047C ARN2 siderophore transporter|TAF1 chromosome 8 8 10213 8351 C 2011-02-03 1996-07-31|2011-02-03 Transporter; member of the ARN family of transporters that specifically recognize siderophore-iron chelates; responsible for uptake of iron bound to the siderophore triacetylfusarinine C -S000029944 CDS YHL047C 8 10213 8351 C 2011-02-03 1996-07-31|2011-02-03 -S000001038 ORF Verified YHL046C PAU13 seripauperin PAU13 chromosome 8 8 12285 11923 C 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; expression is induced after ethanol shock; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively -S000029841 CDS YHL046C 8 12285 11923 C 2011-02-03 1996-07-31 -S000001037 ORF Dubious YHL045W chromosome 8 8 12502 12849 W 2011-02-03 1996-07-31 Putative protein of unknown function; not an essential gene -S000037882 CDS YHL045W 8 12502 12849 W 2011-02-03 1996-07-31 -S000001036 ORF Uncharacterized YHL044W DUP240 family protein chromosome 8 8 13565 14272 W 2011-02-03 1996-07-31 Putative integral membrane protein; member of DUP240 gene family; green fluorescent protein (GFP)-fusion protein localizes to the plasma membrane in a punctate pattern -S000037802 CDS YHL044W 8 13565 14272 W 2011-02-03 1996-07-31 -S000001035 ORF Verified YHL043W ECM34 chromosome 8 L000003903 8 14901 15413 W 2011-02-03 1996-07-31 Protein of unknown function; member of the DUP380 subfamily of conserved, often subtelomerically-encoded proteins; SWAT-GFP, seamless-GFP and mCherry C-terminal fusion proteins localize to the cytosol -S000035918 CDS YHL043W 8 14901 15413 W 2011-02-03 1996-07-31 -S000001034 ORF Uncharacterized YHL042W chromosome 8 8 15667 16119 W 2011-02-03 1996-07-31 Protein of unknown function; member of the DUP380 subfamily of conserved, often subtelomerically-encoded proteins; SWAT-GFP and mCherry fusion proteins localize to the vacuole -S000035803 CDS YHL042W 8 15667 16119 W 2011-02-03 1996-07-31 -S000001033 ORF Dubious YHL041W chromosome 8 8 17392 17841 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035678 CDS YHL041W 8 17392 17841 W 2011-02-03 1996-07-31 -S000001032 ORF Verified YHL040C ARN1 siderophore transporter chromosome 8 8 20971 19088 C 2011-02-03 1996-07-31 ARN family transporter for siderophore-iron chelates; responsible for uptake of iron bound to ferrirubin, ferrirhodin, and related siderophores; protein increases in abundance and relocalizes to the vacuole upon DNA replication stress -S000034609 CDS YHL040C 8 20971 19088 C 2011-02-03 1996-07-31 -S000001031 ORF Verified YHL039W EFM1 protein-lysine N-methyltransferase chromosome 8 8 21783 23540 W 2011-02-03 1996-07-31 Lysine methyltransferase; involved in the monomethylation of eEF1A (Tef1p/Tef2p); SET-domain family member; predicted involvement in ribosome biogenesis; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm -S000036027 CDS YHL039W 8 21783 23540 W 2011-02-03 1996-07-31 -S000001030 ORF Verified YHL038C CBP2 chromosome 8 L000000225 8 25509 23617 C 2011-02-03 1996-07-31 Required for splicing of the group I intron bI5 of the COB pre-mRNA; nuclear-encoded mitochondrial protein that binds to the RNA to promote splicing; also involved in but not essential for splicing of the COB bI2 intron and the intron in the 21S rRNA gene -S000035079 CDS YHL038C 8 25509 23617 C 2011-02-03 1996-07-31 -S000001029 ORF Dubious YHL037C chromosome 8 8 26179 25778 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034940 CDS YHL037C 8 26179 25778 C 2011-02-03 1996-07-31|2011-02-03 -S000001028 ORF Verified YHL036W MUP3 chromosome 8 L000003357 8 26241 27881 W 2011-02-03 1996-07-31 Low affinity methionine permease; similar to Mup1p -S000034885 CDS YHL036W 8 26241 27881 W 2011-02-03 1996-07-31 -S000001027 ORF Verified YHL035C VMR1 putative ATP-binding cassette multidrug transporter VMR1 chromosome 8 8 32756 27978 C 2011-02-03 1996-07-31 Vacuolar membrane protein; involved in multiple drug resistance and metal sensitivity; ATP-binding cassette (ABC) family member involved in drug transport; potential Cdc28p substrate; induced under respiratory conditions; VMR1 has a paralog, YBT1, that arose from the whole genome duplication -S000033937 CDS YHL035C 8 32756 27978 C 2011-02-03 1996-07-31 -S000028774 ORF Dubious YHL034W-A chromosome 8 8 33176 33637 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF SBP1/YHL034C -S000033492 CDS YHL034W-A 8 33176 33637 W 2011-02-03 2003-07-29 -S000001026 ORF Verified YHL034C SBP1 SSB1|SSBR1 chromosome 8 L000002628|L000002076 8 34077 33193 C 2011-02-03 1996-07-31 Protein that binds eIF4G and has a role in repression of translation; has an RGG motif; found in cytoplasmic P bodies; binds to mRNAs under glucose starvation stress, most often in the 5' UTR; found associated with small nucleolar RNAs snR10 and snR11; SBP1 has a paralog, RNP1, that arose from the whole genome duplication -S000033834 CDS YHL034C 8 34077 33193 C 2011-02-03 1996-07-31 -S000001025 ORF Verified YHL033C RPL8A eL8|ribosomal 60S subunit protein L8A|L8e|rp6|YL5|L8A|L4A|MAK7 chromosome 8 L000000981|L000001704 8 36025 35255 C -38 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L8A; required for processing of 27SA3 pre-rRNA to 27SB pre-rRNA during assembly of large ribosomal subunit; depletion leads to a turnover of pre-rRNA; L8 binds to Domain I of 25S and 5.8 S rRNAs; mutation results in decreased amounts of free 60S subunits; homologous to mammalian ribosomal protein L7A, no bacterial homolog; RPL8A has a paralog, RPL8B, that arose from the whole genome duplication -S000033669 CDS YHL033C 8 36025 35255 C 2011-02-03 1996-07-31 -S000001024 ORF Verified YHL032C GUT1 glycerol kinase chromosome 8 L000000746 8 38508 36379 C 2011-02-03 1996-07-31 Glycerol kinase; converts glycerol to glycerol-3-phosphate; glucose repression of expression is mediated by Adr1p and Ino2p-Ino4p; derepression of expression on non-fermentable carbon sources is mediated by Opi1p and Rsf1p -S000030379 CDS YHL032C 8 38508 36379 C 2011-02-03 1996-07-31 -S000028773 ORF Dubious YHL030W-A chromosome 8 8 39074 39535 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene GOS1/YHL031C -S000033490 CDS YHL030W-A 8 39074 39535 W 2011-02-03 2003-07-29 -S000001023 ORF Verified YHL031C GOS1 chromosome 8 L000004085 8 39486 38815 C 2011-02-03 1996-07-31 v-SNARE protein involved in Golgi transport; homolog of the mammalian protein GOS-28/GS28 -S000030199 CDS YHL031C 8 39486 38815 C 2011-02-03 1996-07-31 -S000001022 ORF Verified YHL030W ECM29 chromosome 8 L000003899 8 40084 45690 W 2011-02-03 1996-07-31 Scaffold protein; assists in association of the proteasome core particle with the regulatory particle; inhibits proteasomal ATPase activity; degraded by the mature proteasome after assembly; contains HEAT-like repeats; protein increases in abundance and relocalizes from nucleus to cytoplasm upon DNA replication stress -S000030143 CDS YHL030W 8 40084 45690 W 2011-02-03 1996-07-31 -S000001021 ORF Uncharacterized YHL029C OCA5 chromosome 8 8 47968 45929 C 2011-02-03 1996-07-31 Cytoplasmic protein required for replication of Brome mosaic virus; S. cerevisiae is a model system for studying replication of positive-strand RNA viruses in their natural hosts -S000030645 CDS YHL029C 8 47968 45929 C 2011-02-03 1996-07-31 -S000001020 ORF Verified YHL028W WSC4 YFW1|YHC8 chromosome 8 L000004219 8 48763 50580 W 2011-02-03 1996-07-31 Endoplasmic reticulum (ER) membrane protein; involved in the translocation of soluble secretory proteins and insertion of membrane proteins into the ER membrane; may also have a role in the stress response but has only partial functional overlap with WSC1-3 -S000030604 CDS YHL028W 8 48763 50580 W 2011-02-03 1996-07-31 -S000001019 ORF Verified YHL027W RIM101 alkaline-responsive transcriptional regulator RIM101|RIM1 chromosome 8 L000002818 8 51111 52988 W 2011-02-03 1996-07-31 Cys2His2 zinc-finger transcriptional repressor; involved in alkaline responsive gene repression as part of adaptation to alkaline conditions; involved in cell wall assembly; required for alkaline pH-stimulated haploid invasive growth and sporulation; activated by alkaline-dependent proteolytic processing which results in removal of the C-terminal tail; similar to A. nidulans PacC -S000030530 CDS YHL027W 8 51111 52988 W 2011-02-03 1996-07-31 -S000001018 ORF Uncharacterized YHL026C chromosome 8 8 54166 53219 C 2011-02-03 1996-07-31|2005-11-07 Putative protein of unknown function; transcriptionally regulated by Upc2p via an upstream sterol response element; SWAT-GFP fusion protein localizes to the cell periphery, while mCherry fusion localizes to both the cell periphery and vacuole; YHL026C is not an essential gene; in 2005 the start site was moved 141 nt upstream (see Locus History) -S000037665 CDS YHL026C 8 54166 53219 C 2011-02-03 1996-07-31|2005-11-07 -S000001017 ORF Verified YHL025W SNF6 chromosome 8 L000001949 8 54851 55849 W 2011-02-03 1996-07-31 Subunit of the SWI/SNF chromatin remodeling complex; involved in transcriptional regulation; functions interdependently in transcriptional activation with Snf2p and Snf5p; relocates to the cytosol under hypoxic conditions -S000037635 CDS YHL025W 8 54851 55849 W 2011-02-03 1996-07-31 -S000001016 ORF Verified YHL024W RIM4 chromosome 8 L000004288|L000004795 8 56649 58790 W 2011-02-03 1996-07-31 Putative RNA-binding protein; required for the expression of early and middle sporulation genes -S000037557 CDS YHL024W 8 56649 58790 W 2011-02-03 1996-07-31 -S000001015 ORF Verified YHL023C NPR3 RMD11 chromosome 8 8 62563 59123 C 2011-02-03 1996-07-31 Subunit of the Iml1p/SEACIT complex; SEACIT (Iml1p-Npr2p-Npr3p) is a subcomplex of SEAC, a coatomer-related complex that associates dynamically with the vacuole; Npr3p may have a structural or regulatory role, supporting Iml1p function as a GAP for the Rag family GTPase Gtr1p, and leading to inhibition of TORC1 signaling in response to amino acid deprivation; SEACIT is required for non-nitrogen-starvation-induced autophagy; null mutant has meiotic defects; human NPRL3 homolog -S000037421 CDS YHL023C 8 62563 59123 C 2011-02-03 1996-07-31 -S000006597 tRNA_gene tH(GUG)H chromosome 8 L000003855 8 62755 62826 W 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis -S000033884 noncoding_exon tH(GUG)H 8 62755 62826 W 2011-02-03 2000-05-19 -S000001014 ORF Verified YHL022C SPO11 chromosome 8 L000002002 8 64157 62961 C -23 2011-02-03 1996-07-31 Meiosis-specific protein that initiates meiotic recombination; initiates meiotic recombination by catalyzing the formation of double-strand breaks in DNA via a transesterification reaction; required for homologous chromosome pairing and synaptonemal complex formation -S000031919 CDS YHL022C 8 64157 62961 C 2011-02-03 1996-07-31 -S000114849 ARS ARS805 ARS805 ARSVIII-64|SPO11 ARS chromosome 8 8 64296 64371 2014-11-18 2014-11-18|2006-04-13|2006-09-07|2011-02-03 Autonomously Replicating Sequence -S000178106 ARS_consensus_sequence ARS805 8 64299 64315 W 2014-11-18 2014-11-18 -S000001013 ORF Verified YHL021C AIM17 FMP12 chromosome 8 8 65859 64462 C 2011-02-03 1996-07-31 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; null mutant displays reduced frequency of mitochondrial genome loss -S000031775 CDS YHL021C 8 65859 64462 C 2011-02-03 1996-07-31 -S000001012 ORF Verified YHL020C OPI1 transcriptional regulator OPI1 chromosome 8 L000001303 8 67456 66242 C 2011-02-03 1996-07-31 Transcriptional regulator of a variety of genes; phosphorylation by protein kinase A stimulates Opi1p function in negative regulation of phospholipid biosynthetic genes; involved in telomere maintenance; null exhibits disrupted mitochondrial metabolism and low cardiolipin content, strongly correlated with overproduction of inositol; binds to phosphatidic acid -S000029857 CDS YHL020C 8 67456 66242 C 2011-02-03 1996-07-31 -S000028772 ORF Dubious YHL019W-A chromosome 8 8 67711 68304 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene APM2/YHL019C -S000033486 CDS YHL019W-A 8 67711 68304 W 2011-02-03 2003-07-29 -S000001011 ORF Verified YHL019C APM2 chromosome 8 L000000095 8 69548 67731 C 2011-02-03 1996-07-31 Protein of unknown function; homologous to the medium chain of mammalian clathrin-associated protein complex; involved in vesicular transport -S000035353 CDS YHL019C 8 69548 67731 C 2011-02-03 1996-07-31 -S000001010 ORF Uncharacterized YHL018W 4a-hydroxytetrahydrobiopterin dehydratase chromosome 8 8 69708 70070 W 2011-02-03 1996-07-31 Putative 4a-hydroxytetrahydrobiopterin dehydratase; green fluorescent protein (GFP)-fusion protein localizes to mitochondria and is induced in response to the DNA-damaging agent MMS -S000035323 CDS YHL018W 8 69708 70070 W 2011-02-03 1996-07-31 -S000001009 ORF Uncharacterized YHL017W chromosome 8 8 70276 71874 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein co-localizes with clathrin-coated vesicles; YHL017W has a paralog, PTM1, that arose from the whole genome duplication -S000035245 CDS YHL017W 8 70276 71874 W 2011-02-03 1996-07-31 -S000001008 ORF Verified YHL016C DUR3 chromosome 8 L000000534 8 74244 72037 C -13 2011-02-03 1996-07-31 Plasma membrane transporter for both urea and polyamines; expression is highly sensitive to nitrogen catabolite repression and induced by allophanate, the last intermediate of the allantoin degradative pathway -S000034197 CDS YHL016C 8 74244 72037 C 2011-02-03 1996-07-31 -S000028828 ORF Uncharacterized YHL015W-A chromosome 8 8 74699 74782 W 2011-02-03 2003-07-29 Putative protein of unknown function -S000033654 CDS YHL015W-A 8 74699 74782 W 2011-02-03 2003-07-29 -S000001007 ORF Verified YHL015W RPS20 uS10|ribosomal 40S subunit protein S20|S10|URP2 chromosome 8 L000002442 8 75412 75777 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; overproduction suppresses mutations affecting RNA polymerase III-dependent transcription; homologous to mammalian ribosomal protein S20 and bacterial S10 -S000034165 CDS YHL015W 8 75412 75777 W 2011-02-03 1996-07-31 -S000001006 ORF Verified YHL014C YLF2 YLF1 chromosome 8 L000002519 8 77314 76097 C 2011-02-03 1996-07-31 Protein of unknown function; has weak similarity to E. coli GTP-binding protein gtp1; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000034003 CDS YHL014C 8 77314 76097 C 2011-02-03 1996-07-31 -S000001005 ORF Verified YHL013C OTU2 chromosome 8 8 78353 77430 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; member of the ovarian tumor-like (OTU) superfamily of predicted cysteine proteases; shows cytoplasmic localization; protein abundance increases in response to DNA replication stress -S000033190 CDS YHL013C 8 78353 77430 C 2011-02-03 1996-07-31 -S000001004 ORF Uncharacterized YHL012W UTP--glucose-1-phosphate uridylyltransferase chromosome 8 8 78936 80417 W 2011-02-03 1996-07-31 Putative UTP glucose-1-phosphate uridylyltransferase; YHL012W has a paralog, UGP1, that arose from the whole genome duplication -S000033163 CDS YHL012W 8 78936 80417 W 2011-02-03 1996-07-31 -S000001003 ORF Verified YHL011C PRS3 ribose phosphate diphosphokinase subunit PRS3 chromosome 8 L000001514 8 81616 80654 C 2011-02-03 1996-07-31 5-phospho-ribosyl-1(alpha)-pyrophosphate synthetase; synthesizes PRPP, which is required for nucleotide, histidine, and tryptophan biosynthesis; one of five related enzymes, which are active as heteromultimeric complexes -S000033025 CDS YHL011C 8 81616 80654 C 2011-02-03 1996-07-31 -S000001002 ORF Verified YHL010C ETP1 BRP2 chromosome 8 8 83721 81964 C 2011-02-03 1996-07-31 Protein of unknown function required for growth on ethanol; contains a zinc finger region and has homology to human BRAP2, which is a cytoplasmic protein that binds nuclear localization sequences -S000032099 CDS YHL010C 8 83721 81964 C 2011-02-03 1996-07-31 -S000001001 ORF Verified YHL009C YAP3 chromosome 8 L000004382 8 85060 84068 C 2011-02-03 1996-07-31 Basic leucine zipper (bZIP) transcription factor -S000030991 CDS YHL009C 8 85060 84068 C 2011-02-03 1996-07-31 -S000006758 tRNA_gene tV(AAC)H chromosome 8 L000003865 8 85371 85298 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000032130 noncoding_exon tV(AAC)H 8 85371 85298 C 2011-02-03 2000-05-19 -S000006987 long_terminal_repeat YHLCsigma1 chromosome 8 8 85538 85388 C 2011-02-03 2000-05-19 Ty3 LTR -S000006989 long_terminal_repeat YHLWtau1 chromosome 8 8 85539 85909 W 2011-02-03 2000-05-19 Ty4 LTR -S000006991 LTR_retrotransposon YHLWTy4-1 Ty4 chromosome 8 8 85539 91761 W 2011-02-03 2000-05-19 Ty4 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007371 transposable_element_gene YHL009W-A gag protein chromosome 8 8 85909 87150 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000032880 CDS YHL009W-A 8 85909 87150 W 2011-02-03 1999-07-17 -S000007372 transposable_element_gene YHL009W-B gag-pol fusion protein chromosome 8 S000029015 8 85909 91318 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000032882 CDS YHL009W-B 8 85909 86994 W 2011-02-03 1999-07-17 -S000032883 CDS YHL009W-B 8 86996 91318 W 2011-02-03 1999-07-17 -S000032884 plus_1_translational_frameshift YHL009W-B 8 86995 86995 W 2011-02-03 1999-07-17 -S000006990 long_terminal_repeat YHLWtau2 chromosome 8 8 91391 91761 W 2011-02-03 2000-05-19 Ty4 LTR -S000006985 long_terminal_repeat YHLCdelta1 chromosome 8 8 92099 91772 C 2011-02-03 2000-05-19 Ty1 LTR -S000006988 long_terminal_repeat YHLWdelta2 chromosome 8 8 92240 92390 W 2011-02-03 2000-05-19 Ty1 LTR -S000001000 ORF Uncharacterized YHL008C chromosome 8 8 94510 92627 C 2011-02-03 1996-07-31 Putative protein of unknown function; may be involved in the uptake of chloride ions; does not appear to be involved in monocarboxylic acid transport; green fluorescent protein (GFP)-fusion protein localizes to the vacuole -S000030923 CDS YHL008C 8 94510 92627 C 2011-02-03 1996-07-31 -S000028771 ORF Dubious YHL006W-A chromosome 8 8 97732 98085 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF STE20/YHL007C -S000033485 CDS YHL006W-A 8 97732 98085 W 2011-02-03 2003-07-29 -S000000999 ORF Verified YHL007C STE20 mitogen-activated protein kinase kinase kinase kinase STE20 chromosome 8 L000002123 8 97937 95118 C 2011-02-03 1996-07-31 Cdc42p-activated signal transducing kinase; involved in pheromone response, pseudohyphal/invasive growth, vacuole inheritance, down-regulation of sterol uptake; GBB motif binds Ste4p; member of the PAK (p21-activated kinase) family -S000030840 CDS YHL007C 8 97937 95118 C 2011-02-03 1996-07-31 -S000000998 ORF Verified YHL006C SHU1 chromosome 8 8 98795 98343 C 2011-02-03 2004-01-29|1996-07-31 Component of Shu complex (aka PCSS complex); Shu complex also includes Psy3, Csm2, Shu2, and promotes error-free DNA repair, mediates inhibition of Srs2p function; essential for promoting the establishment of homolog bias during meiotic homologous recombination; promotes both crossover (CO) and non-crossover (NCO) pathways of meiotic recombination and formation of Rad51p filaments -S000029837 CDS YHL006C 8 98795 98343 C 2011-02-03 2004-01-29|1996-07-31 -S000000996 ORF Verified YHL004W MRP4 mitochondrial 37S ribosomal protein MRP4 chromosome 8 L000001154 8 99219 100403 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit -S000037796 CDS YHL004W 8 99219 100403 W 2011-02-03 1996-07-31 -S000000997 ORF Uncharacterized YHL005C chromosome 8 8 99220 98828 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YHL005C is not an essential gene -S000037818 CDS YHL005C 8 99220 98828 C 2011-02-03 1996-07-31 -S000000995 ORF Verified YHL003C LAG1 sphingosine N-acyltransferase LAG1 chromosome 8 L000000928 8 101883 100648 C 2011-02-03 1996-07-31 Ceramide synthase component; involved in synthesis of ceramide from C26(acyl)-coenzyme A and dihydrosphingosine or phytosphingosine, functionally equivalent to Lac1p; forms ER foci upon DNA replication stress; homolog of human CERS2, a tumor metastasis suppressor gene whose silencing enhances invasion/metastasis of prostate cancer cells; LAG1 has a paralog, LAC1, that arose from the whole genome duplication -S000036974 CDS YHL003C 8 101883 100648 C 2011-02-03 1996-07-31 -S000000994 ORF Verified YHL002W HSE1 ESCRT-0 subunit protein HSE1 chromosome 8 8 102612 103970 W 2011-02-03 1996-07-31 Subunit of the endosomal Vps27p-Hse1p complex; complex is required for sorting of ubiquitinated membrane proteins into intralumenal vesicles prior to vacuolar degradation, as well as for recycling of Golgi proteins and formation of lumenal membranes -S000036957 CDS YHL002W 8 102612 103970 W 2011-02-03 1996-07-31 -S000028770 ORF Dubious YHL002C-A chromosome 8 8 103075 102587 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF HSE1/YHL002W -S000033484 CDS YHL002C-A 8 103075 102587 C 2011-02-03 2003-07-29 -S000000993 ORF Verified YHL001W RPL14B eL14|ribosomal 60S subunit protein L14B|L14e|L14B chromosome 8 L000002707 8 104277 105091 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L14B; homologous to mammalian ribosomal protein L14, no bacterial homolog; RPL14B has a paralog, RPL14A, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000036892 CDS YHL001W 8 104277 104405 W 2011-02-03 1996-07-31 -S000036893 CDS YHL001W 8 104804 105091 W 2011-02-03 1996-07-31 -S000036894 intron YHL001W 8 104406 104803 W 2011-02-03 1996-07-31 -S000006469 centromere CEN8 CEN8 chromosome 8 L000000301 8 105703 105586 C 0 2011-02-03 2000-05-19|2004-10-08 Chromosome VIII centromere -S000077284 centromere_DNA_Element_I CEN8 8 105703 105694 C 2011-02-03 2004-10-08 -S000077285 centromere_DNA_Element_II CEN8 8 105693 105611 C 2011-02-03 2004-10-08 -S000077286 centromere_DNA_Element_III CEN8 8 105610 105586 C 2011-02-03 2004-10-08 -S000001043 ORF Verified YHR001W OSH7 oxysterol-binding protein related protein OSH7 chromosome 8 8 106055 107368 W 2011-02-03 1996-07-31 Oxysterol-binding protein; part of family with seven members in S. cerevisiae; family members have overlapping, redundant functions in sterol metabolism and collectively perform a function essential for viability; OSH7 has a paralog, OSH6, that arose from the whole genome duplication -S000033353 CDS YHR001W 8 106055 107368 W 2011-02-03 1996-07-31 -S000003529 ORF Verified YHR001W-A QCR10 ubiquinol--cytochrome-c reductase subunit 10 chromosome 8 L000001550 8 107826 108122 W 2011-02-03 1996-07-31 Subunit of the ubiqunol-cytochrome c oxidoreductase complex; this complex comprises part of the mitochondrial respiratory chain; members include Cobp, Rip1p, Cyt1p, Cor1p, Qcr2p, Qcr6p, Qcr7p, Qcr8p, Qcr9p, and Qcr10p and comprises part of the mitochondrial respiratory chain -S000035662 CDS YHR001W-A 8 107826 107831 W 2011-02-03 1996-07-31 -S000035663 CDS YHR001W-A 8 107895 108122 W 2011-02-03 1996-07-31 -S000035664 intron YHR001W-A 8 107832 107894 W 2011-02-03 1996-07-31 -S000001044 ORF Verified YHR002W LEU5 coenzyme A transporter chromosome 8 L000000946 8 108812 109885 W 0 2011-02-03 1996-07-31 Mitochondrial carrier protein; involved in the accumulation of CoA in the mitochondrial matrix; homolog of human Graves disease protein SLC25A16, which complements yeast null mutant; does not encode an isozyme of Leu4p, as first hypothesized -S000034263 CDS YHR002W 8 108812 109885 W 2011-02-03 1996-07-31 -S000001045 ORF Verified YHR003C TCD1 tRNA threonylcarbamoyladenosine dehydratase chromosome 8 8 111317 110028 C 2011-02-03 1996-07-31 tRNA threonylcarbamoyladenosine dehydratase; required for the ct6A tRNA base modification, where an adenosine at position 37 is modified to form a cyclized active ester with an oxazolone ring; localized to the mitochondrial outer membrane; TCD1 has a paralog, TCD2, that arose from the whole genome duplication -S000034299 CDS YHR003C 8 111317 110028 C 2011-02-03 1996-07-31 -S000001046 ORF Verified YHR004C NEM1 Nem1-Spo7 phosphatase catalytic subunit NEM1 chromosome 8 8 113094 111754 C 2011-02-03 1996-07-31 Probable catalytic subunit of Nem1p-Spo7p phosphatase holoenzyme; regulates nuclear growth by controlling phospholipid biosynthesis, required for normal nuclear envelope morphology and sporulation; homolog of the human protein Dullard -S000034400 CDS YHR004C 8 113094 111754 C 2011-02-03 1996-07-31 -S000001047 ORF Verified YHR005C GPA1 guanine nucleotide-binding protein subunit alpha|SCG1|DAC1|CDC70 chromosome 8 L000000720 8 114917 113499 C 3 2011-02-03 1996-07-31 Subunit of the G protein involved in pheromone response; GTP-binding alpha subunit of the heterotrimeric G protein; negatively regulates the mating pathway by sequestering G(beta)gamma and by triggering an adaptive response; activates Vps34p at the endosome; protein abundance increases in response to DNA replication stress -S000034477 CDS YHR005C 8 114917 113499 C 2011-02-03 1996-07-31 -S000003530 ORF Verified YHR005C-A TIM10 protein transporter TIM10|MRS11 chromosome 8 L000003574 8 115901 115620 C 2011-02-03 1999-07-17 Essential protein of the mitochondrial intermembrane space; forms a complex with Tim9p (TIM10 complex) that delivers hydrophobic proteins to the TIM22 complex for insertion into the inner membrane -S000033460 CDS YHR005C-A 8 115901 115620 C 2011-02-03 1999-07-17 -S000006740 tRNA_gene tT(AGU)H chromosome 8 L000003864 8 116179 116107 C 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000032165 noncoding_exon tT(AGU)H 8 116179 116107 C 2011-02-03 2000-05-19 -S000130146 ARS ARS806 chromosome 8 8 116179 116421 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000006992 long_terminal_repeat YHRCdelta3 chromosome 8 8 116752 116421 C 2011-02-03 2000-05-19 Ty1 LTR -S000006993 long_terminal_repeat YHRCdelta4 chromosome 8 8 117061 116763 C 2011-02-03 2000-05-19 Ty1 LTR -S000001048 ORF Verified YHR006W STP2 chromosome 8 L000003370 8 117814 119439 W 2011-02-03 1996-07-31 Transcription factor; activated by proteolytic processing in response to signals from the SPS sensor system for external amino acids; activates transcription of amino acid permease genes; STP2 has a paralog, STP1, that arose from the whole genome duplication -S000035553 CDS YHR006W 8 117814 119439 W 2011-02-03 1996-07-31 -S000001049 ORF Verified YHR007C ERG11 sterol 14-demethylase|CYP51 chromosome 8 L000000577 8 121683 120091 C 12 2011-02-03 1996-07-31 Lanosterol 14-alpha-demethylase; catalyzes C-14 demethylation of lanosterol to form 4,4''-dimethyl cholesta-8,14,24-triene-3-beta-ol in ergosterol biosynthesis pathway; transcriptionally down-regulated when ergosterol is in excess; member of cytochrome P450 family; associated and coordinately regulated with the P450 reductase Ncp1p; human CYP51A1 functionally complements the lethality of the erg11 null mutation -S000035603 CDS YHR007C 8 121683 120091 C 2011-02-03 1996-07-31 -S000028830 ORF Uncharacterized YHR007C-A chromosome 8 8 122765 122550 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry; SWAT-GFP fusion protein localizes to the nucleus -S000034480 CDS YHR007C-A 8 122765 122550 C 2011-02-03 2003-07-29 -S000001050 ORF Verified YHR008C SOD2 superoxide dismutase SOD2 chromosome 8 L000001979 8 123590 122889 C 12 2011-02-03 1996-07-31 Mitochondrial manganese superoxide dismutase; protects cells against oxygen toxicity and oxidative stress; human mitochondrial SOD2 can complement a yeast null mutant and human cytoplasmic SOD1 can also complement when targeted to the mitochondrial matrix -S000035694 CDS YHR008C 8 123590 122889 C 2011-02-03 1996-07-31 -S000001051 ORF Verified YHR009C TDA3 BTN3 chromosome 8 8 125680 124109 C 2011-02-03 1996-07-31 Putative oxidoreductase involved in late endosome to Golgi transport; physical and genetical interactions with Btn2p; null mutant is viable, has extended S phase, and sensitive to expression of top1-T722A allele; similar to human FOXRED1 -S000036628 CDS YHR009C 8 125680 124109 C 2011-02-03 1996-07-31 -S000001052 ORF Verified YHR010W RPL27A eL27|ribosomal 60S subunit protein L27A|L27e|L27A|RPL27 chromosome 8 L000002708 8 126521 127492 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L27A; homologous to mammalian ribosomal protein L27, no bacterial homolog; RPL27A has a paralog, RPL27B, that arose from the whole genome duplication -S000036518 CDS YHR010W 8 126521 126551 W 2011-02-03 1996-07-31 -S000036519 CDS YHR010W 8 127113 127492 W 2011-02-03 1996-07-31 -S000036520 intron YHR010W 8 126552 127112 W 2011-02-03 1996-07-31 -S000001053 ORF Verified YHR011W DIA4 putative serine--tRNA ligase DIA4 chromosome 8 8 127780 129120 W 2011-02-03 1996-07-31 Probable mitochondrial seryl-tRNA synthetase; mutant displays increased invasive and pseudohyphal growth -S000036641 CDS YHR011W 8 127780 129120 W 2011-02-03 1996-07-31 -S000001054 ORF Verified YHR012W VPS29 retromer subunit VPS29|VPT6|PEP11 chromosome 8 L000002840 8 129481 130448 W 2011-02-03 1996-07-31 Subunit of the membrane-associated retromer complex; endosomal protein; essential for endosome-to-Golgi retrograde transport; forms a subcomplex with Vps35p and Vps26p that selects cargo proteins for endosome-to-Golgi retrieval -S000036738 CDS YHR012W 8 129481 129528 W 2011-02-03 1996-07-31 -S000036739 CDS YHR012W 8 129648 130448 W 2011-02-03 1996-07-31 -S000036740 intron YHR012W 8 129529 129647 W 2011-02-03 1996-07-31 -S000001055 ORF Verified YHR013C ARD1 peptide alpha-N-acetyltransferase complex A subunit ARD1|NAA10 chromosome 8 L000000103 8 131446 130730 C 10 2011-02-03 1996-07-31 Subunit of protein N-terminal acetyltransferase NatA; NatA comprises Nat1p, Ard1p, Nat5p; acetylates many proteins to influence telomeric silencing, cell cycle, heat-shock resistance, mating, sporulation, early stages of mitophagy; protein abundance increases under DNA replication stress; mutations in human homolog X-linked NAA10 lead to Ogden syndrome (S37P) and intellectual disability (R116W); expression of human NAA10 and NAA15 can complement ard1 nat1 double mutant -S000037391 CDS YHR013C 8 131446 130730 C 2011-02-03 1996-07-31 -S000001056 ORF Verified YHR014W SPO13 chromosome 8 L000002004 8 132047 132922 W 11 2011-02-03 1996-07-31 Meiotic regulator; involved in maintaining sister chromatid cohesion during meiosis I as well as promoting proper attachment of kinetochores to the spindle during meiosis I and meiosis II; anaphase-promoting complex (APC) substrate that is degraded during anaphase I; expressed only in meiotic cells -S000037600 CDS YHR014W 8 132047 132922 W 2011-02-03 1996-07-31 -S000006726 tRNA_gene tS(AGA)H chromosome 8 L000003863 8 133107 133026 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis -S000032372 noncoding_exon tS(AGA)H 8 133107 133026 C 2011-02-03 2000-05-19 -S000118357 ARS ARS807 ARSVIII-134 chromosome 8 8 133438 133539 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178107 ARS_consensus_sequence ARS807 8 133530 133514 C 2014-11-18 2014-11-18 -S000006994 long_terminal_repeat YHRCdelta5 chromosome 8 8 133442 133201 C 2011-02-03 2000-05-19 Ty1 LTR -S000006995 long_terminal_repeat YHRCdelta6 chromosome 8 8 133684 133565 C 2011-02-03 2000-05-19 Ty1 LTR -S000007007 long_terminal_repeat YHRWdelta7 chromosome 8 8 133685 134009 W 2011-02-03 2000-05-19 Ty1 LTR -S000006698 tRNA_gene tQ(UUG)H chromosome 8 L000003856 8 134321 134392 W 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000031701 noncoding_exon tQ(UUG)H 8 134321 134392 W 2011-02-03 2000-05-19 -S000001057 ORF Verified YHR015W MIP6 chromosome 8 L000004334 8 134554 136533 W 2011-02-03 1996-07-31 Putative RNA-binding protein; interacts with Mex67p, which is a component of the nuclear pore involved in nuclear mRNA export; MIP6 has a paralog, PES4, that arose from the whole genome duplication -S000030365 CDS YHR015W 8 134554 136533 W 2011-02-03 1996-07-31 -S000001058 ORF Verified YHR016C YSC84 LSB4 chromosome 8 L000003175 8 138455 136881 C 2011-02-03 1996-07-31 Actin-binding protein; involved in bundling of actin filaments and endocytosis of actin cortical patches; activity stimulated by Las17p; contains SH3 domain similar to Rvs167p; YSC84 has a paralog, LSB3, that arose from the whole genome duplication -S000030436 CDS YHR016C 8 138240 136881 C 2011-02-03 1996-07-31 -S000030435 CDS YHR016C 8 138455 138409 C 2011-02-03 1996-07-31 -S000030437 intron YHR016C 8 138408 138241 C 2011-02-03 1996-07-31 -S000001059 ORF Verified YHR017W YSC83 chromosome 8 L000002830 8 138694 139851 W 2011-02-03 1996-07-31 Non-essential mitochondrial protein of unknown function; mRNA induced during meiosis, peaking between mid to late prophase of meiosis I; similar to S. douglasii YSD83 -S000030626 CDS YHR017W 8 138694 139851 W 2011-02-03 1996-07-31 -S000029042 ARS ARS808 ARS2 chromosome 8 L000000122 8 140349 141274 2011-02-03 2006-04-13 Autonomously Replicating Sequence -S000001060 ORF Verified YHR018C ARG4 argininosuccinate lyase ARG4 chromosome 8 L000000109 8 141402 140011 C 12 2011-02-03 1996-07-31 Argininosuccinate lyase; catalyzes the final step in the arginine biosynthesis pathway -S000030670 CDS YHR018C 8 141402 140011 C 2011-02-03 1996-07-31 -S000001061 ORF Verified YHR019C DED81 asparagine--tRNA ligase DED81 chromosome 8 L000002734 8 143558 141894 C 2011-02-03 1996-07-31 Cytosolic asparaginyl-tRNA synthetase; required for protein synthesis, catalyzes the specific attachment of asparagine to its cognate tRNA -S000031533 CDS YHR019C 8 143558 141894 C 2011-02-03 1996-07-31 -S000001062 ORF Verified YHR020W proline--tRNA ligase chromosome 8 8 143996 146062 W 2011-02-03 1996-07-31 Prolyl-tRNA synthetase; N-terminal domain shows weak homology to prokaryotic posttransfer editing domain, but does not possess posttransfer editing activity; may interact with ribosomes, based on co-purification experiments -S000031552 CDS YHR020W 8 143996 146062 W 2011-02-03 1996-07-31 -S000006513 tRNA_gene tA(AGC)H chromosome 8 L000003862 8 146314 146242 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine -S000032282 noncoding_exon tA(AGC)H 8 146314 146242 C 2011-02-03 2000-05-19 -S000007003 long_terminal_repeat YHRCsigma2 chromosome 8 8 146671 146331 C 2011-02-03 2000-05-19 Ty3 LTR -S000007010 long_terminal_repeat YHRWtau3 chromosome 8 8 146844 147114 W 2011-02-03 2000-05-19 Ty4 LTR -S000001063 ORF Verified YHR021C RPS27B eS27|ribosomal 40S subunit protein S27B|S27e|rp61|YS20|S27B chromosome 8 L000002713 8 148669 147871 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S27, no bacterial homolog; RPS27B has a paralog, RPS27A, that arose from the whole genome duplication -S000031620 CDS YHR021C 8 148116 147871 C 2011-02-03 1996-07-31 -S000031619 CDS YHR021C 8 148669 148667 C 2011-02-03 1996-07-31 -S000031621 intron YHR021C 8 148666 148117 C 2011-02-03 1996-07-31 -S000003531 ORF Uncharacterized YHR021W-A ECM12 chromosome 8 L000003887 8 149225 149680 W 2011-02-03 1999-07-17 Putative protein of unknown function; may contribute to cell wall biosynthesis, mutants display zymolyase hypersensitivity -S000034210 CDS YHR021W-A 8 149225 149680 W 2011-02-03 1999-07-17 -S000001064 ORF Uncharacterized YHR022C chromosome 8 8 150345 149575 C 2011-02-03 1996-07-31 Putative protein of unknown function; YHR022C is not an essential gene -S000032603 CDS YHR022C 8 150345 149575 C 2011-02-03 1996-07-31 -S000028645 ORF Uncharacterized YHR022C-A chromosome 8 8 151306 151217 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032421 CDS YHR022C-A 8 151306 151217 C 2011-02-03 2003-07-29 -S000001065 ORF Verified YHR023W MYO1 myosin 1 chromosome 8 L000001222 8 151666 157452 W 2011-02-03 1996-07-31 Type II myosin heavy chain; required for wild-type cytokinesis and cell separation; localizes to the actomyosin ring; binds to myosin light chains Mlc1p and Mlc2p through its IQ1 and IQ2 motifs respectively -S000032750 CDS YHR023W 8 151666 157452 W 2011-02-03 1996-07-31 -S000001066 ORF Verified YHR024C MAS2 mitochondrial-processing protease subunit alpha|MIF2 chromosome 8 L000001027 8 159192 157744 C 26 2011-02-03 1996-07-31 Alpha subunit of the mitochondrial processing protease (MPP); essential processing enzyme that cleaves the N-terminal targeting sequences from mitochondrially imported proteins -S000032823 CDS YHR024C 8 159192 157744 C 2011-02-03 1996-07-31 -S000001067 ORF Verified YHR025W THR1 homoserine kinase chromosome 8 L000002298 8 159438 160511 W 26 2011-02-03 1996-07-31 Homoserine kinase; conserved protein required for threonine biosynthesis; long-lived protein that is preferentially retained in mother cells and forms cytoplasmic filaments; expression is regulated by the GCN4-mediated general amino acid control pathway -S000033588 CDS YHR025W 8 159438 160511 W 2011-02-03 1996-07-31 -S000001068 ORF Verified YHR026W VMA16 H(+)-transporting V0 sector ATPase subunit c''|PPA1 chromosome 8 L000001468 8 160844 161485 W 27 2011-02-03 1996-07-31 Subunit c'' of the vacuolar ATPase; v-ATPase functions in acidification of the vacuole; one of three proteolipid subunits of the V0 domain -S000033662 CDS YHR026W 8 160844 161485 W 2011-02-03 1996-07-31 -S000001069 ORF Verified YHR027C RPN1 proteasome regulatory particle base subunit RPN1|NAS1|HRD2 chromosome 8 L000003039 8 164711 161730 C 2011-02-03 1996-07-31 Non-ATPase base subunit of the 19S RP of the 26S proteasome; may participate in the recognition of several ligands of the proteasome; contains a leucine-rich repeat (LRR) domain, a site for protein-protein interactions; RP is the acronym for regulatory particle -S000033726 CDS YHR027C 8 164711 161730 C 2011-02-03 1996-07-31 -S000028776 ORF Dubious YHR028W-A chromosome 8 8 167352 167672 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF DAP2/YHR028C -S000033498 CDS YHR028W-A 8 167352 167672 W 2011-02-03 2003-07-29 -S000001070 ORF Verified YHR028C DAP2 DPP2 chromosome 8 L000000483 8 167434 164978 C 2011-02-03 1996-07-31 Dipeptidyl aminopeptidase; synthesized as a glycosylated precursor; localizes to the vacuolar membrane; similar to Ste13p -S000034620 CDS YHR028C 8 167434 164978 C 2011-02-03 1996-07-31 -S000118358 ARS ARS809 ARSVIII-169 chromosome 8 8 168549 168723 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000001071 ORF Verified YHR029C YHI9 chromosome 8 8 168561 167677 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant is defective in unfolded protein response; possibly involved in a membrane regulation metabolic pathway; member of the PhzF superfamily, though most likely not involved in phenazine production -S000034772 CDS YHR029C 8 168561 167677 C 2011-02-03 1996-07-31 -S000001072 ORF Verified YHR030C SLT2 mitogen-activated serine/threonine-protein kinase SLT2|LYT2|SLK2|MPK1|BYC2 chromosome 8 L000001919 8 170344 168890 C 2011-02-03 1996-07-31 Serine/threonine MAP kinase; coordinates expression of all 19S regulatory particle assembly-chaperones (RACs) to control proteasome abundance; involved in regulating maintenance of cell wall integrity, cell cycle progression, nuclear mRNA retention in heat shock, septum assembly; required for mitophagy, pexophagy; affects recruitment of mitochondria to phagophore assembly site; plays role in adaptive response of cells to cold; regulated by the PKC1-mediated signaling pathway -S000035799 CDS YHR030C 8 170344 168890 C 2011-02-03 1996-07-31 -S000001073 ORF Verified YHR031C RRM3 RTT104 chromosome 8 S000007420 8 172970 170799 C 2011-02-03 1996-07-31 DNA helicase involved in rDNA replication and Ty1 transposition; binds to and suppresses DNA damage at G4 motifs in vivo; relieves replication fork pauses at telomeric regions; structurally and functionally related to Pif1p -S000035940 CDS YHR031C 8 172970 170799 C 2011-02-03 1996-07-31 -S000001074 ORF Verified YHR032W ERC1 chromosome 8 8 173344 175089 W 2011-02-03 1996-07-31 Member of the multi-drug and toxin extrusion (MATE) family; the MATE family is part of the multidrug/oligosaccharidyl-lipid/polysaccharide (MOP) exporter superfamily; overproduction confers ethionine resistance and accumulation of S-adenosylmethionine -S000036858 CDS YHR032W 8 173344 175089 W 2011-02-03 1996-07-31 -S000028831 ORF Dubious YHR032W-A chromosome 8 8 175195 175374 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YHR032C-A -S000034481 CDS YHR032W-A 8 175195 175374 W 2011-02-03 2003-07-29 -S000028646 ORF Dubious YHR032C-A chromosome 8 8 175394 175275 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YHR032W-A -S000032422 CDS YHR032C-A 8 175394 175275 C 2011-02-03 2003-07-29 -S000001075 ORF Uncharacterized YHR033W putative glutamate 5-kinase chromosome 8 8 175548 176819 W 2011-02-03 1996-07-31 Putative protein of unknown function; epitope-tagged protein localizes to the cytoplasm; YHR033W has a paralog, PRO1, that arose from the whole genome duplication -S000036911 CDS YHR033W 8 175548 176819 W 2011-02-03 1996-07-31 -S000001076 ORF Verified YHR034C PIH1 NOP17 chromosome 8 8 177999 176965 C 2011-02-03 1996-07-31 Component of the conserved R2TP complex (Rvb1-Rvb2-Tah1-Pih1); R2TP complex interacts with Hsp90 (Hsp82p and Hsc82p) to mediate assembly large protein complexes such as box C/D snoRNPs and RNA polymerase II -S000036943 CDS YHR034C 8 177999 176965 C 2011-02-03 1996-07-31 -S000001077 ORF Verified YHR035W NEL1 chromosome 8 8 178219 180111 W 2011-02-03 1996-07-31 Activator of Sar1p GTPase activity; paralog of Sec23 but does not associate with the COPII components; not an essential gene -S000037726 CDS YHR035W 8 178219 180111 W 2011-02-03 1996-07-31 -S000001078 ORF Verified YHR036W BRL1 chromosome 8 8 180345 181760 W 2011-02-03 1996-07-31 Essential nuclear envelope/ER integral membrane protein; interacts and functions with Apq12p and Brr6p in lipid homeostasis; mutants are defective in nuclear pore complex biogenesis, mRNA nuclear export and are sensitive to sterol biosynthesis inhibitors and membrane fluidizing agents; identified as a dosage suppressor of a temperature sensitive mutation in the major karyopherin, CRM1; homologous to Brr6p -S000037810 CDS YHR036W 8 180345 181760 W 2011-02-03 1996-07-31 -S000001079 ORF Verified YHR037W PUT2 1-pyrroline-5-carboxylate dehydrogenase chromosome 8 L000001536 8 181977 183704 W 24 2011-02-03 1996-07-31 Delta-1-pyrroline-5-carboxylate dehydrogenase; nuclear-encoded mitochondrial protein involved in utilization of proline as sole nitrogen source; deficiency of human homolog ALDH4A1 causes type II hyperprolinemia (HPII), an autosomal recessive inborn error of metabolism; human homolog ALDH4A1 can complement yeast null mutant -S000037908 CDS YHR037W 8 181977 183704 W 2011-02-03 1996-07-31 -S000001080 ORF Verified YHR038W RRF1 FIL1|KIM4 chromosome 8 L000004366 8 184066 184758 W 2011-02-03 1996-07-31 Mitochondrial ribosome recycling factor; essential for mitochondrial protein synthesis and for the maintenance of the respiratory function of mitochondria -S000030835 CDS YHR038W 8 184066 184758 W 2011-02-03 1996-07-31 -S000001081 ORF Verified YHR039C MSC7 meiotic recombination directing protein chromosome 8 8 186809 184875 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; msc7 mutants are defective in directing meiotic recombination events to homologous chromatids -S000030880 CDS YHR039C 8 186809 184875 C 2011-02-03 1996-07-31 -S000002100 ORF Verified YHR039C-A VMA10 H(+)-transporting V1 sector ATPase subunit G|YHR039BC|YHR039C-B chromosome 8 L000002954 8 187679 187173 C 2011-02-03 1996-07-31 Subunit G of the V1 peripheral membrane domain of V-ATPase; part of the electrogenic proton pump found throughout the endomembrane system; involved in vacuolar acidification; the V1 peripheral membrane domain of the vacuolar H+-ATPase (V-ATPase) has eight subunits -S000035240 CDS YHR039C-A 8 187514 187173 C 2011-02-03 1996-07-31 -S000035239 CDS YHR039C-A 8 187679 187677 C 2011-02-03 1996-07-31 -S000035241 intron YHR039C-A 8 187676 187515 C 2011-02-03 1996-07-31 -S000001082 ORF Verified YHR040W BCD1 chromosome 8 8 187924 189024 W 2011-02-03 1996-07-31 Essential protein required for the accumulation of box C/D snoRNA -S000031978 CDS YHR040W 8 187924 189024 W 2011-02-03 1996-07-31 -S000001083 ORF Verified YHR041C SRB2 MED20|HRS2 chromosome 8 L000002050|L000003586 8 189864 189131 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; general transcription factor involved in telomere maintenance -S000032051 CDS YHR041C 8 189749 189131 C 2011-02-03 1996-07-31 -S000032050 CDS YHR041C 8 189864 189851 C 2011-02-03 1996-07-31 -S000032052 intron YHR041C 8 189850 189750 C 2011-02-03 1996-07-31 -S000001084 ORF Verified YHR042W NCP1 CPR1 chromosome 8 L000001482 8 190543 192618 W 2011-02-03 1996-07-31 NADP-cytochrome P450 reductase; involved in ergosterol biosynthesis; associated and coordinately regulated with Erg11p -S000033000 CDS YHR042W 8 190543 192618 W 2011-02-03 1996-07-31 -S000001085 ORF Verified YHR043C DOG2 2-deoxyglucose-6-phosphatase chromosome 8 L000000516 8 193545 192805 C 2011-02-03 1996-07-31 2-deoxyglucose-6-phosphate phosphatase; member of a family of low molecular weight phosphatases, induced by oxidative and osmotic stress, confers 2-deoxyglucose resistance when overexpressed; DOG2 has a paralog, DOG1, that arose from a single-locus duplication; the last half of DOG1 and DOG2 are subject to gene conversions among S. cerevisiae, S. paradoxus, and S. mikatae -S000033060 CDS YHR043C 8 193545 192805 C 2011-02-03 1996-07-31 -S000001086 ORF Verified YHR044C DOG1 2-deoxyglucose-6-phosphatase chromosome 8 L000000515 8 194808 194068 C 2011-02-03 1996-07-31 2-deoxyglucose-6-phosphate phosphatase; member of a family of low molecular weight phosphatases; confers 2-deoxyglucose resistance when overexpressed; DOG1 has a paralog, DOG2, that arose from a single-locus duplication; the last half of DOG1 and DOG2 are subject to gene conversions among S. cerevisiae, S. paradoxus, and S. mikatae -S000033147 CDS YHR044C 8 194808 194068 C 2011-02-03 1996-07-31 -S000001087 ORF Uncharacterized YHR045W chromosome 8 8 195551 197233 W 2011-02-03 1996-07-31 Putative protein of unknown function; possible role in iron metabolism and/or amino acid and carbohydrate metabolism; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum -S000033998 CDS YHR045W 8 195551 197233 W 2011-02-03 1996-07-31 -S000001088 ORF Verified YHR046C INM1 inositol monophosphate 1-phosphatase INM1 chromosome 8 8 198285 197398 C 2011-02-03 1996-07-31 Inositol monophosphatase; involved in biosynthesis of inositol and in phosphoinositide second messenger signaling; INM1 expression increases in the presence of inositol and decreases upon exposure to antibipolar drugs lithium and valproate -S000034037 CDS YHR046C 8 198285 197398 C 2011-02-03 1996-07-31 -S000001089 ORF Verified YHR047C AAP1 arginine/alanine aminopeptidase|AAP1' chromosome 8 L000000006 8 201310 198740 C 2011-02-03 1996-07-31 Arginine/alanine amino peptidase; overproduction stimulates glycogen accumulation; AAP1 has a paralog, APE2, that arose from the whole genome duplication -S000034139 CDS YHR047C 8 201310 198740 C 2011-02-03 1996-07-31 -S000001090 ORF Uncharacterized YHR048W YHK8 chromosome 8 8 204607 206151 W 2011-02-03 1996-07-31 Presumed antiporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; expression of gene is up-regulated in cells exhibiting reduced susceptibility to azoles -S000035165 CDS YHR048W 8 204607 206151 W 2011-02-03 1996-07-31 -S000001091 ORF Verified YHR049W FSH1 putative serine hydrolase chromosome 8 8 206462 207193 W 2011-02-03 1996-07-31 Putative serine hydrolase; localizes to both the nucleus and cytoplasm; sequence is similar to S. cerevisiae Fsh2p and Fsh3p and the human candidate tumor suppressor OVCA2 -S000035291 CDS YHR049W 8 206462 207193 W 2011-02-03 1996-07-31 -S000003532 ORF Dubious YHR049C-A chromosome 8 8 207530 207234 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031834 CDS YHR049C-A 8 207530 207234 C 2011-02-03 1996-07-31|2011-02-03 -S000001092 ORF Verified YHR050W SMF2 divalent metal ion transporter SMF2 chromosome 8 L000001932|L000001870 8 207654 209303 W 2011-02-03 1996-07-31 Divalent metal ion transporter involved in manganese homeostasis; has broad specificity for di-valent and tri-valent metals; post-translationally regulated by levels of metal ions; member of the Nramp family of metal transport proteins -S000036147 CDS YHR050W 8 207654 209303 W 2011-02-03 1996-07-31 -S000028832 ORF Uncharacterized YHR050W-A chromosome 8 8 209475 209645 W 2011-02-03 2003-07-29 Protein of unknown function; identified by expression profiling and mass spectrometry -S000034482 CDS YHR050W-A 8 209475 209645 W 2011-02-03 2003-07-29 -S000001093 ORF Verified YHR051W COX6 cytochrome c oxidase subunit VI chromosome 8 L000000390 8 209705 210151 W 2011-02-03 1996-07-31 Subunit VI of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain; expression is regulated by oxygen levels -S000029851 CDS YHR051W 8 209705 210151 W 2011-02-03 1996-07-31 -S000001094 ORF Verified YHR052W CIC1 NSA3 chromosome 8 8 210848 211978 W 2011-02-03 1996-07-31 Essential protein that interacts with proteasome components; has a potential role in proteasome substrate specificity; also copurifies with 66S pre-ribosomal particles -S000031769 CDS YHR052W 8 210848 211978 W 2011-02-03 1996-07-31 -S000028470 ncRNA_gene RUF5-1 RUF5-1 RUF5 chromosome 8 8 212409 213118 W 2011-02-03 2004-04-01 RNA of Unknown Function -S000030107 noncoding_exon RUF5-1 8 212409 213118 W 2011-02-03 2004-04-01 -S000028647 ORF Dubious YHR052W-A chromosome 8 8 212510 212704 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps CUP1-1 -S000032423 CDS YHR052W-A 8 212510 212704 W 2011-02-03 2003-07-29 -S000001095 ORF Verified YHR053C CUP1-1 metallothionein CUP1|CUP1 chromosome 8 L000000436 8 212720 212535 C 2011-02-03 1996-07-31 Metallothionein; binds copper and mediates resistance to high concentrations of copper and cadmium; locus is variably amplified in different strains, with two copies, CUP1-1 and CUP1-2, in the genomic sequence reference strain S288C; CUP1-1 has a paralog, CUP1-2, that arose from a segmental duplication -S000031831 CDS YHR053C 8 212720 212535 C 2011-02-03 1996-07-31 -S000130147 ARS ARS810 chromosome 8 8 212720 213185 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000001096 ORF Uncharacterized YHR054C chromosome 8 8 214249 213185 C 2011-02-03 1996-07-31 Putative protein of unknown function; partial duplicate of RSC30/YHR056C, truncated remnant of segmental duplication -S000031964 CDS YHR054C 8 214249 213185 C 2011-02-03 1996-07-31 -S000028474 ncRNA_gene RUF5-2 RUF5-2 RUF5 chromosome 8 8 214407 215116 W 2011-02-03 2004-04-01 RNA of Unknown Function -S000030115 noncoding_exon RUF5-2 8 214407 215116 W 2011-02-03 2004-04-01 -S000028648 ORF Dubious YHR054W-A chromosome 8 8 214508 214702 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps CUP1-2 -S000032424 CDS YHR054W-A 8 214508 214702 W 2011-02-03 2003-07-29 -S000001097 ORF Verified YHR055C CUP1-2 metallothionein CUP1|CUP1 chromosome 8 8 214718 214533 C 2011-02-03 1996-07-31 Metallothionein; binds copper and mediates resistance to high concentrations of copper and cadmium; locus is variably amplified in different strains, with two copies, CUP1-1 and CUP1-2, in the genomic sequence reference strain S288C; CUP1-2 has a paralog, CUP1-1, that arose from a segmental duplication -S000037453 CDS YHR055C 8 214718 214533 C 2011-02-03 1996-07-31 -S000130148 ARS ARS811 chromosome 8 8 214718 215183 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000028777 ORF Dubious YHR056W-A chromosome 8 8 217406 217840 W 2011-02-03 2004-01-29|2011-02-03|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps ORF RSC30/YHR056C -S000033500 CDS YHR056W-A 8 217406 217840 W 2011-02-03 2004-01-29|2003-07-29|2011-02-03 -S000001098 ORF Verified YHR056C RSC30 chromosome 8 8 217834 215183 C 2011-02-03 2004-01-29|1996-07-31|2011-02-03 Component of the RSC chromatin remodeling complex; non-essential gene required for regulation of ribosomal protein genes and the cell wall/stress response; null mutants are osmosensitive; RSC30 has a paralog, RSC3, that arose from the whole genome duplication -S000037529 CDS YHR056C 8 217834 215183 C 2011-02-03 2004-01-29|1996-07-31|2011-02-03 -S000001099 ORF Verified YHR057C CPR2 peptidylprolyl isomerase CPR2|CYP2 chromosome 8 L000000463 8 218843 218226 C 2011-02-03 1996-07-31 Peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; potential role in the secretory pathway; seamless-GFP and mCherry fusion proteins localize to the vacuole, while SWAT-GFP fusion localizes to both the endoplasmic reticulum and vacuole; suppresses toxicity of slow-folding human Z-type alpha1-antitrypsin variant associated with liver cirrhosis and emphysema -S000037607 CDS YHR057C 8 218843 218226 C 2011-02-03 1996-07-31 -S000001100 ORF Verified YHR058C MED6 mediator complex subunit MED6 chromosome 8 L000003569 8 219884 218997 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation; protein abundance increases in response to DNA replication stress -S000037687 CDS YHR058C 8 219884 218997 C 2011-02-03 1996-07-31 -S000001101 ORF Verified YHR059W FYV4 chromosome 8 8 220108 220500 W 2011-02-03 1996-07-31 Protein of unknown function; required for survival upon exposure to K1 killer toxin -S000030557 CDS YHR059W 8 220108 220500 W 2011-02-03 1996-07-31 -S000001102 ORF Verified YHR060W VMA22 VPH6|CEV1 chromosome 8 L000002789 8 220725 221270 W 2011-02-03 1996-07-31 Protein that is required for vacuolar H+-ATPase (V-ATPase) function; peripheral membrane protein; not an actual component of the V-ATPase complex; functions in the assembly of the V-ATPase; localized to the yeast endoplasmic reticulum (ER) -S000029986 CDS YHR060W 8 220725 221270 W 2011-02-03 1996-07-31 -S000001103 ORF Verified YHR061C GIC1 chromosome 8 L000003313 8 222478 221534 C 2011-02-03 1996-07-31 Protein involved in initiation of budding and cellular polarization; interacts with Cdc42p via the Cdc42/Rac-interactive binding (CRIB) domain; relocalizes from bud neck to nucleus upon DNA replication stress; GIC1 has a paralog, GIC2, that arose from the whole genome duplication -S000030028 CDS YHR061C 8 222478 221534 C 2011-02-03 1996-07-31 -S000001104 ORF Verified YHR062C RPP1 RNA-binding RNA processing protein RPP1 chromosome 8 L000004007 8 223758 222877 C 2011-02-03 1996-07-31 Subunit of both RNase MRP and nuclear RNase P; RNase MRP cleaves pre-rRNA, while nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs; relocalizes to the cytosol in response to hypoxia -S000030103 CDS YHR062C 8 223758 222877 C 2011-02-03 1996-07-31 -S000001105 ORF Verified YHR063C PAN5 2-dehydropantoate 2-reductase PAN5 chromosome 8 8 225169 224030 C 2011-02-03 1996-07-31 2-dehydropantoate 2-reductase; part of the pantothenic acid pathway, structurally homologous to E. coli panE -S000030303 CDS YHR063C 8 225169 224030 C 2011-02-03 1996-07-31 -S000028778 ORF Dubious YHR063W-A chromosome 8 8 225442 225777 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF SSZ1/YHR064C -S000033501 CDS YHR063W-A 8 225442 225777 W 2011-02-03 2003-07-29 -S000001106 ORF Verified YHR064C SSZ1 PDR13 chromosome 8 L000004029 8 227141 225525 C 2011-02-03 2003-09-22|1996-07-31 Hsp70 protein that interacts with Zuo1p (a DnaJ homolog); interacts with Zuo1p to form a ribosome-associated complex that binds the ribosome via the Zuo1p subunit; also involved in pleiotropic drug resistance via sequential activation of PDR1 and PDR5; binds ATP -S000030385 CDS YHR064C 8 227141 225525 C 2011-02-03 2003-09-22|1996-07-31 -S000001107 ORF Verified YHR065C RRP3 RNA-dependent ATPase RRP3 chromosome 8 L000004225 8 229037 227532 C 2011-02-03 2003-09-22|1996-07-31 Protein involved in rRNA processing; required for maturation of the 35S primary transcript of pre-rRNA and for cleavage leading to mature 18S rRNA; homologous to eIF-4a, which is a DEAD box RNA-dependent ATPase with helicase activity -S000033722 CDS YHR065C 8 229037 227532 C 2011-02-03 2003-09-22|1996-07-31 -S000001108 ORF Verified YHR066W SSF1 rRNA-binding ribosome biosynthesis protein chromosome 8 L000002080 8 229335 230696 W 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; required for ribosomal large subunit maturation; functionally redundant with Ssf2p; member of the Brix family; SSF1 has a paralog, SSF2, that arose from the whole genome duplication -S000033935 CDS YHR066W 8 229335 230696 W 2011-02-03 1996-07-31 -S000001109 ORF Verified YHR067W HTD2 hydroxyacyl-thioester dehydratase HTD2|RMD12 chromosome 8 8 230970 231812 W 2011-02-03 1996-07-31 Mitochondrial 3-hydroxyacyl-thioester dehydratase; involved in fatty acid biosynthesis, required for respiratory growth and for normal mitochondrial morphology -S000034794 CDS YHR067W 8 230970 231812 W 2011-02-03 1996-07-31 -S000001110 ORF Verified YHR068W DYS1 deoxyhypusine synthase chromosome 8 L000003346 8 232133 233296 W 2011-02-03 1996-07-31 Deoxyhypusine synthase; catalyzes formation of deoxyhypusine, the first step in hypusine biosynthesis; triggers posttranslational hypusination of translation elongation factor eIF-5A and regulates its intracellular levels; tetrameric; human homolog DHPS allows growth of yeast haploid dys1 null mutant after sporulation of heterozygous diploid -S000034934 CDS YHR068W 8 232133 233296 W 2011-02-03 1996-07-31 -S000001111 ORF Verified YHR069C RRP4 exosome non-catalytic core subunit RRP4 chromosome 8 L000003549 8 234658 233579 C 2011-02-03 1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; predicted to contain RNA binding domains; has similarity to human hRrp4p (EXOSC2) -S000034980 CDS YHR069C 8 234658 233579 C 2011-02-03 1996-07-31 -S000001112 ORF Verified YHR070W TRM5 tRNA (guanine) methyltransferase chromosome 8 8 234881 236380 W 2011-02-03 1996-07-31 tRNA(m(1)G37)methyltransferase; methylates a tRNA base adjacent to the anticodon that has a role in prevention of frameshifting; localized to both cytoplasm and mitochondria, and modifies both cytoplasmic and mitochondrial tRNAs; mutations in human ortholog TRMT5 are associated with skeletal muscle respiratory chain deficiencies, and trm5 mutations analogous to disease mutations decrease respiration -S000034511 CDS YHR070W 8 234881 236380 W 2011-02-03 1996-07-31 -S000028779 ORF Dubious YHR069C-A chromosome 8 8 235236 234874 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps ORF TRM5/YHR070W -S000033503 CDS YHR069C-A 8 235236 234874 C 2011-02-03 2003-07-29 -S000028780 ORF Dubious YHR070C-A chromosome 8 8 236512 236102 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene TRM5/YHR070W -S000033520 CDS YHR070C-A 8 236512 236102 C 2011-02-03 2003-07-29 -S000001113 ORF Verified YHR071W PCL5 chromosome 8 L000004037 8 237004 237693 W 2011-02-03 1996-07-31 Cyclin; interacts with and phosphorylated by Pho85p cyclin-dependent kinase (Cdk), induced by Gcn4p at level of transcription, specifically required for Gcn4p degradation, may be sensor of cellular protein biosynthetic capacity -S000034608 CDS YHR071W 8 237004 237693 W 2011-02-03 1996-07-31 -S000006566 tRNA_gene tF(GAA)H1 chromosome 8 L000003861 8 237939 237848 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis -S000032801 intron tF(GAA)H1 8 237902 237884 C 2011-02-03 2000-05-19 -S000032800 noncoding_exon tF(GAA)H1 8 237883 237848 C 2011-02-03 2000-05-19 -S000032799 noncoding_exon tF(GAA)H1 8 237939 237903 C 2011-02-03 2000-05-19 -S000001114 ORF Verified YHR072W ERG7 lanosterol synthase ERG7 chromosome 8 L000000573 8 239098 241293 W 2011-02-03 1996-07-31|2011-02-03 Lanosterol synthase; an essential enzyme that catalyzes the cyclization of squalene 2,3-epoxide, a step in ergosterol biosynthesis; human LSS functionally complements the lethality of the erg7 null mutation -S000034721 CDS YHR072W 8 239098 241293 W 2011-02-03 1996-07-31|2011-02-03 -S000028781 ORF Dubious YHR071C-A chromosome 8 8 239230 238910 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF ERG7/YHR072W -S000033521 CDS YHR071C-A 8 239230 238910 C 2011-02-03 2003-07-29 -S000007455 ORF Verified YHR072W-A NOP10 snoRNP complex protein NOP10 chromosome 8 8 241664 241840 W 2011-02-03 2000-12-01 Subunit of box H/ACA snoRNP complex; required for pseudouridylation and processing of pre-18S rRNA -S000036439 CDS YHR072W-A 8 241664 241840 W 2011-02-03 2000-12-01 -S000001115 ORF Verified YHR073W OSH3 oxysterol-binding protein related protein OSH3 chromosome 8 8 242582 245572 W 2011-02-03 1996-07-31 Member of an oxysterol-binding protein family; this family has seven members in S. cerevisiae; family members have overlapping, redundant functions in sterol metabolism and collectively perform a function essential for viability; contains FFAT motif; interacts with ER anchor Scs2p at patches at the plasma membrane; regulated by sterol binding -S000035693 CDS YHR073W 8 242582 245572 W 2011-02-03 1996-07-31 -S000028834 ORF Dubious YHR073W-A chromosome 8 8 242868 243044 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF YHR073W; identified by expression profiling and mass spectrometry -S000034484 CDS YHR073W-A 8 242868 243044 W 2011-02-03 2003-07-29 -S000028833 ORF Dubious YHR073C-B chromosome 8 8 245502 245422 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF YHR073W; identified by expression profiling and mass spectrometry -S000034483 CDS YHR073C-B 8 245502 245422 C 2011-02-03 2003-07-29 -S000118359 ARS ARS813 ARSVIII-246 chromosome 8 8 245773 245847 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178108 ARS_consensus_sequence ARS813 8 245789 245805 W 2014-11-18 2014-11-18 -S000001116 ORF Verified YHR074W QNS1 glutamine-dependent NAD(+) synthetase chromosome 8 S000007569 8 246193 248337 W 2011-02-03 1996-07-31 Glutamine-dependent NAD(+) synthetase; essential for the formation of NAD(+) from nicotinic acid adenine dinucleotide -S000035833 CDS YHR074W 8 246193 248337 W 2011-02-03 1996-07-31 -S000001117 ORF Verified YHR075C PPE1 carboxylesterase-mitochondrial 37S ribosomal protein YmS2|YmS2|MRPS2 chromosome 8 8 249641 248439 C 2011-02-03 1996-07-31 Protein with carboxyl methyl esterase activity; may have a role in demethylation of the phosphoprotein phosphatase catalytic subunit; also identified as a small subunit mitochondrial ribosomal protein -S000035876 CDS YHR075C 8 249641 248439 C 2011-02-03 1996-07-31 -S000001118 ORF Verified YHR076W PTC7 type 2C protein phosphatase PTC7 chromosome 8 8 251101 252225 W 2011-02-03 1996-07-31|2007-07-09 Type 2C serine/threonine protein phosphatase (PP2C); alternatively spliced to create two mRNA isoforms; protein from spliced form localizes to the mitochondria while the one from the unspliced form is localized to the nuclear envelope; activates coenzyme Q6 biosynthesis by dephosphorylation of demethoxy-Q6 hydroxylase Coq7p -S000037820 CDS YHR076W 8 251101 251155 W 2011-02-03 1996-07-31|2007-07-09 -S000123271 CDS YHR076W 8 251249 252225 W 2011-02-03 2007-07-09 -S000123270 intron YHR076W 8 251156 251248 W 2011-02-03 2007-07-09 -S000001119 ORF Verified YHR077C NMD2 SUP111|UPF2|SUA1|IFS1 chromosome 8 L000001257|S000029548|L000002230 8 255756 252374 C 51 2011-02-03 1999-11-17|1996-07-31 Protein involved in the nonsense-mediated mRNA decay (NMD) pathway; interacts with Nam7p and Upf3p; involved in telomere maintenance -S000037864 CDS YHR077C 8 255637 252374 C 2011-02-03 1999-11-17 -S000037863 CDS YHR077C 8 255756 255751 C 2011-02-03 1999-11-17|1996-07-31 -S000037865 intron YHR077C 8 255750 255638 C 2011-02-03 1999-11-17 -S000001120 ORF Uncharacterized YHR078W chromosome 8 8 256360 258018 W 2011-02-03 1996-07-31 High osmolarity-regulated gene of unknown function -S000029926 CDS YHR078W 8 256360 258018 W 2011-02-03 1996-07-31 -S000001121 ORF Verified YHR079C IRE1 bifunctional endoribonuclease/protein kinase IRE1|ERN1 chromosome 8 L000000875 8 261591 258244 C 2011-02-03 1996-07-31 Serine-threonine kinase and endoribonuclease; transmembrane protein that mediates the unfolded protein response (UPR) by regulating Hac1p synthesis through HAC1 mRNA splicing; role in homeostatic adaptation to ER stress; Kar2p binds inactive Ire1p and releases from it upon ER stress -S000029980 CDS YHR079C 8 261591 258244 C 2011-02-03 1996-07-31 -S000001957 ORF Verified YHR079C-A SAE3 YHR079BC|YHR079C-B chromosome 8 L000002893 8 262553 262192 C 2011-02-03 1996-07-31|2005-11-03 Meiosis-specific protein involved in meiotic recombination; involved in DMC1-dependent meiotic recombination; forms heterodimer with Mei5p; proposed to be an assembly factor for Dmc1p -S000087058 CDS YHR079C-A 8 262354 262192 C 2011-02-03 2005-11-03 -S000034792 CDS YHR079C-A 8 262553 262441 C 2011-02-03 1996-07-31|2005-11-03 -S000087057 intron YHR079C-A 8 262440 262355 C 2011-02-03 2005-11-03 -S000001122 ORF Verified YHR080C LAM4 LTC3 chromosome 8 8 266838 262801 C 2011-02-03 1996-07-31 Sterol-binding protein that localizes to puncta in the cortical ER; sterol binding occurs via two StART-like domains; one of six StART-like domain-containing proteins in yeast that may be involved in intracellular sterol transfer between membranes; conserved across eukaryotes; has both GRAM and StART-like (VASt) domains; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies -S000037712 CDS YHR080C 8 266838 262801 C 2011-02-03 1996-07-31 -S000001123 ORF Verified YHR081W LRP1 RRP47|YC1D chromosome 8 8 267538 268092 W 2011-02-03 1996-07-31 Nuclear exosome-associated nucleic acid binding protein; involved in RNA processing, surveillance, degradation, tethering, and export; forms a stable heterodimer with Rrp6p and regulates its exonucleolytic activity; rapidly degraded by the proteasome in the absence of Rrp6p; homolog of mammalian nuclear matrix protein C1D involved in regulation of DNA repair and recombination -S000030578 CDS YHR081W 8 267538 268092 W 2011-02-03 1996-07-31 -S000001124 ORF Verified YHR082C KSP1 putative serine/threonine protein kinase KSP1 chromosome 8 L000000921 8 271548 268459 C 2011-02-03 1996-07-31 Serine/threonine protein kinase; associates with TORC1 and likely involved in TOR signaling cascades; negative regulator of autophagy; nuclear translocation required for haploid filamentous growth; regulates filamentous growth induced nuclear translocation of Bcy1p, Fus3p, and Sks1p; overproduction causes allele-specific suppression of prp20-10; protein abundance increases in response to DNA replication stress -S000030628 CDS YHR082C 8 271548 268459 C 2011-02-03 1996-07-31 -S000001125 ORF Verified YHR083W SAM35 SAM complex subunit SAM35|TOM38|TOB38|FMP20 chromosome 8 8 272627 273616 W 2011-02-03 1996-07-31 Component of the sorting and assembly machinery (SAM) complex; the SAM (or TOB) complex is located in the mitochondrial outer membrane; the complex binds precursors of beta-barrel proteins and facilitates their insertion into the outer membrane -S000030804 CDS YHR083W 8 272627 273616 W 2011-02-03 1996-07-31 -S000001126 ORF Verified YHR084W STE12 homeodomain family transcription factor STE12 chromosome 8 L000002119 8 274174 276240 W 65.64 2011-02-03 1996-07-31 Transcription factor that is activated by a MAPK signaling cascade; activates genes involved in mating or pseudohyphal/invasive growth pathways; cooperates with Tec1p transcription factor to regulate genes specific for invasive growth -S000030898 CDS YHR084W 8 274174 276240 W 2011-02-03 1996-07-31 -S000001127 ORF Verified YHR085W IPI1 chromosome 8 8 276764 277768 W 2011-02-03 1996-07-31 Component of the Rix1 complex and possibly pre-replicative complexes; required for processing of ITS2 sequences from 35S pre-rRNA; component of the pre-60S ribosomal particle with the dynein-related AAA-type ATPase Mdn1p; required for pre-replicative complex (pre-RC) formation and maintenance during DNA replication licensing; relocalizes to the cytosol in response to hypoxia; essential gene -S000031899 CDS YHR085W 8 276764 277768 W 2011-02-03 1996-07-31 -S000001128 ORF Verified YHR086W NAM8 MUD15|MRE2 chromosome 8 L000001147|L000001230 8 278153 279724 W 2011-02-03 1996-07-31 RNA binding protein, component of the U1 snRNP protein; mutants are defective in meiotic recombination and in formation of viable spores, involved in the formation of DSBs through meiosis-specific splicing of REC107 pre-mRNA; Nam8p regulon embraces the meiotic pre-mRNAs of REC107, HFM1, AMA1 SPO22 and PCH2; the putative RNA binding domains RRM2 and RRM3 are required for Nam8p meiotic function -S000032027 CDS YHR086W 8 278153 279724 W 2011-02-03 1996-07-31 -S000028552 ORF Uncharacterized YHR086W-A chromosome 8 8 280231 280392 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively -S000031238 CDS YHR086W-A 8 280231 280392 W 2011-02-03 2003-07-29 -S000001129 ORF Verified YHR087W RTC3 HGI1 chromosome 8 8 280820 281155 W 2011-02-03 1996-07-31 Protein of unknown function involved in RNA metabolism; has structural similarity to SBDS, the human protein mutated in Shwachman-Diamond Syndrome (the yeast SBDS ortholog = SDO1); null mutation suppresses cdc13-1 temperature sensitivity; protein abundance increases in response to DNA replication stress -S000032137 CDS YHR087W 8 280820 281155 W 2011-02-03 1996-07-31 -S000001130 ORF Verified YHR088W RPF1 rRNA-binding ribosome biosynthesis protein RPF1 chromosome 8 8 281495 282382 W 2011-02-03 1996-07-31 Protein involved in assembly and export of the large ribosomal subunit; nucleolar protein; constituent of 66S pre-ribosomal particles; contains a sigma(70)-like motif, which is thought to bind RNA -S000034136 CDS YHR088W 8 281495 282382 W 2011-02-03 1996-07-31 -S000001131 ORF Verified YHR089C GAR1 H/ACA snoRNP pseudouridylase subunit GAR1 chromosome 8 L000000668 8 283298 282681 C 2011-02-03 1996-07-31 Protein component of the H/ACA snoRNP pseudouridylase complex; involved in the modification and cleavage of the 18S pre-rRNA -S000034183 CDS YHR089C 8 283298 282681 C 2011-02-03 1996-07-31 -S000001132 ORF Verified YHR090C YNG2 histone acetyltransferase YNG2|EAF4|NBN1 chromosome 8 L000004452 8 284625 283777 C 2011-02-03 1996-07-31 Subunit of NuA4, an essential histone acetyltransferase complex; positions Piccolo NuA4 for efficient acetylation of histone H4 or histone H2A; relocalizes to the cytosol in response to hypoxia; similar to human tumor suppressor ING1 and its isoforms ING4 and ING5 -S000033033 CDS YHR090C 8 284625 283777 C 2011-02-03 1996-07-31 -S000001133 ORF Verified YHR091C MSR1 arginine--tRNA ligase MSR1 chromosome 8 L000002618 8 286770 284839 C 2011-02-03 1996-07-31 Mitochondrial arginyl-tRNA synthetase; mutations in human ortholog are associated with pontocerebellar hypoplasia type 6; MSR1 has a paralog, YDR341C, that arose from the whole genome duplication -S000033677 CDS YHR091C 8 286770 284839 C 2011-02-03 1996-07-31 -S000130149 ARS ARS814 chromosome 8 8 286770 287128 2011-02-03 2009-05-06|2011-02-03 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000001134 ORF Verified YHR092C HXT4 hexose transporter HXT4|RAG1|LGT1 chromosome 8 L000000838 8 288811 287081 C 2011-02-03 1996-07-31|2011-02-03 High-affinity glucose transporter; member of the major facilitator superfamily, expression is induced by low levels of glucose and repressed by high levels of glucose; HXT4 has a paralog, HXT7, that arose from the whole genome duplication -S000033772 CDS YHR092C 8 288811 287081 C 2011-02-03 1996-07-31|2011-02-03 -S000001135 ORF Dubious YHR093W AHT1 chromosome 8 L000000065 8 289142 289690 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; multicopy suppressor of glucose transport defects, likely due to the presence of an HXT4 regulatory element in the region -S000033970 CDS YHR093W 8 289142 289690 W 2011-02-03 1996-07-31 -S000001136 ORF Verified YHR094C HXT1 hexose transporter HXT1|HOR4 chromosome 8 L000000835 8 292625 290913 C 66.54 2011-02-03 1996-07-31 Low-affinity glucose transporter of the major facilitator superfamily; expression is induced by Hxk2p in the presence of glucose and repressed by Rgt1p when glucose is limiting; HXT1 has a paralog, HXT6, what arose from the whole genome duplication -S000034018 CDS YHR094C 8 292625 290913 C 2011-02-03 1996-07-31 -S000001137 ORF Dubious YHR095W chromosome 8 8 292943 293437 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035020 CDS YHR095W 8 292943 293437 W 2011-02-03 1996-07-31|2011-02-03 -S000001138 ORF Verified YHR096C HXT5 hexose transporter HXT5 chromosome 8 L000000839 8 296447 294669 C 2011-02-03 1996-07-31 Hexose transporter with moderate affinity for glucose; induced in the presence of non-fermentable carbon sources, induced by a decrease in growth rate, contains an extended N-terminal domain relative to other HXTs; HXT5 has a paralog, HXT3, that arose from the whole genome duplication -S000035072 CDS YHR096C 8 296447 294669 C 2011-02-03 1996-07-31 -S000130150 ARS ARS815 chromosome 8 8 297060 297179 2014-11-18 2014-11-18|2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000001139 ORF Uncharacterized YHR097C chromosome 8 8 298609 297385 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and the nucleus; YHR097C has a paralog, PAL1, that arose from the whole genome duplication -S000035267 CDS YHR097C 8 298360 297385 C 2011-02-03 1996-07-31 -S000035266 CDS YHR097C 8 298609 298485 C 2011-02-03 1996-07-31 -S000035268 intron YHR097C 8 298484 298361 C 2011-02-03 1996-07-31 -S000001140 ORF Verified YHR098C SFB3 LST1 chromosome 8 L000004659 8 301934 299145 C 2011-02-03 1996-07-31 Component of the Sec23p-Sfb3p heterodimer of the COPII vesicle coat; COPII coat is required for cargo selection during vesicle formation in ER to Golgi transport; scaffolding function of Lst1p required to generate vesicles that can accommodate difficult cargo proteins that include large oligomeric assemblies and asymmetrically distributed membrane proteins; homologous to Sec24p and Sfb2p -S000036156 CDS YHR098C 8 301934 299145 C 2011-02-03 1996-07-31 -S000001141 ORF Verified YHR099W TRA1 histone acetyltransferase TRA1 chromosome 8 L000003945 8 302761 313995 W 2011-02-03 1996-07-31 Subunit of SAGA and NuA4 histone acetyltransferase complexes; interacts with acidic activators (e.g., Gal4p) which leads to transcription activation; similar to human TRRAP, which is a cofactor for c-Myc mediated oncogenic transformation -S000036322 CDS YHR099W 8 302761 313995 W 2011-02-03 1996-07-31 -S000001142 ORF Verified YHR100C GEP4 phosphatidylglycerophosphatase chromosome 8 8 314673 314116 C 2011-02-03 1996-07-31 Mitochondrial phosphatidylglycerophosphatase (PGP phosphatase); dephosphorylates phosphatidylglycerolphosphate to generate phosphatidylglycerol, an essential step during cardiolipin biosynthesis; null mutant is sensitive to tunicamycin, DTT -S000034711 CDS YHR100C 8 314673 314116 C 2011-02-03 1996-07-31 -S000001143 ORF Verified YHR101C BIG1 chromosome 8 L000003416 8 315968 314874 C 2011-02-03 1996-07-31 Integral membrane protein of the endoplasmic reticulum; required for normal content of cell wall beta-1,6-glucan -S000035670 CDS YHR101C 8 315771 314874 C 2011-02-03 1996-07-31 -S000035669 CDS YHR101C 8 315968 315859 C 2011-02-03 1996-07-31 -S000035671 intron YHR101C 8 315858 315772 C 2011-02-03 1996-07-31 -S000001144 ORF Verified YHR102W KIC1 putative serine/threonine protein kinase KIC1|NRK1 chromosome 8 L000001276 8 316572 319814 W 2011-02-03 1996-07-31 Protein kinase of the PAK/Ste20 family, required for cell integrity; physically interacts with Cdc31p (centrin), which is a component of the spindle pole body; part of the RAM network that regulates cellular polarity and morphogenesis -S000035759 CDS YHR102W 8 316572 319814 W 2011-02-03 1996-07-31 -S000001145 ORF Verified YHR103W SBE22 chromosome 8 L000003101 8 320414 322972 W 2011-02-03 1996-07-31 Protein involved in bud growth; involved in the transport of cell wall components from the Golgi to the cell surface; similar in structure and functionally redundant with Sbe2p; SBE22 has a paralog, SBE2, that arose from the whole genome duplication -S000035866 CDS YHR103W 8 320414 322972 W 2011-02-03 1996-07-31 -S000001146 ORF Verified YHR104W GRE3 trifunctional aldehyde reductase/xylose reductase/glucose 1-dehydrogenase (NADP(+)) chromosome 8 L000004178 8 323409 324392 W 2011-02-03 1996-07-31 Aldose reductase; involved in methylglyoxal, d-xylose, arabinose, and galactose metabolism; stress induced (osmotic, ionic, oxidative, heat shock, starvation and heavy metals); regulated by the HOG pathway; protein abundance increases in response to DNA replication stress -S000036784 CDS YHR104W 8 323409 324392 W 2011-02-03 1996-07-31 -S000001147 ORF Verified YHR105W YPT35 chromosome 8 8 324766 325410 W 2011-02-03 1996-07-31 Endosomal protein of unknown function; contains a phox (PX) homology domain; binds to both phosphatidylinositol-3-phosphate (PtdIns(3)P) and proteins involved in ER-Golgi or vesicular transport -S000036859 CDS YHR105W 8 324766 325410 W 2011-02-03 1996-07-31 -S000001148 ORF Verified YHR106W TRR2 thioredoxin-disulfide reductase TRR2 chromosome 8 L000003954 8 325598 326626 W 2011-02-03 1996-07-31 Mitochondrial thioredoxin reductase; involved in protection against oxidative stress, required with Glr1p to maintain the redox state of Trx3p; contains active-site motif (CAVC) present in prokaryotic orthologs; binds NADPH and FAD; TRR2 has a paralog, TRR1, that arose from the whole genome duplication -S000036915 CDS YHR106W 8 325598 326626 W 2011-02-03 1996-07-31 -S000001149 ORF Verified YHR107C CDC12 septin CDC12|PSL7|CLA10 chromosome 8 L000000348|L000000252 8 328036 326813 C 68.14 2011-02-03 1996-07-31 Component of the septin ring that is required for cytokinesis; septins are GTP-binding proteins that assemble into rod-like hetero-oligomers that can associate with other rods to form filaments; septin rings at the mother-bud neck act as scaffolds for recruiting cell division factors and as barriers to prevent diffusion of specific proteins between mother and daughter cells -S000036947 CDS YHR107C 8 328036 326813 C 2011-02-03 1996-07-31 -S000001150 ORF Verified YHR108W GGA2 phosphatidylinositol 4-phosphate-binding protein chromosome 8 S000007494 8 328303 330060 W 2011-02-03 1996-07-31 Protein that regulates Arf1p, Arf2p to facilitate Golgi trafficking; binds phosphatidylinositol 4-phosphate, which plays a role in TGN localization; has homology to gamma-adaptin; GGA2 has a paralog, GGA1, that arose from the whole genome duplication -S000037727 CDS YHR108W 8 328303 330060 W 2011-02-03 1996-07-31 -S000001151 ORF Verified YHR109W CTM1 cytochrome c lysine N-methyltransferase chromosome 8 S000007504 8 330310 332067 W 2011-02-03 1996-07-31 Cytochrome c lysine methyltransferase; trimethylates residue 72 of apo-cytochrome c (Cyc1p) in the cytosol; not required for normal respiratory growth -S000037814 CDS YHR109W 8 330310 332067 W 2011-02-03 1996-07-31 -S000001152 ORF Verified YHR110W ERP5 chromosome 8 L000004682 8 332282 332920 W 2011-02-03 1996-07-31 Protein with similarity to Emp24p and Erv25p; member of the p24 family involved in ER to Golgi transport -S000030739 CDS YHR110W 8 332282 332920 W 2011-02-03 1996-07-31 -S000001153 ORF Verified YHR111W UBA4 YHR1 chromosome 8 8 333072 334394 W 2011-02-03 1996-07-31 E1-like protein that activates Urm1p before urmylation; also acts in thiolation of the wobble base of cytoplasmic tRNAs by adenylating and then thiolating Urm1p; receives sulfur from Tum1p -S000030847 CDS YHR111W 8 333072 334394 W 2011-02-03 1996-07-31 -S000001154 ORF Verified YHR112C putative cystathionine beta-lyase chromosome 8 8 335663 334527 C 2011-02-03 1996-07-31 Protein of unknown function; localizes to the cytoplasm and nucleus; overexpression affects protein trafficking through the endocytic pathway -S000031735 CDS YHR112C 8 335663 334527 C 2011-02-03 1996-07-31 -S000001155 ORF Verified YHR113W APE4 aspartyl aminopeptidase chromosome 8 8 336337 337809 W 2011-02-03 1996-07-31 Cytoplasmic aspartyl aminopeptidase with possible vacuole function; Cvt pathway cargo protein; cleaves unblocked N-terminal acidic amino acids from peptide substrates; forms a 12-subunit homo-oligomer; M18 metalloprotease family -S000031980 CDS YHR113W 8 336337 337809 W 2011-02-03 1996-07-31 -S000001156 ORF Verified YHR114W BZZ1 LSB7 chromosome 8 8 338083 339984 W 2011-02-03 1996-07-31 SH3 domain protein implicated in regulating actin polymerization; able to recruit actin polymerization machinery through its SH3 domains; colocalizes with cortical actin patches and Las17p; interacts with type I myosins -S000032098 CDS YHR114W 8 338083 339984 W 2011-02-03 1996-07-31 -S000001157 ORF Verified YHR115C DMA1 ubiquitin-conjugating protein DMA1|CHF1 chromosome 8 S000029719 8 341359 340109 C 2011-02-03 1996-07-31 Ubiquitin-protein ligase (E3); controls septin dynamics, spindle position checkpoint (SPOC) with ligase Dma2p by regulating recruitment of Elm1p to bud neck; regulates levels of eIF2 subunit Gcd11p, as well as abundance, localization, and ubiquitination of Cdk inhibitory kinase Swe1p; ubiquitinates cyclin Pcl1p; ortholog of human RNF8, similar to human Chfr; contains FHA, RING fingers; DMA1 has a paralog, DMA2, that arose from the whole genome duplication -S000032967 CDS YHR115C 8 341359 340109 C 2011-02-03 1996-07-31 -S000001158 ORF Verified YHR116W COX23 chromosome 8 8 341665 342120 W 2011-02-03 1996-07-31 Protein that functions in mitochondrial copper homeostasis; mitochondrial intermembrane space protein; essential for functional cytochrome oxidase expression; homologous to Cox17p; contains twin cysteine-x9-cysteine motifs -S000033114 CDS YHR116W 8 341665 342120 W 2011-02-03 1996-07-31 -S000001159 ORF Verified YHR117W TOM71 protein channel TOM71|TOM72 chromosome 8 L000003252 8 342349 344268 W 2011-02-03 1996-07-31 Mitochondrial outer membrane protein; probable minor component of the TOM (translocase of outer membrane) complex responsible for recognition and import of mitochondrially directed proteins; TOM71 has a paralog, TOM70, that arose from the whole genome duplication -S000033188 CDS YHR117W 8 342349 344268 W 2011-02-03 1996-07-31 -S000001160 ORF Verified YHR118C ORC6 origin recognition complex subunit 6 chromosome 8 L000001306 8 345628 344321 C 2011-02-03 1996-07-31 Subunit of the origin recognition complex (ORC); ORC directs DNA replication by binding to replication origins and is also involved in transcriptional silencing; phosphorylated by Cdc28p; mutation in the human Orc6p is linked to Meier-Gorlin syndrome -S000033913 CDS YHR118C 8 345628 344321 C 2011-02-03 1996-07-31 -S000001161 ORF Verified YHR119W SET1 histone methyltransferase SET1|KMT2|YTX1 chromosome 8 L000003286 8 346043 349285 W 2011-02-03 1996-07-31 Histone methyltransferase, subunit of the COMPASS (Set1C) complex; COMPASS methylates histone H3K4; Set1p-dependent H3K4 trimethylation recruits Nrd1p, allowing efficient termination of snoRNAs and cryptic unstable transcripts (CUTs) by Nrd1p-Nab3p-Sen1p pathway; modulates histone acetylation levels in promoter proximal regions to ensure efficient Nrd1p-dependent termination; required in transcriptional silencing near telomeres and at silent mating type loci; has a SET domain -S000034097 CDS YHR119W 8 346043 349285 W 2011-02-03 1996-07-31 -S000001162 ORF Verified YHR120W MSH1 mismatch repair ATPase MSH1 chromosome 8 L000001189 8 349574 352453 W 70.44 2011-02-03 1996-07-31 DNA-binding protein of the mitochondria; involved in repair of mitochondrial DNA; has ATPase activity and binds to DNA mismatches; has homology to E. coli MutS; transcription is induced during meiosis -S000035066 CDS YHR120W 8 349574 352453 W 2011-02-03 1996-07-31 -S000001163 ORF Verified YHR121W LSM12 chromosome 8 8 352756 353319 W 2011-02-03 1996-07-31 Protein of unknown function that may function in RNA processing; interacts with Pbp1p and Pbp4p and associates with ribosomes; contains an RNA-binding LSM domain and an AD domain; GFP-fusion protein is induced by the DNA-damaging agent MMS; relative distribution to the nucleus increases upon DNA replication stress -S000035174 CDS YHR121W 8 352756 353319 W 2011-02-03 1996-07-31 -S000001164 ORF Verified YHR122W CIA2 iron-sulfur cluster assembly protein CIA2 chromosome 8 8 353625 354320 W 2011-02-03 1996-07-31 Component of cytosolic iron-sulfur protein assembly (CIA) machinery; acts at a late step of Fe-S cluster assembly; forms the CIA targeting complex with Cia1p and Met18p that directs Fe-S cluster incorporation into a subset of proteins involved in methionine biosynthesis, DNA replication and repair, transcription, and telomere maintenance; ortholog of human FAM96B -S000036050 CDS YHR122W 8 353625 354320 W 2011-02-03 1996-07-31 -S000001165 ORF Verified YHR123W EPT1 bifunctional diacylglycerol cholinephosphotransferase/ethanolaminephosphotransferase chromosome 8 L000000563 8 354815 356081 W 2011-02-03 1996-07-31 sn-1,2-diacylglycerol ethanolamine- and cholinephosphotranferase; not essential for viability; EPT1 has a paralog, CPT1, that arose from the whole genome duplication -S000036151 CDS YHR123W 8 354815 354864 W 2011-02-03 1996-07-31 -S000036152 CDS YHR123W 8 354956 356081 W 2011-02-03 1996-07-31 -S000036153 intron YHR123W 8 354865 354955 W 2011-02-03 1996-07-31 -S000001166 ORF Verified YHR124W NDT80 transcription factor NDT80 chromosome 8 L000003016 8 356561 358444 W 2011-02-03 1996-07-31 Meiosis-specific transcription factor; required for exit from pachytene and for full meiotic recombination; activates middle sporulation genes; competes with Sum1p for binding to promoters containing middle sporulation elements (MSE) -S000029855 CDS YHR124W 8 356561 358444 W 2011-02-03 1996-07-31 -S000006567 tRNA_gene tF(GAA)H2 chromosome 8 L000003860 8 358569 358478 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis -S000032804 intron tF(GAA)H2 8 358532 358514 C 2011-02-03 2000-05-19 -S000032803 noncoding_exon tF(GAA)H2 8 358513 358478 C 2011-02-03 2000-05-19 -S000032802 noncoding_exon tF(GAA)H2 8 358569 358533 C 2011-02-03 2000-05-19 -S000006996 long_terminal_repeat YHRCdelta8 chromosome 8 8 358850 358672 C 2011-02-03 2000-05-19 Ty1 LTR -S000001167 ORF Dubious YHR125W chromosome 8 8 358858 359163 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031773 CDS YHR125W 8 358858 359163 W 2011-02-03 1996-07-31 -S000007005 long_terminal_repeat YHRCtau4 chromosome 8 8 359067 358850 C 2011-02-03 2000-05-19 Ty4 LTR -S000007008 long_terminal_repeat YHRWdelta9 chromosome 8 8 359079 359372 W 2011-02-03 2000-05-19 Ty1 LTR -S000001168 ORF Uncharacterized YHR126C ANS1 chromosome 8 8 360181 359702 C 2011-02-03 1996-07-31 Putative GPI protein; SWAT-GFP and mCherry fusion proteins localize to the vacuole; transcription dependent upon Azf1p -S000031832 CDS YHR126C 8 360181 359702 C 2011-02-03 1996-07-31 -S000001169 ORF Verified YHR127W HSN1 chromosome 8 L000004353 8 360913 361644 W 2011-02-03 1996-07-31 Protein of unknown function; localizes to the nucleus; required for asymmetric localization of Kar9p during mitosis -S000032038 CDS YHR127W 8 360913 361644 W 2011-02-03 1996-07-31 -S000001170 ORF Verified YHR128W FUR1 uracil phosphoribosyltransferase chromosome 8 L000000651 8 362115 362765 W 91 2011-02-03 2003-09-22|1996-07-31 Uracil phosphoribosyltransferase; synthesizes UMP from uracil; involved in the pyrimidine salvage pathway -S000037493 CDS YHR128W 8 362115 362765 W 2011-02-03 2003-09-22|1996-07-31 -S000001171 ORF Verified YHR129C ARP1 actin-related protein 1|ACT5 chromosome 8 L000000028 8 364153 362999 C 2011-02-03 1996-07-31 Actin-related protein of the dynactin complex; required for spindle orientation and nuclear migration; forms actin-like short filament composed of 9 or 10 Arp1p monomers; putative ortholog of mammalian centractin -S000037551 CDS YHR129C 8 364153 362999 C 2011-02-03 1996-07-31 -S000001172 ORF Uncharacterized YHR130C chromosome 8 8 365300 364965 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YHR130C is not an essential gene -S000037165 CDS YHR130C 8 365300 364965 C 2011-02-03 1996-07-31 -S000028782 ORF Dubious YHR131W-A chromosome 8 8 367747 367992 W 2011-02-03 2004-07-26|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YHR131C -S000033522 CDS YHR131W-A 8 367747 367992 W 2011-02-03 2004-07-26|2003-07-29 -S000001173 ORF Uncharacterized YHR131C chromosome 8 8 367892 365340 C 2011-02-03 2004-07-26|1996-07-31 Putative protein of unknown function; GFP-fusion protein localizes to the cytoplasm; overexpression causes cell cycle delay or arrest; contains a PH domain and binds phosphatidylinositols and other lipids in a large-scale study; YHR131C has a paralog, YNL144C, that arose from the whole genome duplication -S000037245 CDS YHR131C 8 367892 365340 C 2011-02-03 2004-07-26|1996-07-31 -S000001174 ORF Verified YHR132C ECM14 putative metallocarboxypeptidase chromosome 8 L000003889 8 369794 368502 C 2011-02-03 1996-07-31 Putative metalloprotease with similarity to zinc carboxypeptidases; required for normal cell wall assembly -S000037322 CDS YHR132C 8 369794 368502 C 2011-02-03 1996-07-31 -S000007496 ORF Verified YHR132W-A IGO2 phosphatase regulator chromosome 8 8 370054 370449 W 2011-02-03 2000-01-21 Protein required for initiation of G0 program; prevents degradation of nutrient-regulated mRNAs via the 5'-3' mRNA decay pathway; phosphorylated by Rim15p; GFP protein localizes to the cytoplasm and nucleus; IGO2 has a paralog, IGO1, that arose from the whole genome duplication -S000032170 CDS YHR132W-A 8 370054 370449 W 2011-02-03 2000-01-21 -S000001175 ORF Verified YHR133C NSG1 chromosome 8 8 371597 370722 C 2011-02-03 1996-07-31 Protein involved in regulation of sterol biosynthesis; specifically stabilizes Hmg2p, one of two HMG-CoA isoenzymes that catalyze the rate-limiting step in sterol biosynthesis; forms foci at the nuclear periphery upon DNA replication stress; relocalizes to the cytosol in response to hypoxia; homolog of mammalian INSIG proteins; NSG1 has a paralog, NSG2, that arose from the whole genome duplication -S000037393 CDS YHR133C 8 371597 370722 C 2011-02-03 1996-07-31 -S000001176 ORF Verified YHR134W WSS1 metalloendopeptidase WSS1 chromosome 8 8 371749 372558 W 2011-02-03 1996-07-31 Metalloprotease involved in DNA repair, removes DNA-protein crosslinks at stalled replication forks during replication of damaged DNA; localizes to a single spot on the nuclear periphery of mother cells but not daughters; interacts genetically with SMT3; activated by DNA binding -S000030068 CDS YHR134W 8 371749 372558 W 2011-02-03 1996-07-31 -S000001177 ORF Verified YHR135C YCK1 serine/threonine protein kinase YCK1|CKI2 chromosome 8 L000002500 8 374310 372694 C 2011-02-03 1996-07-31 Palmitoylated plasma membrane-bound casein kinase I (CK1) isoform; shares redundant functions with Yck2p in morphogenesis, proper septin assembly, endocytic trafficking, and glucose sensing; stabilized by Sod1p binding in the presence of glucose and oxygen, causing glucose repression of respiratory metabolism; involved in the phosphorylation and regulation of glucose sensor Rgt2p; YCK1 has a paralog, YCK2, that arose from the whole genome duplication -S000030130 CDS YHR135C 8 374310 372694 C 2011-02-03 1996-07-31 -S000001178 ORF Verified YHR136C SPL2 chromosome 8 L000004174 8 375100 374654 C 2011-02-03 1996-07-31 Protein with similarity to cyclin-dependent kinase inhibitors; downregulates low-affinity phosphate transport during phosphate limitation by targeting Pho87p to the vacuole; upstream region harbors putative hypoxia response element (HRE) cluster; overproduction suppresses a plc1 null mutation; promoter shows an increase in Snf2p occupancy after heat shock; GFP-fusion protein localizes to the cytoplasm -S000030305 CDS YHR136C 8 375100 374654 C 2011-02-03 1996-07-31 -S000001179 ORF Verified YHR137W ARO9 aromatic-amino-acid:2-oxoglutarate transaminase chromosome 8 L000003950 8 375709 377250 W 2011-02-03 1996-07-31 Aromatic aminotransferase II; catalyzes the first step of tryptophan, phenylalanine, and tyrosine catabolism -S000033667 CDS YHR137W 8 375709 377250 W 2011-02-03 1996-07-31 -S000028649 ORF Dubious YHR137C-A chromosome 8 8 376388 375738 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified gene ARO9/YHR137W; identified by gene-trapping, expression analysis, and genome-wide homology searching -S000032425 CDS YHR137C-A 8 376388 375738 C 2011-02-03 2003-07-29 -S000001180 ORF Verified YHR138C chromosome 8 8 377699 377355 C 2011-02-03 1996-07-31 Protein of unknown function; similar to Pbi2p; double null mutant lacking Pbi2p and Yhr138cp exhibits highly fragmented vacuoles; protein abundance increases in response to DNA replication stress -S000033725 CDS YHR138C 8 377699 377355 C 2011-02-03 1996-07-31 -S000001181 ORF Verified YHR139C SPS100 chromosome 8 L000002027 8 379199 378219 C 2011-02-03 1996-07-31 Protein required for spore wall maturation; expressed during sporulation; may be a component of the spore wall; expression also induced in cells treated with the mycotoxin patulin; SPS100 has a paralog, YGP1, that arose from the whole genome duplication -S000033864 CDS YHR139C 8 379199 378219 C 2011-02-03 1996-07-31 -S000003533 ORF Dubious YHR139C-A chromosome 8 8 380419 380108 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035738 CDS YHR139C-A 8 380419 380108 C 2011-02-03 1996-07-31 -S000001182 ORF Uncharacterized YHR140W chromosome 8 8 380572 381291 W 2011-02-03 1996-07-31 Putative integral membrane protein of unknown function -S000033477 CDS YHR140W 8 380572 381291 W 2011-02-03 1996-07-31 -S000007297 snoRNA_gene snR32 SNR32 chromosome 8 L000001970 8 381540 381727 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2191 -S000036759 noncoding_exon snR32 8 381540 381727 W 2011-02-03 2000-05-19 -S000001183 ORF Verified YHR141C RPL42B eL42|ribosomal 60S subunit protein L42B|L44e|YP44|YL27|L42B|L41B|MAK18 chromosome 8 L000001732|L000000990 8 382751 381990 C 95 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L42B; required for propagation of the killer toxin-encoding M1 double-stranded RNA satellite of the L-A double-stranded RNA virus; homologous to mammalian ribosomal protein L36A, no bacterial homolog; RPL42B has a paralog, RPL42A, that arose from the whole genome duplication -S000033511 CDS YHR141C 8 382306 381990 C 2011-02-03 1996-07-31 -S000033510 CDS YHR141C 8 382751 382748 C 2011-02-03 1996-07-31 -S000033512 intron YHR141C 8 382747 382307 C 2011-02-03 1996-07-31 -S000001184 ORF Verified YHR142W CHS7 chromosome 8 S000007442 8 383538 384488 W 2011-02-03 1996-07-31 Protein of unknown function; may be involved in chitin biosynthesis by regulation of Chs3p export from the ER; relocalizes from bud neck to ER upon DNA replication stress -S000033600 CDS YHR142W 8 383538 384488 W 2011-02-03 1996-07-31 -S000001186 ORF Verified YHR143W DSE2 chromosome 8 8 385510 386487 W 2011-02-03 1996-07-31 Daughter cell-specific secreted protein with similarity to glucanases; degrades cell wall from the daughter side causing daughter to separate from mother; expression is repressed by cAMP -S000034514 CDS YHR143W 8 385510 386487 W 2011-02-03 1996-07-31 -S000001185 ORF Verified YHR143W-A RPC10 DNA-directed RNA polymerase core subunit RPC10|ABC10-alpha|RPB12 chromosome 8 L000001686 8 387233 387445 W 2011-02-03 1996-07-31 RNA polymerase subunit ABC10-alpha, found in RNA pol I, II, and III; relocalizes from nucleolus to cytoplasm upon DNA replication stress -S000036603 CDS YHR143W-A 8 387233 387445 W 2011-02-03 1996-07-31 -S000001187 ORF Verified YHR144C DCD1 deoxycytidine monophosphate deaminase chromosome 8 L000000496 8 388726 387788 C 2011-02-03 1996-07-31 Deoxycytidine monophosphate (dCMP) deaminase; involved in dUMP and dTMP biosynthesis; expression is NOT cell cycle regulated -S000034581 CDS YHR144C 8 388726 387788 C 2011-02-03 1996-07-31 -S000006682 tRNA_gene tP(UGG)H SUF8 chromosome 8 L000002156|L000003859 8 388995 388893 C 82 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin; can mutate to suppress +1 frameshift mutations in proline codons -S000035984 intron tP(UGG)H 8 388959 388929 C 2011-02-03 2000-05-19 -S000035983 noncoding_exon tP(UGG)H 8 388928 388893 C 2011-02-03 2000-05-19 -S000035982 noncoding_exon tP(UGG)H 8 388995 388960 C 2011-02-03 2000-05-19 -S000001188 ORF Dubious YHR145C chromosome 8 8 389337 388981 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034646 CDS YHR145C 8 389337 388981 C 2011-02-03 1996-07-31 -S000006997 long_terminal_repeat YHRCdelta10 chromosome 8 8 389509 389177 C 2011-02-03 2000-05-19 Ty2 LTR -S000006998 long_terminal_repeat YHRCdelta11 chromosome 8 8 389845 389613 C 2011-02-03 2000-05-19 Ty1 LTR -S000001189 ORF Verified YHR146W CRP1 chromosome 8 8 390300 391697 W 2011-02-03 1996-07-31 Protein that binds to cruciform DNA structures; CRP1 has a paralog, MDG1, that arose from the whole genome duplication -S000035695 CDS YHR146W 8 390300 391697 W 2011-02-03 1996-07-31 -S000118360 ARS ARS818 ARSVIII-392 chromosome 8 8 392180 392395 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178109 ARS_consensus_sequence ARS818 8 392249 392233 C 2014-11-18 2014-11-18 -S000001190 ORF Verified YHR147C MRPL6 mitochondrial 54S ribosomal protein YmL16|YmL16 chromosome 8 L000001161 8 393283 392639 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit -S000035761 CDS YHR147C 8 393283 392639 C 2011-02-03 1996-07-31 -S000001191 ORF Verified YHR148W IMP3 snoRNA-binding rRNA-processing protein IMP3 chromosome 8 S000007425 8 393534 394085 W 2011-02-03 1996-07-31 Component of the SSU processome; SSU processome is required for pre-18S rRNA processing, essential protein that interacts with Mpp10p and mediates interactions of Imp4p and Mpp10p with U3 snoRNA -S000035958 CDS YHR148W 8 393534 394085 W 2011-02-03 1996-07-31 -S000001192 ORF Verified YHR149C SKG6 chromosome 8 8 396659 394455 C 2011-02-03 1996-07-31 Integral membrane protein; localizes primarily to growing sites such as the bud tip or the cell periphery; potential Cdc28p substrate; Skg6p interacts with Zds1p and Zds2p; SKG6 has a paralog, TOS2, that arose from the whole genome duplication -S000037794 CDS YHR149C 8 396659 394455 C 2011-02-03 1996-07-31 -S000001193 ORF Verified YHR150W PEX28 chromosome 8 8 397251 398990 W 2011-02-03 1996-07-31 Peroxisomal integral membrane peroxin; involved in the regulation of peroxisomal size, number and distribution; genetic interactions suggest that Pex28p and Pex29p act at steps upstream of those mediated by Pex30p, Pex31p, and Pex32p -S000037560 CDS YHR150W 8 397251 398990 W 2011-02-03 1996-07-31 -S000001194 ORF Verified YHR151C MTC6 chromosome 8 8 400848 399268 C 2011-02-03 1996-07-31 Protein of unknown function; mtc6 is synthetically sick with cdc13-1; SWAT-GFP and mCherry fusion proteins localize to the vacuole while SWAT-GFP fusion also localizes to the endoplasmic reticulum -S000037592 CDS YHR151C 8 400848 399268 C 2011-02-03 1996-07-31 -S000001195 ORF Verified YHR152W SPO12 SDB21 chromosome 8 L000002003|S000029441|L000001821 8 401434 401955 W 83 2011-02-03 1996-07-31 Nucleolar protein of unknown function; positive regulator of mitotic exit; involved in regulating release of Cdc14p from the nucleolus in early anaphase, may play similar role in meiosis; SPO12 has a paralog, BNS1, that arose from the whole genome duplication -S000037692 CDS YHR152W 8 401434 401955 W 2011-02-03 1996-07-31 -S000001196 ORF Verified YHR153C SPO16 chromosome 8 L000002007 8 402682 402086 C 83 2011-02-03 1996-07-31 Meiosis-specific protein involved in synaptonemal complex assembly; implicated in regulation of crossover formation; required for sporulation -S000037713 CDS YHR153C 8 402682 402086 C 2011-02-03 1996-07-31 -S000001197 ORF Verified YHR154W RTT107 ESC4 chromosome 8 L000004424 8 402966 406178 W 2011-02-03 1996-07-31 Protein implicated in Mms22-dependent DNA repair during S phase; involved in recruiting the SMC5/6 complex to double-strand breaks; DNA damage induces phosphorylation by Mec1p at one or more SQ/TQ motifs; interacts with Mms22p and Slx4p; has four BRCT domains; has a role in regulation of Ty1 transposition; relative distribution to nuclear foci increases upon DNA replication stress -S000030580 CDS YHR154W 8 402966 406178 W 2011-02-03 1996-07-31 -S000001198 ORF Verified YHR155W LAM1 YSP1 chromosome 8 8 407103 410789 W 2011-02-03 1996-07-31 Putative sterol transfer protein; localizes to puncta in the cortical ER; probable role in retrograde transport of sterols from the plasma membrane to the ER; one of six StART-like domain-containing proteins in yeast that may be involved in sterol transfer between intracellular membranes; conserved across eukaryotes; contains GRAM, StART-like (VASt) and two PH-like domains -S000030669 CDS YHR155W 8 407103 410789 W 2011-02-03 1996-07-31 -S000006462 snoRNA_gene snR71 SNR71 chromosome 8 L000004540 8 411228 411317 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A2946 -S000031782 noncoding_exon snR71 8 411228 411317 W 2011-02-03 2000-05-19 -S000001199 ORF Verified YHR156C LIN1 U5 snRNP complex subunit LIN1|SNU40 chromosome 8 8 412406 411384 C 2011-02-03 1996-07-31 Non-essential component of U5 snRNP; nuclear protein; physically interacts with Irr1p of cohesin complex; may link together proteins involved in chromosome segregation, mRNA splicing and DNA replication -S000030744 CDS YHR156C 8 412406 411384 C 2011-02-03 1996-07-31 -S000001200 ORF Verified YHR157W REC104 chromosome 8 L000001605 8 412907 413455 W 107 2011-02-03 1996-07-31 Protein involved in early stages of meiotic recombination; required for meiotic crossing over; forms a complex with Rec102p and Spo11p necessary during the initiation of recombination -S000030900 CDS YHR157W 8 412907 413455 W 2011-02-03 1996-07-31 -S000001201 ORF Verified YHR158C KEL1 chromosome 8 L000003592 8 417179 413685 C 2011-02-03 1996-07-31 Protein required for proper cell fusion and cell morphology; forms a complex with Bud14p and Kel2p that regulates Bnr1p (formin) to affect actin cable assembly, cytokinesis, and polarized growth; functions in a complex with Kel2p to negatively regulate mitotic exit, interacts with Tem1p and Lte1p; localizes to regions of polarized growth; potential Cdc28p substrate -S000031842 CDS YHR158C 8 417179 413685 C 2011-02-03 1996-07-31 -S000001202 ORF Uncharacterized YHR159W TDA11 chromosome 8 8 417549 419063 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; potential Cdc28p substrate; null mutant is sensitive to expression of the top1-T722A allele -S000032058 CDS YHR159W 8 417549 419063 W 2011-02-03 1996-07-31 -S000001203 ORF Verified YHR160C PEX18 chromosome 8 L000004796 8 420072 419221 C 2011-02-03 1996-07-31 Peroxin; required for targeting of peroxisomal matrix proteins containing PTS2; interacts with Pex7p; partially redundant with Pex21p; primarily responsible for peroxisomal import during growth on oleate, and expression is induced during oleate growth -S000031912 CDS YHR160C 8 420072 419221 C 2011-02-03 1996-07-31 -S000001204 ORF Verified YHR161C YAP1801 chromosome 8 L000004198 8 422286 420373 C 2011-02-03 1996-07-31 Protein of the AP180 family, involved in clathrin cage assembly; binds Pan1p and clathrin; YAP1801 has a paralog, YAP1802, that arose from the whole genome duplication -S000032851 CDS YHR161C 8 422286 420373 C 2011-02-03 1996-07-31 -S000001205 ORF Verified YHR162W MPC2 mitochondrial pyruvate carrier chromosome 8 8 423072 423461 W 2011-02-03 1996-07-31 Highly conserved subunit of the mitochondrial pyruvate carrier (MPC); expressed during growth on fermentable carbon sources, and heterodimerizes with Mpc1p to form the fermentative isoform of MPC; MPC localizes to the mitochondrial inner membrane and mediates pyruvate uptake; MPC2 paralog, MPC3, heterodimerizes with Mpc1p to form the respiratory MPC isoform -S000033001 CDS YHR162W 8 423072 423461 W 2011-02-03 1996-07-31 -S000001206 ORF Verified YHR163W SOL3 6-phosphogluconolactonase SOL3 chromosome 8 L000003117 8 423724 424473 W 2011-02-03 1996-07-31|2005-11-07 6-phosphogluconolactonase; catalyzes the second step of the pentose phosphate pathway; weak multicopy suppressor of los1-1 mutation; homologous to Sol2p and Sol1p; SOL3 has a paralog, SOL4, that arose from the whole genome duplication -S000033074 CDS YHR163W 8 423724 424473 W 2011-02-03 1996-07-31|2005-11-07 -S000001207 ORF Verified YHR164C DNA2 bifunctional ATP-dependent DNA helicase/ssDNA endodeoxyribonuclease DNA2|WEB2 chromosome 8 L000003158 8 429178 424610 C 2011-02-03 1996-07-31 Tripartite DNA replication factor; single-stranded DNA-dependent ATPase, ATP-dependent nuclease, helicase; tracking protein for flap cleavage during Okazaki fragment maturation; involved in DNA repair/processing of meiotic DNA double strand breaks; component of telomeric chromatin with cell-cycle dependent localization; required for telomerase-dependent telomere synthesis; forms nuclear foci upon DNA replication stress; human homolog DNA2 complements yeast dna2 mutant -S000033680 CDS YHR164C 8 429178 424610 C 2011-02-03 1996-07-31 -S000028783 ORF Dubious YHR165W-A chromosome 8 8 436647 436958 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps ORF PRP8/YHR165C -S000033524 CDS YHR165W-A 8 436647 436958 W 2011-02-03 2003-07-29 -S000001208 ORF Verified YHR165C PRP8 U4/U6-U5 snRNP complex subunit PRP8|USA2|SLT21|RNA8|DNA39|DBF3 chromosome 8 L000001500|L000003226 8 436948 429707 C 2011-02-03 1996-07-31 Component of U4/U6-U5 snRNP complex; involved in second catalytic step of splicing; participates in spliceosomal assembly through its interaction with U1 snRNA; largest and most evolutionarily conserved protein of the spliceosome; mutations in human ortholog, PRPF8, cause Retinitis pigmentosa and missplicing in Myelodysplastic syndrome; mouse ortholog interacts with androgen receptor and may have a role in prostate cancer -S000033804 CDS YHR165C 8 436948 429707 C 2011-02-03 1996-07-31 -S000001209 ORF Verified YHR166C CDC23 anaphase promoting complex subunit CDC23 chromosome 8 L000000261 8 439050 437170 C 2011-02-03 1996-07-31 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); APC/C is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition -S000033878 CDS YHR166C 8 439050 437170 C 2011-02-03 1996-07-31 -S000001210 ORF Verified YHR167W THP2 chromosome 8 8 439342 440127 W 2011-02-03 1996-07-31 Subunit of the THO and TREX complexes; THO connects transcription elongation and mitotic recombination, and TREX is recruited to activated genes and couples transcription to mRNA export; involved in telomere maintenance -S000034871 CDS YHR167W 8 439342 440127 W 2011-02-03 1996-07-31 -S000001211 ORF Verified YHR168W MTG2 putative GTPase MTG2 chromosome 8 8 440377 441933 W 2011-02-03 1996-07-31|2011-02-03 Putative GTPase; member of the Obg family; peripheral protein of the mitochondrial inner membrane that associates with the large ribosomal subunit; required for mitochondrial translation, possibly via a role in ribosome assembly -S000035023 CDS YHR168W 8 440377 441933 W 2011-02-03 1996-07-31|2011-02-03 -S000001212 ORF Verified YHR169W DBP8 ATP-dependent RNA helicase DBP8 chromosome 8 L000004248 8 442181 443476 W 2011-02-03 1996-07-31 ATPase, putative RNA helicase of the DEAD-box family; component of 90S preribosome complex involved in production of 18S rRNA and assembly of 40S small ribosomal subunit; ATPase activity stimulated by association with Esf2p -S000035188 CDS YHR169W 8 442181 443476 W 2011-02-03 1996-07-31 -S000001213 ORF Verified YHR170W NMD3 ribosome-binding protein NMD3|SRC5 chromosome 8 L000002937 8 443828 445384 W 2011-02-03 1996-07-31 Protein involved in nuclear export of the large ribosomal subunit; acts as a Crm1p-dependent adapter protein for export of nascent ribosomal subunits through the nuclear pore complex -S000036170 CDS YHR170W 8 443828 445384 W 2011-02-03 1996-07-31 -S000001214 ORF Verified YHR171W ATG7 APG11|APG7|CVT2 chromosome 8 L000004701|S000029035|L000004786 8 445713 447605 W 2005-11-07 1996-07-31 Autophagy-related protein and dual specificity member of the E1 family; mediates the attachment of Atg12p to Atg5p and Atg8p to phosphatidylethanolamine which are required steps in autophagosome formation; E1 enzymes are also known as ubiquitin-activating enzymes; involved in methionine restriction extension of chronological lifespan in an autophagy-dependent manner -S000036922 CDS YHR171W 8 445713 447605 W 2005-11-07 1996-07-31 -S000118361 ARS ARS820 ARSVIII-448 chromosome 8 8 447714 447795 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178110 ARS_consensus_sequence ARS820 8 447793 447777 C 2014-11-18 2014-11-18 -S000001215 ORF Verified YHR172W SPC97 chromosome 8 L000003543 8 448335 450806 W 2005-11-07 1996-07-31 Component of the microtubule-nucleating Tub4p (gamma-tubulin) complex; interacts with Spc110p at the spindle pole body (SPB) inner plaque and with Spc72p at the SPB outer plaque -S000036987 CDS YHR172W 8 448335 450806 W 2005-11-07 1996-07-31 -S000001216 ORF Uncharacterized YHR173C chromosome 8 8 451153 450815 C 2005-11-07 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels; SWAT-GFP and mCherry fusion proteins localize to the vacuole -S000037013 CDS YHR173C 8 451153 450815 C 2005-11-07 1996-07-31 -S000001217 ORF Verified YHR174W ENO2 phosphopyruvate hydratase ENO2 chromosome 8 L000000560 8 451327 452640 W 2005-11-07 1996-07-31 Enolase II, a phosphopyruvate hydratase; catalyzes conversion of 2-phosphoglycerate to phosphoenolpyruvate during glycolysis and the reverse reaction during gluconeogenesis; expression induced in response to glucose; ENO2 has a paralog, ENO1, that arose from the whole genome duplication -S000037161 CDS YHR174W 8 451327 452640 W 2005-11-07 1996-07-31 -S000001218 ORF Verified YHR175W CTR2 low-affinity Cu transporter chromosome 8 L000004070 8 452872 453441 W 2005-11-07 1996-07-31 Low-affinity copper transporter of the vacuolar membrane; mutation confers resistance to toxic copper concentrations, while overexpression confers resistance to copper starvation; regulated by nonsense-mediated mRNA decay pathway -S000029818 CDS YHR175W 8 452872 453441 W 2005-11-07 1996-07-31 -S000028553 ORF Uncharacterized YHR175W-A chromosome 8 8 453558 453707 W 2005-11-07 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031239 CDS YHR175W-A 8 453558 453707 W 2005-11-07 2003-07-29 -S000001219 ORF Verified YHR176W FMO1 N,N-dimethylaniline monooxygenase chromosome 8 8 454229 455527 W 2005-11-07 2004-01-29|1996-07-31 Flavin-containing monooxygenase; localized to the cytoplasmic face of the ER membrane; catalyzes oxidation of biological thiols to maintain the ER redox buffer ratio for correct folding of disulfide-bonded proteins -S000029937 CDS YHR176W 8 454229 455527 W 2005-11-07 2004-01-29|1996-07-31 -S000001220 ORF Verified YHR177W GON3 chromosome 8 8 456591 457952 W 2005-11-07 1996-07-31 Putative transcription factor containing a WOPR domain; binds DNA in vitro; similar to C. albicans Wor1p transcription factor that regulates white-opaque switching; overexpression causes a cell cycle delay or arrest -S000030949 CDS YHR177W 8 456591 457952 W 2005-11-07 1996-07-31 -S000001221 ORF Verified YHR178W STB5 chromosome 8 L000003368 8 459299 461530 W 2005-11-07 1996-07-31 Transcription factor; involved in regulating multidrug resistance and oxidative stress response; forms a heterodimer with Pdr1p; contains a Zn(II)2Cys6 zinc finger domain that interacts with a pleiotropic drug resistance element in vitro -S000031050 CDS YHR178W 8 459299 461530 W 2005-11-07 1996-07-31 -S000001222 ORF Verified YHR179W OYE2 NADPH dehydrogenase chromosome 8 L000001325 8 462502 463704 W 2005-11-07 1996-07-31 Conserved NADPH oxidoreductase containing flavin mononucleotide (FMN); responsible for geraniol reduction into citronellol during fermentation; homologous to Oye3p with different ligand binding and catalytic properties; may be involved in sterol metabolism, oxidative stress response, and programmed cell death; protein abundance increases in response to DNA replication stress -S000031157 CDS YHR179W 8 462502 463704 W 2005-11-07 1996-07-31 -S000006999 long_terminal_repeat YHRCdelta12 chromosome 8 8 464147 463920 C 2005-11-07 2000-05-19 Ty1 LTR -S000001223 ORF Dubious YHR180W chromosome 8 8 465178 465669 W 2005-11-07 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000032113 CDS YHR180W 8 465178 465669 W 2005-11-07 1996-07-31 -S000007009 long_terminal_repeat YHRWdelta13 chromosome 8 8 466549 466863 W 2005-11-07 2000-05-19 Ty1 LTR -S000028555 ORF Dubious YHR180W-A chromosome 8 8 466932 467114 W 2005-11-07 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps dubious ORF YHR180C-B and long terminal repeat YHRCsigma3 -S000031241 CDS YHR180W-A 8 466932 467114 W 2005-11-07 2003-07-29 -S000007004 long_terminal_repeat YHRCsigma3 chromosome 8 8 466975 466884 C 2005-11-07 2000-05-19 Ty3 LTR -S000006751 tRNA_gene tT(UGU)H chromosome 8 L000003857 8 466990 467061 W 2005-11-07 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000036268 noncoding_exon tT(UGU)H 8 466990 467061 W 2005-11-07 2000-05-19 -S000028554 ORF Dubious YHR180C-B chromosome 8 8 467062 466958 C 2005-11-07 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the dubious ORF YHR180W-A -S000031240 CDS YHR180C-B 8 467062 466958 C 2005-11-07 2003-07-29 -S000001224 ORF Verified YHR181W SVP26 ERV26 chromosome 8 8 467228 467914 W 2005-11-07 1996-07-31 Integral membrane protein of the early Golgi apparatus and ER; involved in COP II vesicle transport; may also function to promote retention of proteins in the early Golgi compartment -S000032177 CDS YHR181W 8 467228 467914 W 2005-11-07 1996-07-31 -S000001225 ORF Verified YHR182W chromosome 8 8 468219 470576 W 2005-11-07 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery and cytoplasm; relocalizes from bud neck to cytoplasm upon DNA replication stress -S000032262 CDS YHR182W 8 468219 470576 W 2005-11-07 1996-07-31 -S000001226 ORF Verified YHR183W GND1 phosphogluconate dehydrogenase (decarboxylating) GND1 chromosome 8 L000003125 8 470960 472429 W 2005-11-07 1996-07-31 6-phosphogluconate dehydrogenase (decarboxylating); catalyzes an NADPH regenerating reaction in the pentose phosphate pathway; required for growth on D-glucono-delta-lactone and adaptation to oxidative stress; GND1 has a paralog, GND2, that arose from the whole genome duplication -S000033135 CDS YHR183W 8 470960 472429 W 2005-11-07 1996-07-31 -S000028784 ORF Dubious YHR182C-A chromosome 8 8 471412 470939 C 2005-11-07 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF GND1/YHR183W -S000033525 CDS YHR182C-A 8 471412 470939 C 2005-11-07 2003-07-29 -S000001227 ORF Verified YHR184W SSP1 SPO3 chromosome 8 L000004410|L000004488 8 472744 474459 W 2005-11-07 1996-07-31 Protein involved in the control of meiotic nuclear division; involved in the coordination of meiosis with spore formation; subunit of the leading edge protein (LEP) complex (Ssp1-Ady3-Don1-Irc10) that forms a ring-like structure at the leading edge of the prospore membrane during meiosis II; required for assembly of the leading edge coat and both prospore membrane shaping and organization; transcription is induced midway through meiosis -S000033191 CDS YHR184W 8 472744 474459 W 2005-11-07 1996-07-31 -S000001228 ORF Verified YHR185C PFS1 ADY1 chromosome 8 L000004781 8 475340 474627 C 2005-11-07 1996-07-31 Sporulation protein required for prospore membrane formation; required for prospore membrane formation at selected spindle poles; ensures functionality of all four spindle pole bodies during meiosis II; not required for meiotic recombination or meiotic chromosome segregation -S000033215 CDS YHR185C 8 475340 474627 C 2005-11-07 1996-07-31 -S000006768 tRNA_gene tV(CAC)H chromosome 8 L000003858 8 475778 475706 C 2005-11-07 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis -S000030621 noncoding_exon tV(CAC)H 8 475778 475706 C 2005-11-07 2000-05-19 -S000001229 ORF Verified YHR186C KOG1 ubiquitin-binding TORC1 subunit KOG1|LAS24 chromosome 8 8 480672 475999 C 2005-11-07 1996-07-31 Subunit of TORC1; TORC1 is a rapamycin-sensitive complex involved in growth control that contains Tor1p or Tor2p, Lst8p and Tco89p; contains four HEAT repeats and seven WD-40 repeats; may act as a scaffold protein to couple TOR and its effectors -S000033270 CDS YHR186C 8 480672 475999 C 2005-11-07 1996-07-31 -S000001230 ORF Verified YHR187W IKI1 Elongator subunit IKI1|HAP2|ELP5|TOT5 chromosome 8 L000003562 8 480990 481919 W 2005-11-07 1996-07-31 Subunit of hexameric RecA-like ATPase Elp456 Elongator subcomplex; which is required for modification of wobble nucleosides in tRNA; iki1 mutations confer resistance to the K. lactis toxin zymocin -S000034195 CDS YHR187W 8 480990 481919 W 2005-11-07 1996-07-31 -S000001231 ORF Verified YHR188C GPI16 GPI-anchor transamidase subunit GPI16 chromosome 8 8 483837 482005 C 2005-11-07 1996-07-31 Subunit of the glycosylphosphatidylinositol transamidase complex; transmembrane protein; adds GPIs to newly synthesized proteins; human PIG-Tp homolog -S000034241 CDS YHR188C 8 483837 482005 C 2005-11-07 1996-07-31 -S000001232 ORF Verified YHR189W PTH1 aminoacyl-tRNA hydrolase|PTH chromosome 8 8 484028 484600 W 2005-11-07 1996-07-31 One of two mitochondrially-localized peptidyl-tRNA hydrolases; dispensable for respiratory growth on rich medium, but required for respiratory growth on minimal medium; see also PTH2 -S000034422 CDS YHR189W 8 484028 484600 W 2005-11-07 1996-07-31 -S000001233 ORF Verified YHR190W ERG9 bifunctional farnesyl-diphosphate farnesyltransferase/squalene synthase chromosome 8 L000000575 8 484845 486179 W 2005-11-07 1996-07-31 Farnesyl-diphosphate farnesyl transferase (squalene synthase); joins two farnesyl pyrophosphate moieties to form squalene in the sterol biosynthesis pathway -S000036394 CDS YHR190W 8 484845 486179 W 2005-11-07 1996-07-31 -S000001234 ORF Verified YHR191C CTF8 chromosome 8 L000003309 8 486631 486230 C 2005-11-07 1996-07-31 Subunit of a complex with Ctf18p; shares some subunits with Replication Factor C; required for sister chromatid cohesion -S000036427 CDS YHR191C 8 486631 486230 C 2005-11-07 1996-07-31 -S000001235 ORF Verified YHR192W LNP1 chromosome 8 8 486826 487662 W 2005-11-07 1996-07-31 Lunapark family member involved in ER network formation; regulates the ER asymmetry-induced inheritance block during ER stress; localizes to ER junctions and this localization is regulated by the yeast atlastin ortholog Sey1p; interacts with the reticulon protein Rtn1p; induced in response to the DNA-damaging agent MMS -S000036575 CDS YHR192W 8 486826 487662 W 2005-11-07 1996-07-31 -S000001236 ORF Verified YHR193C EGD2 chromosome 8 L000000546|L000002606 8 488236 487712 C 2005-11-07 1996-07-31 Alpha subunit of the nascent polypeptide-associated complex (NAC); involved in protein sorting and translocation; associated with cytoplasmic ribosomes -S000036606 CDS YHR193C 8 488236 487712 C 2005-11-07 1996-07-31 -S000001237 ORF Verified YHR194W MDM31 chromosome 8 8 488657 490396 W 2005-11-07 1996-07-31 Mitochondrial protein that may have a role in phospholipid metabolism; inner membrane protein with similarity to Mdm32p; required for normal mitochondrial morphology and inheritance; interacts genetically with MMM1, MMM2, MDM10, MDM12, and MDM34 -S000037365 CDS YHR194W 8 488657 490396 W 2005-11-07 1996-07-31 -S000028785 ORF Dubious YHR193C-A chromosome 8 8 489027 488653 C 2005-11-07 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified ORF MDM31/YHR194W -S000033528 CDS YHR193C-A 8 489027 488653 C 2005-11-07 2003-07-29 -S000001238 ORF Verified YHR195W NVJ1 VAB36 chromosome 8 8 490747 491712 W 2005-11-07 1996-07-31 Nuclear envelope protein; anchored to the nuclear inner membrane, that interacts with the vacuolar membrane protein Vac8p to promote formation of nucleus-vacuole junctions during piecemeal microautophagy of the nucleus (PMN) -S000037505 CDS YHR195W 8 490747 491712 W 2005-11-07 1996-07-31 -S000001239 ORF Verified YHR196W UTP9 chromosome 8 8 491931 493658 W 2005-11-07 1996-07-31 Nucleolar protein; component of the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA -S000030211 CDS YHR196W 8 491931 493658 W 2005-11-07 1996-07-31 -S000001240 ORF Verified YHR197W RIX1 IPI2 chromosome 8 8 493896 496187 W 2005-11-07 1996-07-31|2011-02-03 Component of the Rix1 complex and possibly pre-replicative complexes; required for processing of ITS2 sequences from 35S pre-rRNA; component of the pre-60S ribosomal particle with the dynein-related AAA-type ATPase Mdn1p; required for pre-replicative complex (pre-RC) formation and maintenance during DNA replication licensing; relocalizes to the cytosol in response to hypoxia; essential gene -S000030393 CDS YHR197W 8 493896 496187 W 2005-11-07 1996-07-31|2011-02-03 -S000001241 ORF Verified YHR198C AIM18 FMP22 chromosome 8 8 497280 496315 C 2005-11-07 1996-07-31 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; null mutant displays elevated frequency of mitochondrial genome loss -S000030441 CDS YHR198C 8 497280 496315 C 2005-11-07 1996-07-31 -S000001242 ORF Verified YHR199C AIM46 FMP34 chromosome 8 8 498422 497490 C 2005-11-07 1996-07-31 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; null mutant displays elevated frequency of mitochondrial genome loss -S000031364 CDS YHR199C 8 498422 497490 C 2005-11-07 1996-07-31 -S000029704 ORF Verified YHR199C-A NBL1 MCL1 chromosome 8 8 498859 498571 C 2005-11-07 2004-02-20 Subunit of the conserved chromosomal passenger complex (CPC); complex regulates mitotic chromosome segregation; not required for the kinase activity of the complex; mediates the interaction of Sli15p and Bir1p; other complex members are Ipl1p, Sli15p, and Bir1p -S000036811 CDS YHR199C-A 8 498719 498571 C 2005-11-07 2004-02-20 -S000036810 CDS YHR199C-A 8 498859 498787 C 2005-11-07 2004-02-20 -S000036812 intron YHR199C-A 8 498786 498720 C 2005-11-07 2004-02-20 -S000001243 ORF Verified YHR200W RPN10 proteasome regulatory particle base subunit RPN10|SUN1|MCB1 chromosome 8 L000003108 8 499079 499885 W 2005-11-07 1996-07-31 Non-ATPase base subunit of the 19S RP of the 26S proteasome; N-terminus plays a role in maintaining the structural integrity of the regulatory particle (RP); binds selectively to polyubiquitin chains; homolog of the mammalian S5a protein -S000036384 CDS YHR200W 8 499079 499885 W 2005-11-07 1996-07-31 -S000001244 ORF Verified YHR201C PPX1 exopolyphosphatase chromosome 8 L000001477 8 501143 499950 C 2005-11-07 1996-07-31 Exopolyphosphatase; hydrolyzes inorganic polyphosphate (poly P) into Pi residues; located in the cytosol, plasma membrane, and mitochondrial matrix -S000036416 CDS YHR201C 8 501143 499950 C 2005-11-07 1996-07-31 -S000118362 ARS ARS822 ARSVIII-502 chromosome 8 8 501756 501996 2006-08-30 2006-08-30 Autonomously Replicating Sequence -S000001245 ORF Uncharacterized YHR202W chromosome 8 8 502388 504196 W 2005-11-07 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole, while HA-tagged protein is found in the soluble fraction, suggesting cytoplasmic localization -S000037129 CDS YHR202W 8 502388 504196 W 2005-11-07 1996-07-31 -S000001246 ORF Verified YHR203C RPS4B eS4|ribosomal 40S subunit protein S4B|S4e|rp5|YS6|S7B|S4B chromosome 8 L000001750 8 505530 504476 C 2005-11-07 1999-07-17|1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S4, no bacterial homolog; RPS4B has a paralog, RPS4A, that arose from the whole genome duplication -S000037172 CDS YHR203C 8 505247 504476 C 2005-11-07 1999-07-17|1996-07-31 -S000037171 CDS YHR203C 8 505530 505517 C 2005-11-07 1999-07-17|1996-07-31 -S000037173 intron YHR203C 8 505516 505248 C 2005-11-07 1999-07-17|1996-07-31 -S000001247 ORF Verified YHR204W MNL1 alpha-1,2-mannosidase MNL1|HTM1 chromosome 8 8 506319 508709 W 2005-11-07 1996-07-31 Alpha-1,2-specific exomannosidase of the endoplasmic reticulum; involved in glycan trimming of both folded and misfolded glycoproteins; complexes with Pdi1p, and trims a mannose from Man8GlcNac2 glycans to generate Man7GlcNac2, an oligosaccharide signal on glycoproteins destined for ER-associated protein degradation; requires Pdi1p for stability and substrate recognition; human homolog EDEM1 can complement yeast null mutant -S000037304 CDS YHR204W 8 506319 508709 W 2005-11-07 1996-07-31 -S000001248 ORF Verified YHR205W SCH9 serine/threonine protein kinase SCH9|HRM2|KOM1 chromosome 8 L000001810 8 509363 511837 W 2005-11-07 1996-07-31 AGC family protein kinase; functional ortholog of mammalian S6 kinase; phosphorylated by Tor1p and required for TORC1-mediated regulation of ribosome biogenesis, translation initiation, and entry into G0 phase; involved in transactivation of osmostress-responsive genes; regulates G1 progression, cAPK activity and nitrogen activation of the FGM pathway; integrates nutrient signals and stress signals from sphingolipids to regulate lifespan -S000037366 CDS YHR205W 8 509363 511837 W 2005-11-07 1996-07-31 -S000001249 ORF Verified YHR206W SKN7 kinase-regulated stress-responsive transcription factor SKN7|POS9|BRY1 chromosome 8 L000001908 8 512732 514600 W 2005-11-07 1996-07-31 Nuclear response regulator and transcription factor; physically interacts with the Tup1-Cyc8 complex and recruits Tup1p to its targets; part of a branched two-component signaling system; required for optimal induction of heat-shock genes in response to oxidative stress; involved in osmoregulation; relocalizes to the cytosol in response to hypoxia; SKN7 has a paralog, HMS2, that arose from the whole genome duplication -S000029994 CDS YHR206W 8 512732 514600 W 2005-11-07 1996-07-31 -S000001250 ORF Verified YHR207C SET5 S-adenosylmethionine-dependent methyltransferase chromosome 8 8 516485 514905 C 2005-11-07 1996-07-31 Methyltransferase involved in methylation of histone H4 Lys5, -8, -12; S-adenosylmethionine-dependent; zinc-finger protein, contains one canonical and two unusual fingers in unusual arrangements; deletion enhances replication of positive-strand RNA virus -S000030030 CDS YHR207C 8 516485 514905 C 2005-11-07 1996-07-31 -S000001251 ORF Verified YHR208W BAT1 branched-chain-amino-acid transaminase BAT1|TWT1|ECA39 chromosome 8 L000002396 8 517532 518713 W 2005-11-07 1996-07-31 Mitochondrial branched-chain amino acid (BCAA) aminotransferase; preferentially involved in BCAA biosynthesis; homolog of murine ECA39; highly expressed during logarithmic phase and repressed during stationary phase; BAT1 has a paralog, BAT2, that arose from the whole genome duplication -S000030198 CDS YHR208W 8 517532 518713 W 2005-11-07 1996-07-31 -S000001252 ORF Verified YHR209W CRG1 S-adenosylmethionine-dependent methyltransferase chromosome 8 8 519437 520312 W 2005-11-07 1996-07-31 S-AdoMet-dependent methyltransferase involved in lipid homeostasis; mediates resistance to a drug cantharidin -S000030378 CDS YHR209W 8 519437 520312 W 2005-11-07 1996-07-31 -S000001253 ORF Uncharacterized YHR210C aldose 1-epimerase superfamily protein chromosome 8 8 521737 520712 C 2005-11-07 1996-07-31 Putative aldose 1-epimerase superfamily protein; non-essential gene; highly expressed under anaeorbic conditions -S000032576 CDS YHR210C 8 521737 520712 C 2005-11-07 1996-07-31 -S000001254 ORF Verified YHR211W FLO5 flocculin FLO5 chromosome 8 L000000618 8 525392 528619 W 2005-11-07 1996-07-31 Lectin-like cell wall protein (flocculin) involved in flocculation; binds mannose chains on the surface of other cells, confers floc-forming ability that is chymotrypsin resistant but heat labile; important for co-flocculation with other yeasts, mediating interaction with specific species; FLO5 has a paralog, FLO1, that arose from a segmental duplication -S000033338 CDS YHR211W 8 525392 528619 W 2005-11-07 1996-07-31 -S000007000 long_terminal_repeat YHRCdelta14 chromosome 8 8 530379 530049 C 2005-11-07 2000-05-19 Ty1 LTR -S000001255 ORF Dubious YHR212C chromosome 8 8 538094 537759 C 2005-11-07 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YHR212C has a paralog, YAR060C, that arose from a segmental duplication -S000033360 CDS YHR212C 8 538094 537759 C 2005-11-07 1996-07-31 -S000028650 ORF Uncharacterized YHR212W-A chromosome 8 8 538742 538945 W 2005-11-07 2003-07-29 Pseudogenic fragment with similarity to flocculins; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; YHR212W-A has a paralog, YAR061W, that arose from a segmental duplication -S000032453 CDS YHR212W-A 8 538742 538945 W 2005-11-07 2003-07-29 -S000001256 ORF Uncharacterized YHR213W chromosome 8 8 539151 539747 W 2005-11-07 1996-07-31 Pseudogenic fragment with similarity to flocculins; YHR213W has a paralog, YAR062W, that arose from a segmental duplication -S000033478 CDS YHR213W 8 539151 539747 W 2005-11-07 1996-07-31 -S000028651 ORF Uncharacterized YHR213W-A chromosome 8 8 540549 540782 W 2005-11-07 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032454 CDS YHR213W-A 8 540549 540782 W 2005-11-07 2003-07-29 -S000028652 ORF Uncharacterized YHR213W-B chromosome 8 8 540800 541099 W 2005-11-07 2003-07-29 Pseudogenic fragment with similarity to flocculins; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; YHR213W-B has a paralog, YAR064W, that arose from a segmental duplication -S000032455 CDS YHR213W-B 8 540800 541099 W 2005-11-07 2003-07-29 -S000001257 ORF Uncharacterized YHR214W chromosome 8 8 541651 542262 W 2005-11-07 1996-07-31 Putative protein of unknown function; predicted to be a glycosylphosphatidylinositol-modified (GPI) protein; YHR214W has a paralog, YAR066W, that arose from a segmental duplication -S000033542 CDS YHR214W 8 541651 542262 W 2005-11-07 1996-07-31 -S000003535 ORF Dubious YHR214W-A chromosome 8 8 543008 543493 W 2005-11-07 1996-07-31 Dubious open reading frame; induced by zinc deficiency; YHR214W-A has a paralog, YAR068W, that arose from a segmental duplication -S000035568 CDS YHR214W-A 8 543008 543493 W 2005-11-07 1996-07-31 -S000007001 long_terminal_repeat YHRCdelta15 chromosome 8 8 543941 543610 C 2005-11-07 2000-05-19 Ty1 LTR -S000003534 transposable_element_gene YHR214C-B gag-pol fusion protein chromosome 8 8 549346 543964 C 2005-11-07 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes; YHR214C-B has a paralog, YAR070C, that arose from a segmental duplication -S000035139 CDS YHR214C-B 8 547929 543964 C 2005-11-07 1996-07-31 -S000035138 CDS YHR214C-B 8 549346 547931 C 2005-11-07 1996-07-31 -S000035140 plus_1_translational_frameshift YHR214C-B 8 547930 547930 C 2005-11-07 1996-07-31 -S000007421 transposable_element_gene YHR214C-C gag protein chromosome 8 8 549346 547910 C 2005-11-07 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000035142 CDS YHR214C-C 8 549346 547910 C 2005-11-07 1999-07-17 -S000007006 LTR_retrotransposon YHRCTy1-1 Ty1 chromosome 8 8 549637 543610 C 2005-11-07 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats -S000007002 long_terminal_repeat YHRCdelta16 chromosome 8 8 549637 549306 C 2005-11-07 2000-05-19 Ty1 LTR -S000028653 ORF Uncharacterized YHR214C-D chromosome 8 8 550941 550648 C 2005-11-07 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; SWAT-GFP and mCherry fusion proteins localize to the nucleus and endoplasmic reticulum respectively; YHR214C-D has a paralog, YAR069C, that arose from a segmental duplication -S000032456 CDS YHR214C-D 8 550941 550648 C 2005-11-07 2003-07-29 -S000028654 ORF Uncharacterized YHR214C-E chromosome 8 8 551499 551200 C 2005-11-07 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032457 CDS YHR214C-E 8 551499 551200 C 2005-11-07 2003-07-29 -S000001258 ORF Verified YHR215W PHO12 acid phosphatase PHO12|PHO10 chromosome 8 L000001424 8 552099 553502 W 2005-11-07 1996-07-31 One of three repressible acid phosphatases; glycoprotein that is transported to the cell surface by the secretory pathway; pregulated by phosphate starvation; PHO12 has a paralog, PHO11, that arose from a segmental duplication -S000033601 CDS YHR215W 8 552099 553502 W 2005-11-07 1996-07-31 -S000001259 ORF Verified YHR216W IMD2 IMP dehydrogenase IMD2|PUR5 chromosome 8 8 554396 555967 W 2005-11-07 1996-07-31 Inosine monophosphate dehydrogenase; catalyzes the rate-limiting step in GTP biosynthesis, expression is induced by mycophenolic acid resulting in resistance to the drug, expression is repressed by nutrient limitation; IMD2 has a paralog, YAR073W/YAR075W, that arose from a segmental duplication -S000034515 CDS YHR216W 8 554396 555967 W 2005-11-07 1996-07-31 -S000118363 ARS ARS824 ARSVIII-556 chromosome 8 8 556001 556331 2006-08-30 2006-08-30 Autonomously Replicating Sequence -S000028964 telomere TEL08R chromosome 8 8 556105 562643 W 131 2005-11-07 2003-09-09 Telomeric region on the right arm of Chromosome VIII; composed of an X element core sequence, X element combinatorial repeats, an internal stretch of telomeric repeats, a short Y' element, and a terminal stretch of telomeric repeats -S000028966 telomeric_repeat TEL08R 8 556832 556985 W 2005-11-07 2003-09-09 Internal telomeric repeats on the right arm of Chromosome VIII -S000028965 telomeric_repeat TEL08R 8 562457 562643 W 2005-11-07 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome VIII -S000028967 X_element TEL08R 8 556105 556575 W 2005-11-07 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome VIII; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028968 X_element_combinatorial_repeat TEL08R 8 556576 556831 W 2005-11-07 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr VIII; contains repeats of the D, C, and B types; formerly called SubTelomeric Repeats -S000028969 Y_prime_element TEL08R 8 556986 562456 W 2005-11-07 2003-09-09 Telomeric short Y' element on the right arm of Chromosome VIII; contains an ARS consensus sequence, a region of 36-bp repeats, and four ORFs (YHR218W, YHR219W, YHR218W-A, YHR219C-A) -S000001260 ORF Dubious YHR217C chromosome 8 8 557042 556581 C 2005-11-07 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; located in the telomeric region TEL08R -S000034583 CDS YHR217C 8 557042 556581 C 2005-11-07 1996-07-31 -S000001261 ORF Uncharacterized YHR218W chromosome 8 8 558014 559924 W 2005-11-07 1996-07-31 Helicase-like protein encoded within the telomeric Y' element -S000034722 CDS YHR218W 8 558014 558615 W 2005-11-07 1996-07-31 -S000034723 CDS YHR218W 8 558715 559924 W 2005-11-07 1996-07-31 -S000034724 intron YHR218W 8 558616 558714 W 2005-11-07 1996-07-31 -S000028786 ORF Dubious YHR218W-A chromosome 8 8 559932 560249 W 2005-11-07 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely within telomere TEL08L -S000033530 CDS YHR218W-A 8 559932 560249 W 2005-11-07 2003-07-29 -S000001262 ORF Uncharacterized YHR219W chromosome 8 8 560173 562047 W 2005-11-07 1996-07-31 Putative protein of unknown function with similarity to helicases; located in the telomere region on the right arm of chromosome VIII -S000035716 CDS YHR219W 8 560173 562047 W 2005-11-07 1996-07-31 -S000028655 ORF Dubious YHR219C-A chromosome 8 8 561681 561199 C 2005-11-07 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching -S000032458 CDS YHR219C-A 8 561681 561199 C 2005-11-07 2003-07-29 -S000028658 ORF Dubious YIL177W-A chromosome 9 9 846 1328 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized gene YIL177C -S000032462 CDS YIL177W-A 9 846 1328 W 2003-07-29 2003-07-29 -S000001439 ORF Uncharacterized YIL177C Y' element ATP-dependent helicase chromosome 9 9 6147 483 C 1994-12-10 1994-12-10 Putative Y' element ATP-dependent helicase -S000034517 CDS YIL177C 9 4598 483 C 1994-12-10 1994-12-10 -S000034516 CDS YIL177C 9 6147 4987 C 1994-12-10 1994-12-10 -S000034518 intron YIL177C 9 4986 4599 C 1994-12-10 1994-12-10 -S000130156 ARS ARS902 chromosome 9 9 7470 8793 2009-05-07 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000028896 telomere TEL09L chromosome 9 9 7784 1 C -155 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome IX; composed of an X element core sequence, X element combinatorial repeats, a long Y' element, and a short terminal stretch of telomeric repeats -S000028897 telomeric_repeat TEL09L 9 77 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome IX -S000028898 X_element TEL09L 9 7784 7322 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome IX; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028899 X_element_combinatorial_repeat TEL09L 9 7321 6949 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr IX; contains a repeat of the D type with a group I mitochondrial bI4 intron insertion; formerly called SubTelomeric Repeats -S000028900 Y_prime_element TEL09L 9 6948 78 C 2003-09-09 2003-09-09 Telomeric long Y' element on the left arm of Chromosome IX; contains an ARS consensus sequence, a region of 36-bp repeats, and two ORFs YIL177C and YIL177W-A -S000001438 ORF Uncharacterized YIL176C PAU14 seripauperin PAU14 chromosome 9 9 9155 8793 C 1994-12-10 1994-12-10 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; identical to Pau1p -S000034408 CDS YIL176C 9 9155 8793 C 1994-12-10 1994-12-10 -S000001437 pseudogene YIL175W chromosome 9 9 9183 9500 W 1994-12-10 1994-12-10 Hypothetical protein; classified as pseudogene because there is no ATG at the beginning of this ORF -S000034372 CDS YIL175W 9 9183 9500 W 1994-12-10 1994-12-10 -S000001436 pseudogene YIL174W chromosome 9 9 9469 9696 W 1994-12-10 1994-12-10 Hypothetical protein -S000034275 CDS YIL174W 9 9469 9696 W 1994-12-10 1994-12-10 -S000001435 ORF Verified YIL173W VTH1 signal sequence-binding protein chromosome 9 9 11492 16141 W 1994-12-10 1994-12-10 Putative membrane glycoprotein; has strong similarity to Vth2p and Pep1p/Vps10p; may be involved in vacuolar protein sorting -S000033367 CDS YIL173W 9 11492 16141 W 1994-12-10 1994-12-10 -S000130157 ARS ARS904 chromosome 9 9 16141 16784 2009-05-07 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000028798 ORF Dubious YIL171W-A chromosome 9 9 18260 18712 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF IMA3/YIL172C -S000033565 CDS YIL171W-A 9 18260 18712 W 2003-07-29 2003-07-29 -S000001434 ORF Verified YIL172C IMA3 oligo-1,6-glucosidase IMA3 chromosome 9 9 18553 16784 C 1994-12-10 1994-12-10 Alpha-glucosidase; weak, but broad substrate specificity for alpha-1,4- and alpha-1,6-glucosides; member of IMA isomaltase family; not required for isomaltose utilization, but Ima3p overexpression allows the ima1 null mutant to grow on isomaltose; lower activitiy and thermostability in vitro than Ima2p despite sequence difference of only 3 amino acids; cleaves alpha-1,3 linkage of nigerose and turanose, but not alpha-1,5 of leucrose; identical to IMA4 -S000033269 CDS YIL172C 9 18553 16784 C 1994-12-10 1994-12-10 -S000001433 pseudogene YIL171W HXT12 chromosome 9 L000002639 9 19515 19844 W 1994-12-10 1994-12-10 Possible pseudogene in strain S288C; YIL171W and the adjacent ORF, YIL170W/HXT12, together encode a non-functional member of the hexose transporter family -S000033235 CDS YIL171W 9 19515 19844 W 1994-12-10 1994-12-10 -S000001432 pseudogene YIL170W HXT12 chromosome 9 9 19847 21220 W 1994-12-10 1994-12-10 Possible pseudogene in strain S288C; YIL170W/HXT12 and the adjacent ORF, YIL171W, together encode a non-functional member of the hexose transporter family -S000032383 CDS YIL170W 9 19847 21220 W 1994-12-10 1994-12-10 -S000001431 ORF Verified YIL169C CSS1 HPF1' chromosome 9 9 26106 23119 C 1994-12-10 1994-12-10 Protein of unknown function, secreted when constitutively expressed; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the cell periphery, SWAT-GFP fusion also localizes to the extracellular region, and mCherry fusion also localizes to the vacuole; S/T rich and highly similar to YOL155C, a putative glucan alpha-1,4-glucosidase; transcript is induced in both high and low pH environments; non-essential gene -S000031425 CDS YIL169C 9 26106 23119 C 1994-12-10 1994-12-10 -S000001429 blocked_reading_frame YIL167W SDL1 YIL168W chromosome 9 9 29032 30048 W 2014-11-18 1994-12-10|2014-11-18 Blocked reading frame otherwise encoding L-serine dehydratase -S000031256 CDS YIL167W 9 29032 30048 W 2014-11-18 1994-12-10|2014-11-18 -S000001428 ORF Uncharacterized YIL166C chromosome 9 9 32566 30938 C 1994-12-10 1994-12-10 Putative protein with similarity to allantoate permease; similar to the allantoate permease (Dal5p) subfamily of the major facilitator superfamily; mRNA expression is elevated by sulfur limitation; YIL166C is a non-essential gene -S000030233 CDS YIL166C 9 32566 30938 C 1994-12-10 1994-12-10 -S000001427 ORF Uncharacterized YIL165C chromosome 9 9 34077 33718 C 1994-12-10 1994-12-10 Putative protein of unknown function; mutant exhibits mitophagy defects; in closely related species and other S. cerevisiae strain backgrounds YIL165C and adjacent ORF, YIL164C, likely constitute a single ORF encoding a nitrilase gene -S000030045 CDS YIL165C 9 34077 33718 C 1994-12-10 1994-12-10 -S000001426 ORF Verified YIL164C NIT1 chromosome 9 L000004211 9 34686 34087 C 1994-12-10 1994-12-10 Nitrilase; member of the nitrilase branch of the nitrilase superfamily; in closely related species and other S. cerevisiae strain backgrounds YIL164C and adjacent ORF, YIL165C, likely constitute a single ORF encoding a nitrilase gene -S000029934 CDS YIL164C 9 34686 34087 C 1994-12-10 1994-12-10 -S000001425 ORF Uncharacterized YIL163C chromosome 9 9 37252 36899 C 1994-12-10 1994-12-10 Protein of unknown function; mRNA identified as translated by ribosome profiling data -S000037273 CDS YIL163C 9 37252 36899 C 1994-12-10 1994-12-10 -S000001424 ORF Verified YIL162W SUC2 beta-fructofuranosidase SUC2 chromosome 9 L000002144 9 37385 38983 W -153 1994-12-10 1994-12-10 Invertase; sucrose hydrolyzing enzyme; a secreted, glycosylated form is regulated by glucose repression, and an intracellular, nonglycosylated enzyme is produced constitutively -S000037231 CDS YIL162W 9 37385 38983 W 1994-12-10 1994-12-10 -S000001423 ORF Uncharacterized YIL161W chromosome 9 9 39433 40140 W 1994-12-10 1994-12-10 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; mRNA is enriched in Scp160p-associated mRNPs; YIL161W is a non-essential gene -S000037133 CDS YIL161W 9 39433 40140 W 1994-12-10 1994-12-10 -S000001422 ORF Verified YIL160C POT1 acetyl-CoA C-acyltransferase|POX3|FOX3 chromosome 9 L000001466 9 41444 40191 C 1994-12-10 1994-12-10 3-ketoacyl-CoA thiolase with broad chain length specificity; cleaves 3-ketoacyl-CoA into acyl-CoA and acetyl-CoA during beta-oxidation of fatty acids -S000037007 CDS YIL160C 9 41444 40191 C 1994-12-10 1994-12-10 -S000001421 ORF Verified YIL159W BNR1 formin BNR1 chromosome 9 L000004058 9 41825 45952 W 1994-12-10 1994-12-10 Formin; nucleates the formation of linear actin filaments; involved in processes such as budding and mitotic spindle orientation which require the formation of polarized actin cables; activity is regulated by Hof1p and by the Bud14p-Kel1p-Kel2p complex; dephosphorylated and delocalized from the division site in a Glc7p/Ref2p-dependent manner; functionally redundant with BNI1 -S000035282 CDS YIL159W 9 41825 45952 W 1994-12-10 1994-12-10 -S000001420 ORF Verified YIL158W AIM20 chromosome 9 9 46201 46815 W 1994-12-10 1994-12-10 Protein of unknown function; overexpression causes cell cycle delay or arrest; green fluorescent protein (GFP)-fusion protein localizes to vacuole; null mutant displays elevated frequency of mitochondrial genome loss; relocalizes from nucleus to cytoplasm upon DNA replication stress; AIM20 has a paralog, SKG1, that arose from the whole genome duplication -S000035094 CDS YIL158W 9 46201 46815 W 1994-12-10 1994-12-10 -S000028797 ORF Dubious YIL156W-A chromosome 9 9 47292 47693 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF COA1/YIL157C -S000033563 CDS YIL156W-A 9 47292 47693 W 2003-07-29 2003-07-29 -S000001419 ORF Verified YIL157C COA1 FMP35 chromosome 9 9 47542 46949 C 1994-12-10 1994-12-10 Mitochondrial inner membrane protein; required for assembly of the cytochrome c oxidase complex (complex IV); interacts with complex IV assembly factor Shy1p during the early stages of assembly -S000034088 CDS YIL157C 9 47542 46949 C 1994-12-10 1994-12-10 -S000028511 ORF Uncharacterized YIL156W-B chromosome 9 9 47690 47973 W 2003-07-29 2003-07-29 Putative protein of unknown function; originally identified based on homology to Ashbya gossypii and other related yeasts; SWAT-GFP and mCherry fusion proteins localize to the vacuole, while SWAT-GFP fusion also localizes to the endoplasmic reticulum -S000030265 CDS YIL156W-B 9 47690 47698 W 2003-07-29 2003-07-29 -S000030266 CDS YIL156W-B 9 47761 47973 W 2003-07-29 2003-07-29 -S000030267 intron YIL156W-B 9 47699 47760 W 2003-07-29 2003-07-29 -S000001418 ORF Verified YIL156W UBP7 ubiquitin-specific protease UBP7 chromosome 9 L000003169 9 48091 51306 W 1994-12-10 1994-12-10 Ubiquitin-specific protease that cleaves ubiquitin-protein fusions; UBP7 has a paralog, UBP11, that arose from the whole genome duplication -S000034053 CDS YIL156W 9 48091 51306 W 1994-12-10 1994-12-10 -S000001417 ORF Verified YIL155C GUT2 glycerol-3-phosphate dehydrogenase chromosome 9 L000000747 9 53708 51759 C 1994-12-10 1994-12-10 Mitochondrial glycerol-3-phosphate dehydrogenase; expression is repressed by both glucose and cAMP and derepressed by non-fermentable carbon sources in a Snf1p, Rsf1p, Hap2/3/4/5 complex dependent manner -S000033832 CDS YIL155C 9 53708 51759 C 1994-12-10 1994-12-10 -S000001416 ORF Verified YIL154C IMP2' IMP2 chromosome 9 L000000865 9 55021 53981 C 1994-12-10 1994-12-10 Transcriptional activator involved in maintenance of ion homeostasis; also involved in protection against DNA damage caused by bleomycin and other oxidants; contains a C-terminal leucine-rich repeat -S000033080 CDS YIL154C 9 55021 53981 C 1994-12-10 1994-12-10 -S000001415 ORF Verified YIL153W RRD1 peptidylprolyl isomerase RRD1|YPA1 chromosome 9 L000004483 9 55198 56379 W 1994-12-10 1994-12-10 Peptidyl-prolyl cis/trans-isomerase; activator of the phosphotyrosyl phosphatase activity of PP2A; involved in G1 phase progression, microtubule dynamics, bud morphogenesis and DNA repair; required for rapid reduction of Sgs1p levels in response to rapamycin; subunit of the Tap42p-Sit4p-Rrd1p complex; protein increases in abundance and relative distribution to the nucleus increases upon DNA replication stress -S000033043 CDS YIL153W 9 55198 56379 W 1994-12-10 1994-12-10 -S000001414 ORF Uncharacterized YIL152W chromosome 9 9 56545 57252 W 1994-12-10 1994-12-10 Putative protein of unknown function -S000032954 CDS YIL152W 9 56545 57252 W 1994-12-10 1994-12-10 -S000001413 ORF Uncharacterized YIL151C ESL1 chromosome 9 9 60694 57338 C 1994-12-10 1994-12-10 hEST1A/B (SMG5/6)-like protein; contributes to environment-sensing adaptive gene expression responses; Esl1p and Esl2p contain a 14-3-3-like domain and a putative PilT N-terminus ribonuclease domain; ESL1 has a paralog, ESL2, that arose from the whole genome duplication -S000032789 CDS YIL151C 9 60694 57338 C 1994-12-10 1994-12-10 -S000001412 ORF Verified YIL150C MCM10 DNA43 chromosome 9 L000000512 9 62728 61013 C 1994-12-10 1994-12-10 Essential chromatin-associated protein; involved in initiation of DNA replication; required for association of MCM2-7 complex with replication origins; required to stabilize catalytic subunit of DNA polymerase-alpha; self-associates through its N-terminal domain -S000031878 CDS YIL150C 9 62728 61013 C 1994-12-10 1994-12-10 -S000001411 ORF Verified YIL149C MLP2 chromosome 9 S000007510 9 68067 63028 C 1994-12-10 1994-12-10 Myosin-like protein associated with the nuclear envelope; nuclear basket protein that connects the nuclear pore complex with the nuclear interior; involved in the Tel1p pathway that controls telomere length; MLP2 has a paralog, MLP1, that arose from the whole genome duplication -S000031703 CDS YIL149C 9 68067 63028 C 1994-12-10 1994-12-10 -S000001410 ORF Verified YIL148W RPL40A eL40|ubiquitin-ribosomal 60S subunit protein L40A fusion protein|L40e|L40A|UB11|UBI1|CEP52A chromosome 9 L000002411|L000000313 9 68708 69528 W 1994-12-10 1994-12-10 Ubiquitin-ribosomal 60S subunit protein L40A fusion protein; cleaved to yield ubiquitin and ribosomal protein L40A; ubiquitin may facilitate assembly of the ribosomal protein into ribosomes; homologous to mammalian ribosomal protein L40, no bacterial homolog; RPL40A has a paralog, RPL40B, that arose from the whole genome duplication; relative distribution to the nucleus increases upon DNA replication stress -S000031651 CDS YIL148W 9 68708 68715 W 1994-12-10 1994-12-10 -S000031652 CDS YIL148W 9 69150 69528 W 1994-12-10 1994-12-10 -S000031653 intron YIL148W 9 68716 69149 W 1994-12-10 1994-12-10 -S000001409 ORF Verified YIL147C SLN1 YPD2 chromosome 9 L000001916 9 73453 69791 C 1994-12-10 1994-12-10 Transmembrane histidine phosphotransfer kinase and osmosensor; regulates MAP kinase cascade; transmembrane protein with an intracellular kinase domain that signals to Ypd1p and Ssk1p, thereby forming a phosphorelay system similar to bacterial two-component regulators -S000031443 CDS YIL147C 9 73453 69791 C 1994-12-10 1994-12-10 -S000178111 ARS ARS907 chromosome 9 9 73820 73991 2014-11-18 2014-11-18 Autonomously replicating sequence -S000001408 ORF Verified YIL146C ATG32 mitophagy protein ATG32|ECM37 chromosome 9 L000003904 9 75773 74184 C 1994-12-10 1994-12-10 Mitochondrial outer membrane protein required to initiate mitophagy; recruits the autophagy adaptor protein Atg11p and the ubiquitin-like protein Atg8p to the mitochondrial surface to initiate mitophagy, the selective vacuolar degradation of mitochondria in response to starvation; can promote pexophagy when placed ectopically in the peroxisomal membrane; regulates mitophagy and ethanol production during alcoholic fermentation -S000030520 CDS YIL146C 9 75773 74184 C 1994-12-10 1994-12-10 -S000001407 ORF Verified YIL145C PAN6 pantoate--beta-alanine ligase PAN6 chromosome 9 9 77283 76354 C 2003-09-22 2003-09-22|1994-12-10 Pantothenate synthase; also known as pantoate-beta-alanine ligase, required for pantothenic acid biosynthesis, deletion causes pantothenic acid auxotrophy, homologous to E. coli panC -S000030395 CDS YIL145C 9 77283 76354 C 2003-09-22 2003-09-22|1994-12-10 -S000001406 ORF Verified YIL144W NDC80 kinetochore-associated Ndc80 complex subunit NDC80|TID3|HEC1 chromosome 9 L000004311 9 78074 80149 W 1994-12-10 1994-12-10 Component of the kinetochore-associated Ndc80 complex; conserved coiled-coil protein involved in chromosome segregation, spindle checkpoint activity, and kinetochore assembly and clustering; evolutionarily conserved; complex members include Ndc80p, Nuf2p, Scp24p, and Spc25p; modified by sumoylation -S000030319 CDS YIL144W 9 78074 80149 W 1994-12-10 1994-12-10 -S000001405 ORF Verified YIL143C SSL2 TFIIH/NER complex ATPase/helicase subunit SSL2|RAD25|LOM3 chromosome 9 L000002086 9 83041 80510 C 1994-12-10 1994-12-10 Component of RNA polymerase transcription factor TFIIH holoenzyme; acts as dsDNA-dependent translocase in context of TFIIH, unwinds DNA strands during initiation and promotes transcription start site (TSS) scanning; has DNA-dependent ATPase/helicase activity; interacts functionally with TFIIB, has roles in TSS selection and gene looping to juxtapose initiation and termination regions; involved in DNA repair; relocalizes to cytosol under hypoxia; homolog of human ERCC3 -S000037507 CDS YIL143C 9 83041 80510 C 1994-12-10 1994-12-10 -S000001404 ORF Verified YIL142W CCT2 chaperonin-containing T-complex subunit CCT2|TCP2|BIN3 chromosome 9 L000002269 9 83302 84885 W 1994-12-10 1994-12-10 Subunit beta of the cytosolic chaperonin Cct ring complex; related to Tcp1p, required for the assembly of actin and tubulins in vivo -S000037439 CDS YIL142W 9 83302 84885 W 1994-12-10 1994-12-10 -S000028796 ORF Dubious YIL142C-A chromosome 9 9 83540 83208 C 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF CCT2/YIL142W -S000033561 CDS YIL142C-A 9 83540 83208 C 2003-07-29 2003-07-29 -S000001403 ORF Dubious YIL141W chromosome 9 9 85053 85442 W 1994-12-10 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000037327 CDS YIL141W 9 85053 85442 W 1994-12-10 1994-12-10 -S000001402 ORF Verified YIL140W AXL2 SRO4|BUD10 chromosome 9 L000003104 9 85366 87837 W 1994-12-10 1994-12-10 Integral plasma membrane protein; required for axial budding in haploid cells; localizes to the incipient bud site and bud neck; glycosylated by Pmt4p; potential Cdc28p substrate -S000037249 CDS YIL140W 9 85366 87837 W 1994-12-10 1994-12-10 -S000001401 ORF Verified YIL139C REV7 chromosome 9 L000001618 9 88716 87979 C -101 1994-12-10 1994-12-10 Accessory subunit of DNA polymerase zeta; involved in translesion synthesis during post-replication repair; required for mutagenesis induced by DNA damage; involved in double-strand break repair; forms a complex with Rev3p, Pol31p and Pol32p -S000035566 CDS YIL139C 9 88716 87979 C 1994-12-10 1994-12-10 -S000001400 ORF Verified YIL138C TPM2 tropomyosin TPM2 chromosome 9 L000002329 9 89715 89230 C 1994-12-10 1994-12-10 Minor isoform of tropomyosin; binds to and stabilizes actin cables and filaments, which direct polarized cell growth and the distribution of several organelles; appears to have distinct and also overlapping functions with Tpm1p; TPM2 has a paralog, TPM1, that arose from the whole genome duplication -S000035475 CDS YIL138C 9 89715 89230 C 1994-12-10 1994-12-10 -S000001399 ORF Verified YIL137C TMA108 TAE3|RBF108 chromosome 9 9 92788 89948 C 1994-12-10 1994-12-10 Ribosome-associated, nascent chain binding factor; binds N-terminal region of nascent peptides during translation; recognizes target proteins via its putative metallopeptidase peptide-binding pocket -S000035340 CDS YIL137C 9 92788 89948 C 1994-12-10 1994-12-10 -S000001398 ORF Verified YIL136W OM45 chromosome 9 L000001301 9 93619 94800 W 1994-12-10 1994-12-10 Mitochondrial outer membrane protein of unknown function; major constituent of the outer membrane, extending into the intermembrane space; interacts with porin (Por1p) and with Om14p; imported via the presequence pathway involving the TOM and TIM23 complexes, then assembled in the outer membrane by Mim1p; protein abundance increases in response to DNA replication stress -S000034390 CDS YIL136W 9 93619 94800 W 1994-12-10 1994-12-10 -S000001397 ORF Verified YIL135C VHS2 chromosome 9 9 96375 95065 C 1994-12-10 1994-12-10 Regulator of septin dynamics; involved in the regulation of septin dynamics at bud neck after mitotic entry, likely by stabilizing septin structure; regulated at post-translational level by cell cycle dependent phosphorylation; likely phosphorylated by Cdc28p and dephosphorylated by Cdc14p before cytokinesis; high-copy suppressor of synthetic lethality of sis2 sit4 double mutant; VHS2 has a paralog, MLF3, that arose from the whole genome duplication -S000034198 CDS YIL135C 9 96375 95065 C 1994-12-10 1994-12-10 -S000028556 ORF Uncharacterized YIL134C-A chromosome 9 9 96725 96522 C 2003-07-29 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR -S000031242 CDS YIL134C-A 9 96725 96522 C 2003-07-29 2003-07-29 -S000006459 snoRNA_gene snR68 SNR68 chromosome 9 L000004537 9 97111 97246 W 1994-12-10 1994-12-10 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A2640 -S000030855 noncoding_exon snR68 9 97111 97246 W 1994-12-10 1994-12-10 -S000001396 ORF Verified YIL134W FLX1 flavin adenine dinucleotide transporter FLX1 chromosome 9 L000002664 9 97395 98330 W 1994-12-10 1994-12-10 Mitochondrial flavin adenine dinucleotide transporter; FAD is a synthesis product of riboflavin; human homolog SLC25A32 is implicated in multiple acyl-CoA dehydrogenase deficiency (MADD) or glutaric aciduria type II (GAII), and can complement yeast null mutant -S000034150 CDS YIL134W 9 97395 98330 W 1994-12-10 1994-12-10 -S000001395 ORF Verified YIL133C RPL16A uL13|ribosomal 60S subunit protein L16A|L13|rp22|YL15|L21A|L16A|RPL13 chromosome 9 L000001709 9 99416 98527 C 1994-12-10 1994-12-10 Ribosomal 60S subunit protein L16A; N-terminally acetylated, binds 5.8 S rRNA; transcriptionally regulated by Rap1p; homologous to mammalian ribosomal protein L13A and bacterial L13; RPL16A has a paralog, RPL16B, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress -S000033253 CDS YIL133C 9 99095 98527 C 1994-12-10 1994-12-10 -S000033252 CDS YIL133C 9 99416 99386 C 1994-12-10 1994-12-10 -S000033254 intron YIL133C 9 99385 99096 C 1994-12-10 1994-12-10 -S000001394 ORF Verified YIL132C CSM2 chromosome 9 9 100501 99860 C 1994-12-10 1994-12-10 Component of Shu complex (aka PCSS complex); Shu complex also includes Psy3, Shu1, Shu2, and promotes error-free DNA repair,; Shu complex mediates inhibition of Srs2p function; promotes formation of Rad51p filaments; Psy3p and Csm2p contain similar DNA-binding regions which work together to form a single DNA binding site; required for accurate chromosome segregation during meiosis -S000033192 CDS YIL132C 9 100501 99860 C 1994-12-10 1994-12-10 -S000001393 ORF Verified YIL131C FKH1 forkhead family transcription factor FKH1 chromosome 9 L000002607 9 102235 100781 C 1994-12-10 1994-12-10 Forkhead family transcription factor; rate-limiting replication origin activator; evolutionarily conserved lifespan regulator; binds multiple chromosomal elements with distinct specificities, cell cycle dynamics; regulates transcription elongation, chromatin silencing at mating loci, expression of G2/M phase genes; facilitates clustering, activation of early-firing replication origins; binds HML recombination enhancer, regulates donor preference during mating-type switching -S000033138 CDS YIL131C 9 102235 100781 C 1994-12-10 1994-12-10 -S000001392 ORF Verified YIL130W ASG1 chromosome 9 9 102782 105676 W 1994-12-10 1994-12-10 Zinc cluster protein proposed to be a transcriptional regulator; regulator involved in the stress response; null mutants have a respiratory deficiency, calcofluor white sensitivity and slightly increased cycloheximide resistance -S000032296 CDS YIL130W 9 102782 105676 W 1994-12-10 1994-12-10 -S000118394 ARS ARS909 ARSIX-106 chromosome 9 9 105870 106053 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000001391 ORF Verified YIL129C TAO3 PAG1 chromosome 9 9 113237 106107 C 1994-12-10 1994-12-10 Component of the RAM signaling network; is involved in regulation of Ace2p activity and cellular morphogenesis, interacts with protein kinase Cbk1p and also with Kic1p -S000032290 CDS YIL129C 9 113237 106107 C 1994-12-10 1994-12-10 -S000130158 ARS ARS910 chromosome 9 9 113237 113806 2009-05-07 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000001390 ORF Verified YIL128W MET18 MMS19 chromosome 9 L000003468 9 113806 116904 W 1994-12-10 1994-12-10 Component of cytosolic iron-sulfur protein assembly (CIA) machinery; acts at a late step of Fe-S cluster assembly; forms the CIA targeting complex with Cia1p and Cia2p that directs Fe-S cluster incorporation into a subset of proteins involved in methionine biosynthesis, DNA replication and repair, transcription, and telomere maintenance; ortholog of human MMS19 -S000032232 CDS YIL128W 9 113806 116904 W 1994-12-10 1994-12-10 -S000001389 ORF Uncharacterized YIL127C RRT14 chromosome 9 9 117644 117024 C 1994-12-10 1994-12-10 Putative protein of unknown function; identified in a screen for mutants with decreased levels of rDNA transcription; green fluorescent protein (GFP)-fusion protein localizes to the nucleolus; predicted to be involved in ribosome biogenesis -S000031158 CDS YIL127C 9 117644 117024 C 1994-12-10 1994-12-10 -S000001388 ORF Verified YIL126W STH1 RSC chromatin remodeling complex ATPase subunit STH1|NPS1 chromosome 9 L000002128 9 117992 122071 W -91 1994-12-10 1994-12-10 ATPase component of the RSC chromatin remodeling complex; required for expression of early meiotic genes; promotes base excision repair in chromatin; essential helicase-related protein homologous to Snf2p -S000031113 CDS YIL126W 9 117992 122071 W 1994-12-10 1994-12-10 -S000001387 ORF Verified YIL125W KGD1 alpha-ketoglutarate dehydrogenase KGD1|OGD1 chromosome 9 L000000897 9 122689 125733 W -91 1994-12-10 1994-12-10 Subunit of the mitochondrial alpha-ketoglutarate dehydrogenase complex; catalyzes a key step in the tricarboxylic acid (TCA) cycle, the oxidative decarboxylation of alpha-ketoglutarate to form succinyl-CoA -S000031016 CDS YIL125W 9 122689 125733 W 1994-12-10 1994-12-10 -S000001386 ORF Verified YIL124W AYR1 GBG1|acylglycerone-phosphate reductase chromosome 9 S000007473 9 126204 127097 W 1994-12-10 1994-12-10 Bifunctional triacylglycerol lipase and 1-acyl DHAP reductase; NADPH-dependent 1-acyl dihydroxyacetone phosphate reductase involved in phosphatidic acid biosynthesis; lipid droplet triacylglycerol lipase involved in the mobilization of non-polar lipids; found in lipid particles, the endoplasmic reticulum and the mitochondrial outer membrane; required for spore germination; role in cell wall biosynthesis; capable of metabolizing steroid hormones; oleic acid inducible -S000030012 CDS YIL124W 9 126204 127097 W 1994-12-10 1994-12-10 -S000001385 ORF Verified YIL123W SIM1 putative glucosidase SIM1 chromosome 9 L000003937 9 128151 129581 W 2011-02-03 1994-12-10|2011-02-03 Protein of the SUN family (Sim1p, Uth1p, Nca3p, Sun4p); may participate in DNA replication; promoter contains SCB regulation box at -300 bp indicating that expression may be cell cycle-regulated; SIM1 has a paralog, SUN4, that arose from the whole genome duplication -S000029900 CDS YIL123W 9 128151 129581 W 2011-02-03 1994-12-10|2011-02-03 -S000122103 five_prime_UTR_intron YIL123W 9 127662 128148 W 2007-04-04 2007-04-04 -S000001384 ORF Verified YIL122W POG1 chromosome 9 9 130610 131665 W 2011-02-03 1994-12-10 Nuclear chromatin-associated protein of unknown function; may have a role in cell cycle regulation; overexpression promotes recovery from pheromone induced arrest and suppresses the stress sensitivity caused by a mutation in the E3 ubiquitin ligase Rsp5p; binds upstream of BAR1 and cell cycle-related genes; phsosphoylated form may be ubiquitinated by Dma2p; potential Cdc28p substrate; SBF regulated -S000037860 CDS YIL122W 9 130610 131665 W 2011-02-03 1994-12-10 -S000001383 ORF Verified YIL121W QDR2 cation transporter chromosome 9 9 132244 133872 W 2011-02-03 1994-12-10 Plasma membrane transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; exports copper; has broad substrate specificity and can transport many mono- and divalent cations; transports a variety of drugs and is required for resistance to quinidine, barban, cisplatin, and bleomycin; contributes to potassium homeostasis; expression is regulated by copper -S000037111 CDS YIL121W 9 132244 133872 W 2011-02-03 1994-12-10 -S000001382 ORF Verified YIL120W QDR1 multidrug transporter chromosome 9 9 134417 136108 W 2011-02-03 1994-12-10 Multidrug transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; involved in spore wall assembly; sequence similarity to DTR1 and QDR3, and the triple mutant dtr1 qdr1 qdr3 exhibits reduced dityrosine fluorescence relative to the single mutants; required for resistance to quinidine, ketoconazole, fluconazole, and barban; QDR1 has a paralog, AQR1, that arose from the whole genome duplication -S000037040 CDS YIL120W 9 134417 136108 W 2011-02-03 1994-12-10 -S000118395 ARS ARS911 ARSIX-136 chromosome 9 9 136098 136338 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178112 ARS_consensus_sequence ARS911 9 136288 136272 C 2014-11-18 2014-11-18 -S000001381 ORF Verified YIL119C RPI1 chromosome 9 L000001697 9 137877 136654 C 2011-02-03 1994-12-10 Transcription factor, allelic differences between S288C and Sigma1278b; mediates fermentation stress tolerance by modulating cell wall integrity; overexpression suppresses heat shock sensitivity of wild-type RAS2 overexpression and also suppresses cell lysis defect of mpk1 mutation; allele from S288c can confer fMAPK pathway independent transcription of FLO11; S288C and Sigma1278b alleles differ in number of tandem repeats within ORF -S000036217 CDS YIL119C 9 137877 136654 C 2011-02-03 1994-12-10 -S000001380 ORF Verified YIL118W RHO3 Rho family GTPase RHO3 chromosome 9 L000001632 9 139752 140447 W 2011-02-03 1994-12-10 Non-essential small GTPase of the Rho/Rac family of Ras-like proteins; involved in the establishment of cell polarity; GTPase activity positively regulated by the GTPase activating protein (GAP) Rgd1p -S000036201 CDS YIL118W 9 139752 140447 W 2011-02-03 1994-12-10 -S000001379 ORF Verified YIL117C PRM5 pheromone-regulated protein PRM5 chromosome 9 9 141569 140613 C 2011-02-03 1994-12-10 Pheromone-regulated protein, predicted to have 1 transmembrane segment; induced during cell integrity signaling; PRM5 has a paralog, YNL058C, that arose from the whole genome duplication -S000035189 CDS YIL117C 9 141569 140613 C 2011-02-03 1994-12-10 -S000001378 ORF Verified YIL116W HIS5 histidinol-phosphate transaminase chromosome 9 L000000782 9 142928 144085 W -89 2011-02-03 1994-12-10 Histidinol-phosphate aminotransferase; catalyzes the seventh step in histidine biosynthesis; responsive to general control of amino acid biosynthesis; mutations cause histidine auxotrophy and sensitivity to Cu, Co, and Ni salts -S000035124 CDS YIL116W 9 142928 144085 W 2011-02-03 1994-12-10 -S000028795 ORF Dubious YIL115W-A chromosome 9 9 144268 144639 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene NUP159/YIL115C -S000033557 CDS YIL115W-A 9 144268 144639 W 2011-02-03 2003-07-29 -S000001377 ORF Verified YIL115C NUP159 FG-nucleoporin NUP159|RAT7|NUP158 chromosome 9 L000002782 9 148709 144327 C 2011-02-03 1994-12-10 FG-nucleoporin component of central core of the nuclear pore complex; also part of the nuclear pore complex (NPC) cytoplasmic filaments; contributes directly to nucleocytoplasmic transport; regulates ADP release from the ATP-dependent RNA helicase Dbp5p; forms a stable association with Nup82p, Gle2p and two other FG-nucleoporins (Nsp1p and Nup116p) -S000034872 CDS YIL115C 9 148709 144327 C 2011-02-03 1994-12-10 -S000001376 ORF Verified YIL114C POR2 putative porin POR2|YVDAC2 chromosome 9 L000003425 9 149988 149143 C 2011-02-03 1994-12-10 Putative mitochondrial porin (voltage-dependent anion channel); not required for mitochondrial membrane permeability or mitochondrial osmotic stability; POR2 has a paralog, POR1, that arose from the whole genome duplication -S000033971 CDS YIL114C 9 149988 149143 C 2011-02-03 1994-12-10 -S000001375 ORF Verified YIL113W SDP1 mitogen-activated protein kinase tyrosine protein phosphatase SDP1 chromosome 9 L000004339 9 150559 151188 W 2011-02-03 1994-12-10 Stress-inducible dual-specificity MAP kinase phosphatase; negatively regulates Slt2p MAP kinase by direct dephosphorylation, diffuse localization under normal conditions shifts to punctate localization after heat shock; SDP1 has a paralog, MSG5, that arose from the whole genome duplication -S000033917 CDS YIL113W 9 150559 151188 W 2011-02-03 1994-12-10 -S000001374 ORF Verified YIL112W HOS4 chromosome 9 9 151595 154846 W 2011-02-03 1994-12-10 Subunit of the Set3 complex; complex is a meiotic-specific repressor of sporulation specific genes that contains deacetylase activity; potential Cdc28p substrate -S000033813 CDS YIL112W 9 151595 154846 W 2011-02-03 1994-12-10 -S000001373 ORF Verified YIL111W COX5B cytochrome c oxidase subunit Vb chromosome 9 L000000389 9 155222 155765 W 2011-02-03 1994-12-10 Subunit Vb of cytochrome c oxidase; cytochrome c oxidase is the terminal member of the mitochondrial inner membrane electron transport chain; Cox5Bp is predominantly expressed during anaerobic growth while its isoform Va (Cox5Ap) is expressed during aerobic growth; COX5B has a paralog, COX5A, that arose from the whole genome duplication -S000033706 CDS YIL111W 9 155222 155222 W 2011-02-03 1994-12-10 -S000033707 CDS YIL111W 9 155311 155765 W 2011-02-03 1994-12-10 -S000033708 intron YIL111W 9 155223 155310 W 2011-02-03 1994-12-10 -S000001372 ORF Verified YIL110W HPM1 MNI1 chromosome 9 9 156045 157178 W 2011-02-03 1994-12-10 AdoMet-dependent methyltransferase; involved in a novel 3-methylhistidine modification of ribosomal protein Rpl3p; seven beta-strand MTase family member; null mutant exhibits a weak vacuolar protein sorting defect and caspofungin resistance -S000033038 CDS YIL110W 9 156045 157178 W 2011-02-03 1994-12-10 -S000001371 ORF Verified YIL109C SEC24 COPII subunit SEC24|ANU1 chromosome 9 L000004360 9 160165 157385 C 2011-02-03 1994-12-10 Component of the Sec23p-Sec24p heterodimer of the COPII vesicle coat; required for cargo selection during vesicle formation in ER to Golgi transport; homologous to Sfb3p; SEC24 has a paralog, SFB2, that arose from the whole genome duplication -S000034140 CDS YIL109C 9 160165 157385 C 2011-02-03 1994-12-10 -S000001370 ORF Verified YIL108W putative metalloendopeptidase chromosome 9 9 160887 162977 W 2011-02-03 1994-12-10 Putative metalloendopeptidase; forms cytoplasmic foci upon DNA replication stress -S000034098 CDS YIL108W 9 160887 162977 W 2011-02-03 1994-12-10 -S000001369 ORF Verified YIL107C PFK26 PFK-2|PFK2 chromosome 9 L000001406 9 165761 163278 C 2011-02-03 1994-12-10 6-phosphofructo-2-kinase; inhibited by phosphoenolpyruvate and sn-glycerol 3-phosphate; has negligible fructose-2,6-bisphosphatase activity; transcriptional regulation involves protein kinase A -S000032029 CDS YIL107C 9 165761 163278 C 2011-02-03 1994-12-10 -S000001368 ORF Verified YIL106W MOB1 chromosome 9 L000003356 9 166415 167444 W 2011-02-03 1999-11-17|1994-12-10 Component of the mitotic exit network; associates with and is required for the activation and Cdc15p-dependent phosphorylation of the Dbf2p kinase; required for cytokinesis and cell separation; component of the CCR4 transcriptional complex; relocalizes from cytoplasm to the nuclear periphery upon DNA replication stress -S000031985 CDS YIL106W 9 166415 166434 W 2011-02-03 1999-11-17|1994-12-10 -S000031986 CDS YIL106W 9 166520 167444 W 2011-02-03 1999-11-17 -S000031987 intron YIL106W 9 166435 166519 W 2011-02-03 1999-11-17 -S000028657 ORF Uncharacterized YIL105W-A chromosome 9 9 167664 167804 W 2011-02-03 2003-07-29 Protein of unknown function; completely overlaps the verified gene SLM1; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; mRNA identified as translated by ribosome profiling data -S000032461 CDS YIL105W-A 9 167664 167804 W 2011-02-03 2003-07-29 -S000001367 ORF Verified YIL105C SLM1 phosphatidylinositol 4,5-bisphosphate-binding protein|LIT2 chromosome 9 9 169641 167581 C 2011-02-03 1994-12-10 Phosphoinositide PI4,5P(2) binding protein, forms a complex with Slm2p; acts downstream of Mss4p in a pathway regulating actin cytoskeleton organization in response to stress; TORC2 complex substrate and effector; protein abundance increases in response to DNA replication stress; SLM1 has a paralog, SLM2, that arose from the whole genome duplication -S000030899 CDS YIL105C 9 169641 167581 C 2011-02-03 1994-12-10 -S000001366 ORF Verified YIL104C SHQ1 Hsp90 cochaperone SHQ1 chromosome 9 9 171505 169982 C 2011-02-03 1994-12-10 Chaperone protein; required for the assembly of box H/ACA snoRNPs and thus for pre-rRNA processing; functions as an RNA mimic; forms a complex with Naf1p and interacts with H/ACA snoRNP components Nhp2p and Cbf5p; homology with known Hsp90p cochaperones; relocalizes to the cytosol in response to hypoxia -S000030805 CDS YIL104C 9 171505 169982 C 2011-02-03 1994-12-10 -S000001365 ORF Verified YIL103W DPH1 KIF48 chromosome 9 9 171751 173028 W 2011-02-03 1994-12-10 Protein required for synthesis of diphthamide; required along with Dph2p, Kti11p, Jjj3p, and Dph5p; diphthamide is a modified histidine residue of translation elongation factor 2 (Eft1p or Eft2p); may act in a complex with Dph2p and Kti11p -S000030777 CDS YIL103W 9 171751 173028 W 2011-02-03 1994-12-10 -S000113587 ORF Uncharacterized YIL102C-A chromosome 9 9 173592 173365 C 2011-02-03 2005-11-21 Putative protein of unknown function; identified based on comparisons of the genome sequences of six Saccharomyces species; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the endoplasmic reticulum -S000113588 CDS YIL102C-A 9 173592 173365 C 2011-02-03 2005-11-21 -S000001364 ORF Uncharacterized YIL102C chromosome 9 9 174887 174582 C 2011-02-03 1994-12-10 Putative protein of unknown function -S000030579 CDS YIL102C 9 174887 174582 C 2011-02-03 1994-12-10 -S000006741 tRNA_gene tT(AGU)I1 chromosome 9 L000003866 9 175031 175103 W 2011-02-03 1994-12-10 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000036345 noncoding_exon tT(AGU)I1 9 175031 175103 W 2011-02-03 1994-12-10 -S000118396 ARS ARS912 ARSIX-175 chromosome 9 9 175038 175358 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178113 ARS_consensus_sequence ARS912 9 175170 175186 W 2014-11-18 2014-11-18 -S000001363 ORF Verified YIL101C XBP1 chromosome 9 L000004246 9 177250 175307 C 2011-02-03 1994-12-10 Transcriptional repressor; binds promoter sequences of cyclin genes, CYS3, and SMF2; not expressed during log phase of growth, but induced by stress or starvation during mitosis, and late in meiosis; represses 15% of all yeast genes as cells transition to quiescence; important for maintaining G1 arrest and for longevity of quiescent cells; member of Swi4p/Mbp1p family; phosphorylated by Cdc28p; relative distribution to nucleus increases upon DNA replication stress -S000037752 CDS YIL101C 9 177250 175307 C 2011-02-03 1994-12-10 -S000001362 ORF Dubious YIL100W chromosome 9 9 177373 177726 W 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the dubious ORF YIL100C-A -S000037716 CDS YIL100W 9 177373 177726 W 2011-02-03 1994-12-10 -S000028794 ORF Dubious YIL100C-A chromosome 9 9 177681 177343 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033555 CDS YIL100C-A 9 177681 177343 C 2011-02-03 2003-07-29 -S000001361 ORF Verified YIL099W SGA1 glucan 1,4-alpha-glucosidase chromosome 9 L000001875 9 178004 179653 W 2011-02-03 1994-12-10 Intracellular sporulation-specific glucoamylase; involved in glycogen degradation; induced during starvation of a/a diploids late in sporulation, but dispensable for sporulation -S000032666 CDS YIL099W 9 178004 179653 W 2011-02-03 1994-12-10 -S000001360 ORF Verified YIL098C FMC1 chromosome 9 L000004436 9 180239 179772 C 2011-02-03 1994-12-10 Mitochondrial matrix protein; required for assembly or stability at high temperature of the F1 sector of mitochondrial F1F0 ATP synthase; null mutant temperature sensitive growth on glycerol is suppressed by multicopy expression of Odc1p -S000032508 CDS YIL098C 9 180239 179772 C 2011-02-03 1994-12-10 -S000001359 ORF Verified YIL097W FYV10 glucose-induced degradation complex subunit FYV10|GID9 chromosome 9 9 180427 181977 W 2011-02-03 1994-12-10 Subunit of GID complex; involved in proteasome-dependent catabolite inactivation of gluconeogenic enzymes FBPase, PEPCK, and c-MDH; forms dimer with Rmd5p that is then recruited to GID Complex by Gid8p; contains a degenerate RING finger motif needed for GID complex ubiquitin ligase activity in vivo, as well as CTLH and CRA domains; plays role in anti-apoptosis; required for survival upon exposure to K1 killer toxin -S000032474 CDS YIL097W 9 180427 181977 W 2011-02-03 1994-12-10 -S000001358 ORF Verified YIL096C BMT5 25S rRNA (uracil2634-N3)-methyltransferase chromosome 9 9 183127 182117 C 2011-02-03 1994-12-10 Methyltransferase required for m3U2634 methylation of the 25S rRNA; S-adenosylmethionine-dependent; associates with precursors of the 60S ribosomal subunit; predicted to be involved in ribosome biogenesis -S000031394 CDS YIL096C 9 183127 182117 C 2011-02-03 1994-12-10 -S000006605 tRNA_gene tI(AAU)I1 chromosome 9 L000003875 9 183513 183440 C 2011-02-03 1994-12-10 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000030348 noncoding_exon tI(AAU)I1 9 183513 183440 C 2011-02-03 1994-12-10 -S000001357 ORF Verified YIL095W PRK1 serine/threonine protein kinase PRK1|PAK1 chromosome 9 L000002879 9 183937 186369 W 2011-02-03 1994-12-10 Protein serine/threonine kinase; regulates the organization and function of the actin cytoskeleton and reduces endocytic ability of cell through the phosphorylation of the Pan1p-Sla1p-End3p protein complex; PRK1 has a paralog, ARK1, that arose from the whole genome duplication -S000031347 CDS YIL095W 9 183937 186369 W 2011-02-03 1994-12-10 -S000001356 ORF Verified YIL094C LYS12 homoisocitrate dehydrogenase|LYS11|LYS10 chromosome 9 L000000970 9 187632 186517 C 2011-02-03 1994-12-10 Homo-isocitrate dehydrogenase; an NAD-linked mitochondrial enzyme required for the fourth step in the biosynthesis of lysine, in which homo-isocitrate is oxidatively decarboxylated to alpha-ketoadipate -S000031160 CDS YIL094C 9 187632 186517 C 2011-02-03 1994-12-10 -S000001355 ORF Verified YIL093C RSM25 mitochondrial 37S ribosomal protein RSM25 chromosome 9 9 188784 187990 C 2011-02-03 1994-12-10 Mitochondrial ribosomal protein of the small subunit -S000030231 CDS YIL093C 9 188784 187990 C 2011-02-03 1994-12-10 -S000001354 ORF Uncharacterized YIL092W chromosome 9 9 189066 190967 W 2011-02-03 1994-12-10 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and to the nucleus -S000030095 CDS YIL092W 9 189066 190967 W 2011-02-03 1994-12-10 -S000001353 ORF Verified YIL091C UTP25 rRNA-binding ribosome biosynthesis protein UTP25 chromosome 9 9 193195 191030 C 2011-02-03 1994-12-10 Nucleolar protein; required for 35S pre-RNA processing and 40S ribosomal subunit biogenesis -S000029923 CDS YIL091C 9 193195 191030 C 2011-02-03 1994-12-10 -S000001352 ORF Verified YIL090W ICE2 chromosome 9 9 193595 195070 W 2011-02-03 1994-12-10 Integral ER membrane protein with type-III transmembrane domains; required for maintenance of ER zinc homeostasis; necessary for efficient targeting of Trm1p tRNA methyltransferase to inner nuclear membrane; mutations cause defects in cortical ER morphology in both the mother and daughter cells -S000029886 CDS YIL090W 9 193595 195070 W 2011-02-03 1994-12-10 -S000001351 ORF Verified YIL089W chromosome 9 9 195599 196216 W 2011-02-03 1994-12-10 Protein of unknown function found in the ER and vacuole lumen; overexpression of YIL089W affects endocytic protein trafficking -S000036415 CDS YIL089W 9 195599 196216 W 2011-02-03 1994-12-10 -S000007015 long_terminal_repeat YILCtau1 chromosome 9 9 197023 196653 C 2011-02-03 1994-12-10 Ty4 LTR -S000007011 long_terminal_repeat YILCdelta1 chromosome 9 9 197488 197140 C 2011-02-03 1994-12-10 Ty1 LTR -S000006547 tRNA_gene tE(CUC)I chromosome 9 L000003867 9 197592 197663 W 2011-02-03 1994-12-10 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis -S000031939 noncoding_exon tE(CUC)I 9 197592 197663 W 2011-02-03 1994-12-10 -S000001350 ORF Verified YIL088C AVT7 chromosome 9 9 199403 197931 C 2011-02-03 1994-12-10 Putative transporter; member of a family of seven S. cerevisiae genes (AVT1-7) related to vesicular GABA-glycine transporters -S000036264 CDS YIL088C 9 199403 197931 C 2011-02-03 1994-12-10 -S000001349 ORF Verified YIL087C AIM19 LRC2 chromosome 9 9 200119 199646 C 2011-02-03 1994-12-10 Protein of unknown function; mitochondrial protein that physically interacts with Tim23p; null mutant displays reduced respiratory growth -S000035319 CDS YIL087C 9 200119 199646 C 2011-02-03 1994-12-10 -S000001348 ORF Dubious YIL086C chromosome 9 9 200461 200153 C 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000035155 CDS YIL086C 9 200461 200153 C 2011-02-03 1994-12-10 -S000001347 ORF Verified YIL085C KTR7 putative mannosyltransferase chromosome 9 L000004100 9 202043 200490 C 2011-02-03 1994-12-10 Putative mannosyltransferase involved in protein glycosylation; member of the KRE2/MNT1 mannosyltransferase family; KTR7 has a paralog, KTR5, that arose from the whole genome duplication -S000035010 CDS YIL085C 9 202043 200490 C 2011-02-03 1994-12-10 -S000001346 ORF Verified YIL084C SDS3 chromosome 9 L000003384 9 203259 202276 C 2011-02-03 1994-12-10 Component of the Rpd3L histone deacetylase complex; required for its structural integrity and catalytic activity, involved in transcriptional silencing and required for sporulation; relocalizes to the cytosol in response to hypoxia; cells defective in SDS3 display pleiotropic phenotypes -S000034086 CDS YIL084C 9 203259 202276 C 2011-02-03 1994-12-10 -S000001345 ORF Verified YIL083C CAB2 phosphopantothenate--cysteine ligase CAB2 chromosome 9 9 204653 203556 C 2011-02-03 1994-12-10|2011-02-03 Subunit of the CoA-Synthesizing Protein Complex (CoA-SPC); subunits of this complex are: Cab2p, Cab3p, Cab4p, Cab5p, Sis2p and Vhs3p; probable phosphopantothenoylcysteine synthetase (PPCS), which catalyzes the second step of coenzyme A biosynthesis from pantothenate; null mutant lethality is complemented by human homolog PPCS and by E. coli coaBC (encoding a bifunctional enzyme with PPCS activity) -S000033946 CDS YIL083C 9 204653 203556 C 2011-02-03 1994-12-10|2011-02-03 -S000007017 long_terminal_repeat YILWsigma1 chromosome 9 9 205220 205559 W 2011-02-03 1994-12-10 Ty3 LTR -S000007020 LTR_retrotransposon YILWTy3-1 Ty3 chromosome 9 9 205220 210647 W 2011-02-03 1994-12-10 Ty3 element, LTR retrotransposon of the Gypsy (Metaviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; transposition is induced upon exposure to mating pheromone -S000001344 ORF Dubious YIL082W chromosome 9 9 205635 206507 W 2011-02-03 1994-12-10 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag -S000033890 CDS YIL082W 9 205635 206507 W 2011-02-03 1994-12-10 -S000003537 transposable_element_gene YIL082W-A gag-pol fusion protein chromosome 9 9 205635 210132 W 2011-02-03 1994-12-10|1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes -S000030100 CDS YIL082W-A 9 205635 206485 W 2011-02-03 1999-07-17|1994-12-10 -S000030101 CDS YIL082W-A 9 206487 210132 W 2011-02-03 1999-07-17|1994-12-10 -S000030102 plus_1_translational_frameshift YIL082W-A 9 206486 206486 W 2011-02-03 1999-07-17|1994-12-10 -S000007018 long_terminal_repeat YILWsigma2 chromosome 9 9 210308 210647 W 2011-02-03 1994-12-10 Ty3 LTR -S000006606 tRNA_gene tI(AAU)I2 chromosome 9 L000003868 9 210665 210738 W 2011-02-03 1994-12-10 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis -S000030349 noncoding_exon tI(AAU)I2 9 210665 210738 W 2011-02-03 1994-12-10 -S000001341 ORF Verified YIL079C AIR1 TRAMP complex RNA-binding subunit chromosome 9 S000028413 9 212005 210923 C 2011-02-03 1994-12-10 Zinc knuckle protein; involved in nuclear RNA processing and degradation as a component of the TRAMP complex; stimulates the poly(A) polymerase activity of Pap2p in vitro; AIR1 has a paralog, AIR2, that arose from the whole genome duplication; although Air1p and Air2p are homologous TRAMP subunits, they have nonredundant roles in regulation of substrate specificity of the exosome -S000032850 CDS YIL079C 9 212005 210923 C 2011-02-03 1994-12-10 -S000001340 ORF Verified YIL078W THS1 threonine--tRNA ligase THS1 chromosome 9 L000002301 9 212499 214703 W 2011-02-03 1994-12-10 Threonyl-tRNA synthetase; essential cytoplasmic protein; human homolog TARS can complement yeast null mutant -S000032807 CDS YIL078W 9 212499 214703 W 2011-02-03 1994-12-10 -S000007644 ARS ARS913 ARS901 ARSIX-215|ARS249 chromosome 9 9 214624 214754 2014-11-18 2001-03-06|2014-11-18|2006-09-08 Autonomously Replicating Sequence -S000178114 ARS_consensus_sequence ARS913 9 214732 214748 W 2014-11-18 2014-11-18 -S000001339 ORF Uncharacterized YIL077C chromosome 9 9 215953 214991 C 2011-02-03 1994-12-10 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO) -S000032673 CDS YIL077C 9 215953 214991 C 2011-02-03 1994-12-10 -S000001338 ORF Verified YIL076W SEC28 coatomer subunit epsilon|ANU2 chromosome 9 L000004402 9 216658 217548 W 2011-02-03 1994-12-10|2005-11-22 Epsilon-COP subunit of the coatomer; regulates retrograde Golgi-to-ER protein traffic; stabilizes Cop1p, the alpha-COP and the coatomer complex; non-essential for cell growth; protein abundance increases in response to DNA replication stress -S000032630 CDS YIL076W 9 216658 217548 W 2011-02-03 1994-12-10|2005-11-22 -S000001337 ORF Verified YIL075C RPN2 proteasome regulatory particle base subunit RPN2|SEN3 chromosome 9 L000001864 9 220700 217863 C 2011-02-03 1994-12-10 Subunit of the 26S proteasome; substrate of the N-acetyltransferase Nat1p; protein abundance increases in response to DNA replication stress -S000031543 CDS YIL075C 9 220700 217863 C 2011-02-03 1994-12-10 -S000001336 ORF Verified YIL074C SER33 phosphoglycerate dehydrogenase SER33 chromosome 9 S000007458 9 222490 221081 C 2011-02-03 1994-12-10 3-phosphoglycerate dehydrogenase and alpha-ketoglutarate reductase; 3PG dehydrogenase that catalyzes the first step in serine and glycine biosynthesis; also functions as an alpha-ketoglutarate reductase, converting alpha-ketoglutarate to D-2-hydroxyglutarate (D-2HG); localizes to the cytoplasm; SER33 has a paralog, SER3, that arose from the whole genome duplication -S000031439 CDS YIL074C 9 222490 221081 C 2011-02-03 1994-12-10 -S000001335 ORF Verified YIL073C SPO22 ZIP4 chromosome 9 9 225954 222937 C 2011-02-03 2003-09-27|1994-12-10 Meiosis-specific protein essential for chromosome synapsis; involved in completion of nuclear divisions during meiosis; induced early in meiosis -S000030517 CDS YIL073C 9 225809 222937 C 2011-02-03 2003-09-27 -S000030516 CDS YIL073C 9 225954 225900 C 2011-02-03 2003-09-27|1994-12-10 -S000030518 intron YIL073C 9 225899 225810 C 2011-02-03 2003-09-27 -S000001334 ORF Verified YIL072W HOP1 chromosome 9 L000000802 9 226602 228419 W -59 2011-02-03 1994-12-10 Meiosis-specific protein required for chromosome synapsis; displays Red1p dependent localization to the unsynapsed axial-lateral elements of the synaptonemal complex; required for chiasma formation; in vitro, displays the ability to promote intra- and intermolecular synapsis between double-stranded DNA molecules and to fold DNA into rigid protein-DNA filaments -S000030472 CDS YIL072W 9 226602 228419 W 2011-02-03 1994-12-10 -S000028793 ORF Dubious YIL071W-A chromosome 9 9 228550 229026 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF PCI8/YIL071C -S000033552 CDS YIL071W-A 9 228550 229026 W 2011-02-03 2003-07-29 -S000001333 ORF Verified YIL071C PCI8 YIL071W|CSN11|YIH1 chromosome 9 S000007580 9 229994 228660 C 2011-02-03 1994-12-10 Possible shared subunit of Cop9 signalosome (CSN) and eIF3; binds eIF3b subunit Prt1p, has possible dual functions in transcriptional and translational control, contains a PCI (Proteasome-COP9 signalosome (CSN)-eIF3) domain -S000030209 CDS YIL071C 9 229994 228660 C 2011-02-03 1994-12-10 -S000001332 ORF Verified YIL070C MAM33 chromosome 9 9 231072 230272 C 2011-02-03 1994-12-10 Specific translational activator for the mitochondrial COX1 mRNA; acidic protein of the mitochondrial matrix; related to the human complement receptor gC1q-R -S000037502 CDS YIL070C 9 231072 230272 C 2011-02-03 1994-12-10 -S000001331 ORF Verified YIL069C RPS24B eS24|ribosomal 40S subunit protein S24B|S24e|S24B|RPS24EB chromosome 9 L000002711 9 232369 231553 C 2011-02-03 1994-12-10 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S24, no bacterial homolog; RPS24B has a paralog, RPS24A, that arose from the whole genome duplication -S000036651 CDS YIL069C 9 231957 231553 C 2011-02-03 1994-12-10 -S000036650 CDS YIL069C 9 232369 232367 C 2011-02-03 1994-12-10 -S000036652 intron YIL069C 9 232366 231958 C 2011-02-03 1994-12-10 -S000028792 ORF Dubious YIL068W-A chromosome 9 9 233013 233396 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF SEC6/YIL068C -S000033551 CDS YIL068W-A 9 233013 233396 W 2011-02-03 2003-07-29 -S000001330 ORF Verified YIL068C SEC6 SNARE-binding exocyst subunit SEC6 chromosome 9 L000001832 9 235474 233057 C 2011-02-03 1994-12-10 Essential 88kDa subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis at the plasma membrane prior to SNARE-mediated fusion; anchors the assembled complex to sites of secretion; interacts with SM-like protein and SNARE regulator Sec1p and may recruit it to sites of secretion; binds to SNARE complexes binteracting with Sec9p -S000036567 CDS YIL068C 9 235474 233057 C 2011-02-03 1994-12-10 -S000028791 ORF Dubious YIL066W-A chromosome 9 9 237366 237809 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF YIL067C -S000033550 CDS YIL066W-A 9 237366 237809 W 2011-02-03 2003-07-29 -S000001329 ORF Uncharacterized YIL067C chromosome 9 9 237760 235724 C 2011-02-03 1994-12-10 Uncharacterized protein of unknown function -S000035626 CDS YIL067C 9 237760 235724 C 2011-02-03 1994-12-10 -S000001328 ORF Verified YIL066C RNR3 ribonucleotide-diphosphate reductase subunit RNR3|RIR3|DIN1 chromosome 9 L000001644|L000001657 9 240708 238099 C 2011-02-03 1994-12-10 Minor isoform of large subunit of ribonucleotide-diphosphate reductase; the RNR complex catalyzes rate-limiting step in dNTP synthesis, regulated by DNA replication and DNA damage checkpoint pathways via localization of small subunits; RNR3 has a paralog, RNR1, that arose from the whole genome duplication -S000035554 CDS YIL066C 9 240708 238099 C 2011-02-03 1994-12-10 -S000001327 ORF Verified YIL065C FIS1 MDV2 chromosome 9 9 241775 241308 C 2011-02-03 1994-12-10 Protein involved in mitochondrial fission and peroxisome abundance; may have a distinct role in tethering protein aggregates to mitochondria in order to retain them in the mother cell; required for localization of Dnm1p and Mdv1p during mitochondrial division; mediates ethanol-induced apoptosis and ethanol-induced mitochondrial fragmentation -S000035474 CDS YIL065C 9 241775 241308 C 2011-02-03 1994-12-10 -S000001326 ORF Verified YIL064W EFM4 SEE1 chromosome 9 9 241943 242716 W 2011-02-03 1994-12-10 Lysine methyltransferase; involved in the dimethylation of eEF1A (Tef1p/Tef2p) at lysine 316; sequence similarity to S-adenosylmethionine-dependent methyltransferases of the seven beta-strand family; role in vesicular transport -S000035414 CDS YIL064W 9 241943 242716 W 2011-02-03 1994-12-10 -S000001325 ORF Verified YIL063C YRB2 chromosome 9 L000002886 9 243744 242761 C 2011-02-03 1994-12-10 Protein of unknown function; involved in nuclear processes of the Ran-GTPase cycle; involved in nuclear protein export; contains Ran Binding Domain and FxFG repeats; interacts with Srm1p, GTP-Gsp1p, Rna1p and Crm1p; relocalizes to the cytosol in response to hypoxia; not essential for viability -S000034323 CDS YIL063C 9 243744 242761 C 2011-02-03 1994-12-10 -S000001324 ORF Verified YIL062C ARC15 chromosome 9 L000004032 9 244462 243998 C 2011-02-03 1994-12-10 Subunit of the ARP2/3 complex; ARP2/3 is required for the motility and integrity of cortical actin patches; has mRNA binding activity -S000034193 CDS YIL062C 9 244462 243998 C 2011-02-03 1994-12-10 -S000001323 ORF Verified YIL061C SNP1 U1 snRNP complex subunit SNP1|U1-70K chromosome 9 L000001954 9 245559 244657 C 2011-02-03 1994-12-10 Component of U1 snRNP required for mRNA splicing via spliceosome; substrate of the arginine methyltransferase Hmt1p; may interact with poly(A) polymerase to regulate polyadenylation; homolog of human U1 70K protein; protein abundance increases in response to DNA replication stress -S000033301 CDS YIL061C 9 245559 244657 C 2011-02-03 1994-12-10 -S000119034 ARS ARS923 ARSIX-246|ARS913.5 chromosome 9 9 245756 245925 2014-11-18 2014-11-18|2006-10-03 Autonomously Replicating Sequence -S000178115 ARS_consensus_sequence ARS923 9 245880 245864 C 2014-11-18 2014-11-18 -S000007012 long_terminal_repeat YILWdelta2 YILCdelta2 chromosome 9 9 246220 246552 W 2011-02-03 1994-12-10|2007-04-03 Ty2 LTR -S000001322 ORF Verified YIL060W chromosome 9 9 246392 246826 W 2011-02-03 1994-12-10 Mitochondrial protein of unknown function; required for respiratory growth; mutant accumulates less glycogen than does wild type; null mutation results in a decrease in plasma membrane electron transport; YIL060W is not an essential gene -S000033276 CDS YIL060W 9 246392 246826 W 2011-02-03 1994-12-10 -S000001320 ORF Dubious YIL058W chromosome 9 9 246914 247198 W 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034459 CDS YIL058W 9 246914 247198 W 2011-02-03 1994-12-10 -S000001321 ORF Dubious YIL059C chromosome 9 9 246915 246550 C 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YIL060W -S000034503 CDS YIL059C 9 246915 246550 C 2011-02-03 1994-12-10 -S000118397 ARS ARS914 ARSIX-248 chromosome 9 9 247705 247760 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178116 ARS_consensus_sequence ARS914 9 247752 247736 C 2014-11-18 2014-11-18 -S000001319 ORF Verified YIL057C RGI2 chromosome 9 9 248396 247902 C 2011-02-03 1994-12-10 Protein of unknown function; involved in energy metabolism under respiratory conditions; expression induced under carbon limitation and repressed under high glucose; RGI2 has a paralog, RGI1, that arose from the whole genome duplication -S000032397 CDS YIL057C 9 248396 247902 C 2011-02-03 1994-12-10 -S000130159 ARS ARS915 chromosome 9 9 248396 248850 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000006735 tRNA_gene tS(UGA)I SUP17 chromosome 9 L000002191|L000003869 9 248850 248931 W -53 2011-02-03 1994-12-10 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations -S000034050 noncoding_exon tS(UGA)I 9 248850 248931 W 2011-02-03 1994-12-10 -S000001318 ORF Verified YIL056W VHR1 chromosome 9 9 249991 251913 W 2011-02-03 1994-12-10 Transcriptional activator; required for the vitamin H-responsive element (VHRE) mediated induction of VHT1 (Vitamin H transporter) and BIO5 (biotin biosynthesis intermediate transporter) in response to low biotin concentrations; VHR1 has a paralog, VHR2, that arose from the whole genome duplication -S000032356 CDS YIL056W 9 249991 251913 W 2011-02-03 1994-12-10 -S000001317 ORF Uncharacterized YIL055C chromosome 9 9 253925 252042 C 2011-02-03 1994-12-10 Putative protein of unknown function -S000031292 CDS YIL055C 9 253925 252042 C 2011-02-03 1994-12-10 -S000001316 ORF Uncharacterized YIL054W chromosome 9 9 254543 254860 W 2011-02-03 1994-12-10 Protein of unknown function; expressed at both mRNA and protein levels -S000031254 CDS YIL054W 9 254543 254860 W 2011-02-03 1994-12-10 -S000001315 ORF Verified YIL053W GPP1 RHR2|glycerol-1-phosphatase RHR2 chromosome 9 L000003988 9 255115 255867 W 2011-02-03 1994-12-10|2006-01-24 Constitutively expressed DL-glycerol-3-phosphate phosphatase; also known as glycerol-1-phosphatase; involved in glycerol biosynthesis, induced in response to both anaerobic and osmotic stress; GPP1 has a paralog, GPP2, that arose from the whole genome duplication -S000031111 CDS YIL053W 9 255115 255867 W 2011-02-03 1994-12-10|2006-01-24 -S000001314 ORF Verified YIL052C RPL34B eL34|ribosomal 60S subunit protein L34B|L34e|L34B chromosome 9 L000004466 9 257063 256226 C 2011-02-03 1994-12-10 Ribosomal 60S subunit protein L34B; homologous to mammalian ribosomal protein L34, no bacterial homolog; RPL34B has a paralog, RPL34A, that arose from the whole genome duplication -S000030947 CDS YIL052C 9 256554 256226 C 2011-02-03 1994-12-10 -S000030946 CDS YIL052C 9 257063 257027 C 2011-02-03 1994-12-10 -S000030948 intron YIL052C 9 257026 256555 C 2011-02-03 1994-12-10 -S000001313 ORF Verified YIL051C MMF1 isoleucine biosynthesis protein MMF1|IBM1 chromosome 9 L000004449 9 258280 257843 C 2011-02-03 1994-12-10 Mitochondrial protein required for transamination of isoleucine; but not of valine or leucine; may regulate specificity of branched-chain transaminases Bat1p and Bat2p; induction of expression in response to stress is mediated by a Hog1p-regulated antisense RNA and gene looping; interacts genetically with mitochondrial ribosomal protein genes; MMF1 has a paralog, HMF1, that arose from the whole genome duplication -S000029935 CDS YIL051C 9 258280 257843 C 2011-02-03 1994-12-10 -S000001312 ORF Verified YIL050W PCL7 chromosome 9 L000004039 9 258913 259770 W 2011-02-03 1994-12-10 Pho85p cyclin of the Pho80p subfamily; forms a functional kinase complex with Pho85p which phosphorylates Mmr1p and is regulated by Pho81p; involved in glycogen metabolism, expression is cell-cycle regulated; PCL7 has a paralog, PCL6, that arose from the whole genome duplication -S000029899 CDS YIL050W 9 258913 259770 W 2011-02-03 1994-12-10 -S000001311 ORF Verified YIL049W DFG10 putative polyprenol reductase chromosome 9 L000004073 9 260158 260919 W 2011-02-03 1994-12-10 Probable polyprenol reductase; catalyzes conversion of polyprenol to dolichol, the precursor for N-glycosylation; involved in filamentous growth; mutations in human homolog SRD5A3 confer CDG (Congenital Disorders of Glycosylation); human SRD5A3 can complement yeast null mutant -S000030228 CDS YIL049W 9 260158 260919 W 2011-02-03 1994-12-10 -S000001310 ORF Verified YIL048W NEO1 putative aminophospholipid-translocating P4-type ATPase NEO1 chromosome 9 L000004112 9 261437 264892 W 2011-02-03 1994-12-10 Phospholipid translocase (flippase), role in phospholipid asymmetry of plasma membrane; involved in endocytosis, vacuolar biogenesis and Golgi to ER vesicle-mediated transport; localizes to endosomes and the Golgi apparatus -S000030109 CDS YIL048W 9 261437 264892 W 2011-02-03 1994-12-10 -S000028790 ORF Dubious YIL047C-A chromosome 9 9 265467 265099 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF SYG1/YIL047C -S000033549 CDS YIL047C-A 9 265467 265099 C 2011-02-03 2003-07-29 -S000001309 ORF Verified YIL047C SYG1 chromosome 9 L000002256 9 267823 265115 C 2011-02-03 1994-12-10 Plasma membrane protein of unknown function; truncation and overexpression suppresses lethality of G-alpha protein deficiency -S000036323 CDS YIL047C 9 267823 265115 C 2011-02-03 1994-12-10 -S000028836 ORF Uncharacterized YIL046W-A chromosome 9 9 268309 268473 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000034486 CDS YIL046W-A 9 268309 268473 W 2011-02-03 2003-07-29 -S000001308 ORF Verified YIL046W MET30 ubiquitin-binding SDF ubiquitin ligase complex subunit MET30|ZRG11 chromosome 9 L000001093 9 268651 270573 W 2011-02-03 1994-12-10 F-box protein containing five copies of the WD40 motif; controls cell cycle function, sulfur metabolism, and methionine biosynthesis as part of the ubiquitin ligase complex; interacts with and regulates Met4p, localizes within the nucleus; dissociation of Met30p from SCF complex in response to cadmium stress is regulated by Cdc48p -S000036284 CDS YIL046W 9 268651 270573 W 2011-02-03 1994-12-10 -S000001307 ORF Verified YIL045W PIG2 putative protein phosphatase regulator PIG2 chromosome 9 L000001437 9 271161 272777 W 2011-02-03 1994-12-10 Putative type-1 protein phosphatase targeting subunit; tethers Glc7p type-1 protein phosphatase to Gsy2p glycogen synthase; PIG2 has a paralog, GIP2, that arose from the whole genome duplication -S000036173 CDS YIL045W 9 271161 272777 W 2011-02-03 1994-12-10 -S000001306 ORF Verified YIL044C AGE2 SAT2 chromosome 9 S000007503 9 273846 272950 C 2011-02-03 1994-12-10 ADP-ribosylation factor (ARF) GTPase activating protein (GAP) effector; involved in Trans-Golgi-Network (TGN) transport; contains C2C2H2 cysteine/histidine motif -S000035184 CDS YIL044C 9 273846 272950 C 2011-02-03 1994-12-10 -S000001305 ORF Verified YIL043C CBR1 CBR5 chromosome 9 L000000229 9 274926 274072 C 2011-02-03 1994-12-10|2006-01-23 Cytochrome b reductase; not essential for viability; also detected in mitochondria; mutation in conserved NADH binding domain of the human ortholog results in type I methemoglobinemia -S000035022 CDS YIL043C 9 274926 274072 C 2011-02-03 1994-12-10|2006-01-23 -S000001304 ORF Verified YIL042C PKP1 protein kinase PKP1 chromosome 9 9 276292 275108 C 2011-02-03 1994-12-10 Mitochondrial protein kinase; involved in negative regulation of pyruvate dehydrogenase complex activity by phosphorylating the ser-133 residue of the Pda1p subunit; acts in concert with kinase Pkp2p and phosphatases Ptc5p and Ptc6p -S000034870 CDS YIL042C 9 276292 275108 C 2011-02-03 1994-12-10 -S000001303 ORF Verified YIL041W GVP36 chromosome 9 9 276525 277505 W 2011-02-03 1994-12-10 BAR domain protein that localizes to early and late Golgi vesicles; required for adaptation to varying nutrient concentrations, fluid-phase endocytosis, polarization of the actin cytoskeleton, and vacuole biogenesis -S000034047 CDS YIL041W 9 276525 277505 W 2011-02-03 1994-12-10 -S000001302 ORF Verified YIL040W APQ12 chromosome 9 9 277723 278139 W 2011-02-03 1994-12-10 Nuclear envelope/ER integral membrane protein; interacts and functions with Brr6p and Brl1p in lipid homeostasis; mutants are defective in nuclear pore complex biogenesis, nuclear envelope morphology, mRNA export from the nucleus and are sensitive to sterol biosynthesis inhibitors and membrane fluidizing agents; exhibits synthetic lethal genetic interactions with genes involved in lipid metabolism -S000033887 CDS YIL040W 9 277723 278139 W 2011-02-03 1994-12-10 -S000001301 ORF Verified YIL039W TED1 chromosome 9 9 278426 279847 W 2011-02-03 1994-12-10 GPI-glycan remodelase; conserved phosphoesterase domain-containing protein; acts together with Emp24p/Erv25p in cargo exit from the ER; functional ortholog of mammalian GPI-glycan remodelase PGAP5; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO) -S000035327 CDS YIL039W 9 278426 279847 W 2011-02-03 1994-12-10 -S000001300 ORF Verified YIL038C NOT3 CCR4-NOT core subunit NOT3 chromosome 9 L000001265 9 282652 280142 C 2011-02-03 1994-12-10 Component of the CCR4-NOT core complex, involved in mRNA decapping; involved in transcription initiation and elongation and in mRNA degradation; conserved lysine in human homolog of Not3p and Not5p is mutated in cancers -S000034315 CDS YIL038C 9 282652 280142 C 2011-02-03 1994-12-10 -S000001299 ORF Verified YIL037C PRM2 pheromone-regulated protein PRM2 chromosome 9 9 284999 283029 C 2011-02-03 1994-12-10 Pheromone-regulated protein; predicted to have 4 transmembrane segments and a coiled coil domain; regulated by Ste12p; required for efficient nuclear fusion -S000034252 CDS YIL037C 9 284999 283029 C 2011-02-03 1994-12-10 -S000001298 ORF Verified YIL036W CST6 SHF1|ACA2 chromosome 9 L000002995 9 285666 287429 W 2011-02-03 1994-12-10 Basic leucine zipper (bZIP) transcription factor from ATF/CREB family involved in stress-responsive regulatory network; mediates transcriptional activation of NCE103 in response to low CO2 levels; proposed to be a regulator of oleate responsive genes; involved in utilization of non-optimal carbon sources and chromosome stability; relocalizes to the cytosol in response to hypoxia; CST6 has a paralog, ACA1, that arose from the whole genome duplication -S000034215 CDS YIL036W 9 285666 287429 W 2011-02-03 1994-12-10 -S000001297 ORF Verified YIL035C CKA1 casein kinase 2 catalytic subunit CKA1 chromosome 9 L000000343 9 288908 287790 C -29 2011-02-03 1994-12-10 Alpha catalytic subunit of casein kinase 2 (CK2); a Ser/Thr protein kinase with roles in cell growth and proliferation; CK2, comprised of CKA1, CKA2, CKB1 and CKB2, has many substrates including transcription factors and all RNA polymerases; regulates Fkh1p-mediated donor preference during mating-type switching -S000032136 CDS YIL035C 9 288908 287790 C 2011-02-03 1994-12-10 -S000001296 ORF Verified YIL034C CAP2 F-actin-capping protein subunit beta chromosome 9 L000000215 9 290089 289226 C -28 2011-02-03 1994-12-10 Beta subunit of the capping protein heterodimer (Cap1p and Cap2p); capping protein (CP) binds to the barbed ends of actin filaments preventing further polymerization; localized predominantly to cortical actin patches; protein increases in abundance and relocalizes from bud neck to plasma membrane upon DNA replication stress -S000032026 CDS YIL034C 9 290089 289226 C 2011-02-03 1994-12-10 -S000001295 ORF Verified YIL033C BCY1 cAMP-dependent protein kinase regulatory subunit BCY1|SRA1 chromosome 9 L000002044 9 291669 290419 C -28 2011-02-03 1994-12-10 Regulatory subunit of the cyclic AMP-dependent protein kinase (PKA); PKA is a component of a signaling pathway that controls a variety of cellular processes, including metabolism, cell cycle, stress response, stationary phase, and sporulation -S000031897 CDS YIL033C 9 291669 290419 C 2011-02-03 1994-12-10 -S000001294 ORF Dubious YIL032C chromosome 9 9 292317 291961 C 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030897 CDS YIL032C 9 292317 291961 C 2011-02-03 1994-12-10 -S000001293 ORF Verified YIL031W ULP2 SUMO protease ULP2|SMT4 chromosome 9 L000001939 9 292633 295737 W 2011-02-03 1994-12-10 Peptidase that deconjugates Smt3/SUMO-1 peptides from proteins; plays a role in chromosome cohesion at centromeric regions and recovery from checkpoint arrest induced by DNA damage or DNA replication defects; potential Cdc28p substrate; human homolog PML implicated in promyelocytic leukemia can partially complement yeast null mutant -S000030862 CDS YIL031W 9 292633 295737 W 2011-02-03 1994-12-10 -S000028789 ORF Dubious YIL030W-A chromosome 9 9 295565 295903 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF ULP2/YIL031W -S000033536 CDS YIL030W-A 9 295565 295903 W 2011-02-03 2003-07-29 -S000028788 ORF Dubious YIL029W-A chromosome 9 9 299735 300106 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF SSM4/YIL030C -S000033533 CDS YIL029W-A 9 299735 300106 W 2011-02-03 2003-07-29 -S000001292 ORF Verified YIL030C SSM4 E3 ubiquitin-protein ligase SSM4|KIS3|DOA10 chromosome 9 L000002087 9 300009 296050 C 2011-02-03 1994-12-10 Membrane-embedded ubiquitin-protein ligase; ER and inner nuclear membrane localized RING-CH domain E3 ligase involved in ER-associated protein degradation (ERAD); targets misfolded cytosolic/nucleoplasmic domains of soluble and membrane embedded proteins (ERAD-C) and a transmembrane domain containing substrate (ERAD-M), Sbh2p; C-terminal element (CTE), conserved in human ortholog MARCH10/TEB4, determines substrate selectivity -S000030668 CDS YIL030C 9 300009 296050 C 2011-02-03 1994-12-10 -S000006624 tRNA_gene tK(CUU)I chromosome 9 L000003874 9 300300 300228 C 2011-02-03 1994-12-10|2011-02-03 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced -S000036023 noncoding_exon tK(CUU)I 9 300300 300228 C 2011-02-03 1994-12-10|2011-02-03 -S000007013 long_terminal_repeat YILCdelta3 chromosome 9 9 300727 300409 C 2011-02-03 1994-12-10 Ty1 LTR -S000001291 ORF Uncharacterized YIL029C chromosome 9 9 301257 300829 C 2011-02-03 1994-12-10 Putative protein of unknown function; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO); YIL029C has a paralog, YPR071W, that arose from a single-locus duplication -S000031121 CDS YIL029C 9 301257 300829 C 2011-02-03 1994-12-10 -S000001290 ORF Dubious YIL028W chromosome 9 9 302100 302498 W 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000031076 CDS YIL028W 9 302100 302498 W 2011-02-03 1994-12-10 -S000001289 ORF Verified YIL027C EMC5 KRE27 chromosome 9 9 304104 303679 C 2011-02-03 1994-12-10 Member of conserved ER transmembrane complex; required for efficient folding of proteins in the ER; null mutant displays induction of the unfolded protein response, and also shows K1 killer toxin resistance; homologous to worm B0334.15/EMC-5, fly CG15168, human MMGT -S000030935 CDS YIL027C 9 304104 303679 C 2011-02-03 1994-12-10 -S000001288 ORF Verified YIL026C IRR1 SCC3 chromosome 9 L000003590 9 307929 304477 C 2011-02-03 1994-12-10 Subunit of the cohesin complex; which is required for sister chromatid cohesion during mitosis and meiosis and interacts with centromeres and chromosome arms; relocalizes to the cytosol in response to hypoxia; essential for viability -S000029925 CDS YIL026C 9 307929 304477 C 2011-02-03 1994-12-10 -S000001287 ORF Dubious YIL025C chromosome 9 9 308575 308201 C 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000029834 CDS YIL025C 9 308575 308201 C 2011-02-03 1994-12-10 -S000001286 ORF Uncharacterized YIL024C chromosome 9 9 309171 308602 C 2011-02-03 1994-12-10 Putative protein of unknown function; non-essential gene; expression directly regulated by the metabolic and meiotic transcriptional regulator Ume6p -S000037819 CDS YIL024C 9 309171 308602 C 2011-02-03 1994-12-10 -S000001285 ORF Verified YIL023C YKE4 Zn(2+) transporter YKE4 chromosome 9 9 310426 309386 C 2011-02-03 1994-12-10 Zinc transporter; localizes to the ER; null mutant is sensitive to calcofluor white, leads to zinc accumulation in cytosol; ortholog of the mouse KE4 and member of the ZIP (ZRT, IRT-like Protein) family -S000035957 CDS YIL023C 9 310426 309386 C 2011-02-03 1994-12-10 -S000001284 ORF Verified YIL022W TIM44 protein translocase subunit TIM44|MPI1|MIM44|ISP45 chromosome 9 L000001138 9 311165 312460 W 2011-02-03 1994-12-10 Essential component of the TIM23 complex; tethers the import motor and regulatory factors (PAM complex) to the translocation channel (Tim23p-Tim17p core complex); TIM23 complex is short for the translocase of the inner mitochondrial membrane -S000035916 CDS YIL022W 9 311165 312460 W 2011-02-03 1994-12-10 -S000001283 ORF Verified YIL021W RPB3 DNA-directed RNA polymerase II core subunit RPB3|B44 chromosome 9 L000001677|L000001589 9 312905 313861 W -17 2011-02-03 1994-12-10 RNA polymerase II third largest subunit B44; part of central core; similar to prokaryotic alpha subunit -S000035800 CDS YIL021W 9 312905 313861 W 2011-02-03 1994-12-10 -S000028656 ORF Dubious YIL021C-A chromosome 9 9 313468 313199 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified gene RPB3/YIL021W; identified by gene-trapping, expression analysis, and genome-wide homology searching -S000032459 CDS YIL021C-A 9 313468 313199 C 2011-02-03 2003-07-29 -S000130160 ARS ARS918 chromosome 9 9 313861 314035 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000028787 ORF Dubious YIL020C-A chromosome 9 9 314051 313713 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps origin of replication ARS918, partially overlaps ORF RPB3/YIL021W -S000033532 CDS YIL020C-A 9 314051 313713 C 2011-02-03 2003-07-29 -S000001282 ORF Verified YIL020C HIS6 1-(5-phosphoribosyl)-5- ((5-phosphoribosylamino)methylideneamino)imidazole-4-carboxamide isomerase HIS6 chromosome 9 L000000783 9 314820 314035 C -17 2011-02-03 1994-12-10 Enzyme that catalyzes the fourth step in the histidine pathway; Phosphoribosylformimino-5-aminoimidazole carboxamide ribotide isomerase; mutations cause histidine auxotrophy and sensitivity to Cu, Co, and Ni salts -S000034720 CDS YIL020C 9 314820 314035 C 2011-02-03 1994-12-10 -S000001281 ORF Verified YIL019W FAF1 chromosome 9 9 315093 316133 W 2011-02-03 1994-12-10 Protein required for pre-rRNA processing; also required for 40S ribosomal subunit assembly -S000036117 CDS YIL019W 9 315093 316133 W 2011-02-03 1994-12-10 -S000001280 ORF Verified YIL018W RPL2B uL2|ribosomal 60S subunit protein L2B|L2|rp8|YL6|L5B|L2B|LOT2|RPL5A chromosome 9 L000001707 9 316768 317932 W 2011-02-03 1994-12-10 Ribosomal 60S subunit protein L2B; homologous to mammalian ribosomal protein L2 and bacterial L2; RPL2B has a paralog, RPL2A, that arose from the whole genome duplication; expression is upregulated at low temperatures -S000036024 CDS YIL018W 9 316768 316771 W 2011-02-03 1994-12-10 -S000036025 CDS YIL018W 9 317172 317932 W 2011-02-03 1994-12-10 -S000036026 intron YIL018W 9 316772 317171 W 2011-02-03 1994-12-10 -S000001279 ORF Verified YIL017C VID28 glucose-induced degradation complex subunit VID28|YIL017W|GID5 chromosome 9 9 320965 318200 C 2011-02-03 1994-12-10 GID Complex subunit, serves as adaptor for regulatory subunit Vid24p; protein involved in proteasome-dependent catabolite degradation of fructose-1,6-bisphosphatase (FBPase); localized to the nucleus and the cytoplasm -S000035053 CDS YIL017C 9 320965 318200 C 2011-02-03 1994-12-10 -S000001278 ORF Verified YIL016W SNL1 chromosome 9 L000004403 9 321454 321933 W 2011-02-03 1994-12-10 Ribosome-associated protein; proposed to act in protein synthesis and nuclear pore complex biogenesis and maintenance as well as protein folding; has similarity to the mammalian BAG-1 protein -S000035003 CDS YIL016W 9 321454 321933 W 2011-02-03 1994-12-10 -S000001277 ORF Verified YIL015W BAR1 aspartyl protease BAR1|SST1 chromosome 9 L000000160 9 322342 324105 W -12 2011-02-03 1994-12-10 Aspartyl protease; secreted into the periplasmic space of mating type a cell; helps cells find mating partners; cleaves and inactivates alpha factor allowing cells to recover from alpha-factor-induced cell cycle arrest -S000034859 CDS YIL015W 9 322342 324105 W 2011-02-03 1994-12-10 -S000006534 tRNA_gene tD(GUC)I1 chromosome 9 L000003873 9 324374 324303 C 2011-02-03 1994-12-10 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000030656 noncoding_exon tD(GUC)I1 9 324374 324303 C 2011-02-03 1994-12-10 -S000007019 long_terminal_repeat YILWsigma3 chromosome 9 9 324391 324734 W 2011-02-03 1994-12-10 Ty3 LTR -S000007016 long_terminal_repeat YILWdelta4 chromosome 9 9 324831 325164 W 2011-02-03 1994-12-10 Ty1 LTR -S000003536 ORF Uncharacterized YIL014C-A YIL015C-A chromosome 9 9 325526 325212 C 2011-02-03 1994-12-10 Putative protein of unknown function -S000035773 CDS YIL014C-A 9 325526 325212 C 2011-02-03 1994-12-10 -S000006742 tRNA_gene tT(AGU)I2 chromosome 9 L000003870 9 325748 325820 W 2011-02-03 1994-12-10 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis -S000036347 noncoding_exon tT(AGU)I2 9 325748 325820 W 2011-02-03 1994-12-10 -S000001276 ORF Verified YIL014W MNT3 alpha-1,3-mannosyltransferase MNT3 chromosome 9 9 326103 327995 W 2011-02-03 1994-12-10 Alpha-1,3-mannosyltransferase; adds the fourth and fifth alpha-1,3-linked mannose residues to O-linked glycans during protein O-glycosylation -S000033990 CDS YIL014W 9 326103 327995 W 2011-02-03 1994-12-10 -S000001275 ORF Verified YIL013C PDR11 ATP-binding cassette multidrug transporter PDR11 chromosome 9 L000003163 9 332442 328207 C 2011-02-03 1994-12-10 ATP-binding cassette (ABC) transporter; multidrug transporter involved in multiple drug resistance; mediates sterol uptake when sterol biosynthesis is compromised; regulated by Pdr1p; required for anaerobic growth; PDR11 has a paralog, AUS1, that arose from the whole genome duplication -S000033824 CDS YIL013C 9 332442 328207 C 2011-02-03 1994-12-10 -S000001274 ORF Dubious YIL012W chromosome 9 9 333011 333352 W 2011-02-03 1994-12-10|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033748 CDS YIL012W 9 333011 333352 W 2011-02-03 1994-12-10|2011-02-03 -S000001273 ORF Verified YIL011W TIR3 YIB1 chromosome 9 9 333727 334536 W 2011-02-03 1994-12-10 Cell wall mannoprotein; member of Srp1p/Tip1p family of serine-alanine-rich proteins; expressed under anaerobic conditions and required for anaerobic growth; TIR3 has a paralog, TIR2, that arose from the whole genome duplication -S000033633 CDS YIL011W 9 333727 334536 W 2011-02-03 1994-12-10 -S000001272 ORF Verified YIL010W DOT5 thioredoxin peroxidase DOT5 chromosome 9 L000004392 9 334882 335529 W 2011-02-03 1994-12-10 Nuclear thiol peroxidase; functions as an alkyl-hydroperoxide reductase during post-diauxic growth -S000030341 CDS YIL010W 9 334882 335529 W 2011-02-03 1994-12-10 -S000006432 ORF Verified YIL009C-A EST3 telomerase subunit EST3 chromosome 9 L000004271 9 336212 335666 C 2011-02-03 1997-10-20 Component of the telomerase holoenzyme; involved in telomere replication; synthesis of the full-length protein results from a programmed +1 ribosomal frameshift -S000031928 CDS YIL009C-A 9 335935 335666 C 2011-02-03 1997-10-20 -S000031927 CDS YIL009C-A 9 336212 335937 C 2011-02-03 1997-10-20 -S000031929 plus_1_translational_frameshift YIL009C-A 9 335936 335936 C 2011-02-03 1997-10-20 -S000006535 tRNA_gene tD(GUC)I2 chromosome 9 L000003872 9 336420 336349 C 2011-02-03 1994-12-10 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis -S000030659 noncoding_exon tD(GUC)I2 9 336420 336349 C 2011-02-03 1994-12-10 -S000007014 long_terminal_repeat YILCdelta5 chromosome 9 9 336897 336708 C 2011-02-03 1994-12-10 Ty1 LTR -S000001271 ORF Verified YIL009W FAA3 long-chain fatty acid-CoA ligase FAA3 chromosome 9 L000000596 9 339344 341428 W 2011-02-03 1994-12-10 Long chain fatty acyl-CoA synthetase; activates imported fatty acids with a preference for C16:0-C18:0 chain lengths; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery -S000030759 CDS YIL009W 9 339344 341428 W 2011-02-03 1994-12-10 -S000118398 ARS ARS919 ARSIX-342 chromosome 9 9 341976 342045 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000001270 ORF Verified YIL008W URM1 ubiquitin-related modifier URM1 chromosome 9 S000007535 9 342536 342835 W 2011-02-03 1994-12-10 Ubiquitin-like protein involved in thiolation of cytoplasmic tRNAs; receives sulfur from the E1-like enzyme Uba4p and transfers it to tRNA; also functions as a protein tag with roles in nutrient sensing and oxidative stress response -S000030686 CDS YIL008W 9 342536 342835 W 2011-02-03 1994-12-10 -S000001269 ORF Verified YIL007C NAS2 chromosome 9 9 343656 342994 C 2011-02-03 1994-12-10 Evolutionarily conserved 19S regulatory particle assembly-chaperone; involved in assembly of the base subcomplex of the 19S proteasomal regulatory particle (RP); non-essential gene; interacts with Rpn4p; protein abundance increases in response to DNA replication stress; ortholog of human p27 -S000030556 CDS YIL007C 9 343656 342994 C 2011-02-03 1994-12-10 -S000001268 ORF Verified YIL006W YIA6 NAD+ transporter|NDT1 chromosome 9 9 344062 345183 W 2011-02-03 1994-12-10 Mitochondrial NAD+ transporter; involved in the transport of NAD+ into the mitochondria (see also YEA6); member of the mitochondrial carrier subfamily; disputed role as a pyruvate transporter; has putative mouse and human orthologs; YIA6 has a paralog, YEA6, that arose from the whole genome duplication -S000030529 CDS YIL006W 9 344062 345183 W 2011-02-03 1994-12-10 -S000001267 ORF Verified YIL005W EPS1 protein disulfide isomerase EPS1 chromosome 9 9 345692 347797 W 2011-02-03 1994-12-10 ER protein with chaperone and co-chaperone activity; involved in retention of resident ER proteins; has a role in recognizing proteins targeted for ER-associated degradation (ERAD), member of the protein disulfide isomerase family -S000030455 CDS YIL005W 9 345692 347797 W 2011-02-03 1994-12-10 -S000001266 ORF Verified YIL004C BET1 SLY12 chromosome 9 L000000171 9 348505 347946 C 2011-02-03 1994-12-10 Type II membrane protein required for vesicular transport; required for vesicular transport between the endoplasmic reticulum and Golgi complex; v-SNARE with similarity to synaptobrevins -S000037580 CDS YIL004C 9 348363 347946 C 2011-02-03 1994-12-10 -S000037579 CDS YIL004C 9 348505 348495 C 2011-02-03 1994-12-10 -S000037581 intron YIL004C 9 348494 348364 C 2011-02-03 1994-12-10 -S000001265 ORF Verified YIL003W CFD1 iron-sulfur cluster assembly protein CFD1|DRE3 chromosome 9 9 349122 350003 W 2011-02-03 1994-12-10 Highly conserved iron-sulfur cluster binding protein; localized in the cytoplasm; forms a complex with Nbp35p that is involved in iron-sulfur protein assembly in the cytosol -S000037556 CDS YIL003W 9 349122 350003 W 2011-02-03 1994-12-10 -S000028835 ORF Uncharacterized YIL002W-A chromosome 9 9 350301 350510 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000034485 CDS YIL002W-A 9 350301 350510 W 2011-02-03 2003-07-29 -S000001264 ORF Verified YIL002C INP51 phosphoinositide 5-phosphatase INP51|SJL1 chromosome 9 L000003319 9 353431 350591 C 2011-02-03 1994-12-10 Phosphatidylinositol 4,5-bisphosphate 5-phosphatase; synaptojanin-like protein with an N-terminal Sac1 domain, plays a role in phosphatidylinositol 4,5-bisphosphate homeostasis and in endocytosis; null mutation confers cold-tolerant growth -S000032035 CDS YIL002C 9 353431 350591 C 2011-02-03 1994-12-10 -S000001263 ORF Uncharacterized YIL001W chromosome 9 9 353940 355481 W 2011-02-03 1994-12-10 Putative protein of unknown function; contains a BTB/POZ domain which generally function in protein interactions; deletion slightly improved competitive fitness in rich media; GFP-tagged protein is localized to the cytoplasm -S000031993 CDS YIL001W 9 353940 355481 W 2011-02-03 1994-12-10 -S000006470 centromere CEN9 CEN9 chromosome 9 L000000302 9 355629 355745 W 0 2011-02-03 1994-12-10|2006-05-09 Chromosome IX centromere -S000077275 centromere_DNA_Element_I CEN9 9 355629 355638 W 2011-02-03 2004-10-05 -S000077276 centromere_DNA_Element_II CEN9 9 355639 355720 W 2011-02-03 2004-10-05 -S000077277 centromere_DNA_Element_III CEN9 9 355721 355745 W 2011-02-03 2004-10-05 -S000001440 ORF Verified YIR001C SGN1 RBP29|RBP1 chromosome 9 9 356895 356143 C 2011-02-03 1994-12-10 Cytoplasmic RNA-binding protein; contains an RNA recognition motif (RRM); may have a role in mRNA translation, as suggested by genetic interactions with genes encoding proteins involved in translational initiation -S000032594 CDS YIR001C 9 356895 356143 C 2011-02-03 1994-12-10 -S000118399 ARS ARS920 ARSIX-357 chromosome 9 9 357160 357396 2011-02-03 2006-08-30 Autonomously Replicating Sequence -S000178117 ARS_consensus_sequence ARS920 9 357222 357238 W 2014-11-18 2014-11-18 -S000001441 ORF Verified YIR002C MPH1 3'-5' DNA helicase chromosome 9 9 360396 357415 C 2011-02-03 1994-12-10 3'-5' DNA helicase involved in error-free bypass of DNA lesions; binds flap DNA, stimulates activity of Rad27p and Dna2p; prevents crossovers between ectopic sequences by removing substrates for Mus81-Mms4 or Rad1-Rad10 cleavage; homolog of human FANCM Fanconi anemia protein that is involved in stabilizing and remodeling blocked replication forks; member of SF2 DExD/H superfamily of helicases; nonsense or missense mutations in FANCM can make people more likely to get cancer -S000032716 CDS YIR002C 9 360396 357415 C 2011-02-03 1994-12-10 -S000001442 ORF Verified YIR003W AIM21 chromosome 9 9 360885 362924 W 2011-02-03 1994-12-10 Protein of unknown function; involved in mitochondrial migration along actin filament; may interact with ribosomes; GFP-fusion protein colocalizes with Sac1p to the actin cytoskeleton -S000032876 CDS YIR003W 9 360885 362924 W 2011-02-03 1994-12-10 -S000130161 ARS ARS921 chromosome 9 9 362924 363221 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay -S000001443 ORF Verified YIR004W DJP1 PAS22|ICS1 chromosome 9 L000003966 9 363221 364519 W 2011-02-03 1994-12-10 Cytosolic J-domain-containing protein; required for peroxisomal protein import and involved in peroxisome assembly; facilitates import of Mim1p and Mim2p into the mitochondrial outer membrane; homologous to E. coli DnaJ -S000033586 CDS YIR004W 9 363221 364519 W 2011-02-03 1994-12-10 -S000001444 ORF Verified YIR005W IST3 U2 snRNP complex subunit IST3|SNU17 chromosome 9 9 364889 365335 W 2011-02-03 1994-12-10 Component of the U2 snRNP; required for the first catalytic step of splicing and for spliceosomal assembly; interacts with Rds3p and is required for Mer1p-activated splicing; diploid mutants have a specific defect in MATa1 pre-mRNA splicing which leads to haploid gene expression in diploids -S000033658 CDS YIR005W 9 364889 365335 W 2011-02-03 1994-12-10 -S000001445 ORF Verified YIR006C PAN1 DIM2|MIP3|MDP3 chromosome 9 L000001335 9 369908 365466 C 2011-02-03 1994-12-10 Part of actin cytoskeleton-regulatory complex Pan1p-Sla1p-End3p; associates with actin patches on cell cortex; promotes protein-protein interactions essential for endocytosis; binds to and activates Arp2/3 complex in vitro; phosphorylation of Thr-1225 is regulated by MAPK Hog1p in response to osmotic stress; previously thought to be a subunit of poly(A) ribonuclease -S000033724 CDS YIR006C 9 369908 365466 C 2011-02-03 1994-12-10 -S000006556 tRNA_gene tE(UUC)I chromosome 9 L000003871 9 370417 370488 W 2011-02-03 1994-12-10 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p -S000035987 noncoding_exon tE(UUC)I 9 370417 370488 W 2011-02-03 1994-12-10 -S000001446 ORF Verified YIR007W EGH1 hydrolase chromosome 9 9 370704 372998 W 2011-02-03 1994-12-10 Steryl-beta-glucosidase with broad specificity for aglycones; has a role in ergosteryl-beta-glucoside catabolism; required for normal vacuolar morphology; has similarity to the C. neoformans ergosteryl-beta-glucosidase EGCrP2; localizes to the cytosol -S000034669 CDS YIR007W 9 370704 372998 W 2011-02-03 1994-12-10 -S000001447 ORF Verified YIR008C PRI1 DNA primase subunit PRI1 chromosome 9 L000001489 9 374306 373077 C 2011-02-03 1994-12-10 Subunit of DNA primase; DNA primase is required for DNA synthesis and double-strand break repair -S000034753 CDS YIR008C 9 374306 373077 C 2011-02-03 1994-12-10 -S000001448 ORF Verified YIR009W MSL1 U2 snRNP complex subunit MSL1|YIB9|YIB9w chromosome 9 L000004502 9 374525 374860 W 2011-02-03 1994-12-10 U2B component of U2 snRNP; involved in splicing, binds the U2 snRNA stem-loop IV in vitro but requires association of Lea1p for in vivo binding; does not contain the conserved C-terminal RNA binding domain found in other family members -S000034977 CDS YIR009W 9 374525 374860 W 2011-02-03 1994-12-10 -S000001449 ORF Verified YIR010W DSN1 MIND complex subunit DSN1 chromosome 9 L000004645 9 375431 377161 W 2011-02-03 1994-12-10 Essential component of the MIND kinetochore complex; joins kinetochore subunits contacting DNA to those contacting microtubules; Dsn1p phosphorylation promotes interaction between outer and inner kinetochore proteins; kinetochore receptor for monopolin, via interaction with subunit Csm1p; essential for meiotic but not mitotic chromosome segregation; MIND complex consists of Mtw1p, Nnf1p, Nsl1p and Dsn1p; modified by sumoylation; phosphorylated by monopolin subunit Hrr25p -S000035994 CDS YIR010W 9 375431 377161 W 2011-02-03 1994-12-10 -S000001450 ORF Verified YIR011C STS1 SSM5|DBF8 chromosome 9 L000000489 9 378246 377287 C 2011-02-03 1994-12-10 Protein required for localizing proteasomes to the nucleus; involved in cotranslational protein degradation; mediates interaction between nuclear import factor Srp1p and the proteasome; Sts1p and Srp1p couple proteasomes to nascent polypeptides emerging from the ribosome for cotranslational degradation; involved in ubiquitin-mediated protein degradation -S000036807 CDS YIR011C 9 378246 377287 C 2011-02-03 1994-12-10 -S000001451 ORF Verified YIR012W SQT1 chromosome 9 L000003431 9 378486 379781 W 2011-02-03 1994-12-10 Specific chaperone for ribosomal protein Rpl10p; binds nascent Rpl10p during translation; contains multiple WD repeats; interacts with Qsr1p in a two-hybrid assay; protein abundance increases in response to DNA replication stress -S000036906 CDS YIR012W 9 378486 379781 W 2011-02-03 1994-12-10 -S000001452 ORF Verified YIR013C GAT4 chromosome 9 S000007452 9 380384 380019 C 2011-02-03 1994-12-10 Protein containing GATA family zinc finger motifs; involved in spore wall assembly; sequence similarity to GAT3, and the double mutant gat3 gat4 exhibits reduced dityrosine fluorescence relative to the single mutants -S000036935 CDS YIR013C 9 380384 380019 C 2011-02-03 1994-12-10 -S000001453 ORF Uncharacterized YIR014W chromosome 9 9 381086 381814 W 2011-02-03 2003-09-22|1994-12-10 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole; expression directly regulated by the metabolic and meiotic transcriptional regulator Ume6p; YIR014W is a non-essential gene -S000037725 CDS YIR014W 9 381086 381814 W 2011-02-03 2003-09-22|1994-12-10 -S000001454 ORF Verified YIR015W RPR2 ribonuclease P protein subunit RPR2 chromosome 9 L000004310 9 381948 382382 W 2011-02-03 1994-12-10 Subunit of nuclear RNase P; nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs; not shared between RNase MRP and RNase P, in contrast to all other RNase P protein subunits; protein abundance increases in response to DNA replication stress -S000037806 CDS YIR015W 9 381948 382382 W 2011-02-03 1994-12-10 -S000001455 ORF Uncharacterized YIR016W chromosome 9 9 382628 383425 W 2011-02-03 1994-12-10 Putative protein of unknown function; expression directly regulated by the metabolic and meiotic transcriptional regulator Ume6p; overexpression causes a cell cycle delay or arrest; non-essential gene; YIR016W has a paralog, YOL036W, that arose from the whole genome duplication -S000037904 CDS YIR016W 9 382628 383425 W 2011-02-03 1994-12-10 -S000028799 ORF Dubious YIR017W-A chromosome 9 9 383566 384165 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000033566 CDS YIR017W-A 9 383566 384165 W 2011-02-03 2003-07-29 -S000001456 ORF Verified YIR017C MET28 chromosome 9 L000001092 9 384119 383556 C 2011-02-03 1994-12-10 bZIP transcriptional activator in the Cbf1p-Met4p-Met28p complex; participates in the regulation of sulfur metabolism -S000030791 CDS YIR017C 9 384119 383556 C 2011-02-03 1994-12-10 -S000001457 ORF Verified YIR018W YAP5 chromosome 9 L000004343 9 384609 385346 W 2011-02-03 1994-12-10 Basic leucine zipper (bZIP) iron-sensing transcription factor; involved in diauxic shift; YAP5 has a paralog, YAP7, that arose from the whole genome duplication -S000030914 CDS YIR018W 9 384609 385346 W 2011-02-03 1994-12-10 -S000028837 ORF Uncharacterized YIR018C-A chromosome 9 9 385701 385564 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000034488 CDS YIR018C-A 9 385701 385564 C 2011-02-03 2003-07-29 -S000001458 ORF Verified YIR019C FLO11 MUC1|STA4 chromosome 9 L000002104 9 393675 389572 C 2011-02-03 1994-12-10 GPI-anchored cell surface glycoprotein (flocculin); required for pseudohyphal and invasive growth, flocculation, and biofilm formation; major determinant of colony morphology; transcription regulated by the MAPK pathway (Ste12p and Tec1p) and the cAMP pathway (Flo8p); required for formation of fibrous interconnections between cells of a wild strain; role in co-flocculation with other yeast species; cleaved and shed from cells, contributing to their surface properties -S000030936 CDS YIR019C 9 393675 389572 C 2011-02-03 1994-12-10 -S000001459 ORF Uncharacterized YIR020C chromosome 9 9 394557 394255 C 2011-02-03 1994-12-10 Protein of unknown function; mRNA identified as translated by ribosome profiling data; SWAT-GFP fusion protein localizes to the endoplasmic reticulum -S000032045 CDS YIR020C 9 394557 394255 C 2011-02-03 1994-12-10 -S000007241 ORF Dubious YIR020W-A YIR020W-B chromosome 9 9 394917 395159 W 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000034820 CDS YIR020W-A 9 394917 395159 W 2011-02-03 1999-07-17 -S000132614 ncRNA_gene PWR1 PWR1 chromosome 9 9 395999 396939 W 2011-02-03 2010-01-05 Intergenic regulatory ncRNA; one of two long ncRNAs that play key roles in regulating transcription of the nearby protein-coding ORF FLO11; PWR1 promotes FLO11 transcription by interfering with ncRNA ICR1, which is transcribed across the FLO11 promoter -S000132615 noncoding_exon PWR1 9 395999 396939 W 2011-02-03 2010-01-05 -S000132612 ncRNA_gene ICR1 ICR1 chromosome 9 9 397082 393884 C 2011-02-03 2010-01-05 Long intergenic regulatory ncRNA; has a key role in regulating transcription of the nearby protein-coding ORF FLO11; initiated far upstream from FLO11 and transcribed across much of the large promoter of FLO11, repressing FLO11 transcription in cis -S000132613 noncoding_exon ICR1 9 397082 393884 C 2011-02-03 2010-01-05 -S000001460 ORF Verified YIR021W MRS1 PET157 chromosome 9 9 397294 398385 W 2011-02-03 1994-12-10 Splicing protein; required for splicing of two mitochondrial group I introns (BI3 in COB and AI5beta in COX1); forms a splicing complex, containing four subunits of Mrs1p and two subunits of the BI3-encoded maturase, that binds to the BI3 RNA; MRS1 has a paralog, CCE1, that arose from the whole genome duplication -S000032999 CDS YIR021W 9 397294 398385 W 2011-02-03 1994-12-10 -S000028800 ORF Dubious YIR020C-B chromosome 9 9 397949 397215 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF MRS1 -S000033580 CDS YIR020C-B 9 397949 397215 C 2011-02-03 2003-07-29 -S000028838 ORF Uncharacterized YIR021W-A chromosome 9 9 398514 398726 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry -S000034490 CDS YIR021W-A 9 398514 398726 W 2011-02-03 2003-07-29 -S000001461 ORF Verified YIR022W SEC11 signal peptidase complex catalytic subunit SEC11 chromosome 9 L000001836 9 398733 399236 W 22 2011-02-03 1994-12-10 18kDa catalytic subunit of the Signal Peptidase Complex (SPC); the Signal Peptidase Complex cleaves the signal sequence of proteins targeted to the endoplasmic reticulum; other members are Spc1p, Spc2p, Spc3p, and Sec11p -S000033111 CDS YIR022W 9 398733 399236 W 2011-02-03 1994-12-10 -S000001462 ORF Verified YIR023W DAL81 DURL|UGA35 chromosome 9 L000000481 9 399777 402689 W 22 2011-02-03 1994-12-10 Positive regulator of genes in multiple nitrogen degradation pathways; contains DNA binding domain but does not appear to bind the dodecanucleotide sequence present in the promoter region of many genes involved in allantoin catabolism -S000033187 CDS YIR023W 9 399777 402689 W 2011-02-03 1994-12-10 -S000028801 ORF Dubious YIR023C-A chromosome 9 9 402706 402383 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF DAL81/YIR023W -S000033581 CDS YIR023C-A 9 402706 402383 C 2011-02-03 2003-07-29 -S000001463 ORF Verified YIR024C INA22 GIF1 chromosome 9 L000004438 9 403491 402841 C 2011-02-03 1994-12-10 F1F0 ATP synthase peripheral stalk assembly factor; subunit of the matrix-exposed inner mitochondrial membrane localized INA complex (Ina22p-Ina17p) involved in assembly of the F1F0 peripheral stalk; co-purifies with Aim43p, ATP synthase subunits, and cytochrome bc1 complex assembly factors; interacts with Arh1p, a mitochondrial oxidoreductase; deletion mutant has a respiratory growth defect -S000033910 CDS YIR024C 9 403491 402841 C 2011-02-03 1994-12-10 -S000001464 ORF Verified YIR025W MND2 chromosome 9 9 403659 404765 W 2011-02-03 1994-12-10 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); necessary for maintaining sister chromatid cohesion in prophase I of meiosis by inhibiting premature ubiquitination and subsequent degradation of substrates by the APC(Ama1) ubiquitin ligase -S000034094 CDS YIR025W 9 403659 404765 W 2011-02-03 1994-12-10 -S000001465 ORF Verified YIR026C YVH1 tyrosine protein phosphatase YVH1 chromosome 9 L000002567 9 405967 404873 C 31 2011-02-03 1994-12-10 Dual specificity protein phosphatase; regulates growth, sporulation, and glycogen accumulation in a cAMP-dependent protein kinase cascade dependent manner; mutants are defective in 60S ribosome assembly; positively regulates pre-autophagosomal structure (PAS) formation upon nitrogen starvation or rapamycin treatment -S000034138 CDS YIR026C 9 405967 404873 C 2011-02-03 1994-12-10 -S000001466 ORF Verified YIR027C DAL1 allantoinase chromosome 9 L000000474 9 407642 406260 C 32.1 2011-02-03 1994-12-10 Allantoinase; converts allantoin to allantoate in the first step of allantoin degradation; expression sensitive to nitrogen catabolite repression -S000034253 CDS YIR027C 9 407642 406260 C 2011-02-03 1994-12-10 -S000001467 ORF Verified YIR028W DAL4 allantoin permease chromosome 9 L000000477 9 408468 410375 W 34 2011-02-03 1994-12-10 Allantoin permease; expression sensitive to nitrogen catabolite repression and induced by allophanate, an intermediate in allantoin degradation -S000035258 CDS YIR028W 9 408468 410375 W 2011-02-03 1994-12-10 -S000001468 ORF Verified YIR029W DAL2 allantoicase|ALC1 chromosome 9 L000000475 9 410807 411838 W 36.1 2011-02-03 1994-12-10 Allantoicase; converts allantoate to urea and ureidoglycolate in the second step of allantoin degradation; expression sensitive to nitrogen catabolite repression and induced by allophanate, an intermediate in allantoin degradation -S000035347 CDS YIR029W 9 410807 411838 W 2011-02-03 1994-12-10 -S000118400 ARS ARS922 ARSIX-412 chromosome 9 9 411935 412011 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence -S000178118 ARS_consensus_sequence ARS922 9 412001 411985 C 2014-11-18 2014-11-18 -S000001469 ORF Verified YIR030C DCG1 chromosome 9 L000000497 9 412770 412036 C 36.4 2011-02-03 1994-12-10 Protein of unknown function; expression is sensitive to nitrogen catabolite repression and regulated by Dal80p; contains transmembrane domain -S000036237 CDS YIR030C 9 412770 412036 C 2011-02-03 1994-12-10 -S000028802 ORF Dubious YIR030W-A chromosome 9 9 412899 413282 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF DAL7/YIR031C -S000033582 CDS YIR030W-A 9 412899 413282 W 2011-02-03 2003-07-29 -S000001470 ORF Verified YIR031C DAL7 malate synthase DAL7|MSL2|MLS2 chromosome 9 L000000479 9 414679 413015 C 36.9 2011-02-03 1994-12-10 Malate synthase; can accept butyryl-CoA as acyl-CoA donor in addition to traditional substrate acetyl-CoA; recycles glyoxylate generated during allantoin degradation; SWAT-GFP and mCherry fusion proteins localize to the cytosol; expression sensitive to nitrogen catabolite repression and induced by allophanate, an intermediate in allantoin degradation -S000031686 CDS YIR031C 9 414679 413015 C 2011-02-03 1994-12-10 -S000001471 ORF Verified YIR032C DAL3 ureidoglycolate hydrolase chromosome 9 L000000476 9 415617 415030 C 37 2011-02-03 1994-12-10 Ureidoglycolate lyase; converts ureidoglycolate to glyoxylate and urea in the third step of allantoin degradation; expression is sensitive to nitrogen catabolite repression; this enzyme is sometimes referred to "ureidoglycolate hydrolase" but should not be confused with the Arabidopsis thaliana ureidoglycolate hydrolase enzyme which converts ureidoglycolate to glyoxylate, ammonia and carbon dioxide -S000031829 CDS YIR032C 9 415617 415030 C 2011-02-03 1994-12-10 -S000001472 ORF Verified YIR033W MGA2 chromosome 9 L000004181 9 416124 419465 W 2011-02-03 1994-12-10 ER membrane protein involved in regulation of OLE1 transcription; inactive ER form dimerizes and one subunit is then activated by ubiquitin/proteasome-dependent processing followed by nuclear targeting; MGA2 has a paralog, SPT23, that arose from the whole genome duplication -S000032031 CDS YIR033W 9 416124 419465 W 2011-02-03 1994-12-10 -S000001473 ORF Verified YIR034C LYS1 saccharopine dehydrogenase (NAD+, L-lysine-forming) chromosome 9 L000000964 9 420736 419615 C 40 2011-02-03 1994-12-10 Saccharopine dehydrogenase (NAD+, L-lysine-forming); catalyzes the conversion of saccharopine to L-lysine, which is the final step in the lysine biosynthesis pathway; also has mRNA binding activity -S000037430 CDS YIR034C 9 420736 419615 C 2011-02-03 1994-12-10 -S000001474 ORF Uncharacterized YIR035C sepiapterin reductase family protein chromosome 9 9 421790 421026 C 2011-02-03 1994-12-10 Putative cytoplasmic short-chain dehydrogenase/reductase -S000037528 CDS YIR035C 9 421790 421026 C 2011-02-03 1994-12-10 -S000028803 ORF Dubious YIR036W-A chromosome 9 9 422635 423036 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF IRC24/YIR036C -S000033584 CDS YIR036W-A 9 422635 423036 W 2011-02-03 2003-07-29 -S000001475 ORF Verified YIR036C IRC24 sepiapterin reductase family protein IRC24 chromosome 9 9 422865 422074 C 2011-02-03 1994-12-10 Putative benzil reductase;(GFP)-fusion protein localizes to the cytoplasm and is induced by the DNA-damaging agent MMS; sequence similarity with short-chain dehydrogenase/reductases; null mutant has increased spontaneous Rad52p foci -S000037606 CDS YIR036C 9 422865 422074 C 2011-02-03 1994-12-10 -S000001476 ORF Verified YIR037W HYR1 peroxiredoxin HYR1|ORP1|GPX3 chromosome 9 L000002612 9 423128 423619 W 2011-02-03 1994-12-10 Thiol peroxidase; functions as a hydroperoxide receptor to sense intracellular hydroperoxide levels and transduce a redox signal to the Yap1p transcription factor; HYR1 has a paralog, GPX1, that arose from the whole genome duplication -S000030468 CDS YIR037W 9 423128 423619 W 2011-02-03 1994-12-10 -S000001477 ORF Verified YIR038C GTT1 bifunctional glutathione transferase/peroxidase chromosome 9 L000004612 9 424513 423809 C 2011-02-03 1994-12-10 ER associated glutathione S-transferase capable of homodimerization; expression induced during the diauxic shift and throughout stationary phase; functional overlap with Gtt2p, Grx1p, and Grx2p -S000030525 CDS YIR038C 9 424513 423809 C 2011-02-03 1994-12-10 -S000007021 long_terminal_repeat YIRCdelta6 chromosome 9 9 426425 426201 C 2011-02-03 1994-12-10 Ty1 LTR -S000001478 ORF Verified YIR039C YPS6 aspartyl protease chromosome 9 L000004386 9 432111 430498 C 2011-02-03 1994-12-10 Putative GPI-anchored aspartic protease; member of the yapsin family of proteases involved in cell wall growth and maintenance -S000030600 CDS YIR039C 9 432111 430498 C 2011-02-03 1994-12-10 -S000001479 ORF Dubious YIR040C chromosome 9 9 433721 433389 C 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data -S000030026 CDS YIR040C 9 433721 433389 C 2011-02-03 1994-12-10 -S000001480 ORF Verified YIR041W PAU15 seripauperin PAU15 chromosome 9 9 433929 434303 W 2011-02-03 1994-12-10 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP and mCherry fusion proteins localize to the vacuole -S000030194 CDS YIR041W 9 433929 434303 W 2011-02-03 1994-12-10 -S000001481 ORF Uncharacterized YIR042C chromosome 9 9 435983 435273 C 2011-02-03 1994-12-10 Putative protein of unknown function; YIR042C is a non-essential gene -S000030300 CDS YIR042C 9 435983 435273 C 2011-02-03 1994-12-10 -S000001482 blocked_reading_frame YIR043C YIR044C chromosome 9 9 438179 437043 C 2014-11-18 1994-12-10|2014-11-18 Blocked reading frame; may encode a non-functional member of the conserved, often subtelomerically-encoded Cos protein family -S000030384 CDS YIR043C 9 438179 437043 C 2014-11-18 1994-12-10|2014-11-18 -S000028970 telomere TEL09R chromosome 9 9 439068 439888 W 43 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome IX; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats -S000028971 telomeric_repeat TEL09R 9 439816 439888 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome IX -S000028972 X_element TEL09R 9 439068 439533 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome IX; contains an ARS consensus sequence and an Abf1p binding site consensus sequence -S000028973 X_element_combinatorial_repeat TEL09R 9 439534 439815 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr IX; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats -S000178596 not physically mapped OTO1 Protein whose overexpression inhibits growth; encoded by a previously unannotated ORF located between YGR227W and YGR228W in the "C" direction; overexpression of PRM1 or UBP7 suppresses the growth inhibition caused by OTO1 overexpression; "orphan" ORF not conserved in any other known species -S000182414 not physically mapped SMT1 -S000029044 not physically mapped ASL1 S000029006 -S000155235 not physically mapped PDR19 -S000155237 not physically mapped PDR20 -S000155238 not physically mapped PDR21 -S000183332 not physically mapped HTC1 -S000183742 not physically mapped YPL2 -S000183740 not physically mapped YPL1 -S000151128 not physically mapped AIP5 -S000029237 not in systematic sequence of S288C KHR1 KHR1 KHR L000000899 Killer toxin; encoded on the left arm of chromosome IX in some strains, including YJM789 -S000029522 not in systematic sequence of S288C STA1 STA1 MAL5|DEX2 chromosome 9 L000003928 9 Glucoamylase (glucan 1,4-alpha-glucosidase) -S000029524 not in systematic sequence of S288C STA2 STA2 L000002105 Glucoamylase (glucan 1,4-alpha-glucosidase); allows yeast to degrade starch -S000029525 not in systematic sequence of S288C STA3 STA3 L000002106 Starch hydrolysis -S000029679 not in systematic sequence of S288C STRP STRP L000002135 Transmembrane protein with a highly basic C-terminal region -S000029531 not in systematic sequence of S288C SUC1 SUC1 chromosome 7 L000002143 7 228 Invertase; sucrose hydrolyzing enzyme; seven closely related but non-identical invertase genes have been described in yeast (SUC1-5, 7, 8) but only SUC2 is in the reference strain (S288C) -S000029532 not in systematic sequence of S288C SUC3 SUC3 chromosome 2 L000002145 2 146 Invertase; sucrose hydrolyzing enzyme; seven closely related but non-identical invertase genes have been described in yeast (SUC1-5, 7, 8) but only SUC2 is in the reference strain (S288C) -S000029533 not in systematic sequence of S288C SUC4 SUC4 SUC6 chromosome 13 L000002146 13 Invertase; sucrose hydrolyzing enzyme; seven closely related but non-identical invertase genes have been described in yeast (SUC1-5, 7, 8) but only SUC2 is in the reference strain (S288C) -S000029534 not in systematic sequence of S288C SUC5 SUC5 chromosome 4 L000002147 4 -152 Invertase; sucrose hydrolyzing enzyme; seven closely related but non-identical invertase genes have been described in yeast (SUC1-5, 7, 8) but only SUC2 is in the reference strain (S288C) -S000029535 not in systematic sequence of S288C SUC7 SUC7 chromosome 8 L000002148 8 Invertase; sucrose hydrolyzing enzyme; seven related but non-identical invertase genes have been described in yeast (SUC1-5, 7, 8) but only SUC2 is in strain S288C; unlike other forms of invertase, Suc7p is unable to hydrolyze raffinose -S000029417 not in systematic sequence of S288C RF2 RF2 chromosome 17 S000007533 17 Maturase-like coding sequence downstream of COX3/Q0275; present in some S. cerevisiae strains and other Saccharomyces species; compound ORF with homology to other group I open reading frames; in S288C is interrupted by two GC clusters, both of which ultimately result in a -1 frameshlft -S000029677 not in systematic sequence of S288C RTM1 RTM1 L000001785 Member of the lipid-translocating exporter (LTE) family; present in multiple copies associated with SUC telomeric loci, amplified in yeasts used for industrial biomass or ethanol production with molasses as substrate -S000029656 not in systematic sequence of S288C MAL2 MAL2 chromosome 3 L000001001 3 95 Multigene complex, polymeric locus for maltose fermentation; encodes the MAL23 trans-acting MAL-activator, MAL21 maltose permease, and MAL22 maltase; on the right arm of Chromosome III, but not in strain S288C -S000029681 not in systematic sequence of S288C MAL21 MAL21 MALT L000001011 Maltose permease; part of the complex locus MAL2 -S000029682 not in systematic sequence of S288C MAL22 MAL22 MALS L000001012 Maltase (alpha-D-glucosidase); encoded within the complex locus MAL2 -S000029685 not in systematic sequence of S288C MAL4 MAL4 chromosome 11 L000001006 11 85 Multigene complex, polymeric locus for maltose fermentation; encodes the MAL43 trans-acting MAL-activator, MAL41 maltose permease, and MAL42 maltase; on right arm of Chromosome XI, but not in strain S288C -S000029686 not in systematic sequence of S288C MAL41 MAL41 MALT L000001018 Maltose permease; part of the complex locus MAL4 -S000029687 not in systematic sequence of S288C MAL42 MAL42 MALS L000001019 Maltase (alpha-D-glucosidase); encoded within the complex locus MAL4 -S000029688 not in systematic sequence of S288C MAL43 MAL43 MALR L000001020 MAL-activator protein; encoded within the complex locus MAL4 -S000029689 not in systematic sequence of S288C MAL6 MAL6 L000001007 Multigene complex, polymeric locus for maltose fermentation; encodes the MAL63 trans-acting MAL-activator, MAL61 maltose permease, and MAL62 maltase; on the left arm of Chromosome VIII, but not in strain S288C -S000029690 not in systematic sequence of S288C MAL62 MAL62 MALS L000001022 Maltase (alpha-D-glucosidase); encoded within the complex locus MAL6 -S000029659 not in systematic sequence of S288C MAL63 MAL63 MALR L000001023 MAL-activator protein; transcription factor; part of the complex locus MAL6, plays a positive role in the regulation of maltose fermentation -S000029660 not in systematic sequence of S288C MATA1 MATA1 A1 L000002970 Expressed copy (at MATa) of a1; homeobox-domain protein that, along with alpha2, represses transcription of haploid-specific genes in diploid cells; MATa1 pre-mRNA splicing requires Bud13p and Ist3p; a1 sequence is not present in SGD because the sequenced S288C strain is MATalpha, not MATa -S000029661 not in systematic sequence of S288C MATA2 MATA2 A2 L000002971 Protein of unknown function; identical to the C-terminal 119 amino acid residues of the MATalpha2 protein; a2 sequence is not present in SGD because the sequenced S288C strain is MATalpha, not MATa -S000029662 not in systematic sequence of S288C MEL1 MEL1 chromosome 2 L000001063 2 -77 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose; regulated by several GAL genes -S000029692 not in systematic sequence of S288C MEL10 MEL10 chromosome 12 L000001072 12 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose -S000029663 not in systematic sequence of S288C MEL2 MEL2 L000001064 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose -S000029693 not in systematic sequence of S288C MEL3 MEL3 chromosome 16 L000001065 16 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose -S000029694 not in systematic sequence of S288C MEL4 MEL4 chromosome 11 L000001066 11 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose -S000029664 not in systematic sequence of S288C MEL5 MEL5 chromosome 4 L000001067 4 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose -S000029665 not in systematic sequence of S288C MEL6 MEL6 chromosome 13 L000001068 13 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose -S000029695 not in systematic sequence of S288C MEL7 MEL7 chromosome 6 L000001069 6 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose -S000029696 not in systematic sequence of S288C MEL8 MEL8 chromosome 15 L000001070 15 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose -S000029697 not in systematic sequence of S288C MEL9 MEL9 L000001071 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose -S000029666 not in systematic sequence of S288C MPR1 MPR1 S000007536 L-azetidine-2-carboxylic acid acetyltransferase; reduces intracellular ROS and contributes to L-proline analog resistance and tolerance to ethanol and freezing; member of N-acetyltransferase superfamily; not found in S288C, only present in strains with Sigma1278b background; located on left arm of chromosome XIV approximately 15 kb from telomere -S000029328 not in systematic sequence of S288C NTS1-1 NTS1-1 NTS1 L000001282 Nontranscribed region of the rDNA repeat between the 3'ETS and RDN5; required for rDNA repeat expansion; contains RNA polymerase I termination site -S000080162 not in systematic sequence of S288C KHS1 KHS1 Thermolabile killer toxin encoded on the right arm of Chromosome V -S000029703 not in systematic sequence of S288C AWA1 AWA1 Putative GPI-anchored protein; localized to the cell wall; involved in foam formation in sake mash by conferring hydrophobicity to the cell surface -S000029723 not in systematic sequence of S288C YAR069W-A BIO6 Putative 7-keto-8-aminopelargonic acid (KAPA) synthetase; in sake strains and S. cerevisiae strains YJM627 and A364a; involved in the biotin biosynthesis pathway; homologs present in S. bayanus, S. paradoxus, S. mikatae and S. kudriavzevii -S000029698 not in systematic sequence of S288C ENS2 ENS2 Endo.SceI|RF3 L000001619|L000000562 Mitochondrially-encoded 50 kD subunit of Endo.SceI; a dimeric multi-site-specific endonuclease that introduces double-stranded breaks at a number of well-defined sites on the mitochondrial DNA, inducing homologous recombination -S000134352 not in systematic sequence of S288C SUC8 SUC8 chromosome 10 10 Invertase; sucrose hydrolyzing enzyme; seven closely related but non-identical invertase genes have been described in yeast (SUC1-5, 7, 8) but only SUC2 is in the reference strain (S288C) -S000130715 not in systematic sequence of S288C ENA6 ENA6 chromosome 4 4 Plasma membrane sodium-pumping ATPase; the ENA6 gene is found in the PMR2 locus in the CEN.PK113-7D strain of S. cerevisiae, where other common lab strains have a varying number of the ENA genes (ENA1-ENA5) at the same locus -S000124112 not in systematic sequence of S288C TAT3 TAT3 Permease identified in lager brewing yeast strain Weihenstephan Nr.34; also in RM11-1a, but not S288C; subject to nitrogen catabolite repression and post-translational control, cellular localization dependent on nitrogen source quality -S000124955 not in systematic sequence of S288C MATA MATA MAT Mating type locus; note that the systematic sequence in SGD contains MATalpha sequences -S000125018 not in systematic sequence of S288C YAR070W-A BIO1 Putative pimeloyl-CoA synthetase involved in biotin biosynthesis; highly degraded pseudogenic paralog of YJR154W; functional copies present in S. cerevisiae strains YJM627 and A364a; functional pimeloyl-CoA synthetase (PCAS) genes are homologs of the bioW gene in Bacillus sp. and the bioC-bioH complex of E. coli -S000125021 not in systematic sequence of S288C YHR214W-F BIO8 Putative 7-keto-8-aminopelargonic acid (KAPA) synthetase; highly degraded pseudogenic copy of BIO6/YAR069W-A; functional copy present in S. cerevisiae strains YJM627 and A364a; involved in the biotin biosynthesis pathway -S000125022 not in systematic sequence of S288C YHR214W-G BIO7 Putative pimeloyl-CoA synthetase involved in biotin biosynthesis; in S. cerevisiae strains YJM627 and A364a; highly degraded pseudogenic copy of BIO1/YAR070W-A, which is a paralog of YJR154W -S000029657 not in systematic sequence of S288C MAL23 MAL23 MALR L000001013 MAL-activator protein; encoded within the complex locus MAL2; required for maltose and isomaltose utilization -S000029684 not in systematic sequence of S288C MAL34 MAL34 L000001017 ORF with sequence and positional similarity to the MAL64 gene; the MAL64 gene is thought to be a nonfunctional copy of MAL63; encoded within the complex locus MAL3 in some strains of S. cerevisiae, but not in S288C -S000029691 not in systematic sequence of S288C MAL64 MAL64 L000001024 MAL64 is a nonfunctional homolog of the MAL63 trans-activator; encoded within the complex locus MAL6 -S000029658 not in systematic sequence of S288C MAL61 MAL61 MALT L000001021 High-affinity maltose transporter; narrow substrate specificity, transporting maltose and turanose but not other alpha-glucosides; other names include alpha-glucoside transporter and maltose permease -S000145155 not in systematic sequence of S288C FPG1 FPG1 Putative cell wall mannoprotein involved in foam formation; contains a signal peptide and a putative GPI anchor; protein precursor homologous to Awa1p and Hpf1p -S000133140 not in systematic sequence of S288C XDH1 XDH1 chromosome 15 15 Xylitol dehydrogenase; involved in utilization of xylose as a carbon source; not present in S288C, but located in a 65kb insertion on the right arm of chromosome XV in many wine strains such as EC1118 and AWRI1631 -S000149345 not in systematic sequence of S288C IMI1 IMI1 Protein involved in maintaining mitochondrial integrity and glutathione homeostasis; localized to the cytoplasm; in W303 strain IMI1 is encoded by one continuous open reading frame comprising of YDL037C, the intergenic region and YDL039C, while in the reference sequence of S288C, YDL037C encodes Bsc1p and YDL039C encodes Prm7p. -S000150108 not in systematic sequence of S288C MPR2 MPR2 L-azetidine-2-carboxylic acid acetyltransferase; reduces intracellular ROS, contributes to L-proline analog resistance and tolerance to ethanol and freezing; member of N-acetyltransferase superfamily; not found in S288C, present in strains with Sigma1278b background; located on left arm of Chr X ~ 15 kb from telomere; identical to MPR1 except for one base at position 254, leading to Gly at position 85 in MPR1 and Glu in MPR2; present also in Japanese industrial baker's yeast +S000002143 ORF Dubious YAL069W chromosome 1 1 335 649 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031098 CDS YAL069W 1 335 649 W 1996-07-31 1996-07-31 +S000028594 ORF Dubious YAL068W-A chromosome 1 1 538 792 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031372 CDS YAL068W-A 1 538 792 W 2003-07-29 2003-07-29 +S000121252 ARS ARS102 ARSI-1 chromosome 1 1 707 776 2014-11-18 2014-11-18|2007-03-07 Autonomously Replicating Sequence +S000028862 telomere TEL01L chromosome 1 1 801 1 C -64 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome I; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats +S000028864 telomeric_repeat TEL01L 1 62 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome I +S000028865 X_element TEL01L 1 801 337 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome I; contains an ARS consensus sequence, an Abf1p binding site consensus sequence and two small overlapping ORFs (YAL068W-A and YAL069W) +S000028866 X_element_combinatorial_repeat TEL01L 1 336 63 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr I; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000002142 ORF Verified YAL068C PAU8 seripauperin PAU8 chromosome 1 1 2169 1807 C 1996-07-31 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions +S000030944 CDS YAL068C 1 2169 1807 C 1996-07-31 1996-07-31 +S000028593 ORF Uncharacterized YAL067W-A chromosome 1 1 2480 2707 W 2003-07-29 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031368 CDS YAL067W-A 1 2480 2707 W 2003-07-29 2003-07-29 +S000121253 ARS ARS103 ARSI-8 chromosome 1 1 7997 8547 2011-02-03 2007-03-07 Autonomously Replicating Sequence; replication origin of very weak function +S000000062 ORF Verified YAL067C SEO1 putative permease SEO1 chromosome 1 L000003363 1 9016 7235 C 2011-02-03 1996-07-31 Putative permease; member of the allantoate transporter subfamily of the major facilitator superfamily; mutation confers resistance to ethionine sulfoxide +S000029932 CDS YAL067C 1 9016 7235 C 2011-02-03 1996-07-31 +S000000061 ORF Dubious YAL066W chromosome 1 1 10091 10399 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000029887 CDS YAL066W 1 10091 10399 W 2011-02-03 1996-07-31 +S000001817 ORF Uncharacterized YAL065C chromosome 1 1 11951 11565 C 2011-02-03 1996-07-31 Putative protein of unknown function; shows sequence similarity to FLO1 and other flocculins +S000037154 CDS YAL065C 1 11951 11565 C 2011-02-03 1996-07-31 +S000002141 ORF Uncharacterized YAL064W-B chromosome 1 1 12046 12426 W 2011-02-03 1999-07-17 Fungal-specific protein of unknown function +S000034793 CDS YAL064W-B 1 12046 12426 W 2011-02-03 1999-07-17 +S000002140 ORF Uncharacterized YAL064C-A TDA8 YAL065C-A chromosome 1 1 13743 13363 C 2011-02-03 1996-07-31 Putative protein of unknown function; null mutant is sensitive to expression of the top1-T722A allele; not an essential gene +S000031541 CDS YAL064C-A 1 13743 13363 C 2011-02-03 1996-07-31 +S000000060 ORF Verified YAL064W chromosome 1 1 21566 21850 W 2011-02-03 1996-07-31|2011-02-03 Protein of unknown function; may interact with ribosomes, based on co-purification experiments +S000037087 CDS YAL064W 1 21566 21850 W 2011-02-03 1996-07-31|2011-02-03 +S000006787 long_terminal_repeat YALWdelta1 chromosome 1 1 22230 22552 W 2011-02-03 2000-05-19 Ty1 LTR +S000028813 ORF Uncharacterized YAL063C-A chromosome 1 1 22685 22395 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000033613 CDS YAL063C-A 1 22685 22395 C 2011-02-03 2003-07-29 +S000000059 ORF Verified YAL063C FLO9 flocculin FLO9 chromosome 1 L000003331 1 27968 24000 C 2011-02-03 1996-07-31 Lectin-like protein with similarity to Flo1p; thought to be expressed and involved in flocculation +S000036982 CDS YAL063C 1 27968 24000 C 2011-02-03 1996-07-31 +S000118317 ARS ARS104 ARSI-31 chromosome 1 1 30946 31183 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178034 ARS_consensus_sequence ARS104 1 31002 31018 W 2014-11-18 2014-11-18 +S000000058 ORF Verified YAL062W GDH3 glutamate dehydrogenase (NADP(+)) GDH3|FUN51 chromosome 1 L000000698 1 31567 32940 W 2011-02-03 1996-07-31 NADP(+)-dependent glutamate dehydrogenase; synthesizes glutamate from ammonia and alpha-ketoglutarate; rate of alpha-ketoglutarate utilization differs from Gdh1p; expression regulated by nitrogen and carbon sources; GDH3 has a paralog, GDH1, that arose from the whole genome duplication +S000036963 CDS YAL062W 1 31567 32940 W 2011-02-03 1996-07-31 +S000000057 ORF Uncharacterized YAL061W BDH2 putative dehydrogenase BDH2 chromosome 1 1 33448 34701 W 2011-02-03 1996-07-31 Putative medium-chain alcohol dehydrogenase with similarity to BDH1; transcription induced by constitutively active PDR1 and PDR3 +S000036902 CDS YAL061W 1 33448 34701 W 2011-02-03 1996-07-31 +S000000056 ORF Verified YAL060W BDH1 (R,R)-butanediol dehydrogenase|BDH chromosome 1 1 35155 36303 W 2011-02-03 1996-07-31|2011-02-03 NAD-dependent (R,R)-butanediol dehydrogenase; catalyzes oxidation of (R,R)-2,3-butanediol to (3R)-acetoin, oxidation of meso-butanediol to (3S)-acetoin, and reduction of acetoin; enhances use of 2,3-butanediol as an aerobic carbon source +S000036089 CDS YAL060W 1 35155 36303 W 2011-02-03 1996-07-31|2011-02-03 +S000000055 ORF Verified YAL059W ECM1 chromosome 1 L000003052 1 36509 37147 W 2011-02-03 1996-07-31|2011-02-03 Pre-ribosomal factor involved in 60S ribosomal protein subunit export; associates with the pre-60S particle; shuttles between the nucleus and cytoplasm +S000035122 CDS YAL059W 1 36509 37147 W 2011-02-03 1996-07-31|2011-02-03 +S000028734 ORF Dubious YAL059C-A chromosome 1 1 36918 36496 C 2011-02-03 2003-07-29|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene ECM1/YAL059W +S000033378 CDS YAL059C-A 1 36918 36496 C 2011-02-03 2003-07-29|2011-02-03 +S000000054 ORF Verified YAL058W CNE1 calnexin|FUN48 chromosome 1 L000000373 1 37464 38972 W 2011-02-03 1996-07-31 Calnexin; integral membrane ER chaperone involved in folding and quality control of glycoproteins; chaperone activity is inhibited by Mpd1p, with which Cne1p interacts; 24% identical to mammalian calnexin; Ca+ binding not yet shown in yeast +S000034933 CDS YAL058W 1 37464 38972 W 2011-02-03 1996-07-31 +S000002139 ORF Dubious YAL056C-A YAL058C-A chromosome 1 1 39046 38696 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035879 CDS YAL056C-A 1 39046 38696 C 2011-02-03 1996-07-31 +S000000052 ORF Verified YAL056W GPB2 KRH1 chromosome 1 1 39259 41901 W 2011-02-03 2004-01-20|1996-07-31|2011-02-03 Multistep regulator of cAMP-PKA signaling; inhibits PKA downstream of Gpa2p and Cyr1p, thereby increasing cAMP dependency; inhibits Ras activity through direct interactions with Ira1p/2p; regulated by G-alpha protein Gpa2p; GPB2 has a paralog, GPB1, that arose from the whole genome duplication +S000033885 CDS YAL056W 1 39259 41901 W 2011-02-03 2004-01-20|1996-07-31|2011-02-03 +S000121254 ARS ARS105 ARSI-42 chromosome 1 1 41992 42151 2014-11-18 2014-11-18|2007-03-07 Autonomously Replicating Sequence +S000000051 ORF Verified YAL055W PEX22 ubiquitin-protein transferase activating protein PEX22|YAF5 chromosome 1 1 42177 42719 W 2011-02-03 1996-07-31 Putative peroxisomal membrane protein; required for import of peroxisomal proteins; functionally complements a Pichia pastoris pex22 mutation +S000033812 CDS YAL055W 1 42177 42719 W 2011-02-03 1996-07-31 +S000000050 ORF Verified YAL054C ACS1 acetate--CoA ligase 1|FUN44 chromosome 1 L000000024 1 45022 42881 C -63.11 2011-02-03 1996-07-31 Acetyl-coA synthetase isoform; along with Acs2p, acetyl-coA synthetase isoform is the nuclear source of acetyl-coA for histone acetylation; expressed during growth on nonfermentable carbon sources and under aerobic conditions +S000033073 CDS YAL054C 1 45022 42881 C 2011-02-03 1996-07-31 +S000000049 ORF Verified YAL053W FLC2 flavin adenine dinucleotide transporter FLC2|HUF2 chromosome 1 1 45899 48250 W 2011-02-03 1996-07-31|2011-02-03 Putative calcium channel involved in calcium release under hypotonic stress; required for uptake of FAD into endoplasmic reticulum; involved in cell wall maintenance; FLC2 has a paralog, YOR365C, that arose from the whole genome duplication +S000033037 CDS YAL053W 1 45899 48250 W 2011-02-03 1996-07-31|2011-02-03 +S000000048 ORF Verified YAL051W OAF1 oleate-activated transcription factor OAF1|YAF1 chromosome 1 L000004197 1 48564 51707 W 2011-02-03 2004-07-20|1996-07-31|2011-02-03 Oleate-activated transcription factor; subunit of a heterodimeric complex with Pip2p, which binds to oleate-response elements (ORE) in the promoter of genes involved in beta-oxidation of fatty acids, peroxisome organization and biogenesis, activating transcription in the presence of oleate; regulates chromatin silencing at telomeres; involved in diauxic shift; OAF1 has a paralog, PIP2, that arose from the whole genome duplication +S000032862 CDS YAL051W 1 48564 51707 W 2011-02-03 2004-07-20|1996-07-31|2011-02-03 +S000000047 ORF Verified YAL049C AIM2 protein AIM2 chromosome 1 1 52595 51855 C 2011-02-03 1996-07-31 Cytoplasmic protein involved in mitochondrial function or organization; null mutant displays reduced frequency of mitochondrial genome loss; potential Hsp82p interactor +S000031896 CDS YAL049C 1 52595 51855 C 2011-02-03 1996-07-31 +S000028733 ORF Dubious YAL047W-A chromosome 1 1 54584 54913 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF GEM1/YAL048C +S000033377 CDS YAL047W-A 1 54584 54913 W 2011-02-03 2003-07-29 +S000000046 ORF Verified YAL048C GEM1 ERMES complex Ca(2+)-binding regulatory GTPase GEM1|GON1 chromosome 1 1 54789 52801 C 2011-02-03 1996-07-31 Outer mitochondrial membrane GTPase, subunit of the ERMES complex; potential regulatory subunit of the ERMES complex that links the ER to mitochondria and may promote inter-organellar calcium and phospholipid exchange as well as coordinating mitochondrial DNA replication and growth; cells lacking Gem1p contain collapsed, globular, or grape-like mitochondria; ortholog of metazoan Miro GTPases +S000030895 CDS YAL048C 1 54789 52801 C 2011-02-03 1996-07-31 +S000000045 ORF Verified YAL047C SPC72 gamma-tubulin complex subunit SPC72|LDB4 chromosome 1 L000003455 1 56857 54989 C 2011-02-03 1996-07-31|2011-02-03 Gamma-tubulin small complex (gamma-TuSC) receptor; recruits the gamma-TuSC complex to the cytoplasmic side of the SPB, connecting nuclear microtubules to the SPB; involved in astral microtubule formation, stabilization, and with Stu2p, anchoring astral MTs at the cytoplasmic face of the SPB, and regulating plus-end MT dynamics; regulated by Cdc5 kinase +S000030803 CDS YAL047C 1 56857 54989 C 2011-02-03 1996-07-31|2011-02-03 +S000000044 ORF Verified YAL046C BOL3 AIM1 chromosome 1 1 57385 57029 C 2011-02-03 1996-07-31 Protein involved in Fe-S cluster transfer to mitochondrial clients; protects [4Fe-4S] clusters from damage due to oxidative stress by acting along with Nfu1p at a late step in the transfer of [4Fe-4S] clusters from the ISA complex to mitochondrial client proteins like lipoate synthase and succinate dehydrogenase; sequence similarity to human BOLA family member, BOLA3, mutations of which are associated with Multiple Mitochondria Dysfunctions Syndrome (MMDS2) +S000030666 CDS YAL046C 1 57385 57029 C 2011-02-03 1996-07-31 +S000007586 ORF Verified YAL044W-A BOL1 chromosome 1 1 57518 57850 W 2011-02-03 2001-01-30 Mitochondrial matrix protein involved in Fe-S cluster biogenesis; facilitates [4Fe-2S] cluster inception into mitochondrial proteins such as lipoate synthase and succinate dehydrogenase; interacts and may function with Grx5p at an early step in Fe-S cluster biosynthesis; forms dimeric complexes with Grx5p and Nfu1p that alter the stability of shared Fe/S clusters; sequence similarity to human BOLA family member, BOLA1 and S. pombe uvi31, a putative DNA repair protein +S000037097 CDS YAL044W-A 1 57518 57850 W 2011-02-03 2001-01-30 +S000000043 ORF Dubious YAL045C chromosome 1 1 57796 57488 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps YAL044W-A +S000030576 CDS YAL045C 1 57796 57488 C 2011-02-03 1996-07-31 +S000000042 ORF Verified YAL044C GCV3 glycine decarboxylase subunit H chromosome 1 L000003501 1 58462 57950 C 2011-02-03 2003-09-22|1996-07-31|2008-03-05 H subunit of the mitochondrial glycine decarboxylase complex; glycine decarboxylase is required for the catabolism of glycine to 5,10-methylene-THF; also required for all protein lipoylation; expression is regulated by levels of 5,10-methylene-THF +S000037751 CDS YAL044C 1 58462 57950 C 2011-02-03 2003-09-22|1996-07-31|2008-03-05 +S000000041 ORF Verified YAL043C PTA1 RNA-processing protein PTA1|FUN39 chromosome 1 L000001522 1 61052 58695 C 2011-02-03 1996-07-31 Subunit of holo-CPF; holo-CPF is a multiprotein complex and functional homolog of mammalian CPSF, required for the cleavage and polyadenylation of mRNA and snoRNA 3' ends; involved in pre-tRNA processing; binds to the phosphorylated CTD of RNAPII +S000037691 CDS YAL043C 1 61052 58695 C 2011-02-03 1996-07-31 +S000000040 ORF Verified YAL042W ERV46 FUN9 chromosome 1 L000000633 1 61316 62563 W 2011-02-03 1996-07-31 Protein localized to COPII-coated vesicles; forms a complex with Erv41p; involved in the membrane fusion stage of transport +S000037669 CDS YAL042W 1 61316 62563 W 2011-02-03 1996-07-31 +S000002138 ORF Dubious YAL042C-A YAL043C-A chromosome 1 1 61608 61231 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF ERV46/YAL042W; YAL042C-A is a non-essential gene +S000030422 CDS YAL042C-A 1 61608 61231 C 2011-02-03 1996-07-31 +S000000039 ORF Verified YAL041W CDC24 Rho family guanine nucleotide exchange factor CDC24|CLS4 chromosome 1 L000000262 1 62840 65404 W -56 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF) for Cdc42p; required for polarity establishment and maintenance, and mutants have morphological defects in bud formation and shmooing; relocalizes from nucleus to cytoplasm upon DNA replication stress; thermosensitivity of the cdc24-4 mutant in the presence of sorbitol is functionally complemented by human CDC42 +S000037599 CDS YAL041W 1 62840 65404 W 2011-02-03 1996-07-31 +S000000038 ORF Verified YAL040C CLN3 cyclin CLN3|WHI1|FUN10|DAF1 chromosome 1 L000000359 1 67520 65778 C -56 2011-02-03 1996-07-31 G1 cyclin involved in cell cycle progression; activates Cdc28p kinase to promote G1 to S phase transition; plays a role in regulating transcription of other G1 cyclins, CLN1 and CLN2; regulated by phosphorylation and proteolysis; acetyl-CoA induces CLN3 transcription in response to nutrient repletion to promote cell-cycle entry; cell cycle arrest phenotype of the cln1 cln2 cln3 triple null mutant is complemented by any of human cyclins CCNA2, CCNB1, CCNC, CCND1, or CCNE1 +S000036825 CDS YAL040C 1 67520 65778 C 2011-02-03 1996-07-31 +S000000037 ORF Verified YAL039C CYC3 holocytochrome c synthase CYC3|CCHL chromosome 1 L000000450 1 69525 68716 C -47 2011-02-03 1996-07-31 Cytochrome c heme lyase (holocytochrome c synthase); attaches heme to apo-cytochrome c (Cyc1p or Cyc7p) in mitochondrial intermembrane space; human homolog HCCS implicated in microphthalmia with linear skin defects (MLS), and can complement yeast null mutant +S000035956 CDS YAL039C 1 69525 68716 C 2011-02-03 1996-07-31 +S000118318 ARS ARS106 ARSI-70 chromosome 1 1 70300 70469 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178035 ARS_consensus_sequence ARS106 1 70434 70418 C 2014-11-18 2014-11-18 +S000000036 ORF Verified YAL038W CDC19 pyruvate kinase CDC19|PYK1 chromosome 1 L000000258 1 71786 73288 W -45 2011-02-03 1996-07-31 Pyruvate kinase; functions as a homotetramer in glycolysis to convert phosphoenolpyruvate to pyruvate, the input for aerobic (TCA cycle) or anaerobic (glucose fermentation) respiration; regulated via allosteric activation by fructose bisphosphate; CDC19 has a paralog, PYK2, that arose from the whole genome duplication +S000035915 CDS YAL038W 1 71786 73288 W 2011-02-03 1996-07-31 +S000028592 ORF Dubious YAL037C-B chromosome 1 1 73300 72326 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031366 CDS YAL037C-B 1 73300 72326 C 2011-02-03 2003-07-29 +S000028732 ORF Uncharacterized YAL037C-A chromosome 1 1 73518 73426 C 2011-02-03 2003-07-29 Putative protein of unknown function +S000033376 CDS YAL037C-A 1 73518 73426 C 2011-02-03 2003-07-29 +S000000035 ORF Uncharacterized YAL037W chromosome 1 1 74020 74823 W 2011-02-03 1996-07-31 Putative protein of unknown function; YAL037W has a paralog, YOR342C, that arose from the whole genome duplication +S000035798 CDS YAL037W 1 74020 74823 W 2011-02-03 1996-07-31 +S000000034 ORF Verified YAL036C RBG1 GTP-binding protein RBG1|FUN11 chromosome 1 L000000634 1 76152 75043 C 2011-02-03 1996-07-31 Member of the DRG family of GTP-binding proteins; associates with translating ribosomes; interacts with Tma46p, Ygr250cp, Gir2p and Yap1p via two-hybrid +S000034719 CDS YAL036C 1 76152 75043 C 2011-02-03 1996-07-31 +S000000033 ORF Verified YAL035W FUN12 translation initiation factor eIF5B|eIF5B|yIF2 chromosome 1 L000000635 1 76427 79435 W 2011-02-03 1996-07-31 Translation initiation factor eIF5B; GTPase that promotes Met-tRNAiMet binding to ribosomes and ribosomal subunit joining; promotes GTP-dependent maturation of 18S rRNA by Nob1p; protein abundance increases in response to DNA replication stress; homolog of bacterial IF2 +S000034678 CDS YAL035W 1 76427 79435 W 2011-02-03 1996-07-31 +S000000032 ORF Verified YAL034W-A MTW1 MIND complex subunit MTW1|NSL2|DSN3 chromosome 1 S000007418 1 79718 80587 W 2011-02-03 1996-07-31 Essential component of the MIND kinetochore complex; joins kinetochore subunits contacting DNA to those contacting microtubules; critical to kinetochore assembly; complex consists of Mtw1p Including Nnf1p-Nsl1p-Dsn1p (MIND) +S000031836 CDS YAL034W-A 1 79718 80587 W 2011-02-03 1996-07-31 +S000002137 ORF Dubious YAL034C-B YAL035C-A chromosome 1 1 79842 79489 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031374 CDS YAL034C-B 1 79842 79489 C 2011-02-03 1996-07-31 +S000002134 ORF Verified YAL034C FUN19 chromosome 1 L000000637 1 81951 80710 C 2011-02-03 2003-09-22|1996-07-31 Non-essential protein of unknown function; expression induced in response to heat stress; FUN19 has a paralog, YOR338W, that arose from the whole genome duplication +S000034508 CDS YAL034C 1 81951 80710 C 2011-02-03 2003-09-22|1996-07-31 +S000000031 ORF Verified YAL033W POP5 RNA-binding protein POP5|FUN53 chromosome 1 L000004301|L000000649 1 82706 83227 W 2011-02-03 1996-07-31 Subunit of both RNase MRP and nuclear RNase P; RNase MRP cleaves pre-rRNA, while nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs +S000034465 CDS YAL033W 1 82706 83227 W 2011-02-03 1996-07-31 +S000000030 ORF Verified YAL032C PRP45 mRNA splicing protein PRP45|FUN20 chromosome 1 L000000638 1 84474 83335 C 2011-02-03 1996-07-31 Protein required for pre-mRNA splicing; associates with the spliceosome and interacts with splicing factors Prp22p and Prp46p; orthologous to human transcriptional coactivator SKIP and can activate transcription of a reporter gene +S000033541 CDS YAL032C 1 84474 83335 C 2011-02-03 1996-07-31 +S000028731 ORF Dubious YAL031W-A chromosome 1 1 84669 84977 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF GIP4/YAL031C +S000033375 CDS YAL031W-A 1 84669 84977 W 2011-02-03 2003-07-29 +S000000029 ORF Verified YAL031C GIP4 protein phosphatase regulator GIP4|FUN21 chromosome 1 L000000639 1 87031 84749 C 2011-02-03 1996-07-31 Cytoplasmic protein that regulates protein phosphatase 1 Glc7p; protein overexpression relocalizes Glc7p from the nucleus and prevents chromosome segregation; potential Cdc28p substrate +S000033476 CDS YAL031C 1 87031 84749 C 2011-02-03 1996-07-31 +S000000028 ORF Verified YAL030W SNC1 SNAP receptor SNC1 chromosome 1 L000001942 1 87286 87752 W 2011-02-03 1996-07-31 Vesicle membrane receptor protein (v-SNARE); involved in the fusion between Golgi-derived secretory vesicles with the plasma membrane; proposed to be involved in endocytosis; member of the synaptobrevin/VAMP family of R-type v-SNARE proteins; SNC1 has a paralog, SNC2, that arose from the whole genome duplication +S000033437 CDS YAL030W 1 87286 87387 W 2011-02-03 1996-07-31 +S000033438 CDS YAL030W 1 87501 87752 W 2011-02-03 1996-07-31 +S000033439 intron YAL030W 1 87388 87500 W 2011-02-03 1996-07-31 +S000000027 ORF Verified YAL029C MYO4 myosin 4|SHE1|FUN22 chromosome 1 L000000640|L000001224 1 92270 87855 C 2011-02-03 1996-07-31 Type V myosin motor involved in actin-based transport of cargos; required for mRNA transport, including ASH1 mRNA, and facilitating the growth and movement of ER tubules into the growing bud along with She3p; MYO4 has a paralog, MYO2, that arose from the whole genome duplication +S000033821 CDS YAL029C 1 92270 87855 C 2011-02-03 1996-07-31 +S000000026 ORF Verified YAL028W FRT2 HPH2 chromosome 1 1 92900 94486 W 2011-02-03 1996-07-31 Tail-anchored ER membrane protein of unknown function; interacts with homolog Frt1p; promotes growth in conditions of high Na+, alkaline pH, or cell wall stress, possibly via a role in posttranslational translocation; potential Cdc28p substrate; FRT2 has a paralog, FRT1, that arose from the whole genome duplication +S000033747 CDS YAL028W 1 92900 94486 W 2011-02-03 1996-07-31 +S000000025 ORF Verified YAL027W SAW1 DNA-binding protein SAW1 chromosome 1 1 94687 95472 W 2011-02-03 1996-07-31 5'- and 3'-flap DNA binding protein; recruits Rad1p-Rad10p to single-strand annealing intermediates with 3' non-homologous tails for removal during double-strand break repair; complexes with Rad1p-Rad10p and stimulates its endonuclease activity; green fluorescent protein (GFP)-fusion protein localizes to the nucleus +S000033629 CDS YAL027W 1 94687 95472 W 2011-02-03 1996-07-31 +S000028730 ORF Dubious YAL026C-A chromosome 1 1 95823 95386 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YAL027W and the verified gene DRS2 +S000033374 CDS YAL026C-A 1 95823 95386 C 2011-02-03 2003-07-29 +S000119380 ncRNA_gene HRA1 HRA1 chromosome 1 1 99305 99868 W 2011-02-03 2007-02-06|2007-05-08|2011-02-03 Non-protein-coding RNA; substrate of RNase P, possibly involved in rRNA processing, specifically maturation of 20S precursor into the mature 18S rRNA +S000120654 noncoding_exon HRA1 1 99305 99868 W 2011-02-03 2007-02-06|2007-05-08|2011-02-03 +S000000024 ORF Verified YAL026C DRS2 aminophospholipid-translocating P4-type ATPase DRS2|SWA3|FUN38 chromosome 1 L000000526 1 99697 95630 C 2011-02-03 1996-07-31|2011-02-03 Trans-golgi network aminophospholipid translocase (flippase); maintains membrane lipid asymmetry in post-Golgi secretory vesicles; contributes to clathrin-coated vesicle formation, endocytosis, protein trafficking between the Golgi and endosomal system and the cellular response to mating pheromone; autoinhibited by its C-terminal tail; localizes to the trans-Golgi network; mutations in human homolog ATP8B1 result in liver disease +S000030197 CDS YAL026C 1 99697 95630 C 2011-02-03 1996-07-31|2011-02-03 +S000000023 ORF Verified YAL025C MAK16 ribosome biosynthesis protein MAK16 chromosome 1 L000000989 1 101145 100225 C -31 2011-02-03 1996-07-31|2011-02-03 Essential nuclear protein; constituent of 66S pre-ribosomal particles; required for maturation of 25S and 5.8S rRNAs; required for maintenance of M1 satellite double-stranded RNA of the L-A virus +S000030064 CDS YAL025C 1 101145 100225 C 2011-02-03 1996-07-31|2011-02-03 +S000000022 ORF Verified YAL024C LTE1 mitotic regulator LTE1|MSI2 chromosome 1 L000000955 1 105872 101565 C -31 2011-02-03 1996-07-31 Protein similar to GDP/GTP exchange factors; without detectable GEF activity; required for asymmetric localization of Bfa1p at daughter-directed spindle pole bodies and for mitotic exit at low temperatures +S000029981 CDS YAL024C 1 105872 101565 C 2011-02-03 1996-07-31 +S000000021 ORF Verified YAL023C PMT2 dolichyl-phosphate-mannose-protein mannosyltransferase PMT2|FUN25 chromosome 1 L000000642|L000001459 1 108551 106272 C 2011-02-03 2002-12-17|1996-07-31 Protein O-mannosyltransferase of the ER membrane; transfers mannose residues from dolichyl phosphate-D-mannose to protein serine/threonine residues; involved in ER quality control; acts in a complex with Pmt1p, can instead interact with Pmt5p; antifungal drug target; PMT2 has a paralog, PMT3, that arose from the whole genome duplication +S000037355 CDS YAL023C 1 108551 106272 C 2011-02-03 2002-12-17|1996-07-31 +S000000020 ORF Verified YAL022C FUN26 nucleoside transmembrane transporter FUN26 chromosome 1 L000000643 1 110430 108877 C 2011-02-03 1996-07-31 High affinity, broad selectivity, nucleoside/nucleobase transporter; vacuolar membrane localized transporter which may regulate the balance of nicotinamide riboside (NmR) levels between the cytosol and vacuole, contributing to salvage of NmR for use in cytosolic NAD+ synthesis; equilibrative nucleoside transporter (ENT) family member +S000037286 CDS YAL022C 1 110430 108877 C 2011-02-03 1996-07-31 +S000000019 ORF Verified YAL021C CCR4 CCR4-NOT core exoribonuclease subunit CCR4|NUT21|FUN27 chromosome 1 L000000239 1 113359 110846 C -25 2011-02-03 1996-07-31 Component of the CCR4-NOT transcriptional complex; CCR4-NOT is involved in regulation of gene expression; component of the major cytoplasmic deadenylase, which is involved in mRNA poly(A) tail shortening +S000037200 CDS YAL021C 1 113359 110846 C 2011-02-03 1996-07-31 +S000028729 ORF Dubious YAL019W-A chromosome 1 1 114250 114819 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF ATS1/YAL020C +S000032720 CDS YAL019W-A 1 114250 114819 W 2011-02-03 2003-07-29 +S000000018 ORF Verified YAL020C ATS1 KTI13|FUN28 chromosome 1 L000000644|L000000154 1 114615 113614 C 2011-02-03 1996-07-31|2011-02-03 Protein required for modification of wobble nucleosides in tRNA; acts with Elongator complex, Kti11p, and Kti12p; has a potential role in regulatory interactions between microtubules and the cell cycle; forms a stable heterodimer with Kti11p +S000037124 CDS YAL020C 1 114615 113614 C 2011-02-03 1996-07-31|2011-02-03 +S000000017 ORF Verified YAL019W FUN30 DNA-dependent ATPase FUN30 chromosome 1 L000000645 1 114919 118314 W 2011-02-03 1996-07-31 Snf2p family member with ATP-dependent chromatin remodeling activity; has a role in silencing at the mating type locus, telomeres and centromeres; enriched at centromeres and is required for correct chromatin structure around centromeres, as well as at the boundary element of the silent HMR; recruited to DNA double-strand breaks (DSBs) where it promotes 5' strand resection of DSBs; potential Cdc28p substrate +S000037555 CDS YAL019W 1 114919 118314 W 2011-02-03 1996-07-31 +S000000016 ORF Verified YAL018C LDS1 chromosome 1 1 119541 118564 C 2011-02-03 1996-07-31 Protein Involved in spore wall assembly; localizes to lipid droplets found on or outside of the prospore membrane; shares similarity with Lds2p and Rrt8p, and a strain mutant for all 3 genes exhibits reduced dityrosine fluorescence relative to the single mutants +S000032033 CDS YAL018C 1 119541 118564 C 2011-02-03 1996-07-31 +S000000015 ORF Verified YAL017W PSK1 serine/threonine protein kinase PSK1|FUN31 chromosome 1 L000000646 1 120225 124295 W 2011-02-03 1996-07-31|2011-02-03 PAS domain-containing serine/threonine protein kinase; coordinately regulates protein synthesis and carbohydrate metabolism and storage in response to a unknown metabolite that reflects nutritional status; PSK1 has a paralog, PSK2, that arose from the whole genome duplication +S000031992 CDS YAL017W 1 120225 124295 W 2011-02-03 1996-07-31|2011-02-03 +S000118319 ARS ARS107 ARSI-125 chromosome 1 1 124349 124597 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178036 ARS_consensus_sequence ARS107 1 124479 124463 C 2014-11-18 2014-11-18 +S000028528 ORF Dubious YAL016C-B chromosome 1 1 124492 124307 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030333 CDS YAL016C-B 1 124492 124307 C 2011-02-03 2003-07-29 +S000000014 ORF Verified YAL016W TPD3 protein phosphatase 2A structural subunit TPD3|FUN32 chromosome 1 L000002325 1 124879 126786 W .5 2011-02-03 1996-07-31 Regulatory subunit A of the heterotrimeric PP2A complex; the heterotrimeric protein phosphatase 2A (PP2A) complex also contains regulatory subunit Cdc55p and either catalytic subunit Pph21p or Pph22p; required for cell morphogenesis and transcription by RNA polymerase III +S000031874 CDS YAL016W 1 124879 126786 W 2011-02-03 1996-07-31 +S000028728 ORF Dubious YAL016C-A chromosome 1 1 125069 124755 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF TPD3/YAL016W +S000032719 CDS YAL016C-A 1 125069 124755 C 2011-02-03 2003-07-29 +S000000013 ORF Verified YAL015C NTG1 bifunctional N-glycosylase/AP lyase NTG1|ogg2|SCR1|FUN33 chromosome 1 L000004114 1 128102 126903 C 2011-02-03 1996-07-31 DNA N-glycosylase and apurinic/apyrimidinic (AP) lyase; involved in base excision repair; acts in both nucleus and mitochondrion; creates a double-strand break at mtDNA origins that stimulates replication in response to oxidative stress; required for maintaining mitochondrial genome integrity; NTG1 has a paralog, NTG2, that arose from the whole genome duplication +S000036247 CDS YAL015C 1 128102 126903 C 2011-02-03 1996-07-31 +S000000012 ORF Verified YAL014C SYN8 syntaxin|SLT2|UIP2 chromosome 1 1 129019 128252 C 2011-02-03 2002-12-17|1996-07-31 Endosomal SNARE related to mammalian syntaxin 8 +S000036146 CDS YAL014C 1 129019 128252 C 2011-02-03 2002-12-17|1996-07-31 +S000000011 ORF Verified YAL013W DEP1 Rpd3L histone deacetylase complex subunit DEP1|FUN54 chromosome 1 L000000502 1 129270 130487 W 12 2011-02-03 2003-12-15|1996-07-31|2011-02-03 Component of the Rpd3L histone deacetylase complex; required for diauxic shift-induced histone H2B deposition onto rDNA genes; transcriptional modulator involved in regulation of structural phospholipid biosynthesis genes and metabolically unrelated genes, as well as maintenance of telomeres, mating efficiency, and sporulation +S000036100 CDS YAL013W 1 129270 130487 W 2011-02-03 2003-12-15|1996-07-31|2011-02-03 +S000000010 ORF Verified YAL012W CYS3 cystathionine gamma-lyase CYS3|STR1|FUN35|CYI1 chromosome 1 L000000470 1 130799 131983 W -16 2011-02-03 1996-07-31 Cystathionine gamma-lyase; catalyzes one of the two reactions involved in the transsulfuration pathway that yields cysteine from homocysteine with the intermediary formation of cystathionine; protein abundance increases in response to DNA replication stress +S000035250 CDS YAL012W 1 130799 131983 W 2011-02-03 1996-07-31 +S000000009 ORF Verified YAL011W SWC3 SWC1 chromosome 1 1 132199 134076 W 2011-02-03 2003-09-22|1996-07-31 Protein of unknown function; component of the SWR1 complex, which exchanges histone variant H2AZ (Htz1p) for chromatin-bound histone H2A; required for formation of nuclear-associated array of smooth endoplasmic reticulum known as karmellae +S000035116 CDS YAL011W 1 132199 134076 W 2011-02-03 2003-09-22|1996-07-31 +S000000008 ORF Verified YAL010C MDM10 FUN37 chromosome 1 L000000648|L000001053 1 135665 134184 C 2011-02-03 1996-07-31|2011-02-03 Subunit of both the ERMES and the SAM complex; component of ERMES complex which acts as a molecular tether between the mitochondria and the ER, necessary for efficient phospholipid exchange between organelles and for mitophagy; SAM/TOB complex component that functions in the assembly of outer membrane beta-barrel proteins; involved in mitochondrial inheritance and morphology; ERMES complex is often co-localized with peroxisomes and concentrated areas of pyruvate dehydrogenase +S000034958 CDS YAL010C 1 135665 134184 C 2011-02-03 1996-07-31|2011-02-03 +S000000007 ORF Verified YAL009W SPO7 Nem1-Spo7 phosphatase regulatory subunit SPO7 chromosome 1 L000002000 1 135854 136633 W -4 2011-02-03 1996-07-31 Putative regulatory subunit of Nem1p-Spo7p phosphatase holoenzyme; regulates nuclear growth by controlling phospholipid biosynthesis, required for normal nuclear envelope morphology, premeiotic replication, and sporulation +S000034070 CDS YAL009W 1 135854 136633 W 2011-02-03 1996-07-31 +S000000006 ORF Verified YAL008W FUN14 MCP3 chromosome 1 L000000636 1 136914 137510 W 2011-02-03 1996-07-31 Integral mitochondrial outer membrane (MOM) protein; dosage suppressor of an MDM10 null that reduces ERMES-related phenotypes, such as alterations in mitochondrial morphology, protein complex assembly, and lipid profile; dosage suppressor of MDM12, MDM34, and MMM1 null mutant growth defects; novel mechanism of MOM import involving Tom70p, the TOM complex, and the TIM23 complex, requiring mitochondrial membrane potential and processing by the IMP complex for correct biogenesis +S000033957 CDS YAL008W 1 136914 137510 W 2011-02-03 1996-07-31 +S000000005 ORF Verified YAL007C ERP2 chromosome 1 L000004679 1 138345 137698 C 2011-02-03 1996-07-31 Member of the p24 family involved in ER to Golgi transport; similar to Emp24p and Erv25p; role in misfolded protein quality control; forms a heterotrimeric complex with Erp1p, Emp24p, and Erv25p; localized to COPII-coated vesicles; ERP2 has a paralog, ERP4, that arose from the whole genome duplication +S000033112 CDS YAL007C 1 138345 137698 C 2011-02-03 1996-07-31 +S000006786 long_terminal_repeat YALCdelta2 chromosome 1 1 138992 138831 C 2011-02-03 2000-05-19 Ty1 LTR +S000006680 tRNA_gene tP(UGG)A TRN1 chromosome 1 L000003601 1 139152 139254 W -2 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin; can mutate to suppress +1 frameshift mutations in proline codons +S000035969 intron tP(UGG)A 1 139188 139218 W 2011-02-03 2000-05-19 +S000035967 noncoding_exon tP(UGG)A 1 139152 139187 W 2011-02-03 2000-05-19 +S000035968 noncoding_exon tP(UGG)A 1 139219 139254 W 2011-02-03 2000-05-19 +S000002136 ORF Dubious YAL004W chromosome 1 1 140760 141407 W 2011-02-03 1996-07-31|2007-04-05 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified gene SSA1/YAL005C +S000032057 CDS YAL004W 1 140760 141407 W 2011-02-03 1996-07-31|2007-04-05 +S000000004 ORF Verified YAL005C SSA1 Hsp70 family ATPase SSA1|YG100 chromosome 1 L000002069 1 141431 139503 C -1 2011-02-03 1996-07-31|2007-04-05 ATPase involved in protein folding and NLS-directed nuclear transport; member of HSP70 family; required for ubiquitin-dependent degradation of short-lived proteins; forms chaperone complex with Ydj1p; localized to nucleus, cytoplasm, cell wall; 98% identical to paralog Ssa2p with different functional specificity in propagation of yeast [URE3] prions, vacuolar-mediated degradations of gluconeogenesis enzymes; general targeting factor of Hsp104p to prion fibrils +S000032096 CDS YAL005C 1 141431 139503 C 2011-02-03 1996-07-31|2007-04-05 +S000000003 ORF Verified YAL003W EFB1 translation elongation factor 1 subunit beta|EF-1beta|eEF1Balpha|TEF5 chromosome 1 L000000542 1 142174 143160 W 2011-02-03 1996-07-31|1999-07-17 Translation elongation factor 1 beta; stimulates nucleotide exchange to regenerate EF-1 alpha-GTP for the next elongation cycle; part of the EF-1 complex, which facilitates binding of aminoacyl-tRNA to the ribosomal A site; human homolog EEF1B2 can complement yeast efb1 mutants +S000031941 CDS YAL003W 1 142174 142253 W 2011-02-03 1999-07-17|1996-07-31 +S000031942 CDS YAL003W 1 142620 143160 W 2011-02-03 1999-07-17|1996-07-31 +S000031943 intron YAL003W 1 142254 142619 W 2011-02-03 1999-07-17|1996-07-31 +S000007500 snoRNA_gene snR18 SNR18 chromosome 1 1 142367 142468 W 2011-02-03 2000-05-19|2007-05-08 C/D box small nucleolar RNA (snoRNA); commonly referred to as U18; guides 2'-O-methylation of large subunit (LSU) rRNA at positions A649 and C650 +S000036595 noncoding_exon snR18 1 142367 142468 W 2011-02-03 2000-05-19|2007-05-08 +S000000002 ORF Verified YAL002W VPS8 CORVET complex membrane-binding subunit VPS8|VPL8|VPT8|FUN15 chromosome 1 L000003013 1 143707 147531 W 2011-02-03 2004-01-14|1996-07-31 Membrane-binding component of the CORVET complex; involved in endosomal vesicle tethering and fusion in the endosome to vacuole protein targeting pathway; interacts with Vps21p; contains RING finger motif +S000031737 CDS YAL002W 1 143707 147531 W 2011-02-03 2004-01-14|1996-07-31 +S000121255 ARS ARS108 ARSI-147 chromosome 1 1 147398 147717 2014-11-18 2014-11-18|2007-03-07 Autonomously Replicating Sequence +S000000001 ORF Verified YAL001C TFC3 transcription factor TFIIIC subunit TFC3|tau 138|TSV115|FUN24 chromosome 1 L000000641|L000002287 1 151166 147594 C -1 2011-02-03 1996-07-31 Subunit of RNA polymerase III transcription initiation factor complex; part of the TauB domain of TFIIIC that binds DNA at the BoxB promoter sites of tRNA and similar genes; cooperates with Tfc6p in DNA binding; largest of six subunits of the RNA polymerase III transcription initiation factor complex (TFIIIC) +S000030735 CDS YAL001C 1 151006 147594 C 2011-02-03 1996-07-31 +S000030734 CDS YAL001C 1 151166 151097 C 2011-02-03 1996-07-31 +S000030736 intron YAL001C 1 151096 151007 C 2011-02-03 1996-07-31 +S000006463 centromere CEN1 CEN1 chromosome 1 L000000294 1 151465 151582 W 0 2011-02-03 2000-05-19|2006-05-08 Chromosome I centromere +S000077257 centromere_DNA_Element_I CEN1 1 151465 151474 W 2011-02-03 2004-10-04 +S000077258 centromere_DNA_Element_II CEN1 1 151475 151557 W 2011-02-03 2004-10-04 +S000077259 centromere_DNA_Element_III CEN1 1 151558 151582 W 2011-02-03 2004-10-04 +S000000063 ORF Verified YAR002W NUP60 FG-nucleoporin NUP60 chromosome 1 1 152257 153876 W 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; contributes directly to nucleocytoplasmic transport and maintenance of the nuclear pore complex (NPC) permeability barrier and is involved in gene tethering at the nuclear periphery; relocalizes to the cytosol in response to hypoxia; both NUP1 and NUP60 are homologous to human NUP153 +S000035473 CDS YAR002W 1 152257 153876 W 2011-02-03 1996-07-31 +S000002129 ORF Verified YAR002C-A ERP1 chromosome 1 L000004678 1 154724 154065 C 2011-02-03 1999-07-17 Member of the p24 family involved in ER to Golgi transport; role in misfolded protein quality control; forms heterotrimeric complex with Erp2p, Emp24p, and Erv25p; localized to COPII-coated vesicles; ERP1 has a paralog, ERP6, that arose from the whole genome duplication +S000032940 CDS YAR002C-A 1 154724 154065 C 2011-02-03 1999-07-17 +S000000064 ORF Verified YAR003W SWD1 COMPASS subunit protein SWD1|SAF49|CPS50|FUN16 chromosome 1 1 155005 156285 W 2011-02-03 1996-07-31 Subunit of the COMPASS (Set1C) complex; COMPASS methylates histone H3 on lysine 4 and is required in transcriptional silencing near telomeres; WD40 beta propeller superfamily member with similarity to mammalian Rbbp7 +S000035547 CDS YAR003W 1 155005 156285 W 2011-02-03 1996-07-31 +S000000065 ORF Verified YAR007C RFA1 replication factor A subunit protein RFA1|RPA70|RPA1|FUN3|BUF2 chromosome 1 L000000204|L000001620 1 158619 156754 C -3 2011-02-03 1996-07-31 Subunit of heterotrimeric Replication Protein A (RPA); RPA is a highly conserved single-stranded DNA binding protein involved in DNA replication, repair, and recombination; RPA protects against inappropriate telomere recombination, and upon telomere uncapping, prevents cell proliferation by a checkpoint-independent pathway; role in DNA catenation/decatenation pathway of chromosome disentangling; relocalizes to the cytosol in response to hypoxia +S000036676 CDS YAR007C 1 158619 156754 C 2011-02-03 1996-07-31 +S000000066 ORF Verified YAR008W SEN34 tRNA splicing endonuclease subunit SEN34|FUN4 chromosome 1 L000003973 1 158966 159793 W 2011-02-03 1996-07-31 Subunit of the tRNA splicing endonuclease; tRNA splicing endonuclease (Sen complex) is composed of Sen2p, Sen15p, Sen34p, and Sen54p; Sen complex also cleaves the CBP1 mRNA at the mitochondrial surface; Sen34p contains the active site for tRNA 3' splice site cleavage and has similarity to Sen2p and to Archaeal tRNA splicing endonuclease +S000037450 CDS YAR008W 1 158966 159793 W 2011-02-03 1996-07-31 +S000077372 ARS ARS109 ARS101 ARSI-160 chromosome 1 1 159907 160127 2011-02-03 2004-10-18|2006-09-06 ARS containing multiple redundant ORC binding sites; ORC is the acronym for origin recognition complex +S000121251 ARS_consensus_sequence ARS109 1 159945 159935 C 2011-02-03 2007-03-07 +S000118986 ARS_consensus_sequence ARS109 1 159952 159966 W 2011-02-03 2006-10-02 +S000006788 long_terminal_repeat YARCdelta3 chromosome 1 1 160237 160105 C 2011-02-03 2000-05-19 Ty1 LTR +S000006789 long_terminal_repeat YARCdelta4 chromosome 1 1 160574 160238 C 2011-02-03 2000-05-19 Ty1 LTR +S000000067 transposable_element_gene YAR009C truncated gag-pol fusion protein|YARCTyB1-1 chromosome 1 1 164187 160597 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; Gag processing produces capsid proteins, Pol is cleaved to produce protease, reverse transcriptase and integrase activities; in YARCTy1-1 TYB is mutant and probably non-functional; protein product forms cytoplasmic foci upon DNA replication stress +S000037508 CDS YAR009C 1 164187 160597 C 2011-02-03 1996-07-31 +S000000068 transposable_element_gene YAR010C gag protein|YARCTyA1-1 chromosome 1 1 165866 164544 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; Gag processing produces capsid proteins; in YARCTy1-1 TYB is mutant and probably non-functional +S000030210 CDS YAR010C 1 165866 164544 C 2011-02-03 1996-07-31 +S000006792 LTR_retrotransposon YARCTy1-1 Ty1 chromosome 1 1 166162 160238 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; mutated in S288C +S000006790 long_terminal_repeat YARCdelta5 chromosome 1 1 166162 165826 C 2011-02-03 2000-05-19 Ty1 LTR +S000006521 tRNA_gene tA(UGC)A TGA1 chromosome 1 L000003602|S000029601|L000002292 1 166267 166339 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 5 nuclear tRNA genes containing the tDNA-anticodon TGC (mature tRNA may be UGC or may contain modified bases), decodes GCA and probably GCG codons into alanine, one of 16 nuclear tRNAs for alanine +S000034842 noncoding_exon tA(UGC)A 1 166267 166339 W 2011-02-03 2000-05-19 +S000000069 ORF Verified YAR014C BUD14 protein phosphatase regulator BUD14 chromosome 1 1 168871 166742 C 2011-02-03 2004-01-27|1996-07-31|2011-02-03 Protein involved in bud-site selection; Bud14p-Glc7p complex is a cortical regulator of dynein; forms a complex with Kel1p and Kel2p that regulates Bnr1p (formin) to affect actin cable assembly, cytokinesis, and polarized growth; diploid mutants display a random budding pattern instead of the wild-type bipolar pattern; relative distribution to the nucleus increases upon DNA replication stress +S000031457 CDS YAR014C 1 168871 166742 C 2011-02-03 2004-01-27|1996-07-31|2011-02-03 +S000000070 ORF Verified YAR015W ADE1 phosphoribosylaminoimidazolesuccinocarboxamide synthase chromosome 1 L000000031 1 169375 170295 W 4 2011-02-03 1996-07-31 N-succinyl-5-aminoimidazole-4-carboxamide ribotide synthetase; required for 'de novo' purine nucleotide biosynthesis; red pigment accumulates in mutant cells deprived of adenine; protein abundance increases in response to DNA replication stress +S000031548 CDS YAR015W 1 169375 170295 W 2011-02-03 1996-07-31 +S000000071 ORF Verified YAR018C KIN3 serine/threonine protein kinase KIN3|NPK1|FUN52 chromosome 1 L000000903 1 171703 170396 C 2011-02-03 1996-07-31 Nonessential serine/threonine protein kinase; possible role in DNA damage response; influences tolerance to high levels of ethanol +S000032711 CDS YAR018C 1 171703 170396 C 2011-02-03 1996-07-31 +S000028735 ORF Dubious YAR019W-A chromosome 1 1 174998 175330 W 2011-02-03 2003-07-29|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF CDC15/YAR019C +S000033379 CDS YAR019W-A 1 174998 175330 W 2011-02-03 2003-07-29|2011-02-03 +S000000072 ORF Verified YAR019C CDC15 serine/threonine protein kinase CDC15|LYT1 chromosome 1 L000000255 1 175135 172211 C 6 2011-02-03 1996-07-31|2011-02-03 Protein kinase of the Mitotic Exit Network; localized to the spindle pole bodies at late anaphase; promotes mitotic exit by directly switching on the kinase activity of Dbf2p; required for spindle disassembly after meiosis II; relocalizes to the cytoplasm upon DNA replication stress +S000032794 CDS YAR019C 1 175135 172211 C 2011-02-03 1996-07-31|2011-02-03 +S000114488 ARS ARS110 ARS110 ARSI-176 chromosome 1 1 176157 176404 2011-02-03 2006-09-06|2006-02-28 Autonomously Replicating Sequence; originally referred to as ADE1 ARS +S000178037 ARS_consensus_sequence ARS110 1 176232 176248 W 2014-11-18 2014-11-18 +S000000073 ORF Verified YAR020C PAU7 seripauperin PAU7 chromosome 1 1 177023 176856 C 2011-02-03 1996-07-31 Member of the seripauperin multigene family; active during alcoholic fermentation, regulated by anaerobiosis, inhibited by oxygen, repressed by heme +S000034578 CDS YAR020C 1 177023 176856 C 2011-02-03 1996-07-31 +S000000074 ORF Uncharacterized YAR023C DUP240 family protein chromosome 1 1 179820 179281 C 2011-02-03 1996-07-31|2011-02-03 Putative integral membrane protein; member of DUP240 gene family +S000035643 CDS YAR023C 1 179820 179281 C 2011-02-03 1996-07-31|2011-02-03 +S000006636 tRNA_gene tL(CAA)A SUP56 chromosome 1 L000003603 1 181141 181254 W 10 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis; can mutate to suppress amber nonsense mutations +S000033745 intron tL(CAA)A 1 181179 181210 W 2011-02-03 2000-05-19 +S000033743 noncoding_exon tL(CAA)A 1 181141 181178 W 2011-02-03 2000-05-19 +S000033744 noncoding_exon tL(CAA)A 1 181211 181254 W 2011-02-03 2000-05-19 +S000006719 tRNA_gene tS(AGA)A chromosome 1 L000003604 1 182603 182522 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000032337 noncoding_exon tS(AGA)A 1 182603 182522 C 2011-02-03 2000-05-19 +S000006795 long_terminal_repeat YARWsigma1 chromosome 1 1 182620 182959 W 2011-02-03 2000-05-19 Ty3 LTR +S000006793 long_terminal_repeat YARWdelta6 chromosome 1 1 183142 183474 W 2011-02-03 2000-05-19 Ty1 LTR +S000000075 ORF Verified YAR027W UIP3 DUP240 family protein UIP3 chromosome 1 1 183770 184477 W 2011-02-03 1996-07-31 Putative integral membrane protein of unknown function; interacts with Ulp1p at the nuclear periphery; member of DUP240 gene family +S000036855 CDS YAR027W 1 183770 184477 W 2011-02-03 1996-07-31 +S000000076 ORF Uncharacterized YAR028W DUP240 family protein chromosome 1 1 184892 185596 W 2011-02-03 1996-07-31 Putative integral membrane protein; member of DUP240 gene family; GFP-fusion protein is induced in response to the DNA-damaging agent MMS +S000036899 CDS YAR028W 1 184892 185596 W 2011-02-03 1996-07-31 +S000000077 ORF Uncharacterized YAR029W DUP240 family protein chromosome 1 1 186321 186545 W 2011-02-03 1996-07-31 Member of DUP240 gene family but contains no transmembrane domains; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern +S000036967 CDS YAR029W 1 186321 186545 W 2011-02-03 1996-07-31 +S000000078 ORF Verified YAR031W PRM9 pheromone-regulated DUP240 family protein PRM9 chromosome 1 1 186836 187732 W 2011-02-03 1996-07-31 Pheromone-regulated protein; contains 3 predicted transmembrane segments and an FF sequence, a motif involved in COPII binding; member of DUP240 gene family; PRM9 has a paralog, PRM8, that arose from a segmental duplication +S000030609 CDS YAR031W 1 186836 187732 W 2011-02-03 1996-07-31 +S000001821 ORF Dubious YAR030C chromosome 1 1 186853 186512 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YAR029W and the verified gene PRM9 +S000036694 CDS YAR030C 1 186853 186512 C 2011-02-03 1996-07-31 +S000000079 ORF Verified YAR033W MST28 DUP240 family protein MST28 chromosome 1 1 188107 188811 W 2011-02-03 1996-07-31 Putative integral membrane protein, involved in vesicle formation; forms complex with Mst27p; member of DUP240 gene family; binds COPI and COPII vesicles; MST28 has a paralog, MST27, that arose from a segmental duplication +S000030819 CDS YAR033W 1 188107 188811 W 2011-02-03 1996-07-31 +S000006794 long_terminal_repeat YARWdelta7 chromosome 1 1 189426 189757 W 2011-02-03 2000-05-19 Ty2 LTR +S000000080 ORF Verified YAR035W YAT1 carnitine O-acetyltransferase YAT1 chromosome 1 L000002497 1 190193 192256 W 2011-02-03 1996-07-31 Outer mitochondrial carnitine acetyltransferase; minor ethanol-inducible enzyme involved in transport of activated acyl groups from the cytoplasm into the mitochondrial matrix; phosphorylated +S000031976 CDS YAR035W 1 190193 192256 W 2011-02-03 1996-07-31 +S000028595 ORF Uncharacterized YAR035C-A chromosome 1 1 192417 192337 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; predicted to have a role in cell budding based on computational "guilt by association" analysis +S000031375 CDS YAR035C-A 1 192417 192337 C 2011-02-03 2003-07-29 +S000000081 ORF Verified YAR042W SWH1 oxysterol-binding protein related protein SWH1|OSH1|YAR044W chromosome 1 L000002249 1 192619 196185 W 2011-02-03 2003-09-27|2006-01-19|1996-07-31 Protein similar to mammalian oxysterol-binding protein; contains ankyrin repeats and FFAT motif; interacts with ER anchor Scs2p at the nucleus-vacuole junction; regulated by sterol binding; SWH1 has a paralog, OSH2, that arose from the whole genome duplication +S000035065 CDS YAR042W 1 192619 196185 W 2011-02-03 2003-09-27|2006-01-19|1996-07-31 +S000000083 ORF Dubious YAR047C chromosome 1 1 201787 201467 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031684 CDS YAR047C 1 201787 201467 C 2011-02-03 1996-07-31 +S000000084 ORF Verified YAR050W FLO1 flocculin FLO1|FLO4|FLO2 chromosome 1 L000000617|L000000616 1 203403 208016 W 44 2011-02-03 1998-09-02|1996-07-31 Lectin-like protein involved in flocculation; cell wall protein that binds mannose chains on the surface of other cells, confers floc-forming ability that is chymotrypsin sensitive and heat resistant; important for co-flocculation with other yeasts, mediating interaction with specific species; FLO1 has a paralog, FLO5, that arose from a segmental duplication +S000036444 CDS YAR050W 1 203403 208016 W 2011-02-03 1998-09-02|1996-07-31 +S000000085 ORF Dubious YAR053W chromosome 1 1 208367 208663 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037285 CDS YAR053W 1 208367 208663 W 2011-02-03 1996-07-31 +S000006791 long_terminal_repeat YARCdelta8 chromosome 1 1 209778 209448 C 2011-02-03 2000-05-19 Ty1 LTR +S000121256 ARS ARS111 ARSI-215 chromosome 1 1 214888 215644 2011-02-03 2007-03-07 Autonomously Replicating Sequence +S000178038 ARS_consensus_sequence ARS111 1 215028 215012 C 2014-11-18 2014-11-18 +S000000086 ORF Dubious YAR060C chromosome 1 1 217492 217157 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YAR060C has a paralog, YHR212C, that arose from a segmental duplication +S000032661 CDS YAR060C 1 217492 217157 C 2011-02-03 1996-07-31 +S000000087 pseudogene YAR061W YAR062W chromosome 1 1 218140 219145 W 2014-11-18 1996-07-31|2014-11-18 Pseudogenic fragment with similarity to flocculins; YAR061W has a paralog, YHR212W-A, that arose from a segmental duplication +S000033393 CDS YAR061W 1 218140 219145 W 2014-11-18 1996-07-31|2014-11-18 +S000000089 ORF Uncharacterized YAR064W chromosome 1 1 220198 220497 W 2011-02-03 1996-07-31 Pseudogenic fragment with similarity to flocculins; YAR064W has a paralog, YHR213W-B, that arose from a segmental duplication +S000033577 CDS YAR064W 1 220198 220497 W 2011-02-03 1996-07-31 +S000002144 ORF Uncharacterized YAR066W chromosome 1 1 221049 221660 W 2011-02-03 1996-07-31 Putative GPI protein; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively; YAR066W has a paralog, YHR214W, that arose from a segmental duplication +S000034603 CDS YAR066W 1 221049 221660 W 2011-02-03 1996-07-31 +S000000091 ORF Uncharacterized YAR068W chromosome 1 1 222406 222891 W 2011-02-03 1996-07-31 Fungal-specific protein of unknown function; induced in respiratory-deficient cells; YAR068W has a paralog, YHR214W-A, that arose from a segmental duplication +S000035691 CDS YAR068W 1 222406 222891 W 2011-02-03 1996-07-31 +S000121257 ARS ARS112 ARSI-223 chromosome 1 1 222880 224046 2011-02-03 2007-03-07 Autonomously Replicating Sequence +S000000092 ORF Dubious YAR069C chromosome 1 1 224304 224011 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a protein, based on available experimental and comparative sequence data; YAR069C has a paralog, YHR214C-D, that arose from a segmental duplication +S000035758 CDS YAR069C 1 224304 224011 C 2011-02-03 1996-07-31 +S000000093 ORF Dubious YAR070C chromosome 1 1 224862 224563 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a protein, based on available experimental and comparative sequence data; YAR070C has a paralog, YHR214C-B, that arose from a segmental duplication +S000036733 CDS YAR070C 1 224862 224563 C 2011-02-03 1996-07-31 +S000000094 ORF Verified YAR071W PHO11 acid phosphatase PHO11 chromosome 1 L000001423 1 225460 226863 W 48 2011-02-03 1996-07-31 One of three repressible acid phosphatases; glycoprotein that is transported to the cell surface by the secretory pathway; induced by phosphate starvation and coordinately regulated by PHO4 and PHO2; PHO11 has a paralog, PHO12, that arose from a segmental duplication +S000036824 CDS YAR071W 1 225460 226863 W 2011-02-03 1996-07-31 +S000000095 ORF Dubious YAR073W IMD1 chromosome 1 1 227742 228953 W 2011-02-03 1996-07-31 Nonfunctional protein with homology to IMP dehydrogenase; blocked reading frame, located close to the telomere; not expressed at detectable levels; YAR073W and YAR075W comprise a continuous reading frame in most strains of S. cerevisiae; YAR073W/YAR075W together have a paralog, IMD2, that arose from a segmental duplication +S000037618 CDS YAR073W 1 227742 228953 W 2011-02-03 1996-07-31 +S000002145 ORF Dubious YAR075W chromosome 1 1 228844 229317 W 2011-02-03 1996-07-31 Non-functional protein with homology IMP dehydrogenase; YAR073W/IMD1 and YAR075W comprise a continuous reading frame in most strains of S. cerevisiae; YAR073W/YAR075W together have a paralog, IMD2, that arose from a segmental duplication +S000037740 CDS YAR075W 1 228844 229317 W 2011-02-03 1996-07-31 +S000028937 telomere TEL01R chromosome 1 1 229411 230218 W 51 2011-02-03 2003-09-09|2011-02-03 Telomeric region on the right arm of Chromosome I; composed of an X element core sequence and a short terminal stretch of telomeric repeats +S000028938 telomeric_repeat TEL01R 1 230121 230218 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome I +S000028939 X_element TEL01R 1 229411 229871 W 2011-02-03 2003-09-09|2011-02-03 Telomeric X element Core sequence on the right arm of Chromosome I; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028438 ARS ARS1001 chromosome 10 10 65 577 2002-12-16 2002-12-16 Autonomously Replicating Sequence +S000028665 ORF Dubious YJL225W-A chromosome 10 10 829 1311 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized gene YJL225C +S000032490 CDS YJL225W-A 10 829 1311 W 2003-07-29 2003-07-29 +S000003760 ORF Uncharacterized YJL225C Y' element ATP-dependent helicase chromosome 10 10 6130 466 C 1996-07-31 1996-07-31 Putative Y' element ATP-dependent helicase +S000033322 CDS YJL225C 10 4581 466 C 1996-07-31 1996-07-31 +S000033321 CDS YJL225C 10 6130 4970 C 1996-07-31 1996-07-31 +S000033323 intron YJL225C 10 4969 4582 C 1996-07-31 1996-07-31 +S000028439 ARS ARS1002 chromosome 10 10 7445 7943 2002-12-16 2002-12-16 Autonomously Replicating Sequence +S000028901 telomere TEL10L chromosome 10 10 7767 1 C -125 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome X; composed of an X element core sequence, X element combinatorial repeats, a long Y' element, and a short terminal stretch of telomeric repeats +S000028902 telomeric_repeat TEL10L 10 60 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome X +S000028903 X_element TEL10L 10 7767 7305 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome X; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028904 X_element_combinatorial_repeat TEL10L 10 7304 6932 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr X; contains a repeat of the D type with a group I mitochondrial bI4 intron insertion; formerly called SubTelomeric Repeats +S000028905 Y_prime_element TEL10L 10 6931 61 C 2003-09-09 2003-09-09 Telomeric long Y' element on the left arm of Chromosome X; contains an ARS consensus sequence, a region of 36-bp repeats, and two ORFs YJL225C and YJL225W-A +S000003759 ORF Verified YJL223C PAU1 seripauperin PAU1 chromosome 10 L000001343 10 9138 8776 C 1996-07-31 1996-07-31 Member of the seripauperin multigene family; encoded mainly in subtelomeric regions; SWAT-GFP and mCherry fusion proteins localize to the vacuole; active during alcoholic fermentation; regulated by anaerobiosis, negatively regulated by oxygen; repressed by heme; identical to Pau14p +S000032445 CDS YJL223C 10 9138 8776 C 1996-07-31 1996-07-31 +S000028664 ORF Dubious YJL222W-B chromosome 10 10 9346 9483 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032489 CDS YJL222W-B 10 9346 9483 W 2003-07-29 2003-07-29 +S000028663 ORF Dubious YJL222W-A chromosome 10 10 9452 9679 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032488 CDS YJL222W-A 10 9452 9679 W 2003-07-29 2003-07-29 +S000003758 ORF Verified YJL222W VTH2 signal sequence-binding protein chromosome 10 10 11475 16124 W 1996-07-31 1996-07-31 Putative membrane glycoprotein; has strong similarity to Vth1p and Pep1p/Vps10p; may be involved in vacuolar protein sorting +S000032381 CDS YJL222W 10 11475 16124 W 1996-07-31 1996-07-31 +S000028440 ARS ARS1003 chromosome 10 10 16124 16762 2002-12-16 2002-12-16 Autonomously Replicating Sequence +S000003756 ORF Dubious YJL220W chromosome 10 10 18243 18695 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YJL221C/FSP2 +S000032208 CDS YJL220W 10 18243 18695 W 1996-07-31 1996-07-31 +S000003757 ORF Verified YJL221C IMA4 oligo-1,6-glucosidase IMA4|FSP2 chromosome 10 L000002901 10 18536 16767 C 1996-07-31 1996-07-31 Alpha-glucosidase; weak, but broad substrate specificity for alpha-1,4- and alpha-1,6-glucosides; member of IMA isomaltase family; not required for isomaltose utilization, but Ima4p overexpression allows the ima1 null mutant to grow on isomaltose; identical to IMA3 +S000032237 CDS YJL221C 10 18536 16767 C 1996-07-31 1996-07-31 +S000003755 ORF Verified YJL219W HXT9 hexose transporter HXT9 chromosome 10 L000000843 10 19497 21200 W 1996-07-31 1996-07-31 Putative hexose transporter that is nearly identical to Hxt11p; has similarity to major facilitator superfamily (MFS) transporters, expression of HXT9 is regulated by transcription factors Pdr1p and Pdr3p +S000031251 CDS YJL219W 10 19497 21200 W 1996-07-31 1996-07-31 +S000003754 ORF Uncharacterized YJL218W acetyltransferase chromosome 10 10 21973 22563 W 1996-07-31 1996-07-31 Putative acetyltransferase; similar to bacterial galactoside O-acetyltransferases; induced by oleate in an OAF1/PIP2-dependent manner; promoter contains an oleate response element consensus sequence; non-essential gene +S000031119 CDS YJL218W 10 21973 22563 W 1996-07-31 1996-07-31 +S000003753 ORF Verified YJL217W REE1 chromosome 10 10 23133 23729 W 1996-07-31 1996-07-31 Cytoplasmic protein involved in the regulation of enolase (ENO1); mRNA expression is induced by calcium shortage, copper deficiency (via Mac1p) and the presence of galactose (via Gal4p); mRNA expression is also regulated by the cell cycle +S000030093 CDS YJL217W 10 23133 23729 W 1996-07-31 1996-07-31 +S000028441 ARS ARS1004 chromosome 10 10 23662 24158 2002-12-16 2002-12-16 Autonomously Replicating Sequence +S000178121 ARS_consensus_sequence ARS1004 10 23819 23835 W 2014-11-18 2014-11-18 +S000003752 ORF Verified YJL216C IMA5 oligo-1,6-glucosidase IMA5 chromosome 10 10 26086 24341 C 1996-07-31 1996-07-31 Alpha-glucosidase; specificity for isomaltose, maltose, and palatinose, but not alpha-methylglucoside; most distant member of the IMA isomaltase family, but with similar catalytic properties as Ima1p and Ima2p; not required for isomaltose utilization, but Ima5p overexpression allows the ima1 null mutant to grow on isomaltose; can cleave alpha-1,3 linkage of nigerose and turanose and alpha-1,5 linkage of leucrose and is very sensitive to temperature in vitro +S000029921 CDS YJL216C 10 26086 24341 C 1996-07-31 1996-07-31 +S000003751 ORF Dubious YJL215C chromosome 10 10 26771 26412 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037269 CDS YJL215C 10 26771 26412 C 1996-07-31 1996-07-31 +S000003750 ORF Verified YJL214W HXT8 hexose transporter HXT8 chromosome 10 L000000842 10 26887 28596 W 1996-07-31 1996-07-31 Protein of unknown function with similarity to hexose transporters; expression is induced by low levels of glucose and repressed by high levels of glucose +S000037229 CDS YJL214W 10 26887 28596 W 1996-07-31 1996-07-31 +S000003749 ORF Verified YJL213W chromosome 10 10 32163 33158 W 1996-07-31 1996-07-31 Protein of unknown function that may interact with ribosomes; periodically expressed during the yeast metabolic cycle; phosphorylated in vitro by the mitotic exit network (MEN) kinase complex, Dbf2p/Mob1p +S000037130 CDS YJL213W 10 32163 33158 W 1996-07-31 1996-07-31 +S000003748 ORF Verified YJL212C OPT1 oligopeptide transporter OPT1|GSH11|HGT1 chromosome 10 10 36249 33850 C 1996-07-31 1996-07-31 Proton-coupled oligopeptide transporter of the plasma membrane; also transports glutathione and phytochelatin; member of the OPT family +S000037000 CDS YJL212C 10 36249 33850 C 1996-07-31 1996-07-31 +S000003746 ORF Verified YJL210W PEX2 ubiquitin-protein ligase peroxin 2|PAS5|CRT1 chromosome 10 L000000422|L000003076 10 36919 37734 W 1996-07-31 1996-07-31 RING-finger peroxin and E3 ubiquitin ligase; peroxisomal membrane protein with a C-terminal zinc-binding RING domain, forms translocation subcomplex with Pex10p and Pex12p which functions in peroxisomal matrix protein import +S000036292 CDS YJL210W 10 36919 37734 W 1996-07-31 1996-07-31 +S000003747 ORF Dubious YJL211C chromosome 10 10 37200 36757 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YJL210W/PEX2 +S000036326 CDS YJL211C 10 37200 36757 C 1996-07-31 1996-07-31 +S000003745 ORF Verified YJL209W CBP1 chromosome 10 L000000224 10 38005 39969 W 1996-07-31 1996-07-31 Mitochondrial protein, regulator of COB mRNA stability and translation; interacts with the 5'-untranslated region of the COB mRNA; found in a complex at the inner membrane along with Pet309p; localizes to mitochondrial foci upon DNA replication stress +S000034944 CDS YJL209W 10 38005 39969 W 1996-07-31 1996-07-31 +S000003744 ORF Verified YJL208C NUC1 ribonuclease chromosome 10 L000001283 10 41183 40194 C 1996-07-31 1996-07-31 Major mitochondrial nuclease; has RNAse and DNA endo- and exonucleolytic activities; roles in mitochondrial recombination, apoptosis and maintenance of polyploidy; involved in fragmentation of genomic DNA during PND (programmed nuclear destruction); encodes ortholog of mammalian endoG +S000033945 CDS YJL208C 10 41183 40194 C 1996-07-31 1996-07-31 +S000003743 ORF Verified YJL207C LAA1 chromosome 10 10 47433 41389 C 1996-07-31 1996-07-31 AP-1 accessory protein; colocalizes with clathrin to the late-Golgi apparatus; involved in TGN-endosome transport; physically interacts with AP-1; similar to the mammalian p200; may interact with ribosomes; YJL207C is a non-essential gene +S000033803 CDS YJL207C 10 47433 41389 C 1996-07-31 1996-07-31 +S000003741 ORF Uncharacterized YJL206C chromosome 10 10 49935 47659 C 1996-07-31 1996-07-31 Putative protein of unknown function; similar to transcriptional regulators from the Zn[2]-Cys[6] binuclear cluster protein family; mRNA is weakly cell cycle regulated, peaking in S phase; induced rapidly upon MMS treatment +S000033077 CDS YJL206C 10 49935 47659 C 1996-07-31 1996-07-31 +S000003742 ORF Verified YJL205C NCE101 YJL205C-A|YJL206C-A|NCE1 chromosome 10 L000003097 10 50443 50139 C 1996-07-31 1996-07-31 Protein of unknown function; involved in secretion of proteins that lack classical secretory signal sequences; SWAT-GFP and mCherry fusion proteins localize to the cytosol +S000034430 CDS YJL205C 10 50268 50139 C 1996-07-31 1996-07-31 +S000034429 CDS YJL205C 10 50443 50412 C 1996-07-31 1996-07-31 +S000034431 intron YJL205C 10 50411 50269 C 1996-07-31 1996-07-31 +S000003740 ORF Verified YJL204C RCY1 chromosome 10 10 53151 50629 C 1996-07-31 1996-07-31 F-box protein involved in recycling endocytosed proteins; involved in recycling plasma membrane proteins internalized by endocytosis; localized to sites of polarized growth; direct interaction with C-terminal cytoplasmic region of Drs2p plays an important role for Drs2p function in endocytic recycling pathway +S000032878 CDS YJL204C 10 53151 50629 C 1996-07-31 1996-07-31 +S000003739 ORF Verified YJL203W PRP21 SPP91 chromosome 10 L000001507 10 53341 54183 W 1996-07-31 1996-07-31 Subunit of the SF3a splicing factor complex; required for spliceosome assembly +S000032839 CDS YJL203W 10 53341 54183 W 1996-07-31 1996-07-31 +S000003738 ORF Dubious YJL202C chromosome 10 10 54290 53943 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps 3' end of essential PRP21 gene encoding a subunit of the SF3a splicing factor complex +S000031876 CDS YJL202C 10 54290 53943 C 1996-07-31 1996-07-31 +S000003737 ORF Verified YJL201W ECM25 chromosome 10 L000003897 10 54379 56178 W 1996-07-31 1996-07-31 Non-essential protein of unknown function; promoter contains a consensus binding sequence for factor Abf1p +S000031819 CDS YJL201W 10 54379 56178 W 1996-07-31 1996-07-31 +S000003736 ORF Verified YJL200C ACO2 aconitate hydratase ACO2 chromosome 10 10 58813 56444 C 1996-07-31 1996-07-31 Putative mitochondrial aconitase isozyme; similarity to Aco1p, an aconitase required for the TCA cycle; expression induced during growth on glucose, by amino acid starvation via Gcn4p, and repressed on ethanol +S000031641 CDS YJL200C 10 58813 56444 C 1996-07-31 1996-07-31 +S000006743 tRNA_gene tT(AGU)J chromosome 10 L000003628 10 59172 59100 C 2000-05-19 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000032173 noncoding_exon tT(AGU)J 10 59172 59100 C 2000-05-19 2000-05-19 +S000007027 long_terminal_repeat YJLWdelta1 chromosome 10 10 59505 59784 W 2011-02-03 2000-05-19 Ty1 LTR +S000003735 ORF Uncharacterized YJL199C MBB1 chromosome 10 10 60182 59856 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains, not conserved in closely related Saccharomyces species; protein detected in large-scale protein-protein interaction studies; YJL199C is not an essential gene +S000035098 CDS YJL199C 10 60182 59856 C 2011-02-03 1996-07-31 +S000003734 ORF Verified YJL198W PHO90 SPX domain-containing inorganic phosphate transporter chromosome 10 10 60844 63489 W 2011-02-03 1996-07-31 Low-affinity phosphate transporter; acts upstream of Pho81p in regulation of the PHO pathway; deletion of pho84, pho87, pho89, pho90, and pho91 causes synthetic lethality; transcription independent of Pi and Pho4p activity; overexpression results in vigorous growth; PHO90 has a paralog, PHO87, that arose from the whole genome duplication +S000034201 CDS YJL198W 10 60844 63489 W 2011-02-03 1996-07-31 +S000003733 ORF Verified YJL197W UBP12 putative ubiquitin-specific protease UBP12 chromosome 10 L000003033 10 63805 67569 W 2011-02-03 1996-07-31 Ubiquitin-specific protease; cleaves ubiquitin from ubiquitinated proteins; present in the nucleus and cytoplasm +S000034104 CDS YJL197W 10 63805 67569 W 2011-02-03 1996-07-31 +S000028839 ORF Dubious YJL197C-A chromosome 10 10 66086 65805 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene YJL197C/UBP12 +S000034494 CDS YJL197C-A 10 66086 65805 C 2011-02-03 2003-07-29 +S000028442 ARS ARS1005 chromosome 10 10 67663 67736 2014-11-18 2002-12-16|2014-11-18 Autonomously Replicating Sequence +S000003732 ORF Verified YJL196C ELO1 fatty acid elongase ELO1 chromosome 10 L000003442 10 68782 67850 C 2011-02-03 1996-07-31 Elongase I, medium-chain acyl elongase; catalyzes carboxy-terminal elongation of unsaturated C12-C16 fatty acyl-CoAs to C16-C18 fatty acids; ELO1 has a paralog, ELO2, that arose from the whole genome duplication +S000033953 CDS YJL196C 10 68782 67850 C 2011-02-03 1996-07-31 +S000003730 ORF Verified YJL194W CDC6 AAA family ATPase CDC6 chromosome 10 L000000246 10 69338 70879 W -124 2011-02-03 1996-07-31 Essential ATP-binding protein required for DNA replication; component of the pre-replicative complex (pre-RC) which requires ORC to associate with chromatin and is in turn required for Mcm2-7p DNA association; homologous to S. pombe Cdc18p; relocalizes from nucleus to cytoplasm upon DNA replication stress; degraded in response to plasma membrane stress +S000033118 CDS YJL194W 10 69338 70879 W 2011-02-03 1996-07-31 +S000003731 ORF Dubious YJL195C chromosome 10 10 69942 69241 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YJL194W/CDC6 +S000033155 CDS YJL195C 10 69942 69241 C 2011-02-03 1996-07-31 +S000003729 ORF Uncharacterized YJL193W chromosome 10 10 71366 72574 W 2011-02-03 1996-07-31 Putative protein of unknown function; predicted to encode a triose phosphate transporter subfamily member based on phylogenetic analysis; similar to YOR307C/SLY41; deletion mutant has a respiratory growth defect +S000033028 CDS YJL193W 10 71366 72574 W 2011-02-03 1996-07-31 +S000003728 ORF Verified YJL192C SOP4 EMC7 chromosome 10 10 73414 72710 C 2011-02-03 1996-07-31 ER-membrane protein; subunit of evolutionarily conserved EMC (Endoplasmic Reticulum Membrane Complex) implicated in ERAD (ER-associated degradation) and proper assembly of multi-pass transmembrane (TM) proteins; EMC acts in yeast as an ER-mitochondria tether that interacts with outer membrane protein Tom5 of TOM (Translocase of the Mitochondrial Outer Membrane) complex; suppressor of pma1-7, deletion of SOP4 slows down export of wild-type Pma1p and Pma1-7 from the ER +S000032055 CDS YJL192C 10 73414 72710 C 2011-02-03 1996-07-31 +S000003727 ORF Verified YJL191W RPS14B uS11|ribosomal 40S subunit protein S14B|S11|rp59B|S14B|CRY2 chromosome 10 L000000424 10 73787 74611 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; required for ribosome assembly and 20S pre-rRNA processing; mutations confer cryptopleurine resistance; homologous to mammalian ribosomal protein S14 and bacterial S11; RPS14B has a paralog, RPS14A, that arose from the whole genome duplication +S000032004 CDS YJL191W 10 73787 73796 W 2011-02-03 1996-07-31 +S000032005 CDS YJL191W 10 74205 74611 W 2011-02-03 1996-07-31 +S000032006 intron YJL191W 10 73797 74204 W 2011-02-03 1996-07-31 +S000003726 ORF Verified YJL190C RPS22A uS8|ribosomal 40S subunit protein S22A|S8|rp50|YS22|S24A|S22A|RPS24 chromosome 10 L000003150|L000001760 10 75302 74910 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S15A and bacterial S8; RPS22A has a paralog, RPS22B, that arose from the whole genome duplication +S000031736 CDS YJL190C 10 75302 74910 C 2011-02-03 1996-07-31 +S000003725 ORF Verified YJL189W RPL39 eL39|ribosomal 60S subunit protein L39|L39e|YL40|L46|L39|SPB2|RPL46 chromosome 10 L000001737 10 75933 76474 W 2011-02-03 1996-07-31|2011-02-03 Ribosomal 60S subunit protein L39; required for ribosome biogenesis; loss of both Rpl31p and Rpl39p confers lethality; also exhibits genetic interactions with SIS1 and PAB1; homologous to mammalian ribosomal protein L39, no bacterial homolog +S000030844 CDS YJL189W 10 75933 75938 W 2011-02-03 1996-07-31 +S000030845 CDS YJL189W 10 76325 76474 W 2011-02-03 1996-07-31 +S000030846 intron YJL189W 10 75939 76324 W 2011-02-03 1996-07-31|2011-02-03 +S000003724 ORF Dubious YJL188C BUD19 chromosome 10 10 76510 76202 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 88% of ORF overlaps the verified gene RPL39; diploid mutant displays a weak budding pattern phenotype in a systematic assay +S000037873 CDS YJL188C 10 76510 76202 C 2011-02-03 1996-07-31|2011-02-03 +S000003723 ORF Verified YJL187C SWE1 tyrosine protein kinase SWE1|WEE1 chromosome 10 L000002248 10 79262 76803 C 2011-02-03 1996-07-31 Protein kinase that regulates the G2/M transition; negative regulator of the Cdc28p kinase; morphogenesis checkpoint kinase; positive regulator of sphingolipid biosynthesis via Orm2p; phosphorylates a tyrosine residue in the N-terminus of Hsp90 in a cell-cycle associated manner, thus modulating the ability of Hsp90 to chaperone a selected clientele; localizes to the nucleus and to the daughter side of the mother-bud neck; homolog of S. pombe Wee1p; potential Cdc28p substrate +S000037770 CDS YJL187C 10 79262 76803 C 2011-02-03 1996-07-31 +S000003722 ORF Verified YJL186W MNN5 alpha-1,2-mannosyltransferase MNN5 chromosome 10 L000004918 10 80155 81915 W 2011-02-03 1996-07-31|2011-02-03 Alpha-1,2-mannosyltransferase; responsible for addition of the second alpha-1,2-linked mannose of the branches on the mannan backbone of oligosaccharides, localizes to an early Golgi compartment +S000037744 CDS YJL186W 10 80155 81915 W 2011-02-03 1996-07-31|2011-02-03 +S000003721 ORF Verified YJL185C ATG36 chromosome 10 10 82976 82095 C 2011-02-03 1996-07-31 Pex3p interacting protein, required for pexophagy; interacts with Atg8p and Atg11p; mRNA is weakly cell cycle regulated, peaking in G2 phase; YJL185C is a non-essential gene +S000036951 CDS YJL185C 10 82976 82095 C 2011-02-03 1996-07-31 +S000003720 ORF Verified YJL184W GON7 chromatin DNA-binding EKC/KEOPS complex subunit GON7|PCC2|LDB6 chromosome 10 10 83448 83819 W 2011-02-03 1996-07-31 Component of the EKC/KEOPS protein complex; EKC/KEOPS complex is required for t6A tRNA modification and telomeric TG1-3 recombination; may have role in transcription; implicated in osmotic stress response; other complex members are Kae1p, Cgi121p, Pcc1p, and Bud32p +S000036918 CDS YJL184W 10 83448 83819 W 2011-02-03 1996-07-31 +S000003719 ORF Verified YJL183W MNN11 alpha-1,6-mannosyltransferase chromosome 10 L000004260 10 84068 85336 W 2011-02-03 1996-07-31|2011-02-03 Subunit of a Golgi mannosyltransferase complex; this complex also contains Anp1p, Mnn9p, Mnn10p, and Hoc1p, and mediates elongation of the polysaccharide mannan backbone; has homology to Mnn10p +S000036862 CDS YJL183W 10 84068 85336 W 2011-02-03 1996-07-31|2011-02-03 +S000003717 ORF Uncharacterized YJL181W RBH1 RBH1 chromosome 10 10 85660 87495 W 2011-02-03 1996-07-31 Putative protein of unknown function; expression is cell-cycle regulated as shown by microarray analysis; potential regulatory target of Mbp1p, which binds to the YJL181W promoter region; contains a PH-like domain; RBH1 has a paralog, RBH2, that arose from the whole genome duplication +S000035872 CDS YJL181W 10 85660 87495 W 2011-02-03 1996-07-31 +S000003718 ORF Dubious YJL182C chromosome 10 10 85752 85435 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps uncharacterized ORF YJL181W +S000035944 CDS YJL182C 10 85752 85435 C 2011-02-03 1996-07-31 +S000003716 ORF Verified YJL180C ATP12 ATP synthase complex assembly protein ATP12 chromosome 10 L000000149 10 88560 87583 C 2011-02-03 1996-07-31 Assembly factor for F1 sector of mitochondrial F1F0 ATP synthase; conserved protein; required for assembly of alpha and beta subunits into F1 sector of mitochondrial F1F0 ATP synthase; human homolog ATPAF2 can complement yeast atp12 mutant; mutation of human homolog reduces active ATP synthase levels and is associated with the disorder ATPAF2 deficiency +S000035717 CDS YJL180C 10 88560 87583 C 2011-02-03 1996-07-31 +S000003715 ORF Verified YJL179W PFD1 prefolding complex chaperone subunit|GIM6 chromosome 10 L000004367 10 88787 89116 W 2011-02-03 1996-07-31|2011-02-03 Subunit of heterohexameric prefoldin; prefoldin binds cytosolic chaperonin and transfers target proteins to it; involved in the biogenesis of actin and of alpha- and gamma-tubulin; prefoldin complex also localizes to chromatin of actively transcribed genes in the nucleus and facilitates transcriptional elongation +S000034696 CDS YJL179W 10 88787 89116 W 2011-02-03 1996-07-31|2011-02-03 +S000003714 ORF Verified YJL178C ATG27 ETF1 chromosome 10 10 90097 89282 C 2011-02-03 2004-02-12|1996-07-31 Type I membrane protein involved in autophagy and the Cvt pathway; may be involved in membrane delivery to the phagophore assembly site +S000033739 CDS YJL178C 10 90097 89282 C 2011-02-03 2004-02-12|1996-07-31 +S000003713 ORF Verified YJL177W RPL17B uL22|ribosomal 60S subunit protein L17B|L22|YL17|L20B|L17B chromosome 10 L000004457 10 90786 91657 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L17B; required for processing of 27SB pre-rRNA and formation of stable 66S assembly intermediates; homologous to mammalian ribosomal protein L17 and bacterial L22; RPL17B has a paralog, RPL17A, that arose from the whole genome duplication +S000033683 CDS YJL177W 10 90786 91094 W 2011-02-03 1996-07-31 +S000033684 CDS YJL177W 10 91412 91657 W 2011-02-03 1996-07-31 +S000033685 intron YJL177W 10 91095 91411 W 2011-02-03 1996-07-31 +S000003711 ORF Dubious YJL175W chromosome 10 10 94049 94561 W 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; deletion confers resistance to cisplatin, hypersensitivity to 5-fluorouracil, and growth defect at high pH with high calcium; overlaps gene for SWI3 transcription factor +S000033497 CDS YJL175W 10 94049 94561 W 2011-02-03 1996-07-31 +S000003712 ORF Verified YJL176C SWI3 HAF2|TYE2 chromosome 10 L000002251 10 94530 92053 C 2011-02-03 1996-07-31 Subunit of the SWI/SNF chromatin remodeling complex; SWI/SNF regulates transcription by remodeling chromosomes; contains SANT domain that is required for SWI/SNF assembly; is essential for displacement of histone H2A-H2B dimers during ATP-dependent remodeling; required for transcription of many genes, including ADH1, ADH2, GAL1, HO, INO1 and SUC2; relocates to the cytosol under hypoxic conditions +S000033535 CDS YJL176C 10 94530 92053 C 2011-02-03 1996-07-31 +S000003710 ORF Verified YJL174W KRE9 chromosome 10 L000000916 10 95092 95922 W -111.26 2011-02-03 1996-07-31 Glycoprotein involved in cell wall beta-glucan assembly; null mutation leads to severe growth defects, aberrant multibudded morphology, and mating defects +S000032753 CDS YJL174W 10 95092 95922 W 2011-02-03 1996-07-31 +S000003709 ORF Verified YJL173C RFA3 RPA14|RPA3 chromosome 10 L000001622 10 96529 96161 C 2011-02-03 1996-07-31 Subunit of heterotrimeric Replication Protein A (RPA); RPA is a highly conserved single-stranded DNA binding protein complex involved in DNA replication, repair, recombination; RPA protects against inappropriate telomere recombination, and upon telomere uncapping, prevents cell proliferation by a checkpoint-independent pathway; with Sgs1p-Top2p-Rmi1p, stimulates DNA catenation/decatenation activity of Top3p; protein abundance increases in response to DNA replication stress +S000032609 CDS YJL173C 10 96529 96161 C 2011-02-03 1996-07-31 +S000003708 ORF Verified YJL172W CPS1 Gly-Xaa carboxypeptidase chromosome 10 L000000403 10 97737 99467 W 2011-02-03 1996-07-31 Vacuolar carboxypeptidase S; expression is induced under low-nitrogen conditions +S000032538 CDS YJL172W 10 97737 99467 W 2011-02-03 1996-07-31 +S000028443 ARS ARS1006 chromosome 10 10 99458 99678 2014-11-18 2002-12-16|2014-11-18|2011-02-03 Autonomously Replicating Sequence +S000178122 ARS_consensus_sequence ARS1006 10 99617 99601 C 2014-11-18 2014-11-18 +S000003707 ORF Verified YJL171C TOH1 chromosome 10 10 100894 99704 C 2011-02-03 1996-07-31|2011-02-03 GPI-anchored cell wall protein of unknown function; induced in response to cell wall damaging agents and by mutations in genes involved in cell wall biogenesis; sequence similarity to YBR162C/TOS1, a covalently bound cell wall protein; protein abundance increases in response to DNA replication stress +S000031523 CDS YJL171C 10 100894 99704 C 2011-02-03 1996-07-31|2011-02-03 +S000003706 ORF Verified YJL170C ASG7 chromosome 10 L000004055 10 101779 101150 C 2011-02-03 1996-07-31|2006-01-18 Protein that regulates signaling from G protein beta subunit Ste4p; contributes to relocalization of Ste4p within the cell; specific to a-cells and induced by alpha-factor +S000031474 CDS YJL170C 10 101779 101150 C 2011-02-03 1996-07-31|2006-01-18 +S000003705 ORF Dubious YJL169W chromosome 10 10 102099 102467 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YJL168C/SET2 +S000030718 CDS YJL169W 10 102099 102467 W 2011-02-03 1996-07-31|2011-02-03 +S000003704 ORF Verified YJL168C SET2 histone methyltransferase SET2|KMT3|EZL1 chromosome 10 L000003090 10 104428 102227 C 2011-02-03 1996-07-31|2011-02-03 Histone methyltransferase with a role in transcriptional elongation; methylates H3 lysine 36 (H3K36), which suppresses incorporation of acetylated histones and signals for the deacetylation of these histones within transcribed genes; associates with the C-terminal domain(CTD) of Rpo21p; H3K36me3 (trimethylation) requires Spt6p, proline 38 on H3, CTD of Rpo21p, Ctk1p, and C-terminal SRI domain of Ste2p; relocalizes to the cytosol in response to hypoxia +S000030590 CDS YJL168C 10 104428 102227 C 2011-02-03 1996-07-31|2011-02-03 +S000003703 ORF Verified YJL167W ERG20 bifunctional (2E,6E)-farnesyl diphosphate synthase/dimethylallyltranstransferase|FPP1|FDS1|BOT3 chromosome 10 L000000579 10 105014 106072 W 2011-02-03 1996-07-31 Farnesyl pyrophosphate synthetase; has both dimethylallyltranstransferase and geranyltranstransferase activities; catalyzes the formation of C15 farnesyl pyrophosphate units for isoprenoid and sterol biosynthesis +S000030519 CDS YJL167W 10 105014 106072 W 2011-02-03 1996-07-31 +S000003702 ORF Verified YJL166W QCR8 ubiquinol--cytochrome-c reductase subunit 8|COR5 chromosome 10 L000001548 10 106434 106718 W 2011-02-03 1996-07-31 Subunit 8 of ubiquinol cytochrome-c reductase (Complex III); Complex III is a component of the mitochondrial inner membrane electron transport chain; oriented facing the intermembrane space; expression is regulated by Abf1p and Cpf1p +S000030370 CDS YJL166W 10 106434 106718 W 2011-02-03 1996-07-31 +S000003701 ORF Verified YJL165C HAL5 protein kinase HAL5 chromosome 10 L000000751 10 109461 106894 C 2011-02-03 1996-07-31 Putative protein kinase; overexpression increases sodium and lithium tolerance, whereas gene disruption increases cation and low pH sensitivity and impairs potassium uptake, suggesting a role in regulation of Trk1p and/or Trk2p transporters; HAL5 has a paralog, KKQ8, that arose from the whole genome duplication +S000037517 CDS YJL165C 10 109461 106894 C 2011-02-03 1996-07-31 +S000003700 ORF Verified YJL164C TPK1 cAMP-dependent protein kinase catalytic subunit TPK1|SRA3|PKA1 chromosome 10 L000002045 10 111159 109966 C -106 2011-02-03 1996-07-31|2011-02-03 cAMP-dependent protein kinase catalytic subunit; promotes vegetative growth in response to nutrients via the Ras-cAMP signaling pathway; inhibited by regulatory subunit Bcy1p in the absence of cAMP; phosphorylates and inhibits Whi3p to promote G1/S phase passage; partially redundant with Tpk2p and Tpk3p; phosphorylates pre-Tom40p, which impairs its import into mitochondria under non-respiratory conditions; TPK1 has a paralog, TPK3, that arose from the whole genome duplication +S000037409 CDS YJL164C 10 111159 109966 C 2011-02-03 1996-07-31|2011-02-03 +S000003699 ORF Uncharacterized YJL163C chromosome 10 10 113333 111666 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000036682 CDS YJL163C 10 113333 111666 C 2011-02-03 1996-07-31 +S000028444 ARS ARS1007 chromosome 10 10 113678 113749 2014-11-18 2002-12-16|2014-11-18 Autonomously Replicating Sequence +S000178123 ARS_consensus_sequence ARS1007 10 113744 113728 C 2014-11-18 2014-11-18 +S000003698 ORF Verified YJL162C JJJ2 chromosome 10 10 115629 113878 C 2011-02-03 1996-07-31|2006-01-18 Protein of unknown function; contains a J-domain, which is a region with homology to the E. coli DnaJ protein +S000036580 CDS YJL162C 10 115629 113878 C 2011-02-03 1996-07-31|2006-01-18 +S000006557 tRNA_gene tE(UUC)J chromosome 10 L000003627 10 116010 115939 C 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; target of K. lactis zymocin +S000035988 noncoding_exon tE(UUC)J 10 116010 115939 C 2011-02-03 2000-05-19 +S000003697 ORF Uncharacterized YJL161W FMP33 chromosome 10 10 117245 117787 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000036525 CDS YJL161W 10 117245 117787 W 2011-02-03 1996-07-31 +S000003696 ORF Uncharacterized YJL160C PIR5 beta-1,3-glucan linked protein chromosome 10 10 118825 117962 C 2011-02-03 2004-02-19|1996-07-31 Putative protein of unknown function; member of the PIR (Proteins with Internal Repeats) family of cell wall proteins; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, and mCherry fusion localizes to the vacuole; non-essential gene that is required for sporulation; mRNA is weakly cell cycle regulated, peaking in mitosis; YJL160C has a paralog, PIR1, that arose from the whole genome duplication +S000035585 CDS YJL160C 10 118825 117962 C 2011-02-03 2004-02-19|1996-07-31 +S000003695 ORF Verified YJL159W HSP150 heat shock protein HSP150|PIR2|ORE1|CCW7 chromosome 10 L000000824|L000001442 10 120449 121690 W 2011-02-03 2004-02-18|1996-07-31|2006-10-04 O-mannosylated heat shock protein; secreted and covalently attached to the cell wall via beta-1,3-glucan and disulfide bridges; required for cell wall stability; induced by heat shock, oxidative stress, and nitrogen limitation; HSP150 has a paralog, PIR3, that arose from the whole genome duplication +S000035769 CDS YJL159W 10 120449 121690 W 2011-02-03 2004-02-18|1996-07-31|2006-10-04 +S000003694 ORF Verified YJL158C CIS3 SCW8|CCW5|PIR4|CCW11 chromosome 10 S000029072|L000003951|L000004553|S000029439|L000004569 10 122948 122265 C 2011-02-03 1996-07-31 Mannose-containing glycoprotein constituent of the cell wall; member of the PIR (proteins with internal repeats) family +S000035606 CDS YJL158C 10 122948 122265 C 2011-02-03 1996-07-31 +S000003693 ORF Verified YJL157C FAR1 cyclin-dependent protein serine/threonine kinase inhibiting protein FAR1 chromosome 10 L000000600 10 126328 123836 C 2011-02-03 1996-07-31 CDK inhibitor and nuclear anchor; during the cell cycle Far1p sequesters the GEF Cdc24p in the nucleus; phosphorylation by Cdc28p-Cln results in SCFCdc4 complex-mediated ubiquitin-dependent degradation, releasing Cdc24p for export and activation of GTPase Cdc42p; in response to pheromone, phosphorylation of Far1p by MAPK Fus3p results in association with, and inhibition of Cdc28p-Cln, as well as Msn5p mediated nuclear export of Far1p-Cdc24p, targeting Cdc24p to polarity sites +S000035524 CDS YJL157C 10 126328 123836 C 2011-02-03 1996-07-31 +S000007613 ORF Dubious YJL156W-A chromosome 10 10 126604 126825 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037190 CDS YJL156W-A 10 126604 126825 W 2011-02-03 2001-02-26 +S000003692 ORF Verified YJL156C SSY5 RAA3 chromosome 10 L000003187|S000029401|L000004045 10 128952 126853 C 2011-02-03 1996-07-31|2009-02-18 Serine protease of SPS plasma membrane amino acid sensor system; contains an inhibitory domain that dissociates in response to extracellular amino acids, freeing a catalytic domain to activate transcription factor Stp1p; other members are Ssy1p and Ptr3p +S000034507 CDS YJL156C 10 128952 126853 C 2011-02-03 1996-07-31|2009-02-18 +S000003691 ORF Verified YJL155C FBP26 fructose-2,6-bisphosphatase chromosome 10 L000000606 10 130643 129285 C 2011-02-03 1996-07-31 Fructose-2,6-bisphosphatase, required for glucose metabolism; protein abundance increases in response to DNA replication stress +S000034402 CDS YJL155C 10 130643 129285 C 2011-02-03 1996-07-31 +S000003690 ORF Verified YJL154C VPS35 retromer subunit VPS35|VPT7|GRD9 chromosome 10 L000002477 10 133935 131101 C -102 2011-02-03 1996-07-31 Endosomal subunit of membrane-associated retromer complex; required for retrograde transport; receptor that recognizes retrieval signals on cargo proteins, forms subcomplex with Vps26p and Vps29p that selects cargo proteins for retrieval; interacts with Ypt7p; overexpression of wild-type human VPS35 or Parkinson's-associated vps35-D686N or vps35-P299S variants complements Ni2+ resistance and Cd2+ sensitivity of yeast vps35 null mutant +S000034312 CDS YJL154C 10 133935 131101 C 2011-02-03 1996-07-31 +S000003689 ORF Verified YJL153C INO1 inositol-3-phosphate synthase INO1|APR1 chromosome 10 L000000867 10 135933 134332 C -101 2011-02-03 2003-09-22|1996-07-31 Inositol-3-phosphate synthase; involved in synthesis of inositol phosphates and inositol-containing phospholipids; transcription is coregulated with other phospholipid biosynthetic genes by Ino2p and Ino4p, which bind the UASINO DNA element +S000033398 CDS YJL153C 10 135933 134332 C 2011-02-03 2003-09-22|1996-07-31 +S000003688 ORF Dubious YJL152W chromosome 10 10 136174 136533 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033364 CDS YJL152W 10 136174 136533 W 2011-02-03 1996-07-31 +S000003687 ORF Verified YJL151C SNA3 chromosome 10 10 136773 136372 C 2011-02-03 1996-07-31 Protein involved in efficient MVB sorting of proteins to the vacuole; may function as an RSP5 adapter protein for MVB cargos; integral membrane protein localized to vacuolar intralumenal vesicles +S000033267 CDS YJL151C 10 136773 136372 C 2011-02-03 1996-07-31 +S000003686 ORF Dubious YJL150W chromosome 10 10 137123 137425 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033233 CDS YJL150W 10 137123 137425 W 2011-02-03 1996-07-31 +S000003685 ORF Verified YJL149W DAS1 DUH1|SCF ubiquitin ligase complex subunit DAS1 chromosome 10 10 137379 139370 W 2011-02-03 1996-07-31 Putative SCF ubiquitin ligase F-box protein; interacts physically with both Cdc53p and Skp1 and genetically with CDC34; similar to putative F-box protein YDR131C +S000032472 CDS YJL149W 10 137379 139370 W 2011-02-03 1996-07-31 +S000006508 snoRNA_gene snR128 SNR128 U14 chromosome 10 L000001975 10 139691 139566 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); referred to as U14; essential gene required for cleavage of 35S primary rRNA transcript to release the precursor to the 18S rRNA; guides 2'-O-methylation of small subunit (SSU) rRNA at position C414 +S000035225 noncoding_exon snR128 10 139691 139566 C 2011-02-03 2000-05-19 +S000006509 snoRNA_gene snR190 SNR190 chromosome 10 L000001977 10 139950 139761 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); predicted to guide 2'-O-methylation of large subunit (LSU) rRNA at position G2395; not shown to be active +S000030414 noncoding_exon snR190 10 139950 139761 C 2011-02-03 2000-05-19 +S000003684 ORF Verified YJL148W RPA34 DNA-directed RNA polymerase I subunit RPA34|CST21|A34.5 chromosome 10 L000004132|L000003000|S000029123 10 140437 141138 W 2011-02-03 1996-07-31 RNA polymerase I subunit A34.5; essential for nucleolar assembly and for high polymerase loading rate; nucleolar localization depends on Rpa49p +S000032342 CDS YJL148W 10 140437 141138 W 2011-02-03 1996-07-31 +S000003683 ORF Uncharacterized YJL147C MRX5 chromosome 10 10 142567 141419 C 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; homozygous diploid deletion strain has a sporulation defect characterized by elevated dityrosine in the soluble fraction; expression induced by calcium shortage; YJL147W is a non-essential gene +S000031289 CDS YJL147C 10 142567 141419 C 2011-02-03 1996-07-31 +S000003682 ORF Verified YJL146W IDS2 chromosome 10 L000000853 10 143292 144701 W 2011-02-03 1996-07-31 Protein involved in modulation of Ime2p activity during meiosis; appears to act indirectly to promote Ime2p-mediated late meiotic functions; found in growing cells and degraded during sporulation +S000031249 CDS YJL146W 10 143292 144701 W 2011-02-03 1996-07-31 +S000003681 ORF Verified YJL145W SFH5 chromosome 10 10 145160 146044 W 2011-02-03 1996-07-31 Non-classical phosphatidylinositol transfer protein (PITP); exhibits PI- but not PC-transfer activity; localizes to the peripheral endoplasmic reticulum, cytosol and microsomes; similar to Sec14p; partially relocalizes to the plasma membrane upon DNA replication stress +S000031116 CDS YJL145W 10 145160 146044 W 2011-02-03 1996-07-31 +S000003680 ORF Verified YJL144W chromosome 10 10 146359 146673 W 2011-02-03 1996-07-31 Cytoplasmic hydrophilin essential in desiccation-rehydration process; expression induced by osmotic stress, starvation and during stationary phase; protein abundance increases in response to DNA replication stress +S000030090 CDS YJL144W 10 146359 146673 W 2011-02-03 1996-07-31 +S000003679 ORF Verified YJL143W TIM17 protein transporter TIM17|SMS1|MPI2|MIM17 chromosome 10 L000001139 10 147101 147577 W 2011-02-03 1996-07-31 Essential component of the TIM23 complex; with Tim23p, contributes to the architecture and function of the import channel; may link the import motor to the core Translocase of the Inner Mitochondrial membrane (TIM23 complex) +S000029979 CDS YJL143W 10 147101 147577 W 2011-02-03 1996-07-31 +S000003678 ORF Dubious YJL142C IRC9 chromosome 10 10 148211 147819 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene YJL141C; null mutant displays increased levels of spontaneous Rad52p foci +S000037267 CDS YJL142C 10 148211 147819 C 2011-02-03 1996-07-31 +S000003677 ORF Verified YJL141C YAK1 serine/threonine protein kinase YAK1 chromosome 10 L000002490 10 150390 147967 C 2011-02-03 1996-07-31 Serine-threonine protein kinase; component of a glucose-sensing system that inhibits growth in response to glucose availability; upon nutrient deprivation Yak1p phosphorylates Pop2p to regulate mRNA deadenylation, the co-repressor Crf1p to inhibit transcription of ribosomal genes, and the stress-responsive transcription factors Hsf1p and Msn2p; nuclear localization negatively regulated by the Ras/PKA signaling pathway in the presence of glucose +S000037175 CDS YJL141C 10 150390 147967 C 2011-02-03 1996-07-31 +S000003676 ORF Verified YJL140W RPB4 DNA-directed RNA polymerase II subunit RPB4|B32|CTF15 chromosome 10 L000001678 10 150961 151626 W 2011-02-03 1996-07-31 RNA polymerase II subunit B32; forms dissociable heterodimer with Rpb7p; Rpb4/7 dissociates from RNAPII as Ser2 CTD phosphorylation increases; Rpb4/7 regulates cellular lifespan via mRNA decay process; involved in recruitment of 3'-end processing factors to transcribing RNAPII complex, export of mRNA to cytoplasm under stress conditions; also involved in translation initiation +S000037123 CDS YJL140W 10 150961 151626 W 2011-02-03 1996-07-31 +S000003675 ORF Verified YJL139C YUR1 mannosyltransferase YUR1 chromosome 10 L000002566 10 152999 151713 C -90.66 2011-02-03 1996-07-31 Mannosyltransferase involved in protein N-glycosylation; member of the KTR1 family; located in the Golgi apparatus; YUR1 has a paralog, KTR2, that arose from the whole genome duplication +S000035317 CDS YJL139C 10 152999 151713 C 2011-02-03 1996-07-31 +S000003674 ORF Verified YJL138C TIF2 translation initiation factor eIF4A|eIF4A chromosome 10 L000002303 10 154691 153504 C -92 2011-02-03 1996-07-31 Translation initiation factor eIF4A; DEA(D/H)-box RNA helicase that couples ATPase activity to RNA binding and unwinding; forms a dumbbell structure of two compact domains connected by a linker; interacts with eIF4G; protein abundance increases in response to DNA replication stress; TIF2 has a paralog, TIF1, that arose from the whole genome duplication +S000035154 CDS YJL138C 10 154691 153504 C 2011-02-03 1996-07-31 +S000003673 ORF Verified YJL137C GLG2 glycogenin glucosyltransferase GLG2 chromosome 10 L000003159 10 156127 154985 C 2011-02-03 1996-07-31 Glycogenin glucosyltransferase; self-glucosylating initiator of glycogen synthesis, also glucosylates n-dodecyl-beta-D-maltoside; similar to mammalian glycogenin; GLG2 has a paralog, GLG1, that arose from the whole genome duplication +S000035008 CDS YJL137C 10 156127 154985 C 2011-02-03 1996-07-31 +S000028806 ORF Uncharacterized YJL136W-A chromosome 10 10 156169 156252 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by SAGE +S000033589 CDS YJL136W-A 10 156169 156252 W 2011-02-03 2003-07-29 +S000003672 ORF Verified YJL136C RPS21B eS21|ribosomal 40S subunit protein S21B|S21e|YS25|S26B|S21B chromosome 10 L000003031 10 157273 156550 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S21, no bacterial homolog; RPS21B has a paralog, RPS21A, that arose from the whole genome duplication +S000034084 CDS YJL136C 10 156789 156550 C 2011-02-03 1996-07-31 +S000034083 CDS YJL136C 10 157273 157250 C 2011-02-03 1996-07-31 +S000034085 intron YJL136C 10 157249 156790 C 2011-02-03 1996-07-31 +S000003671 ORF Dubious YJL135W chromosome 10 10 157877 158194 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified genes YJL134W/LCB3 +S000034027 CDS YJL135W 10 157877 158194 W 2011-02-03 1996-07-31 +S000003670 ORF Verified YJL134W LCB3 sphinganine kinase LCB3|YSR2|LBP1 chromosome 10 L000004101 10 158188 159417 W 2011-02-03 1996-07-31 Long-chain base-1-phosphate phosphatase; specific for dihydrosphingosine-1-phosphate, regulates ceramide and long-chain base phosphates levels, involved in incorporation of exogenous long chain bases in sphingolipids; LCB3 has a paralog, YSR3, that arose from the whole genome duplication +S000033888 CDS YJL134W 10 158188 159417 W 2011-02-03 1996-07-31 +S000028805 ORF Uncharacterized YJL133C-A chromosome 10 10 159847 159623 C 2011-02-03 2003-07-29 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000033587 CDS YJL133C-A 10 159847 159623 C 2011-02-03 2003-07-29 +S000003669 ORF Verified YJL133W MRS3 Fe(2+) transporter chromosome 10 L000001179 10 160619 161563 W 2011-02-03 1996-07-31 Iron transporter, mediates Fe2+ transport across inner mito membrane; mitochondrial carrier family member; active under low-iron conditions; may transport other cations; MRS3 has a paralog, MRS4, that arose from the whole genome duplication +S000033746 CDS YJL133W 10 160619 161563 W 2011-02-03 1996-07-31 +S000003668 ORF Uncharacterized YJL132W chromosome 10 10 161914 164166 W 2011-02-03 1996-07-31 Putative protein of unknown function; localizes to the membrane fraction; possible Zap1p-regulated target gene induced by zinc deficiency; YJL132W is a non-essential gene +S000033018 CDS YJL132W 10 161914 164166 W 2011-02-03 1996-07-31 +S000003667 ORF Verified YJL131C AIM23 chromosome 10 10 165348 164278 C 2011-02-03 1996-07-31 Mitochondrial translation initiation factor 3 (IF3, mIF3); evolutionarily conserved; binds to E. coli ribosomes in vitro; null mutant displays severe respiratory growth defect and elevated frequency of mitochondrial genome loss +S000032877 CDS YJL131C 10 165348 164278 C 2011-02-03 1996-07-31 +S000003666 ORF Verified YJL130C URA2 bifunctional carbamoylphosphate synthetase/aspartate transcarbamylase chromosome 10 L000002431 10 172367 165723 C -89 2011-02-03 1996-07-31|2011-02-03 Bifunctional carbamoylphosphate synthetase/aspartate transcarbamylase; catalyzes the first two enzymatic steps in the de novo biosynthesis of pyrimidines; both activities are subject to feedback inhibition by UTP +S000031969 CDS YJL130C 10 172367 165723 C 2011-02-03 1996-07-31|2011-02-03 +S000122104 five_prime_UTR_intron YJL130C 10 172752 172433 C 2011-02-03 2007-04-04 +S000003665 ORF Verified YJL129C TRK1 chromosome 10 L000002334 10 177306 173599 C 2011-02-03 1996-07-31 Component of the Trk1p-Trk2p potassium transport system; 180 kDa high affinity potassium transporter; phosphorylated in vivo and interacts physically with the phosphatase Ppz1p, suggesting Trk1p acitivy is regulated by phosphorylation; TRK1 has a paralog, TRK2, that arose from the whole genome duplication +S000032672 CDS YJL129C 10 177306 173599 C 2011-02-03 1996-07-31 +S000003664 ORF Verified YJL128C PBS2 mitogen-activated protein kinase kinase PBS2|SSK4|SFS4|HOG4 chromosome 10 L000001346|L000001874 10 180103 178097 C -85 2011-02-03 1996-07-31|2011-02-03 MAP kinase kinase of the HOG signaling pathway; activated under severe osmotic stress; mitophagy-specific regulator; plays a role in regulating Ty1 transposition +S000031693 CDS YJL128C 10 180103 178097 C 2011-02-03 1996-07-31|2011-02-03 +S000007612 ORF Dubious YJL127W-A YJL127W-B chromosome 10 10 180194 180310 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037189 CDS YJL127W-A 10 180194 180310 W 2011-02-03 2001-02-26 +S000028522 ORF Uncharacterized YJL127C-B YJL127C-A chromosome 10 10 181709 181551 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified based on homology to the filamentous fungus, Ashbya gossypii; SWAT-GFP and seamless-GFP fusion proteins localize to the mitochondria +S000030318 CDS YJL127C-B 10 181709 181551 C 2011-02-03 2003-07-29 +S000003663 ORF Verified YJL127C SPT10 SUD1|CRE1 chromosome 10 L000002035 10 184220 182298 C -87 2011-02-03 1996-07-31 Histone H3 acetylase with a role in transcriptional regulation; sequence-specific activator of histone genes, binds specifically and cooperatively to pairs of UAS elements in core histone promoters, functions at or near TATA box; involved in S phase-specific acetylation of H3K56 at histone promoters, which is required for recruitment of SWI/SNF nucleosome remodeling complex and subsequent transcription +S000031537 CDS YJL127C 10 184220 182298 C 2011-02-03 1996-07-31 +S000003662 ORF Verified YJL126W NIT2 putative hydrolase chromosome 10 L000004212 10 184501 185424 W 2011-02-03 1996-07-31 Nit protein; one of two proteins in S. cerevisiae with similarity to the Nit domain of NitFhit from fly and worm and to the mouse and human Nit protein which interacts with the Fhit tumor suppressor; nitrilase superfamily member +S000031498 CDS YJL126W 10 184501 185424 W 2011-02-03 1996-07-31 +S000003661 ORF Verified YJL125C GCD14 tRNA 1-methyladenosine methyltransferase subunit GCD14|TRM61 chromosome 10 L000002902 10 186679 185528 C 2011-02-03 1996-07-31 Subunit of tRNA (1-methyladenosine) methyltransferase; required, along with Gcd10p, for the modification of the adenine at position 58 in tRNAs, especially tRNAi-Met; first identified as a negative regulator of GCN4 expression +S000030509 CDS YJL125C 10 186679 185528 C 2011-02-03 1996-07-31 +S000003660 ORF Verified YJL124C LSM1 SPB8 chromosome 10 L000004427 10 187644 187126 C 2011-02-03 1996-07-31 Lsm (Like Sm) protein; forms heteroheptameric complex (with Lsm2p, Lsm3p, Lsm4p, Lsm5p, Lsm6p, and Lsm7p) involved in degradation of cytoplasmic mRNAs; also enters the nucleus and positively regulates transcription initiation; unlike most Sm-like proteins, Lsm1p requires both its SM-domain and C-terminal domain for RNA-binding; binds to mRNAs under glucose starvation, most often in the 3' UTR; forms cytoplasmic foci upon DNA replication stress +S000030388 CDS YJL124C 10 187644 187126 C 2011-02-03 1996-07-31 +S000003659 ORF Verified YJL123C MTC1 chromosome 10 10 189440 188004 C 2011-02-03 1996-07-31 Protein of unknown function that may interact with ribosomes; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and to COPI-coated vesicles (early Golgi); mtc1 is synthetically lethal with cdc13-1 +S000030206 CDS YJL123C 10 189440 188004 C 2011-02-03 1996-07-31 +S000003658 ORF Verified YJL122W ALB1 chromosome 10 10 189716 190243 W 2011-02-03 1996-07-31 Shuttling pre-60S factor; involved in the biogenesis of ribosomal large subunit; interacts directly with Arx1p; responsible for Tif6p recycling defects in absence of Rei1p +S000037544 CDS YJL122W 10 189716 190243 W 2011-02-03 1996-07-31 +S000003656 ORF Dubious YJL120W chromosome 10 10 191022 191345 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YJL121C/RPE1; deletion confers sensitivity to GSAO +S000037326 CDS YJL120W 10 191022 191345 W 2011-02-03 1996-07-31 +S000003657 ORF Verified YJL121C RPE1 ribulose-phosphate 3-epimerase RPE1|POS18|EPI1 chromosome 10 L000004023|L000002588 10 191090 190374 C 2011-02-03 1996-07-31 D-ribulose-5-phosphate 3-epimerase; catalyzes a reaction in the non-oxidative part of the pentose-phosphate pathway; mutants are sensitive to oxidative stress +S000037363 CDS YJL121C 10 191090 190374 C 2011-02-03 1996-07-31 +S000003654 ORF Verified YJL118W chromosome 10 10 191639 192298 W 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; YJL118W is a non-essential gene; deletion enhances the toxicity of heterologously expressed human alpha-synuclein +S000035604 CDS YJL118W 10 191639 192298 W 2011-02-03 1996-07-31 +S000003655 ORF Dubious YJL119C chromosome 10 10 191895 191572 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035622 CDS YJL119C 10 191895 191572 C 2011-02-03 1996-07-31 +S000003653 ORF Verified YJL117W PHO86 chromosome 10 L000002945 10 192531 193466 W 2011-02-03 1996-07-31 Endoplasmic reticulum (ER) resident protein; required for ER exit of the high-affinity phosphate transporter Pho84p, specifically required for packaging of Pho84p into COPII vesicles; protein abundance increases in response to DNA replication stress +S000035509 CDS YJL117W 10 192531 193466 W 2011-02-03 1996-07-31 +S000003652 ORF Verified YJL116C NCA3 SUN family protein NCA3 chromosome 10 L000002936 10 194873 193860 C 2011-02-03 1996-07-31 Protein involved in mitochondrion organization; functions with Nca2p to regulate mitochondrial expression of subunits 6 (Atp6p) and 8 (Atp8p) of the Fo-F1 ATP synthase; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the vacuole; member of the SUN family; expression induced in cells treated with the mycotoxin patulin; NCA3 has a paralog, UTH1, that arose from the whole genome duplication +S000034420 CDS YJL116C 10 194873 193860 C 2011-02-03 1996-07-31 +S000003651 ORF Verified YJL115W ASF1 nucleosome assembly factor ASF1|CIA1 chromosome 10 L000000126 10 196287 197126 W -80.06 2011-02-03 1996-07-31 Nucleosome assembly factor; involved in chromatin assembly, disassembly; required for recovery after DSB repair; role in H3K56 acetylation required for expression homeostasis, buffering mRNA synthesis rate against gene dosage changes in S phase; anti-silencing protein, derepresses silent loci when overexpressed; role in regulating Ty1 transposition; relocalizes to cytosol under hypoxia; growth defect of asf1 null is functionally complemented by either human ASF1A or ASF1B +S000034387 CDS YJL115W 10 196287 197126 W 2011-02-03 1996-07-31 +S000006514 tRNA_gene tA(AGC)J chromosome 10 L000003626 10 197385 197313 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine +S000032283 noncoding_exon tA(AGC)J 10 197385 197313 C 2011-02-03 2000-05-19 +S000007035 long_terminal_repeat YJLWsigma1 chromosome 10 10 197401 197494 W 2011-02-03 2000-05-19 Ty3 LTR +S000007036 long_terminal_repeat YJLWtau1 chromosome 10 10 197545 197915 W 2011-02-03 2000-05-19 Ty4 LTR +S000007039 LTR_retrotransposon YJLWTy4-1 Ty4 chromosome 10 10 197545 203768 W 2011-02-03 2000-05-19|2011-02-03 Ty4 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000003650 transposable_element_gene YJL114W gag protein chromosome 10 10 197915 198595 W 2011-02-03 1996-07-31|2011-02-03 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000034265 CDS YJL114W 10 197915 198595 W 2011-02-03 1996-07-31|2011-02-03 +S000003649 transposable_element_gene YJL113W gag-pol fusion protein chromosome 10 10 198678 203325 W 2011-02-03 1996-07-31|2011-02-03 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000034131 CDS YJL113W 10 198678 198998 W 2011-02-03 1996-07-31|2011-02-03 +S000034132 CDS YJL113W 10 199000 203325 W 2011-02-03 1996-07-31 +S000034133 plus_1_translational_frameshift YJL113W 10 198999 198999 W 2011-02-03 1996-07-31 +S000007037 long_terminal_repeat YJLWtau2 chromosome 10 10 203398 203768 W 2011-02-03 2000-05-19 Ty4 LTR +S000028445 ARS ARS1008 chromosome 10 10 204029 204917 2011-02-03 2002-12-16|2011-02-03 Autonomously Replicating Sequence +S000178124 ARS_consensus_sequence ARS1008 10 204241 204225 C 2014-11-18 2014-11-18 +S000007022 long_terminal_repeat YJLCdelta3 chromosome 10 10 204114 203783 C 2011-02-03 2000-05-19 Ty1 LTR +S000006536 tRNA_gene tD(GUC)J1 chromosome 10 L000003605 10 204735 204806 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000030769 noncoding_exon tD(GUC)J1 10 204735 204806 W 2011-02-03 2000-05-19 +S000003648 ORF Verified YJL112W MDV1 NET2|GAG3|FIS2 chromosome 10 10 205305 207449 W 2011-02-03 1996-07-31|2011-02-03 Peripheral protein of cytosolic face of mitochondrial outer membrane; required for mitochondrial fission; interacts with Fis1p and with the self-assembled oligomeric form of the dynamin-related GTPase Dnm1p; contains WD repeats; MDV1 has a paralog, CAF4, that arose from the whole genome duplication +S000033273 CDS YJL112W 10 205305 207449 W 2011-02-03 1996-07-31|2011-02-03 +S000003647 ORF Verified YJL111W CCT7 chaperonin-containing T-complex subunit CCT7|TCP7 chromosome 10 L000002763 10 207877 209529 W 2011-02-03 1996-07-31 Subunit of the cytosolic chaperonin Cct ring complex; related to Tcp1p, required for the assembly of actin and tubulins in vivo; mutant has increased aneuploidy tolerance +S000033222 CDS YJL111W 10 207877 209529 W 2011-02-03 1996-07-31 +S000003646 ORF Verified YJL110C GZF3 NIL2|DEH1 chromosome 10 L000002858|L000003382 10 211577 209922 C 2011-02-03 1996-07-31 GATA zinc finger protein; negatively regulates nitrogen catabolic gene expression by competing with Gat1p for GATA site binding; function requires a repressive carbon source; dimerizes with Dal80p and binds to Tor1p; GZF3 has a paralog, DAL80, that arose from the whole genome duplication +S000033132 CDS YJL110C 10 211577 209922 C 2011-02-03 1996-07-31 +S000003645 ORF Verified YJL109C UTP10 snoRNA-binding rRNA-processing protein UTP10 chromosome 10 10 217309 212000 C 2011-02-03 1996-07-31 Nucleolar protein; component of the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA; mutant has increased aneuploidy tolerance +S000032396 CDS YJL109C 10 217309 212000 C 2011-02-03 1996-07-31 +S000003644 ORF Verified YJL108C PRM10 pheromone-regulated protein PRM10 chromosome 10 10 218856 217705 C 2011-02-03 1996-07-31 Pheromone-regulated protein; proposed to be involved in mating; predicted to have 5 transmembrane segments; induced by treatment with 8-methoxypsoralen and UVA irradiation +S000032288 CDS YJL108C 10 218856 217705 C 2011-02-03 1996-07-31 +S000003643 ORF Uncharacterized YJL107C chromosome 10 10 220016 218853 C 2011-02-03 1996-07-31 Putative protein of unknown function; expression is induced by activation of the HOG1 mitogen-activated signaling pathway and this induction is Hog1p/Pbs2p dependent; YJL107C and adjacent ORF, YJL108C are merged in related fungi +S000031290 CDS YJL107C 10 220016 218853 C 2011-02-03 1996-07-31 +S000003642 ORF Verified YJL106W IME2 protein kinase IME2|SME1 chromosome 10 L000000862 10 221390 223327 W 2011-02-03 1996-07-31 Serine/threonine protein kinase involved in activation of meiosis; associates with Ime1p and mediates its stability, activates Ndt80p; IME2 expression is positively regulated by Ime1p; human CDK2 can complement ime2 null mutant +S000031252 CDS YJL106W 10 221390 223327 W 2011-02-03 1996-07-31 +S000003641 ORF Verified YJL105W SET4 chromosome 10 10 225055 226737 W 2011-02-03 1996-07-31 Protein of unknown function, contains a SET domain; SET4 has a paralog, SET3, that arose from the whole genome duplication +S000031110 CDS YJL105W 10 225055 226737 W 2011-02-03 1996-07-31 +S000003640 ORF Verified YJL104W PAM16 import motor complex subunit PAM16|TIM16|MIA1 chromosome 10 10 227327 227776 W 2011-02-03 1996-07-31 Subunit of the import motor (PAM complex); the PAM complex is a component of the Translocase of the Inner Mitochondrial membrane (TIM23 complex); forms a 1:1 subcomplex with Pam18p and inhibits its cochaperone activity; contains a J-like domain +S000031000 CDS YJL104W 10 227327 227776 W 2011-02-03 1996-07-31 +S000006501 snoRNA_gene snR37 SNR37 chromosome 10 L000003502 10 228479 228094 C 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2944 +S000036767 noncoding_exon snR37 10 228479 228094 C 2011-02-03 2000-05-19 +S000028446 ARS ARS1009 chromosome 10 10 228552 229043 2011-02-03 2002-12-16 Autonomously Replicating Sequence +S000178125 ARS_consensus_sequence ARS1009 10 228575 228559 C 2014-11-18 2014-11-18 +S000003639 ORF Verified YJL103C GSM1 chromosome 10 10 230881 229025 C 2011-02-03 1996-07-31 Putative zinc cluster protein of unknown function; proposed to be involved in the regulation of energy metabolism, based on patterns of expression and sequence analysis +S000029933 CDS YJL103C 10 230881 229025 C 2011-02-03 1996-07-31 +S000003638 ORF Verified YJL102W MEF2 chromosome 10 L000001058 10 231301 233760 W 2011-02-03 1996-07-31 Mitochondrial elongation factor involved in translational elongation +S000029898 CDS YJL102W 10 231301 233760 W 2011-02-03 1996-07-31 +S000006702 tRNA_gene tR(ACG)J chromosome 10 L000003606 10 233939 234011 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 6 nuclear tRNA genes containing the tDNA-anticodon ACG (converted to ICG in the mature tRNA), decodes CGU, CGC, and probably CGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000030405 noncoding_exon tR(ACG)J 10 233939 234011 W 2011-02-03 2000-05-19 +S000003637 ORF Verified YJL101C GSH1 glutamate--cysteine ligase chromosome 10 L000000735 10 236356 234320 C 2011-02-03 1996-07-31 Gamma glutamylcysteine synthetase; catalyzes the first step in glutathione (GSH) biosynthesis; expression induced by oxidants, cadmium, and mercury; protein abundance increases in response to DNA replication stress +S000037157 CDS YJL101C 10 236356 234320 C 2011-02-03 1996-07-31 +S000003636 ORF Verified YJL100W LSB6 1-phosphatidylinositol 4-kinase LSB6 chromosome 10 10 237263 239086 W 2011-02-03 1996-07-31 Type II phosphatidylinositol 4-kinase; binds Las17p, a homolog of human Wiskott-Aldrich Syndrome protein involved in actin patch assembly and actin polymerization +S000037110 CDS YJL100W 10 237263 239086 W 2011-02-03 1996-07-31 +S000003635 ORF Verified YJL099W CHS6 CSD3 chromosome 10 L000000334 10 239414 241654 W 2011-02-03 1996-07-31 Member of the ChAPs (Chs5p-Arf1p-binding proteins) family; part of the exomer complex that mediates export of specific cargo proteins, including Chs3p, from the Golgi to the plasma membrane; primary component of the Chs5/6 complex that binds directly to membranes; CHS6 has a paralog, BCH2, that arose from the whole genome duplication +S000031796 CDS YJL099W 10 239414 241654 W 2011-02-03 1996-07-31 +S000003634 ORF Verified YJL098W SAP185 chromosome 10 L000003246 10 242082 245258 W 2011-02-03 1996-07-31 Protein that forms a complex with the Sit4p protein phosphatase; required for Sit4p function; member of a family of similar proteins including Sap4p, Sap155p, and Sap190p; SAP185 has a paralog, SAP190, that arose from the whole genome duplication +S000031694 CDS YJL098W 10 242082 245258 W 2011-02-03 1996-07-31 +S000003633 ORF Verified YJL097W PHS1 enoyl-CoA hydratase PHS1 chromosome 10 10 245591 246244 W 2011-02-03 1996-07-31 Essential 3-hydroxyacyl-CoA dehydratase of the ER membrane; involved in elongation of very long-chain fatty acids; evolutionarily conserved, similar to mammalian PTPLA and PTPLB; involved in sphingolipid biosynthesis and protein trafficking +S000031576 CDS YJL097W 10 245591 246244 W 2011-02-03 1996-07-31 +S000003632 ORF Verified YJL096W MRPL49 mitochondrial 54S ribosomal protein YmL49|YmL49 chromosome 10 10 246490 246975 W 2011-02-03 2003-09-22|1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000030716 CDS YJL096W 10 246490 246975 W 2011-02-03 2003-09-22|1996-07-31 +S000077074 matrix_attachment_site ETC3 ETC3 chromosome 10 10 247060 247082 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; located between MRPL49 and BCK1 +S000003631 ORF Verified YJL095W BCK1 mitogen-activated protein kinase kinase kinase BCK1|SSP31|SLK1|SAP3|LAS3 chromosome 10 L000000162 10 247255 251691 W -64 2011-02-03 1996-07-31 MAPKKK acting in the protein kinase C signaling pathway; the kinase C signaling pathway controls cell integrity; upon activation by Pkc1p phosphorylates downstream kinases Mkk1p and Mkk2p; MAPKKK is an acronym for mitogen-activated protein (MAP) kinase kinase kinase +S000030629 CDS YJL095W 10 247255 251691 W 2011-02-03 1996-07-31 +S000003630 ORF Verified YJL094C KHA1 chromosome 10 10 254442 251821 C 2011-02-03 1996-07-31 Putative K+/H+ antiporter; has a probable role in intracellular cation homeostasis; localized to Golgi vesicles and detected in highly purified mitochondria in high-throughput studies +S000030439 CDS YJL094C 10 254442 251821 C 2011-02-03 1996-07-31 +S000003629 ORF Verified YJL093C TOK1 YPK1|YORK|YKC1|DUK1 chromosome 10 L000003009 10 256812 254737 C 2011-02-03 1996-07-31 Outward-rectifier potassium channel of the plasma membrane; has two pore domains in tandem, each of which forms a functional channel permeable to potassium; carboxy tail functions to prevent inner gate closures; target of K1 toxin +S000037648 CDS YJL093C 10 256812 254737 C 2011-02-03 1996-07-31 +S000003628 ORF Verified YJL092W SRS2 DNA helicase SRS2|HPR5|RADH1|RADH chromosome 10 L000000809|L000001578 10 257423 260947 W -61 2011-02-03 1996-07-31 DNA helicase and DNA-dependent ATPase; involved in DNA repair and checkpoint recovery, needed for proper timing of commitment to meiotic recombination and transition from Meiosis I to II; blocks trinucleotide repeat expansion; affects genome stability; disassembles Rad51p nucleoprotein filaments during meiotic recombination; stimulates activity of the Mus81p-Mms4p endonuclease, independently of Srs2p catalytic activity; functional homolog of human RTEL1 +S000037603 CDS YJL092W 10 257423 260947 W 2011-02-03 1996-07-31 +S000003627 ORF Verified YJL091C GWT1 glucosaminyl-phosphotidylinositol O-acyltransferase chromosome 10 10 262552 261080 C 2011-02-03 2003-09-22|1996-07-31 Protein involved in the inositol acylation of GlcN-PI; the inositol acylation of glucosaminyl phosphatidylinositol (GlcN-PI) forms glucosaminyl(acyl)phosphatidylinositol (GlcN(acyl)PI), an intermediate in the biosynthesis of glycosylphosphatidylinositol (GPI) anchors +S000037407 CDS YJL091C 10 262552 261080 C 2011-02-03 2003-09-22|1996-07-31 +S000003626 ORF Verified YJL090C DPB11 protein kinase activating protein DPB11 chromosome 10 L000003001 10 265051 262757 C 2011-02-03 1996-07-31 DNA replication initiation protein; loads DNA pol epsilon onto pre-replication complexes at origins; checkpoint sensor recruited to stalled replication forks by the checkpoint clamp complex where it activates Mec1p; along with Rfa1p, binds to ultrafine anaphase bridges in mitotic cells and prevents accumulation of chromatin bridges by stimulating the Mec1p kinase and suppressing homologous recombination; ortholog of human TopBP1; forms nuclear foci upon DNA replication stress +S000036680 CDS YJL090C 10 265051 262757 C 2011-02-03 1996-07-31 +S000003625 ORF Verified YJL089W SIP4 chromosome 10 L000001893 10 265926 268415 W 2011-02-03 1996-07-31 C6 zinc cluster transcriptional activator; binds to the carbon source-responsive element (CSRE) of gluconeogenic genes; involved in the positive regulation of gluconeogenesis; regulated by Snf1p protein kinase; localized to the nucleus +S000036795 CDS YJL089W 10 265926 268415 W 2011-02-03 1996-07-31 +S000003624 ORF Verified YJL088W ARG3 ornithine carbamoyltransferase|argF chromosome 10 L000000108 10 268799 269815 W -61 2011-02-03 1999-02-28|1996-07-31 Ornithine carbamoyltransferase; also known as carbamoylphosphate:L-ornithine carbamoyltransferase; catalyzes the biosynthesis of the arginine precursor citrulline +S000036728 CDS YJL088W 10 268799 269815 W 2011-02-03 1999-02-28|1996-07-31 +S000003623 ORF Verified YJL087C TRL1 tRNA ligase|RLG1|LIG1 chromosome 10 L000002336 10 272485 270002 C 2011-02-03 1996-07-31 tRNA ligase; required for tRNA splicing and for both splicing and translation of HAC1 mRNA in the UPR; has phosphodiesterase, polynucleotide kinase, and ligase activities; localized at the inner nuclear envelope and partially to polysomes +S000036631 CDS YJL087C 10 272485 270002 C 2011-02-03 1996-07-31 +S000003621 ORF Verified YJL085W EXO70 GTP-Rho binding exocyst subunit EXO70 chromosome 10 L000003349 10 272827 274698 W 2011-02-03 1996-07-31 Subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis prior to SNARE-mediated fusion; PtdIns[4,5]P2-binding protein that localizes to exocytic sites in an actin-independent manner, targeting and anchoring the exocyst with Sec3p; involved in exocyst assembly; direct downstream effector of Rho3p and Cdc42p; relocalizes from bud neck to cytoplasm upon DNA replication stress +S000035634 CDS YJL085W 10 272827 274698 W 2011-02-03 1996-07-31 +S000003622 ORF Dubious YJL086C chromosome 10 10 272846 272478 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified genes YJL085W/EXO70 and YJL087C/TRL1 +S000035697 CDS YJL086C 10 272846 272478 C 2011-02-03 1996-07-31 +S000003620 ORF Verified YJL084C ALY2 ART3 chromosome 10 10 278002 274862 C 2011-02-03 1997-07-27|1996-07-31 Alpha arrestin; controls nutrient-mediated intracellular sorting of permease Gap1p; interacts with AP-1 subunit Apl4p; phosphorylated by Npr1p and also by cyclin-CDK complex Pcl7p-Pho85p; promotes endocytosis of plasma membrane proteins; ALY2 has a paralog, ALY1, that arose from the whole genome duplication +S000035516 CDS YJL084C 10 278002 274862 C 2011-02-03 1997-07-27|1996-07-31 +S000003619 ORF Verified YJL083W TAX4 chromosome 10 10 278841 280655 W 2011-02-03 1996-07-31 EH domain-containing protein; involved in regulating phosphatidylinositol 4,5-bisphosphate levels and autophagy; Irs4p and Tax4p bind and activate the PtdIns phosphatase Inp51p; Irs4p and Tax4p are involved in localizing Atg17p to the PAS; TAX4 has a paralog, IRS4, that arose from the whole genome duplication +S000034560 CDS YJL083W 10 278841 280655 W 2011-02-03 1996-07-31 +S000003618 ORF Verified YJL082W IML2 chromosome 10 10 281185 283380 W 2011-02-03 1996-07-31 Protein required for clearance of inclusion bodies; localizes to the inclusion bodies formed under protein misfolding stress; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; protein abundance increases in response to DNA replication stress; IML2 has a paralog, YKR018C, that arose from the whole genome duplication +S000034438 CDS YJL082W 10 281185 283380 W 2011-02-03 1996-07-31 +S000003617 ORF Verified YJL081C ARP4 ACT3 chromosome 10 L000000027 10 285271 283802 C 2011-02-03 1996-07-31 Nuclear actin-related protein involved in chromatin remodeling; component of chromatin-remodeling enzyme complexes +S000034308 CDS YJL081C 10 285271 283802 C 2011-02-03 1996-07-31 +S000003616 ORF Verified YJL080C SCP160 chromosome 10 L000001817 10 289226 285558 C 2011-02-03 1996-07-31 Essential RNA-binding G protein effector of mating response pathway; ligand-activated RNA-binding protein that delivers RNAs involved in polarization and perpetualizing mating signal to shmoo tip during pheromone signaling; Scp160p-mediated RNA trafficking essential for chemotropism and successful mating; mainly associated with nuclear envelope and ER, interacts in mRNA-dependent manner with translating ribosomes via multiple KH domains, similar to vertebrate vigilins +S000033394 CDS YJL080C 10 289226 285558 C 2011-02-03 1996-07-31 +S000003615 ORF Verified YJL079C PRY1 sterol-binding protein chromosome 10 L000003216 10 290774 289875 C 2011-02-03 1996-07-31 Sterol binding protein involved in the export of acetylated sterols; secreted glycoprotein and member of the CAP protein superfamily (cysteine-rich secretory proteins (CRISP), antigen 5, and pathogenesis related 1 proteins); sterol export function is redundant with that of PRY2; may be involved in detoxification of hydrophobic compounds; PRY1 has a paralog, PRY2, that arose from the whole genome duplication +S000033334 CDS YJL079C 10 290774 289875 C 2011-02-03 1996-07-31 +S000003614 ORF Verified YJL078C PRY3 chromosome 10 L000003218 10 293981 291336 C 2011-02-03 1996-07-31 Cell wall-associated protein involved in export of acetylated sterols; member of the CAP protein superfamily (cysteine-rich secretory proteins (CRISP), antigen 5, and pathogenesis related 1 proteins); role in mating efficiency; expression of full-length transcript is daughter cell-specific; in response to alpha factor, a short transcript starting at +452 is expressed and the long form is repressed by Ste12p +S000032582 CDS YJL078C 10 293981 291336 C 2011-02-03 1996-07-31 +S000028662 ORF Uncharacterized YJL077W-B chromosome 10 10 294047 294145 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032487 CDS YJL077W-B 10 294047 294145 W 2011-02-03 2003-07-29 +S000028661 ORF Uncharacterized YJL077W-A chromosome 10 10 294799 294885 W 2011-02-03 2003-07-29 Protein of unknown function; mRNA identified as translated by ribosome profiling data; completely overlaps the verified gene YJL077C/ICS3 +S000032486 CDS YJL077W-A 10 294799 294885 W 2011-02-03 2003-07-29 +S000003613 ORF Verified YJL077C ICS3 chromosome 10 10 295061 294666 C 2011-02-03 1996-07-31 Protein with a role in copper homeostasis; possible role in vacuolar sorting and processing of secretory proteins; null mutants are hypersensitive to sortin2 +S000032502 CDS YJL077C 10 295061 294666 C 2011-02-03 1996-07-31 +S000003612 ORF Verified YJL076W NET1 SRM8|CFI1|ESC5 chromosome 10 L000004425 10 295245 298814 W 2011-02-03 1996-07-31 Core subunit of the RENT complex; involved in nucleolar silencing and telophase exit; stimulates transcription by RNA polymerase I and regulates nucleolar structure; NET1 has a paralog, TOF2, that arose from the whole genome duplication +S000032450 CDS YJL076W 10 295245 298814 W 2011-02-03 1996-07-31 +S000003611 ORF Dubious YJL075C APQ13 chromosome 10 10 298876 298460 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 85% of ORF overlaps the verified gene NET1; null mutant is sensitive to sorbate +S000031391 CDS YJL075C 10 298876 298460 C 2011-02-03 1996-07-31 +S000028447 ARS ARS1010 chromosome 10 10 298981 299245 2014-11-18 2002-12-16|2014-11-18 Autonomously Replicating Sequence +S000003610 ORF Verified YJL074C SMC3 cohesin subunit SMC3 chromosome 10 L000003992 10 302849 299157 C 2011-02-03 1996-07-31 Subunit of the multiprotein cohesin complex; required for sister chromatid cohesion in mitotic cells; also required, with Rec8p, for cohesion and recombination during meiosis; phylogenetically conserved SMC chromosomal ATPase family member +S000031287 CDS YJL074C 10 302849 299157 C 2011-02-03 1996-07-31 +S000003609 ORF Verified YJL073W JEM1 KAR8 chromosome 10 L000003533 10 303181 305118 W 2011-02-03 1997-10-20|1996-07-31 DnaJ-like chaperone required for nuclear membrane fusion during mating; localizes to the ER membrane; exhibits genetic interactions with KAR2 +S000031229 CDS YJL073W 10 303181 305118 W 2011-02-03 1997-10-20|1996-07-31 +S000003608 ORF Verified YJL072C PSF2 DNA replication protein PSF2|CDC102 chromosome 10 10 305862 305221 C 2011-02-03 1996-07-31 Subunit of the GINS complex (Sld5p, Psf1p, Psf2p, Psf3p); complex is localized to DNA replication origins and implicated in assembly of the DNA replication machinery +S000030195 CDS YJL072C 10 305862 305221 C 2011-02-03 1996-07-31 +S000003607 ORF Verified YJL071W ARG2 acetyl-CoA:L-glutamate N-acetyltransferase|HRB574 chromosome 10 L000003263 10 306132 307856 W 2011-02-03 1996-07-31 Acetylglutamate synthase (glutamate N-acetyltransferase); mitochondrial enzyme that catalyzes the first step in the biosynthesis of the arginine precursor ornithine; forms a complex with Arg5,6p +S000030084 CDS YJL071W 10 306132 307856 W 2011-02-03 1996-07-31 +S000003606 ORF Uncharacterized YJL070C metallo-dependent hydrolase superfamily protein chromosome 10 10 310637 307971 C 2011-02-03 1996-07-31 Putative metallo-dependent hydrolase superfamily protein; similar to AMP deaminases but lacks key catalytic residues and does not rescue purine nucleotide metabolic defect of quadruple aah1 ade8 amd1 his1 mutant; may regulate purine nucleotide homeostasis as overexpression in an AMD1 strain grown in adenine results in greatly reduced GDP and GTP intracellular levels; not an essential gene; YJL070C has a paralog, YBR284W, that arose from the whole genome duplication +S000029919 CDS YJL070C 10 310637 307971 C 2011-02-03 1996-07-31 +S000003605 ORF Verified YJL069C UTP18 chromosome 10 10 312706 310922 C 2011-02-03 1996-07-31 Small-subunit processome protein involved in pre-18S rRNA maturation; part of a subunit of the 90S preribosomal particle capable of interacting directly with the 5' ETS of the 35S pre-rRNA; contains WD40 repeats +S000036438 CDS YJL069C 10 312706 310922 C 2011-02-03 1996-07-31 +S000003604 ORF Verified YJL068C S-formylglutathione hydrolase|SFGH chromosome 10 10 313915 313016 C 2011-02-03 1996-07-31 Esterase that can function as an S-formylglutathione hydrolase; non-essential intracellular esterase; may be involved in the detoxification of formaldehyde, which can be metabolized to S-formylglutathione; similar to human esterase D +S000036339 CDS YJL068C 10 313915 313016 C 2011-02-03 1996-07-31 +S000003603 ORF Dubious YJL067W chromosome 10 10 314084 314434 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036295 CDS YJL067W 10 314084 314434 W 2011-02-03 1996-07-31 +S000003602 ORF Verified YJL066C MPM1 chromosome 10 10 314872 314114 C 2011-02-03 1996-07-31 Mitochondrial intermembrane space protein of unknown function +S000035314 CDS YJL066C 10 314872 314114 C 2011-02-03 1996-07-31 +S000003600 ORF Dubious YJL064W chromosome 10 10 315175 315570 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene YJL065C/DLS1 +S000035084 CDS YJL064W 10 315175 315570 W 2011-02-03 1996-07-31 +S000003601 ORF Verified YJL065C DLS1 chromosome 10 10 315557 315054 C 2011-02-03 1996-07-31 Subunit of ISW2/yCHRAC chromatin accessibility complex; ISW2/yCHRAC also includes Itc1p, Isw2p, and Dpb4p; involved in inheritance of telomeric silencing; DLS1 has a paralog, DPB3, that arose from the whole genome duplication +S000035150 CDS YJL065C 10 315557 315054 C 2011-02-03 1996-07-31 +S000003599 ORF Verified YJL063C MRPL8 mitochondrial 54S ribosomal protein YmL8|YmL8|HRD238 chromosome 10 L000001162|L000002524 10 316475 315759 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000034082 CDS YJL063C 10 316475 315759 C 2011-02-03 1996-07-31 +S000007611 ORF Verified YJL062W-A COA3 COX25|RRG10 chromosome 10 10 316723 316980 W 2011-02-03 2001-02-26 Mitochondrial protein required for cytochrome c oxidase assembly; also involved in translational regulation of Cox1p and prevention of Cox1p aggregation before assembly; located in the mitochondrial inner membrane +S000037188 CDS YJL062W-A 10 316723 316980 W 2011-02-03 2001-02-26 +S000003598 ORF Verified YJL062W LAS21 mannose-ethanolamine phosphotransferase LAS21|GPI7 chromosome 10 L000004283|L000004818 10 317284 319776 W 2011-02-03 1996-07-31 Integral plasma membrane protein; involved in the synthesis of the glycosylphosphatidylinositol (GPI) core structure; mutations affect cell wall integrity +S000034026 CDS YJL062W 10 317284 319776 W 2011-02-03 1996-07-31 +S000003597 ORF Verified YJL061W NUP82 linker nucleoporin NUP82|HRB187 chromosome 10 L000002941 10 320016 322157 W 2011-02-03 1996-07-31 Linker nucleoporin component of the nuclear pore complex (NPC); also part of the NPC cytoplasmic filaments; contributes to nucleocytoplasmic transport and NPC biogenesis; forms stable associations with three FG-nucleoporins (Nsp1p, Nup159p, and Nup116p); relocalizes to the cytosol in response to hypoxia +S000033873 CDS YJL061W 10 320016 322157 W 2011-02-03 1996-07-31 +S000003596 ORF Verified YJL060W BNA3 kynurenine--oxoglutarate transaminase chromosome 10 10 323386 324720 W 2011-02-03 1996-07-31 Kynurenine aminotransferase; catalyzes formation of kynurenic acid from kynurenine; potential Cdc28p substrate +S000033737 CDS YJL060W 10 323386 324720 W 2011-02-03 1996-07-31 +S000003595 ORF Verified YJL059W YHC3 amino acid transporter YHC3|BTN1 chromosome 10 L000003332|L000003284 10 324964 326190 W 2011-02-03 1996-07-31 Protein required for the ATP-dependent transport of arginine; vacuolar membrane protein; involved in the ATP-dependent transport of arginine into the vacuole and possibly in balancing ion homeostasis; human homolog CLN3 involved in Batten disease (juvenile onset neuronal ceroid lipofuscinosis) can complement yeast null mutant +S000034862 CDS YJL059W 10 324964 326190 W 2011-02-03 1996-07-31 +S000003594 ORF Verified YJL058C BIT61 chromosome 10 10 327873 326242 C 2011-02-03 1996-07-31 Subunit of TORC2 membrane-associated complex; involved in regulation of cell cycle-dependent actin cytoskeletal dynamics during polarized growth and cell wall integrity; BIT61 has a paralog, BIT2, that arose from the whole genome duplication +S000032844 CDS YJL058C 10 327873 326242 C 2011-02-03 1996-07-31 +S000003593 ORF Verified YJL057C IKS1 protein kinase IKS1 chromosome 10 L000004209 10 330121 328118 C 2011-02-03 1996-07-31 Protein kinase of unknown cellular role; putative serine/threonine kinase; expression is induced during mild heat stress; deletion mutants are hypersensitive to copper sulphate and resistant to sorbate; interacts with an N-terminal fragment of Sst2p +S000032730 CDS YJL057C 10 330121 328118 C 2011-02-03 1996-07-31 +S000003592 ORF Verified YJL056C ZAP1 ZRG10 chromosome 10 L000003321 10 333073 330431 C 2011-02-03 1996-07-31 Zinc-regulated transcription factor; binds to zinc-responsive promoters to induce transcription of certain genes in presence of zinc, represses other genes in low zinc; regulates its own transcription; contains seven zinc-finger domains +S000032670 CDS YJL056C 10 333073 330431 C 2011-02-03 1996-07-31 +S000003591 ORF Uncharacterized YJL055W chromosome 10 10 333357 334094 W 2011-02-03 1996-07-31 Putative protein of unknown function; functions together with HAM1 to mediate resistance to 5-FU; specifically reduces the incorporation of 5-FU into RNA, without affecting uptake or incorporation of uracil into RNA; proposed to be involved in the metabolism of purine and pyrimidine base analogues; deletion mutants are sensitive to HAP and AHA +S000032627 CDS YJL055W 10 333357 334094 W 2011-02-03 1996-07-31 +S000003590 ORF Verified YJL054W TIM54 chromosome 10 L000004342 10 334265 335701 W 2011-02-03 1996-07-31 Component of the mitochondrial TIM22 complex; involved in insertion of polytopic proteins into the inner membrane +S000031626 CDS YJL054W 10 334265 335701 W 2011-02-03 1996-07-31 +S000003589 ORF Verified YJL053W PEP8 retromer subunit PEP8|VPT4|VPS26|GRD6 chromosome 10 L000001378 10 335898 337037 W 2011-02-03 1996-07-31 Vacuolar protein component of the retromer; forms part of the multimeric membrane-associated retromer complex involved in vacuolar protein sorting along with Vps35p, Vps29p, Vps17p, and Vps5p; essential for endosome-to-Golgi retrograde protein transport; interacts with Ypt7p; protein abundance increases in response to DNA replication stress +S000031497 CDS YJL053W 10 335898 337037 W 2011-02-03 1996-07-31 +S000028448 ARS ARS1011 ARSX-337 chromosome 10 10 337281 337529 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence +S000007610 ORF Uncharacterized YJL052C-A chromosome 10 10 338003 337884 C 2011-02-03 2001-02-26 Putative protein of unknown function; identified based on comparison to related yeast species; mCherry fusion protein localizes to the vacuole +S000037187 CDS YJL052C-A 10 338003 337884 C 2011-02-03 2001-02-26 +S000003588 ORF Verified YJL052W TDH1 glyceraldehyde-3-phosphate dehydrogenase (phosphorylating) TDH1|GAPDH|GLD3 chromosome 10 L000002272 10 338271 339269 W 2011-02-03 1996-07-31 Glyceraldehyde-3-phosphate dehydrogenase (GAPDH), isozyme 1; involved in glycolysis and gluconeogenesis; tetramer that catalyzes the reaction of glyceraldehyde-3-phosphate to 1,3 bis-phosphoglycerate; detected in the cytoplasm and cell wall; protein abundance increases in response to DNA replication stress; GAPDH-derived antimicrobial peptides secreted by S. cerevisiae are active against a wide variety of wine-related yeasts and bateria +S000031373 CDS YJL052W 10 338271 339269 W 2011-02-03 1996-07-31 +S000003587 ORF Verified YJL051W IRC8 chromosome 10 10 339787 342255 W 2011-02-03 1996-07-31 Bud tip localized protein of unknown function; mRNA is targeted to the bud by a She2p dependent transport system; mRNA is cell cycle regulated via Fkh2p, peaking in G2/M phase; null mutant displays increased levels of spontaneous Rad52p foc +S000030449 CDS YJL051W 10 339787 342255 W 2011-02-03 1996-07-31 +S000003586 ORF Verified YJL050W MTR4 ATP-dependent RNA helicase MTR4|DOB1 chromosome 10 L000004110 10 342522 345743 W 2011-02-03 1996-07-31 ATP-dependent 3'-5' RNA helicase of the DExD/H family; involved in nuclear RNA processing and degradation both as a component of TRAMP complex and in TRAMP-independent processes; TRAMP unwinds RNA duplexes, with Mtr4p unwinding activity stimulated by Pap2p/Air2p but not dependent on ongoing polyadenylation; contains an arch domain, with two coiled-coil arms/stalks and a globular fist/KOW domain, which has RNA binding activity and is required for 5.8S rRNA processing +S000030313 CDS YJL050W 10 342522 345743 W 2011-02-03 1996-07-31 +S000003585 ORF Uncharacterized YJL049W CHM7 chromosome 10 10 345973 347325 W 2011-02-03 1996-07-31 Yeast homolog of human CHMP7, localizes to the endoplasmic reticulum presumably as part of an ESCRT-III like complex; null mutant has growth defect at 37 C in an apq12 deletion background; non-essential gene +S000036773 CDS YJL049W 10 345973 347325 W 2011-02-03 1996-07-31 +S000003584 ORF Verified YJL048C UBX6 CUI2 chromosome 10 10 348637 347447 C 2011-02-03 1996-07-31 UBX (ubiquitin regulatory X) domain-containing protein; interacts with Cdc48p, transcription is repressed when cells are grown in media containing inositol and choline; UBX6 has a paralog, UBX7, that arose from the whole genome duplication +S000036634 CDS YJL048C 10 348637 347447 C 2011-02-03 1996-07-31 +S000028804 ORF Uncharacterized YJL047C-A chromosome 10 10 349178 349044 C 2011-02-03 2003-07-29 Putative protein of unknown function +S000033585 CDS YJL047C-A 10 349178 349044 C 2011-02-03 2003-07-29 +S000006451 snoRNA_gene snR60 SNR60 chromosome 10 L000004529 10 349233 349130 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at positions A817 and G908 +S000030821 noncoding_exon snR60 10 349233 349130 C 2011-02-03 2000-05-19 +S000003583 ORF Verified YJL047C RTT101 cullin RTT101|CULC|CUL8 chromosome 10 L000004737 10 352108 349580 C 2011-02-03 1996-07-31 Cullin subunit of a Roc1p-dependent E3 ubiquitin ligase complex; role in anaphase progression; required for recovery after DSB repair; implicated in Mms22-dependent DNA repair; involved with Mms1p in nonfunctional rRNA decay; modified by the ubiquitin-like protein, Rub1p +S000036565 CDS YJL047C 10 352108 349580 C 2011-02-03 1996-07-31 +S000003582 ORF Verified YJL046W AIM22 putative lipoate--protein ligase|RRG3|LIP3 chromosome 10 10 352386 353615 W 2011-02-03 1996-07-31|2005-12-01 Putative lipoate-protein ligase; required along with Lip2 and Lip5 for lipoylation of Lat1p and Kgd2p; similar to E. coli LplA; null mutant displays reduced frequency of mitochondrial genome loss +S000036505 CDS YJL046W 10 352386 353615 W 2011-02-03 1996-07-31|2005-12-01 +S000006781 tRNA_gene tY(GUA)J1 SUP7 chromosome 10 L000003607|L000002186 10 354244 354332 W -32 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations +S000032080 intron tY(GUA)J1 10 354283 354296 W 2011-02-03 2000-05-19 +S000032078 noncoding_exon tY(GUA)J1 10 354244 354282 W 2011-02-03 2000-05-19 +S000032079 noncoding_exon tY(GUA)J1 10 354297 354332 W 2011-02-03 2000-05-19 +S000007024 long_terminal_repeat YJLCdelta5 chromosome 10 10 355175 354844 C 2011-02-03 2000-05-19 Ty1 LTR +S000007023 long_terminal_repeat YJLCdelta4 chromosome 10 10 355204 354538 C 2011-02-03 2000-05-19 Ty1 LTR +S000006714 tRNA_gene tR(UCU)J1 chromosome 10 L000003608 10 355374 355445 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000030321 noncoding_exon tR(UCU)J1 10 355374 355445 W 2011-02-03 2000-05-19 +S000006537 tRNA_gene tD(GUC)J2 chromosome 10 L000003609 10 355456 355527 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000030790 noncoding_exon tD(GUC)J2 10 355456 355527 W 2011-02-03 2000-05-19 +S000003581 ORF Verified YJL045W succinate dehydrogenase SDH1b|SDH1b chromosome 10 10 356024 357928 W 2011-02-03 1996-07-31 Minor succinate dehydrogenase isozyme; participates in oxidation of succinate and transfer of electrons to ubiquinone; induced during the diauxic shift in a Cat8p-dependent manner; YJL045W has a paralog, SDH1, that arose from the whole genome duplication +S000035600 CDS YJL045W 10 356024 357928 W 2011-02-03 1996-07-31 +S000003580 ORF Verified YJL044C GYP6 chromosome 10 L000000748 10 359676 358300 C 2011-02-03 1996-07-31 GTPase-activating protein (GAP) for yeast Rab family member Ypt6p; involved in vesicle mediated protein transport +S000035463 CDS YJL044C 10 359676 358300 C 2011-02-03 1996-07-31 +S000003579 ORF Uncharacterized YJL043W chromosome 10 10 360130 360903 W 2011-02-03 1996-07-31 Putative protein of unknown function; YJL043W is a non-essential gene +S000035409 CDS YJL043W 10 360130 360903 W 2011-02-03 1996-07-31 +S000003578 ORF Verified YJL042W MHP1 chromosome 10 L000002720 10 361249 365445 W 2011-02-03 1996-07-31 Microtubule-associated protein involved in microtubule organization; involved in assembly and stabilization of microtubules; overproduction results in cell cycle arrest at G2 phase; similar to Drosophila protein MAP and to mammalian MAP4 proteins +S000034384 CDS YJL042W 10 361249 365445 W 2011-02-03 1996-07-31 +S000003577 ORF Verified YJL041W NSP1 FG-nucleoporin NSP1 chromosome 10 L000001277 10 365784 368373 W 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; also part of the nuclear pore complex (NPC) nuclear basket; contributes directly to nucleocytoplasmic transport and maintenance of the NPC permeability barrier; found in stable complex with Nup82p, Gle2p and two other FG-nucleoporins (Nup159p and Nup116p); also found in stable complex with Nic96p and two other FG-nucleoproteins (Nup49p and Nup57p) +S000034258 CDS YJL041W 10 365784 365784 W 2011-02-03 1996-07-31 +S000034259 CDS YJL041W 10 365903 368373 W 2011-02-03 1996-07-31 +S000034260 intron YJL041W 10 365785 365902 W 2011-02-03 1996-07-31 +S000003576 ORF Verified YJL039C NUP192 chromosome 10 S000007465 10 373799 368748 C 2011-02-03 1996-07-31 Essential subunit of inner ring of nuclear pore complex (NPC); plays a role in modulating transport through the NPC; homologous to human NUP205 +S000034602 CDS YJL039C 10 373799 368748 C 2011-02-03 1996-07-31 +S000006538 tRNA_gene tD(GUC)J3 chromosome 10 L000003625 10 374495 374424 C 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000030793 noncoding_exon tD(GUC)J3 10 374495 374424 C 2011-02-03 2000-05-19 +S000006715 tRNA_gene tR(UCU)J2 chromosome 10 L000003624 10 374577 374506 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000030328 noncoding_exon tR(UCU)J2 10 374577 374506 C 2011-02-03 2000-05-19 +S000028449 ARS ARS1012 ARSX-375 chromosome 10 10 374880 375122 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence +S000007025 long_terminal_repeat YJLCdelta6 chromosome 10 10 374935 374844 C 2011-02-03 2000-05-19 Ty1 LTR +S000028450 ARS ARS1013 chromosome 10 10 375706 376227 2011-02-03 2002-12-16 Autonomously Replicating Sequence; inefficient as chromosomal replication origin; replication capacity dependent upon Sum1p +S000003575 ORF Verified YJL038C LOH1 OSW4 chromosome 10 10 375774 375115 C 2011-02-03 1996-07-31 Protein involved in outer spore wall assembly; likely involved directly in dityrosine layer assembly; induced during sporulation; repressed during vegetative growth by Sum1p and Hst1p; sequence similar to adjacent ORF, IRC18/YJL037W, and the irc18 loh1 double mutant exhibits reduced dityrosine fluorescence relative to the single mutants; SWAT-GFP and mCherry fusion proteins localize to the cytosol; proposed role in maintenance of genome integrity +S000034497 CDS YJL038C 10 375774 375115 C 2011-02-03 1996-07-31 +S000003574 ORF Verified YJL037W IRC18 OSW6 chromosome 10 10 376662 377336 W 2011-02-03 1996-07-31 Protein involved in outer spore wall assembly; possible role in assembly of the dityrosine layer; similar to adjacent ORF, LOH1; irc18 loh1 double mutant exhibits reduced dityrosine fluorescence relative to single mutants; SWAT-GFP fusion protein localizes to the ER and vacuole, while mCherry fusion localizes to the vacuole; expression induced in respiratory-deficient cells and carbon-limited chemostat culture; null mutant displays increased levels of spontaneous Rad52p foci +S000034457 CDS YJL037W 10 376662 377336 W 2011-02-03 1996-07-31 +S000007026 long_terminal_repeat YJLCdelta7 chromosome 10 10 377870 377598 C 2011-02-03 2000-05-19 Ty1 LTR +S000006759 tRNA_gene tV(AAC)J chromosome 10 L000003610 10 378360 378433 W 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000032964 noncoding_exon tV(AAC)J 10 378360 378433 W 2011-02-03 2000-05-19 +S000003573 ORF Verified YJL036W SNX4 ATG24|CVT13 chromosome 10 S000007467|L000004764 10 378825 380096 W 2011-02-03 1996-07-31 Sorting nexin; involved in retrieval of late-Golgi SNAREs from post-Golgi endosomes to the trans-Golgi network and in cytoplasm to vacuole transport; contains a PX phosphoinositide-binding domain; forms complexes with Snx41p and with Atg20p +S000032435 CDS YJL036W 10 378825 380096 W 2011-02-03 1996-07-31 +S000003572 ORF Verified YJL035C TAD2 tRNA(adenine34) deaminase chromosome 10 S000007489 10 381001 380249 C 2011-02-03 1996-07-31 Subunit of tRNA-specific adenosine-34 deaminase; forms a heterodimer with Tad3p that converts adenosine to inosine at the wobble position of several tRNAs +S000032286 CDS YJL035C 10 381001 380249 C 2011-02-03 1996-07-31 +S000003571 ORF Verified YJL034W KAR2 Hsp70 family ATPase KAR2|BIP|GRP78 chromosome 10 L000000887 10 381327 383375 W 2011-02-03 1996-07-31 ATPase involved in protein import into the ER; also acts as a chaperone to mediate protein folding in the ER and may play a role in ER export of soluble proteins; regulates the unfolded protein response via interaction with Ire1p +S000032230 CDS YJL034W 10 381327 383375 W 2011-02-03 1996-07-31 +S000003570 ORF Verified YJL033W HCA4 RNA-dependent ATPase HCA4|ECM24|DBP4 chromosome 10 L000003421 10 383837 386149 W 2011-02-03 1996-07-31 DEAD box RNA helicase; component of the SSU; interacts with Bfr2p and Enp2p; high-copy number suppression of a U14 snoRNA processing mutant suggests an involvement in 18S rRNA synthesis +S000031248 CDS YJL033W 10 383837 386149 W 2011-02-03 1996-07-31 +S000003569 ORF Dubious YJL032W chromosome 10 10 386348 386662 W 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; overlaps 3' end of essential BET4 gene encoding the alpha subunit of Type II geranylgeranyltransferase +S000031093 CDS YJL032W 10 386348 386662 W 2011-02-03 1996-07-31 +S000003568 ORF Verified YJL031C BET4 Rab geranylgeranyltransferase BET4 chromosome 10 L000000173 10 387438 386368 C 2011-02-03 2004-01-27|1996-07-31 Alpha subunit of Type II geranylgeranyltransferase; required for vesicular transport between the endoplasmic reticulum and the Golgi; provides a membrane attachment moiety to Rab-like proteins Ypt1p and Sec4p +S000030060 CDS YJL031C 10 387348 386368 C 2011-02-03 2004-01-27 +S000030059 CDS YJL031C 10 387438 387436 C 2011-02-03 2004-01-27|1996-07-31 +S000030061 intron YJL031C 10 387435 387349 C 2011-02-03 2004-01-27 +S000003567 ORF Verified YJL030W MAD2 spindle checkpoint protein MAD2 chromosome 10 L000000975 10 387657 388247 W 2011-02-03 1996-07-31 Component of the spindle-assembly checkpoint complex; delays onset of anaphase in cells with defects in mitotic spindle assembly; forms a complex with Mad1p; regulates APC/C activity during prometaphase and metaphase of meiosis I; gene dosage imbalance between MAD1 and MAD2 leads to chromosome instability +S000030009 CDS YJL030W 10 387657 388247 W 2011-02-03 1996-07-31 +S000003566 ORF Verified YJL029C VPS53 chromosome 10 10 390853 388385 C 2011-02-03 1996-07-31 Component of the GARP (Golgi-associated retrograde protein) complex; GARP is required for the recycling of proteins from endosomes to the late Golgi, and for mitosis after DNA damage induced checkpoint arrest; required for vacuolar protein sorting; members of the GARP complex are Vps51p-Vps52p-Vps53p-Vps54p; human ortholog is implicated in progressive cerebello-cerebral atrophy type 2 (PCCA2) +S000030293 CDS YJL029C 10 390853 388385 C 2011-02-03 1996-07-31 +S000006661 tRNA_gene tM(CAU)J1 EMT5 chromosome 10 L000000555|L000003623 10 391115 391043 C 2011-02-03 2000-05-19 Methionine tRNA (tRNA-Met), functions in translational elongation; not involved in translational initiation; predicted by tRNAscan-SE analysis +S000029920 noncoding_exon tM(CAU)J1 10 391115 391043 C 2011-02-03 2000-05-19 +S000003565 ORF Verified YJL028W chromosome 10 10 391311 391646 W 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments +S000030214 CDS YJL028W 10 391311 391646 W 2011-02-03 1996-07-31 +S000003564 ORF Uncharacterized YJL027C chromosome 10 10 392249 391833 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000036407 CDS YJL027C 10 392249 391833 C 2011-02-03 1996-07-31 +S000003563 ORF Verified YJL026W RNR2 ribonucleotide-diphosphate reductase subunit RNR2|CRT6 chromosome 10 L000001656 10 392404 393603 W 0 2011-02-03 1996-07-31 Ribonucleotide-diphosphate reductase (RNR), small subunit; the RNR complex catalyzes the rate-limiting step in dNTP synthesis and is regulated by DNA replication and DNA damage checkpoint pathways via localization of the small subunits; RNR2 has a paralog, RNR4, that arose from the whole genome duplication +S000036365 CDS YJL026W 10 392404 393603 W 2011-02-03 1996-07-31 +S000028660 ORF Dubious YJL026C-A chromosome 10 10 393287 393066 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene YJL026W/RNR2 +S000032485 CDS YJL026C-A 10 393287 393066 C 2011-02-03 2003-07-29 +S000003562 ORF Verified YJL025W RRN7 chromosome 10 L000001773 10 393967 395511 W 2011-02-03 1996-07-31 Component of the core factor (CF) rDNA transcription factor complex; CF is required for transcription of 35S rRNA genes by RNA polymerase I and is composed of Rrn6p, Rrn7p, and Rrn11p +S000036283 CDS YJL025W 10 393967 395511 W 2011-02-03 1996-07-31 +S000003561 ORF Verified YJL024C APS3 YKS7 chromosome 10 L000003174 10 396592 395931 C 2011-02-03 1996-07-31 Small subunit of the clathrin-associated adaptor complex AP-3; involved in vacuolar protein sorting; related to the sigma subunit of the mammalian clathrin AP-3 complex; suppressor of loss of casein kinase 1 function; protein abundance increases in response to DNA replication stress +S000036076 CDS YJL024C 10 396493 395931 C 2011-02-03 1996-07-31 +S000036075 CDS YJL024C 10 396592 396571 C 2011-02-03 1996-07-31 +S000036077 intron YJL024C 10 396570 396494 C 2011-02-03 1996-07-31 +S000006583 tRNA_gene tG(GCC)J1 chromosome 10 L000003622 10 396796 396726 C 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis +S000030415 noncoding_exon tG(GCC)J1 10 396796 396726 C 2011-02-03 2000-05-19 +S000003559 ORF Dubious YJL022W chromosome 10 10 398109 398417 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene PET130 +S000035121 CDS YJL022W 10 398109 398417 W 2011-02-03 1996-07-31 +S000003560 ORF Verified YJL023C PET130 chromosome 10 L000003025 10 398398 397355 C 2011-02-03 1996-07-31 Protein required for respiratory growth; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000035183 CDS YJL023C 10 398398 397355 C 2011-02-03 1996-07-31 +S000028659 ORF Dubious YJL020W-A chromosome 10 10 400981 401238 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene YJL020C/BBC1 +S000032463 CDS YJL020W-A 10 400981 401238 W 2011-02-03 2003-07-29 +S000003557 ORF Verified YJL020C BBC1 YJL021C|MTI1 chromosome 10 10 402410 398937 C 2011-02-03 2001-06-28|1996-07-31 Protein possibly involved in assembly of actin patches; interacts with an actin assembly factor Las17p and with the SH3 domains of Type I myosins Myo3p and Myo5p; localized predominantly to cortical actin patches +S000033969 CDS YJL020C 10 402410 398937 C 2011-02-03 2001-06-28|1996-07-31 +S000003556 ORF Verified YJL019W MPS3 YJL018W|NEP98 chromosome 10 10 402897 404945 W 2011-02-03 2003-01-02|1996-07-31 Nuclear envelope protein; required for SPB insertion, SPB duplication, Kar5p localization near the SPB and nuclear fusion; interacts with Mps2p to tether half-bridge to core SPB; N-terminal acetylation by Eco1p regulates its role in nuclear organization; localizes to the SPB half bridge and telomeres during meiosis; required with Ndj1p and Csm4p for meiotic bouquet formation and telomere-led rapid prophase movement; member of the SUN protein family (Sad1-UNC-84 homology) +S000035368 CDS YJL019W 10 402897 404945 W 2011-02-03 2003-01-02|1996-07-31 +S000003553 ORF Uncharacterized YJL016W TPH3 YJL017W chromosome 10 10 405588 407273 W 2011-02-03 2003-09-29|1996-07-31 Putative protein of unknown function; GFP-fusion protein localizes to the cytoplasm; contains two adjacent PH-like domains; conserved in closely related Saccharomyces species +S000034286 CDS YJL016W 10 405588 407273 W 2011-02-03 2003-09-29|1996-07-31 +S000003552 ORF Dubious YJL015C chromosome 10 10 407426 407142 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame unlikely to encode a functional protein; expression if heat-inducible; located in promoter region of essential CCT3 gene encoding a subunit of the cytosolic chaperonin Cct ring complex, overlaps ORF YJL016W +S000034109 CDS YJL015C 10 407426 407142 C 2011-02-03 1996-07-31|2011-02-03 +S000003551 ORF Verified YJL014W CCT3 chaperonin-containing T-complex subunit CCT3|TCP3|BIN2 chromosome 10 L000002270 10 407558 409162 W 2011-02-03 1996-07-31 Subunit of the cytosolic chaperonin Cct ring complex; related to Tcp1p, required for the assembly of actin and tubulins in vivo; capable of binding Q/N rich proteins and mediating their folding +S000034079 CDS YJL014W 10 407558 409162 W 2011-02-03 1996-07-31 +S000003550 ORF Verified YJL013C MAD3 chromosome 10 L000003179 10 411040 409493 C 2011-02-03 1996-07-31 Subunit of spindle-assembly checkpoint complex; involved in delaying anaphase onset in cells with defects in mitotic spindle assembly; pseudosubstrate inhibitor of APC(Cdc20), the anaphase promoting complex involved in securin (Pds1p) turnover; MAD3 has a paralog, BUB1, that arose from the whole genome duplication +S000032025 CDS YJL013C 10 411040 409493 C 2011-02-03 1996-07-31 +S000003549 ORF Verified YJL012C VTC4 YJL012C-A|PHM3 chromosome 10 S000007513 10 413399 411234 C 2011-02-03 2004-02-19|1996-07-31 Vacuolar membrane polyphosphate polymerase; subunit of the vacuolar transporter chaperone (VTC) complex involved in synthesis and transfer of polyP to the vacuole; regulates membrane trafficking; role in non-autophagic vacuolar fusion; protein abundance increases in response to DNA replication stress +S000031895 CDS YJL012C 10 413399 411234 C 2011-02-03 2004-02-19|1996-07-31 +S000003548 ORF Verified YJL011C RPC17 DNA-directed RNA polymerase III subunit RPC17|C17 chromosome 10 10 414770 414285 C 2011-02-03 1996-07-31|2011-02-03 RNA polymerase III subunit C17; physically interacts with C31, C11, and TFIIIB70; may be involved in the recruitment of pol III by the preinitiation complex; protein abundance increases in response to DNA replication stress; relocalizes to the cytosol in response to hypoxia +S000030894 CDS YJL011C 10 414770 414285 C 2011-02-03 1996-07-31|2011-02-03 +S000006625 tRNA_gene tK(CUU)J chromosome 10 L000003611 10 414966 415038 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000036030 noncoding_exon tK(CUU)J 10 414966 415038 W 2011-02-03 2000-05-19 +S000006773 tRNA_gene tW(CCA)J chromosome 10 L000003621 10 416036 415931 C 2011-02-03 2000-05-19 Tryptophan tRNA (tRNA-Trp), predicted by tRNAscan-SE analysis +S000033314 intron tW(CCA)J 10 416000 415967 C 2011-02-03 2000-05-19 +S000033313 noncoding_exon tW(CCA)J 10 415966 415931 C 2011-02-03 2000-05-19 +S000033312 noncoding_exon tW(CCA)J 10 416036 416001 C 2011-02-03 2000-05-19 +S000007047 long_terminal_repeat YJLWtau3 YJRWtau3 chromosome 10 10 416266 416441 W 2011-02-03 2000-05-19 Ty4 LTR +S000007029 long_terminal_repeat YJLWdelta8 chromosome 10 10 416506 416650 W 2011-02-03 2000-05-19 Ty1 LTR +S000007030 long_terminal_repeat YJLWdelta9 chromosome 10 10 416899 417026 W 2011-02-03 2000-05-19 Ty1 LTR +S000028451 ARS ARS1014 ARSX-417 chromosome 10 10 417195 417440 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence +S000003547 ORF Verified YJL010C NOP9 RNA-binding RNA processing protein NOP9 chromosome 10 10 419562 417562 C 2011-02-03 1996-07-31 Essential subunit of U3-containing 90S preribosome; involved in production of 18S rRNA and assembly of small ribosomal subunit; also part of pre-40S ribosome and required for its export into cytoplasm; binds RNA and contains pumilio domain +S000030801 CDS YJL010C 10 419562 417562 C 2011-02-03 1996-07-31 +S000003546 ORF Dubious YJL009W chromosome 10 10 419855 420181 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps CCT8/YJL008C, a verified gene encoding a subunit of the cytosolic chaperonin Cct ring complex +S000031233 CDS YJL009W 10 419855 420181 W 2011-02-03 1996-07-31 +S000003545 ORF Verified YJL008C CCT8 chaperonin-containing T-complex subunit CCT8 chromosome 10 L000002764 10 421663 419957 C 2011-02-03 1996-07-31|2011-02-03 Subunit of the cytosolic chaperonin Cct ring complex; related to Tcp1p, required for the assembly of actin and tubulins in vivo +S000031107 CDS YJL008C 10 421663 419957 C 2011-02-03 1996-07-31|2011-02-03 +S000007038 long_terminal_repeat YJLWtau4 chromosome 10 10 421946 422295 W 2011-02-03 2000-05-19|2011-02-03 Ty4 LTR +S000007031 long_terminal_repeat YJLWdelta10 chromosome 10 10 422601 422887 W 2011-02-03 2000-05-19 Ty1 LTR +S000006662 tRNA_gene tM(CAU)J2 EMT3 chromosome 10 L000000553|L000003612 10 422937 423009 W 2011-02-03 2000-05-19 Methionine tRNA (tRNA-Met), functions in translational elongation; not involved in translational initiation; predicted by tRNAscan-SE analysis +S000029922 noncoding_exon tM(CAU)J2 10 422937 423009 W 2011-02-03 2000-05-19 +S000003544 ORF Dubious YJL007C chromosome 10 10 423012 422698 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031008 CDS YJL007C 10 423012 422698 C 2011-02-03 1996-07-31 +S000003543 ORF Verified YJL006C CTK2 chromosome 10 L000003011 10 424109 423138 C 2011-02-03 1996-07-31 Beta subunit of C-terminal domain kinase I (CTDK-I); which phosphorylates both RNA pol II subunit Rpo21p to affect transcription and pre-mRNA 3' end processing, and ribosomal protein Rps2p to increase translational fidelity; relocalizes to the cytosol in response to hypoxia +S000030929 CDS YJL006C 10 424109 423138 C 2011-02-03 1996-07-31 +S000006650 tRNA_gene tL(UAA)J SUP51 SUP52 chromosome 10 L000002209|L000003620 10 424515 424432 C 0 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis; can mutate to suppress amber nonsense mutations +S000037406 noncoding_exon tL(UAA)J 10 424515 424432 C 2011-02-03 2000-05-19 +S000003542 ORF Verified YJL005W CYR1 adenylate cyclase|FIL1|TSM0185|SRA4|HSR1|CDC35 chromosome 10 L000000467 10 425157 431237 W 2 2011-02-03 1996-07-31 Adenylate cyclase; required for cAMP production and cAMP-dependent protein kinase signaling; the cAMP pathway controls a variety of cellular processes, including metabolism, cell cycle, stress response, stationary phase, and sporulation +S000029993 CDS YJL005W 10 425157 431237 W 2011-02-03 1996-07-31 +S000003541 ORF Verified YJL004C SYS1 chromosome 10 L000004153 10 432200 431589 C 2011-02-03 1996-07-31 Integral membrane protein of the Golgi; required for targeting of the Arf-like GTPase Arl3p to the Golgi; multicopy suppressor of ypt6 null mutation +S000037910 CDS YJL004C 10 432200 431589 C 2011-02-03 1996-07-31 +S000003540 ORF Verified YJL003W COX16 chromosome 10 10 432644 433000 W 2011-02-03 1996-07-31 Mitochondrial inner membrane protein; required for assembly of cytochrome c oxidase +S000037880 CDS YJL003W 10 432644 433000 W 2011-02-03 1996-07-31 +S000003539 ORF Verified YJL002C OST1 dolichyl-diphosphooligosaccharide--protein glycotransferase subunit OST1|NLT1 chromosome 10 L000002649 10 434651 433221 C 2011-02-03 1996-07-31 Alpha subunit of the oligosaccharyltransferase complex of the ER lumen; complex catalyzes asparagine-linked glycosylation of newly synthesized proteins +S000035955 CDS YJL002C 10 434651 433221 C 2011-02-03 1996-07-31 +S000003538 ORF Verified YJL001W PRE3 proteasome core particle subunit beta 1|CRL21 chromosome 10 L000000418|L000001485 10 435163 435926 W 2011-02-03 1996-07-31 Beta 1 subunit of the 20S proteasome; responsible for cleavage after acidic residues in peptides +S000035909 CDS YJL001W 10 435163 435227 W 2011-02-03 1996-07-31 +S000035910 CDS YJL001W 10 435344 435926 W 2011-02-03 1996-07-31 +S000035911 intron YJL001W 10 435228 435343 W 2011-02-03 1996-07-31 +S000006471 centromere CEN10 CEN10 chromosome 10 L000000303 10 436425 436307 C 0 2011-02-03 2000-05-19|2004-10-08 Chromosome X centromere +S000077296 centromere_DNA_Element_I CEN10 10 436425 436416 C 2011-02-03 2004-10-08 +S000077297 centromere_DNA_Element_II CEN10 10 436415 436332 C 2011-02-03 2004-10-08 +S000077298 centromere_DNA_Element_III CEN10 10 436331 436307 C 2011-02-03 2004-10-08 +S000003761 ORF Verified YJR001W AVT1 chromosome 10 10 436802 438610 W 2011-02-03 1996-07-31 Vacuolar transporter; imports large neutral amino acids into the vacuole; member of a family of seven S. cerevisiae genes (AVT1-7) related to vesicular GABA-glycine transporters +S000033093 CDS YJR001W 10 436802 438610 W 2011-02-03 1996-07-31 +S000003762 ORF Verified YJR002W MPP10 rRNA-processing protein MPP10 chromosome 10 L000004335 10 438865 440646 W 2011-02-03 1996-07-31 Component of the SSU processome and 90S preribosome; required for pre-18S rRNA processing, interacts with and controls the stability of Imp3p and Imp4p, essential for viability; similar to human Mpp10p +S000033184 CDS YJR002W 10 438865 440646 W 2011-02-03 1996-07-31 +S000003763 ORF Uncharacterized YJR003C MRX12 chromosome 10 10 442553 440994 C 2011-02-03 1996-07-31|2006-05-09 Protein that associates with mitochondrial ribosome; detected in highly purified mitochondria in high-throughput studies; predicted to be involved in ribosome biogenesis +S000033209 CDS YJR003C 10 442553 440994 C 2011-02-03 1996-07-31|2006-05-09 +S000028452 ARS ARS1015 chromosome 10 10 442556 442965 2011-02-03 2002-12-16 Autonomously Replicating Sequence +S000003764 ORF Verified YJR004C SAG1 AG(ALPHA)1 chromosome 10 L000001796 10 444861 442909 C 2 2011-02-03 1996-07-31 Alpha-agglutinin of alpha-cells; binds to Aga1p during agglutination, N-terminal half is homologous to the immunoglobulin superfamily and contains binding site for a-agglutinin, C-terminal half is highly glycosylated and contains GPI anchor +S000034030 CDS YJR004C 10 444861 442909 C 2011-02-03 1996-07-31 +S000003765 ORF Verified YJR005W APL1 YAP80 chromosome 10 L000002495 10 445923 448025 W 2011-02-03 1996-07-31 Beta-adaptin; large subunit of the clathrin associated protein complex (AP-2); involved in vesicle mediated transport; similar to mammalian beta-chain of the clathrin associated protein complex +S000034176 CDS YJR005W 10 445923 448025 W 2011-02-03 1996-07-31 +S000028523 ORF Verified YJR005C-A LSO1 chromosome 10 10 448758 448477 C 2011-02-03 2003-07-29 Protein with a potential role in response to iron deprivation; transcription increases during iron deprivation and during treatment with 2-(6-benzyl-2-pyridyl)quinazoline (BPQ) and copper; regulated by Aft1p and, to a lesser extent, by Aft2p; originally identified as a syntenic homolog of an Ashbya gossypii gene; localizes to nucleus and cytoplasm, and nuclear localization is enhanced under iron-replete conditions +S000030322 CDS YJR005C-A 10 448758 448477 C 2011-02-03 2003-07-29 +S000003766 ORF Verified YJR006W POL31 DNA-directed DNA polymerase delta subunit POL31|HYS2|SDP5|HUS2 chromosome 10 L000002981 10 449202 450665 W 2011-02-03 1996-07-31 Subunit of DNA polymerase delta (polymerase III); essential for cell viability; involved in DNA replication and DNA repair; forms a complex with Rev3p, Rev7p and Pol32p; relocalizes to the cytosol in response to hypoxia +S000035159 CDS YJR006W 10 449202 450665 W 2011-02-03 1996-07-31 +S000003767 ORF Verified YJR007W SUI2 translation initiation factor eIF2 subunit alpha chromosome 10 L000002178 10 451020 451934 W 2 2011-02-03 1996-07-31 Alpha subunit of the translation initiation factor eIF2; eIF2 is involved in identification of the start codon; phosphorylation of Ser51 is required for regulation of translation by inhibiting the exchange of GDP for GTP; protein abundance increases in response to DNA replication stress +S000035254 CDS YJR007W 10 451020 451934 W 2011-02-03 1996-07-31 +S000003768 ORF Verified YJR008W MHO1 chromosome 10 10 452430 453446 W 2011-02-03 1996-07-31 Protein of unknown function; inhibits haploid invasive growth when overexpressed; synthetically lethal with phospholipase C (PLC1); expression induced by mild heat-stress on a non-fermentable carbon source, upon entry into stationary phase and upon nitrogen deprivation; repressed by inosine and choline in an Opi1p-dependent manner; highly conserved from bacteria to human; Memo, the human homolog, is an ErbB2 interacting protein with an essential function in cell motility +S000035336 CDS YJR008W 10 452430 453446 W 2011-02-03 1996-07-31 +S000028453 ARS ARS1016 chromosome 10 10 454584 455555 2011-02-03 2002-12-16 Autonomously Replicating Sequence +S000003769 ORF Verified YJR009C TDH2 glyceraldehyde-3-phosphate dehydrogenase (phosphorylating) TDH2|GAPDH|GLD2 chromosome 10 L000002273 10 454681 453683 C 2.95 2011-02-03 1996-07-31 Glyceraldehyde-3-phosphate dehydrogenase (GAPDH), isozyme 2; involved in glycolysis and gluconeogenesis; tetramer that catalyzes reaction of glyceraldehyde-3-phosphate to 1,3 bis-phosphoglycerate; detected in cytoplasm and cell wall; protein abundance increases in response to DNA replication stress; GAPDH-derived antimicrobial peptides are active against a wide variety of wine-related yeasts and bateria; TDH2 has a paralog, TDH3, that arose from the whole genome duplication +S000035380 CDS YJR009C 10 454681 453683 C 2011-02-03 1996-07-31 +S000003771 ORF Verified YJR010W MET3 sulfate adenylyltransferase chromosome 10 L000001078 10 456239 457774 W 3 2011-02-03 1996-07-31 ATP sulfurylase; catalyzes the primary step of intracellular sulfate activation, essential for assimilatory reduction of sulfate to sulfide, involved in methionine metabolism; human homolog PAPSS2 complements yeast null mutant +S000031767 CDS YJR010W 10 456239 457774 W 2011-02-03 1996-07-31 +S000003770 ORF Verified YJR010C-A SPC1 signal peptidase complex subunit SPC1 chromosome 10 L000003006 10 458361 458077 C 2011-02-03 1996-07-31 Subunit of the signal peptidase complex (SPC); SPC cleaves the signal sequence from proteins targeted to the endoplasmic reticulum (ER); homolog of the SPC12 subunit of mammalian signal peptidase complex; protein abundance increases in response to DNA replication stress +S000037612 CDS YJR010C-A 10 458361 458077 C 2011-02-03 1996-07-31 +S000028454 ARS ARS1017 chromosome 10 10 459337 459895 2011-02-03 2002-12-16 Autonomously Replicating Sequence +S000003772 ORF Uncharacterized YJR011C chromosome 10 10 459426 458641 C 2011-02-03 1996-07-31 Putative protein of unknown function; GFP-fusion protein expression is induced in response to the DNA-damaging agent MMS +S000031827 CDS YJR011C 10 459426 458641 C 2011-02-03 1996-07-31 +S000003774 ORF Verified YJR013W GPI14 glycosylphosphatidylinositol-alpha 1,4 mannosyltransferase I|PMH1 chromosome 10 10 460382 461593 W 2011-02-03 2004-02-12|1996-07-31 Glycosylphosphatidylinositol-alpha 1,4 mannosyltransferase I; involved in GPI anchor biosynthesis, requires Pbn1p for function; homolog of mammalian PIG-M +S000037491 CDS YJR013W 10 460382 461593 W 2011-02-03 2004-02-12|1996-07-31 +S000003773 ORF Uncharacterized YJR012C chromosome 10 10 460418 459795 C 2011-02-03 1996-07-31 Essential protein of unknown function; proposed involvement in transport based on mass spectrometry analysis of copurifying proteins; partially overlaps neighboring ORF, GPI14/YJR013W +S000031960 CDS YJR012C 10 460418 459795 C 2011-02-03 1996-07-31 +S000003775 ORF Verified YJR014W TMA22 RBF22 chromosome 10 10 461829 462425 W 2011-02-03 1996-07-31 Protein of unknown function; associates with ribosomes and has a putative RNA binding domain; interacts with Tma20p; similar to human GRAP and human DRP1, which interacts with human Tma20p homolog MCT-1; protein abundance increases in response to DNA replication stress +S000037578 CDS YJR014W 10 461829 462425 W 2011-02-03 1996-07-31 +S000003776 ORF Uncharacterized YJR015W chromosome 10 10 462721 464253 W 2011-02-03 1996-07-31 Putative protein of unknown function; localizes to endoplasmic reticulum and cytoplasm; predicted to encode a membrane transporter based on phylogenetic analysis; not an essential gene; YJR015W has a paralog, SNG1, that arose from the whole genome duplication +S000037660 CDS YJR015W 10 462721 464253 W 2011-02-03 1996-07-31 +S000003777 ORF Verified YJR016C ILV3 dihydroxy-acid dehydratase ILV3 chromosome 10 L000000859 10 466208 464451 C 10 2011-02-03 1996-07-31 Dihydroxyacid dehydratase; catalyzes third step in the common pathway leading to biosynthesis of branched-chain amino acids +S000037686 CDS YJR016C 10 466208 464451 C 2011-02-03 1996-07-31 +S000003779 ORF Dubious YJR018W chromosome 10 10 466786 467148 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030641 CDS YJR018W 10 466786 467148 W 2011-02-03 1996-07-31 +S000003778 ORF Verified YJR017C ESS1 peptidylprolyl isomerase ESS1|PIN1|PTF1 chromosome 10 L000000587 10 467033 466521 C 17 2011-02-03 2003-09-22|1996-07-31 Peptidylprolyl-cis/trans-isomerase (PPIase); specific for phosphorylated S/T residues N-terminal to proline; regulates phosphorylation of RNAPII large subunit (Rpo21p) C-terminal domain (CTD) at Ser7; associates with phospho-Ser5 form of RNAPII in vivo; present along entire coding length of genes; represses initiation of CUTs; required for efficient termination of mRNA transcription, trimethylation of histone H3; human ortholog PIN1 can complement yeast null and ts mutants +S000030503 CDS YJR017C 10 467033 466521 C 2011-02-03 2003-09-22|1996-07-31 +S000003781 ORF Dubious YJR020W chromosome 10 10 468001 468333 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030190 CDS YJR020W 10 468001 468333 W 2011-02-03 1996-07-31 +S000003780 ORF Verified YJR019C TES1 PTE1 chromosome 10 L000003343 10 468281 467232 C 2011-02-03 1996-07-31 Peroxisomal acyl-CoA thioesterase; likely to be involved in fatty acid oxidation rather than fatty acid synthesis; conserved protein also found in human peroxisomes; TES1 mRNA levels increase during growth on fatty acids +S000030681 CDS YJR019C 10 468281 467232 C 2011-02-03 1996-07-31 +S000003782 ORF Verified YJR021C REC107 MER2 chromosome 10 L000001606 10 469579 468555 C 2011-02-03 1996-07-31 Protein involved in early stages of meiotic recombination; involved in coordination between the initiation of recombination and the first division of meiosis; part of a complex (Rec107p-Mei4p-Rec114p) required for ds break formation +S000030251 CDS YJR021C 10 469183 468555 C 2011-02-03 1996-07-31 +S000030250 CDS YJR021C 10 469579 469264 C 2011-02-03 1996-07-31 +S000030252 intron YJR021C 10 469263 469184 C 2011-02-03 1996-07-31 +S000003783 ORF Verified YJR022W LSM8 U4/U6-U5 snRNP complex subunit LSM8 chromosome 10 L000004687 10 469784 470113 W 2011-02-03 2003-09-22|1996-07-31 Lsm (Like Sm) protein; forms heteroheptameric complex (with Lsm2p, Lsm3p, Lsm4p, Lsm5p, Lsm6p, and Lsm7p) that is part of spliceosomal U6 snRNP and is also implicated in processing of pre-tRNA, pre-snoRNA, and pre-rRNA +S000033657 CDS YJR022W 10 469784 470113 W 2011-02-03 2003-09-22|1996-07-31 +S000003784 ORF Dubious YJR023C chromosome 10 10 470205 469804 C 2011-02-03 1996-07-31 Putative protein of unknown function; open reading frame overlaps LSM8/YJR022W encoding an essential snRNP protein required for RNA processing and splicing +S000033704 CDS YJR023C 10 470205 469804 C 2011-02-03 1996-07-31 +S000003785 ORF Verified YJR024C MDE1 methylthioribulose 1-phosphate dehydratase MDE1 chromosome 10 10 470964 470230 C 2011-02-03 1996-07-31 5'-methylthioribulose-1-phosphate dehydratase; acts in the methionine salvage pathway; potential Smt3p sumoylation substrate; expression downregulated by caspofungin and deletion mutant is caspofungin resistant +S000033856 CDS YJR024C 10 470964 470230 C 2011-02-03 1996-07-31 +S000003786 ORF Verified YJR025C BNA1 3-hydroxyanthranilate 3,4-dioxygenase|HAD1 chromosome 10 L000003490 10 471671 471138 C 2011-02-03 1996-07-31 3-hydroxyanthranilic acid dioxygenase; required for the de novo biosynthesis of NAD from tryptophan via kynurenine; expression regulated by Hst1p +S000033981 CDS YJR025C 10 471671 471138 C 2011-02-03 1996-07-31 +S000007040 long_terminal_repeat YJRWdelta11 chromosome 10 10 472463 472800 W 2011-02-03 2000-05-19 Ty1 LTR +S000007048 LTR_retrotransposon YJRWTy1-1 Ty1 chromosome 10 10 472463 478384 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000003787 transposable_element_gene YJR026W gag protein chromosome 10 10 472760 474082 W 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000034898 CDS YJR026W 10 472760 474082 W 2011-02-03 1996-07-31 +S000003788 transposable_element_gene YJR027W gag-pol fusion protein chromosome 10 10 472760 478028 W 2011-02-03 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000035049 CDS YJR027W 10 472760 474061 W 2011-02-03 1996-07-31 +S000035050 CDS YJR027W 10 474063 478028 W 2011-02-03 1996-07-31 +S000035051 plus_1_translational_frameshift YJR027W 10 474062 474062 W 2011-02-03 1996-07-31 +S000007041 long_terminal_repeat YJRWdelta12 chromosome 10 10 478051 478384 W 2011-02-03 2000-05-19 Ty1 LTR +S000007049 LTR_retrotransposon YJRWTy1-2 Ty1 chromosome 10 10 478051 483972 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000003789 transposable_element_gene YJR028W gag protein chromosome 10 10 478344 479666 W 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000035151 CDS YJR028W 10 478344 479666 W 2011-02-03 1996-07-31 +S000003790 transposable_element_gene YJR029W gag-pol fusion protein chromosome 10 10 478344 483612 W 2011-02-03 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000036043 CDS YJR029W 10 478344 479644 W 2011-02-03 1996-07-31 +S000036044 CDS YJR029W 10 479646 483612 W 2011-02-03 1996-07-31 +S000036045 plus_1_translational_frameshift YJR029W 10 479645 479645 W 2011-02-03 1996-07-31 +S000007042 long_terminal_repeat YJRWdelta13 chromosome 10 10 483635 483972 W 2011-02-03 2000-05-19 Ty1 LTR +S000003791 ORF Uncharacterized YJR030C RBH2 RBH2 chromosome 10 10 486196 483959 C 2011-02-03 1996-07-31 Putative protein of unknown function; expression repressed in carbon limited vs carbon replete chemostat cultures; non-essential gene; contains a PH-like domain; RBH2 has a paralog, RBH1, that arose from the whole genome duplication +S000034642 CDS YJR030C 10 486196 483959 C 2011-02-03 1996-07-31 +S000003792 ORF Verified YJR031C GEA1 Arf family guanine nucleotide exchange factor GEA1 chromosome 10 L000004312 10 490812 486586 C 2011-02-03 1996-07-31 Guanine nucleotide exchange factor for ADP ribosylation factors (ARFs); involved in vesicular transport between the Golgi and ER, Golgi organization, and actin cytoskeleton organization; GEA1 has a paralog, GEA2, that arose from the whole genome duplication +S000034771 CDS YJR031C 10 490812 486586 C 2011-02-03 1996-07-31 +S000003793 ORF Verified YJR032W CPR7 peptidylprolyl isomerase CPR7 chromosome 10 L000003230 10 491081 492262 W 2011-02-03 1996-07-31 Peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; binds to Hsp82p and contributes to chaperone activity; plays a role in determining prion variants +S000035830 CDS YJR032W 10 491081 492262 W 2011-02-03 1996-07-31 +S000003794 ORF Verified YJR033C RAV1 SOI3 chromosome 10 S000029472|L000002969 10 496451 492378 C 2011-02-03 1996-07-31 Subunit of RAVE complex (Rav1p, Rav2p, Skp1p); the RAVE complex promotes assembly of the V-ATPase holoenzyme; required for transport between the early and late endosome/PVC and for localization of TGN membrane proteins; potential Cdc28p substrate +S000035875 CDS YJR033C 10 496451 492378 C 2011-02-03 1996-07-31 +S000003795 ORF Verified YJR034W PET191 chromosome 10 L000001400 10 496683 497009 W 2011-02-03 1996-07-31 Protein required for assembly of cytochrome c oxidase; exists as an oligomer; described as both an integral mitochondrial inner membrane protein facing the intermembrane space (IMS) and as a soluble IMS protein; contains a twin Cx9C motif; imported into the IMS via the MIA import machinery +S000037813 CDS YJR034W 10 496683 497009 W 2011-02-03 1996-07-31 +S000003796 ORF Verified YJR035W RAD26 DNA-dependent ATPase RAD26 chromosome 10 L000001569 10 497355 500612 W 2011-02-03 1996-07-31 Protein involved in transcription-coupled nucleotide excision repair; repairs UV-induced DNA lesions; recruitment to DNA lesions is dependent on an elongating RNA polymerase II; homolog of human CSB protein +S000037907 CDS YJR035W 10 497355 500612 W 2011-02-03 1996-07-31 +S000003798 ORF Dubious YJR037W chromosome 10 10 503102 503485 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene HUL4/YJR036C; deletion mutant has decreased spore survival in Drosophila feces +S000030927 CDS YJR037W 10 503102 503485 W 2011-02-03 1996-07-31 +S000003797 ORF Verified YJR036C HUL4 putative E3 ubiquitin-protein ligase HUL4 chromosome 10 10 503391 500713 C 2011-02-03 1996-07-31 Protein with similarity to hect domain E3 ubiquitin-protein ligases; not essential for viability; found in association with Trf4 in TRAMP complex +S000029850 CDS YJR036C 10 503391 500713 C 2011-02-03 1996-07-31 +S000003800 ORF Uncharacterized YJR039W chromosome 10 10 503936 507301 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000031105 CDS YJR039W 10 503936 507301 W 2011-02-03 1996-07-31 +S000003799 ORF Dubious YJR038C chromosome 10 10 504072 503710 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030967 CDS YJR038C 10 504072 503710 C 2011-02-03 1996-07-31 +S000003801 ORF Verified YJR040W GEF1 CLC chromosome 10 L000000701 10 507746 510085 W 2011-02-03 1996-07-31 Voltage-gated chloride channel; localized to the golgi, the endosomal system, and plasma membrane; involved in cation homeostasis; highly homologous to vertebrate voltage-gated chloride channels; modulates TBSV model (+) RNA virus replication by regulating copper metabolism +S000030664 CDS YJR040W 10 507746 510085 W 2011-02-03 1996-07-31 +S000003802 ORF Verified YJR041C URB2 NPA2 chromosome 10 10 513763 510239 C 2011-02-03 1996-07-31 Protein required for normal metabolism of the rRNA primary transcript; nucleolar protein; proposed to be involved in ribosome biogenesis +S000030713 CDS YJR041C 10 513763 510239 C 2011-02-03 1996-07-31 +S000003803 ORF Verified YJR042W NUP85 RAT9 chromosome 10 L000003023 10 514055 516289 W 2011-02-03 1996-07-31 Subunit of the Nup84p subcomplex of the nuclear pore complex (NPC); contributes to nucleocytoplasmic transport and NPC biogenesis and is involved in establishment of a normal nucleocytoplasmic concentration gradient of the GTPase Gsp1p; also plays roles in several processes that may require localization of genes or chromosomes at the nuclear periphery, including double-strand break repair, transcription and chromatin silencing; homologous to human NUP85 aka NUP75 +S000030892 CDS YJR042W 10 514055 516289 W 2011-02-03 1996-07-31 +S000003804 ORF Verified YJR043C POL32 DNA polymerase delta subunit POL32|REV5 chromosome 10 L000004337|S000029416|L000001617 10 517513 516461 C 2011-02-03 1996-07-31 Third subunit of DNA polymerase delta; involved in chromosomal DNA replication; required for error-prone DNA synthesis in the presence of DNA damage and processivity; forms a complex with Rev3p, Rev7p and Pol31p; interacts with Hys2p, PCNA (Pol30p), and Pol1p +S000031802 CDS YJR043C 10 517513 516461 C 2011-02-03 1996-07-31 +S000006663 tRNA_gene tM(CAU)J3 IMT3 chromosome 10 L000003619 10 517884 517813 C 2011-02-03 2000-05-19 Methionine initiator tRNA (tRNA-Met); predicted by tRNAscan-SE analysis; one of four initiator methionine tRNAs in yeast that are functional for translation +S000029924 noncoding_exon tM(CAU)J3 10 517884 517813 C 2011-02-03 2000-05-19 +S000007043 long_terminal_repeat YJRWdelta14 chromosome 10 10 517959 518099 W 2011-02-03 2000-05-19 Ty1 LTR +S000003805 ORF Verified YJR044C VPS55 chromosome 10 10 519185 518763 C 2011-02-03 1996-07-31 Late endosomal protein involved in late endosome to vacuole transport; functional homolog of human obesity receptor gene-related protein (OB-RGRP) +S000031950 CDS YJR044C 10 519185 518763 C 2011-02-03 1996-07-31 +S000003806 ORF Verified YJR045C SSC1 Hsp70 family ATPase SSC1|mtHSP70|ENS1 chromosome 10 L000000561 10 521602 519638 C 2011-02-03 1996-07-31 Hsp70 family ATPase; constituent of the import motor component of the Translocase of the Inner Mitochondrial membrane (TIM23 complex); involved in protein translocation and folding; subunit of SceI endonuclease; SSC1 has a paralog, ECM10, that arose from the whole genome duplication +S000032104 CDS YJR045C 10 521602 519638 C 2011-02-03 1996-07-31 +S000003807 ORF Verified YJR046W TAH11 CDT1|SID2 chromosome 10 L000004733 10 522048 523862 W 2011-02-03 1996-07-31 DNA replication licensing factor; required for pre-replication complex assembly +S000034108 CDS YJR046W 10 522048 523862 W 2011-02-03 1996-07-31 +S000006727 tRNA_gene tS(AGA)J chromosome 10 L000003618 10 524093 524012 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000032380 noncoding_exon tS(AGA)J 10 524093 524012 C 2011-02-03 2000-05-19 +S000003808 ORF Verified YJR047C ANB1 translation elongation factor eIF-5A|eIF-5A|eIF5A|TIF51B|HYP1 chromosome 10 L000000085|L000000846|L000002308 10 525381 524908 C 2011-02-03 1996-07-31 Translation elongation factor eIF-5A; previously thought to function in translation initiation; undergoes an essential hypusination modification; expressed under anaerobic conditions; ANB1 has a paralog, HYP2, that arose from the whole genome duplication; human EIF5A complements the inviability of the yeast hyp2 anb1 double null mutant +S000034179 CDS YJR047C 10 525381 524908 C 2011-02-03 1996-07-31 +S000003809 ORF Verified YJR048W CYC1 cytochrome c isoform 1 chromosome 10 L000000448 10 526335 526664 W 34 2011-02-03 1996-07-31 Cytochrome c, isoform 1; also known as iso-1-cytochrome c; electron carrier of mitochondrial intermembrane space that transfers electrons from ubiquinone-cytochrome c oxidoreductase to cytochrome c oxidase during cellular respiration; CYC1 has a paralog, CYC7, that arose from the whole genome duplication; human homolog CYC1 can complement yeast null mutant; mutations in human CYC1 cause insulin-responsive hyperglycemia +S000034309 CDS YJR048W 10 526335 526664 W 2011-02-03 1996-07-31 +S000003810 ORF Verified YJR049C UTR1 NADH/NAD(+) kinase chromosome 10 L000002680 10 528476 526884 C 2011-02-03 1996-07-31 ATP-NADH kinase; phosphorylates both NAD and NADH; active as a hexamer; enhances the activity of ferric reductase (Fre1p); UTR1 has a paralog, YEF1, that arose from the whole genome duplication +S000034337 CDS YJR049C 10 528476 526884 C 2011-02-03 1996-07-31 +S000003811 ORF Verified YJR050W ISY1 NTC30|UTR3 chromosome 10 L000002730 10 528697 529404 W 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); NTC contains Prp19p and stabilizes U6 snRNA in catalytic forms of spliceosome containing U2, U5, and U6 snRNAs; interacts with Prp16p to modulate splicing fidelity; isy1 syf2 cells have defective spindles +S000033850 CDS YJR050W 10 528697 529404 W 2011-02-03 1996-07-31 +S000003812 ORF Verified YJR051W OSM1 fumarate reductase|FRDS2 chromosome 10 L000001317 10 529861 531366 W 34 2011-02-03 1996-07-31 Fumarate reductase, catalyzes the reduction of fumarate to succinate; required for the reoxidation of intracellular NADH under anaerobic conditions; mutations cause osmotic sensitivity; has two translation start sites, one at the annotated start codon which produces an ER-targeted form required for anaerobic growth, and one at codon 32 which produces a mitochondrially-targeted form; OSM1 has a paralog, FRD1, that arose from the whole genome duplication +S000033966 CDS YJR051W 10 529861 531366 W 2011-02-03 1996-07-31 +S000007032 long_terminal_repeat YJRCdelta15 YJLWdelta15 chromosome 10 10 531675 531516 C 2011-02-03 2000-05-19|2007-04-04 Ty1 LTR +S000006584 tRNA_gene tG(GCC)J2 SUF23 chromosome 10 L000003613|S000029541|L000002170 10 531828 531898 W 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly); can mutate to suppress +1 frameshift mutations +S000030417 noncoding_exon tG(GCC)J2 10 531828 531898 W 2011-02-03 2000-05-19 +S000003813 ORF Verified YJR052W RAD7 UV-damaged DNA-binding protein RAD7 chromosome 10 L000001561 10 532062 533759 W 35 2011-02-03 1996-07-31 Nucleotide excision repair (NER) protein; binds damaged DNA during NER; binds DNA in an ATP-dependent manner (with Rad16p) during NER; required for repair of non-transcribed chromatin; subunit of Nucleotide Excision Repair Factor 4 (NEF4) and the Elongin-Cullin-Socs (ECS) ligase complex +S000034844 CDS YJR052W 10 532062 533759 W 2011-02-03 1996-07-31 +S000003814 ORF Verified YJR053W BFA1 IBD1 chromosome 10 10 534027 535751 W 2011-02-03 1996-07-31 Subunit of a two-component GTPase-activating protein, Bfa1p-Bub2p; contributes to GAP activity, inactivating Tem1 by stimulating GTP hydrolysis following damage or misalignment of the mitotic spindle; functions as a guanine-nucleotide exchange inhibitor (GDI) for Tem1p; involved in multiple cell cycle checkpoint pathways that control mitotic exit; required when telomeres are damaged, but not for all types of chromosomal DNA damage; phosphorylated by the Polo-like kinase Cdc5p +S000034983 CDS YJR053W 10 534027 535751 W 2011-02-03 1996-07-31 +S000003815 ORF Verified YJR054W KCH1 ERM6 chromosome 10 10 536056 537549 W 2011-02-03 1996-07-31 Potassium transporter that mediates K+ influx; activates high-affinity Ca2+ influx system (HACS) during mating pheromone response; expression up-regulated in response to alpha factor; localized to sites of polarized growth; member of a fungal-specific gene family; potential Cdc28p substrate; KCH1 has a paralog, PRM6, that arose from the whole genome duplication +S000035180 CDS YJR054W 10 536056 537549 W 2011-02-03 1996-07-31 +S000007033 long_terminal_repeat YJRCdelta16 YJLWdelta16 chromosome 10 10 538041 537741 C 2011-02-03 2000-05-19|2007-04-04 Ty1 LTR +S000007044 long_terminal_repeat YJRWdelta17 chromosome 10 10 538103 538434 W 2011-02-03 2000-05-19 Ty1 LTR +S000006707 tRNA_gene tR(CCU)J HSX1 chromosome 10 10 538555 538626 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; low abundance tRNA required for growth on nonfermentable carbon sources at high temperatures, for synthesis of heat shock protein Ssc1p, and for Ty1 retrotransposition through the regulation of translational frameshifting +S000032860 noncoding_exon tR(CCU)J 10 538555 538626 W 2011-02-03 2000-05-19 +S000003816 ORF Verified YJR055W HIT1 chromosome 10 L000000786 10 538772 539266 W 2011-02-03 1996-07-31 Protein involved in C/D snoRNP assembly; regulates abundance of Rsa1p; required for growth at high temperature; similar to human ZNHIT3 +S000036066 CDS YJR055W 10 538772 539266 W 2011-02-03 1996-07-31 +S000028455 ARS ARS1018 ARSX-540 chromosome 10 10 540546 540780 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence +S000007045 long_terminal_repeat YJRWdelta18 chromosome 10 10 540766 541087 W 2011-02-03 2000-05-19 Ty1 LTR +S000007034 long_terminal_repeat YJRCdelta19 YJLWdelta19 chromosome 10 10 541427 541095 C 2011-02-03 2000-05-19|2007-04-04 Ty1 LTR +S000006539 tRNA_gene tD(GUC)J4 chromosome 10 L000003615 10 541508 541579 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000030795 noncoding_exon tD(GUC)J4 10 541508 541579 W 2011-02-03 2000-05-19 +S000003817 ORF Verified YJR056C chromosome 10 10 542502 541792 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus; relative distribution to the nucleus increases upon DNA replication stress +S000036154 CDS YJR056C 10 542502 541792 C 2011-02-03 1996-07-31 +S000006782 tRNA_gene tY(GUA)J2 SUP4 chromosome 10 L000003617|L000002183 10 543044 542956 C 36 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations +S000032087 intron tY(GUA)J2 10 543005 542992 C 2011-02-03 2000-05-19 +S000032086 noncoding_exon tY(GUA)J2 10 542991 542956 C 2011-02-03 2000-05-19 +S000032085 noncoding_exon tY(GUA)J2 10 543044 543006 C 2011-02-03 2000-05-19 +S000007046 long_terminal_repeat YJRWdelta20 chromosome 10 10 543448 543770 W 2011-02-03 2000-05-19 Ty1 LTR +S000003818 ORF Verified YJR057W CDC8 bifunctional thymidylate/uridylate kinase chromosome 10 L000000248 10 544062 544712 W 36 2011-02-03 1996-07-31 Thymidylate and uridylate kinase; functions in de novo biosynthesis of pyrimidine deoxyribonucleotides; converts dTMP to dTDP and dUMP to dUTP; essential for mitotic and meiotic DNA replication; homologous to S. pombe tmp1; human homolog DTYMK can complement yeast cdc8 null mutant +S000036320 CDS YJR057W 10 544062 544712 W 2011-02-03 1996-07-31 +S000003819 ORF Verified YJR058C APS2 YAP17 chromosome 10 L000002492 10 545175 544732 C 2011-02-03 1996-07-31 Small subunit of the clathrin-associated adaptor complex AP-2; AP-2 is involved in protein sorting at the plasma membrane; related to the sigma subunit of the mammalian plasma membrane clathrin-associated protein (AP-2) complex +S000036359 CDS YJR058C 10 545175 544732 C 2011-02-03 1996-07-31 +S000003820 ORF Verified YJR059W PTK2 protein kinase PTK2|STK2 chromosome 10 L000003492 10 545787 548243 W 2011-02-03 1996-07-31 Serine/threonine protein kinase; involved in regulation of ion transport across plasma membrane; carboxyl terminus is essential for glucose-dependent Pma1p activation via phosphorylation of Pma1p-Ser899; enhances spermine uptake; PTK2 has a paralog, PTK1, that arose from the whole genome duplication +S000030117 CDS YJR059W 10 545787 548243 W 2011-02-03 1996-07-31 +S000003821 ORF Verified YJR060W CBF1 GFII|CP1|CPF1|CEP1 chromosome 10 L000000311|L000000401 10 548759 549814 W 40 2011-02-03 1996-07-31 Basic helix-loop-helix (bHLH) protein; forms homodimer to bind E-box consensus sequence CACGTG present at MET gene promoters and centromere DNA element I (CDEI); affects nucleosome positioning at this motif; associates with other transcription factors such as Met4p and Isw1p to mediate transcriptional activation or repression; associates with kinetochore proteins, required for chromosome segregation; protein abundance increases in response to DNA replication stress +S000037892 CDS YJR060W 10 548759 549814 W 2011-02-03 1996-07-31 +S000003822 ORF Uncharacterized YJR061W chromosome 10 10 550511 553318 W 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene; transcription repressed by Rm101p; YJR061W has a paralog, MNN4, that arose from the whole genome duplication +S000029930 CDS YJR061W 10 550511 553318 W 2011-02-03 1996-07-31 +S000003823 ORF Verified YJR062C NTA1 amidase|DEA1 chromosome 10 L000001279 10 554849 553476 C 2011-02-03 1996-07-31 Amidase; removes the amide group from N-terminal asparagine and glutamine residues to generate proteins with N-terminal aspartate and glutamate residues that are targets of ubiquitin-mediated degradation +S000029976 CDS YJR062C 10 554849 553476 C 2011-02-03 1996-07-31 +S000003824 ORF Verified YJR063W RPA12 DNA-directed RNA polymerase I core subunit RPA12|A12.2|RRN4 chromosome 10 L000001672 10 555195 555572 W 2011-02-03 1996-07-31 RNA polymerase I subunit A12.2; contains two zinc binding domains, and the N terminal domain is responsible for anchoring to the RNA pol I complex; physically interacts with transcriptional activator Msn4p, to regulate transcription of AYR1, a gene involved in lipid metabolism +S000031049 CDS YJR063W 10 555195 555572 W 2011-02-03 1996-07-31 +S000003825 ORF Verified YJR064W CCT5 chaperonin-containing T-complex subunit CCT5|TCP5 chromosome 10 L000002717 10 555914 557602 W 2011-02-03 1996-07-31 Subunit of the cytosolic chaperonin Cct ring complex; related to Tcp1p, required for the assembly of actin and tubulins in vivo +S000031152 CDS YJR064W 10 555914 557602 W 2011-02-03 1996-07-31 +S000003826 ORF Verified YJR065C ARP3 actin-related protein 3|ACT4 chromosome 10 L000003198 10 559158 557809 C 2011-02-03 1996-07-31 Essential component of the Arp2/3 complex; Arp2/3 is a highly conserved actin nucleation center required for the motility and integrity of actin patches; involved in endocytosis and membrane growth and polarity +S000031207 CDS YJR065C 10 559158 557809 C 2011-02-03 1996-07-31 +S000003827 ORF Verified YJR066W TOR1 phosphatidylinositol kinase-related protein kinase TOR1|DRR1 chromosome 10 L000002322 10 559416 566828 W 44.84 2011-02-03 1996-07-31 PIK-related protein kinase and rapamycin target; subunit of TORC1, a complex that controls growth in response to nutrients by regulating translation, transcription, ribosome biogenesis, nutrient transport and autophagy; involved in meiosis; TOR1 has a paralog, TOR2, that arose from the whole genome duplication +S000032272 CDS YJR066W 10 559416 566828 W 2011-02-03 1996-07-31 +S000003828 ORF Verified YJR067C YAE1 chromosome 10 L000004159 10 567444 567019 C 2011-02-03 1996-07-31 Protein that forms a complex with Lto1p and Rli1p; essential for growth under standard (aerobic) conditions but not under anaerobic conditions; may have a role in protection of ribosomal assembly and function from damage due to reactive oxygen species +S000032323 CDS YJR067C 10 567444 567019 C 2011-02-03 1996-07-31 +S000003829 ORF Verified YJR068W RFC2 replication factor C subunit 2 chromosome 10 L000001623 10 567643 568704 W 2011-02-03 1996-07-31 Subunit of heteropentameric Replication factor C (RF-C); RF-C is a DNA binding protein and ATPase that acts as a clamp loader of the proliferating cell nuclear antigen (PCNA) processivity factor for DNA polymerases delta and epsilon +S000032475 CDS YJR068W 10 567643 568704 W 2011-02-03 1996-07-31 +S000003830 ORF Verified YJR069C HAM1 nucleoside triphosphate pyrophosphohydrolase HAM1 chromosome 10 L000003233 10 569399 568806 C 2011-02-03 1996-07-31 Nucleoside triphosphate pyrophosphohydrolase; active against various substrates including ITP, dITP and XTP; mediates exclusion of non canonical purines, pyrimidines from dNTP pools; functions with YJL055W to mediate resistance to 5-FU; specifically reduces the incorporation of 5-FU into RNA without affecting uptake or incorporation of uracil into RNA; protein abundance increases in response to DNA replication stress; yeast HAM1 can complement knockdown of human homolog ITPA +S000034432 CDS YJR069C 10 569399 568806 C 2011-02-03 1996-07-31 +S000003832 ORF Dubious YJR071W chromosome 10 10 570405 570773 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033295 CDS YJR071W 10 570405 570773 W 2011-02-03 1996-07-31 +S000003831 ORF Verified YJR070C LIA1 MMD1 chromosome 10 10 570598 569621 C 2011-02-03 1996-07-31 Deoxyhypusine hydroxylase; HEAT-repeat containing metalloenzyme that catalyzes hypusine formation; binds to and is required for the modification of Hyp2p (eIF5A); complements S. pombe mmd1 mutants defective in mitochondrial positioning; protein abundance increases in response to DNA replication stress +S000033205 CDS YJR070C 10 570598 569621 C 2011-02-03 1996-07-31 +S000003833 ORF Verified YJR072C NPA3 GTPase NPA3|GPN1|EPA1 chromosome 10 10 572124 570967 C 2011-02-03 1996-07-31 Member of the conserved GPN-loop GTPase family; has a role in transport of RNA polymerase II to the nucleus; exhibits GTP-dependent binding to PolII; has ATPase activity; involved in sister chromatid cohesion; phosphorylated by the Pcl1p-Pho85p kinase complex; human homolog XAB1 interacts with human RNA polymerase II; protein abundance increases in response to DNA replication stress +S000034114 CDS YJR072C 10 572124 570967 C 2011-02-03 1996-07-31 +S000003834 ORF Verified YJR073C OPI3 bifunctional phosphatidyl-N-methylethanolamine N-methyltransferase/phosphatidyl-N-dimethylethanolamine N-methyltransferase|PEM2 chromosome 10 L000001304 10 572935 572315 C 2011-02-03 1996-07-31 Methylene-fatty-acyl-phospholipid synthase; catalyzes the last two steps in phosphatidylcholine biosynthesis; also known as phospholipid methyltransferase +S000034233 CDS YJR073C 10 572935 572315 C 2011-02-03 1996-07-31 +S000003835 ORF Verified YJR074W MOG1 Ran GTPase-binding protein MOG1 chromosome 10 L000004615 10 573095 573751 W 2011-02-03 1996-07-31 Conserved nuclear protein that interacts with GTP-Gsp1p; stimulates nucleotide release from Gsp1p; involved in nuclear protein import; nucleotide release is inhibited by Yrb1p +S000034411 CDS YJR074W 10 573095 573751 W 2011-02-03 1996-07-31 +S000003836 ORF Verified YJR075W HOC1 alpha-1,6-mannosyltransferase chromosome 10 L000003274 10 573981 575171 W 2011-02-03 1996-07-31 Alpha-1,6-mannosyltransferase; involved in cell wall mannan biosynthesis; subunit of a Golgi-localized complex that also contains Anp1p, Mnn9p, Mnn11p, and Mnn10p; identified as a suppressor of a cell lysis sensitive pkc1-371 allele +S000035455 CDS YJR075W 10 573981 575171 W 2011-02-03 1996-07-31 +S000003837 ORF Verified YJR076C CDC11 septin CDC11|PSL9 chromosome 10 L000000251 10 576601 575354 C 54 2011-02-03 1996-07-31 Component of the septin ring that is required for cytokinesis; present at the ends of rod-like septin hetero-oligomers; C-terminal extension is important for recruitment of Bni5p to the mother-bud neck, which in turn is required for Myo1p recruitment and cytokinesis; septin rings at the mother-bud neck act as scaffolds for recruiting cell division factors and as barriers to prevent diffusion of specific proteins between mother and daughter cells +S000035494 CDS YJR076C 10 576601 575354 C 2011-02-03 1996-07-31 +S000003838 ORF Verified YJR077C MIR1 PTP chromosome 10 L000001114 10 578190 577255 C 2011-02-03 1996-07-31 Mitochondrial phosphate carrier; imports inorganic phosphate into mitochondria; functionally redundant with Pic2p but more abundant than Pic2p under normal conditions; phosphorylated +S000035596 CDS YJR077C 10 578190 577255 C 2011-02-03 1996-07-31 +S000003839 ORF Verified YJR078W BNA2 dioxygenase BNA2 chromosome 10 10 578860 580221 W 2011-02-03 1996-07-31 Tryptophan 2,3-dioxygenase or indoleamine 2,3-dioxygenase; required for de novo biosynthesis of NAD from tryptophan via kynurenine; interacts genetically with telomere capping gene CDC13; regulated by Hst1p and Aftp +S000036561 CDS YJR078W 10 578860 580221 W 2011-02-03 1996-07-31 +S000003840 ORF Uncharacterized YJR079W chromosome 10 10 580205 581239 W 2011-02-03 1996-07-31 Putative protein of unknown function; mutation results in impaired mitochondrial respiration +S000036624 CDS YJR079W 10 580205 580347 W 2011-02-03 1996-07-31 +S000036625 CDS YJR079W 10 581053 581239 W 2011-02-03 1996-07-31 +S000036626 intron YJR079W 10 580348 581052 W 2011-02-03 1996-07-31 +S000003841 ORF Verified YJR080C AIM24 FMP26 chromosome 10 10 581616 580432 C 2011-02-03 1996-07-31 Protein with a role in determining mitochondrial architecture; inner membrane protein that interacts physically and genetically with the MICOS complex and is required for its integrity +S000037402 CDS YJR080C 10 581616 580432 C 2011-02-03 1996-07-31 +S000003842 ORF Verified YJR082C EAF6 chromosome 10 10 582255 581914 C 2011-02-03 1996-07-31 Subunit of the NuA4 acetyltransferase complex; this complex acetylates histone H4 and NuA3 acetyltransferase complex that acetylates histone H3 +S000030287 CDS YJR082C 10 582255 581914 C 2011-02-03 1996-07-31 +S000003843 ORF Verified YJR083C ACF4 chromosome 10 10 583537 582608 C 2011-02-03 1996-07-31 Protein of unknown function; computational analysis of large-scale protein-protein interaction data suggests a possible role in actin cytoskeleton organization; potential Cdc28p substrate +S000030434 CDS YJR083C 10 583537 582608 C 2011-02-03 1996-07-31 +S000003844 ORF Verified YJR084W CSN12 chromosome 10 S000007581 10 583733 585004 W 2011-02-03 1996-07-31 Protein that forms a complex with Thp3p; may have a role in transcription elongation and/or mRNA splicing; identified as a COP9 signalosome component but phenotype and interactions suggest it may not be involved with the signalosome +S000031409 CDS YJR084W 10 583733 585004 W 2011-02-03 1996-07-31 +S000003845 ORF Verified YJR085C chromosome 10 10 585437 585120 C 2011-02-03 1996-07-31 Protein of unknown function; GFP-fusion protein is induced in response to the DNA-damaging agent MMS; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; protein abundance increases in response to DNA replication stress +S000031477 CDS YJR085C 10 585437 585120 C 2011-02-03 1996-07-31 +S000003846 ORF Verified YJR086W STE18 chromosome 10 L000002122 10 586068 586400 W 59 2011-02-03 1996-07-31 G protein gamma subunit; forms a dimer with Ste4p to activate the mating signaling pathway, forms a heterotrimer with Gpa1p and Ste4p to dampen signaling; C-terminus is palmitoylated and farnesylated, which are required for normal signaling +S000031665 CDS YJR086W 10 586068 586400 W 2011-02-03 1996-07-31 +S000003847 ORF Dubious YJR087W chromosome 10 10 586400 586750 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the verified genes STE18 and ECM2 +S000032646 CDS YJR087W 10 586400 586750 W 2011-02-03 1996-07-31 +S000003848 ORF Verified YJR088C EMC2 chromosome 10 10 587373 586495 C 2011-02-03 1996-07-31 Member of conserved ER transmembrane complex; required for efficient folding of proteins in the ER; null mutant displays induction of the unfolded protein response; homologous to worm Y57G7A.10/EMC-2, fly CG17556, human TTC35 +S000032686 CDS YJR088C 10 587373 586495 C 2011-02-03 1996-07-31 +S000003849 ORF Verified YJR089W BIR1 chromosome 10 L000004754 10 587718 590582 W 2011-02-03 1996-07-31 Subunit of chromosomal passenger complex (CPC); CPC is comprised of Ipl1p-Sli15p-Bir1p-Nbl1p and regulates chromosome segregation; required for chromosome bi-orientation and for spindle assembly checkpoint activation upon reduced sister kinetochore tension; relative distribution to shortened microtubules increases upon DNA replication stress; sumoylated in an Mms21p-dependent manner; human survivin homolog +S000032816 CDS YJR089W 10 587718 590582 W 2011-02-03 1996-07-31 +S000003850 ORF Verified YJR090C GRR1 SCF ubiquitin ligase complex subunit GRR1|SDC1|SSU2|COT2|CAT80 chromosome 10 L000000730 10 594327 590872 C 60 2011-02-03 1996-07-31 F-box protein component of an SCF ubiquitin-ligase complex; modular substrate specificity factor which associates with core SCF (Cdc53p, Skp1p and Hrt1p/Rbx1p) to form the SCF(Grr1) complex; SCF(Grr1) acts as a ubiquitin-protein ligase directing ubiquitination of substrates such as: Gic2p, Mks1p, Mth1p, Cln1p, Cln2p and Cln3p; involved in carbon catabolite repression, glucose-dependent divalent cation transport, glucose transport, morphogenesis, and sulfite detoxification +S000032905 CDS YJR090C 10 594327 590872 C 2011-02-03 1996-07-31 +S000003851 ORF Verified YJR091C JSN1 PUF1 chromosome 10 L000002964 10 598336 595061 C 2011-02-03 1996-07-31 Member of the Puf family of RNA-binding proteins; interacts with mRNAs encoding membrane-associated proteins; involved in localizing the Arp2/3 complex to mitochondria; overexpression causes increased sensitivity to benomyl; JSN1 has a paralog, PUF2, that arose from the whole genome duplication +S000033011 CDS YJR091C 10 598336 595061 C 2011-02-03 1996-07-31 +S000003852 ORF Verified YJR092W BUD4 chromosome 10 L000000201 10 598735 603078 W 2011-02-03 2004-04-20|1996-07-31|1997-07-27|2008-06-04 Anillin-like protein involved in bud-site selection; required for the axial budding pattern; required for the formation and disassembly of the double septin ring structure, and generally for septin organization; functions as a platform linking the cytokinesis tag septins to the axial landmark through its multiple domains; in vivo substrate of Cdc28p/Clb2p +S000033797 CDS YJR092W 10 598735 603078 W 2011-02-03 2004-04-20|1996-07-31|1997-07-27|2008-06-04 +S000003853 ORF Verified YJR093C FIP1 cleavage polyadenylation factor subunit FIP1 chromosome 10 L000002775 10 604203 603220 C 2011-02-03 1996-07-31 Subunit of cleavage polyadenylation factor (CPF); interacts directly with poly(A) polymerase (Pap1p) to regulate its activity; bridging factor that links Pap1p and the CPF complex via Yth1p +S000033863 CDS YJR093C 10 604203 603220 C 2011-02-03 1996-07-31 +S000003854 ORF Verified YJR094C IME1 transcription factor IME1 chromosome 10 L000000861 10 605651 604569 C 2011-02-03 1996-07-31 Master regulator of meiosis that is active only during meiotic events; activates transcription of early meiotic genes through interaction with Ume6p; degraded by the 26S proteasome following phosphorylation by Ime2p; transcription is negatively regulated in cis by the IRT1 long noncoding antisense RNA +S000034019 CDS YJR094C 10 605651 604569 C 2011-02-03 1996-07-31 +S000178119 ncRNA_gene IRT1 IRT1 SUT643 chromosome 10 10 607424 605936 C 2014-11-18 2014-11-18 Long noncoding RNA that governs mating-type control of gametogenesis; located in the IME1 promoter; in haploids, expression of IME1, the central inducer of gametogenesis, is inhibited in cis by transcription of IRT1, which recruits the Set2p histone methyltransferase and the Set3p histone deacetylase complex to establish repressive chromatin at the IME1 promoter +S000178120 noncoding_exon IRT1 10 607424 605936 C 2014-11-18 2014-11-18 +S000003855 ORF Verified YJR094W-A RPL43B eL43|ribosomal 60S subunit protein L43B|L43e|L43B chromosome 10 L000004470 10 608305 608858 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L43B; homologous to mammalian ribosomal protein L37A, no bacterial homolog; RPL43B has a paralog, RPL43A, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000034757 CDS YJR094W-A 10 608305 608306 W 2011-02-03 1996-07-31 +S000034758 CDS YJR094W-A 10 608582 608858 W 2011-02-03 1996-07-31 +S000034759 intron YJR094W-A 10 608307 608581 W 2011-02-03 1996-07-31 +S000003856 ORF Verified YJR095W SFC1 ACR1 chromosome 10 L000000023 10 609773 610741 W 2011-02-03 1996-07-31 Mitochondrial succinate-fumarate transporter; transports succinate into and fumarate out of the mitochondrion; required for ethanol and acetate utilization +S000034990 CDS YJR095W 10 609773 610741 W 2011-02-03 1996-07-31 +S000003857 ORF Verified YJR096W aldo-keto reductase superfamily protein chromosome 10 10 611195 612043 W 2011-02-03 1996-07-31 Xylose and arabinose reductase; member of the aldo-keto reductase (AKR) family; GFP-fusion protein is induced in response to the DNA-damaging agent MMS +S000035147 CDS YJR096W 10 611195 612043 W 2011-02-03 1996-07-31 +S000003858 ORF Verified YJR097W JJJ3 DPH4 chromosome 10 10 612413 612931 W 2011-02-03 1996-07-31 Protein of unknown function; contains a CSL Zn finger and a DnaJ-domain; involved in diphthamide biosynthesis; ortholog human Dph4 +S000035313 CDS YJR097W 10 612413 612931 W 2011-02-03 1996-07-31 +S000028456 ARS ARS1019 chromosome 10 10 612846 613278 2011-02-03 2002-12-16 Autonomously Replicating Sequence +S000003859 ORF Uncharacterized YJR098C chromosome 10 10 615156 613186 C 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000036139 CDS YJR098C 10 615156 613186 C 2011-02-03 1996-07-31|2011-02-03 +S000003860 ORF Verified YJR099W YUH1 ubiquitin-specific protease YUH1 chromosome 10 L000002565 10 615576 616286 W 57 2011-02-03 1996-07-31 Ubiquitin C-terminal hydrolase; cleaves ubiquitin-protein fusions to generate monomeric ubiquitin; hydrolyzes the peptide bond at the C-terminus of ubiquitin; also the major processing enzyme for the ubiquitin-like protein Rub1p +S000036337 CDS YJR099W 10 615576 616286 W 2011-02-03 1996-07-31 +S000003861 ORF Verified YJR100C AIM25 SLM35 chromosome 10 10 617334 616351 C 2011-02-03 1996-07-31 Mitochondria protein of unknown function; interacts genetically with TOR1 to regulate chronological lifespan, and the response to both heat shock and oxidative stress; involved in maintaining the integrity of the mitochondrial network; negative regulator of mitophagy flux; non-tagged protein is detected in purified mitochondria in high-throughput studies; null mutant is viable and displays an elevated frequency of mitochondrial genome loss; similar to murine NOR1 +S000033573 CDS YJR100C 10 617334 616351 C 2011-02-03 1996-07-31 +S000006654 tRNA_gene tL(UAG)J chromosome 10 L000003616 10 617919 618019 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000035855 intron tL(UAG)J 10 617957 617975 W 2011-02-03 2000-05-19 +S000035853 noncoding_exon tL(UAG)J 10 617919 617956 W 2011-02-03 2000-05-19 +S000035854 noncoding_exon tL(UAG)J 10 617976 618019 W 2011-02-03 2000-05-19 +S000003862 ORF Verified YJR101W RSM26 mitochondrial 37S ribosomal protein RSM26 chromosome 10 10 618234 619034 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit +S000034505 CDS YJR101W 10 618234 619034 W 2011-02-03 1996-07-31 +S000003863 ORF Verified YJR102C VPS25 ESCRT-II subunit protein VPS25|VPL12|VPT25 chromosome 10 10 619765 619157 C 2011-02-03 1996-07-31 Component of the ESCRT-II complex; ESCRT-II is involved in ubiquitin-dependent sorting of proteins into the endosome +S000034557 CDS YJR102C 10 619765 619157 C 2011-02-03 1996-07-31 +S000003864 ORF Verified YJR103W URA8 CTP synthase URA8 chromosome 10 L000002437 10 620754 622490 W 2011-02-03 1996-07-31|2011-02-03 Minor CTP synthase isozyme (see also URA7); catalyzes the ATP-dependent transfer of the amide nitrogen from glutamine to UTP, forming CTP, the final step in de novo biosynthesis of pyrimidines; involved in phospholipid biosynthesis; capable of forming cytoplasmic filaments termed cytoophidium, especially during conditions of glucose depletion; URA8 has a paralog, URA7, that arose from the whole genome duplication +S000034718 CDS YJR103W 10 620754 622490 W 2011-02-03 1996-07-31|2011-02-03 +S000003865 ORF Verified YJR104C SOD1 superoxide dismutase SOD1|CRS4 chromosome 10 L000001978 10 623014 622550 C 2011-02-03 1996-07-31 Cytosolic copper-zinc superoxide dismutase; detoxifies superoxide; stabilizes Yck1p and Yck2p kinases in glucose to repress respiration; phosphorylated by Dun1p, enters nucleus under oxidative stress to promote transcription of stress response genes; human ortholog SOD1 implicated in ALS complements a null allele; abundance increases under DNA replication stress and during exposure to boric acid; localization to mitochondrial intermembrane space is modulated by MICOS complex +S000035647 CDS YJR104C 10 623014 622550 C 2011-02-03 1996-07-31 +S000003866 ORF Verified YJR105W ADO1 adenosine kinase chromosome 10 10 623581 624603 W 2011-02-03 1996-07-31 Adenosine kinase; required for the utilization of S-adenosylmethionine (AdoMet); may be involved in recycling adenosine produced through the methyl cycle +S000035831 CDS YJR105W 10 623581 624603 W 2011-02-03 1996-07-31 +S000003867 ORF Verified YJR106W ECM27 chromosome 10 L000003898 10 624838 627015 W 2011-02-03 1996-07-31|2011-02-03 Protein involved in calcium homeostasis and exit from quiescence; required for proper trehalose levels during quiescence; may play a role in cell wall biosynthesis, mutants are hypersensitive to antifungal, Papulacandin B; null mutants have increased plasmid loss; interacts with Pdr5p +S000035951 CDS YJR106W 10 624838 627015 W 2011-02-03 1996-07-31|2011-02-03 +S000003868 ORF Uncharacterized YJR107W LIH1 putative lipase chromosome 10 10 627340 628326 W 2011-02-03 1996-07-31|2011-02-03 Putative lipase +S000037815 CDS YJR107W 10 627340 628326 W 2011-02-03 1996-07-31|2011-02-03 +S000003869 ORF Verified YJR108W ABM1 chromosome 10 10 628712 629083 W 2011-02-03 1996-07-31 Protein of unknown function; required for normal microtubule organization +S000037909 CDS YJR108W 10 628712 629083 W 2011-02-03 1996-07-31 +S000003870 ORF Verified YJR109C CPA2 carbamoyl-phosphate synthase (glutamine-hydrolyzing) CPA2 chromosome 10 L000000400 10 632941 629585 C 2011-02-03 1996-07-31 Large subunit of carbamoyl phosphate synthetase; carbamoyl phosphate synthetase catalyzes a step in the synthesis of citrulline, an arginine precursor +S000029885 CDS YJR109C 10 632941 629585 C 2011-02-03 1996-07-31 +S000003871 ORF Verified YJR110W YMR1 phosphatidylinositol-3-phosphatase YMR1 chromosome 10 10 633615 635681 W 2011-02-03 1996-07-31 Phosphatidylinositol 3-phosphate (PI3P) phosphatase; involved in various protein sorting pathways, including CVT targeting and endosome to vacuole transport; has similarity to the conserved myotubularin dual specificity phosphatase family +S000037677 CDS YJR110W 10 633615 635681 W 2011-02-03 1996-07-31 +S000003872 ORF Verified YJR111C PXP2 chromosome 10 10 636706 635855 C 2011-02-03 1996-07-31 Peroxisomal matrix protein with naturally active promoter; well-conserved in fungi; localized to peroxisomes under physiological growth conditions; levels of some amino acids are altered upon both knockout and overexpression, suggesting potential involvement of Pxp2p in amino acid metabolism or related cellular metabolic processes (needs further study); GFP-fusion protein displays inherent dual localization with large proportion localizing to cytosol +S000037709 CDS YJR111C 10 636706 635855 C 2011-02-03 1996-07-31 +S000003873 ORF Verified YJR112W NNF1 MIND complex subunit NNF1 chromosome 10 L000003072 10 637030 637635 W 2011-02-03 1996-07-31 Essential component of the MIND kinetochore complex; joins kinetochore subunits contacting DNA to those contacting microtubules; required for accurate chromosome segregation; complex consists of Mtw1p Including Nnf1p-Nsl1p-Dsn1p (MIND) +S000037783 CDS YJR112W 10 637030 637635 W 2011-02-03 1996-07-31 +S000028513 ORF Uncharacterized YJR112W-A chromosome 10 10 637790 638168 W 2011-02-03 2003-07-29 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; identified based on homology to Ashbya gossypii +S000030277 CDS YJR112W-A 10 637790 637809 W 2011-02-03 2003-07-29 +S000030278 CDS YJR112W-A 10 637859 638168 W 2011-02-03 2003-07-29 +S000030279 intron YJR112W-A 10 637810 637858 W 2011-02-03 2003-07-29 +S000003875 ORF Dubious YJR114W SRF2 chromosome 10 10 638659 639051 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF RSM7/YJR113C +S000030784 CDS YJR114W 10 638659 639051 W 2011-02-03 1996-07-31 +S000003874 ORF Verified YJR113C RSM7 mitochondrial 37S ribosomal protein RSM7 chromosome 10 10 638975 638232 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; has similarity to E. coli S7 ribosomal protein +S000030623 CDS YJR113C 10 638975 638232 C 2011-02-03 1996-07-31 +S000003876 ORF Uncharacterized YJR115W chromosome 10 10 639942 640451 W 2011-02-03 1996-07-31 Putative protein of unknown function; YJR115W has a paralog, ECM13, that arose from the whole genome duplication +S000030893 CDS YJR115W 10 639942 640451 W 2011-02-03 1996-07-31 +S000003877 ORF Uncharacterized YJR116W TDA4 chromosome 10 10 640825 641664 W 2011-02-03 1996-07-31 Putative protein of unknown function; null mutant is sensitive to expression of the top1-T722A allele +S000031858 CDS YJR116W 10 640825 641664 W 2011-02-03 1996-07-31 +S000003878 ORF Verified YJR117W STE24 zinc metalloprotease|PIO2|AFC1 chromosome 10 L000003457 10 642007 643368 W 2011-02-03 1996-07-31 Highly conserved zinc metalloprotease; functions in two steps of a-factor maturation, C-terminal CAAX proteolysis and the first step of N-terminal proteolytic processing; cleaves both isoprenylated and non-prenylated oligopeptides; contains multiple transmembrane spans; human homolog ZMPSTE24 implicated in mandibuloacral dysplasia (MAD), and can complement yeast null mutant +S000032024 CDS YJR117W 10 642007 643368 W 2011-02-03 1996-07-31 +S000003879 ORF Verified YJR118C ILM1 chromosome 10 10 644101 643490 C 2011-02-03 1996-07-31 Protein of unknown function; may be involved in mitochondrial DNA maintenance; required for slowed DNA synthesis-induced filamentous growth +S000032105 CDS YJR118C 10 644101 643490 C 2011-02-03 1996-07-31 +S000003880 ORF Verified YJR119C JHD2 histone demethylase|KDM5 chromosome 10 10 646490 644304 C 2011-02-03 1996-07-31 JmjC domain family histone demethylase; promotes global demethylation of H3K4 and repression of noncoding intergenic transcription during sporulation; removes methyl groups added by Set1p methyltransferase; negatively regulated by H3K14 acetylation; protein levels regulated by Not4p polyubiquitin-mediated degradation; regulates sporulation timing by extending period of active transcription in opposition to programmed global transcriptional quiescence; regulates rDNA silencing +S000034072 CDS YJR119C 10 646490 644304 C 2011-02-03 1996-07-31 +S000003881 ORF Verified YJR120W chromosome 10 10 647126 647476 W 2011-02-03 1996-07-31 Protein of unknown function; essential for growth under anaerobic conditions; mutation causes decreased expression of ATP2, impaired respiration, defective sterol uptake, and altered levels/localization of ABC transporters Aus1p and Pdr11p +S000032979 CDS YJR120W 10 647126 647476 W 2011-02-03 1996-07-31 +S000003882 ORF Verified YJR121W ATP2 F1F0 ATP synthase subunit beta chromosome 10 L000000142 10 647607 649142 W 2011-02-03 1996-07-31 Beta subunit of the F1 sector of mitochondrial F1F0 ATP synthase; which is a large, evolutionarily conserved enzyme complex required for ATP synthesis; F1 translationally regulates ATP6 and ATP8 expression to achieve a balanced output of ATP synthase genes encoded in nucleus and mitochondria; phosphorylated +S000033071 CDS YJR121W 10 647607 649142 W 2011-02-03 1996-07-31 +S000003883 ORF Verified YJR122W IBA57 CAF17 chromosome 10 L000003419 10 649776 651269 W 2011-02-03 1996-07-31 Protein involved in incorporating iron-sulfur clusters into proteins; mitochondrial matrix protein; involved in the incorporation of iron-sulfur clusters into mitochondrial aconitase-type proteins; activates the radical-SAM family members Bio2p and Lip5p; interacts with Ccr4p in the two-hybrid system +S000033750 CDS YJR122W 10 649776 651269 W 2011-02-03 1996-07-31 +S000003884 ORF Verified YJR123W RPS5 uS7|ribosomal 40S subunit protein S5|S7|rp14|YS8|S5|S2 chromosome 10 L000002821 10 651901 652578 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; least basic of non-acidic ribosomal proteins; phosphorylated in vivo; essential for viability; homologous to mammalian ribosomal protein S5 and bacterial S7 +S000033852 CDS YJR123W 10 651901 652578 W 2011-02-03 1996-07-31 +S000003885 ORF Uncharacterized YJR124C chromosome 10 10 654238 652892 C 2011-02-03 1996-07-31 Putative protein of unknown function; expression induced under calcium shortage +S000033876 CDS YJR124C 10 654238 652892 C 2011-02-03 1996-07-31 +S000028457 ARS ARS1020 ARSX-654 chromosome 10 10 654375 654614 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence +S000003886 ORF Verified YJR125C ENT3 chromosome 10 10 655963 654737 C 2011-02-03 1996-07-31 Protein containing an N-terminal epsin-like domain; involved in clathrin recruitment and traffic between the Golgi and endosomes; associates with the clathrin adaptor Gga2p +S000034017 CDS YJR125C 10 655963 654737 C 2011-02-03 1996-07-31 +S000003887 ORF Verified YJR126C VPS70 putative zinc metalloprotease chromosome 10 10 658689 656254 C 2011-02-03 1996-07-31 Protein of unknown function involved in vacuolar protein sorting; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum +S000034920 CDS YJR126C 10 658689 656254 C 2011-02-03 1996-07-31 +S000003889 ORF Dubious YJR128W chromosome 10 10 662921 663280 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF RSF2 +S000036069 CDS YJR128W 10 662921 663280 W 2011-02-03 1996-07-31 +S000003888 ORF Verified YJR127C RSF2 ZMS1 chromosome 10 L000002569 10 663059 658917 C 2011-02-03 1996-07-31 Zinc-finger protein; involved in transcriptional control of both nuclear and mitochondrial genes, many of which specify products required for glycerol-based growth, respiration, and other functions; RSF2 has a paralog, TDA9, that arose from the whole genome duplication; relocalizes from nucleus to cytoplasm upon DNA replication stress +S000035071 CDS YJR127C 10 663059 658917 C 2011-02-03 1996-07-31 +S000006492 snoRNA_gene snR3 SNR3 chromosome 10 L000001958 10 663749 663942 W 2011-02-03 2000-05-19|2007-05-08 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at positions U2129, U2133, and U2264 +S000034301 noncoding_exon snR3 10 663749 663942 W 2011-02-03 2000-05-19|2007-05-08 +S000003890 ORF Verified YJR129C EFM3 protein-lysine N-methyltransferase chromosome 10 10 665019 664000 C 2011-02-03 1996-07-31|2011-02-03 S-adenosylmethionine-dependent methyltransferase; seven-beta-strand lysine methyltransferase which trimethylates translation elongation factor EF2 (Eft1p and Eft2p) at lysine 509; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; ortholog of human gene FAM86A +S000036155 CDS YJR129C 10 665019 664000 C 2011-02-03 1996-07-31|2011-02-03 +S000003891 ORF Verified YJR130C STR2 cystathionine gamma-synthase chromosome 10 10 667137 665218 C 2011-02-03 1996-07-31 Cystathionine gamma-synthase, converts cysteine into cystathionine; STR2 has a paralog, YML082W, that arose from the whole genome duplication +S000036945 CDS YJR130C 10 667137 665218 C 2011-02-03 1996-07-31 +S000003892 ORF Verified YJR131W MNS1 mannosyl-oligosaccharide 1,2-alpha-mannosidase chromosome 10 L000001130 10 667644 669293 W 2011-02-03 1996-07-31 Alpha-1,2-mannosidase; involved in ER-associated protein degradation (ERAD); catalyzes the removal of one mannose residue from a glycosylated protein, converting the modification from Man9GlcNAc to Man8GlcNAc; catalyzes the last step in glycoprotein maturation in the ER and is critical for ER protein degradation +S000037068 CDS YJR131W 10 667644 669293 W 2011-02-03 1996-07-31 +S000003893 ORF Verified YJR132W NMD5 KAP119 chromosome 10 L000002939 10 669522 672668 W 2011-02-03 1996-07-31|2011-02-03 Karyopherin; a carrier protein involved in nuclear import of proteins; importin beta homolog +S000037153 CDS YJR132W 10 669522 672668 W 2011-02-03 1996-07-31|2011-02-03 +S000003894 ORF Verified YJR133W XPT1 xanthine phosphoribosyltransferase chromosome 10 10 672991 673620 W 2011-02-03 1996-07-31 Xanthine-guanine phosphoribosyl transferase; required for xanthine utilization and for optimal utilization of guanine +S000037899 CDS YJR133W 10 672991 673620 W 2011-02-03 1996-07-31 +S000003895 ORF Verified YJR134C SGM1 chromosome 10 10 675852 673729 C 2011-02-03 1996-07-31 Protein of unknown function; required for wild-type growth rate on galactose and mannose; localizes to COPI coated vesicles and the Golgi apparatus +S000029858 CDS YJR134C 10 675852 673729 C 2011-02-03 1996-07-31 +S000003896 ORF Verified YJR135C MCM22 chromosome 10 L000003999 10 676778 676059 C 2011-02-03 1996-07-31 Outer kinetochore protein and component of the Ctf3 subcomplex; binds to centromeric DNA in a Ctf19p-dependent manner; involved in chromosome segregation and minichromosome maintenance; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-K and fission yeast sim4 +S000030000 CDS YJR135C 10 676778 676059 C 2011-02-03 1996-07-31 +S000007348 ORF Verified YJR135W-A TIM8 protein transporter TIM8 chromosome 10 10 676971 677234 W 2011-02-03 1999-07-17 Mitochondrial intermembrane space protein; forms a complex with Tim13p that delivers a subset of hydrophobic proteins to the TIM22 complex for inner membrane insertion; homolog of human TIMM8A, implicated in Mohr-Tranebjaerg syndrome, also known as deafness-dystonia-optic neuronopathy (DDON) syndrome; human TIMM8A can complement yeast null mutant +S000032075 CDS YJR135W-A 10 676971 677234 W 2011-02-03 1999-07-17 +S000003897 ORF Verified YJR136C TTI2 chromosome 10 10 678706 677441 C 2011-02-03 1996-07-31 Subunit of the ASTRA complex, involved in chromatin remodeling; telomere length regulator involved in the stability or biogenesis of PIKKs such as TORC1; involved in the cellular stress response; similar to S. pombe Tti2p; may interact with Rsm23p; GFP-fusion protein localizes to the cytoplasm +S000030982 CDS YJR136C 10 678706 677441 C 2011-02-03 1996-07-31 +S000003898 ORF Verified YJR137C MET5 sulfite reductase (NADPH) subunit beta|ECM17 chromosome 10 L000001080|L000003892 10 683285 678957 C 84 2011-02-03 1996-07-31 Sulfite reductase beta subunit; involved in amino acid biosynthesis, transcription repressed by methionine +S000031082 CDS YJR137C 10 683285 678957 C 2011-02-03 1996-07-31 +S000007553 ARS ARS1021 ARS121 chromosome 10 10 684009 684098 2014-11-18 2000-10-17|2014-11-18 Autonomously Replicating Sequence +S000003899 ORF Verified YJR138W IML1 SEA1 chromosome 10 10 684567 689321 W 2011-02-03 1996-07-31|2011-02-03 GTPase-activating protein (GAP) subunit of the Iml1p/SEACIT complex; SEACIT (Iml1p-Npr2p-Npr3p) is a subcomplex of the SEA complex, a coatomer-related complex that associates dynamically with the vacuole; Iml1p functions in the SEACIT complex as a GAP for the Rag family GTPase Gtr1p (EGOC subunit), resulting in the inhibition of TORC1 signaling in response to amino acid deprivation; the Iml1p/SEACIT complex is required for non-nitrogen-starvation (NNS)-induced autophagy +S000031284 CDS YJR138W 10 684567 689321 W 2011-02-03 1996-07-31|2011-02-03 +S000003900 ORF Verified YJR139C HOM6 homoserine dehydrogenase|THR6 chromosome 10 L000000801 10 690524 689445 C 87 2011-02-03 1996-07-31 Homoserine dehydrogenase (L-homoserine:NADP oxidoreductase); dimeric enzyme that catalyzes the third step in the common pathway for methionine and threonine biosynthesis; enzyme has nucleotide-binding, dimerization and catalytic regions +S000032214 CDS YJR139C 10 690524 689445 C 2011-02-03 1996-07-31 +S000028666 ORF Dubious YJR140W-A chromosome 10 10 690961 691110 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene HIR3; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032491 CDS YJR140W-A 10 690961 691110 W 2011-02-03 2003-07-29 +S000003901 ORF Verified YJR140C HIR3 HPC1 chromosome 10 L000003127 10 695696 690750 C 2011-02-03 1996-07-31 Subunit of the HIR complex; a nucleosome assembly complex involved in regulation of histone gene transcription; involved in position-dependent gene silencing and nucleosome reassembly; ortholog of human CABIN1 protein +S000032216 CDS YJR140C 10 695696 690750 C 2011-02-03 1996-07-31 +S000003902 ORF Uncharacterized YJR141W IPA1 putative polyadenylation protein chromosome 10 10 695906 696949 W 2011-02-03 1996-07-31 Essential protein of unknown function +S000033127 CDS YJR141W 10 695906 696949 W 2011-02-03 1996-07-31 +S000003903 ORF Verified YJR142W chromosome 10 10 697141 698169 W 2011-02-03 1996-07-31 8-oxo-dGTP diphosphatase of the Nudix hydrolase family; converts diphosphates of damaged forms of thiamin to monophosphates; GST fusion protein is a Dbf2p-Mob1p phosphorylation target in a proteome chip analysis; synthetic lethal with PH085 deletion; plays a role in restricting Ty1 transposition +S000033186 CDS YJR142W 10 697141 698169 W 2011-02-03 1996-07-31 +S000003904 ORF Verified YJR143C PMT4 dolichyl-phosphate-mannose-protein mannosyltransferase chromosome 10 L000002623 10 700614 698326 C 2011-02-03 1996-07-31 Protein O-mannosyltransferase; transfers mannose residues from dolichyl phosphate-D-mannose to protein serine/threonine residues; appears to form homodimers in vivo and does not complex with other Pmt proteins; target for new antifungals +S000033214 CDS YJR143C 10 700614 698326 C 2011-02-03 1996-07-31 +S000003905 ORF Verified YJR144W MGM101 MGM9 chromosome 10 L000001104 10 700882 701691 W 2011-02-03 1996-07-31 Protein with a role in mitochondrial DNA recombinational repair; also involved in interstrand cross-link repair; binds to and catalyzes the annealing of single-stranded mtDNA; oligomerizes to form rings and filaments; related to Rad52-type recombination proteins, with limited overall similarity but sharing conserved functionally important residues; component of the mitochondrial nucleoid, required for the repair of oxidative mtDNA damage and mitochondrial genome maintenance +S000033297 CDS YJR144W 10 700882 701691 W 2011-02-03 1996-07-31 +S000003906 ORF Verified YJR145C RPS4A eS4|ribosomal 40S subunit protein S4A|S4e|rp5|YS6|S7A|S4A chromosome 10 L000001751 10 703068 702027 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; mutation affects 20S pre-rRNA processing; homologous to mammalian ribosomal protein S4, no bacterial homolog; RPS4A has a paralog, RPS4B, that arose from the whole genome duplication +S000034116 CDS YJR145C 10 702798 702027 C 2011-02-03 1996-07-31 +S000034115 CDS YJR145C 10 703068 703055 C 2011-02-03 1996-07-31 +S000034117 intron YJR145C 10 703054 702799 C 2011-02-03 1996-07-31 +S000003907 ORF Uncharacterized YJR146W chromosome 10 10 703885 704238 W 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels; partially overlaps HMS2 +S000034307 CDS YJR146W 10 703885 704238 W 2011-02-03 1996-07-31 +S000003908 ORF Verified YJR147W HMS2 chromosome 10 L000004442 10 704196 705272 W 2011-02-03 1996-07-31 Protein with similarity to heat shock transcription factors; overexpression suppresses the pseudohyphal filamentation defect of a diploid mep1 mep2 homozygous null mutant; HMS2 has a paralog, SKN7, that arose from the whole genome duplication +S000034417 CDS YJR147W 10 704196 705272 W 2011-02-03 1996-07-31 +S000003909 ORF Verified YJR148W BAT2 branched-chain-amino-acid transaminase BAT2|ECA40|TWT2 chromosome 10 L000003082 10 705744 706874 W 2011-02-03 1996-07-31 Cytosolic branched-chain amino acid (BCAA) aminotransferase; preferentially involved in BCAA catabolism; homolog of murine ECA39; highly expressed during stationary phase and repressed during logarithmic phase; BAT2 has a paralog, BAT1, that arose from the whole genome duplication +S000035457 CDS YJR148W 10 705744 706874 W 2011-02-03 1996-07-31 +S000003910 ORF Uncharacterized YJR149W putative nitronate monooxygenase chromosome 10 10 707160 708374 W 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000035545 CDS YJR149W 10 707160 708374 W 2011-02-03 1996-07-31|2011-02-03 +S000003911 ORF Verified YJR150C DAN1 CCW13 chromosome 10 L000003381 10 709707 708811 C 2011-02-03 1996-07-31|2011-02-03 Cell wall mannoprotein; has similarity to Tir1p, Tir2p, Tir3p, and Tir4p; expressed under anaerobic conditions, completely repressed during aerobic growth +S000036513 CDS YJR150C 10 709707 708811 C 2011-02-03 1996-07-31|2011-02-03 +S000028458 ARS ARS1022 ARSX-712 chromosome 10 10 711896 712142 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence +S000003912 ORF Verified YJR151C DAN4 chromosome 10 10 715740 712255 C 2011-02-03 1996-07-31|2011-02-03 Cell wall mannoprotein; has similarity to Tir1p, Tir2p, Tir3p, and Tir4p; expressed under anaerobic conditions, completely repressed during aerobic growth +S000036600 CDS YJR151C 10 715740 712255 C 2011-02-03 1996-07-31|2011-02-03 +S000028557 ORF Uncharacterized YJR151W-A chromosome 10 10 717580 717630 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR; predicted to have a role in transcription based on computational "guilt by association" analysis +S000031243 CDS YJR151W-A 10 717580 717630 W 2011-02-03 2003-07-29 +S000003913 ORF Verified YJR152W DAL5 allantoate permease|UREP1 chromosome 10 L000000478 10 719666 721297 W 97 2011-02-03 1996-07-31 Allantoate permease; ureidosuccinate permease; also transports dipeptides, though with lower affinity than for allantoate and ureidosuccinate; expression is constitutive but sensitive to nitrogen catabolite repression +S000037362 CDS YJR152W 10 719666 721297 W 2011-02-03 1996-07-31 +S000003914 ORF Verified YJR153W PGU1 PSM1|PGL1 chromosome 10 L000004371|L000004261 10 722815 723900 W 2011-02-03 1996-07-31 Endo-polygalacturonase; pectolytic enzyme that hydrolyzes the alpha-1,4-glycosidic bonds in the rhamnogalacturonan chains in pectins +S000037481 CDS YJR153W 10 722815 723900 W 2011-02-03 1996-07-31 +S000003915 ORF Uncharacterized YJR154W chromosome 10 10 725784 726824 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000030205 CDS YJR154W 10 725784 726824 W 2011-02-03 1996-07-31 +S000003916 ORF Verified YJR155W AAD10 putative aryl-alcohol dehydrogenase chromosome 10 L000004639 10 727405 728271 W 2011-02-03 1996-07-31 Putative aryl-alcohol dehydrogenase; similar to P. chrysosporium aryl-alcohol dehydrogenase; mutational analysis has not yet revealed a physiological role; members of the AAD gene family comprise three pairs (AAD3 + AAD15, AAD6/AAD16 + AAD4, AAD10 + AAD14) whose two genes are more related to one another than to other members of the family +S000030387 CDS YJR155W 10 727405 728271 W 2011-02-03 1996-07-31 +S000003917 ORF Verified YJR156C THI11 4-amino-5-hydroxymethyl-2-methylpyrimidine phosphate synthase chromosome 10 L000003222 10 729596 728574 C 2011-02-03 1996-07-31 Protein involved in synthesis of the thiamine precursor HMP; member of a subtelomeric gene family including THI5, THI11, THI12, and THI13; hydroxymethylpyrimidine is also known as HMP +S000030438 CDS YJR156C 10 729596 728574 C 2011-02-03 1996-07-31 +S000028459 ARS ARS1023 chromosome 10 10 729983 730513 2011-02-03 2002-12-16 Autonomously Replicating Sequence +S000003918 ORF Dubious YJR157W chromosome 10 10 730515 730877 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031435 CDS YJR157W 10 730515 730877 W 2011-02-03 1996-07-31 +S000003919 ORF Verified YJR158W HXT16 HLT3|hexose transporter HXT16 chromosome 10 L000003264 10 732440 734143 W 2011-02-03 1996-07-31 Putative transmembrane polyol transporter; supports growth on and uptake of sorbitol with moderate affinity and mannitol with lower affinity when overexpressed in a strain deleted for hexose family members; minor hexose transport activity when overexpressed in a similar strain; similarity to hexose transporters; expression is repressed by high levels of glucose +S000031532 CDS YJR158W 10 732440 734143 W 2011-02-03 1996-07-31 +S000003920 ORF Verified YJR159W SOR1 L-iditol 2-dehydrogenase SOR1|SDH1 chromosome 10 L000002753 10 736044 737117 W 2011-02-03 1996-07-31 Sorbitol dehydrogenase; protein sequence is 99% identical to the Sor2p sorbitol dehydrogenase; expression is induced in the presence of sorbitol or xylose +S000031666 CDS YJR159W 10 736044 737117 W 2011-02-03 1996-07-31 +S000028460 ARS ARS1024 ARSX-737 chromosome 10 10 737034 737275 2011-02-03 2002-12-16|2006-09-07 Autonomously Replicating Sequence +S000003921 ORF Verified YJR160C MPH3 alpha-glucoside permease chromosome 10 10 739816 738008 C 2011-02-03 1996-07-31 Alpha-glucoside permease; transports maltose, maltotriose, alpha-methylglucoside, and turanose; identical to Mph2p; encoded in a subtelomeric position in a region likely to have undergone duplication +S000031772 CDS YJR160C 10 739816 738008 C 2011-02-03 1996-07-31 +S000003922 ORF Verified YJR161C COS5 chromosome 10 L000004063 10 743999 742848 C 2011-02-03 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins +S000031918 CDS YJR161C 10 743999 742848 C 2011-02-03 1996-07-31 +S000028461 ARS ARS1025 chromosome 10 10 744408 745008 2011-02-03 2002-12-16 Autonomously Replicating Sequence +S000178126 ARS_consensus_sequence ARS1025 10 744632 744648 W 2014-11-18 2014-11-18 +S000028974 telomere TEL10R chromosome 10 10 744902 745751 W 100 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome X; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats +S000028975 telomeric_repeat TEL10R 10 745663 745751 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome X +S000028976 X_element TEL10R 10 744902 745361 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome X; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YJR162C +S000028977 X_element_combinatorial_repeat TEL10R 10 745362 745662 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr X; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000003923 ORF Dubious YJR162C chromosome 10 10 745261 744911 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032831 CDS YJR162C 10 745261 744911 C 2011-02-03 1996-07-31 +S000001708 ORF Dubious YKL225W chromosome 11 11 451 798 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032685 CDS YKL225W 11 451 798 W 2011-02-03 1996-07-31 +S000028906 telomere TEL11L chromosome 11 11 807 1 C -162 2011-02-03 2003-09-09|2011-02-03 Telomeric region on the left arm of Chromosome XI; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats +S000028907 telomeric_repeat TEL11L 11 67 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome XI +S000028908 X_element TEL11L 11 807 347 C 2011-02-03 2003-09-09|2011-02-03 Telomeric X element Core sequence on the left arm of Chromosome XI; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YKL225W +S000028909 X_element_combinatorial_repeat TEL11L 11 346 68 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr XI; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000001707 ORF Verified YKL224C PAU16 seripauperin PAU16 chromosome 11 11 2181 1810 C 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP and mCherry fusion proteins localize to the vacuole +S000031625 CDS YKL224C 11 2181 1810 C 2011-02-03 1996-07-31 +S000001706 ORF Dubious YKL223W chromosome 11 11 2389 2721 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031556 CDS YKL223W 11 2389 2721 W 2011-02-03 1996-07-31 +S000001705 ORF Verified YKL222C chromosome 11 11 5620 3503 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; similar to transcriptional regulators from the zinc cluster (binuclear cluster) family; null mutant is sensitive to caffeine +S000031466 CDS YKL222C 11 5620 3503 C 2011-02-03 1996-07-31 +S000001704 ORF Verified YKL221W MCH2 chromosome 11 11 6107 7528 W 2011-02-03 1996-07-31|2011-02-03 Protein with similarity to mammalian monocarboxylate permeases; monocarboxylate permeases are involved in transport of monocarboxylic acids across the plasma membrane but mutant is not deficient in monocarboxylate transport +S000031419 CDS YKL221W 11 6107 7528 W 2011-02-03 1996-07-31|2011-02-03 +S000130137 ARS ARS1102 ARSXI-8 chromosome 11 11 7528 8309 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000001703 ORF Verified YKL220C FRE2 ferric/cupric-chelate reductase chromosome 11 L000002805 11 11226 9091 C 2011-02-03 1996-07-31 Ferric reductase and cupric reductase; reduces siderophore-bound iron and oxidized copper prior to uptake by transporters; expression induced by low iron levels but not by low copper levels +S000031305 CDS YKL220C 11 11226 9091 C 2011-02-03 1996-07-31 +S000001702 ORF Verified YKL219W COS9 chromosome 11 L000004067 11 14485 15708 W 1996-07-31 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins +S000030515 CDS YKL219W 11 14485 15708 W 1996-07-31 1996-07-31 +S000001701 ORF Verified YKL218C SRY1 threo-3-hydroxy-L-aspartate ammonia-lyase SRY1 chromosome 11 S000007485 11 18339 17359 C 1996-07-31 1996-07-31 3-hydroxyaspartate dehydratase; deaminates L-threo-3-hydroxyaspartate to form oxaloacetate and ammonia; required in the presence of hydroxyaspartate; highly similar to mouse serine racemase (Srr) but has no serine racemase activity +S000037646 CDS YKL218C 11 18339 17359 C 1996-07-31 1996-07-31 +S000001700 ORF Verified YKL217W JEN1 chromosome 11 L000002666 11 22234 24084 W 1996-07-31 1996-07-31 Monocarboxylate/proton symporter of the plasma membrane; transport activity is dependent on the pH gradient across the membrane; mediates high-affinity uptake of carbon sources lactate, pyuvate, and acetate, and also of the micronutrient selenite, whose structure mimics that of monocarboxylates; expression and localization are tightly regulated, with transcription repression, mRNA degradation, and protein endocytosis and degradation all occurring in the presence of glucose +S000037602 CDS YKL217W 11 22234 24084 W 1996-07-31 1996-07-31 +S000001699 ORF Verified YKL216W URA1 dihydroorotate dehydrogenase chromosome 11 L000002430 11 25215 26159 W -159.7 2011-02-03 1996-07-31 Dihydroorotate dehydrogenase; catalyzes the fourth enzymatic step in the de novo biosynthesis of pyrimidines, converting dihydroorotic acid into orotic acid +S000037467 CDS YKL216W 11 25215 26159 W 2011-02-03 1996-07-31 +S000001698 ORF Verified YKL215C OXP1 5-oxoprolinase chromosome 11 11 30687 26827 C 2011-02-03 1996-07-31 5-oxoprolinase; enzyme is ATP-dependent and functions as a dimer; similar to mouse Oplah gene; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; protein abundance increases in response to DNA replication stress +S000036677 CDS YKL215C 11 30687 26827 C 2011-02-03 1996-07-31 +S000001697 ORF Verified YKL214C YRA2 chromosome 11 11 31693 31082 C 2011-02-03 1996-07-31 Member of the REF (RNA and export factor binding proteins) family; when overexpressed, can substitute for the function of Yra1p in export of poly(A)+ mRNA from the nucleus +S000036577 CDS YKL214C 11 31693 31082 C 2011-02-03 1996-07-31 +S000001696 ORF Verified YKL213C DOA1 ZZZ4|UFD3 chromosome 11 L000002961 11 34107 31960 C 2011-02-03 1996-07-31 WD repeat protein required for ubiquitin-mediated protein degradation; ubiquitin binding cofactor that complexes with Cdc48p; required for ribophagy; controls cellular ubiquitin concentration; promotes efficient NHEJ in postdiauxic/stationary phase; facilitates N-terminus-dependent proteolysis of centromeric histone H3 (Cse4p) for faithful chromosome segregation; protein increases in abundance and relocalizes from nucleus to nuclear periphery upon DNA replication stress +S000036488 CDS YKL213C 11 34107 31960 C 2011-02-03 1996-07-31 +S000001695 ORF Verified YKL212W SAC1 phosphatidylinositol-3-phosphatase SAC1|RSD1 chromosome 11 L000001790 11 34543 36414 W -153.8 2011-02-03 1996-07-31 Phosphatidylinositol phosphate (PtdInsP) phosphatase; involved in hydrolysis of PtdIns[4]P in the early and medial Golgi; regulated by interaction with Vps74p; ER localized transmembrane protein which cycles through the Golgi; involved in protein trafficking and processing, secretion, and cell wall maintenance; regulates sphingolipid biosynthesis through the modulation of PtdIns(4)P metabolism +S000036459 CDS YKL212W 11 34543 36414 W 2011-02-03 1996-07-31 +S000001694 ORF Verified YKL211C TRP3 bifunctional anthranilate synthase/indole-3-glycerol-phosphate synthase chromosome 11 L000002354 11 38153 36699 C -153.8 2011-02-03 1996-07-31 Indole-3-glycerol-phosphate synthase; forms bifunctional hetero-oligomeric anthranilate synthase:indole-3-glycerol phosphate synthase enzyme complex with Trp2p +S000035520 CDS YKL211C 11 38153 36699 C 2011-02-03 1996-07-31 +S000006455 snoRNA_gene snR64 SNR64 chromosome 11 L000004533 11 38811 38911 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position C2337 +S000030843 noncoding_exon snR64 11 38811 38911 W 2011-02-03 2000-05-19 +S000001693 ORF Verified YKL210W UBA1 E1 ubiquitin-activating protein UBA1 chromosome 11 L000002405 11 39163 42237 W -153.3 2011-02-03 1996-07-31 Ubiquitin activating enzyme (E1); involved in ubiquitin-mediated protein degradation and essential for viability; protein abundance increases in response to DNA replication stress +S000035493 CDS YKL210W 11 39163 42237 W 2011-02-03 1996-07-31 +S000001692 ORF Verified YKL209C STE6 ATP-binding cassette a-factor transporter STE6 chromosome 11 L000002116 11 46295 42423 C -152.3 2011-02-03 1996-07-31 Plasma membrane ATP-binding cassette (ABC) transporter; required for the export of a-factor, catalyzes ATP hydrolysis coupled to a-factor transport; contains 12 transmembrane domains and two ATP binding domains; expressed only in MATa cells; human homolog ABCB1 mediates multidrug resistance in many chemotherapy-resistant tumors by effluxing toxic compounds from the cell +S000035512 CDS YKL209C 11 46295 42423 C 2011-02-03 1996-07-31 +S000006748 tRNA_gene tT(CGU)K TRT2 chromosome 11 L000003644 11 46806 46735 C 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis; correct folding and efficient aminoacylation require Lhp1p +S000032223 noncoding_exon tT(CGU)K 11 46806 46735 C 2011-02-03 2000-05-19 +S000001691 ORF Verified YKL208W CBT1 SOC1 chromosome 11 L000004295|S000029465|L000004597 11 47157 47972 W 2011-02-03 1996-07-31 Protein involved in 5' RNA end processing; substrates include mitochondrial COB, 15S_rRNA, and RPM1 transcripts; may also have a role in 3' end processing of the COB pre-mRNA; displays genetic interaction with cell cycle-regulated kinase Dbf2p +S000034559 CDS YKL208W 11 47157 47972 W 2011-02-03 1996-07-31 +S000001690 ORF Verified YKL207W EMC3 AIM27|LRC3 chromosome 11 11 48194 48955 W 2011-02-03 2004-02-13|1996-07-31|2006-05-08 Member of conserved ER transmembrane complex; required for efficient folding of proteins in the ER; required for respiratory growth; null mutant displays induction of the unfolded protein response; homologous to worm Y62E10A.10/EMC-3, fly CG6750, human TMEM111 +S000034425 CDS YKL207W 11 48194 48955 W 2011-02-03 2004-02-13|1996-07-31|2006-05-08 +S000001689 ORF Verified YKL206C ADD66 POC2|PBA2 chromosome 11 11 49809 49006 C 2011-02-03 1996-07-31 Protein involved in 20S proteasome assembly; forms a heterodimer with Pba1p that binds to proteasome precursors; interaction with Pba1p-Add66p may affect function of the mature proteasome and its role in maintaining respiratory metabolism; similar to human PAC2 constituent of the PAC1-PAC2 complex involved in proteasome assembly +S000034304 CDS YKL206C 11 49809 49006 C 2011-02-03 1996-07-31 +S000001688 ORF Verified YKL205W LOS1 Ran GTPase-binding protein LOS1 chromosome 11 L000000950 11 50051 53353 W -149.7 2011-02-03 1996-07-31 Nuclear pore protein; involved in nuclear export of pre-tRNA and in re-export of mature tRNAs after their retrograde import from the cytoplasm; deletion mutation extends replicative lifespan, as does exclusion of Los1p from the nucleus in response to caloric restriction +S000034266 CDS YKL205W 11 50051 53353 W 2011-02-03 1996-07-31 +S000001687 ORF Verified YKL204W EAP1 chromosome 11 11 53704 55602 W 2011-02-03 1996-07-31 eIF4E-associated protein, competes with eIF4G for binding to eIF4E; accelerates mRNA degradation by promoting decapping, facilitated by interaction with eIF4E; essential for Puf5p mediated repression; associates with Puf5p and Dhh1p; inhibits cap-dependent translation; functions independently of eIF4E to maintain genetic stability; plays a role in cell growth, implicated in the TOR signaling cascade +S000033363 CDS YKL204W 11 53704 55602 W 2011-02-03 1996-07-31 +S000118401 ARS ARS1103 ARSXI-56 chromosome 11 11 55671 55917 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178127 ARS_consensus_sequence ARS1103 11 55867 55851 C 2014-11-18 2014-11-18 +S000001686 ORF Verified YKL203C TOR2 phosphatidylinositol kinase-related protein kinase TOR2|DRR2 chromosome 11 L000002323 11 63359 55935 C -152.3 2011-02-03 2004-02-13|1996-07-31 PIK-related protein kinase and rapamycin target; subunit of TORC1, a complex that regulates growth in response to nutrients and TORC2, a complex that regulates cell-cycle dependent polarization of the actin cytoskeleton; involved in meiosis; TOR2 has a paralog, TOR1, that arose from the whole genome duplication +S000033266 CDS YKL203C 11 63359 55935 C 2011-02-03 2004-02-13|1996-07-31 +S000001685 ORF Dubious YKL202W chromosome 11 11 63821 64402 W 2011-02-03 2001-05-31|1996-07-31|1999-03-12 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033230 CDS YKL202W 11 63821 64402 W 2011-02-03 2001-05-31|1996-07-31|1999-03-12 +S000001684 ORF Verified YKL201C MNN4 YKL200C chromosome 11 L000001128 11 67466 63930 C -132.6 2011-02-03 2001-05-31|1996-07-31|1999-03-12 Putative positive regulator of mannosylphosphate transferase Mnn6p; involved in mannosylphosphorylation of N-linked oligosaccharides; expression increases in late-logarithmic and stationary growth phases; coding sequence contains length polymorphisms in different strains; MNN4 has a paralog, YJR061W, that arose from the whole genome duplication +S000032315 CDS YKL201C 11 67466 63930 C 2011-02-03 2001-05-31|1999-03-12|1996-07-31 +S000001681 ORF Verified YKL198C PTK1 putative serine/threonine protein kinase PTK1|POT1|YKT9|YKL199C|STK1|KKT8 chromosome 11 L000003491 11 70220 68232 C 2011-02-03 2003-01-08|1999-03-12|1996-07-31|2011-02-03 Putative serine/threonine protein kinase; regulates spermine uptake; involved in polyamine transport; possible mitochondrial protein; PTK1 has a paralog, PTK2, that arose from the whole genome duplication +S000034854 CDS YKL198C 11 70220 68232 C 2011-02-03 2003-01-08|1996-07-31|1999-03-12|2011-02-03 +S000001680 ORF Verified YKL197C PEX1 AAA family ATPase peroxin 1|PAS1 chromosome 11 L000001337 11 73865 70734 C 2011-02-03 1996-07-31 AAA-peroxin; heterodimerizes with AAA-peroxin Pex6p and participates in the recycling of peroxisomal signal receptor Pex5p from the peroxisomal membrane to the cystosol; induced by oleic acid and upregulated during anaerobiosis; mutations in human PEX1 can lead to severe peroxisomal disorders and early death +S000033983 CDS YKL197C 11 73865 70734 C 2011-02-03 1996-07-31 +S000007055 long_terminal_repeat YKLWdelta1 chromosome 11 11 74236 74518 W 2011-02-03 2000-05-19 Ty1 LTR +S000006671 tRNA_gene tN(GUU)K chromosome 11 L000003629 11 74624 74697 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis +S000030740 noncoding_exon tN(GUU)K 11 74624 74697 W 2011-02-03 2000-05-19 +S000001679 ORF Verified YKL196C YKT6 palmitoyltransferase YKT6 chromosome 11 L000004163 11 75534 74932 C 2011-02-03 1996-07-31 Vesicle membrane protein (v-SNARE) with acyltransferase activity; involved in trafficking to and within the Golgi, endocytic trafficking to the vacuole, and vacuolar fusion; membrane localization due to prenylation at the carboxy-terminus; human homolog YKT6 can complement yeast ykt6 mutant +S000033862 CDS YKL196C 11 75534 74932 C 2011-02-03 1996-07-31 +S000001678 ORF Verified YKL195W MIA40 TIM40|FMP15 chromosome 11 11 75821 77032 W 2011-02-03 2003-09-22|1996-07-31 Import and assembly protein in mitochondrial intermembrane space; component of MIA pathway which mediates import and oxidative folding of substrates including small proteins containing twin cysteine motifs; acts in concert with Erv1p, which oxidizes the cysteine residues of Mia40p to comprise a disulfide relay system that catalyzes import; also mediates folding of Atp23p via a chaperone-like activity; forms a dimer that binds iron-sulfur cluster in vitro +S000033827 CDS YKL195W 11 75821 77032 W 2011-02-03 2003-09-22|1996-07-31 +S000001677 ORF Verified YKL194C MST1 threonine--tRNA ligase MST1 chromosome 11 L000001207 11 78646 77258 C 2011-02-03 1996-07-31 Mitochondrial threonyl-tRNA synthetase; aminoacylates both the canonical threonine tRNA tT(UGU)Q1 and the unusual threonine tRNA tT(UAG)Q2 in vitro; lacks a typical editing domain, but has pre-transfer editing activity stimulated by the unusual tRNA-Thr +S000030386 CDS YKL194C 11 78646 77258 C 2011-02-03 1996-07-31 +S000001676 ORF Verified YKL193C SDS22 type 1 protein phosphatase-activating protein SDS22|EGP1 chromosome 11 L000002590 11 79882 78866 C 2011-02-03 1996-07-31 Regulatory subunit of the type 1 protein phosphatase (PP1) Glc7p; whether it functions as a positive or negative regulator of Glc7p is controversial; involved in the regulation of Glc7p nuclear localization and function +S000030304 CDS YKL193C 11 79882 78866 C 2011-02-03 1996-07-31 +S000001675 ORF Verified YKL192C ACP1 acyl carrier protein chromosome 11 L000004843 11 80537 80160 C 2011-02-03 1996-07-31 Mitochondrial matrix acyl carrier protein; involved in biosynthesis of octanoate, which is a precursor to lipoic acid; activated by phosphopantetheinylation catalyzed by Ppt2p +S000030104 CDS YKL192C 11 80537 80160 C 2011-02-03 1996-07-31 +S000001674 ORF Verified YKL191W DPH2 chromosome 11 L000000522 11 81035 82639 W 2011-02-03 1996-07-31 Protein required for synthesis of diphthamide; required along with Dph1p, Kti11p, Jjj3p, and Dph5p; diphthamide is a modified histidine residue of translation elongation factor 2 (Eft1p or Eft2p); may act in a complex with Dph1p and Kti11p +S000030067 CDS YKL191W 11 81035 82639 W 2011-02-03 1996-07-31 +S000001673 ORF Verified YKL190W CNB1 calcineurin regulatory subunit B|YCN2|CRV1 chromosome 11 L000000371 11 82947 83550 W 2011-02-03 1996-07-31 Calcineurin B; regulatory subunit of calcineurin, a Ca++/calmodulin-regulated type 2B protein phosphatase which regulates Crz1p (stress-response transcription factor); other calcineurin subunit encoded by CNA1 and/or CMP1; regulates function of Aly1p alpha-arrestin; myristoylation by Nmt1p reduces calcineurin activity in response to submaximal Ca signals, is needed to prevent constitutive phosphatase activity; protein abundance increases in response to DNA replication stress +S000029989 CDS YKL190W 11 82947 82998 W 2011-02-03 1996-07-31 +S000029990 CDS YKL190W 11 83075 83550 W 2011-02-03 1996-07-31 +S000029991 intron YKL190W 11 82999 83074 W 2011-02-03 1996-07-31 +S000007050 long_terminal_repeat YKLCdelta2 chromosome 11 11 84115 83808 C 2011-02-03 2000-05-19 Ty1 LTR +S000006651 tRNA_gene tL(UAA)K chromosome 11 L000003630 11 84208 84291 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000037408 noncoding_exon tL(UAA)K 11 84208 84291 W 2011-02-03 2000-05-19 +S000001672 ORF Verified YKL189W HYM1 chromosome 11 L000004365 11 84704 85903 W 2011-02-03 1996-07-31 Component of the RAM signaling network; is involved in regulation of Ace2p activity and cellular morphogenesis, interacts with Kic1p and Sog2p, localizes to sites of polarized growth during budding and during the mating response +S000030561 CDS YKL189W 11 84704 85903 W 2011-02-03 1996-07-31 +S000001671 ORF Verified YKL188C PXA2 ATP-binding cassette long-chain fatty acid transporter PXA2|PAT1 chromosome 11 L000003538 11 88786 86225 C 2011-02-03 1996-07-31 Subunit of heterodimeric peroxisomal ABC transport complex, with Pxa1p; required for import of long-chain fatty acids into peroxisomes; similar to human adrenoleukodystrophy transportesr ABCD1 and ABCD2, and ALD-related proteins; mutations in ABCD1 cause X-linked adrenoleukodystrophy (X-ALD), a peroxisomal disorder; human ABCD1 and ABCD2 can each partially complement yeast pxa1 pxa2 double null mutant +S000030413 CDS YKL188C 11 88786 86225 C 2011-02-03 1996-07-31 +S000130138 ARS ARS1104 ARSXI-89 chromosome 11 11 88789 89287 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000001670 ORF Verified YKL187C FAT3 chromosome 11 11 91536 89284 C 2011-02-03 1996-07-31 Protein required for fatty acid uptake; protein abundance increases in cortical patches in response to oleate exposure; the authentic, non-tagged protein is detected in a phosphorylated state in highly purified mitochondria in high-throughput studies; FAT3 has a paralog, YLR413W, that arose from the whole genome duplication +S000037608 CDS YKL187C 11 91536 89284 C 2011-02-03 1996-07-31 +S000001669 ORF Verified YKL186C MTR2 chromosome 11 L000002934 11 93298 92744 C 2011-02-03 1996-07-31 mRNA transport regulator; essential nuclear protein; Mex67p and Mtr2p form a mRNA export complex which binds to RNA +S000037550 CDS YKL186C 11 93298 92744 C 2011-02-03 1996-07-31 +S000122106 five_prime_UTR_intron YKL186C 11 93465 93312 C 2011-02-03 2007-04-04 +S000001668 ORF Verified YKL185W ASH1 DNA-binding transcription repressor ASH1 chromosome 11 L000003058 11 94499 96265 W 2011-02-03 1996-07-31 Component of the Rpd3L histone deacetylase complex; zinc-finger inhibitor of HO transcription; mRNA is localized and translated in the distal tip of anaphase cells, resulting in accumulation of Ash1p in daughter cell nuclei and inhibition of HO expression; potential Cdc28p substrate +S000037492 CDS YKL185W 11 94499 96265 W 2011-02-03 1996-07-31 +S000001667 ORF Verified YKL184W SPE1 ornithine decarboxylase SPE1|SPE10|ORD1 chromosome 11 L000001307|L000001993|L000001995 11 96757 98157 W -130.3 2011-02-03 1996-07-31 Ornithine decarboxylase; catalyzes the first step in polyamine biosynthesis; degraded in a proteasome-dependent manner in the presence of excess polyamines; deletion decreases lifespan, and increases necrotic cell death and ROS generation +S000032037 CDS YKL184W 11 96757 98157 W 2011-02-03 1996-07-31 +S000119035 ARS ARS1125 ARSXI-98|ARS1104.5 chromosome 11 11 98364 98523 2014-11-18 2014-11-18|2006-10-03 Autonomously Replicating Sequence +S000178128 ARS_consensus_sequence ARS1125 11 98385 98401 W 2014-11-18 2014-11-18 +S000028558 ORF Uncharacterized YKL183C-A chromosome 11 11 98607 98395 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031244 CDS YKL183C-A 11 98607 98395 C 2011-02-03 2003-07-29 +S000001666 ORF Verified YKL183W LOT5 chromosome 11 11 98721 99641 W 2011-02-03 1996-07-31 Protein of unknown function; gene expression increases in cultures shifted to a lower temperature; protein abundance increases in response to DNA replication stress +S000031917 CDS YKL183W 11 98721 99641 W 2011-02-03 1996-07-31 +S000001665 ORF Verified YKL182W FAS1 tetrafunctional fatty acid synthase subunit FAS1 chromosome 11 L000000601 11 100671 106826 W -116.7 2011-02-03 1996-07-31 Beta subunit of fatty acid synthetase; complex catalyzes the synthesis of long-chain saturated fatty acids; contains acetyltransacylase, dehydratase, enoyl reductase, malonyl transacylase, and palmitoyl transacylase activities +S000031771 CDS YKL182W 11 100671 106826 W 2011-02-03 1996-07-31 +S000001664 ORF Verified YKL181W PRS1 ribose phosphate diphosphokinase subunit PRS1|PRP1 chromosome 11 L000001494 11 107316 108599 W 2011-02-03 1996-07-31 5-phospho-ribosyl-1(alpha)-pyrophosphate synthetase; synthesizes PRPP, which is required for nucleotide, histidine, and tryptophan biosynthesis; plays a key role in cell wall integrity (CWI) pathway; one of five related enzymes, which are active as heteromultimeric complexes; missense mutations in human homolog PRPS1 are associated with neuropathic Arts syndrome and Charcot-Marie Tooth (CMTX5) disease +S000029853 CDS YKL181W 11 107316 108599 W 2011-02-03 1996-07-31 +S000001663 ORF Verified YKL180W RPL17A uL22|ribosomal 60S subunit protein L17A|L22|YL17|L20A|L17A|RPL17 chromosome 11 L000001715 11 109269 110129 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L17A; required for processing of 27SB pre-rRNA and formation of stable 66S assembly intermediates; copurifies with the Dam1 complex (aka DASH complex); homologous to mammalian ribosomal protein L17 and bacterial L22; RPL17A has a paralog, RPL17B, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000036148 CDS YKL180W 11 109269 109577 W 2011-02-03 1996-07-31 +S000036149 CDS YKL180W 11 109884 110129 W 2011-02-03 1996-07-31 +S000036150 intron YKL180W 11 109578 109883 W 2011-02-03 1996-07-31 +S000001662 ORF Verified YKL179C COY1 chromosome 11 11 112503 110464 C 2011-02-03 1996-07-31 Golgi membrane protein with similarity to mammalian CASP; genetic interactions with GOS1 (encoding a Golgi snare protein) suggest a role in Golgi function +S000035207 CDS YKL179C 11 112503 110464 C 2011-02-03 1996-07-31 +S000001660 ORF Dubious YKL177W chromosome 11 11 114356 114694 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene STE3 +S000034192 CDS YKL177W 11 114356 114694 W 2011-02-03 1996-07-31 +S000001661 ORF Verified YKL178C STE3 DAF2 chromosome 11 L000002113 11 114627 113215 C 2011-02-03 1996-07-31 Receptor for a factor pheromone; couples to MAP kinase cascade to mediate pheromone response; transcribed in alpha cells and required for mating by alpha cells, ligand bound receptors endocytosed and recycled to the plasma membrane; GPCR +S000035096 CDS YKL178C 11 114627 113215 C 2011-02-03 1996-07-31 +S000001659 ORF Verified YKL176C LST4 chromosome 11 L000004354 11 117986 115500 C 2011-02-03 1996-07-31 Subunit of the Lst4p-Lst7p GTPase activating protein complex for Gtr2p; stimulates the GTPase activity of Rag family GTPase Gtr2p, within the context of the Gtr1p-Gtr2p heterodimer, after amino acid stimulation; required for activation of TORC1 in response to amino acid stimulation; recruited to the vacuolar membrane during amino acid starvation and released from the membrane by TORC1; required for the transport of amino acid permease Gap1p from the Golgi to the cell surface +S000034038 CDS YKL176C 11 117986 115500 C 2011-02-03 1996-07-31 +S000001658 ORF Verified YKL175W ZRT3 Zn(2+) transporter ZRT3 chromosome 11 11 118793 120304 W 2011-02-03 1996-07-31 Vacuolar membrane zinc transporter; transports zinc from storage in the vacuole to the cytoplasm when needed; transcription is induced under conditions of zinc deficiency +S000033999 CDS YKL175W 11 118793 120304 W 2011-02-03 1996-07-31 +S000001657 ORF Verified YKL174C TPO5 chromosome 11 11 122236 120380 C 2011-02-03 1996-07-31 Protein involved in excretion of putrescine and spermidine; putative polyamine transporter in the Golgi or post-Golgi vesicles +S000033149 CDS YKL174C 11 122236 120380 C 2011-02-03 1996-07-31 +S000001656 ORF Verified YKL173W SNU114 U5 snRNP GTPase SNU114|GIN10 chromosome 11 L000003541 11 122517 125543 W 2011-02-03 1996-07-31 GTPase component of U5 snRNP involved in mRNA splicing via spliceosome; binds directly to U5 snRNA; proposed to be involved in conformational changes of the spliceosome; similarity to ribosomal translocation factor EF-2 +S000033113 CDS YKL173W 11 122517 125543 W 2011-02-03 1996-07-31 +S000001655 ORF Verified YKL172W EBP2 chromosome 11 L000004646 11 125759 127042 W 2011-02-03 1996-07-31 Required for 25S rRNA maturation and 60S ribosomal subunit assembly; localizes to the nucleolus and in foci along nuclear periphery; constituent of 66S pre-ribosomal particles; cooperates with Rrs1p and Mps3p to mediate telomere clustering by binding Sir4p, but is not involved in telomere tethering +S000033024 CDS YKL172W 11 125759 127042 W 2011-02-03 1996-07-31 +S000001654 ORF Verified YKL171W NNK1 protein kinase NNK1 chromosome 11 11 127475 130261 W 2011-02-03 1996-07-31 Protein kinase; implicated in proteasome function; interacts with TORC1, Ure2 and Gdh2; overexpression leads to hypersensitivity to rapamycin and nuclear accumulation of Gln3; epitope-tagged protein localizes to the cytoplasm +S000032097 CDS YKL171W 11 127475 130261 W 2011-02-03 1996-07-31 +S000001653 ORF Verified YKL170W MRPL38 mitochondrial 54S ribosomal protein YmL38/YmL34|YmL38|YmL34|MRPL34 chromosome 11 S000029310|L000002693|L000001173 11 130634 131050 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; appears as two protein spots (YmL34 and YmL38) on two-dimensional SDS gels; protein abundance increases in response to DNA replication stress +S000031979 CDS YKL170W 11 130634 131050 W 2011-02-03 1996-07-31 +S000001652 ORF Dubious YKL169C chromosome 11 11 131068 130685 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene MRPL38 +S000030884 CDS YKL169C 11 131068 130685 C 2011-02-03 1996-07-31 +S000001651 ORF Verified YKL168C KKQ8 putative serine/threonine protein kinase KKQ8 chromosome 11 L000004097 11 133462 131288 C 2011-02-03 1996-07-31|2006-05-08 Putative serine/threonine protein kinase with unknown cellular role; KKQ8 has a paralog, HAL5, that arose from the whole genome duplication +S000030812 CDS YKL168C 11 133462 131288 C 2011-02-03 1996-07-31|2006-05-08 +S000001650 ORF Verified YKL167C MRP49 mitochondrial 54S ribosomal protein MRP49 chromosome 11 L000001159 11 134134 133721 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; not essential for mitochondrial translation +S000037870 CDS YKL167C 11 134134 133721 C 2011-02-03 1996-07-31 +S000001649 ORF Verified YKL166C TPK3 cAMP-dependent protein kinase catalytic subunit TPK3 chromosome 11 L000002327 11 135705 134509 C 2011-02-03 1996-07-31 cAMP-dependent protein kinase catalytic subunit; promotes vegetative growth in response to nutrients via the Ras-cAMP signaling pathway; partially redundant with Tpk1p and Tpk2p; localizes to P-bodies during stationary phase; TPK3 has a paralog, TPK1, that arose from the whole genome duplication +S000037767 CDS YKL166C 11 135705 134509 C 2011-02-03 1996-07-31 +S000007617 ORF Dubious YKL165C-A chromosome 11 11 136023 135790 C 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037215 CDS YKL165C-A 11 136023 135790 C 2011-02-03 2001-02-26 +S000001648 ORF Verified YKL165C MCD4 mannose-ethanolamine phosphotransferase MCD4|FSR2|SSU21|ZRG16 chromosome 11 L000003913|S000029172|L000003584 11 140691 137932 C 2011-02-03 1996-07-31 Protein involved in GPI anchor synthesis; multimembrane-spanning protein that localizes to the endoplasmic reticulum; highly conserved among eukaryotes; GPI stands for glycosylphosphatidylinositol +S000037706 CDS YKL165C 11 140691 137932 C 2011-02-03 1996-07-31 +S000006558 tRNA_gene tE(UUC)K chromosome 11 L000003643 11 141089 141018 C 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000036005 noncoding_exon tE(UUC)K 11 141089 141018 C 2011-02-03 2000-05-19 +S000001647 ORF Verified YKL164C PIR1 beta-1,3-glucan linked protein|CCW6 chromosome 11 L000001441 11 142819 141794 C 2011-02-03 1996-07-31 O-glycosylated protein required for cell wall stability; attached to the cell wall via beta-1,3-glucan; mediates mitochondrial translocation of Apn1p; expression regulated by the cell integrity pathway and by Swi5p during the cell cycle; PIR1 has a paralog, YJL160C, that arose from the whole genome duplication +S000036944 CDS YKL164C 11 142819 141794 C 2011-02-03 1996-07-31 +S000001646 ORF Verified YKL163W PIR3 beta-1,3-glucan linked protein|CCW8 chromosome 11 L000001443 11 144401 145378 W 2011-02-03 1996-07-31 O-glycosylated covalently-bound cell wall protein; required for cell wall stability; expression is cell cycle regulated, peaking in M/G1 and also subject to regulation by the cell integrity pathway; coding sequence contains length polymorphisms in different strains; PIR3 has a paralog, HSP150, that arose from the whole genome duplication +S000036912 CDS YKL163W 11 144401 145378 W 2011-02-03 1996-07-31 +S000007244 ORF Dubious YKL162C-A chromosome 11 11 146074 145922 C 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032863 CDS YKL162C-A 11 146074 145922 C 2011-02-03 1999-07-17 +S000001645 ORF Uncharacterized YKL162C chromosome 11 11 148838 147630 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the mitochondrion +S000036809 CDS YKL162C 11 148838 147630 C 2011-02-03 1996-07-31 +S000001644 ORF Verified YKL161C KDX1 putative protein kinase KDX1|MLP1 chromosome 11 11 150687 149386 C 2011-02-03 1996-07-31 Protein kinase; implicated in Slt2p mitogen-activated (MAP) kinase signaling pathway; interacts with numerous components in the mating pheromone and CWI MAPK pathways; associates with Rlm1p; KDX1 has a paralog, SLT2, that arose from the whole genome duplication +S000035941 CDS YKL161C 11 150687 149386 C 2011-02-03 1996-07-31 +S000118402 ARS ARS1106 ARSXI-153 chromosome 11 11 153020 153135 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178129 ARS_consensus_sequence ARS1106 11 153122 153106 C 2014-11-18 2014-11-18 +S000001643 ORF Verified YKL160W ELF1 chromosome 11 11 153269 153706 W 2011-02-03 1996-07-31 Transcription elongation factor with a conserved zinc finger domain; implicated in the maintenance of proper chromatin structure in actively transcribed regions; deletion inhibits Brome mosaic virus (BMV) gene expression +S000035865 CDS YKL160W 11 153269 153706 W 2011-02-03 1996-07-31 +S000001642 ORF Verified YKL159C RCN1 chromosome 11 S000007456 11 154451 153816 C 2011-02-03 1996-07-31 Protein involved in calcineurin regulation during calcium signaling; has similarity to H. sapiens DSCR1 which is found in the Down Syndrome candidate region +S000034776 CDS YKL159C 11 154451 153816 C 2011-02-03 1996-07-31 +S000001640 ORF Verified YKL157W APE2 metallo-aminopeptidase|YKL158W|LAP1 chromosome 11 S000001641|L000000092 11 154991 158232 W -124.8 2011-02-03 2000-07-14|1996-07-31|2011-02-03 Aminopeptidase yscII; may have a role in obtaining leucine from dipeptide substrates; APE2 has a paralog, AAP1, that arose from the whole genome duplication +S000033809 CDS YKL157W 11 154991 155271 W 2011-02-03 2000-07-14|1996-07-31 +S000033810 CDS YKL157W 11 155655 158232 W 2011-02-03 2000-07-14|2011-02-03 +S000033811 intron YKL157W 11 155272 155654 W 2011-02-03 2000-07-14 +S000001639 ORF Verified YKL156W RPS27A eS27|ribosomal 40S subunit protein S27A|S27e|rp61|YS20|S27A chromosome 11 L000002712 11 158613 159212 W 2011-02-03 1996-07-31|2011-02-03 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S27, no bacterial homolog; RPS27A has a paralog, RPS27B, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000033664 CDS YKL156W 11 158613 158615 W 2011-02-03 1996-07-31 +S000033665 CDS YKL156W 11 158967 159212 W 2011-02-03 1996-07-31 +S000033666 intron YKL156W 11 158616 158966 W 2011-02-03 1996-07-31|2011-02-03 +S000028668 ORF Dubious YKL156C-A chromosome 11 11 159091 158975 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene RPS27A; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032493 CDS YKL156C-A 11 159091 158975 C 2011-02-03 2003-07-29 +S000001638 ORF Verified YKL155C RSM22 mitochondrial 37S ribosomal protein RSM22 chromosome 11 11 161342 159456 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; also predicted to be an S-adenosylmethionine-dependent RNA methyltransferase +S000033531 CDS YKL155C 11 161342 159456 C 2011-02-03 1996-07-31 +S000001637 ORF Verified YKL154W SRP102 Signal recognition particle receptor subunit beta chromosome 11 11 161601 162335 W 2011-02-03 1996-07-31 Signal recognition particle (SRP) receptor beta subunit; involved in SRP-dependent protein targeting; anchors the alpha subunit, Srp101p to the ER membrane +S000033491 CDS YKL154W 11 161601 162335 W 2011-02-03 1996-07-31 +S000006716 tRNA_gene tR(UCU)K chromosome 11 L000003642 11 162558 162487 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000037862 noncoding_exon tR(UCU)K 11 162558 162487 C 2011-02-03 2000-05-19 +S000007056 long_terminal_repeat YKLWdelta3 chromosome 11 11 162831 163169 W 2011-02-03 2000-05-19 Ty1 LTR +S000001636 ORF Dubious YKL153W chromosome 11 11 163600 164109 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; transcription of both YLK153W and the overlapping essential gene GPM1 is reduced in the gcr1 null mutant +S000032752 CDS YKL153W 11 163600 164109 W 2011-02-03 1996-07-31 +S000001635 ORF Verified YKL152C GPM1 phosphoglycerate mutase GPM1 chromosome 11 L000000726 11 164385 163642 C 2011-02-03 1996-07-31 Tetrameric phosphoglycerate mutase; mediates the conversion of 3-phosphoglycerate to 2-phosphoglycerate during glycolysis and the reverse reaction during gluconeogenesis +S000032605 CDS YKL152C 11 164385 163642 C 2011-02-03 1996-07-31 +S000001634 ORF Verified YKL151C NNR2 NADHX dehydratase chromosome 11 11 165930 164917 C 2011-02-03 1996-07-31 Widely-conserved NADHX dehydratase; converts (S)-NADHX to NADH in ATP-dependent manner; YKL151C promoter contains STREs (stress response elements) and expression is induced by heat shock or methyl methanesulfonate; downstream intergenic region drives antisense expression and mediates coordinated regulation of YKL151C and GPM1 phosphoglycerate mutase; protein abundance increases in response to DNA replication stress; homolog of Carkd in mammals and C-terminus of YjeF in E.coli +S000031623 CDS YKL151C 11 165930 164917 C 2011-02-03 1996-07-31 +S000001633 ORF Verified YKL150W MCR1 cytochrome-b5 reductase chromosome 11 L000003134 11 166544 167452 W 2011-02-03 1996-07-31 Mitochondrial NADH-cytochrome b5 reductase; involved in ergosterol biosynthesis +S000031554 CDS YKL150W 11 166544 167452 W 2011-02-03 1996-07-31 +S000122105 five_prime_UTR_intron YKL150W 11 166400 166487 W 2011-02-03 2007-04-04 +S000001632 ORF Verified YKL149C DBR1 RNA lariat debranching enzyme|PRP26 chromosome 11 L000000495 11 168829 167612 C -106.4 2011-02-03 1996-07-31 RNA lariat debranching enzyme; catalyzes debranching of lariat introns formed during pre-mRNA splicing; required for efficient Ty1 transposition; knockdown of human homolog Dbr1 rescues toxicity of RNA-binding proteins TDP-43 and FUS which are implicated in amyotrophic lateral sclerosis (ALS), suggests potential therapeutic target for ALS and related TDP-43 proteinopathies; human homolog DBR1 can complement yeast dbr1 null mutant +S000031536 CDS YKL149C 11 168829 167612 C 2011-02-03 1996-07-31 +S000001631 ORF Verified YKL148C SDH1 succinate dehydrogenase flavoprotein subunit SDH1|SDHA chromosome 11 L000001823 11 171129 169207 C 2011-02-03 1996-07-31 Flavoprotein subunit of succinate dehydrogenase; couples the oxidation of succinate to the transfer of electrons to ubiquinone as part of the TCA cycle and the mitochondrial respiratory chain; FAD binding to Sdh1p is required for the assembly of the succinate dehydrogenase subunits; mutations in human ortholog SDHA are associated with Leigh syndrome +S000030671 CDS YKL148C 11 171129 169207 C 2011-02-03 1996-07-31 +S000001629 ORF Verified YKL146W AVT3 chromosome 11 11 171783 173861 W 2011-02-03 1996-07-31 Vacuolar transporter; exports large neutral amino acids from the vacuole; member of a family of seven S. cerevisiae genes (AVT1-7) related to vesicular GABA-glycine transporters +S000030513 CDS YKL146W 11 171783 173861 W 2011-02-03 1996-07-31 +S000001630 ORF Dubious YKL147C chromosome 11 11 172168 171551 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the verified gene AVT3 +S000030585 CDS YKL147C 11 172168 171551 C 2011-02-03 1996-07-31 +S000001628 ORF Verified YKL145W RPT1 proteasome regulatory particle base subunit RPT1|YTA3|CIM5 chromosome 11 L000002557 11 174213 175616 W 2011-02-03 1996-07-31 ATPase of the 19S regulatory particle of the 26S proteasome; one of six ATPases of the regulatory particle; involved in the degradation of ubiquitinated substrates; required for optimal CDC20 transcription; interacts with Rpn12p and Ubr1p; mutant has aneuploidy tolerance +S000030368 CDS YKL145W 11 174213 175616 W 2011-02-03 1996-07-31 +S000028841 ORF Dubious YKL145W-A chromosome 11 11 174958 175050 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified essential gene RPT1; identified by expression profiling and mass spectrometry +S000034526 CDS YKL145W-A 11 174958 175050 W 2011-02-03 2003-07-29 +S000001627 ORF Verified YKL144C RPC25 DNA-directed RNA polymerase III subunit RPC25|C25|YKL1 chromosome 11 L000002427 11 176481 175843 C 2011-02-03 1996-07-31 RNA polymerase III subunit C25; required for transcription initiation; forms a heterodimer with Rpc17p; paralog of Rpb7p +S000037515 CDS YKL144C 11 176481 175843 C 2011-02-03 1996-07-31 +S000001626 ORF Verified YKL143W LTV1 YKL2 chromosome 11 L000000962 11 176781 178172 W 2011-02-03 1996-07-31 Component of the GSE complex; GSE is required for proper sorting of amino acid permease Gap1p; required for ribosomal small subunit export from nucleus; required for growth at low temperature +S000037465 CDS YKL143W 11 176781 178172 W 2011-02-03 1996-07-31 +S000001625 ORF Verified YKL142W MRP8 YKL3 chromosome 11 L000001156 11 178515 179174 W 2011-02-03 1996-07-31 Protein of unknown function; undergoes sumoylation; transcription induced under cell wall stress; protein levels are reduced under anaerobic conditions; protein abundance increases in response to DNA replication stress; originally thought to be a mitochondrial ribosomal protein based on sequence analysis +S000036742 CDS YKL142W 11 178515 179174 W 2011-02-03 1996-07-31 +S000001624 ORF Verified YKL141W SDH3 succinate dehydrogenase cytochrome b subunit SDH3|YKL4|CYB3 chromosome 11 L000001825 11 179667 180263 W 2011-02-03 1996-07-31 Subunit of succinate dehydrogenase and of TIM22 translocase; functions as cytochrome b subunit of succinate dehydrogenase, which couples oxidation of succinate to transfer of electrons to ubiquinone as part of the TCA cycle and the mitochondrial respiratory chain; also required for mitochondrial inner membrane protein import as part of the TIM22 complex; SDH3 has a paralog, SHH3, that arose from the whole genome duplication +S000036643 CDS YKL141W 11 179667 180263 W 2011-02-03 1996-07-31 +S000001623 ORF Verified YKL140W TGL1 YKL5 chromosome 11 L000002293 11 180779 182425 W 2011-02-03 1996-07-31 Steryl ester hydrolase; one of three gene products (Yeh1p, Yeh2p, Tgl1p) responsible for steryl ester hydrolase activity and involved in sterol homeostasis; localized to lipid particle membranes +S000036522 CDS YKL140W 11 180779 182425 W 2011-02-03 1996-07-31 +S000001622 ORF Verified YKL139W CTK1 cyclin-dependent serine/threonine protein kinase CTK1 chromosome 11 L000000432 11 182958 184544 W 2011-02-03 1996-07-31 Catalytic (alpha) subunit of C-terminal domain kinase I (CTDK-I); phosphorylates both RNA pol II subunit Rpo21p to affect transcription and pre-mRNA 3' end processing, and ribosomal protein Rps2p to increase translational fidelity; required for H3K36 trimethylation but not dimethylation by Set2p; suggested stimulatory role in 80S formation during translation initiation; similar to the Drosophila dCDK12 and human CDK12 and probably CDK13 +S000036668 CDS YKL139W 11 182958 184544 W 2011-02-03 1996-07-31 +S000028421 ORF Verified YKL138C-A HSK3 chromosome 11 S000028418 11 185012 184803 C 2011-02-03 2002-06-20 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; is transferred to the kinetochore prior to mitosis +S000029957 CDS YKL138C-A 11 185012 184803 C 2011-02-03 2002-06-20 +S000001621 ORF Verified YKL138C MRPL31 mitochondrial 54S ribosomal protein YmL31|YmL31 chromosome 11 L000001168|L000002529 11 185681 185286 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000035696 CDS YKL138C 11 185681 185286 C 2011-02-03 1996-07-31 +S000001620 ORF Verified YKL137W CMC1 chromosome 11 11 185957 186292 W 2011-02-03 1996-07-31|2005-12-15 Copper-binding protein of the mitochondrial intermembrane space; evolutionarily conserved; may be involved in delivering copper from the matrix to the cytochrome c oxidase complex; contains a twin CX9C motif +S000035632 CDS YKL137W 11 185957 186292 W 2011-02-03 1996-07-31|2005-12-15 +S000001619 ORF Dubious YKL136W chromosome 11 11 186416 186814 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF APL2/YKL135C +S000035555 CDS YKL136W 11 186416 186814 W 2011-02-03 1996-07-31 +S000001618 ORF Verified YKL135C APL2 chromosome 11 L000000094 11 188640 186460 C 2011-02-03 1996-07-31 Beta-adaptin subunit of the clathrin-associated protein (AP-1) complex; binds clathrin; involved in clathrin-dependent Golgi protein sorting; protein abundance increases in response to DNA replication stress +S000034478 CDS YKL135C 11 188640 186460 C 2011-02-03 1996-07-31 +S000001617 ORF Verified YKL134C OCT1 metalloendopeptidase chromosome 11 L000004860 11 191442 189124 C 2011-02-03 1996-07-31|2011-02-03 Mitochondrial intermediate peptidase; cleaves destabilizing N-terminal residues of a subset of proteins upon import, after their cleavage by mitochondrial processing peptidase (Mas1p-Mas2p); may contribute to mitochondrial iron homeostasis +S000034401 CDS YKL134C 11 191442 189124 C 2011-02-03 1996-07-31|2011-02-03 +S000001616 ORF Uncharacterized YKL133C chromosome 11 11 193070 191679 C 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; not required for growth of cells lacking the mitochondrial genome; SWAT-GFP and mCherry fusion proteins localize to the mitochondria; YKL133C has a paralog, MGR3, that arose from the whole genome duplication +S000034300 CDS YKL133C 11 193070 191679 C 2011-02-03 1996-07-31|2011-02-03 +S000001614 ORF Dubious YKL131W chromosome 11 11 194478 194999 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033359 CDS YKL131W 11 194478 194999 W 2011-02-03 1996-07-31 +S000001615 ORF Verified YKL132C RMA1 putative tetrahydrofolate synthase chromosome 11 11 194866 193574 C 2011-02-03 1996-07-31 Putative dihydrofolate synthetase; similar to E. coli folylpolyglutamate synthetase/dihydrofolate synthetase; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; RMA1 has a paralog, FOL3, that arose from the whole genome duplication +S000033390 CDS YKL132C 11 194866 193574 C 2011-02-03 1996-07-31 +S000001613 ORF Verified YKL130C SHE2 chromosome 11 L000004571 11 196028 195288 C 2011-02-03 1996-07-31 RNA-binding protein that binds specific mRNAs and interacts with She3p; part of the mRNA localization machinery that restricts accumulation of certain proteins to the bud; binds to ER-derived membranes and targets mRNAs to cortical ER +S000033257 CDS YKL130C 11 196028 195288 C 2011-02-03 1996-07-31 +S000119036 ARS ARS1126 ARSXI-196|ARS1106.3 chromosome 11 11 196042 196287 2011-02-03 2006-10-03 Autonomously Replicating Sequence +S000001612 ORF Verified YKL129C MYO3 myosin 3 chromosome 11 L000002889 11 200167 196349 C 2011-02-03 1996-07-31|2011-02-03 One of two type I myosins; localizes to actin cortical patches; deletion of MYO3 has little effect on growth, but myo3 myo5 double deletion causes severe defects in growth and actin cytoskeleton organization; MYO3 has a paralog, MYO5, that arose from the whole genome duplication +S000032500 CDS YKL129C 11 200167 196349 C 2011-02-03 1996-07-31|2011-02-03 +S000001611 ORF Verified YKL128C PMU1 putative phosphomutase chromosome 11 L000003276 11 201771 200884 C 2011-02-03 1996-07-31 Putative phosphomutase; contains a region homologous to the active site of phosphomutases; overexpression suppresses the histidine auxotrophy of an ade3 ade16 ade17 triple mutant and the temperature sensitivity of a tps2 mutant +S000032407 CDS YKL128C 11 201771 200884 C 2011-02-03 1996-07-31 +S000007054 long_terminal_repeat YKLCsigma1 chromosome 11 11 202983 202644 C 2011-02-03 2000-05-19 Ty3 LTR +S000006626 tRNA_gene tK(CUU)K chromosome 11 L000003631 11 202999 203071 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000036035 noncoding_exon tK(CUU)K 11 202999 203071 W 2011-02-03 2000-05-19 +S000001610 ORF Verified YKL127W PGM1 phosphoglucomutase PGM1 chromosome 11 L000001412 11 203541 205253 W -108.4 2011-02-03 1996-07-31 Phosphoglucomutase, minor isoform; catalyzes the conversion from glucose-1-phosphate to glucose-6-phosphate, which is a key step in hexose metabolism; PGM1 has a paralog, PGM2, that arose from the whole genome duplication +S000032331 CDS YKL127W 11 203541 205253 W 2011-02-03 1996-07-31 +S000001609 ORF Verified YKL126W YPK1 serine/threonine protein kinase YPK1|SLI2 chromosome 11 L000002541 11 205707 207749 W -97.7 2011-02-03 1996-07-31 S/T protein kinase; phosphorylates, downregulates flippase activator Fpk1p; inactivates Orm1p and Orm2p by phosphorylation in response to compromised sphingolipid synthesis; involved in the TORC-dependent phosphorylation of ribosomal proteins Rps6a/b (S6); mutations affect receptor-mediated endocytosis and sphingolipid-mediated and cell integrity signaling pathways; human homolog SGK1 can complement a null mutant; human homolog SGK2 can complement a ypk1 ypk2 double mutant +S000031322 CDS YKL126W 11 205707 207749 W 2011-02-03 1996-07-31 +S000001608 ORF Verified YKL125W RRN3 rDNA-binding RNA polymerase I transcriptional factor chromosome 11 L000003362 11 208247 210130 W 2011-02-03 1996-07-31 Protein required for transcription of rDNA by RNA polymerase I; transcription factor independent of DNA template; involved in recruitment of RNA polymerase I to rDNA; structure reveals unique HEAT repeat fold and a surface serine patch; phosphorylation of serine patch impairs cell growth and reduces RNA polymerase I binding in vitro and RNA polymerase I recruitment to the rDNA gene in vivo +S000031219 CDS YKL125W 11 208247 210130 W 2011-02-03 1996-07-31 +S000001607 ORF Verified YKL124W SSH4 MLF4 chromosome 11 L000002951 11 210593 212332 W 2011-02-03 1996-07-31 Specificity factor required for Rsp5p-dependent ubiquitination; also required for sorting of cargo proteins at the multivesicular body; identified as a high-copy suppressor of a SHR3 deletion, increasing steady-state levels of amino acid permeases +S000031112 CDS YKL124W 11 210593 212332 W 2011-02-03 1996-07-31 +S000001606 ORF Dubious YKL123W chromosome 11 11 212043 212423 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene SSH4 +S000030083 CDS YKL123W 11 212043 212423 W 2011-02-03 1996-07-31 +S000001605 ORF Verified YKL122C SRP21 signal recognition particle subunit SRP21 chromosome 11 L000002062 11 212998 212495 C 2011-02-03 1996-07-31 Subunit of the signal recognition particle (SRP); SRP functions in protein targeting to the endoplasmic reticulum membrane; not found in mammalian SRP; forms a pre-SRP structure in the nucleolus that is translocated to the cytoplasm +S000029913 CDS YKL122C 11 212998 212495 C 2011-02-03 1996-07-31 +S000119037 ARS ARS1127 ARSXI-213|ARS1106.7 chromosome 11 11 213439 213743 2011-02-03 2006-10-03 Autonomously Replicating Sequence +S000001604 ORF Uncharacterized YKL121W DGR2 chromosome 11 11 214142 216700 W 2011-02-03 1996-07-31 Protein of unknown function; null mutant is resistant to 2-deoxy-D-glucose and displays abnormally elongated buds; DGR2 has a paralog, YMR102C, that arose from the whole genome duplication +S000029872 CDS YKL121W 11 214142 216700 W 2011-02-03 1996-07-31 +S000001603 ORF Verified YKL120W OAC1 chromosome 11 S000007413 11 217344 218318 W 2011-02-03 1996-07-31 Mitochondrial inner membrane transporter; transports oxaloacetate, sulfate, thiosulfate, and isopropylmalate; member of the mitochondrial carrier family +S000037208 CDS YKL120W 11 217344 218318 W 2011-02-03 1996-07-31 +S000001601 ORF Dubious YKL118W chromosome 11 11 219126 219437 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene VPH2 +S000036185 CDS YKL118W 11 219126 219437 W 2011-02-03 1996-07-31 +S000001602 ORF Verified YKL119C VPH2 VMA12|CLS10 chromosome 11 L000002468 11 219217 218570 C 2011-02-03 1996-07-31 Integral membrane protein required for V-ATPase function; not an actual component of the vacuolar H+-ATPase (V-ATPase) complex; functions in the assembly of the V-ATPase; localized to the endoplasmic reticulum (ER); involved in methionine restriction extension of chronological lifespan in an autophagy-dependent manner +S000036236 CDS YKL119C 11 219217 218570 C 2011-02-03 1996-07-31 +S000007051 long_terminal_repeat YKLCdelta4 chromosome 11 11 219723 219395 C 2011-02-03 2000-05-19 Ty1 LTR +S000006515 tRNA_gene tA(AGC)K1 chromosome 11 L000003632 11 219895 219967 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine +S000036246 noncoding_exon tA(AGC)K1 11 219895 219967 W 2011-02-03 2000-05-19 +S000001600 ORF Verified YKL117W SBA1 Hsp90 cochaperone SBA1|CST18 chromosome 11 L000004284|L000002999|S000029122 11 220324 220974 W 2011-02-03 1996-07-31 Co-chaperone that binds and regulates Hsp90 family chaperones; plays a role in determining prion variants; important for pp60v-src activity in yeast; homologous to the mammalian p23 proteins, and like p23 can regulate telomerase activity; protein abundance increases in response to DNA replication stress +S000035238 CDS YKL117W 11 220324 220974 W 2011-02-03 1996-07-31 +S000001599 ORF Verified YKL116C PRR1 serine/threonine protein kinase PRR1 chromosome 11 11 222900 221344 C 2011-02-03 1996-07-31 Serine/threonine protein kinase; inhibits pheromone induced signaling downstream of MAPK, possibly at the level of the Ste12p transcription factor +S000034995 CDS YKL116C 11 222900 221344 C 2011-02-03 1996-07-31 +S000001598 ORF Dubious YKL115C chromosome 11 11 223285 222893 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene PRR1 +S000034081 CDS YKL115C 11 223285 222893 C 2011-02-03 1996-07-31 +S000001597 ORF Verified YKL114C APN1 DNA-(apurinic or apyrimidinic site) lyase APN1 chromosome 11 L000000096 11 224455 223352 C 2011-02-03 1996-07-31 Major apurinic/apyrimidinic endonuclease; 3'-repair diesterase; involved in repair of DNA damage by oxidation and alkylating agents; also functions as a 3'-5' exonuclease to repair 7,8-dihydro-8-oxodeoxyguanosine; genetically interacts with NTG1 to maintain mitochondrial genome integrity +S000033938 CDS YKL114C 11 224455 223352 C 2011-02-03 1996-07-31 +S000001596 ORF Verified YKL113C RAD27 multifunctional nuclease RAD27|FEN1|RTH1|ERC11 chromosome 11 L000002742|L000000565 11 225875 224727 C 2011-02-03 1996-07-31 5' to 3' exonuclease, 5' flap endonuclease; required for Okazaki fragment processing and maturation, for long-patch base-excision repair and large loop repair (LLR), ribonucleotide excision repair; member of the S. pombe RAD2/FEN1 family; relocalizes to the cytosol in response to hypoxia +S000033801 CDS YKL113C 11 225875 224727 C 2011-02-03 1996-07-31 +S000001595 ORF Verified YKL112W ABF1 GFI|SBF-B|DNA-binding protein ABF1|SBF1|REB2|OBF1|BAF1 chromosome 11 L000000159 11 226570 228765 W 2011-02-03 1996-07-31 DNA binding protein with possible chromatin-reorganizing activity; involved in transcriptional activation, gene silencing, and DNA replication and repair +S000033734 CDS YKL112W 11 226570 228765 W 2011-02-03 1996-07-31 +S000001594 ORF Dubious YKL111C chromosome 11 11 228799 228464 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the verified essential gene ABF1 +S000032984 CDS YKL111C 11 228799 228464 C 2011-02-03 1996-07-31 +S000001593 ORF Verified YKL110C KTI12 TOT4 chromosome 11 L000000923 11 229880 228939 C 2011-02-03 1996-07-31 Protein that plays a role in modification of tRNA wobble nucleosides; protein plays role in tRNA wobble nucleoside modification with Elongator complex; involved in sensitivity to G1 arrest induced by zymocin; interacts with chromatin throughout the genome; also interacts with Cdc19p +S000032867 CDS YKL110C 11 229880 228939 C 2011-02-03 1996-07-31 +S000001592 ORF Verified YKL109W HAP4 transcription factor HAP4 chromosome 11 L000000754 11 232227 233891 W 2011-02-03 1996-07-31 Transcription factor; subunit of the heme-activated, glucose-repressed Hap2p/3p/4p/5p CCAAT-binding complex, a transcriptional activator and global regulator of respiratory gene expression; provides the principal activation function of the complex; involved in diauxic shift +S000032773 CDS YKL109W 11 232227 233891 W 2011-02-03 1996-07-31 +S000001591 ORF Verified YKL108W SLD2 DRC1 chromosome 11 L000004708 11 234426 235787 W 2011-02-03 1996-07-31 Single-stranded DNA origin-binding and annealing protein; required for initiation of DNA replication; phosphorylated in S phase by cyclin-dependent kinases (Cdks), promoting origin binding, DNA replication and Dpb11p complex formation; component of the preloading complex; binds the Mcm2-7p complex to prevent inappropriate Mcm2-7p interaction with the GINS complex in G1; required for S phase checkpoint; relative distribution to the nucleus increases upon DNA replication stress +S000032698 CDS YKL108W 11 234426 235787 W 2011-02-03 1996-07-31 +S000001590 ORF Uncharacterized YKL107W putative short-chain dehydrogenase/reductase chromosome 11 11 236141 237070 W 2011-02-03 1996-07-31 Putative short-chain dehydrogenase/reductase; proposed to be a palmitoylated membrane protein +S000032626 CDS YKL107W 11 236141 237070 W 2011-02-03 1996-07-31 +S000007616 ORF Uncharacterized YKL106C-A chromosome 11 11 237266 237147 C 2011-02-03 2001-02-26 Putative protein of unknown function; identified by homology to uncharacterized proteins in other fungi +S000037214 CDS YKL106C-A 11 237266 237147 C 2011-02-03 2001-02-26 +S000001589 ORF Verified YKL106W AAT1 aspartate transaminase AAT1 chromosome 11 L000000009 11 237536 238891 W 2011-02-03 1996-07-31 Mitochondrial aspartate aminotransferase; catalyzes the conversion of oxaloacetate to aspartate in aspartate and asparagine biosynthesis +S000031616 CDS YKL106W 11 237536 238891 W 2011-02-03 1996-07-31 +S000001588 ORF Verified YKL105C SEG2 chromosome 11 11 242583 239185 C 2011-02-03 1996-07-31 Eisosome component; likely plays only a minor role in eisosome assembly; shown to interact with Seg1p by affinity purification and mass spec; SWAT-GFP and mCherry fusion proteins localize to the cell periphery; similar to A. gossypii SEG gene which is important for stabilizing eisosomes; SEG2 has a paralog, SEG1, that arose from the whole genome duplication +S000031413 CDS YKL105C 11 242583 239185 C 2011-02-03 1996-07-31 +S000001587 ORF Verified YKL104C GFA1 glutamine--fructose-6-phosphate transaminase (isomerizing) GFA1 chromosome 11 L000000702 11 245373 243220 C 2011-02-03 1996-07-31 Glutamine-fructose-6-phosphate amidotransferase; catalyzes the formation of glucosamine-6-P and glutamate from fructose-6-P and glutamine in the first step of chitin biosynthesis; GFA1 has a paralogous region, comprising ORFs YMR084W-YMR085W, that arose from the whole genome duplication +S000030506 CDS YKL104C 11 245373 243220 C 2011-02-03 1996-07-31 +S000001586 ORF Verified YKL103C APE1 metalloaminopeptidase APE1|LAP4|API|YSC1 chromosome 11 L000000930 11 247682 246138 C -138 2011-02-03 1996-07-31 Vacuolar aminopeptidase yscI; zinc metalloproteinase that belongs to the peptidase family M18; often used as a marker protein in studies of autophagy and cytosol to vacuole targeting (CVT) pathway; protein increases in abundance and relative distribution to cytoplasmic foci increases upon DNA replication stress +S000030363 CDS YKL103C 11 247682 246138 C 2011-02-03 1996-07-31 +S000001585 ORF Dubious YKL102C chromosome 11 11 248367 248062 C 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; deletion confers sensitivity to citric acid; predicted protein would include a thiol-disulfide oxidoreductase active site +S000030203 CDS YKL102C 11 248367 248062 C 2011-02-03 1996-07-31 +S000001584 ORF Verified YKL101W HSL1 protein kinase HSL1|ELM2|NIK1 chromosome 11 L000003129|L000002839 11 248920 253476 W 2011-02-03 1996-07-31|2011-02-03 Nim1p-related protein kinase; septin-binding kinase that localizes to the bud neck septin ring and regulates the morphogenesis checkpoint; phosphorylates Hsl7p and cooperates with Elm1p to recruit Hsl7p to the mother-bud neck, as a prerequisite for the subsequent recruitment, phosphorylation, and degradation of Swe1p; autophosphorylation enhances interactions with Hsl7p +S000037537 CDS YKL101W 11 248920 253476 W 2011-02-03 1996-07-31|2011-02-03 +S000028840 ORF Dubious YKL100W-A chromosome 11 11 254159 254248 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000034525 CDS YKL100W-A 11 254159 254248 W 2011-02-03 2003-07-29 +S000001583 ORF Verified YKL100C YPF1 aspartic endopeptidase chromosome 11 11 255460 253697 C 2011-02-03 1996-07-31 Intramembrane aspartyl protease of the perinuclear ER membrane; acts in a branch of ER-associated degradation (ERAD) that degrades functional proteins rather than misfolded proteins; regulates abundance of high-affinity plasma membrane transporters, such as Ctr1p and Zrt1p, during the starvation response; has a presenilin fold; member of the GxGD family of intramembrane proteases; closest human homolog is signal peptide peptidase (SPP) +S000037360 CDS YKL100C 11 255460 253697 C 2011-02-03 1996-07-31 +S000001582 ORF Verified YKL099C UTP11 rRNA-processing protein UTP11 chromosome 11 11 256472 255720 C 2011-02-03 1996-07-31|2005-12-15 Subunit of U3-containing Small Subunit (SSU) processome complex; involved in production of 18S rRNA and assembly of small ribosomal subunit +S000031999 CDS YKL099C 11 256472 255720 C 2011-02-03 1996-07-31|2005-12-15 +S000001581 ORF Verified YKL098W MTC2 chromosome 11 11 256770 257843 W 2011-02-03 1996-07-31 Protein of unknown function; mtc2 is synthetically sick with cdc13-1 +S000031070 CDS YKL098W 11 256770 257843 W 2011-02-03 1996-07-31 +S000001580 ORF Dubious YKL097C chromosome 11 11 258913 258503 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species +S000030940 CDS YKL097C 11 258913 258503 C 2011-02-03 1996-07-31 +S000028667 ORF Uncharacterized YKL096C-B chromosome 11 11 259222 259073 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032492 CDS YKL096C-B 11 259222 259073 C 2011-02-03 2003-07-29 +S000001956 ORF Verified YKL096W-A CWP2 YKL097W-A|LPR1 chromosome 11 L000000952|L000002857 11 259253 259531 W 2011-02-03 1996-07-31 Covalently linked cell wall mannoprotein; major constituent of the cell wall; plays a role in stabilizing the cell wall; involved in low pH resistance; precursor is GPI-anchored +S000037786 CDS YKL096W-A 11 259253 259531 W 2011-02-03 1996-07-31 +S000001579 ORF Verified YKL096W CWP1 YJU1 chromosome 11 L000000446|L000002512 11 261132 261851 W 2011-02-03 1996-07-31 Cell wall mannoprotein that localizes to birth scars of daughter cells; linked to a beta-1,3- and beta-1,6-glucan heteropolymer through a phosphodiester bond; required for propionic acid resistance +S000030917 CDS YKL096W 11 261132 261851 W 2011-02-03 1996-07-31 +S000001578 ORF Verified YKL095W YJU2 mRNA splicing protein YJU2|CWC16 chromosome 11 L000002513 11 262277 263113 W 2011-02-03 1996-07-31 Essential protein required for pre-mRNA splicing; associates transiently with the spliceosomal NTC ("nineteen complex") and acts after Prp2p to promote the first catalytic reaction of splicing +S000030823 CDS YKL095W 11 262277 263113 W 2011-02-03 1996-07-31 +S000001577 ORF Verified YKL094W YJU3 acylglycerol lipase chromosome 11 L000002514 11 263349 264290 W 2011-02-03 1996-07-31 Monoglyceride lipase (MGL); functional ortholog of mammalian MGL, localizes to lipid particles and membranes, also member of the eukaryotic serine hydrolase family +S000037906 CDS YKL094W 11 263349 264290 W 2011-02-03 1996-07-31 +S000001576 ORF Verified YKL093W MBR1 chromosome 11 L000001033 11 264789 265808 W 2011-02-03 1996-07-31 Protein involved in mitochondrial functions and stress response; overexpression suppresses growth defects of hap2, hap3, and hap4 mutants; MBR1 has a paralog, ISF1, that arose from the whole genome duplication +S000037808 CDS YKL093W 11 264789 265808 W 2011-02-03 1996-07-31 +S000001575 ORF Verified YKL092C BUD2 ERC25|CLA2 chromosome 11 L000000199 11 269459 266145 C 2011-02-03 1996-07-31 GTPase activating factor for Rsr1p/Bud1p; plays a role in spindle position checkpoint distinct from its role in bud site selection; required for both axial and bipolar budding patterns; mutants exhibit random budding in all cell types; contains two PH-like domains +S000037705 CDS YKL092C 11 269459 266145 C 2011-02-03 1996-07-31 +S000001574 ORF Verified YKL091C phosphatidylinositol/phosphatidylcholine-binding protein|SFH1 chromosome 11 11 270650 269718 C 2011-02-03 1996-07-31 Putative phosphatidylinositol/phosphatidylcholine transfer protein; possibly involved in lipid metabolism; localizes to the nucleus; contains a CRAL/TRIO domain and binds several lipids in a large-scale study; YKL091C has a paralog, SEC14, that arose from the whole genome duplication +S000036936 CDS YKL091C 11 270650 269718 C 2011-02-03 1996-07-31 +S000001573 ORF Verified YKL090W CUE2 chromosome 11 11 271878 273209 W 2011-02-03 1996-07-31 Protein of unknown function; has two CUE domains that bind ubiquitin, which may facilitate intramolecular monoubiquitination +S000036908 CDS YKL090W 11 271878 273209 W 2011-02-03 1996-07-31 +S000001572 ORF Verified YKL089W MIF2 chromosome 11 L000001109 11 273394 275043 W -43 2011-02-03 1996-07-31 Protein required for structural integrity of elongating spindles; localizes to the kinetochore; interacts with histones H2A, H2B, and H4; phosphorylated by Ipl1p; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-C and fission yeast cnp3 +S000036033 CDS YKL089W 11 273394 275043 W 2011-02-03 1996-07-31 +S000001571 ORF Verified YKL088W CAB3 phosphopantothenoylcysteine decarboxylase complex subunit CAB3 chromosome 11 11 275283 276998 W 2011-02-03 1996-07-31 Subunit of PPCDC and CoA-SPC complexes involved in CoA biosynthesis; subunits of the phosphopantothenoylcysteine decarboxylase (PPCDC) complex are: Cab3p, Sis2p, Vhs3p, while the subunits of the CoA-synthesizing protein complex (CoA-SPC) are: Cab2p, Cab3p, Cab4p, and Cab5p as well as Sis2p and Vhs3p; null mutant lethality is complemented by E. coli coaBC +S000035891 CDS YKL088W 11 275283 276998 W 2011-02-03 1996-07-31 +S000001570 ORF Verified YKL087C CYT2 cytochrome c1 heme lyase CYT2|CC1HL chromosome 11 L000000473 11 277863 277189 C 2011-02-03 1996-07-31 Cytochrome c1 heme lyase; involved in maturation of cytochrome c1, which is a subunit of the mitochondrial ubiquinol-cytochrome-c reductase; links heme covalently to apocytochrome c1; human homolog HCCS can complement yeast cyt2 null mutant +S000034890 CDS YKL087C 11 277863 277189 C 2011-02-03 1996-07-31 +S000001569 ORF Verified YKL086W SRX1 sulfiredoxin chromosome 11 11 278281 278664 W 2011-02-03 1996-07-31 Sulfiredoxin; contributes to oxidative stress resistance by reducing cysteine-sulfinic acid groups in the peroxiredoxin Tsa1p, which is formed upon exposure to oxidants; conserved in higher eukaryotes; protein abundance increases in response to DNA replication stress +S000034838 CDS YKL086W 11 278281 278664 W 2011-02-03 1996-07-31 +S000001568 ORF Verified YKL085W MDH1 malate dehydrogenase MDH1 chromosome 11 L000001045 11 279123 280127 W 2011-02-03 1996-07-31 Mitochondrial malate dehydrogenase; catalyzes interconversion of malate and oxaloacetate; involved in the tricarboxylic acid (TCA) cycle; phosphorylated +S000034670 CDS YKL085W 11 279123 280127 W 2011-02-03 1996-07-31 +S000001567 ORF Verified YKL084W HOT13 chromosome 11 11 280509 280859 W 2011-02-03 1996-07-31 Zinc-binding mitochondrial intermembrane space (IMS) protein; involved in a disulfide relay system for IMS import of cysteine-containing proteins; binds Mia40p and stimulates its Erv1p-dependent oxidation, probably by sequestering zinc +S000033808 CDS YKL084W 11 280509 280859 W 2011-02-03 1996-07-31 +S000001566 ORF Dubious YKL083W chromosome 11 11 280921 281535 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the verified essential gene RRP14 +S000033660 CDS YKL083W 11 280921 281535 W 2011-02-03 1996-07-31 +S000001565 ORF Verified YKL082C RRP14 ribosome biosynthesis protein RRP14 chromosome 11 11 282329 281025 C 2011-02-03 1996-07-31 Essential protein, constituent of 66S pre-ribosomal particles; interacts with proteins involved in ribosomal biogenesis and cell polarity; member of the SURF-6 family +S000033529 CDS YKL082C 11 282329 281025 C 2011-02-03 1996-07-31 +S000001564 ORF Verified YKL081W TEF4 translation elongation factor EF1B gamma|EFC1 chromosome 11 L000002280 11 282891 284455 W 2011-02-03 1996-07-31 Gamma subunit of translational elongation factor eEF1B; stimulates the binding of aminoacyl-tRNA (AA-tRNA) to ribosomes by releasing eEF1A (Tef1p/Tef2p) from the ribosomal complex +S000033487 CDS YKL081W 11 282891 283095 W 2011-02-03 1996-07-31 +S000033488 CDS YKL081W 11 283422 284455 W 2011-02-03 1996-07-31 +S000033489 intron YKL081W 11 283096 283421 W 2011-02-03 1996-07-31 +S000007301 snoRNA_gene snR38 SNR38 chromosome 11 L000003053 11 283185 283279 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position G2815 +S000036768 noncoding_exon snR38 11 283185 283279 W 2011-02-03 2000-05-19 +S000001563 ORF Verified YKL080W VMA5 H(+)-transporting V1 sector ATPase subunit C|VAT3|CSL5 chromosome 11 L000002460 11 285030 286208 W 2011-02-03 1996-07-31 Subunit C of the V1 peripheral membrane domain of V-ATPase; part of the electrogenic proton pump found throughout the endomembrane system; required for the V1 domain to assemble onto the vacuolar membrane; the V1 peripheral membrane domain of vacuolar H+-ATPase (V-ATPase) has eight subunits +S000032748 CDS YKL080W 11 285030 286208 W 2011-02-03 1996-07-31 +S000001562 ORF Verified YKL079W SMY1 chromosome 11 L000001940 11 286603 288573 W 2011-02-03 1996-07-31 Kinesin-like myosin passenger-protein; interacts with Myo2p and enhances its interaction with Sec4p during transport of secretory vesicles; controls actin cable structure and dynamics +S000031903 CDS YKL079W 11 286603 288573 W 2011-02-03 1996-07-31 +S000001561 ORF Verified YKL078W DHR2 RNA helicase chromosome 11 11 288845 291052 W 2011-02-03 1996-07-31 Predominantly nucleolar DEAH-box ATP-dependent RNA helicase; required for 18S rRNA synthesis +S000031760 CDS YKL078W 11 288845 291052 W 2011-02-03 1996-07-31 +S000001560 ORF Uncharacterized YKL077W chromosome 11 11 291453 292631 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole +S000031669 CDS YKL077W 11 291453 292631 W 2011-02-03 1996-07-31 +S000001559 ORF Dubious YKL076C PSY1 chromosome 11 11 293221 292838 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 69% of ORF overlaps the uncharacterized ORF YKL075C +S000031531 CDS YKL076C 11 293221 292838 C 2011-02-03 1996-07-31 +S000001558 ORF Uncharacterized YKL075C chromosome 11 11 294308 292956 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; proposed to be involved in resistance to streptozotocin and camptothecin +S000030667 CDS YKL075C 11 294308 292956 C 2011-02-03 1996-07-31 +S000001557 ORF Verified YKL074C MUD2 chromosome 11 L000002794 11 296193 294610 C 2011-02-03 1996-07-31 Protein involved in early pre-mRNA splicing; component of the pre-mRNA-U1 snRNP complex, the commitment complex; interacts with Msl5p/BBP splicing factor and Sub2p; similar to metazoan splicing factor U2AF65 +S000030581 CDS YKL074C 11 296193 294610 C 2011-02-03 1996-07-31 +S000001556 ORF Verified YKL073W LHS1 Hsp70 family chaperone LHS1|SSI1|CER1 chromosome 11 L000004102 11 296430 299075 W 2011-02-03 1996-07-31 Molecular chaperone of the endoplasmic reticulum lumen; involved in polypeptide translocation and folding; nucleotide exchange factor for the ER lumenal Hsp70 chaperone Kar2p; regulated by the unfolded protein response pathway +S000030511 CDS YKL073W 11 296430 299075 W 2011-02-03 1996-07-31 +S000001555 ORF Verified YKL072W STB6 chromosome 11 L000003369 11 299582 301882 W 2011-02-03 1996-07-31 Protein that binds Sin3p in a two-hybrid assay; STB6 has a paralog, STB2, that arose from the whole genome duplication +S000030364 CDS YKL072W 11 299582 301882 W 2011-02-03 1996-07-31 +S000007052 long_terminal_repeat YKLCdelta5 chromosome 11 11 302625 302334 C 2011-02-03 2000-05-19 Ty1 LTR +S000006774 tRNA_gene tW(CCA)K chromosome 11 L000003633 11 302918 303023 W 2011-02-03 2000-05-19 Tryptophan tRNA (tRNA-Trp), predicted by tRNAscan-SE analysis +S000033327 intron tW(CCA)K 11 302954 302987 W 2011-02-03 2000-05-19 +S000033325 noncoding_exon tW(CCA)K 11 302918 302953 W 2011-02-03 2000-05-19 +S000033326 noncoding_exon tW(CCA)K 11 302988 303023 W 2011-02-03 2000-05-19 +S000001554 ORF Uncharacterized YKL071W chromosome 11 11 305114 305884 W 2011-02-03 1996-07-31 Putative protein of unknown function; expression induced in cells treated with the mycotoxin patulin, and also the quinone methide triterpene celastrol; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000037597 CDS YKL071W 11 305114 305884 W 2011-02-03 1996-07-31 +S000001553 ORF Uncharacterized YKL070W chromosome 11 11 306211 306720 W 2011-02-03 1996-07-31 Putative protein of unknown function; expression induced in cells treated with mycotoxins patulin or citrinin; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000037452 CDS YKL070W 11 306211 306720 W 2011-02-03 1996-07-31 +S000001552 ORF Verified YKL069W L-methionine (R)-S-oxide reductase|fRMsr|YKG9 chromosome 11 11 307285 307827 W 2011-02-03 1996-07-31 Methionine-R-sulfoxide reductase; reduces the R enantiomer of free Met-SO, in contrast to Ycl033Cp which reduces Met-R-SO in a peptide linkage; has a role in protection against oxidative stress; relative distribution to the nucleus increases upon DNA replication stress +S000036847 CDS YKL069W 11 307285 307827 W 2011-02-03 1996-07-31 +S000006760 tRNA_gene tV(AAC)K1 chromosome 11 L000003641 11 308217 308144 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000037869 noncoding_exon tV(AAC)K1 11 308217 308144 C 2011-02-03 2000-05-19 +S000028524 ORF Uncharacterized YKL068W-A chromosome 11 11 309206 309442 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by homology to Ashbya gossypii +S000030323 CDS YKL068W-A 11 309206 309442 W 2011-02-03 2003-07-29 +S000001551 ORF Verified YKL068W NUP100 FG-nucleoporin NUP100|[NUP100+]|NSP100 chromosome 11 L000001292 11 310199 313078 W 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; contributes directly to nucleocytoplasmic transport and maintenance of the nuclear pore complex (NPC) permeability barrier and is involved in gene tethering at the nuclear periphery; NUP100 has a paralog, NUP116, that arose from the whole genome duplication +S000036782 CDS YKL068W 11 310199 313078 W 2011-02-03 1996-07-31 +S000006598 tRNA_gene tH(GUG)K chromosome 11 L000003640 11 313472 313401 C 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis +S000033889 noncoding_exon tH(GUG)K 11 313472 313401 C 2011-02-03 2000-05-19 +S000007053 long_terminal_repeat YKLCdelta6 chromosome 11 11 313919 313602 C 2011-02-03 2000-05-19 Ty1 LTR +S000007057 long_terminal_repeat YKLWdelta7 chromosome 11 11 314193 314524 W 2011-02-03 2000-05-19 Ty1 LTR +S000001550 ORF Verified YKL067W YNK1 nucleoside diphosphate kinase|NDK1 chromosome 11 L000002536 11 314812 315273 W 2011-02-03 1996-07-31 Nucleoside diphosphate kinase; catalyzes the transfer of gamma phosphates from nucleoside triphosphates, usually ATP, to nucleoside diphosphates by a mechanism that involves formation of an autophosphorylated enzyme intermediate; protein abundance increases in response to DNA replication stress +S000036722 CDS YKL067W 11 314812 315273 W 2011-02-03 1996-07-31 +S000001549 ORF Dubious YKL066W chromosome 11 11 315281 315724 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the verified gene YNK1 +S000036665 CDS YKL066W 11 315281 315724 W 2011-02-03 1996-07-31 +S000113563 ORF Uncharacterized YKL065W-A chromosome 11 11 315954 316175 W 2011-02-03 2005-11-17 Putative protein of unknown function; SWAT-GFP fusion protein localizes to the endoplasmic reticulum (ER) while mCherry fusion localizes to both the ER and vacuole +S000113565 CDS YKL065W-A 11 315954 316175 W 2011-02-03 2005-11-17 +S000001548 ORF Verified YKL065C YET1 chromosome 11 L000003484 11 317057 316437 C 2011-02-03 1996-07-31|2011-02-03 Endoplasmic reticulum transmembrane protein; may interact with ribosomes, based on co-purification experiments; homolog of human BAP31 protein; YET1 has a paralog, YET2, that arose from the whole genome duplication +S000035692 CDS YKL065C 11 317057 316437 C 2011-02-03 1996-07-31|2011-02-03 +S000001547 ORF Verified YKL064W MNR2 putative Mg(2+) transporter MNR2 chromosome 11 L000003203 11 317764 320673 W 2011-02-03 1996-07-31 Vacuolar membrane protein required for magnesium homeostasis; putative magnesium transporter; has similarity to Alr1p and Alr2p, which mediate influx of Mg2+ and other divalent cations; localizes to sites of contact between the vacuole and mitochondria (vCLAMPs) +S000035630 CDS YKL064W 11 317764 320673 W 2011-02-03 1996-07-31 +S000001546 ORF Uncharacterized YKL063C chromosome 11 11 321518 321015 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the Golgi +S000035510 CDS YKL063C 11 321518 321015 C 2011-02-03 1996-07-31 +S000001545 ORF Verified YKL062W MSN4 stress-responsive transcriptional activator MSN4 chromosome 11 L000001199 11 323228 325120 W 2011-02-03 1996-07-31 Stress-responsive transcriptional activator; activated in stochastic pulses of nuclear localization in response to various stress conditions; binds DNA at stress response elements of responsive genes, inducing gene expression; involved in diauxic shift +S000034556 CDS YKL062W 11 323228 325120 W 2011-02-03 1996-07-31 +S000001544 ORF Verified YKL061W BLI1 chromosome 11 11 325771 326112 W 2011-02-03 1996-07-31 Subunit of the BLOC-1 complex involved in endosomal maturation; interacts with Msb3p; green fluorescent protein (GFP)-fusion protein localizes to the endosome +S000034423 CDS YKL061W 11 325771 326112 W 2011-02-03 1996-07-31 +S000001543 ORF Verified YKL060C FBA1 fructose-bisphosphate aldolase FBA1|LOT1 chromosome 11 L000000604 11 327487 326408 C 2011-02-03 1996-07-31 Fructose 1,6-bisphosphate aldolase; required for glycolysis and gluconeogenesis; catalyzes conversion of fructose 1,6 bisphosphate to glyceraldehyde-3-P and dihydroxyacetone-P; locates to mitochondrial outer surface upon oxidative stress; N-terminally propionylated in vivo +S000034296 CDS YKL060C 11 327487 326408 C 2011-02-03 1996-07-31 +S000001542 ORF Verified YKL059C MPE1 cleavage polyadenylation factor subunit MPE1 chromosome 11 11 329443 328118 C 2011-02-03 1996-07-31 Essential conserved subunit of CPF cleavage and polyadenylation factor; plays a role in 3' end formation of mRNA via the specific cleavage and polyadenylation of pre-mRNA; contains a ubiquitin-like (UBL) domain, a RNA-binding zinc knuckle motif and a RING finger domain; both the zinc knuckle and RING finger are required for pre-mRNA binding; possible role in ubiquitination of Pap1p; relocalizes to the cytosol in response to hypoxia +S000033369 CDS YKL059C 11 329443 328118 C 2011-02-03 1996-07-31 +S000118403 ARS ARS1109 ARSXI-329 chromosome 11 11 329682 329930 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000001541 ORF Verified YKL058W TOA2 transcription initiation factor IIA subunit gamma chromosome 11 L000002317 11 330166 330534 W 2011-02-03 1996-07-31 TFIIA small subunit; involved in transcriptional activation, acts as antirepressor or as coactivator; required, along with Toa1p, for ribosomal protein gene transcription in vivo; homologous to smallest subunit of human and Drosophila TFIIA; protein abundance increases in response to DNA replication stress +S000033347 CDS YKL058W 11 330166 330534 W 2011-02-03 1996-07-31 +S000001540 ORF Verified YKL057C NUP120 RAT2 chromosome 11 L000003138 11 333969 330856 C 2011-02-03 1996-07-31 Subunit of the Nup84p subcomplex of the nuclear pore complex (NPC); contributes to nucleocytoplasmic transport and NPC biogenesis and is involved in establishment of a normal nucleocytoplasmic concentration gradient of the GTPase Gsp1p; also plays roles in several processes that may require localization of genes or chromosomes at the nuclear periphery, including double-strand break repair, transcription and chromatin silencing; homologous to human NUP160 +S000032581 CDS YKL057C 11 333969 330856 C 2011-02-03 1996-07-31 +S000001539 ORF Verified YKL056C TMA19 MMI1|RBF18 chromosome 11 11 334915 334412 C 2011-02-03 1996-07-31 Protein that associates with ribosomes; homolog of translationally controlled tumor protein; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and relocates to the mitochondrial outer surface upon oxidative stress +S000032498 CDS YKL056C 11 334915 334412 C 2011-02-03 1996-07-31 +S000001538 ORF Verified YKL055C OAR1 3-oxoacyl-[acyl-carrier-protein] reductase (NADPH) chromosome 11 11 336157 335321 C 2011-02-03 1996-07-31|2011-02-03 Mitochondrial 3-oxoacyl-[acyl-carrier-protein] reductase; may comprise a type II mitochondrial fatty acid synthase along with Mct1p; human homolog CBR4 complements yeast null mutant +S000032402 CDS YKL055C 11 336157 335321 C 2011-02-03 1996-07-31|2011-02-03 +S000001537 ORF Verified YKL054C DEF1 DNA damage-responsive RNA polymerase-degradation factor DEF1|VID31 chromosome 11 11 338753 336537 C 2011-02-03 1996-07-31 RNAPII degradation factor; forms a complex with Rad26p in chromatin, enables ubiquitination and proteolysis of RNAPII present in an elongation complex; mutant is deficient in Zip1p loading onto chromosomes during meiosis +S000031390 CDS YKL054C 11 338753 336537 C 2011-02-03 1996-07-31 +S000007243 ORF Verified YKL053C-A MDM35 chromosome 11 11 339442 339182 C 2011-02-03 1999-07-17 Mitochondrial intermembrane space protein; forms complex with Ups2p that transfers phosphatidylserine from outer membrane to inner membrane for phosphatidylethanolamine synthesis; mutation affects mitochondrial distribution and morphology; contains twin cysteine-x9-cysteine motifs; protein abundance increases in response to DNA replication stress +S000032996 CDS YKL053C-A 11 339442 339182 C 2011-02-03 1999-07-17 +S000001536 ORF Dubious YKL053W chromosome 11 11 339572 339946 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF ASK1 +S000031321 CDS YKL053W 11 339572 339946 W 2011-02-03 1996-07-31 +S000001535 ORF Verified YKL052C ASK1 chromosome 11 11 340546 339668 C 2011-02-03 1996-07-31|2008-06-03 Essential subunit of the Dam1 complex (aka DASH complex); couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; phosphorylated during the cell cycle by cyclin-dependent kinases; sumoylated in an Mms21p-dependent manner; protein abundance increases in response to DNA replication stress +S000031156 CDS YKL052C 11 340546 339668 C 2011-02-03 1996-07-31|2008-06-03 +S000001534 ORF Verified YKL051W SFK1 chromosome 11 11 341312 342373 W 2011-02-03 1996-07-31 Plasma membrane protein that may act to generate normal levels of PI4P; may act together with or upstream of Stt4p; at least partially mediates proper localization of Stt4p to the plasma membrane +S000031104 CDS YKL051W 11 341312 342373 W 2011-02-03 1996-07-31 +S000001533 ORF Verified YKL050C chromosome 11 11 345620 342852 C 2011-02-03 1996-07-31 Protein of unknown function; the YKL050W protein is a target of the SCFCdc4 ubiquitin ligase complex and YKL050W transcription is regulated by Azf1p; YKL050C has a paralog, EIS1, that arose from the whole genome duplication +S000030029 CDS YKL050C 11 345620 342852 C 2011-02-03 1996-07-31 +S000001532 ORF Verified YKL049C CSE4 centromeric DNA-binding histone H3-like protein CSE4|CSL2 chromosome 11 L000002719 11 346764 346075 C 2011-02-03 2003-01-10|1996-07-31|2003-01-08 Histone H3-like centromere protein; associated with promoters, accessible chromatin, RNAPII-bound regions; phosphorylated Cse4p associates with centromeres; required for proper kinetochore function; levels regulated by E3 ubiquitin ligase Psh1p; phosphorylation may destabilize defective kinetochores to promote bi-orientation; ubiquitination of N-terminus regulates proteolysis for faithful chromosome segregation; yeast CSE4 can complement mutations in human homolog CENPA +S000037076 CDS YKL049C 11 346764 346075 C 2011-02-03 2003-01-10|1996-07-31|2003-01-08 +S000001531 ORF Verified YKL048C ELM1 serine/threonine protein kinase ELM1|LDB9 chromosome 11 L000000548 11 349136 347214 C 2011-02-03 1996-07-31 Serine/threonine protein kinase; regulates the orientation checkpoint, the morphogenesis checkpoint and the metabolic switch from fermentative to oxidative metabolism by phosphorylating the activation loop of Kin4p, Hsl1p and Snf4p respectively; cooperates with Hsl7p in recruiting Hsl1p to the septin ring, a prerequisite for subsequent recruitment, phosphorylation, and degradation of Swe1p; forms part of the bud neck ring; regulates cytokinesis +S000036436 CDS YKL048C 11 349136 347214 C 2011-02-03 1996-07-31 +S000001530 ORF Verified YKL047W ANR2 chromosome 11 S000114863 11 349463 351013 W 2011-02-03 1996-07-31 Protein of unknown function; may have a role in lipid metabolism, based on localization to lipid droplets; predicted to be palmitoylated +S000036411 CDS YKL047W 11 349463 351013 W 2011-02-03 1996-07-31 +S000001529 ORF Verified YKL046C DCW1 putative mannan endo-1,6-alpha-mannosidase chromosome 11 11 352624 351275 C 2011-02-03 1996-07-31 Putative mannosidase; GPI-anchored membrane protein required for cell wall biosynthesis in bud formation;homologous to Dfg5p +S000036235 CDS YKL046C 11 352624 351275 C 2011-02-03 1996-07-31 +S000001528 ORF Verified YKL045W PRI2 DNA primase subunit PRI2 chromosome 11 L000001490 11 353493 355079 W 2011-02-03 1996-07-31 Subunit of DNA primase; DNA primase is required for DNA synthesis and double-strand break repair +S000036183 CDS YKL045W 11 353493 355079 W 2011-02-03 1996-07-31 +S000001527 ORF Verified YKL044W MMO1 chromosome 11 11 356322 356642 W 2011-02-03 1996-07-31 Protein of unknown function; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the mitochondria; mRNA identified as translated by ribosome profiling data; MMO1 is a non-essential gene +S000035237 CDS YKL044W 11 356322 356642 W 2011-02-03 1996-07-31 +S000001526 ORF Verified YKL043W PHD1 chromosome 11 L000001417 11 356748 357848 W 2011-02-03 1996-07-31 Transcriptional activator that enhances pseudohyphal growth; physically interacts with the Tup1-Cyc8 complex and recruits Tup1p to its targets; regulates expression of FLO11, an adhesin required for pseudohyphal filament formation; similar to StuA, an A. nidulans developmental regulator; potential Cdc28p substrate; PHD1 has a paralog, SOK2, that arose from the whole genome duplication +S000035082 CDS YKL043W 11 356748 357848 W 2011-02-03 1996-07-31 +S000001525 ORF Verified YKL042W SPC42 chromosome 11 L000004148 11 358475 359566 W 2011-02-03 1996-07-31 Central plaque component of spindle pole body (SPB); involved in SPB duplication, may facilitate attachment of the SPB to the nuclear membrane +S000034904 CDS YKL042W 11 358475 359566 W 2011-02-03 1996-07-31 +S000001524 ORF Verified YKL041W VPS24 ESCRT-III subunit protein VPS24|VPL26|DID3 chromosome 11 L000004158 11 360143 360817 W 2011-02-03 1996-07-31 One of four subunits of the ESCRT-III complex; forms an endosomal sorting complex required for transport III (ESCRT-III) subcomplex with Did4p; involved in the sorting of transmembrane proteins into the multivesicular body (MVB) pathway +S000034024 CDS YKL041W 11 360143 360817 W 2011-02-03 1996-07-31 +S000001523 ORF Verified YKL040C NFU1 NUB1 chromosome 11 L000004771 11 361828 361058 C 2011-02-03 1996-07-31 Protein involved in Fe-S cluster transfer to mitochondrial clients; protects [4Fe-4S] clusters from damage due to oxidative stress; acts along with Bol3 at a late step in the transfer of [4Fe-4S] clusters from the ISA complex to client proteins; Fe-S loaded homodimer at steady state; similar to NifU, a bacterial protein required for Fe/S cluster maturation; ortholog of the human NFU1, mutations of which are associated with Multiple Mitochondria Dysfunctions Syndrome (MMDS1) +S000033793 CDS YKL040C 11 361828 361058 C 2011-02-03 1996-07-31 +S000001522 ORF Verified YKL039W PTM1 chromosome 11 L000001524 11 362622 364193 W 2011-02-03 1996-07-31|2005-12-15 Protein of unknown function; copurifies with late Golgi vesicles containing the v-SNARE Tlg2p; PTM1 has a paralog, YHL017W, that arose from the whole genome duplication +S000035013 CDS YKL039W 11 362622 364193 W 2011-02-03 1996-07-31|2005-12-15 +S000006460 snoRNA_gene snR69 SNR69 chromosome 11 L000004538 11 364776 364876 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position C2948 +S000030857 noncoding_exon snR69 11 364776 364876 W 2011-02-03 2000-05-19 +S000001521 ORF Verified YKL038W RGT1 chromosome 11 L000003482 11 365605 369117 W 2011-02-03 1996-07-31 Glucose-responsive transcription factor; regulates expression of several glucose transporter (HXT) genes in response to glucose; binds to promoters and acts both as a transcriptional activator and repressor; recruits Tup1p/Cyc8p to target gene promoters; RGT1 has a paralog, EDS1, that arose from the whole genome duplication +S000034833 CDS YKL038W 11 365605 369117 W 2011-02-03 1996-07-31 +S000001520 ORF Verified YKL037W AIM26 chromosome 11 11 369365 369721 W 2011-02-03 1996-07-31 Protein of unknown function; null mutant is viable and displays elevated frequency of mitochondrial genome loss; null mutation confers sensitivity to tunicamycin and DTT +S000032888 CDS YKL037W 11 369365 369721 W 2011-02-03 1996-07-31 +S000001518 ORF Verified YKL035W UGP1 UTP glucose-1-phosphate uridylyltransferase chromosome 11 L000003118 11 369891 371390 W 2011-02-03 1996-07-31 UDP-glucose pyrophosphorylase (UGPase); catalyses the reversible formation of UDP-Glc from glucose 1-phosphate and UTP, involved in a wide variety of metabolic pathways, expression modulated by Pho85p through Pho4p; involved in PKA-mediated oxidative stress resistance and long-term survival in stationary phase; UGP1 has a paralog, YHL012W, that arose from the whole genome duplication +S000032697 CDS YKL035W 11 369891 371390 W 2011-02-03 1996-07-31 +S000001519 ORF Dubious YKL036C chromosome 11 11 369920 369528 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the essential gene UGP1 gene and uncharacterized ORF YKL037W +S000032729 CDS YKL036C 11 369920 369528 C 2011-02-03 1996-07-31 +S000001517 ORF Verified YKL034W TUL1 ubiquitin-protein ligase TUL1 chromosome 11 11 371829 374105 W 2011-02-03 1996-07-31 Subunit of the DSC ubiquitin ligase complex; golgi-localized RING-finger ubiquitin ligase (E3) involved in sorting polar transmembrane domain containing membrane proteins to multivesicular bodies for delivery to the vacuole; proposed involvement in the quality control of misfolded TMD containing proteins; ortholog of fission yeast dsc1 +S000032625 CDS YKL034W 11 371829 374105 W 2011-02-03 1996-07-31 +S000007242 ORF Uncharacterized YKL033W-A putative hydrolase chromosome 11 11 374505 375215 W 2011-02-03 2004-02-13|1999-07-17 Putative protein of unknown function; similar to uncharacterized proteins from other fungi +S000036238 CDS YKL033W-A 11 374505 375215 W 2011-02-03 2004-02-13|1999-07-17 +S000001516 ORF Verified YKL033W TTI1 FMP47 chromosome 11 11 375456 378572 W 2011-02-03 1996-07-31 Subunit of the ASTRA complex, involved in chromatin remodeling; telomere length regulator involved in the stability or biogenesis of PIKKs such as TORC1; similar to S. pombe Tti1p; detected in highly purified mitochondria in high-throughput studies +S000031614 CDS YKL033W 11 375456 378572 W 2011-02-03 1996-07-31 +S000006761 tRNA_gene tV(AAC)K2 chromosome 11 L000003634 11 379680 379753 W 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000037883 noncoding_exon tV(AAC)K2 11 379680 379753 W 2011-02-03 2000-05-19 +S000001515 ORF Verified YKL032C IXR1 DNA-binding transcription repressor IXR1|ORD1 chromosome 11 L000000881 11 381858 380065 C 2011-02-03 1996-07-31 Transcriptional repressor that regulates hypoxic genes during normoxia; involved in the aerobic repression of genes such as COX5b, TIR1, and HEM13; binds DNA intrastrand cross-links formed by cisplatin; HMG (high mobility group box) domain containing protein which binds and bends cisplatin-modified DNA, blocking excision repair; IXR1 has a paralog, ABF2, that arose from the whole genome duplication +S000031407 CDS YKL032C 11 381858 380065 C 2011-02-03 1996-07-31 +S000001514 ORF Dubious YKL031W chromosome 11 11 382072 382485 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species +S000031365 CDS YKL031W 11 382072 382485 W 2011-02-03 1996-07-31 +S000001513 ORF Dubious YKL030W chromosome 11 11 382498 383103 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; partially overlaps the verified gene MAE1 +S000030446 CDS YKL030W 11 382498 383103 W 2011-02-03 1996-07-31 +S000001512 ORF Verified YKL029C MAE1 malate dehydrogenase (oxaloacetate-decarboxylating) chromosome 11 L000003506 11 384725 382716 C 2011-02-03 1996-07-31 Mitochondrial malic enzyme; catalyzes the oxidative decarboxylation of malate to pyruvate, which is a key intermediate in sugar metabolism and a precursor for synthesis of several amino acids +S000030570 CDS YKL029C 11 384725 382716 C 2011-02-03 1996-07-31 +S000001511 ORF Verified YKL028W TFA1 transcription factor TFIIE subunit TFA1 chromosome 11 L000002595 11 385758 387206 W 2011-02-03 1996-07-31 TFIIE large subunit; involved in recruitment of RNA polymerase II to the promoter, activation of TFIIH, and promoter opening +S000036771 CDS YKL028W 11 385758 387206 W 2011-02-03 1996-07-31 +S000001510 ORF Verified YKL027W TCD2 tRNA threonylcarbamoyladenosine dehydratase chromosome 11 11 387562 388905 W 2011-02-03 1996-07-31 tRNA threonylcarbamoyladenosine dehydratase; required for the ct6A tRNA base modification, where an adenosine at position 37 is modified to form a cyclized active ester with an oxazolone ring; localized to the mitochondrial outer membrane; TCD2 has a paralog, TCD1, that arose from the whole genome duplication +S000036685 CDS YKL027W 11 387562 388905 W 2011-02-03 1996-07-31 +S000118404 ARS ARS1112 ARSXI-389 chromosome 11 11 388970 389264 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000001509 ORF Verified YKL026C GPX1 glutathione peroxidase GPX1 chromosome 11 11 389883 389380 C 2011-02-03 1996-07-31 Phospholipid hydroperoxide glutathione peroxidase; induced by glucose starvation that protects cells from phospholipid hydroperoxides and nonphospholipid peroxides during oxidative stress; GPX1 has a paralog, HYR1, that arose from the whole genome duplication +S000036560 CDS YKL026C 11 389883 389380 C 2011-02-03 1996-07-31 +S000001508 ORF Verified YKL025C PAN3 ECM35 chromosome 11 L000003340 11 392279 390240 C 2011-02-03 1996-07-31 Essential subunit of the Pan2p-Pan3p poly(A)-ribonuclease complex; poly (A) mRNA binding subunit which recruits mRNA to the complex; the Pan2p-Pan3p complex controls poly(A) tail length and regulates the stoichiometry and activity of postreplication repair complexes +S000035620 CDS YKL025C 11 392279 390240 C 2011-02-03 1996-07-31 +S000001507 ORF Verified YKL024C URA6 bifunctional uridylate/adenylate kinase|SOC8 chromosome 11 L000002435 11 393140 392526 C 18 2011-02-03 1996-07-31 Uridylate kinase; catalyzes the seventh enzymatic step in the de novo biosynthesis of pyrimidines, converting uridine monophosphate (UMP) into uridine-5'-diphosphate (UDP) +S000035543 CDS YKL024C 11 393140 392526 C 2011-02-03 1996-07-31 +S000113559 ORF Uncharacterized YKL023C-A chromosome 11 11 393373 393146 C 2011-02-03 2005-11-17 Putative protein of unknown function +S000113560 CDS YKL023C-A 11 393373 393146 C 2011-02-03 2005-11-17 +S000001506 ORF Uncharacterized YKL023W chromosome 11 11 393721 394554 W 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; predicted by computational methods to be involved in mRNA degradation; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000035506 CDS YKL023W 11 393721 394554 W 2011-02-03 1996-07-31|2011-02-03 +S000001505 ORF Verified YKL022C CDC16 anaphase promoting complex subunit CDC16 chromosome 11 L000000256 11 397248 394726 C -15 2011-02-03 1996-07-31 Subunit of the anaphase-promoting complex/cyclosome (APC/C); which is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; required for sporulation; relocalizes to the cytosol in response to hypoxia +S000034410 CDS YKL022C 11 397248 394726 C 2011-02-03 1996-07-31 +S000001504 ORF Verified YKL021C MAK11 chromosome 11 L000000984 11 398750 397344 C -16 2011-02-03 1996-07-31 Protein involved in an early step of 60S ribosomal subunit biogenesis; essential for cell growth and replication of killer M1 dsRNA virus; contains four beta-transducin repeats +S000034298 CDS YKL021C 11 398750 397344 C 2011-02-03 1996-07-31 +S000001503 ORF Verified YKL020C SPT23 chromosome 11 L000002041 11 402080 398832 C 2011-02-03 1996-07-31 ER membrane protein involved in regulation of OLE1 transcription; inactive ER form dimerizes and one subunit is then activated by ubiquitin/proteasome-dependent processing followed by nuclear targeting; SPT23 has a paralog, MGA2, that arose from the whole genome duplication +S000034167 CDS YKL020C 11 402080 398832 C 2011-02-03 1996-07-31 +S000001502 ORF Verified YKL019W RAM2 bifunctional protein farnesyltransferase/protein geranylgeranyltransferase chromosome 11 L000001580 11 402568 403518 W 2011-02-03 1996-07-31 Alpha subunit of farnesyltransferase and geranylgeranyltransferase-I; farnesyltransferase (Ram2p-Ram1p heterodimer) catalyzes the addition of 15-carbon isoprenoid farnesyl to substrate proteins containing a CAAX consensus motif; type I geranylgeranyltransferase (Ram2p-Cdc43p heterodimer) catalyzes the addition of the 20-carbon isoprenoid geranylgeranyl to substrate proteins containing a CaaL consensus motif; required for membrane localization of Ras proteins and a-factor +S000034702 CDS YKL019W 11 402568 403518 W 2011-02-03 1996-07-31 +S000007615 ORF Uncharacterized YKL018C-A chromosome 11 11 403879 403580 C 2011-02-03 2001-02-26 Putative protein of unknown function; identified by homology; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000037213 CDS YKL018C-A 11 403879 403580 C 2011-02-03 2001-02-26 +S000001501 ORF Verified YKL018W SWD2 WD-repeat containing protein SWD2|SAF37|CPS35 chromosome 11 11 404102 405091 W 2011-02-03 1996-07-31 Subunit of the COMPASS (Set1C) histone H3K4 methyltransferase complex; required for Set1C stability and optimal activity; COMPASS methylates histone H3 on lys 4 and is involved in telomeric silencing; subunit of CPF (cleavage and polyadenylation factor), a complex involved in RNAP II transcription termination +S000034635 CDS YKL018W 11 404102 405091 W 2011-02-03 1996-07-31 +S000001500 ORF Verified YKL017C HCS1 ATP-dependent 5'-3' DNA helicase HCS1|DIP1 chromosome 11 L000003087|L000004272 11 407241 405190 C 2011-02-03 1996-07-31 Hexameric DNA polymerase alpha-associated DNA helicase A; involved in lagging strand DNA synthesis; contains single-stranded DNA stimulated ATPase and dATPase activities; replication protein A stimulates helicase and ATPase activities +S000034495 CDS YKL017C 11 407241 405190 C 2011-02-03 1996-07-31 +S000001499 ORF Verified YKL016C ATP7 F1F0 ATP synthase subunit d chromosome 11 L000000146 11 407989 407465 C 2011-02-03 1996-07-31 Subunit d of the stator stalk of mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis +S000032473 CDS YKL016C 11 407989 407465 C 2011-02-03 1996-07-31 +S000001498 ORF Verified YKL015W PUT3 chromosome 11 L000001537|L000001528 11 408544 411483 W -5 2011-02-03 1996-07-31 Transcriptional activator; binds specific gene recruitment sequences and is required for DNA zip code-mediated targeting of genes to nuclear periphery; regulates proline utilization genes, constitutively binds PUT1 and PUT2 promoters as a dimer, undergoes conformational change to form active state; binds other promoters only under activating conditions; differentially phosphorylated in presence of different nitrogen sources; has a Zn(2)-Cys(6) binuclear cluster domain +S000032428 CDS YKL015W 11 408544 411483 W 2011-02-03 1996-07-31 +S000001497 ORF Verified YKL014C URB1 NPA1 chromosome 11 11 416913 411619 C 2011-02-03 1996-07-31 Protein required for the normal accumulation of 25S and 5.8S rRNAs; nucleolar protein; associated with the 27SA2 pre-ribosomal particle; proposed to be involved in the biogenesis of the 60S ribosomal subunit +S000032267 CDS YKL014C 11 416913 411619 C 2011-02-03 1996-07-31 +S000118405 ARS ARS1113 ARSXI-417 chromosome 11 11 417185 417417 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000001496 ORF Verified YKL013C ARC19 chromosome 11 L000004034 11 418023 417508 C 2011-02-03 1996-07-31 Subunit of the ARP2/3 complex; ARP2/3 is required for the motility and integrity of cortical actin patches; mutation is functionally complemented by human ARPC4 +S000031281 CDS YKL013C 11 418023 417508 C 2011-02-03 1996-07-31 +S000001495 ORF Verified YKL012W PRP40 chromosome 11 L000003078 11 418310 420061 W 2011-02-03 1996-07-31 U1 snRNP protein involved in splicing; interacts with the branchpoint-binding protein during the formation of the second commitment complex +S000031220 CDS YKL012W 11 418310 420061 W 2011-02-03 1996-07-31 +S000001494 ORF Verified YKL011C CCE1 cruciform cutting endonuclease|MGT1 chromosome 11 L000000236 11 421216 420155 C -2 2011-02-03 1996-07-31 Mitochondrial cruciform cutting endonuclease; cleaves Holliday junctions formed during recombination of mitochondrial DNA; CCE1 has a paralog, MRS1, that arose from the whole genome duplication +S000031036 CDS YKL011C 11 421216 420155 C 2011-02-03 1996-07-31 +S000001493 ORF Verified YKL010C UFD4 putative ubiquitin-protein ligase UFD4 chromosome 11 L000003509 11 425875 421424 C 2011-02-03 1996-07-31 Ubiquitin-protein ligase (E3); interacts with Rpt4p and Rpt6p, two subunits of the 19S particle of the 26S proteasome; cytoplasmic E3 involved in the degradation of ubiquitin fusion proteins; relative distribution to the nucleus increases upon DNA replication stress +S000030049 CDS YKL010C 11 425875 421424 C 2011-02-03 1996-07-31 +S000001492 ORF Verified YKL009W MRT4 chromosome 11 L000004450 11 426242 426952 W 2011-02-03 1996-07-31 Protein involved in mRNA turnover and ribosome assembly; required at post-transcriptional step for efficient retrotransposition; localizes to the nucleolus +S000030485 CDS YKL009W 11 426242 426952 W 2011-02-03 1996-07-31 +S000001491 ORF Verified YKL008C LAC1 sphingosine N-acyltransferase LAC1|DGT1 chromosome 11 11 428551 427295 C 2011-02-03 1996-07-31 Ceramide synthase component; involved in synthesis of ceramide from C26(acyl)-coenzyme A and dihydrosphingosine or phytosphingosine, functionally equivalent to Lag1p; LAC1 has a paralog, LAG1, that arose from the whole genome duplication +S000030290 CDS YKL008C 11 428551 427295 C 2011-02-03 1996-07-31 +S000001490 ORF Verified YKL007W CAP1 chromosome 11 L000000214 11 429302 430108 W -2 2011-02-03 1996-07-31 Alpha subunit of the capping protein heterodimer (Cap1p and Cap2p); capping protein (CP) binds to the barbed ends of actin filaments preventing further polymerization; localized predominantly to cortical actin patches; protein increases in abundance and relocalizes from bud neck to plasma membrane upon DNA replication stress +S000030183 CDS YKL007W 11 429302 430108 W 2011-02-03 1996-07-31 +S000002101 ORF Verified YKL006C-A SFT1 chromosome 11 L000002949 11 430632 430198 C 2011-02-03 1996-07-31 Intra-Golgi v-SNARE; required for transport of proteins between an early and a later Golgi compartment +S000037319 CDS YKL006C-A 11 430455 430198 C 2011-02-03 1996-07-31 +S000037318 CDS YKL006C-A 11 430632 430597 C 2011-02-03 1996-07-31 +S000037320 intron YKL006C-A 11 430596 430456 C 2011-02-03 1996-07-31 +S000114301 snoRNA_gene snR87 SNR87 chromosome 11 11 431138 431030 C 2011-02-03 2006-03-02 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position A436 +S000114518 noncoding_exon snR87 11 431138 431030 C 2011-02-03 2006-03-02 +S000001489 ORF Verified YKL006W RPL14A eL14|ribosomal 60S subunit protein L14A|L14e|L14A chromosome 11 L000002706 11 431906 432720 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L14A; N-terminally acetylated; homologous to mammalian ribosomal protein L14, no bacterial homolog; RPL14A has a paralog, RPL14B, that arose from the whole genome duplication +S000030075 CDS YKL006W 11 431906 432034 W 2011-02-03 1996-07-31 +S000030076 CDS YKL006W 11 432433 432720 W 2011-02-03 1996-07-31 +S000030077 intron YKL006W 11 432035 432432 W 2011-02-03 1996-07-31 +S000001488 ORF Verified YKL005C BYE1 chromosome 11 11 434877 433093 C 2011-02-03 1996-07-31 Negative regulator of transcription elongation; contains a TFIIS-like domain that associates with chromatin and a PHD domain that interacts with H3K4me3; multicopy suppressor of temperature-sensitive ess1 mutations, binds RNA polymerase II large subunit +S000036319 CDS YKL005C 11 434877 433093 C 2011-02-03 1996-07-31 +S000001487 ORF Verified YKL004W AUR1 inositol phosphorylceramide synthase chromosome 11 L000002767 11 435580 436785 W 2011-02-03 1996-07-31 Phosphatidylinositol:ceramide phosphoinositol transferase; required for sphingolipid synthesis; can mutate to confer aureobasidin A resistance; also known as IPC synthase +S000036280 CDS YKL004W 11 435580 436785 W 2011-02-03 1996-07-31 +S000001486 ORF Verified YKL003C MRP17 mitochondrial 37S ribosomal protein YmS16 chromosome 11 L000002616 11 437492 437097 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; MRP17 exhibits genetic interactions with PET122, encoding a COX3-specific translational activator +S000036065 CDS YKL003C 11 437492 437097 C 2011-02-03 1996-07-31 +S000001485 ORF Verified YKL002W DID4 ESCRT-III subunit protein DID4|VPS14|CHM2|VPS2|VPT14|VPL2|REN1|GRD7 chromosome 11 L000002955 11 437778 438544 W 2011-02-03 2000-07-22|1996-07-31 Class E Vps protein of the ESCRT-III complex; required for sorting of integral membrane proteins into lumenal vesicles of multivesicular bodies, and for delivery of newly synthesized vacuolar enzymes to the vacuole, involved in endocytosis +S000035271 CDS YKL002W 11 437778 437837 W 2011-02-03 2000-07-22|1996-07-31 +S000035272 CDS YKL002W 11 437906 438544 W 2011-02-03 2000-07-22 +S000035273 intron YKL002W 11 437838 437905 W 2011-02-03 2000-07-22 +S000001484 ORF Verified YKL001C MET14 adenylyl-sulfate kinase chromosome 11 L000001086 11 439385 438777 C .8 2011-02-03 1996-07-31 Adenylylsulfate kinase; required for sulfate assimilation and involved in methionine metabolism; human homolog PAPSS2 complements yeast null mutant +S000034979 CDS YKL001C 11 439385 438777 C 2011-02-03 1996-07-31 +S000006472 centromere CEN11 CEN11 chromosome 11 L000000304 11 440246 440129 C 0 2011-02-03 2000-05-19|2004-10-08 Chromosome XI centromere +S000077299 centromere_DNA_Element_I CEN11 11 440246 440237 C 2011-02-03 2004-10-08 +S000077300 centromere_DNA_Element_II CEN11 11 440236 440154 C 2011-02-03 2004-10-08 +S000077301 centromere_DNA_Element_III CEN11 11 440153 440129 C 2011-02-03 2004-10-08 +S000001709 ORF Verified YKR001C VPS1 dynamin-like GTPase VPS1|VPT26|VPL1|SPO15|LAM1|GRD1 chromosome 11 L000002006 11 442722 440608 C -1 2011-02-03 1996-07-31 Dynamin-like GTPase required for vacuolar sorting; also involved in actin cytoskeleton organization, endocytosis, late Golgi-retention of some proteins, regulation of peroxisome biogenesis +S000030382 CDS YKR001C 11 442722 440608 C 2011-02-03 1996-07-31 +S000001710 ORF Verified YKR002W PAP1 polynucleotide adenylyltransferase PAP1 chromosome 11 L000001336 11 443232 444938 W -1 2011-02-03 1996-07-31 Poly(A) polymerase; one of three factors required for mRNA 3'-end polyadenylation, forms multiprotein complex with polyadenylation factor I (PF I), also required for mRNA nuclear export; may also polyadenylate rRNAs; required for gene looping +S000033778 CDS YKR002W 11 443232 444938 W 2011-02-03 1996-07-31 +S000001711 ORF Verified YKR003W OSH6 oxysterol-binding protein OSH6 chromosome 11 11 445381 446727 W 2011-02-03 1996-07-31 Member of an oxysterol-binding protein family; family members have overlapping, redundant functions in sterol metabolism and collectively perform a function essential for viability; GFP-fusion protein localizes to the cell periphery; overexpression extends lifespan by promoting vacuolar fusion; OSH6 has a paralog, OSH7, that arose from the whole genome duplication +S000033901 CDS YKR003W 11 445381 446727 W 2011-02-03 1996-07-31 +S000118406 ARS ARS1114 ARSXI-448 chromosome 11 11 448020 448254 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000001712 ORF Verified YKR004C ECM9 YKR004C-A chromosome 11 L000003884 11 448036 446799 C 2011-02-03 2003-09-27|1996-07-31 Non-essential protein of unknown function +S000033974 CDS YKR004C 11 447706 446799 C 2011-02-03 2003-09-27 +S000033973 CDS YKR004C 11 448036 447811 C 2011-02-03 2003-09-27|1996-07-31 +S000033975 intron YKR004C 11 447810 447707 C 2011-02-03 2003-09-27 +S000001713 ORF Uncharacterized YKR005C chromosome 11 11 450167 448521 C 2011-02-03 1996-07-31|2007-09-05 Putative protein of unknown function +S000123939 CDS YKR005C 11 449951 448521 C 2011-02-03 2007-09-05 +S000034843 CDS YKR005C 11 450167 450021 C 2011-02-03 1996-07-31|2007-09-05 +S000123938 intron YKR005C 11 450020 449952 C 2011-02-03 2007-09-05 +S000001714 ORF Verified YKR006C MRPL13 mitochondrial 54S ribosomal protein YmL13|YmL13|YK105 chromosome 11 L000001164|L000002526 11 451217 450423 C 2011-02-03 2003-09-22|1996-07-31 Mitochondrial ribosomal protein of the large subunit; not essential for mitochondrial translation +S000034952 CDS YKR006C 11 451217 450423 C 2011-02-03 2003-09-22|1996-07-31 +S000001715 ORF Verified YKR007W MEH1 GSE2|EGO1 chromosome 11 11 451434 451988 W 2011-02-03 1996-07-31 Component of the EGO and GSE complexes; EGO is involved in the regulation of microautophagy and GSE is required for proper sorting of amino acid permease Gap1p; loss results in a defect in vacuolar acidification +S000035149 CDS YKR007W 11 451434 451988 W 2011-02-03 1996-07-31 +S000001716 ORF Verified YKR008W RSC4 chromosome 11 L000004026 11 452201 454078 W 2011-02-03 1996-07-31|2011-02-03 Component of the RSC chromatin remodeling complex; found in close proximity to nucleosomal DNA; displaced from the surface of nucleosomal DNA after chromatin remodeling; acetylated (K25) by Gcn5p, altering replication stress tolerance; contains tandem bromodomains that recognize histone H3 acetylated on K14 (H3K14ac) by Gcn5p +S000036038 CDS YKR008W 11 452201 454078 W 2011-02-03 1996-07-31|2011-02-03 +S000001717 ORF Verified YKR009C FOX2 bifunctional hydroxyacyl-CoA dehydrogenase/enoyl-CoA hydratase FOX2|POX2 chromosome 11 L000000622 11 457054 454352 C 2011-02-03 1996-07-31 3-hydroxyacyl-CoA dehydrogenase and enoyl-CoA hydratase; multifunctional enzyme of the peroxisomal fatty acid beta-oxidation pathway; mutation is functionally complemented by human HSD17B4 +S000036079 CDS YKR009C 11 457054 454352 C 2011-02-03 1996-07-31 +S000007058 long_terminal_repeat YKRCdelta8 chromosome 11 11 458471 458140 C 2011-02-03 2000-05-19 Ty1 LTR +S000006642 tRNA_gene tL(CAA)K chromosome 11 L000003635 11 458557 458670 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000033792 intron tL(CAA)K 11 458595 458626 W 2011-02-03 2000-05-19 +S000033790 noncoding_exon tL(CAA)K 11 458557 458594 W 2011-02-03 2000-05-19 +S000033791 noncoding_exon tL(CAA)K 11 458627 458670 W 2011-02-03 2000-05-19 +S000001718 ORF Verified YKR010C TOF2 chromosome 11 L000004245 11 461239 458924 C 2011-02-03 1996-07-31 Protein required for rDNA silencing and mitotic rDNA condensation; stimulates Cdc14p phosphatase activity and biphasic release to promote rDNA repeat segregation; required for condensin recruitment to the replication fork barrier site; TOF2 has a paralog, NET1, that arose from the whole genome duplication +S000034767 CDS YKR010C 11 461239 458924 C 2011-02-03 1996-07-31 +S000001719 ORF Verified YKR011C TOS5 chromosome 11 11 462696 461635 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; protein abundance increases in response to DNA replication stress +S000035735 CDS YKR011C 11 462696 461635 C 2011-02-03 1996-07-31 +S000130139 ARS ARS1115 ARSXI-463 chromosome 11 11 462699 463742 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000001721 ORF Verified YKR013W PRY2 sterol-binding protein|YFW12 chromosome 11 L000003217 11 463959 464948 W 2011-02-03 1996-07-31 Sterol binding protein involved in the export of acetylated sterols; secreted glycoprotein and member of the CAP protein superfamily (cysteine-rich secretory proteins (CRISP), antigen 5, and pathogenesis related 1 proteins); sterol export function is redundant with that of PRY1; may be involved in detoxification of hydrophobic compounds; PRY2 has a paralog, PRY1, that arose from the whole genome duplication +S000037809 CDS YKR013W 11 463959 464948 W 2011-02-03 1996-07-31 +S000001720 ORF Dubious YKR012C chromosome 11 11 464116 463739 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene PRY2 +S000035867 CDS YKR012C 11 464116 463739 C 2011-02-03 1996-07-31|2011-02-03 +S000001722 ORF Verified YKR014C YPT52 Rab family GTPase YPT52 chromosome 11 L000002546 11 466071 465367 C 2011-02-03 1996-07-31 Endosomal Rab family GTPase; required for vacuolar protein sorting, endocytosis and multivesicular body (MVB) biogenesis and sorting; required for localization of the CORVET complex to endosomes; involved in autophagy and ionic stress tolerance; similar to Vps21p and Ypt53p; mammalian Rab5 homolog; protein abundance increases in response to DNA replication stress +S000037843 CDS YKR014C 11 466071 465367 C 2011-02-03 1996-07-31 +S000001723 ORF Uncharacterized YKR015C chromosome 11 11 468667 466961 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000029849 CDS YKR015C 11 468667 466961 C 2011-02-03 1996-07-31 +S000001724 ORF Verified YKR016W MIC60 FCJ1|AIM28|FMP13 chromosome 11 11 469717 471339 W 2011-02-03 1996-07-31 Component of the MICOS complex; MICOS (formerly MINOS or MitOS) is a mitochondrial inner membrane complex that extends into the intermembrane space and has a role in the maintenance of crista junctions, inner membrane architecture, and formation of contact sites to the outer membrane; Mic60p is also involved in import of intermembrane space (IMS) proteins, probably by positioning Mia40p relative to the TOM complex to receive incoming proteins; ortholog of mammalian mitofilin +S000030918 CDS YKR016W 11 469717 471339 W 2011-02-03 1996-07-31 +S000001725 ORF Verified YKR017C HEL1 E3 ubiquitin-protein ligase HEL1 chromosome 11 11 473349 471694 C 2011-02-03 1996-07-31 RING finger ubiquitin ligase (E3); involved in ubiquitination and degradation of excess histones; interacts with Ubc4p and Rad53p; null mutant sensitive to hydroxyurea (HU) +S000030959 CDS YKR017C 11 473349 471694 C 2011-02-03 1996-07-31 +S000001726 ORF Verified YKR018C chromosome 11 11 475900 473723 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; protein abundance increases in response to DNA replication stress; YKR018C has a paralog, IML2, that arose from the whole genome duplication +S000031035 CDS YKR018C 11 475900 473723 C 2011-02-03 1996-07-31 +S000001727 ORF Verified YKR019C IRS4 chromosome 11 L000004394 11 478063 476216 C 2011-02-03 1996-07-31 EH domain-containing protein; involved in regulating phosphatidylinositol 4,5-bisphosphate levels and autophagy; Irs4p and Tax4p bind and activate the PtdIns phosphatase Inp51p; Irs4p and Tax4p are involved in localizing Atg17p to the PAS; IRS4 has a paralog, TAX4, that arose from the whole genome duplication +S000031136 CDS YKR019C 11 478063 476216 C 2011-02-03 1996-07-31 +S000001728 ORF Verified YKR020W VPS51 VPS67|API3|WHI6 chromosome 11 11 478338 478832 W 2011-02-03 1996-07-31 Component of the GARP (Golgi-associated retrograde protein) complex; GARP is required for the recycling of proteins from endosomes to the late Golgi, and for mitosis after DNA damage induced checkpoint arrest; links the (VFT/GARP) complex to the SNARE Tlg1p; members of the GARP complex are Vps51p-Vps52p-Vps53p-Vps54p +S000030781 CDS YKR020W 11 478338 478832 W 2011-02-03 1996-07-31 +S000001729 ORF Verified YKR021W ALY1 ART6 chromosome 11 11 479234 481981 W 2011-02-03 1996-07-31|2011-02-03 Alpha arrestin, substrate of calcineurin; controls nutrient-mediated intracellular sorting of permease Gap1p; interacts with AP-1 subunit Apl4p; dephosphorylation of Aly1p required for the endocytosis of Dip5p; may regulate endocytosis of plasma membrane proteins by recruiting ubiquitin ligase Rsp5p to plasma membrane targets; ALY1 has a paralog, ALY2, that arose from the whole genome duplication +S000030869 CDS YKR021W 11 479234 481981 W 2011-02-03 1996-07-31|2011-02-03 +S000001730 ORF Verified YKR022C NTR2 chromosome 11 11 483139 482171 C 2011-02-03 1996-07-31 Essential protein that forms a dimer with Ntr1p; also forms a trimer, with Ntr2p and the DExD/H-box RNA helicase Prp43p, that is involved in spliceosome disassembly +S000031793 CDS YKR022C 11 483139 482171 C 2011-02-03 1996-07-31 +S000001731 ORF Uncharacterized YKR023W chromosome 11 11 483419 485011 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000032021 CDS YKR023W 11 483419 485011 W 2011-02-03 1996-07-31 +S000001732 ORF Verified YKR024C DBP7 putative ATP-dependent RNA helicase chromosome 11 L000004205 11 487372 485144 C 2011-02-03 1996-07-31 Putative ATP-dependent RNA helicase of the DEAD-box family; involved in ribosomal biogenesis; required at post-transcriptional step for efficient retrotransposition; essential for growth under anaerobic conditions +S000032100 CDS YKR024C 11 487372 485144 C 2011-02-03 1996-07-31 +S000001733 ORF Verified YKR025W RPC37 DNA-directed RNA polymerase III subunit C37|C37 chromosome 11 11 487770 488618 W 2011-02-03 1996-07-31 RNA polymerase III subunit C37 +S000034103 CDS YKR025W 11 487770 488618 W 2011-02-03 1996-07-31 +S000001734 ORF Verified YKR026C GCN3 translation initiation factor eIF2B subunit alpha|AAS2 chromosome 11 L000000682 11 489655 488738 C 7 2011-02-03 1996-07-31 Alpha subunit of translation initiation factor eIF2B; guanine-nucleotide exchange factor for eIF2; activity subsequently regulated by phosphorylated eIF2; positive regulator of GCN4 expression; assembles into filaments with Gcd2p, Gcd6p, Gcd7p, and Sui2p as cells approach stationary phase and under cytosolic acidification and starvation conditions; human homolog EIF2B1 can complement yeast null mutant +S000034170 CDS YKR026C 11 489655 488738 C 2011-02-03 1996-07-31 +S000007059 long_terminal_repeat YKRCdelta9 chromosome 11 11 490416 490286 C 2011-02-03 2000-05-19 Ty1 LTR +S000007062 long_terminal_repeat YKRWdelta10 chromosome 11 11 490464 490787 W 2011-02-03 2000-05-19 Ty1 LTR +S000006703 tRNA_gene tR(ACG)K chromosome 11 L000003636 11 490968 491040 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 6 nuclear tRNA genes containing the tDNA-anticodon ACG (converted to ICG in the mature tRNA), decodes CGU, CGC, and probably CGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000030411 noncoding_exon tR(ACG)K 11 490968 491040 W 2011-02-03 2000-05-19 +S000001735 ORF Verified YKR027W BCH2 FMP50 chromosome 11 11 491364 493661 W 2011-02-03 1996-07-31 Member of the ChAPs (Chs5p-Arf1p-binding proteins) family; part of the exomer complex with Chs5p to mediate export of specific cargo proteins, including Chs3p, from the Golgi to the plasma membrane; BCH2 has a paralog, CHS6, that arose from the whole genome duplication +S000034303 CDS YKR027W 11 491364 493661 W 2011-02-03 1996-07-31 +S000001736 ORF Verified YKR028W SAP190 chromosome 11 L000002600 11 494257 497358 W 2011-02-03 1996-07-31|2011-02-03 Protein that forms a complex with the Sit4p protein phosphatase; required for Sit4p function; member of a family of similar proteins including Sap4p, Sap155p, and Sap185p; SAP190 has a paralog, SAP185, that arose from the whole genome duplication +S000034368 CDS YKR028W 11 494257 497358 W 2011-02-03 1996-07-31|2011-02-03 +S000001737 ORF Verified YKR029C SET3 histone-binding protein SET3 chromosome 11 11 499833 497578 C 2011-02-03 1996-07-31 Defining member of the SET3 histone deacetylase complex; which is a meiosis-specific repressor of sporulation genes; necessary for efficient transcription by RNAPII; one of two yeast proteins that contains both SET and PHD domains; SET3 has a paralog, SET4, that arose from the whole genome duplication +S000035298 CDS YKR029C 11 499833 497578 C 2011-02-03 1996-07-31 +S000001738 ORF Verified YKR030W GMH1 MSG1 chromosome 11 11 500282 501103 W 2011-02-03 1996-07-31 Golgi membrane protein of unknown function; interacts with Gea1p and Gea2p; required for localization of Gea2p; computational analysis suggests a possible role in either cell wall synthesis or protein-vacuolar targeting +S000033925 CDS YKR030W 11 500282 501103 W 2011-02-03 1996-07-31 +S000001739 ORF Verified YKR031C SPO14 phospholipase D|PLD1 chromosome 11 L000002005|L000002946 11 506395 501344 C 18 2011-02-03 1996-07-31 Phospholipase D; catalyzes the hydrolysis of phosphatidylcholine, producing choline and phosphatidic acid; involved in Sec14p-independent secretion; required for meiosis and spore formation; differently regulated in secretion and meiosis; participates in transcription initiation and/or early elongation of specific genes; interacts with "foot domain" of RNA polymerase II; deletion results in abnormal CTD-Ser5 phosphorylation of RNA polymerase II at specific promoter regions +S000034013 CDS YKR031C 11 506395 501344 C 2011-02-03 1996-07-31 +S000001740 ORF Dubious YKR032W chromosome 11 11 506517 506831 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034971 CDS YKR032W 11 506517 506831 W 2011-02-03 1996-07-31 +S000001742 ORF Verified YKR034W DAL80 UGA43 chromosome 11 L000000480 11 506898 507707 W 14 2011-02-03 1996-07-31 Negative regulator of genes in multiple nitrogen degradation pathways; expression is regulated by nitrogen levels and by Gln3p; member of the GATA-binding family, forms homodimers and heterodimers with Gzf3p; DAL80 has a paralog, GZF3, that arose from the whole genome duplication +S000036062 CDS YKR034W 11 506898 507707 W 2011-02-03 1996-07-31 +S000001741 ORF Dubious YKR033C chromosome 11 11 507304 506879 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene DAL80 +S000035067 CDS YKR033C 11 507304 506879 C 2011-02-03 1996-07-31 +S000006435 ORF Verified YKR035W-A DID2 VPL30|VPS46|CHM1|FTI1 chromosome 11 L000004496 11 507939 508553 W 2011-02-03 1999-07-17 Class E protein of the vacuolar protein-sorting (Vps) pathway; binds Vps4p and directs it to dissociate ESCRT-III complexes; forms a functional and physical complex with Ist1p; human ortholog may be altered in breast tumors +S000034954 CDS YKR035W-A 11 507939 508553 W 2011-02-03 1999-07-17 +S000001743 ORF Dubious YKR035C OPI8 chromosome 11 11 508561 507920 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene DID2/YKR035W-A +S000036116 CDS YKR035C 11 508561 507920 C 2011-02-03 1996-07-31 +S000001744 ORF Verified YKR036C CAF4 chromosome 11 L000003417 11 510633 508702 C 2011-02-03 1996-07-31|2006-05-08|2011-02-03 WD40 repeat-containing protein associated with the CCR4-NOT complex; interacts in a Ccr4p-dependent manner with Ssn2p; also interacts with Fis1p, Mdv1p and Dnm1p and plays a role in mitochondrial fission; CAF4 has a paralog, MDV1, that arose from the whole genome duplication +S000036256 CDS YKR036C 11 510633 508702 C 2011-02-03 1996-07-31|2006-05-08|2011-02-03 +S000001745 ORF Verified YKR037C SPC34 chromosome 11 L000004696 11 511797 510910 C 2011-02-03 1996-07-31 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; also localized to nuclear side of spindle pole body +S000036356 CDS YKR037C 11 511797 510910 C 2011-02-03 1996-07-31 +S000001746 ORF Verified YKR038C KAE1 tRNA N6-adenosine threonylcarbamoyltransferase chromosome 11 11 513159 511999 C 2011-02-03 2003-09-22|1996-07-31 Highly conserved ATPase of HSP70/DnaK family; essential functional component of the EKC/KEOPS complex, with Bud32p, Cgi121p, Pcc1p, and Gon7p; EKC/KEOPS complex is required for t6A tRNA modification and telomeric TG1-3 recombination; may have role in transcription +S000036434 CDS YKR038C 11 513159 511999 C 2011-02-03 2003-09-22|1996-07-31 +S000006540 tRNA_gene tD(GUC)K chromosome 11 L000003639 11 513403 513332 C 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000037688 noncoding_exon tD(GUC)K 11 513403 513332 C 2011-02-03 2000-05-19 +S000007060 long_terminal_repeat YKRCdelta11 chromosome 11 11 513846 513532 C 2011-02-03 2000-05-19 Ty1 LTR +S000001747 ORF Verified YKR039W GAP1 amino acid permease GAP1 chromosome 11 L000000667 11 515063 516871 W 27 2011-02-03 1996-07-31 General amino acid permease; Gap1p senses the presence of amino acid substrates to regulate localization to the plasma membrane when needed; essential for invasive growth +S000030283 CDS YKR039W 11 515063 516871 W 2011-02-03 1996-07-31 +S000118407 ARS ARS1116 ARSXI-517 chromosome 11 11 517017 517265 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000007061 long_terminal_repeat YKRCdelta12 chromosome 11 11 517784 517453 C 2011-02-03 2000-05-19 Ty1 LTR +S000006516 tRNA_gene tA(AGC)K2 chromosome 11 L000003637 11 517988 518060 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine +S000036249 noncoding_exon tA(AGC)K2 11 517988 518060 W 2011-02-03 2000-05-19 +S000001749 ORF Verified YKR041W chromosome 11 11 518198 518950 W 2011-02-03 1996-07-31 Protein of unknown function; localizes to the mitotic spindle; overexpression of YKR041W affects endocytic protein trafficking +S000030043 CDS YKR041W 11 518198 518950 W 2011-02-03 1996-07-31 +S000001748 ORF Dubious YKR040C chromosome 11 11 518566 518063 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YKR041W +S000029852 CDS YKR040C 11 518566 518063 C 2011-02-03 1996-07-31 +S000001750 ORF Verified YKR042W UTH1 SUN family protein UTH1 chromosome 11 L000002766 11 519527 520624 W 2011-02-03 1996-07-31|2005-11-03 Mitochondrial inner membrane protein; role in mitophagy is disputed; implicated in cell wall biogenesis, the oxidative stress response, life span during starvation, and cell death; SUN family member; UTH1 has a paralog, NCA3, that arose from the whole genome duplication +S000031030 CDS YKR042W 11 519527 520624 W 2011-02-03 1996-07-31|2005-11-03 +S000001751 ORF Verified YKR043C SHB17 sedoheptulose-bisphosphatase chromosome 11 11 521712 520897 C 2011-02-03 1996-07-31 Sedoheptulose bisphosphatase involved in riboneogenesis; dephosphorylates sedoheptulose 1,7-bisphosphate, which is converted via the nonoxidative pentose phosphate pathway to ribose-5-phosphate; facilitates the conversion of glycolytic intermediates to pentose phosphate units; also has fructose 1,6-bisphosphatase activity but this is probably not biologically relevant, since deletion does not affect FBP levels; GFP-fusion protein localizes to the cytoplasm and nucleus +S000031078 CDS YKR043C 11 521712 520897 C 2011-02-03 1996-07-31 +S000001752 ORF Verified YKR044W UIP5 chromosome 11 11 522015 523346 W 2011-02-03 1996-07-31 Protein of unknown function that interacts with Ulp1p; a Ubl (ubiquitin-like protein)-specific protease for Smt3p protein conjugates +S000031276 CDS YKR044W 11 522015 523346 W 2011-02-03 1996-07-31 +S000001753 ORF Uncharacterized YKR045C chromosome 11 11 523969 523418 C 2011-02-03 2003-09-22|1996-07-31 Putative protein of unknown function; epitope-tagged protein localizes to the cytoplasm +S000032206 CDS YKR045C 11 523969 523418 C 2011-02-03 2003-09-22|1996-07-31 +S000001754 ORF Verified YKR046C PET10 chromosome 11 11 525074 524223 C 2011-02-03 1996-07-31 Protein of unknown function that localizes to lipid particles; localization suggests a role in lipid metabolism; expression pattern suggests a role in respiratory growth; computational analysis of large-scale protein-protein interaction data suggests a role in ATP/ADP exchange +S000032320 CDS YKR046C 11 525074 524223 C 2011-02-03 1996-07-31 +S000001755 ORF Dubious YKR047W chromosome 11 11 525257 525562 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene NAP1 +S000032471 CDS YKR047W 11 525257 525562 W 2011-02-03 1996-07-31 +S000001756 ORF Verified YKR048C NAP1 histone chaperone NAP1 chromosome 11 L000001232 11 526640 525387 C 2011-02-03 1996-07-31 Histone chaperone; involved in histone exchange by removing and replacing histone H2A-H2B dimers or histone variant dimers from assembled nucleosomes; involved in the transport of H2A and H2B histones to the nucleus; required for the regulation of microtubule dynamics during mitosis; interacts with mitotic cyclin Clb2p; controls bud morphogenesis; phosphorylated by CK2; protein abundance increases in response to DNA replication stress +S000034427 CDS YKR048C 11 526640 525387 C 2011-02-03 1996-07-31 +S000001757 ORF Verified YKR049C FMP46 putative redox protein chromosome 11 11 527231 526830 C 2011-02-03 1996-07-31 Putative redox protein containing a thioredoxin fold; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000034545 CDS YKR049C 11 527231 526830 C 2011-02-03 1996-07-31 +S000001758 ORF Verified YKR050W TRK2 RPD2 chromosome 11 L000002335 11 527815 530484 W 15 2011-02-03 1996-07-31 Component of the Trk1p-Trk2p potassium transport system; contributes to K(+) supply and maintenance of plasma-membrane potential; TRK2 has a paralog, TRK1, that arose from the whole genome duplication +S000033289 CDS YKR050W 11 527815 530484 W 2011-02-03 1996-07-31 +S000001759 ORF Uncharacterized YKR051W chromosome 11 11 530946 532202 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000034162 CDS YKR051W 11 530946 532202 W 2011-02-03 1996-07-31 +S000001760 ORF Verified YKR052C MRS4 Fe(2+) transporter chromosome 11 L000001180 11 533464 532550 C 2011-02-03 1996-07-31 Iron transporter of the mitochondrial carrier family; mediates Fe2+ transport across the inner mitochondrial membrane; active under low-iron conditions; may transport other cations; protein abundance increases in response to DNA replication stress; MRS4 has a paralog, MRS3, that arose from the whole genome duplication +S000034228 CDS YKR052C 11 533464 532550 C 2011-02-03 1996-07-31 +S000001761 ORF Verified YKR053C YSR3 sphinganine kinase YSR3|LBP2 chromosome 11 L000004404 11 535281 534067 C 2011-02-03 1996-07-31 Dihydrosphingosine 1-phosphate phosphatase; membrane protein involved in sphingolipid metabolism; YSR3 has a paralog, LCB3, that arose from the whole genome duplication +S000034357 CDS YKR053C 11 535281 534067 C 2011-02-03 1996-07-31 +S000001762 ORF Verified YKR054C DYN1 dynein heavy chain|PAC6|DHC1 chromosome 11 L000000538 11 547925 535647 C 24.6 2011-02-03 1996-07-31 Cytoplasmic heavy chain dynein; microtubule motor protein; member of the AAA+ protein family, required for anaphase spindle elongation; involved in spindle assembly, chromosome movement, and spindle orientation during cell division, targeted to microtubule tips by Pac1p; motility along microtubules inhibited by She1p +S000035346 CDS YKR054C 11 547925 535647 C 2011-02-03 1996-07-31 +S000001763 ORF Verified YKR055W RHO4 Rho family GTPase RHO4 chromosome 11 L000001633 11 548216 549091 W 2011-02-03 1996-07-31 Non-essential small GTPase; member of the Rho/Rac subfamily of Ras-like proteins; likely to be involved in the establishment of cell polarity; has long N-terminal extension that plays an important role in Rho4p function and is shared with Rho4 homologs in other yeasts and filamentous fungi +S000035541 CDS YKR055W 11 548216 549091 W 2011-02-03 1996-07-31 +S000001764 ORF Verified YKR056W TRM2 RNC1|NUD1|NUC2 chromosome 11 L000001652|L000001284 11 549448 551367 W 2011-02-03 2004-02-13|1996-07-31 tRNA methyltransferase; 5-methylates the uridine residue at position 54 of tRNAs and may also have a role in tRNA stabilization or maturation; endo-exonuclease with a role in DNA repair +S000035618 CDS YKR056W 11 549448 551367 W 2011-02-03 2004-02-13|1996-07-31 +S000001765 ORF Verified YKR057W RPS21A eS21|ribosomal 40S subunit protein S21A|S21e|YS25|S26A|S21A|RPS25 chromosome 11 L000001761 11 551657 552242 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S21, no bacterial homolog; RPS21A has a paralog, RPS21B, that arose from the whole genome duplication +S000036538 CDS YKR057W 11 551657 551680 W 2011-02-03 1996-07-31 +S000036539 CDS YKR057W 11 552003 552242 W 2011-02-03 1996-07-31 +S000036540 intron YKR057W 11 551681 552002 W 2011-02-03 1996-07-31 +S000001766 ORF Verified YKR058W GLG1 glycogenin glucosyltransferase GLG1 chromosome 11 L000002878 11 552770 554620 W 2011-02-03 1996-07-31|2005-12-01 Glycogenin glucosyltransferase; self-glucosylating initiator of glycogen synthesis, also glucosylates n-dodecyl-beta-D-maltoside; SWAT-GFP and mCherry fusion proteins localize to the cell periphery and vacuole respectively; similar to mammalian glycogenin; GLG1 has a paralog, GLG2, that arose from the whole genome duplication +S000036619 CDS YKR058W 11 552770 554620 W 2011-02-03 1996-07-31|2005-12-01 +S000001767 ORF Verified YKR059W TIF1 translation initiation factor eIF4A|eIF4A chromosome 11 L000002302 11 554987 556174 W 22 2011-02-03 1996-07-31 Translation initiation factor eIF4A; DEA(D/H)-box RNA helicase that couples ATPase activity to RNA binding and unwinding; forms a dumbbell structure of two compact domains connected by a linker; interacts with eIF4G; protein abundance increases in response to DNA replication stress; TIF1 has a paralog, TIF2, that arose from the whole genome duplication +S000036719 CDS YKR059W 11 554987 556174 W 2011-02-03 1996-07-31 +S000001768 ORF Verified YKR060W UTP30 chromosome 11 11 556518 557342 W 2011-02-03 1996-07-31 Putative subunit of U3-containing 90S preribosome complex; complex is involved in production of 18S rRNA and assembly of small ribosomal subunit +S000030161 CDS YKR060W 11 556518 557342 W 2011-02-03 1996-07-31 +S000001769 ORF Verified YKR061W KTR2 mannosyltransferase KTR2 chromosome 11 L000000925 11 557677 558954 W 2011-02-03 1996-07-31 Mannosyltransferase involved in N-linked protein glycosylation; member of the KRE2/MNT1 mannosyltransferase family; KTR2 has a paralog, YUR1, that arose from the whole genome duplication +S000030356 CDS YKR061W 11 557677 558954 W 2011-02-03 1996-07-31 +S000006502 snoRNA_gene snR42 SNR42 chromosome 11 L000003409 11 559366 559016 C 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2975 +S000030613 noncoding_exon snR42 11 559366 559016 C 2011-02-03 2000-05-19 +S000001770 ORF Verified YKR062W TFA2 transcription factor TFIIE subunit TFA2 chromosome 11 L000002596 11 559666 560652 W 2011-02-03 1996-07-31 TFIIE small subunit; involved in RNA polymerase II transcription initiation +S000030483 CDS YKR062W 11 559666 560652 W 2011-02-03 1996-07-31 +S000001771 ORF Verified YKR063C LAS1 rRNA-processing protein LAS1 chromosome 11 L000000931 11 562297 560789 C 2011-02-03 1996-07-31 Endonuclease involved in pre-rRNA processing at both ends of ITS2; functions with Grc3p in a conserved mechanism to modulate rRNA processing and ribosome biogenesis; may coordinate the action of the Rat1p-Rai1p exoRNAse; required for the G1/S cell cycle transition; human ortholog is Las1L; mutants require the SSD1-v allele for viability +S000030551 CDS YKR063C 11 562297 560789 C 2011-02-03 1996-07-31 +S000001772 ORF Verified YKR064W OAF3 chromosome 11 11 562547 565138 W 2011-02-03 1996-07-31 Putative transcriptional repressor with Zn(2)-Cys(6) finger; negatively regulates transcription in response to oleate levels, based on mutant phenotype and localization to oleate-responsive promoters; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; forms nuclear foci upon DNA replication stress +S000031527 CDS YKR064W 11 562547 565138 W 2011-02-03 1996-07-31 +S000001773 ORF Verified YKR065C PAM17 FMP18 chromosome 11 11 565892 565299 C 2011-02-03 1996-07-31 Constituent of the TIM23 complex; proposed alternatively to be a component of the import motor (PAM complex) or to interact with and modulate the core TIM23 (Translocase of the Inner mitochondrial Membrane) complex; protein abundance increases in response to DNA replication stress +S000031607 CDS YKR065C 11 565892 565299 C 2011-02-03 1996-07-31 +S000001774 ORF Verified YKR066C CCP1 cytochrome-c peroxidase chromosome 11 L000000238 11 567198 566113 C 2011-02-03 1996-07-31 Mitochondrial cytochrome-c peroxidase; degrades reactive oxygen species in mitochondria, involved in the response to oxidative stress +S000032588 CDS YKR066C 11 567198 566113 C 2011-02-03 1996-07-31 +S000001775 ORF Verified YKR067W GPT2 bifunctional glycerol-3-phosphate/glycerone-phosphate O-acyltransferase GPT2|GAT1 chromosome 11 11 567918 570149 W 2011-02-03 1996-07-31 Glycerol-3-phosphate/dihydroxyacetone phosphate sn-1 acyltransferase; located in lipid particles and the ER; involved in the stepwise acylation of glycerol-3-phosphate and dihydroxyacetone in lipid biosynthesis; the most conserved motifs and functionally relevant residues are oriented towards the ER lumen +S000032727 CDS YKR067W 11 567918 570149 W 2011-02-03 1996-07-31 +S000001776 ORF Verified YKR068C BET3 TRAPP complex core subunit BET3 chromosome 11 L000004057 11 570909 570328 C 2011-02-03 1996-07-31 Core component of transport protein particle (TRAPP) complexes I-III; TRAPP complexes are related multimeric guanine nucleotide-exchange factors for the GTPase Ypt1, regulating ER-Golgi traffic (TRAPPI), intra-Golgi traffic (TRAPPII), endosome-Golgi traffic (TRAPPII and III) and autophagy (TRAPPIII); hydrophilic homodimeric protein that acts in conjunction with SNARE proteins in targeting and fusion of ER to Golgi transport vesicles +S000032759 CDS YKR068C 11 570909 570328 C 2011-02-03 1996-07-31 +S000001777 ORF Verified YKR069W MET1 uroporphyrinogen-III C-methyltransferase|MET20 chromosome 11 L000001089 11 571612 573393 W 2011-02-03 1996-07-31 S-adenosyl-L-methionine uroporphyrinogen III transmethylase; involved in the biosynthesis of siroheme, a prosthetic group used by sulfite reductase; required for sulfate assimilation and methionine biosynthesis +S000032921 CDS YKR069W 11 571612 573393 W 2011-02-03 1996-07-31 +S000001778 ORF Uncharacterized YKR070W chromosome 11 11 573574 574632 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000033052 CDS YKR070W 11 573574 574632 W 2011-02-03 1996-07-31 +S000001779 ORF Verified YKR071C DRE2 electron carrier DRE2 chromosome 11 11 575980 574934 C 2011-02-03 1996-07-31 Component of the cytosolic Fe-S protein assembly (CIA) machinery; contains an Fe-S cluster that receives electrons from NADPH via the action of Tah18p in an early step in the CIA pathway; ortholog of human Ciapin1; protein abundance increases in response to DNA replication stress; inviability of the null mutant is functionally complemented by human CIAPIN1 +S000033101 CDS YKR071C 11 575980 574934 C 2011-02-03 1996-07-31 +S000001780 ORF Verified YKR072C SIS2 phosphopantothenoylcysteine decarboxylase complex subunit SIS2|HAL3 chromosome 11 L000001899 11 578123 576435 C 57 2011-02-03 1996-07-31 Negative regulatory subunit of protein phosphatase 1 (Ppz1p); involved in coenzyme A biosynthesis; subunit of phosphopantothenoylcysteine decarboxylase (PPCDC: Cab3p, Sis2p, Vhs3p) complex and the CoA-Synthesizing Protein Complex (CoA-SPC: Cab2p, Cab3p, Cab4p, Cab5p, Sis2p and Vhs3p); SIS2 has a paralog, VHS3, that arose from the whole genome duplication +S000033861 CDS YKR072C 11 578123 576435 C 2011-02-03 1996-07-31 +S000001781 ORF Dubious YKR073C chromosome 11 11 578507 578187 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033995 CDS YKR073C 11 578507 578187 C 2011-02-03 1996-07-31 +S000006632 tRNA_gene tK(UUU)K chromosome 11 L000003638 11 578965 579060 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000034204 intron tK(UUU)K 11 579002 579024 W 2011-02-03 2000-05-19 +S000034202 noncoding_exon tK(UUU)K 11 578965 579001 W 2011-02-03 2000-05-19 +S000034203 noncoding_exon tK(UUU)K 11 579025 579060 W 2011-02-03 2000-05-19 +S000001782 ORF Verified YKR074W AIM29 chromosome 11 11 579209 579676 W 2011-02-03 1996-07-31 Protein of unknown function; epitope-tagged protein localizes to the cytoplasm; YKR074W is not an essential gene; null mutant displays elevated frequency of mitochondrial genome loss +S000034957 CDS YKR074W 11 579209 579676 W 2011-02-03 1996-07-31 +S000028669 ORF Dubious YKR075W-A chromosome 11 11 580212 580481 W 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a protein; completely overlaps the uncharacterized gene YKR075C; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032494 CDS YKR075W-A 11 580212 580481 W 2011-02-03 2003-07-29 +S000001783 ORF Uncharacterized YKR075C chromosome 11 11 580750 579827 C 2011-02-03 1996-07-31 Protein of unknown function; similar to Reg1p; expression regulated by glucose and Rgt1p; GFP-fusion protein is induced in response to the DNA-damaging agent MMS; YKR075C has a paralog, YOR062C, that arose from the whole genome duplication +S000035052 CDS YKR075C 11 580750 579827 C 2011-02-03 1996-07-31 +S000118408 ARS ARS1118 ARSXI-582 chromosome 11 11 581833 582070 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000001784 ORF Verified YKR076W ECM4 S-glutathionyl-(chloro)hydroquinone reductase|GTO2 chromosome 11 L000003880 11 582283 583395 W 2011-02-03 1996-07-31 S-glutathionyl-(chloro)hydroquinone reductase (GS-HQR); glutathione transferase involved in cell-surface biosynthesis and architecture; catalyzes glutathione (GSH)-dependent reduction of GS-trichloro-p-hydroquinone to trichloro-p-hydroquinone; expression upregulated upon exposure to genotoxic agents, such as methyl methanesulfonate, cisplatin and bleomycin; not an essential gene; similar to YGR154C; green fluorescent protein (GFP)-fusion protein localizes to cytoplasm +S000035311 CDS YKR076W 11 582283 583395 W 2011-02-03 1996-07-31 +S000001785 ORF Verified YKR077W MSA2 chromosome 11 11 583653 584744 W 2011-02-03 1996-07-31 Putative transcriptional activator; interacts with G1-specific transcription factor MBF and G1-specific promoters; MSA2 has a paralog, MSA1, that arose from the whole genome duplication +S000036232 CDS YKR077W 11 583653 584744 W 2011-02-03 1996-07-31 +S000001786 ORF Verified YKR078W chromosome 11 11 584952 586709 W 2011-02-03 1996-07-31 Cytoplasmic protein of unknown function; potential Cdc28p substrate; contains a Phox homology (PX) domain and specifically binds phosphatidylinositol 3-phosphate (PtdIns-3-P); YKR078W has a paralog, VPS5, that arose from the whole genome duplication +S000036335 CDS YKR078W 11 584952 586709 W 2011-02-03 1996-07-31 +S000001787 ORF Verified YKR079C TRZ1 tRNase Z chromosome 11 11 589305 586789 C 2011-02-03 1996-07-31 tRNA 3'-end processing endonuclease tRNase Z; also localized to mitochondria and interacts genetically with Rex2 exonuclease; homolog of the human candidate prostate cancer susceptibility gene ELAC2 +S000036383 CDS YKR079C 11 589305 586789 C 2011-02-03 1996-07-31 +S000001788 ORF Verified YKR080W MTD1 methylenetetrahydrofolate dehydrogenase (NAD(+)) chromosome 11 L000001210 11 590395 591357 W 2011-02-03 1996-07-31 NAD-dependent 5,10-methylenetetrahydrafolate dehydrogenase; plays a catalytic role in oxidation of cytoplasmic one-carbon units; expression is regulated by Bas1p and Bas2p, repressed by adenine, and may be induced by inositol and choline +S000029910 CDS YKR080W 11 590395 591357 W 2011-02-03 1996-07-31 +S000001789 ORF Verified YKR081C RPF2 rRNA-binding ribosome biosynthesis protein RPF2 chromosome 11 11 592540 591506 C 2011-02-03 1996-07-31 Essential protein involved in rRNA maturation and ribosomal assembly; involved in the processing of pre-rRNA and the assembly of the 60S ribosomal subunit; interacts with ribosomal protein L11; localizes predominantly to the nucleolus; constituent of 66S pre-ribosomal particles +S000029955 CDS YKR081C 11 592540 591506 C 2011-02-03 1996-07-31 +S000001790 ORF Verified YKR082W NUP133 RAT3 chromosome 11 L000002620 11 592825 596298 W 2011-02-03 1996-07-31 Subunit of Nup84p subcomplex of nuclear pore complex (NPC); contributes to nucleocytoplasmic transport, NPC biogenesis; is involved in establishment of a normal nucleocytoplasmic concentration gradient of GTPase Gsp1p; also plays roles in several processes that may require localization of genes or chromosomes at nuclear periphery, including double-strand break repair, transcription and chromatin silencing; relocalizes to cytosol in response to hypoxia; homolog of human NUP133 +S000030187 CDS YKR082W 11 592825 596298 W 2011-02-03 1996-07-31 +S000001791 ORF Verified YKR083C DAD2 HSK1 chromosome 11 11 596822 596421 C 2011-02-03 1996-07-31 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; is transferred to the kinetochore prior to mitosis +S000031089 CDS YKR083C 11 596822 596421 C 2011-02-03 1996-07-31 +S000001792 ORF Verified YKR084C HBS1 ribosome dissociation factor GTPase HBS1 chromosome 11 L000000756 11 598890 597055 C 2011-02-03 1996-07-31 GTPase with similarity to translation release factors; together with binding partner Dom34p, facilitates ribosomal subunit dissociation and peptidyl-tRNA release when translation is stalled, particularly in 3' UTRs; genetically implicated in mRNA no-go decay; HBS1 has a paralog, SKI7, that arose from the whole genome duplication +S000031204 CDS YKR084C 11 598890 597055 C 2011-02-03 1996-07-31 +S000001793 ORF Verified YKR085C MRPL20 mitochondrial 54S ribosomal protein YmL20|YmL20 chromosome 11 L000002527|L000001166 11 599681 599094 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000031317 CDS YKR085C 11 599681 599094 C 2011-02-03 1996-07-31 +S000001794 ORF Verified YKR086W PRP16 DEAH-box RNA helicase PRP16|PRP23|RNA16 chromosome 11 L000001504 11 599857 603072 W 2011-02-03 1996-07-31 DEAH-box RNA helicase involved in second catalytic step of splicing and in exon ligation; exhibits ATP-dependent RNA unwinding activity; mediates the release of Yju2p and Cwc25p in the second step; in the absence of ATP, stabilizes the binding of Cwc25p to the spliceosome in the first catalytic step; missense mutation in human ortholog DHX38 associated with early-onset retinitis pigmentosa +S000032379 CDS YKR086W 11 599857 603072 W 2011-02-03 1996-07-31 +S000001795 ORF Verified YKR087C OMA1 metalloendopeptidase chromosome 11 11 604232 603195 C 2011-02-03 2004-07-23|1996-07-31 Metalloendopeptidase of the mitochondrial inner membrane; important for adaptive responses to various homeostatic insults, preservation of normal mitochondrial function under damage-eliciting conditions, and stability of respiratory supercomplexes; involved in turnover of membrane-embedded proteins; mediates degradation of Cox1p in coa2 mutant cells; zebrafish ortholog has a role in organ development and mouse ortholog is also required for respiratory supercomplex stability +S000032444 CDS YKR087C 11 604232 603195 C 2011-02-03 2004-07-23|1996-07-31 +S000001796 ORF Verified YKR088C TVP38 chromosome 11 11 605418 604405 C 2011-02-03 1996-07-31 Integral membrane protein; localized to late Golgi vesicles along with the v-SNARE Tlg2p; required for asymmetric localization of Kar9p during mitosis; GFP-fusion protein localizes to the cytoplasm in a punctate pattern +S000032545 CDS YKR088C 11 605418 604405 C 2011-02-03 1996-07-31 +S000001797 ORF Verified YKR089C TGL4 STC1 chromosome 11 11 608365 605633 C 2011-02-03 1996-07-31 Multifunctional lipase/hydrolase/phospholipase; triacylglycerol lipase, steryl ester hydrolase, and Ca2+-independent phospholipase A2; catalyzes acyl-CoA dependent acylation of LPA to PA; required with Tgl3p for timely bud formation; phosphorylated and activated by Cdc28p; TGL4 has a paralog, TGL5, that arose from the whole genome duplication +S000032624 CDS YKR089C 11 608365 605633 C 2011-02-03 1996-07-31 +S000001798 ORF Verified YKR090W PXL1 chromosome 11 11 608946 611066 W 2011-02-03 1996-07-31|2011-02-03 Protein that localizes to sites of polarized growth; required for selection and/or maintenance of polarized growth sites, may modulate signaling by the GTPases Cdc42p and Rho1p; contains LIM domains and has similarity to metazoan paxillin; relocalizes from bud neck to cytoplasm upon DNA replication stress +S000033373 CDS YKR090W 11 608946 611066 W 2011-02-03 1996-07-31|2011-02-03 +S000001799 ORF Verified YKR091W SRL3 DNA-binding protein SRL3|WHI7 chromosome 11 L000004671 11 611525 612265 W 2011-02-03 2004-07-23|1996-07-31 GTB motif (G1/S transcription factor binding) containing protein; binds SBF-regulated promoters in hydroxyurea-treated cells; when overexpressed, suppresses the lethality of a rad53 null mutation; potential Cdc28p substrate; SRL3 has a paralog, WHI5, that arose from the whole genome duplication +S000034294 CDS YKR091W 11 611525 612265 W 2011-02-03 2004-07-23|1996-07-31 +S000118409 ARS ARS1120 ARSXI-612 chromosome 11 11 612378 612463 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000001800 ORF Verified YKR092C SRP40 chromosome 11 L000002063 11 613885 612665 C 2011-02-03 1996-07-31 Nucleolar serine-rich protein; role in preribosome assembly or transport; may function as a chaperone of small nucleolar ribonucleoprotein particles (snoRNPs); immunologically and structurally to rat Nopp140 +S000034345 CDS YKR092C 11 613885 612665 C 2011-02-03 1996-07-31 +S000001801 ORF Verified YKR093W PTR2 chromosome 11 L000001527 11 615730 617535 W 2011-02-03 1996-07-31 Integral membrane peptide transporter; mediates transport of di- and tri-peptides; conserved protein that contains 12 transmembrane domains; PTR2 expression is regulated by the N-end rule pathway via repression by Cup9p +S000034474 CDS YKR093W 11 615730 617535 W 2011-02-03 1996-07-31 +S000001802 ORF Verified YKR094C RPL40B eL40|ubiquitin-ribosomal 60S subunit protein L40B fusion protein|L40e|L40B|UB12|CEP52B|UBI2 chromosome 11 L000002412|L000000314 11 618750 617996 C 2011-02-03 1996-07-31|2011-02-03 Ubiquitin-ribosomal 60S subunit protein L40B fusion protein; cleaved to yield ubiquitin and ribosomal protein L40B; ubiquitin may facilitate assembly of the ribosomal protein into ribosomes; homologous to mammalian ribosomal protein L40, no bacterial homolog; RPL40B has a paralog, RPL40A, that arose from the whole genome duplication +S000034523 CDS YKR094C 11 618374 617996 C 2011-02-03 1996-07-31 +S000034522 CDS YKR094C 11 618750 618743 C 2011-02-03 1996-07-31 +S000034524 intron YKR094C 11 618742 618375 C 2011-02-03 1996-07-31|2011-02-03 +S000001803 ORF Verified YKR095W MLP1 MPL1 chromosome 11 L000001141|L000001122 11 619805 625432 W 80.3 2011-02-03 1996-07-31 Myosin-like protein associated with the nuclear envelope; nuclear basket protein that connects the nuclear pore complex with the nuclear interior; involved with Tel1p in telomere length control; involved with Pml1p and Pml39p in nuclear retention of unspliced mRNAs; MLP1 has a paralog, MLP2, that arose from the whole genome duplication +S000035599 CDS YKR095W 11 619805 625432 W 2011-02-03 1996-07-31 +S000028512 ORF Verified YKR095W-A PCC1 chromatin DNA-binding EKC/KEOPS complex subunit PCC1 chromosome 11 11 625864 626205 W 2011-02-03 2004-01-28|2003-07-29 Component of the EKC/KEOPS protein complex; EKC/KEOPS complex is required for t6A tRNA modification and telomeric TG1-3 recombination; may have role in transcription; other complex members are Kae1p, Gon7p, Bud32p, and Cgi121p +S000030270 CDS YKR095W-A 11 625864 625901 W 2011-02-03 2004-01-28|2003-07-29 +S000030272 CDS YKR095W-A 11 625977 626205 W 2011-02-03 2004-01-28 +S000030273 intron YKR095W-A 11 625902 625976 W 2011-02-03 2004-01-28|2003-07-29 +S000001804 ORF Verified YKR096W ESL2 chromosome 11 11 626793 630380 W 2011-02-03 1996-07-31 hEST1A/B (SMG5/6)-like protein; contributes to environment-sensing adaptive gene expression responses; Esl2p and Esl1p contain a 14-3-3-like domain and a putative PilT N-terminus ribonuclease domain; interacts with Pex14p; may interact with ribosomes, based on co-purification experiments; green fluorescent protein (GFP)-fusion protein localizes to the nucleus and cytoplasm; ESL2 has a paralog, ESL1, that arose from the whole genome duplication +S000035688 CDS YKR096W 11 626793 630380 W 2011-02-03 1996-07-31 +S000001805 ORF Verified YKR097W PCK1 phosphoenolpyruvate carboxykinase PCK1|PPC1|JPM2 chromosome 11 L000001350 11 631152 632801 W 73.2 2011-02-03 1996-07-31 Phosphoenolpyruvate carboxykinase; key enzyme in gluconeogenesis, catalyzes early reaction in carbohydrate biosynthesis, glucose represses transcription and accelerates mRNA degradation, regulated by Mcm1p and Cat8p, located in the cytosol +S000036623 CDS YKR097W 11 631152 632801 W 2011-02-03 1996-07-31 +S000001806 ORF Verified YKR098C UBP11 ubiquitin-specific protease UBP11 chromosome 11 L000003171 11 635179 633026 C 2011-02-03 1996-07-31 Ubiquitin-specific protease; cleaves ubiquitin from ubiquitinated proteins; UBP11 has a paralog, UBP7, that arose from the whole genome duplication +S000036658 CDS YKR098C 11 635179 633026 C 2011-02-03 1996-07-31 +S000001807 ORF Verified YKR099W BAS1 chromosome 11 L000000161 11 635851 638286 W 82 2011-02-03 1996-07-31 Myb-related transcription factor; involved in regulating basal and induced expression of genes of the purine and histidine biosynthesis pathways; also involved in regulation of meiotic recombination at specific genes +S000036756 CDS YKR099W 11 635851 638286 W 2011-02-03 1996-07-31 +S000001808 ORF Verified YKR100C SKG1 YKR099C-A chromosome 11 11 639968 638901 C 2011-02-03 2004-02-13|1996-07-31 Transmembrane protein with a role in cell wall polymer composition; localizes on inner surface of plasma membrane at bud and in daughter cell; SKG1 has a paralog, AIM20, that arose from the whole genome duplication +S000033006 CDS YKR100C 11 639968 638901 C 2011-02-03 2004-02-13|1996-07-31 +S000001809 ORF Verified YKR101W SIR1 chromosome 11 L000001894 11 640540 642504 W 84 2011-02-03 1996-07-31|2009-02-20 Protein involved in silencing at mating-type loci HML and HMR; recruitment to silent chromatin requires interactions with Orc1p and with Sir4p, through a common Sir1p domain; binds to centromeric chromatin +S000033721 CDS YKR101W 11 640540 642504 W 2011-02-03 1996-07-31|2009-02-20 +S000118410 ARS ARS1123 ARSXI-642 chromosome 11 11 642727 642973 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000001810 ORF Verified YKR102W FLO10 chromosome 11 L000004081 11 646356 649865 W 2011-02-03 1996-07-31 Member of the FLO family of cell wall flocculation proteins; not expressed in most lab strains; overproduction induces flocculation that can be inhibited by mannose, sucrose, or glucose; overproduction also promotes haploid invasive growth and diploid filamentous growth +S000033847 CDS YKR102W 11 646356 649865 W 2011-02-03 1996-07-31 +S000001811 ORF Verified YKR103W NFT1 putative multidrug transporter NFT1 chromosome 11 11 653080 656736 W 2011-02-03 1996-07-31 Putative transporter of the MRP subfamily; adjacent ORFs YKR103W and YKR104W are merged in different strain backgrounds; MRP stands for multidrug resistance-associated protein +S000033929 CDS YKR103W 11 653080 656736 W 2011-02-03 1996-07-31 +S000001812 ORF Verified YKR104W NFT1 chromosome 11 11 656836 657756 W 2011-02-03 1996-07-31 Putative transporter of the MRP subfamily; contains a stop codon in S288C; adjacent ORFs YKR103W and YKR104W are merged in different strain backgrounds; MRP stands for multidrug resistance-associated protein +S000034837 CDS YKR104W 11 656836 657756 W 2011-02-03 1996-07-31 +S000001813 ORF Verified YKR105C VBA5 basic amino acid transporter chromosome 11 11 660464 658716 C 2011-02-03 1996-07-31 Plasma membrane protein of the Major Facilitator Superfamily (MFS); involved in amino acid uptake and drug sensitivity; VBA5 has a paralog, VBA3, that arose from a segmental duplication +S000034879 CDS YKR105C 11 660464 658716 C 2011-02-03 1996-07-31 +S000001814 ORF Verified YKR106W GEX2 glutathione exchanger chromosome 11 11 661442 663289 W 2011-02-03 1996-07-31 Proton:glutathione antiporter; localized to the vacuolar and plasma membranes; expressed at a very low level; potential role in resistance to oxidative stress and modulation of the PKA pathway; GEX2 has a paralog, GEX1, that arose from a segmental duplication +S000035177 CDS YKR106W 11 661442 663289 W 2011-02-03 1996-07-31 +S000007063 long_terminal_repeat YKRWomega1 chromosome 11 11 665430 665668 W 2011-02-03 2000-05-19 Ty5 LTR +S000028978 telomere TEL11R chromosome 11 11 665904 666816 W 89 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome XI; composed of an X element core sequence, X element combinatorial repeats, and a terminal stretch of telomeric repeats +S000028979 telomeric_repeat TEL11R 11 666609 666816 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome XI +S000028980 X_element TEL11R 11 665904 666364 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome XI; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028981 X_element_combinatorial_repeat TEL11R 11 666365 666608 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr XI; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000029411 gene_group RDN1 RDN1 chromosome 12 L000001595 12 105 Ribosomal DNA (rDNA); an approximately 1-2 Mb region on the right arm of chr. XII consisting of 100-200 tandem copies of a 9.1 kb repeat which contains the genes for 5S, 5.8S, 25S and 18S rRNAs (represented by the RDN37, RDN25, RDN18, RDN58, and RDN5 loci); a specific histone modification (H3K56ac) regulates RNA polymerase I transcription of the ribosomal DNA +S000028673 ORF Dubious YLL067W-A chromosome 12 12 843 1325 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps YLL067C +S000032519 CDS YLL067W-A 12 843 1325 W 2003-07-29 2003-07-29 +S000003990 ORF Uncharacterized YLL067C Y' element ATP-dependent helicase chromosome 12 12 4301 585 C 1996-07-31 1996-07-31 Putative Y' element ATP-dependent helicase +S000034997 CDS YLL067C 12 3915 585 C 1996-07-31 1996-07-31 +S000034996 CDS YLL067C 12 4301 4015 C 1996-07-31 1996-07-31 +S000034998 intron YLL067C 12 4014 3916 C 1996-07-31 1996-07-31 +S000028672 ORF Uncharacterized YLL066W-B chromosome 12 12 5605 5775 W 2003-07-29 2003-07-29 Putative protein of unknown function; overexpression causes a cell cycle delay or arrest +S000032518 CDS YLL066W-B 12 5605 5775 W 2003-07-29 2003-07-29 +S000028671 ORF Dubious YLL066W-A chromosome 12 12 6486 6968 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized ORF YLL066C +S000032517 CDS YLL066W-A 12 6486 6968 W 2003-07-29 2003-07-29 +S000003989 ORF Uncharacterized YLL066C Y' element ATP-dependent helicase chromosome 12 12 9836 6120 C 1996-07-31 1996-07-31 Putative Y' element ATP-dependent helicase; YLL066C is not an essential gene +S000034882 CDS YLL066C 12 9450 6120 C 1996-07-31 1996-07-31 +S000034881 CDS YLL066C 12 9836 9550 C 1996-07-31 1996-07-31 +S000034883 intron YLL066C 12 9549 9451 C 1996-07-31 1996-07-31 +S000003988 ORF Dubious YLL065W GIN11 chromosome 12 L000002674 12 11726 12076 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps chromosome XII telomeric element core sequences +S000034819 CDS YLL065W 12 11726 12076 W 1996-07-31 1996-07-31 +S000028910 telomere TEL12L chromosome 12 12 12085 1 C -33 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome XII; composed of an X element core sequence, X element combinatorial repeats, and three distinct regions of telomeric repeats separated by two short Y' elements +S000028911 telomeric_repeat TEL12L 12 75 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome XII +S000028912 telomeric_repeat TEL12L 12 5723 5662 C 2003-09-09 2003-09-09 Middle stretch of telomeric repeats on the left arm of Chromosome XII +S000028913 telomeric_repeat TEL12L 12 11358 11197 C 2003-09-09 2003-09-09 Internal telomeric repeats on the left arm of Chromosome XII +S000028914 X_element TEL12L 12 12085 11626 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome XII; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YLL065W +S000028915 X_element_combinatorial_repeat TEL12L 12 11625 11359 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr XII; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000028916 Y_prime_element TEL12L 12 5661 76 C 2003-09-09 2003-09-09 Short telomeric Y' element on the left arm of Chromosome XII; more end-proximal of two two short telomeric Y' elements; contains an ARS consensus sequence, a region of 36-bp repeats, and two ORFs YLL067C and YLL067W-A +S000028917 Y_prime_element TEL12L 12 11196 5724 C 2003-09-09 2003-09-09 Short Y' element in the left telomere of Chromosome XII; more centromere-proximal of two short Y' elements; contains an ARS consensus sequence, a region of 36-bp repeats, and two ORFs YLL066C and YLL066W-A +S000003987 ORF Verified YLL064C PAU18 seripauperin PAU18 chromosome 12 12 13445 13083 C 1996-07-31 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; identical to Pau6p +S000034617 CDS YLL064C 12 13445 13083 C 1996-07-31 1996-07-31 +S000003986 ORF Verified YLL063C AYT1 acetyltransferase chromosome 12 L000004544 12 16072 14648 C 1996-07-31 1996-07-31 Acetyltransferase; catalyzes trichothecene 3-O-acetylation, suggesting a possible role in trichothecene biosynthesis +S000033720 CDS YLL063C 12 16072 14648 C 1996-07-31 1996-07-31 +S000003985 ORF Verified YLL062C MHT1 S-adenosylmethionine-homocysteine S-methyltransferase MHT1 chromosome 12 12 17613 16639 C 1996-07-31 1996-07-31 S-methylmethionine-homocysteine methyltransferase; functions along with Sam4p in the conversion of S-adenosylmethionine (AdoMet) to methionine to control the methionine/AdoMet ratio +S000033626 CDS YLL062C 12 17613 16639 C 1996-07-31 1996-07-31 +S000003984 ORF Verified YLL061W MMP1 S-methylmethionine permease MMP1 chromosome 12 L000004869 12 17956 19707 W 1996-07-31 1996-07-31 High-affinity S-methylmethionine permease; required for utilization of S-methylmethionine as a sulfur source; has similarity to S-adenosylmethionine permease Sam3p +S000033583 CDS YLL061W 12 17956 19707 W 1996-07-31 1996-07-31 +S000003983 ORF Verified YLL060C GTT2 glutathione transferase GTT2 chromosome 12 L000004613 12 21839 21138 C 1996-07-31 1996-07-31 Glutathione S-transferase capable of homodimerization; functional overlap with Gtt2p, Grx1p, and Grx2p; protein abundance increases in response to DNA replication stress +S000032819 CDS YLL060C 12 21839 21138 C 1996-07-31 1996-07-31 +S000003982 ORF Dubious YLL059C chromosome 12 12 22980 22474 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032747 CDS YLL059C 12 22980 22474 C 1996-07-31 1996-07-31 +S000003981 ORF Uncharacterized YLL058W cystathionine gamma-synthase chromosome 12 12 23569 25296 W 1996-07-31 1996-07-31 Putative protein of unknown function with similarity to Str2p; Str2p is a cystathionine gamma-synthase important in sulfur metabolism; YLL058W is not an essential gene +S000031898 CDS YLL058W 12 23569 25296 W 1996-07-31 1996-07-31 +S000003980 ORF Verified YLL057C JLP1 sulfonate dioxygenase chromosome 12 12 26994 25756 C 1996-07-31 1996-07-31 Fe(II)-dependent sulfonate/alpha-ketoglutarate dioxygenase; involved in sulfonate catabolism for use as a sulfur source; contains sequence that resembles a J domain (typified by the E. coli DnaJ protein); induced by sulphur starvation +S000031705 CDS YLL057C 12 26994 25756 C 1996-07-31 1996-07-31 +S000003979 ORF Uncharacterized YLL056C chromosome 12 12 28305 27409 C 1996-07-31 1996-07-31 Putative protein of unknown function; transcription is activated by paralogous transcription factors Yrm1p and Yrr1p and genes involved in pleiotropic drug resistance (PDR); expression is induced in cells treated with the mycotoxin patulin; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively +S000031618 CDS YLL056C 12 28305 27409 C 1996-07-31 1996-07-31 +S000003978 ORF Verified YLL055W YCT1 chromosome 12 12 30109 31704 W 1996-07-31 1996-07-31 High-affinity cysteine-specific transporter; has similarity to the Dal5p family of transporters; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; YCT1 is not an essential gene +S000031573 CDS YLL055W 12 30109 31704 W 1996-07-31 1996-07-31 +S000130180 ARS ARS1202 chromosome 12 12 30209 31384 2009-05-08 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000003977 ORF Uncharacterized YLL054C chromosome 12 12 35204 32673 C 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function with similarity to Pip2p; an oleate-specific transcriptional activator of peroxisome proliferation; YLL054C is not an essential gene +S000030665 CDS YLL054C 12 35204 32673 C 2011-02-03 1996-07-31|2011-02-03 +S000003976 ORF Uncharacterized YLL053C chromosome 12 12 35961 35503 C 2011-02-03 1996-07-31 Putative protein; in the Sigma 1278B strain background YLL053C is contiguous with AQY2 which encodes an aquaporin +S000030554 CDS YLL053C 12 35961 35503 C 2011-02-03 1996-07-31 +S000003975 ORF Verified YLL052C AQY2 chromosome 12 L000004844 12 36361 35912 C 2011-02-03 1996-07-31 Water channel that mediates water transport across cell membranes; only expressed in proliferating cells; controlled by osmotic signals; may be involved in freeze tolerance; disrupted by a stop codon in many S. cerevisiae strains +S000030412 CDS YLL052C 12 36361 35912 C 2011-02-03 1996-07-31 +S000003974 ORF Verified YLL051C FRE6 putative ferric-chelate reductase chromosome 12 L000003558 12 39471 37333 C 2011-02-03 1996-07-31 Putative ferric reductase with similarity to Fre2p; expression induced by low iron levels +S000037644 CDS YLL051C 12 39471 37333 C 2011-02-03 1996-07-31 +S000003973 ORF Verified YLL050C COF1 cofilin chromosome 12 L000000377 12 40414 39804 C 2011-02-03 1996-07-31 Cofilin, involved in pH-dependent actin filament depolarization; binds both actin monomers and filaments and severs filaments; involved in the selective sorting, export of the secretory cargo from the late golgi; genetically interacts with pmr1; thought to be regulated by phosphorylation at SER4; ubiquitous and essential in eukaryotes +S000037511 CDS YLL050C 12 40221 39804 C 2011-02-03 1996-07-31 +S000037510 CDS YLL050C 12 40414 40401 C 2011-02-03 1996-07-31 +S000037512 intron YLL050C 12 40400 40222 C 2011-02-03 1996-07-31 +S000003972 ORF Verified YLL049W LDB18 chromosome 12 12 40666 41205 W 2011-02-03 1996-07-31 Component of the dynactin complex; dynactin is required for dynein activity; null mutant exhibits defects in nuclear migration and spindle orientation and has reduced affinity for alcian blue dye; has homology to mammalian dynactin subunit p24 +S000037568 CDS YLL049W 12 40666 41205 W 2011-02-03 1996-07-31 +S000003971 ORF Verified YLL048C YBT1 bile acid-transporting ATPase YBT1|BAT1 chromosome 12 L000004345 12 46265 41280 C 2011-02-03 1996-07-31 Transporter of the ATP-binding cassette (ABC) family; involved in bile acid transport; negative regulator of vacuole fusion; regulates release of lumenal Ca2+ stores; similar to mammalian bile transporters; YBT1 has a paralog, VMR1, that arose from the whole genome duplication +S000036801 CDS YLL048C 12 46265 41280 C 2011-02-03 1996-07-31 +S000003970 ORF Dubious YLL047W chromosome 12 12 46672 47055 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene RNP1 +S000036777 CDS YLL047W 12 46672 47055 W 2011-02-03 1996-07-31 +S000003969 ORF Verified YLL046C RNP1 chromosome 12 L000001654 12 47463 46714 C 2011-02-03 1996-07-31 Ribonucleoprotein that contains two RNA recognition motifs (RRM); RNP1 has a paralog, SBP1, that arose from the whole genome duplication +S000036697 CDS YLL046C 12 47463 46714 C 2011-02-03 1996-07-31 +S000003967 ORF Dubious YLL044W chromosome 12 12 48216 48662 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; transcription of both YLL044W and the overlapping gene RPL8B is reduced in the gcr1 null mutant +S000035737 CDS YLL044W 12 48216 48662 W 2011-02-03 1996-07-31 +S000003968 ORF Verified YLL045C RPL8B eL8|ribosomal 60S subunit protein L8B|L8e|rp6|YL5|L8B|L4B|SCL41|KRB1 chromosome 12 L000000911|L000001705 12 48629 47859 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L8B; required for processing of 27SA3 pre-rRNA to 27SB pre-rRNA during assembly of large ribosomal subunit; depletion leads to a turnover of pre-rRNA; L8 binds to Domain I of 25S and 5.8 S rRNAs; mutation results in decreased amounts of free 60S subunits; homologous to mammalian ribosomal protein L7A, no bacterial homolog; RPL8B has a paralog, RPL8A, that arose from the whole genome duplication +S000036622 CDS YLL045C 12 48629 47859 C 2011-02-03 1996-07-31 +S000003966 ORF Verified YLL043W FPS1 chromosome 12 L000000625 12 49938 51947 W 2011-02-03 1996-07-31 Aquaglyceroporin, plasma membrane channel; involved in efflux of glycerol and xylitol, and in uptake of acetic acid, arsenite, and antimonite; key factor in maintaining redox balance by mediating passive diffusion of glycerol; phosphorylated by Hog1p MAPK under acetate stress; deletion improves xylose fermentation; regulated by Rgc1p and Ask10p, which are regulated by Hog1p phosphorylation under osmotic stress; phosphorylation by Ypk1p required to maintain an open state +S000035628 CDS YLL043W 12 49938 51947 W 2011-02-03 1996-07-31 +S000003965 ORF Verified YLL042C ATG10 E2-like conjugating enzyme|APG10 chromosome 12 L000004785 12 52590 52087 C 2011-02-03 1996-07-31 Conserved E2-like conjugating enzyme; mediates formation of the Atg12p-Atg5p conjugate, which is a critical step in autophagy +S000035508 CDS YLL042C 12 52590 52087 C 2011-02-03 1996-07-31 +S000003964 ORF Verified YLL041C SDH2 succinate dehydrogenase iron-sulfur protein subunit SDH2|SDHB|ACN17 chromosome 12 L000001824 12 53931 53131 C 2011-02-03 1996-07-31 Iron-sulfur protein subunit of succinate dehydrogenase; the complex couples the oxidation of succinate to the transfer of electrons to ubiquinone as part of the TCA cycle and the mitochondrial respiratory chain; other members are Sdh1p, Sdh3p, and Sdh4p +S000034473 CDS YLL041C 12 53931 53131 C 2011-02-03 1996-07-31 +S000003963 ORF Verified YLL040C VPS13 membrane morphogenesis protein VPS13|VPT2|SOI1 chromosome 12 L000003510|L000002967 12 63645 54211 C 2011-02-03 1996-07-31 Protein involved in prospore membrane morphogenesis; peripheral membrane protein that localizes to the prospore membrane and at numerous membrane contact sites; involved in sporulation, vacuolar protein sorting, prospore membrane formation during sporulation, and protein-Golgi retention; required for mitochondrial integrity; contains a PH-like domain; homologous to human CHAC and COH1 which are involved in Chorea-acanthocytosis and Cohen syndrome, respectively +S000034394 CDS YLL040C 12 63645 54211 C 2011-02-03 1996-07-31 +S000003962 ORF Verified YLL039C UBI4 ubiquitin|UB14|SCD2 chromosome 12 L000002414 12 65207 64062 C 2011-02-03 1996-07-31 Ubiquitin; becomes conjugated to proteins, marking them for selective degradation via the ubiquitin-26S proteasome system; essential for the cellular stress response; encoded as a polyubiquitin precursor comprised of 5 head-to-tail repeats; protein abundance increases in response to DNA replication stress +S000033435 CDS YLL039C 12 65207 64062 C 2011-02-03 1996-07-31 +S000003961 ORF Verified YLL038C ENT4 chromosome 12 12 66518 65775 C 2011-02-03 1996-07-31 Protein of unknown function; contains an N-terminal epsin-like domain; proposed to be involved in the trafficking of Arn1p in the absence of ferrichrome +S000033366 CDS YLL038C 12 66518 65775 C 2011-02-03 1996-07-31 +S000003960 ORF Dubious YLL037W chromosome 12 12 66562 66942 W 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; overlaps 3' end of essential PRP19 gene encoding an RNA splicing factor +S000033343 CDS YLL037W 12 66562 66942 W 2011-02-03 1996-07-31 +S000003959 ORF Verified YLL036C PRP19 E3 ubiquitin-protein ligase PRP19|PSO4 chromosome 12 L000001506 12 68256 66745 C 2011-02-03 1996-07-31 Splicing factor associated with the spliceosome; contains a U-box, a motif found in a class of ubiquitin ligases, and a WD40 domain; relocalizes to the cytosol in response to hypoxia +S000032580 CDS YLL036C 12 68256 66745 C 2011-02-03 1996-07-31 +S000003958 ORF Verified YLL035W GRC3 polynucleotide 5'-hydroxyl-kinase chromosome 12 12 68580 70478 W 2011-02-03 1996-07-31 Polynucleotide kinase present on rDNA; required for efficient transcription termination by RNA polymerase I; functions with Las1p in a conserved mechanism to modulate rRNA processing and ribosome biogenesis; required for cell growth; mRNA is cell-cycle regulated +S000032549 CDS YLL035W 12 68580 70478 W 2011-02-03 1996-07-31 +S000003957 ORF Verified YLL034C RIX7 putative AAA family ATPase RIX7 chromosome 12 12 73146 70633 C 2011-02-03 1996-07-31 Putative ATPase of the AAA family; required for export of pre-ribosomal large subunits from the nucleus; distributed between the nucleolus, nucleoplasm, and nuclear periphery depending on growth conditions +S000032376 CDS YLL034C 12 73146 70633 C 2011-02-03 1996-07-31 +S000003956 ORF Verified YLL033W IRC19 RRG4|GON2 chromosome 12 12 73409 74101 W 2011-02-03 1996-07-31 Protein of unknown function; YLL033W is not an essential gene but mutant is defective in spore formation; null mutant displays increased levels of spontaneous Rad52p foci +S000032327 CDS YLL033W 12 73409 74101 W 2011-02-03 1996-07-31 +S000003955 ORF Verified YLL032C chromosome 12 12 76747 74270 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YLL032C is not an essential gene +S000031283 CDS YLL032C 12 76747 74270 C 2011-02-03 1996-07-31 +S000003954 ORF Verified YLL031C GPI13 mannose-ethanolamine phosphotransferase GPI13|MPC1 chromosome 12 12 80205 77152 C 2011-02-03 1996-07-31 ER membrane localized phosphoryltransferase; adds phosphoethanolamine onto the third mannose residue of the glycosylphosphatidylinositol (GPI) anchor precursor; similar to human PIG-O protein +S000031131 CDS YLL031C 12 80205 77152 C 2011-02-03 1996-07-31 +S000003953 ORF Dubious YLL030C RRT7 chromosome 12 12 80697 80356 C 2011-02-03 1996-07-31 Protein of unknown function; identified in a screen for mutants with increased levels of rDNA transcription; dubious open reading frame unlikely to encode a protein, based on available experimental and comparative sequence data +S000030186 CDS YLL030C 12 80697 80356 C 2011-02-03 1996-07-31 +S000003952 ORF Verified YLL029W FRA1 RUP2 chromosome 12 12 81461 83710 W 2011-02-03 1996-07-31 Protein involved in negative regulation of iron regulon transcription; forms an iron independent complex with Fra2p, Grx3p, and Grx4p; cytosolic; mutant fails to repress transcription of iron regulon and is defective in spore formation +S000037209 CDS YLL029W 12 81461 83710 W 2011-02-03 1996-07-31 +S000003951 ORF Verified YLL028W TPO1 chromosome 12 12 84804 86564 W 2011-02-03 1996-07-31 Polyamine transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; recognizes spermine, putrescine, and spermidine; catalyzes uptake of polyamines at alkaline pH and excretion at acidic pH; during oxidative stress exports spermine, spermidine from the cell, which controls timing of expression of stress-responsive genes; phosphorylation enhances activity and sorting to the plasma membrane +S000037134 CDS YLL028W 12 84804 86564 W 2011-02-03 1996-07-31 +S000003950 ORF Verified YLL027W ISA1 Fe-binding Fe/S cluster assembly protein ISA1 chromosome 12 L000004953 12 87403 88155 W 2011-02-03 1996-07-31 Protein required for maturation of mitochondrial [4Fe-4S] proteins; functions in a complex with Isa2p and possibly Iba57p; isa1 deletion causes loss of mitochondrial DNA and respiratory deficiency; depletion reduces growth on nonfermentable carbon sources; functional ortholog of bacterial A-type ISC proteins; human ISCA1 can complement isa1 null mutant +S000036472 CDS YLL027W 12 87403 88155 W 2011-02-03 1996-07-31 +S000003949 ORF Verified YLL026W HSP104 chaperone ATPase HSP104 chromosome 12 L000000823 12 88623 91349 W 2011-02-03 1996-07-31 Disaggregase; heat shock protein that cooperates with Ydj1p (Hsp40) and Ssa1p (Hsp70) to refold and reactivate previously denatured, aggregated proteins; responsive to stresses including: heat, ethanol, and sodium arsenite; involved in [PSI+] propagation; protein becomes more abundant and forms cytoplasmic foci in response to DNA replication stress; potentiated Hsp104p variants decrease TDP-43 proteotoxicity by eliminating its cytoplasmic aggregation +S000036386 CDS YLL026W 12 88623 91349 W 2011-02-03 1996-07-31 +S000118469 ARS ARS1206 ARSXII-91 chromosome 12 12 91419 91660 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178130 ARS_consensus_sequence ARS1206 12 91466 91482 W 2014-11-18 2014-11-18 +S000007064 long_terminal_repeat YLLCdelta1 chromosome 12 12 92381 92050 C 2011-02-03 2000-05-19 Ty1 LTR +S000006683 tRNA_gene tP(UGG)L chromosome 12 L000003645 12 92548 92650 W 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin +S000036013 intron tP(UGG)L 12 92584 92614 W 2011-02-03 2000-05-19 +S000036011 noncoding_exon tP(UGG)L 12 92548 92583 W 2011-02-03 2000-05-19 +S000036012 noncoding_exon tP(UGG)L 12 92615 92650 W 2011-02-03 2000-05-19 +S000003948 ORF Verified YLL025W PAU17 seripauperin PAU17 chromosome 12 12 94747 95121 W 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP and mCherry fusion proteins localize to the vacuole; YLL025W is not an essential gene +S000036278 CDS YLL025W 12 94747 95121 W 2011-02-03 1996-07-31 +S000003947 ORF Verified YLL024C SSA2 Hsp70 family chaperone SSA2|YG102 chromosome 12 L000002070 12 97485 95566 C 2011-02-03 1996-07-31 HSP70 family ATP-binding protein; involved in protein folding, vacuolar import of proteins; required for ubiquitin-dependent degradation of short-lived proteins; associated with chaperonin-containing T-complex; 98% identical to paralog Ssa1p with distinct functional specificity in propagation of yeast [URE3] prions and vacuolar-mediated degradation of gluconeogenesis enzymes; binds tRNA, has role in tRNA nuclear import during starvation +S000035290 CDS YLL024C 12 97485 95566 C 2011-02-03 1996-07-31 +S000003946 ORF Verified YLL023C POM33 nucleoporin POM33 chromosome 12 12 98836 97997 C 2011-02-03 1996-07-31 Transmembrane nucleoporin; involved in nuclear pore complex (NPC) distribution, assembly or stabilization; highly conserved across species, orthologous to human TMEM33 and paralogous to Per33p; protein abundance increases in response to DNA replication stress +S000035143 CDS YLL023C 12 98836 97997 C 2011-02-03 1996-07-31 +S000003945 ORF Verified YLL022C HIF1 chromosome 12 L000004439 12 100201 99044 C 2011-02-03 1996-07-31 Non-essential component of the HAT-B histone acetyltransferase complex; localized to the nucleus; has a role in telomeric silencing; other members are Hat1p and Hat2p +S000034956 CDS YLL022C 12 100201 99044 C 2011-02-03 1996-07-31 +S000003944 ORF Verified YLL021W SPA2 PPF1|PEA1|FUS6 chromosome 12 L000001989 12 100947 105347 W -28 2011-02-03 1996-07-31 Component of the polarisome; functions in actin cytoskeletal organization during polarized growth; acts as a scaffold for Mkk1p and Mpk1p cell wall integrity signaling components; potential Cdc28p substrate; coding sequence contains length polymorphisms in different strains; SPA2 has a paralog, SPH1, that arose from the whole genome duplication +S000034900 CDS YLL021W 12 100947 105347 W 2011-02-03 1996-07-31 +S000003943 ORF Dubious YLL020C chromosome 12 12 105861 105556 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene KNS1 +S000033932 CDS YLL020C 12 105861 105556 C 2011-02-03 1996-07-31 +S000028670 ORF Dubious YLL019W-A chromosome 12 12 106908 107000 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene KNS1 +S000032516 CDS YLL019W-A 12 106908 107000 W 2011-02-03 2003-07-29 +S000003942 ORF Verified YLL019C KNS1 serine/threonine protein kinase KNS1|L124 chromosome 12 L000000910 12 107899 105686 C -28 2011-02-03 1996-07-31 Protein kinase involved in negative regulation of PolIII transcription; effector kinase of the TOR signaling pathway and phosphorylates Rpc53p to regulate ribosome and tRNA biosynthesis; member of the LAMMER family of protein kinases, which are serine/threonine kinases also capable of phosphorylating tyrosine residues; capable of autophosphorylation +S000035019 CDS YLL019C 12 107899 105686 C 2011-02-03 1996-07-31 +S000007245 ORF Verified YLL018C-A COX19 chromosome 12 L000004848 12 108972 108676 C 2011-02-03 1999-07-17 Protein required for cytochrome c oxidase assembly; located in the cytosol and mitochondrial intermembrane space; putative copper metallochaperone that delivers copper to cytochrome c oxidase; contains twin cysteine-x9-cysteine motifs +S000037730 CDS YLL018C-A 12 108972 108676 C 2011-02-03 1999-07-17 +S000003941 ORF Verified YLL018C DPS1 aspartate--tRNA ligase DPS1|AspRS chromosome 12 L000002834 12 111575 109902 C 2011-02-03 1996-07-31 Aspartyl-tRNA synthetase, primarily cytoplasmic; homodimeric enzyme that catalyzes the specific aspartylation of tRNA(Asp); class II aminoacyl tRNA synthetase; binding to its own mRNA may confer autoregulation; shares five highly conserved amino acids with human that when mutated cause leukoencephalopathy characterized by hypomyelination with brain stem and spinal cord involvement and leg spasticity (HBSL) +S000034907 CDS YLL018C 12 111575 109902 C 2011-02-03 1996-07-31 +S000003940 pseudogene YLL017W Ras family guanine nucleotide exchange factor SDC25|SDC25 chromosome 12 L000002822|L000003262 12 112234 112545 W 2011-02-03 1996-07-31 Non-essential Ras guanine nucleotide exchange factor (GEF); localized to the membrane; expressed in poor nutrient conditions and on nonfermentable carbon sources; contains a stop codon in S288C, full-length gene includes YLL016W; SDC25 has a paralog, CDC25, that arose from the whole genome duplication +S000034831 CDS YLL017W 12 112234 112545 W 2011-02-03 1996-07-31 +S000003939 pseudogene YLL016W SDC25 Ras family guanine nucleotide exchange factor SDC25 chromosome 12 12 112847 115993 W -3 2011-02-03 1996-07-31 Non-essential Ras guanine nucleotide exchange factor (GEF); localized to the membrane; expressed in poor nutrient conditions and on nonfermentable carbon sources; contains a stop codon in S288C, full-length gene includes YLL017W; SDC25 has a paralog, CDC25, that arose from the whole genome duplication +S000032886 CDS YLL016W 12 112847 115993 W 2011-02-03 1996-07-31 +S000003938 ORF Verified YLL015W BPT1 ATP-binding cassette bilirubin transporter BPT1 chromosome 12 12 116432 121111 W 2011-02-03 1996-07-31 ABC type transmembrane transporter of MRP/CFTR family; found in vacuolar membrane, involved in the transport of unconjugated bilirubin and in heavy metal detoxification via glutathione conjugates, along with Ycf1p +S000032769 CDS YLL015W 12 116432 121111 W 2011-02-03 1996-07-31 +S000003937 ORF Verified YLL014W EMC6 chromosome 12 12 121322 121648 W 2011-02-03 1996-07-31 Member of conserved ER transmembrane complex; required for efficient folding of proteins in the ER; null mutant displays induction of the unfolded protein response; homologous to worm F33D4.7/EMC-6, fly CG11781, human TMEM93 +S000032696 CDS YLL014W 12 121322 121648 W 2011-02-03 1996-07-31 +S000003936 ORF Verified YLL013C PUF3 mRNA-binding protein PUF3 chromosome 12 12 124714 122075 C 2011-02-03 1996-07-31 Protein of the mitochondrial outer surface; links the Arp2/3 complex with the mitochore during anterograde mitochondrial movement; also binds to and promotes degradation of mRNAs for select nuclear-encoded mitochondrial proteins +S000031656 CDS YLL013C 12 124714 122075 C 2011-02-03 1996-07-31 +S000003935 ORF Verified YLL012W YEH1 sterol esterase chromosome 12 12 125534 127255 W 2011-02-03 1996-07-31 Steryl ester hydrolase; one of three gene products (Yeh1p, Yeh2p, Tgl1p) responsible for steryl ester hydrolase activity and involved in sterol homeostasis; localized to lipid particle membranes; YEH1 has a paralog, YEH2, that arose from the whole genome duplication +S000031612 CDS YLL012W 12 125534 127255 W 2011-02-03 1996-07-31 +S000003934 ORF Verified YLL011W SOF1 rRNA-processing protein SOF1 chromosome 12 L000001981 12 127523 128992 W 2011-02-03 1996-07-31 Protein required for biogenesis of 40S (small) ribosomal subunit; has similarity to the beta subunit of trimeric G-proteins and the splicing factor Prp4p; essential gene +S000031493 CDS YLL011W 12 127523 128992 W 2011-02-03 1996-07-31 +S000003933 ORF Verified YLL010C PSR1 phosphatase chromosome 12 12 130613 129330 C 2011-02-03 1996-07-31 Plasma membrane associated protein phosphatase; involved in the general stress response; required along with binding partner Whi2p for full activation of STRE-mediated gene expression, possibly through dephosphorylation of Msn2p; PSR1 has a paralog, PSR2, that arose from the whole genome duplication +S000030481 CDS YLL010C 12 130613 129330 C 2011-02-03 1996-07-31 +S000003932 ORF Verified YLL009C COX17 copper metallochaperone COX17 chromosome 12 L000003085 12 131414 131205 C 2011-02-03 1996-07-31 Copper metallochaperone that transfers copper to Sco1p and Cox11p; eventual delivery to cytochrome c oxidase; contains twin cysteine-x9-cysteine motifs; interacts with the MICOS complex, and interaction is promoted by copper ions; human homolog COX17 partially complements yeast null mutant +S000030695 CDS YLL009C 12 131414 131205 C 2011-02-03 1996-07-31 +S000003931 ORF Verified YLL008W DRS1 putative ATP-dependent RNA helicase chromosome 12 L000000525 12 131729 133987 W 2011-02-03 1996-07-31 Nucleolar DEAD-box protein required for ribosome assembly and function; including synthesis of 60S ribosomal subunits; constituent of 66S pre-ribosomal particles +S000030652 CDS YLL008W 12 131729 133987 W 2011-02-03 1996-07-31 +S000003930 ORF Verified YLL007C LMO1 chromosome 12 12 136299 134302 C 2011-02-03 1996-07-31 Homolog of mammalian ELMO (Engulfment and celL MOtility); upstream component for regulation through the small GTPase Rho5p; may form a complex with Dck1p that acts as a GEF for Rho5p; cytoplasmic protein that relocates to mitochondria under oxidative stress; implicated in mitophagy; not an essential protein +S000036717 CDS YLL007C 12 136299 134302 C 2011-02-03 1996-07-31 +S000028560 ORF Uncharacterized YLL006W-A chromosome 12 12 136345 136521 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031266 CDS YLL006W-A 12 136345 136521 W 2011-02-03 2003-07-29 +S000003929 ORF Verified YLL006W MMM1 ERMES complex subunit MMM1|YME6 chromosome 12 L000001124 12 136586 137866 W 2011-02-03 1996-07-31 ER integral membrane protein, ERMES complex subunit; ERMES links the ER to mitochondria and may promote inter-organellar calcium and phospholipid exchange as well as coordinating mitochondrial DNA replication and growth; required for mitophagy; ERMES complex is often co-localized with peroxisomes and with concentrated areas of pyruvate dehydrogenase +S000036667 CDS YLL006W 12 136586 137866 W 2011-02-03 1996-07-31 +S000130181 ARS ARS1207 chromosome 12 12 138185 139164 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000003928 ORF Verified YLL005C SPO75 chromosome 12 S000007654 12 140546 137940 C 2011-02-03 1996-07-31 Meiosis-specific protein of unknown function; required for spore wall formation during sporulation; dispensable for both nuclear divisions during meiosis +S000036535 CDS YLL005C 12 140546 137940 C 2011-02-03 1996-07-31 +S000003927 ORF Verified YLL004W ORC3 origin recognition complex subunit 3 chromosome 12 L000003074 12 141073 142923 W 2011-02-03 1996-07-31 Subunit of the origin recognition complex (ORC); ORC directs DNA replication by binding to replication origins and is also involved in transcriptional silencing +S000036499 CDS YLL004W 12 141073 142923 W 2011-02-03 1996-07-31 +S000003926 ORF Verified YLL003W SFI1 chromosome 12 L000003991 12 143201 146041 W 2011-02-03 1996-07-31 Centrin (Cdc31p)-binding protein required for SPB duplication; localizes to the half-bridge of the spindle pole body (SPB); required for progression through G(2)-M transition; phosphorylated by Cdc28p-Clb2p and by Cdc5p; dephosphorylated by Cdc14p; has similarity to Xenopus laevis XCAP-C +S000035597 CDS YLL003W 12 143201 146041 W 2011-02-03 1996-07-31 +S000003925 ORF Verified YLL002W RTT109 H3 histone acetyltransferase RTT109|KAT11|REM50|KIM2 chromosome 12 L000003932 12 146291 147601 W 2011-02-03 1996-07-31 Histone acetyltransferase; critical for cell survival in presence of DNA damage during S phase, required for recovery after DSB repair; acetylates H3K56, H3K9; H3K56 acetylation activity required for expression homeostasis, buffering of mRNA synthesis rate against changes in gene dosage during S phase; involved in non-homologous end joining and regulation of Ty1 transposition; prevents hyper-amplification of rDNA; interacts physically with Vps75p +S000035504 CDS YLL002W 12 146291 147601 W 2011-02-03 1996-07-31 +S000003924 ORF Verified YLL001W DNM1 dynamin-related GTPase DNM1 chromosome 12 L000002645 12 147890 150163 W 2011-02-03 1996-07-31 Dynamin-related GTPase involved in mitochondrial organization; required for mitochondrial fission and inheritance; self assembles on the cytoplasmic face of mitochondrial tubules at sites where division will occur; participates in endocytosis and regulates peroxisome fission along with Vps1p; mutants in the human ortholog DNM1L, which mediates mitochondrial fission, peroxisomal division, autophagy, and mitophagy, are associated with slowly progressive infantile encephalopathy +S000035377 CDS YLL001W 12 147890 150163 W 2011-02-03 1996-07-31 +S000006473 centromere CEN12 CEN12 chromosome 12 L000000305 12 150947 150828 C 0 2011-02-03 2000-05-19|2004-10-08 Chromosome XII centromere +S000077287 centromere_DNA_Element_I CEN12 12 150947 150938 C 2011-02-03 2004-10-08 +S000077288 centromere_DNA_Element_II CEN12 12 150937 150853 C 2011-02-03 2004-10-08 +S000077289 centromere_DNA_Element_III CEN12 12 150852 150828 C 2011-02-03 2004-10-08 +S000114848 ARS ARS1208 ARS1208 ARSXII-151|CEN12 ARS chromosome 12 12 150947 151389 2011-02-03 2006-04-13 Autonomously Replicating Sequence +S000178131 ARS_consensus_sequence ARS1208 12 151078 151094 W 2014-11-18 2014-11-18 +S000003991 ORF Uncharacterized YLR001C chromosome 12 12 153977 151389 C 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; predicted to be palmitoylated +S000031754 CDS YLR001C 12 153977 151389 C 2011-02-03 1996-07-31 +S000003992 ORF Verified YLR002C NOC3 chromosome 12 12 156334 154343 C 2011-02-03 1996-07-31 Subunit of a nuclear complex with Noc2p and pre-replicative complexes; the Noc2p-Noc3p complex binds to 66S ribosomal precursors to mediate their maturation and intranuclear transport; binds to chromatin at active replication origins, and is required for pre-RC formation and maintenance during DNA replication licensing +S000031944 CDS YLR002C 12 156334 154343 C 2011-02-03 1996-07-31 +S000118470 ARS ARS1209 ARSXII-157 chromosome 12 12 156648 156884 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000003993 ORF Verified YLR003C CMS1 chromosome 12 12 157730 156855 C 2011-02-03 1996-07-31 Putative subunit of the 90S preribosome processome complex; overexpression rescues supressor mutant of mcm10; null mutant is viable; relocalizes from nucleus to cytoplasm upon DNA replication stress +S000032071 CDS YLR003C 12 157730 156855 C 2011-02-03 1996-07-31 +S000003994 ORF Verified YLR004C THI73 chromosome 12 12 159505 157934 C 2011-02-03 1996-07-31 Putative plasma membrane permease; proposed to be involved in carboxylic acid uptake and repressed by thiamine; substrate of Dbf2p/Mob1p kinase; transcription is altered if mitochondrial dysfunction occurs +S000034068 CDS YLR004C 12 159505 157934 C 2011-02-03 1996-07-31 +S000003995 ORF Verified YLR005W SSL1 TFIIH/NER complex subunit SSL1 chromosome 12 L000002085 12 160049 161434 W 2011-02-03 1996-07-31 Subunit of the core form of RNA polymerase transcription factor TFIIH; has both protein kinase and DNA-dependent ATPase/helicase activities; essential for transcription and nucleotide excision repair; interacts with Tfb4p +S000034240 CDS YLR005W 12 160049 161434 W 2011-02-03 1996-07-31 +S000003996 ORF Verified YLR006C SSK1 mitogen-activated protein kinase kinase kinase SSK1 chromosome 12 L000002084 12 163893 161755 C 2011-02-03 1996-07-31 Cytoplasmic phosphorelay intermediate osmosensor and regulator; part of a two-component signal transducer that mediates osmosensing via a phosphorelay mechanism; required for mitophagy; dephosphorylated form is degraded by the ubiquitin-proteasome system; potential Cdc28p substrate +S000034274 CDS YLR006C 12 163893 161755 C 2011-02-03 1996-07-31 +S000003997 ORF Verified YLR007W NSE1 Smc5-Smc6 complex subunit NSE1 chromosome 12 12 164392 165402 W 2011-02-03 1996-07-31 Component of the SMC5-SMC6 complex; this complex plays a key role in the removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair +S000034350 CDS YLR007W 12 164392 165402 W 2011-02-03 1996-07-31 +S000003998 ORF Verified YLR008C PAM18 TIM14 chromosome 12 12 166083 165577 C 2011-02-03 1996-07-31 Subunit of the import motor (PAM complex); the PAM complex is a component of the Translocase of the Inner Mitochondrial membrane (TIM23 complex); essential J-protein cochaperone that stimulates Ssc1p ATPase activity to drive import; inhibited by Pam16p +S000034382 CDS YLR008C 12 166083 165577 C 2011-02-03 1996-07-31 +S000003999 ORF Verified YLR009W RLP24 ATPase-activating ribosome biosynthesis protein chromosome 12 12 166537 167136 W 2011-02-03 1996-07-31 Essential protein required for ribosomal large subunit biogenesis; associated with pre-60S ribosomal subunits; stimulates the ATPase activity of Afg2p, which is required for release of Rlp24p from the pre-60S particle; has similarity to Rpl24Ap and Rpl24Bp +S000035399 CDS YLR009W 12 166537 167136 W 2011-02-03 1996-07-31 +S000004000 ORF Verified YLR010C TEN1 chromosome 12 12 167802 167320 C 2011-02-03 1996-07-31 Protein that regulates telomeric length; protects telomeric ends in a complex with Cdc13p and Stn1p; similar to human Ten1 which is critical for the telomeric function of the CST (Cdc13p-Stn1p-Ten1p) complex +S000034009 CDS YLR010C 12 167802 167320 C 2011-02-03 1996-07-31 +S000006728 tRNA_gene tS(AGA)L chromosome 12 L000003665 12 168025 167944 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000032403 noncoding_exon tS(AGA)L 12 168025 167944 C 2011-02-03 2000-05-19 +S000007079 long_terminal_repeat YLRCsigma1 chromosome 12 12 168380 168043 C 2011-02-03 2000-05-19 Ty3 LTR +S000004001 ORF Verified YLR011W LOT6 flavin-dependent quinone reductase chromosome 12 12 169103 169678 W 2011-02-03 1996-07-31 FMN-dependent NAD(P)H:quinone reductase; role in apoptosis-like cell death; may be involved in quinone detoxification; expression elevated at low temperature; sequesters the Cin5p transcription factor in the cytoplasm in complex with the proteasome under reducing conditions +S000034963 CDS YLR011W 12 169103 169678 W 2011-02-03 1996-07-31 +S000004002 ORF Uncharacterized YLR012C chromosome 12 12 170281 169982 C 2011-02-03 2003-09-22|1996-07-31 Putative protein of unknown function; YLR012C is not an essential gene +S000035029 CDS YLR012C 12 170281 169982 C 2011-02-03 2003-09-22|1996-07-31 +S000004003 ORF Verified YLR013W GAT3 chromosome 12 S000007451 12 171339 171764 W 2011-02-03 1996-07-31 Protein containing GATA family zinc finger motifs; involved in spore wall assembly; sequence similarity to GAT4, and the double mutant gat3 gat4 exhibits reduced dityrosine fluorescence relative to the single mutants +S000035278 CDS YLR013W 12 171339 171764 W 2011-02-03 1996-07-31 +S000004004 ORF Verified YLR014C PPR1 chromosome 12 L000001475 12 174982 172268 C 8 2011-02-03 1996-07-31 Zinc finger transcription factor; contains a Zn(2)-Cys(6) binuclear cluster domain, positively regulates transcription of URA1, URA3, URA4, and URA10, which are involved in de novo pyrimidine biosynthesis, in response to pyrimidine starvation; activity may be modulated by interaction with Tup1p +S000036111 CDS YLR014C 12 174982 172268 C 2011-02-03 1996-07-31 +S000004005 ORF Verified YLR015W BRE2 CPS60 chromosome 12 12 175227 176744 W 2011-02-03 1996-07-31 Subunit of COMPASS (Set1C) complex; COMPASS methylates Lys4 of histone H3 and functions in silencing at telomeres; has a C-terminal Sdc1 Dpy-30 Interaction (SDI) domain that mediates binding to Sdc1p; similar to trithorax-group protein ASH2L +S000036291 CDS YLR015W 12 175227 176744 W 2011-02-03 1996-07-31 +S000004006 ORF Verified YLR016C PML1 chromosome 12 12 177416 176802 C 2011-02-03 1996-07-31 Subunit of the RES complex; RES complex is required for nuclear retention of unspliced pre-mRNAs; acts in the same pathway as Pml39p and Mlp1p +S000036355 CDS YLR016C 12 177416 176802 C 2011-02-03 1996-07-31 +S000004007 ORF Verified YLR017W MEU1 S-methyl-5-thioadenosine phosphorylase chromosome 12 L000004106 12 177608 178621 W 2011-02-03 1996-07-31 Methylthioadenosine phosphorylase (MTAP); catalyzes the initial step in the methionine salvage pathway; affects polyamine biosynthesis through regulation of ornithine decarboxylase (Spe1p) activity; regulates ADH2 gene expression +S000030114 CDS YLR017W 12 177608 178621 W 2011-02-03 1996-07-31 +S000004008 ORF Verified YLR018C POM34 chromosome 12 12 179606 178707 C 2011-02-03 1996-07-31 Subunit of the transmembrane ring of the nuclear pore complex (NPC); contributes to nucleocytoplasmic transport, NPC biogenesis and spindle pole body duplication +S000030160 CDS YLR018C 12 179606 178707 C 2011-02-03 1996-07-31 +S000004009 ORF Verified YLR019W PSR2 putative phosphatase chromosome 12 12 180288 181481 W 2011-02-03 1996-07-31 Plasma membrane phosphatase involved in the general stress response; required with Psr1p and Whi2p for full activation of STRE-mediated gene expression, possibly through dephosphorylation of Msn2p; PSR2 has a paralog, PSR1, that arose from the whole genome duplication +S000030375 CDS YLR019W 12 180288 181481 W 2011-02-03 1996-07-31 +S000004010 ORF Verified YLR020C YEH2 sterol esterase chromosome 12 12 183405 181789 C 2011-02-03 1996-07-31 Steryl ester hydrolase; catalyzes steryl ester hydrolysis at the plasma membrane; involved in sterol metabolism; YEH2 has a paralog, YEH1, that arose from the whole genome duplication +S000029961 CDS YLR020C 12 183405 181789 C 2011-02-03 1996-07-31 +S000004011 ORF Verified YLR021W IRC25 DMP2|PBA3|POC3 chromosome 12 12 183623 184162 W 2011-02-03 1996-07-31 Component of a heterodimeric Poc4p-Irc25p chaperone; involved in assembly of alpha subunits into the 20S proteasome; may regulate formation of proteasome isoforms with alternative subunits under different conditions; upregulates proteasome assembly in response to the unfolded protein response activated by mistargeting of proteins (UPRam) +S000031024 CDS YLR021W 12 183623 184162 W 2011-02-03 1996-07-31 +S000004012 ORF Verified YLR022C SDO1 guanine nucleotide exchange factor SDO1 chromosome 12 S000029721 12 184926 184174 C 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF) for Ria1p; essential protein involved in ribosome maturation; with Ria1p, promotes release of Tif6p from 60S ribosomal subunits in the cytoplasm so that they can assemble with 40S subunits to generate mature ribosomes; ortholog of the human protein (SBDS) responsible for autosomal recessive Shwachman-Bodian-Diamond Syndrome; highly conserved across archaea and eukaryotes +S000031066 CDS YLR022C 12 184926 184174 C 2011-02-03 1996-07-31 +S000004013 ORF Verified YLR023C IZH3 chromosome 12 12 187129 185498 C 2011-02-03 1996-07-31 Membrane protein involved in zinc ion homeostasis; member of the four-protein IZH family, expression induced by zinc deficiency; deletion reduces sensitivity to elevated zinc and shortens lag phase, overexpression reduces Zap1p activity +S000031203 CDS YLR023C 12 187129 185498 C 2011-02-03 1996-07-31 +S000004014 ORF Verified YLR024C UBR2 putative ubiquitin-protein ligase UBR2 chromosome 12 12 193281 187663 C 2011-02-03 1996-07-31|2011-02-03 Cytoplasmic ubiquitin-protein ligase (E3); component of the Mub1p-Ubr2p-Rad6p ubiquitin ligase complex required for the ubiquitination and degradation of Rpn4p; mediates formation of the ternary complex +S000032202 CDS YLR024C 12 193281 187663 C 2011-02-03 1996-07-31|2011-02-03 +S000004015 ORF Verified YLR025W SNF7 ESCRT-III subunit protein SNF7|VPL5|RNS4|VPS32|DID1 chromosome 12 L000001950 12 194452 195174 W 11.4 2011-02-03 1996-07-31 One of four subunits of the ESCRT-III complex; involved in the sorting of transmembrane proteins into the multivesicular body (MVB) pathway; recruited from the cytoplasm to endosomal membranes; ESCRT-III stands for endosomal sorting complex required for transport III +S000032371 CDS YLR025W 12 194452 195174 W 2011-02-03 1996-07-31 +S000004016 ORF Verified YLR026C SED5 t-SNARE syntaxin chromosome 12 L000001861 12 196472 195450 C 2011-02-03 1996-07-31 cis-Golgi t-SNARE syntaxin; required for vesicular transport between the ER and the Golgi complex; binds at least 9 SNARE proteins +S000032400 CDS YLR026C 12 196472 195450 C 2011-02-03 1996-07-31 +S000004017 ORF Verified YLR027C AAT2 aspartate transaminase AAT2|ASP5 chromosome 12 L000000131|L000002677 12 198085 196829 C 17 2011-02-03 2003-09-22|1996-07-31 Cytosolic aspartate aminotransferase involved in nitrogen metabolism; localizes to peroxisomes in oleate-grown cells +S000032507 CDS YLR027C 12 198085 196829 C 2011-02-03 2003-09-22|1996-07-31 +S000007497 snoRNA_gene snR30 SNR30 chromosome 12 L000001968 12 198784 199389 W 2011-02-03 2000-05-19|2007-05-09 H/ACA box small nucleolar RNA (snoRNA); essential gene required for cleavage of 35S primary rRNA transcript to release the precursor to the 18S rRNA +S000036751 noncoding_exon snR30 12 198784 199389 W 2011-02-03 2000-05-19|2007-05-09 +S000004018 ORF Verified YLR028C ADE16 bifunctional phosphoribosylaminoimidazolecarboxamide formyltransferase/IMP cyclohydrolase ADE16 chromosome 12 L000003305 12 201315 199540 C 2011-02-03 1997-07-30|1996-07-31 Enzyme of 'de novo' purine biosynthesis; contains both 5-aminoimidazole-4-carboxamide ribonucleotide transformylase and inosine monophosphate cyclohydrolase activities; ADE16 has a paralog, ADE17, that arose from the whole genome duplication; ade16 ade17 mutants require adenine and histidine +S000034542 CDS YLR028C 12 201315 199540 C 2011-02-03 1997-07-30|1996-07-31 +S000004019 ORF Verified YLR029C RPL15A eL15|ribosomal 60S subunit protein L15A|L15e|rp15R|YL10|L15A|L13A|RPL10A chromosome 12 L000002705|L000001710 12 202590 201976 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L15A; binds to 5.8 S rRNA; homologous to mammalian ribosomal protein L15, no bacterial homolog; RPL15A has a paralog, RPL15B, that arose from the whole genome duplication +S000034631 CDS YLR029C 12 202590 201976 C 2011-02-03 1996-07-31 +S000004020 ORF Uncharacterized YLR030W chromosome 12 12 203290 204081 W 2011-02-03 1996-07-31 Putative protein of unknown function; S288C contains an in-frame stop codon between ORFs YLR030W and YLR031W +S000034152 CDS YLR030W 12 203290 204081 W 2011-02-03 1996-07-31 +S000004021 ORF Uncharacterized YLR031W chromosome 12 12 204225 204785 W 2011-02-03 1996-07-31 Putative protein of unknown function; S288C contains an in-frame stop codon between ORFs YLR030W and YLR031W; YLR031W has a paralog, YMR124W, that arose from the whole genome duplication +S000034277 CDS YLR031W 12 204225 204785 W 2011-02-03 1996-07-31 +S000004022 ORF Verified YLR032W RAD5 DNA helicase RAD5|SNM2|REV2 chromosome 12 L000001559 12 204991 208500 W 22 2011-02-03 1996-07-31 DNA helicase/Ubiquitin ligase; involved in error-free DNA damage tolerance (DDT), replication fork regression during postreplication repair by template switching, error-prone translesion synthesis; promotes synthesis of free and PCNA-bound polyubiquitin chains by Ubc13p-Mms2p; forms nuclear foci upon DNA replication stress; associates with native telomeres, cooperates with homologous recombination in senescent cells; human homolog HLTF can complement yeast null mutant +S000034393 CDS YLR032W 12 204991 208500 W 2011-02-03 1996-07-31 +S000004023 ORF Verified YLR033W RSC58 chromosome 12 12 208761 210269 W 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; RSC functions in transcriptional regulation and elongation, chromosome stability, and establishing sister chromatid cohesion; involved in telomere maintenance +S000035450 CDS YLR033W 12 208761 210269 W 2011-02-03 1996-07-31 +S000004024 ORF Verified YLR034C SMF3 putative divalent metal ion transporter SMF3 chromosome 12 12 211933 210512 C 2011-02-03 1996-07-31|2011-02-03 Putative divalent metal ion transporter involved in iron homeostasis; transcriptionally regulated by metal ions; member of the Nramp family of metal transport proteins; protein abundance increases in response to DNA replication stress +S000035485 CDS YLR034C 12 211933 210512 C 2011-02-03 1996-07-31|2011-02-03 +S000004025 ORF Verified YLR035C MLH2 mismatch repair protein MLH2 chromosome 12 12 214456 212369 C 2011-02-03 1996-07-31 Protein involved in mismatch repair and meiotic recombination; only certain frameshift intermediates are mismatch repair substrates; forms a complex with Mlh1p +S000035575 CDS YLR035C 12 214456 212369 C 2011-02-03 1996-07-31 +S000006524 tRNA_gene tA(UGC)L chromosome 12 L000003664 12 214955 214883 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 5 nuclear tRNA genes containing the tDNA-anticodon TGC (mature tRNA may be UGC or may contain modified bases), decodes GCA and probably GCG codons into alanine, one of 16 nuclear tRNAs for alanine +S000034887 noncoding_exon tA(UGC)L 12 214955 214883 C 2011-02-03 2000-05-19 +S000007065 long_terminal_repeat YLRCdelta2 chromosome 12 12 215417 215080 C 2011-02-03 2000-05-19 Ty1 LTR +S000007225 transposable_element_gene YLR035C-A gag-pol fusion protein chromosome 12 12 218907 215440 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); YLR035C-A is part of a mutant retrotransposon +S000034784 CDS YLR035C-A 12 218907 215440 C 2011-02-03 1999-07-17 +S000007066 long_terminal_repeat YLRCdelta3 chromosome 12 12 221005 220668 C 2011-02-03 2000-05-19 Ty1 LTR +S000007083 long_terminal_repeat YLRWdelta4 chromosome 12 12 221006 221266 W 2011-02-03 2000-05-19 Ty1 LTR +S000004026 ORF Uncharacterized YLR036C chromosome 12 12 222132 221521 C 2011-02-03 1996-07-31 Putative protein predicted to have transmembrane domains; interacts with HSP90 by yeast two-hybrid analysis; YLR036C is not an essential protein +S000035633 CDS YLR036C 12 222132 221521 C 2011-02-03 1996-07-31 +S000178132 ARS ARS1210 chromosome 12 12 222220 222676 2014-11-18 2014-11-18 Autonomously replicating sequence +S000004027 ORF Verified YLR037C PAU23 seripauperin PAU23|DAN2 chromosome 12 12 223059 222685 C 2011-02-03 1996-07-31 Cell wall mannoprotein; has similarity to Tir1p, Tir2p, Tir3p, and Tir4p; member of the seripauperin multigene family encoded mainly in subtelomeric regions; expressed under anaerobic conditions, completely repressed during aerobic growth +S000036588 CDS YLR037C 12 223059 222685 C 2011-02-03 1996-07-31 +S000004028 ORF Verified YLR038C COX12 cytochrome c oxidase subunit VIb chromosome 12 L000000396 12 225172 224921 C 2011-02-03 1996-07-31 Subunit VIb of cytochrome c oxidase; cytochrome c oxidase is also known as respiratory Complex IV and is the terminal member of the mitochondrial inner membrane electron transport chain; required for assembly of cytochrome c oxidase but not required for activity after assembly; phosphorylated; easily released from the intermembrane space, suggesting a loose association with Complex IV +S000036657 CDS YLR038C 12 225172 224921 C 2011-02-03 1996-07-31 +S000004029 ORF Verified YLR039C RIC1 chromosome 12 L000001638 12 228596 225426 C 2011-02-03 1996-07-31 Protein involved in retrograde transport to the cis-Golgi network; forms heterodimer with Rgp1p that acts as a GTP exchange factor for Ypt6p; involved in transcription of rRNA and ribosomal protein genes +S000036750 CDS YLR039C 12 228596 225426 C 2011-02-03 1996-07-31 +S000004031 ORF Dubious YLR041W chromosome 12 12 229377 229697 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YLR040C +S000030478 CDS YLR041W 12 229377 229697 W 2011-02-03 1996-07-31 +S000004030 ORF Verified YLR040C AFB1 chromosome 12 12 229582 228908 C 2011-02-03 1996-07-31 MATalpha-specific a-factor blocker; contributes to mating efficiency under certain conditions; localizes to the cell wall; predicted to be a GPI-attached protein; upregulated by Mcm1p-Alpha1p transcription factor; partially overlaps the dubious ORF YLR041W +S000030256 CDS YLR040C 12 229582 228908 C 2011-02-03 1996-07-31 +S000004032 ORF Verified YLR042C chromosome 12 12 230451 229966 C 2011-02-03 1996-07-31 Cell wall protein of unknown function; localizes to the cytoplasm; deletion improves xylose fermentation in industrially engineered strains; YLR042C is not an essential gene +S000030545 CDS YLR042C 12 230451 229966 C 2011-02-03 1996-07-31 +S000118471 ARS ARS1211 ARSXII-231 chromosome 12 12 231179 231421 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178133 ARS_consensus_sequence ARS1211 12 231250 231266 W 2014-11-18 2014-11-18 +S000004033 ORF Verified YLR043C TRX1 thioredoxin TRX1|LMA1 chromosome 12 L000002357 12 232013 231702 C -7 2011-02-03 1996-07-31 Cytoplasmic thioredoxin isoenzyme; part of thioredoxin system which protects cells against oxidative and reductive stress; forms LMA1 complex with Pbi2p; acts as a cofactor for Tsa1p; required for ER-Golgi transport and vacuole inheritance; with Trx2p, facilitates mitochondrial import of small Tims Tim9p, Tim10p, Tim13p by maintaining them in reduced form; abundance increases iunder DNA replication stress; TRX1 has a paralog, TRX2, that arose from the whole genome duplication +S000031467 CDS YLR043C 12 232013 231702 C 2011-02-03 1996-07-31 +S000004034 ORF Verified YLR044C PDC1 indolepyruvate decarboxylase 1 chromosome 12 L000001354 12 234081 232390 C -7 2011-02-03 1996-07-31 Major of three pyruvate decarboxylase isozymes; key enzyme in alcoholic fermentation; decarboxylates pyruvate to acetaldehyde; involved in amino acid catabolism; subject to glucose-, ethanol-, and autoregulation; activated by phosphorylation in response to glucose levels; N-terminally propionylated in vivo +S000031581 CDS YLR044C 12 234081 232390 C 2011-02-03 1996-07-31 +S000004035 ORF Verified YLR045C STU2 chromosome 12 L000003019 12 237703 235037 C 2011-02-03 1996-07-31 Microtubule-associated protein (MAP) of the XMAP215/Dis1 family; regulates microtubule dynamics during spindle orientation and metaphase chromosome alignment; interacts with spindle pole body component Spc72p +S000032584 CDS YLR045C 12 237703 235037 C 2011-02-03 1996-07-31 +S000004036 ORF Uncharacterized YLR046C RLA1 chromosome 12 12 238813 238001 C 2011-02-03 1996-07-31 Putative membrane protein; member of the fungal lipid-translocating exporter (LTE) family of proteins; transcription is activated by paralogous transcription factors Yrm1p and Yrr1p along with genes involved in multidrug resistance; YLR046C has a paralog, RTA1, that arose from the whole genome duplication +S000032679 CDS YLR046C 12 238813 238001 C 2011-02-03 1996-07-31 +S000004037 ORF Verified YLR047C FRE8 putative ferric-chelate reductase chromosome 12 12 241407 239347 C 2011-02-03 1996-07-31 Protein with sequence similarity to iron/copper reductases; involved in iron homeostasis; deletion mutant has iron deficiency/accumulation growth defects; expression increased in the absence of copper-responsive transcription factor Mac1p +S000032758 CDS YLR047C 12 241407 239347 C 2011-02-03 1996-07-31 +S000004038 ORF Verified YLR048W RPS0B uS2|ribosomal 40S subunit protein S0B|S2|S0B|YST2|NAB1B chromosome 12 L000002908 12 242232 243349 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; RPS0B has a paralog, RPS0A, that arose from the whole genome duplication; required for maturation of 18S rRNA along with Rps0Ap; deletion of either RPS0 gene reduces growth rate, deletion of both genes is lethal; homologous to human ribosomal protein SA and bacterial S2 +S000032917 CDS YLR048W 12 242232 242321 W 2011-02-03 1996-07-31 +S000032918 CDS YLR048W 12 242681 243349 W 2011-02-03 1996-07-31 +S000032919 intron YLR048W 12 242322 242680 W 2011-02-03 1996-07-31 +S000004039 ORF Uncharacterized YLR049C chromosome 12 12 245172 243886 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000034828 CDS YLR049C 12 245172 243886 C 2011-02-03 1996-07-31 +S000004040 ORF Uncharacterized YLR050C chromosome 12 12 246072 245587 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; YLR050C is not an essential gene +S000033086 CDS YLR050C 12 246072 245587 C 2011-02-03 1996-07-31 +S000004041 ORF Verified YLR051C FCF2 chromosome 12 12 246977 246324 C 2011-02-03 1996-07-31 Nucleolar protein involved in the early steps of 35S rRNA processing; interacts with Faf1p; member of a transcriptionally co-regulated set of genes called the RRB regulon; essential gene +S000033845 CDS YLR051C 12 246977 246324 C 2011-02-03 1996-07-31 +S000004042 ORF Verified YLR052W IES3 chromosome 12 12 247201 247953 W 2011-02-03 1996-07-31 Subunit of the INO80 chromatin remodeling complex +S000034056 CDS YLR052W 12 247201 247953 W 2011-02-03 1996-07-31 +S000004043 ORF Uncharacterized YLR053C chromosome 12 12 248426 248100 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000034893 CDS YLR053C 12 248426 248100 C 2011-02-03 1996-07-31 +S000004044 ORF Verified YLR054C OSW2 chromosome 12 12 250978 248717 C 2011-02-03 2003-09-27|1996-07-31 Protein of unknown function reputedly involved in spore wall assembly +S000035045 CDS YLR054C 12 250860 248717 C 2011-02-03 2003-09-27|1996-07-31 +S000035044 CDS YLR054C 12 250978 250948 C 2011-02-03 2003-09-27 +S000035046 intron YLR054C 12 250947 250861 C 2011-02-03 2003-09-27 +S000004045 ORF Verified YLR055C SPT8 SAGA complex subunit SPT8 chromosome 12 L000002034 12 253080 251272 C 30 2011-02-03 1996-07-31 Subunit of the SAGA transcriptional regulatory complex; not present in SAGA-like complex SLIK/SALSA; required for SAGA-mediated inhibition at some promoters +S000035199 CDS YLR055C 12 253080 251272 C 2011-02-03 1996-07-31 +S000004046 ORF Verified YLR056W ERG3 C-5 sterol desaturase|PSO6|SYR1 chromosome 12 L000000570|L000004043 12 253861 254958 W 2011-02-03 1996-07-31 C-5 sterol desaturase; glycoprotein that catalyzes the introduction of a C-5(6) double bond into episterol, a precursor in ergosterol biosynthesis; transcriptionally down-regulated when ergosterol is in excess; mutants are viable, but cannot grow on non-fermentable carbon sources; substrate of HRD ubiquitin ligase; mutation is functionally complemented by human SC5D +S000036224 CDS YLR056W 12 253861 254958 W 2011-02-03 1996-07-31 +S000004047 ORF Verified YLR057W MNL2 putative mannosidase MNL2 chromosome 12 12 255306 257855 W 2011-02-03 1996-07-31 Putative mannosidase involved in ER-associated protein degradation; localizes to the endoplasmic reticulum; sequence similarity with seven-hairpin glycosidase (GH47) family members, such as Mns1p and Mnl1p, that hydrolyze 1,2-linked alpha-D-mannose residues; non-essential gene +S000036328 CDS YLR057W 12 255306 257855 W 2011-02-03 1996-07-31 +S000004048 ORF Verified YLR058C SHM2 glycine hydroxymethyltransferase SHM2|SHMT2 chromosome 12 L000001882 12 259401 257992 C 2011-02-03 1996-07-31 Cytosolic serine hydroxymethyltransferase; converts serine to glycine plus 5,10 methylenetetrahydrofolate; major isoform involved in generating precursors for purine, pyrimidine, amino acid, and lipid biosynthesis +S000036381 CDS YLR058C 12 259401 257992 C 2011-02-03 1996-07-31 +S000004049 ORF Verified YLR059C REX2 YNT20 chromosome 12 L000003035 12 260547 259738 C 2011-02-03 1996-07-31 3'-5' RNA exonuclease; involved in 3'-end processing of U4 and U5 snRNAs, 5S and 5.8S rRNAs, and RNase P and RNase MRP RNA; localized to mitochondria and null suppresses escape of mtDNA to nucleus in yme1 yme2 mutants; RNase D exonuclease +S000036443 CDS YLR059C 12 260547 259738 C 2011-02-03 1996-07-31 +S000004050 ORF Verified YLR060W FRS1 phenylalanine--tRNA ligase subunit beta chromosome 12 L000000629 12 260979 262766 W 2011-02-03 1996-07-31 Beta subunit of cytoplasmic phenylalanyl-tRNA synthetase; forms a tetramer with Frs2p to generate active enzyme; able to hydrolyze mis-aminoacylated tRNA-Phe, which could contribute to translational quality control +S000030011 CDS YLR060W 12 260979 262766 W 2011-02-03 1996-07-31 +S000004051 ORF Verified YLR061W RPL22A eL22|ribosomal 60S subunit protein L22A|L22e|rp4|l1c|YL31|L22A chromosome 12 L000004460 12 263194 263948 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L22A; required for translation of long 5' UTR of IME1 mRNA and meiotic entry; required for the oxidative stress response, pseudohyphal and invasive growth; homologous to mammalian ribosomal protein L22, no bacterial homolog; RPL22A has a paralog, RPL22B, that arose from the whole genome duplication +S000030138 CDS YLR061W 12 263194 263205 W 2011-02-03 1996-07-31 +S000030139 CDS YLR061W 12 263595 263948 W 2011-02-03 1996-07-31 +S000030140 intron YLR061W 12 263206 263594 W 2011-02-03 1996-07-31 +S000004052 ORF Dubious YLR062C BUD28 chromosome 12 12 263954 263577 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 98% of ORF overlaps the verified gene RPL22A; diploid mutant displays a weak budding pattern phenotype in a systematic assay +S000031086 CDS YLR062C 12 263954 263577 C 2011-02-03 1996-07-31 +S000004053 ORF Verified YLR063W BMT6 25S rRNA (uracil2843-N3)-methyltransferase chromosome 12 12 264157 265254 W 2011-02-03 1996-07-31 Methyltransferase required for m3U2843 methylation of the 25S rRNA; S-adenosylmethionine-dependent; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YLR063W is not an essential gene +S000031280 CDS YLR063W 12 264157 265254 W 2011-02-03 1996-07-31 +S000004054 ORF Verified YLR064W PER33 chromosome 12 12 265456 266277 W 2011-02-03 1996-07-31 Protein that localizes to the endoplasmic reticulum; also associates with the nuclear pore complex; deletion extends chronological lifespan; highly conserved across species, orthologous to human TMEM33 and paralogous to Pom33p; protein abundance increases in response to DNA replication stress +S000031356 CDS YLR064W 12 265456 266277 W 2011-02-03 1996-07-31 +S000004055 ORF Verified YLR065C ENV10 SND2 chromosome 12 12 266918 266373 C 2011-02-03 1996-07-31 Protein involved in SRP-independent targeting of substrates to the ER; component of an alternative ER targeting pathway that has partial functional redundancy with the GET pathway; preference for substrates with downstream transmembrane domains; interacts with Snd1p, Pho88p/Snd3p, and Sec61p-translocon subunits; can compensate for loss of SRP; role in the late endosome-vacuole interface; putative role in secretory protein quality control +S000031430 CDS YLR065C 12 266918 266373 C 2011-02-03 1996-07-31 +S000004056 ORF Verified YLR066W SPC3 signal peptidase complex subunit SPC3 chromosome 12 L000003542|S000029502|L000002875 12 267169 267723 W 2011-02-03 1996-07-31 Subunit of signal peptidase complex; complex catalyzes cleavage of N-terminal signal sequences of proteins targeted to the secretory pathway; homologous to mammalian SPC22/23; other members of the complex are Spc1p, Spc2p, and Sec11p +S000032483 CDS YLR066W 12 267169 267723 W 2011-02-03 1996-07-31 +S000004057 ORF Verified YLR067C PET309 chromosome 12 L000001401 12 270710 267813 C 2011-02-03 1996-07-31 Specific translational activator for the COX1 mRNA; binds to the COX1 mRNA; also influences stability of intron-containing COX1 primary transcripts; localizes to the mitochondrial inner membrane; contains 12 pentatricopeptide repeats (PPRs) +S000032544 CDS YLR067C 12 270710 267813 C 2011-02-03 1996-07-31 +S000004058 ORF Verified YLR068W FYV7 chromosome 12 12 271008 271463 W 2011-02-03 1996-07-31 Essential protein required for maturation of 18S rRNA; required for survival upon exposure to K1 killer toxin +S000032669 CDS YLR068W 12 271008 271463 W 2011-02-03 1996-07-31 +S000004059 ORF Verified YLR069C MEF1 chromosome 12 L000001057 12 273915 271630 C 2011-02-03 1996-07-31 Mitochondrial elongation factor involved in translational elongation +S000033337 CDS YLR069C 12 273915 271630 C 2011-02-03 1996-07-31 +S000004060 ORF Verified YLR070C XYL2 D-xylulose reductase XYL2 chromosome 12 12 275211 274141 C 2011-02-03 1996-07-31 Xylitol dehydrogenase; converts xylitol to D-xylulose; expression induced by xylose, even though this pentose sugar is not well utilized by S. cerevisiae; null mutant has cell wall defect +S000033430 CDS YLR070C 12 275211 274141 C 2011-02-03 1996-07-31 +S000004061 ORF Verified YLR071C RGR1 MED14 chromosome 12 L000001629 12 278626 275378 C 70 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; required for glucose repression, HO repression, RME1 repression and sporulation +S000034340 CDS YLR071C 12 278626 275378 C 2011-02-03 1996-07-31 +S000004062 ORF Verified YLR072W LAM6 LTC1 chromosome 12 12 278862 280943 W 2011-02-03 1996-07-31 Sterol transporter that transfers sterols between membranes; may regulate and coordinate formation of contact sites between organelles; localizes to ER-mitochondrial contact sites in a Tom70p- and Tom71p-dependent manner; mitochondrial localization requires GRAM domain; also localizes to ER-vacuole contact sites, in a Vac8p-dependent manner; has GRAM and StART-like (VASt) domains; one of six StART-like domain-containing proteins in yeast; conserved across eukaryotes +S000034470 CDS YLR072W 12 278862 280943 W 2011-02-03 1996-07-31 +S000004063 ORF Verified YLR073C RFU1 chromosome 12 12 281621 281019 C 2011-02-03 1996-07-31 Protein that inhibits Doa4p deubiquitinating activity; contributes to ubiquitin homeostasis by regulating the conversion of free ubiquitin chains to ubiquitin monomers by Doa4p; GFP-fusion protein localizes to endosomes +S000034520 CDS YLR073C 12 281621 281019 C 2011-02-03 1996-07-31 +S000004064 ORF Verified YLR074C BUD20 chromosome 12 12 282456 281956 C 2011-02-03 1996-07-31 C2H2-type zinc finger protein required for ribosome assembly; shuttling factor which associates with pre-60S particles in the nucleus, accompanying them to the cytoplasm; cytoplasmic dissociation of Bud20p requires Drg1p; N-terminus harbors a nuclear localization signal (NLS) and a nuclear export signal (NES); cytoplasmic Bud20p is reimported by Kap123-dependent pathway; involved in bud-site selection; diploid mutants display a random budding pattern; similar to human ZNF593 +S000035544 CDS YLR074C 12 282456 281956 C 2011-02-03 1996-07-31 +S000004065 ORF Verified YLR075W RPL10 uL16|ribosomal 60S subunit protein L10|L16|L10|QSR1|GRC5 chromosome 12 L000000727 12 282927 283592 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L10; homologous to mammalian ribosomal protein L10 and bacterial L16; responsible for joining the 40S and 60S subunits; regulates translation initiation; similar to members of the QM gene family; protein abundance increases under DNA replication stress; mutations in human homolog implicated in T-cell acute lymphoblastic leukemia and also autism spectrum disorders (ASD); human RPL10 can complement yeast null mutant +S000035684 CDS YLR075W 12 282927 283592 W 2011-02-03 1996-07-31 +S000004066 ORF Dubious YLR076C chromosome 12 12 283607 283185 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the essential gene RPL10 which encodes the ribosomal protein L10 +S000035729 CDS YLR076C 12 283607 283185 C 2011-02-03 1996-07-31 +S000004067 ORF Verified YLR077W FMP25 BCA1 chromosome 12 12 283872 285623 W 2011-02-03 1996-07-31 Protein required for assembly of respiratory complex III; mitochondrial inner membrane protein; required for an early step in assembly of respiratory complex III (cytochrome bc1 complex); mRNA is targeted to mitochondria +S000036693 CDS YLR077W 12 283872 285623 W 2011-02-03 1996-07-31 +S000004068 ORF Verified YLR078C BOS1 SEC32 chromosome 12 L000000192 12 286559 285736 C 2011-02-03 1996-07-31 v-SNARE (vesicle specific SNAP receptor); localized to the endoplasmic reticulum membrane and necessary for vesicular transport from the ER to the Golgi; required for efficient nuclear fusion during mating +S000036710 CDS YLR078C 12 286467 285736 C 2011-02-03 1996-07-31 +S000036709 CDS YLR078C 12 286559 286557 C 2011-02-03 1996-07-31 +S000036711 intron YLR078C 12 286556 286468 C 2011-02-03 1996-07-31 +S000004069 ORF Verified YLR079W SIC1 BYC1|cyclin-dependent protein serine/threonine kinase inhibiting protein SIC1|SDB25 chromosome 12 L000001886|L000001822 12 286820 287674 W 2011-02-03 1996-07-31 Cyclin-dependent kinase inhibitor (CKI); inhibitor of Cdc28-Clb kinase complexes that controls G1/S phase transition, preventing premature S phase and ensuring genomic integrity; phosphorylated by Clb5/6-Cdk1 and Cln1/2-Cdk1 kinase which regulate timing of Sic1p degradation; phosphorylation targets Sic1p for SCF(CDC4)-dependent turnover; functional homolog of mammalian Kip1 +S000036800 CDS YLR079W 12 286820 287674 W 2011-02-03 1996-07-31 +S000004070 ORF Verified YLR080W EMP46 chromosome 12 12 287916 289250 W 2011-02-03 1996-07-31 Integral membrane component of ER-derived COPII-coated vesicles; functions in ER to Golgi transport; EMP46 has a paralog, EMP47, that arose from the whole genome duplication +S000037384 CDS YLR080W 12 287916 289250 W 2011-02-03 1996-07-31 +S000118472 ARS ARS1212 ARSXII-289 chromosome 12 12 289315 289444 2014-11-18 2014-11-18|2006-08-30 Late-firing chromosomal replication origin +S000178134 ARS_consensus_sequence ARS1212 12 289422 289406 C 2014-11-18 2014-11-18 +S000004071 ORF Verified YLR081W GAL2 galactose permease GAL2 chromosome 12 L000000659 12 290212 291936 W 44 2011-02-03 1996-07-31 Galactose permease; required for utilization of galactose; also able to transport glucose +S000037506 CDS YLR081W 12 290212 291936 W 2011-02-03 1996-07-31 +S000004072 ORF Verified YLR082C SRL2 chromosome 12 L000004670 12 293572 292394 C 2011-02-03 1996-07-31 Protein of unknown function; overexpression suppresses the lethality caused by a rad53 null mutation +S000037548 CDS YLR082C 12 293572 292394 C 2011-02-03 1996-07-31 +S000004073 ORF Verified YLR083C EMP70 TMN1|p24a chromosome 12 L000000550 12 296094 294091 C 2011-02-03 1996-07-31 Protein with a role in cellular adhesion and filamentous growth; also endosome-to-vacuole sorting; similar to Tmn3p; member of Transmembrane Nine family of proteins with 9 transmembrane segments; EMP70 has a paralog, TMN2, that arose from the whole genome duplication +S000030358 CDS YLR083C 12 296094 294091 C 2011-02-03 1996-07-31 +S000004074 ORF Verified YLR084C RAX2 chromosome 12 12 300251 296589 C 2011-02-03 1996-07-31 N-glycosylated protein; involved in the maintenance of bud site selection during bipolar budding; localization requires Rax1p; RAX2 mRNA stability is regulated by Mpt5p +S000030482 CDS YLR084C 12 300251 296589 C 2011-02-03 1996-07-31 +S000004075 ORF Verified YLR085C ARP6 chromosome 12 L000003435 12 301989 300673 C 2011-02-03 1996-07-31 Actin-related protein that binds nucleosomes; a component of the SWR1 complex, which exchanges histone variant H2AZ (Htz1p) for chromatin-bound histone H2A +S000030596 CDS YLR085C 12 301989 300673 C 2011-02-03 1996-07-31 +S000004076 ORF Verified YLR086W SMC4 condensin subunit SMC4 chromosome 12 L000003472 12 302243 306499 W 2011-02-03 1996-07-31 Subunit of the condensin complex; condensin reorganizes chromosomes during both mitosis and meiosis; forms a subcomplex with Smc2p that has ATP-hydrolyzing and DNA-binding activity, but other condensin subunits are required for chromatin binding; required for tRNA gene clustering at the nucleolus; potential Cdc28p substrate +S000031513 CDS YLR086W 12 302243 306499 W 2011-02-03 1996-07-31 +S000004077 ORF Verified YLR087C CSF1 chromosome 12 12 315731 306855 C 2011-02-03 1996-07-31 Protein required for fermentation at low temperature; plays a role in the maturation of secretory proteins; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000031547 CDS YLR087C 12 315731 306855 C 2011-02-03 1996-07-31 +S000004078 ORF Verified YLR088W GAA1 GPI-anchor transamidase subunit GAA1|END2 chromosome 12 L000000557 12 316107 317951 W 2011-02-03 1996-07-31 Subunit of the GPI:protein transamidase complex; removes the GPI-anchoring signal and attaches GPI (glycosylphosphatidylinositol) to proteins in the ER; human homolog GPAA1 can complement growth defects of yeast thermosensitive mutant at restrictive temperature +S000031702 CDS YLR088W 12 316107 317951 W 2011-02-03 1996-07-31 +S000004079 ORF Verified YLR089C ALT1 alanine transaminase ALT1 chromosome 12 12 320015 318237 C 2011-02-03 1996-07-31 Alanine transaminase (glutamic pyruvic transaminase); involved in alanine biosynthesis and catabolism; TOR1-independent role in determining chronological lifespan; expression is induced in the presence of alanine; repression is mediated by Nrg1p; ALT1 has a paralog, ALT2, that arose from the whole genome duplication; Alt2p is catalytically inactive +S000031709 CDS YLR089C 12 320015 318237 C 2011-02-03 1996-07-31 +S000004080 ORF Verified YLR090W XDJ1 chromosome 12 L000002487 12 320701 322080 W 2011-02-03 1996-07-31 Chaperone with a role in facilitating mitochondrial protein import; ascomycete-specific member of the DnaJ-like family, closely related to Ydj1p; predicted to be C-terminally prenylated; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000032708 CDS YLR090W 12 320701 322080 W 2011-02-03 1996-07-31 +S000004081 ORF Verified YLR091W GEP5 RRG5 chromosome 12 12 322297 323178 W 2011-02-03 1996-07-31 Protein of unknown function; required for mitochondrial genome maintenance; detected in highly purified mitochondria in high-throughput studies; null mutant has decreased levels of cardiolipin and phosphatidylethanolamine +S000032790 CDS YLR091W 12 322297 323178 W 2011-02-03 1996-07-31 +S000004082 ORF Verified YLR092W SUL2 sulfate permease chromosome 12 L000003473 12 323544 326225 W 2011-02-03 1996-07-31 High affinity sulfate permease; sulfate uptake is mediated by specific sulfate transporters Sul1p and Sul2p, which control the concentration of endogenous activated sulfate intermediates +S000033523 CDS YLR092W 12 323544 326225 W 2011-02-03 1996-07-31 +S000004083 ORF Verified YLR093C NYV1 MAM2 chromosome 12 L000004690 12 327415 326513 C 2011-02-03 2000-07-14|1996-07-31 v-SNARE component of the vacuolar SNARE complex; involved in vesicle fusion; inhibits ATP-dependent Ca(2+) transport activity of Pmc1p in the vacuolar membrane +S000033559 CDS YLR093C 12 327258 326513 C 2011-02-03 2000-07-14|1996-07-31 +S000033558 CDS YLR093C 12 327415 327400 C 2011-02-03 2000-07-14 +S000033560 intron YLR093C 12 327399 327259 C 2011-02-03 2000-07-14 +S000004084 ORF Verified YLR094C GIS3 chromosome 12 L000004863 12 329238 327730 C 2011-02-03 1996-07-31 Protein of unknown function +S000033649 CDS YLR094C 12 329238 327730 C 2011-02-03 1996-07-31 +S000004085 ORF Verified YLR095C IOC2 chromosome 12 12 332115 329677 C 2011-02-03 1996-07-31 Subunit of the Isw1b complex; exhibits nucleosome-stimulated ATPase activity and acts within coding regions to coordinate transcription elongation with termination and processing; contains a PHD finger motif; other complex members are Isw1p and Ioc4p +S000033765 CDS YLR095C 12 332115 329677 C 2011-02-03 1996-07-31 +S000004086 ORF Verified YLR096W KIN2 serine/threonine protein kinase KIN2 chromosome 12 L000000902 12 332590 336033 W 2011-02-03 1996-07-31 Serine/threonine protein kinase involved in regulation of exocytosis; localizes to the cytoplasmic face of the plasma membrane; KIN2 has a paralog, KIN1, that arose from the whole genome duplication +S000034747 CDS YLR096W 12 332590 336033 W 2011-02-03 1996-07-31 +S000004087 ORF Verified YLR097C HRT3 SCF ubiquitin ligase complex subunit HRT3 chromosome 12 12 337265 336231 C 2011-02-03 1996-07-31 Putative SCF-ubiquitin ligase F-box protein; based on both genetic and physical interactions and sequence similarity; identified in association with Cdc53p, Skp1p and Ubi4 in large and small-scale studies +S000034800 CDS YLR097C 12 337265 336231 C 2011-02-03 1996-07-31 +S000004088 ORF Verified YLR098C CHA4 SIL3|SIL2 chromosome 12 L000002854 12 339473 337527 C 2011-02-03 1996-07-31 DNA binding transcriptional activator; mediates serine/threonine activation of the catabolic L-serine (L-threonine) deaminase (CHA1); Zinc-finger protein with Zn[2]-Cys[6] fungal-type binuclear cluster domain +S000034932 CDS YLR098C 12 339473 337527 C 2011-02-03 1996-07-31 +S000004089 ORF Verified YLR099C ICT1 lysophosphatidic acid acyltransferase ICT1 chromosome 12 12 340928 339744 C 2011-02-03 1996-07-31 Lysophosphatidic acid acyltransferase; responsible for enhanced phospholipid synthesis during organic solvent stress; null displays increased sensitivity to Calcofluor white; highly expressed during organic solvent stress; ICT1 has a paralog, ECM18, that arose from the whole genome duplication; human ABHD5 can complement ict1 null mutant +S000035852 CDS YLR099C 12 340928 339744 C 2011-02-03 1996-07-31 +S000007618 ORF Verified YLR099W-A MIM2 chromosome 12 12 341325 341588 W 2011-02-03 2001-02-26 Mitochondrial protein required for outer membrane protein import; involved in import of the subset of proteins with multiple alpha-helical transmembrane segments, including Ugo1p, Tom20p, and Fzo1p; component of a large protein complex in the outer membrane that includes Mim1p; not essential in W303 strain background +S000037216 CDS YLR099W-A 12 341325 341588 W 2011-02-03 2001-02-26 +S000004090 ORF Verified YLR100W ERG27 3-keto-steroid reductase chromosome 12 12 341810 342853 W 2011-02-03 1996-07-31 3-keto sterol reductase; catalyzes the last of three steps required to remove two C-4 methyl groups from an intermediate in ergosterol biosynthesis; mutants are sterol auxotrophs; mutation is functionally complemented by human HSD17B7 +S000033168 CDS YLR100W 12 341810 342853 W 2011-02-03 1996-07-31 +S000004091 ORF Dubious YLR101C chromosome 12 12 342961 342566 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified, essential ORF ERG27/YLR100W +S000033199 CDS YLR101C 12 342961 342566 C 2011-02-03 1996-07-31 +S000178135 ARS ARS1212.5 chromosome 12 12 343577 344032 2014-11-18 2014-11-18 Strong autonomously replicating sequence +S000178136 ARS_consensus_sequence ARS1212.5 12 343855 343871 W 2014-11-18 2014-11-18 +S000004092 ORF Verified YLR102C APC9 anaphase promoting complex subunit 9 chromosome 12 L000004321 12 343767 342970 C 2011-02-03 1996-07-31 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); APC/C is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition +S000033261 CDS YLR102C 12 343767 342970 C 2011-02-03 1996-07-31 +S000004093 ORF Verified YLR103C CDC45 DNA replication initiation factor CDC45|SLD4 chromosome 12 L000003380 12 345941 343989 C 2011-02-03 1996-07-31 DNA replication initiation factor; recruited to MCM pre-RC complexes at replication origins; promotes release of MCM from Mcm10p, recruits elongation machinery; binds tightly to ssDNA, which disrupts interaction with the MCM helicase and stalls it during replication stress; mutants in human homolog may cause velocardiofacial and DiGeorge syndromes +S000033319 CDS YLR103C 12 345941 343989 C 2011-02-03 1996-07-31 +S000004094 ORF Uncharacterized YLR104W LCL2 chromosome 12 12 346585 346980 W 2011-02-03 1996-07-31 Putative protein of unknown function; mutant is deficient in cell wall mannosylphosphate and has long chronological lifespan; genetic interactions suggest a role in ER-associated protein degradation (ERAD); SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole +S000034290 CDS YLR104W 12 346585 346980 W 2011-02-03 1996-07-31 +S000004095 ORF Verified YLR105C SEN2 tRNA splicing endonuclease subunit SEN2 chromosome 12 L000001863 12 348180 347047 C 2011-02-03 1996-07-31 Subunit of the tRNA splicing endonuclease; tRNA splicing endonuclease (Sen complex) is composed of Sen2p, Sen15p, Sen34p, and Sen54p; Sen complex also cleaves the CBP1 mRNA at the mitochondrial surface; Sen2p contains the active site for tRNA 5' splice site cleavage and has similarity to Sen34p and to Archaeal tRNA splicing endonuclease; +S000034355 CDS YLR105C 12 348180 347047 C 2011-02-03 1996-07-31 +S000007313 snoRNA_gene snR79 SNR79 Z9 chromosome 12 L000004807 12 348510 348427 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position C1007 +S000031838 noncoding_exon snR79 12 348510 348427 C 2011-02-03 2000-05-19 +S000004096 ORF Verified YLR106C MDN1 AAA family ATPase midasin|REA1 chromosome 12 S000028419 12 363738 349006 C 2011-02-03 1996-07-31 Huge dynein-related AAA-type ATPase (midasin); forms extended pre-60S particle with the Rix1 complex (Rix1p-Ipi1p-Ipi3p); acts in removal of ribosomal biogenesis factors at successive steps of pre-60S assembly and export from nucleus +S000035344 CDS YLR106C 12 363738 349006 C 2011-02-03 1996-07-31 +S000004097 ORF Verified YLR107W REX3 RNA exonuclease chromosome 12 12 364116 365330 W 2011-02-03 1996-07-31 RNA exonuclease; required for maturation of the RNA component of RNase MRP; functions redundantly with Rnh70p and Rex2p in processing of U5 snRNA and RNase P RNA; member of RNase D family of exonucleases +S000035537 CDS YLR107W 12 364116 365330 W 2011-02-03 1996-07-31 +S000007067 long_terminal_repeat YLRCdelta5 chromosome 12 12 366144 365810 C 2011-02-03 2000-05-19 Ty1 LTR +S000006494 snRNA_gene snR6 SNR6 U6 chromosome 12 L000001961 12 366235 366346 W 2011-02-03 2000-05-19 U6 spliceosomal RNA (U6 snRNA); mediates catalysis of pre-mRNA splicing by the spliceosome; interacts with U4; homology to U6 snRNA, interacts with snr14 +S000034320 noncoding_exon snR6 12 366235 366346 W 2011-02-03 2000-05-19 +S000004098 ORF Verified YLR108C chromosome 12 12 368124 366667 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; YLR108C is not an esssential gene; protein abundance increases in response to DNA replication stress; YLR108C has a paralog, YDR132C, that arose from the whole genome duplication +S000035581 CDS YLR108C 12 368124 366667 C 2011-02-03 1996-07-31 +S000004099 ORF Verified YLR109W AHP1 thioredoxin peroxidase AHP1|cTPxIII chromosome 12 S000007480 12 368781 369311 W 2011-02-03 1996-07-31 Thiol-specific peroxiredoxin; reduces hydroperoxides to protect against oxidative damage; function in vivo requires covalent conjugation to Urm1p +S000036533 CDS YLR109W 12 368781 369311 W 2011-02-03 1996-07-31 +S000004100 ORF Verified YLR110C CCW12 chromosome 12 12 370098 369697 C 2011-02-03 1996-07-31 Cell wall mannoprotein; plays a role in maintenance of newly synthesized areas of cell wall; localizes to periphery of small buds, septum region of larger buds, and shmoo tip; CCW12 has a paralog, YDR134C, that arose from the whole genome duplication +S000037291 CDS YLR110C 12 370098 369697 C 2011-02-03 1996-07-31 +S000004101 ORF Dubious YLR111W chromosome 12 12 370391 370723 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037464 CDS YLR111W 12 370391 370723 W 2011-02-03 1996-07-31 +S000004102 ORF Dubious YLR112W chromosome 12 12 370791 371210 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030153 CDS YLR112W 12 370791 371210 W 2011-02-03 1996-07-31 +S000004103 ORF Verified YLR113W HOG1 mitogen-activated protein kinase HOG1|SSK3 chromosome 12 L000000797 12 371620 372927 W 2011-02-03 1996-07-31 Mitogen-activated protein kinase involved in osmoregulation; controls global reallocation of RNAPII during osmotic shock; mediates recruitment/activation of RNAPII at Hot1p-dependent promoters; binds calmodulin; stimulates antisense transcription to activate CDC28; defines novel S-phase checkpoint with Mrc1p that prevent replication/transcription conflicts; nuclear form represses pseudohyphal growth; autophosphorylates; protein abundance increases under DNA replication stress +S000030351 CDS YLR113W 12 371620 372927 W 2011-02-03 1996-07-31 +S000118473 ARS ARS1213 ARSXII-373 chromosome 12 12 373254 373332 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000007095 long_terminal_repeat YLRWsigma2 chromosome 12 12 373999 374338 W 2011-02-03 2000-05-19 Ty3 LTR +S000006704 tRNA_gene tR(ACG)L chromosome 12 L000003646 12 374355 374427 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 6 nuclear tRNA genes containing the tDNA-anticodon ACG (converted to ICG in the mature tRNA), decodes CGU, CGC, and probably CGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000030443 noncoding_exon tR(ACG)L 12 374355 374427 W 2011-02-03 2000-05-19 +S000004104 ORF Verified YLR114C AVL9 chromosome 12 S000029049|S000029007 12 377238 374944 C 2011-02-03 1996-07-31 Conserved protein involved in exocytic transport from the Golgi; mutation is synthetically lethal with apl2 vps1 double mutation; member of a protein superfamily with orthologs in diverse organisms; relocalizes from bud neck to cytoplasm upon DNA replication stress +S000030429 CDS YLR114C 12 377238 374944 C 2011-02-03 1996-07-31 +S000004105 ORF Verified YLR115W CFT2 cleavage polyadenylation factor subunit CFT2|YDH1 chromosome 12 L000003599 12 377985 380564 W 2011-02-03 1996-07-31 Subunit of the mRNA cleavage and polyadenlylation factor (CPF); required for pre-mRNA cleavage, polyadenylation and poly(A) site recognition, 43% similarity with the mammalian CPSF-100 protein. +S000031398 CDS YLR115W 12 377985 380564 W 2011-02-03 1996-07-31 +S000004106 ORF Verified YLR116W MSL5 mRNA splicing protein MSL5|BBP chromosome 12 L000004109 12 380822 382252 W 2011-02-03 1996-07-31 Component of commitment complex; which defines first step in splicing pathway; essential protein that interacts with Mud2p and Prp40p, forming a bridge between the intron ends; also involved in nuclear retention of pre-mRNA; relocalizes to the cytosol in response to hypoxia +S000031525 CDS YLR116W 12 380822 382252 W 2011-02-03 1996-07-31 +S000004107 ORF Verified YLR117C CLF1 NTC77|SYF3 chromosome 12 L000004628 12 384534 382471 C 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); this complex contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs; homolog of Drosophila crooked neck protein; interacts with U1 snRNP proteins +S000031606 CDS YLR117C 12 384534 382471 C 2011-02-03 1996-07-31 +S000130182 ARS ARS1214 chromosome 12 12 384534 384725 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000004108 ORF Verified YLR118C palmitoyl-(protein) hydrolase|APT1 chromosome 12 12 385408 384725 C 2011-02-03 1996-07-31 Acyl-protein thioesterase responsible for depalmitoylation of Gpa1p; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and nucleus and is induced in response to the DNA-damaging agent MMS +S000032586 CDS YLR118C 12 385408 384725 C 2011-02-03 1996-07-31 +S000004109 ORF Verified YLR119W SRN2 ESCRT-I subunit protein SRN2|VPL16|VPS37|SRN10 chromosome 12 L000003103 12 385534 386175 W 2011-02-03 1996-07-31 Component of the ESCRT-I complex; ESCRT-I is involved in ubiquitin-dependent sorting of proteins into the endosome; suppressor of rna1-1 mutation; may be involved in RNA export from nucleus +S000032725 CDS YLR119W 12 385534 386175 W 2011-02-03 1996-07-31 +S000004110 ORF Verified YLR120C YPS1 aspartyl protease|YAP3 chromosome 12 L000002491 12 388220 386511 C 2011-02-03 1996-07-31 Aspartic protease; hyperglycosylated member of the yapsin family of proteases, attached to the plasma membrane via a glycosylphosphatidylinositol (GPI) anchor; involved in nutrient limitation-induced cleavage of the extracellular inhibitory domain of signaling mucin Msb2p, resulting in activation of the filamentous growth MAPK pathway; involved with other yapsins in the cell wall integrity response; role in KEX2-independent processing of the alpha factor precursor +S000032796 CDS YLR120C 12 388220 386511 C 2011-02-03 1996-07-31 +S000028674 ORF Dubious YLR120W-A chromosome 12 12 388672 388773 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YLR121C +S000032521 CDS YLR120W-A 12 388672 388773 W 2011-02-03 2003-07-29 +S000004111 ORF Verified YLR121C YPS3 aspartyl protease|YPS4 chromosome 12 L000004383 12 390270 388744 C 2011-02-03 1996-07-31 Aspartic protease; member of the yapsin family of proteases involved in cell wall growth and maintenance; attached to the plasma membrane via a glycosylphosphatidylinositol (GPI) anchor +S000032903 CDS YLR121C 12 390270 388744 C 2011-02-03 1996-07-31 +S000004112 ORF Dubious YLR122C chromosome 12 12 391331 390954 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YLR123C +S000033010 CDS YLR122C 12 391331 390954 C 2011-02-03 1996-07-31 +S000004113 ORF Dubious YLR123C chromosome 12 12 391407 391078 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YLR122C; contains characteristic aminoacyl-tRNA motif +S000033100 CDS YLR123C 12 391407 391078 C 2011-02-03 1996-07-31 +S000004114 ORF Dubious YLR124W chromosome 12 12 391600 391944 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033902 CDS YLR124W 12 391600 391944 W 2011-02-03 1996-07-31 +S000004115 ORF Uncharacterized YLR125W chromosome 12 12 393484 393894 W 2011-02-03 1996-07-31 Putative protein of unknown function; mutant has decreased Ty3 transposition; YLR125W is not an essential gene +S000034058 CDS YLR125W 12 393484 393894 W 2011-02-03 1996-07-31 +S000004116 ORF Verified YLR126C putative amidotransferase chromosome 12 12 395520 394765 C 2011-02-03 1996-07-31 Putative glutamine amidotransferase; has Aft1p-binding motif in the promoter; may be involved in copper and iron homeostasis; YLR126C is not an essential protein; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress +S000034899 CDS YLR126C 12 395520 394765 C 2011-02-03 1996-07-31 +S000004117 ORF Verified YLR127C APC2 anaphase promoting complex subunit 2|TID2|RSI1 chromosome 12 L000003970|L000004348 12 398319 395758 C 2011-02-03 1996-07-31 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); which is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; component of the catalytic core of the APC/C; has similarity to cullin Cdc53p +S000035048 CDS YLR127C 12 398319 395758 C 2011-02-03 1996-07-31 +S000004118 ORF Verified YLR128W DCN1 NEDD8 ligase DCN1 chromosome 12 12 398530 399433 W 2011-02-03 1996-07-31 Scaffold-type E3 ligase; required for cullin neddylation and ubiquitin ligase activation; contains a ubiquitin-binding domain (UBA) for ubiquitin and Nedd8 (Rub1p) interaction and a PONY domain involved in cullin binding and neddylation +S000035287 CDS YLR128W 12 398530 398532 W 2011-02-03 1996-07-31 +S000035288 CDS YLR128W 12 398627 399433 W 2011-02-03 1996-07-31 +S000035289 intron YLR128W 12 398533 398626 W 2011-02-03 1996-07-31 +S000004119 ORF Verified YLR129W DIP2 snoRNA-binding rRNA-processing protein DIP2|UTP12 chromosome 12 L000003088 12 399657 402488 W 2011-02-03 1996-07-31 Nucleolar protein; specifically associated with the U3 snoRNA, part of the large ribonucleoprotein complex known as the small subunit (SSU) processome, required for 18S rRNA biogenesis, part of the active pre-rRNA processing complex +S000036230 CDS YLR129W 12 399657 402488 W 2011-02-03 1996-07-31 +S000004120 ORF Verified YLR130C ZRT2 low-affinity Zn(2+) transporter ZRT2 chromosome 12 L000004167 12 404062 402794 C 2011-02-03 1996-07-31 Low-affinity zinc transporter of the plasma membrane; transcription is induced under low-zinc conditions by the Zap1p transcription factor +S000037080 CDS YLR130C 12 404062 402794 C 2011-02-03 1996-07-31 +S000004121 ORF Verified YLR131C ACE2 DNA-binding transcription factor ACE2 chromosome 12 L000000020 12 406822 404510 C 2011-02-03 1996-07-31 Transcription factor required for septum destruction after cytokinesis; phosphorylation by Cbk1p blocks nuclear exit during M/G1 transition, causing localization to daughter cell nuclei, and also increases Ace2p activity; phosphorylation by Cdc28p and Pho85p prevents nuclear import during cell cycle phases other than cytokinesis; part of RAM network that regulates cellular polarity and morphogenesis; ACE2 has a paralog, SWI5, that arose from the whole genome duplication +S000037197 CDS YLR131C 12 406822 404510 C 2011-02-03 1996-07-31 +S000004122 ORF Verified YLR132C USB1 phosphoric diester hydrolase chromosome 12 12 408155 407283 C 2011-02-03 1996-07-31 Putative poly(U)-specific 3'-to-5' RNA exonuclease; involved in 3'-end processing of U6 snRNA removing uridines and generating a terminal 2′,3′ cyclic phosphate; essential protein that localizes to the nucleus and mitochondria; overexpression suppresses the respiratory defects of oxa1 and mtf2 mutants; homolog of S.pombe gene, mpn1 and human gene, hUSB1; mutations in hUSB1 are associated with a rare genodermatosis, poikiloderma with neutropenia (OMIM 604173) +S000037305 CDS YLR132C 12 408155 407283 C 2011-02-03 1996-07-31 +S000004123 ORF Verified YLR133W CKI1 bifunctional choline kinase/ethanolamine kinase CKI1 chromosome 12 L000000346 12 408445 410193 W 2011-02-03 1996-07-31 Choline kinase; catalyzes the first step in phosphatidylcholine synthesis via the CDP-choline (Kennedy pathway); exhibits some ethanolamine kinase activity contributing to phosphatidylethanolamine synthesis via the CDP-ethanolamine pathway; CKI1 has a paralog, EKI1, that arose from the whole genome duplication +S000030014 CDS YLR133W 12 408445 410193 W 2011-02-03 1996-07-31 +S000004124 ORF Verified YLR134W PDC5 indolepyruvate decarboxylase 5 chromosome 12 L000001356 12 410723 412414 W 2011-02-03 1996-07-31 Minor isoform of pyruvate decarboxylase; key enzyme in alcoholic fermentation, decarboxylates pyruvate to acetaldehyde, regulation is glucose- and ethanol-dependent, repressed by thiamine, involved in amino acid catabolism +S000030184 CDS YLR134W 12 410723 412414 W 2011-02-03 1996-07-31 +S000118474 ARS ARS1215 ARSXII-413 chromosome 12 12 412686 412893 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000004125 ORF Verified YLR135W SLX4 chromosome 12 12 413281 415527 W 2011-02-03 1996-07-31 Endonuclease involved in processing DNA; acts during recombination, repair; promotes template switching during break-induced replication (BIR), causing non-reciprocal translocations (NRTs); cleaves branched structures in complex with Slx1p; involved in interstrand cross-link repair, Rad1p/Rad10p-dependent removal of 3'-nonhomologous tails during DSBR via single-strand annealing; relative distribution to nuclear foci increases upon DNA replication stress; FANCP-related factor +S000031127 CDS YLR135W 12 413281 415527 W 2011-02-03 1996-07-31 +S000004126 ORF Verified YLR136C TIS11 CTH2 chromosome 12 L000002895 12 416658 415801 C 2011-02-03 1996-07-31 mRNA-binding protein expressed during iron starvation; binds to a sequence element in the 3'-untranslated regions of specific mRNAs to mediate their degradation; involved in iron homeostasis; protein increases in abundance and relative distribution to the nucleus increases upon DNA replication stress; TIS11 has a paralog, CTH1, that arose from the whole genome duplication +S000031183 CDS YLR136C 12 416658 415801 C 2011-02-03 1996-07-31 +S000004127 ORF Verified YLR137W RKM5 S-adenosylmethionine-dependent methyltransferase chromosome 12 12 417006 418109 W 2011-02-03 1996-07-31 Protein lysine methyltransferase; monomethylates Lys-46 of the ribosomal large subunit Rpl1a/Rpl1b; member of the seven beta-strand methyltransferase superfamily; orthologs only found among fungal species +S000031387 CDS YLR137W 12 417006 418109 W 2011-02-03 1996-07-31 +S000004128 ORF Verified YLR138W NHA1 chromosome 12 L000004113 12 418437 421394 W 2011-02-03 1996-07-31 Na+/H+ antiporter; involved in sodium and potassium efflux through the plasma membrane; required for alkali cation tolerance at acidic pH +S000032374 CDS YLR138W 12 418437 421394 W 2011-02-03 1996-07-31 +S000004129 ORF Verified YLR139C SLS1 chromosome 12 L000002656 12 423473 421542 C 2011-02-03 1996-07-31 Mitochondrial membrane protein; coordinates expression of mitochondrially-encoded genes; may facilitate delivery of mRNA to membrane-bound translation machinery +S000032442 CDS YLR139C 12 423473 421542 C 2011-02-03 1996-07-31 +S000004130 ORF Dubious YLR140W chromosome 12 12 423474 423800 W 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; overlaps essential RRN5 gene which encodes a member of the UAF transcription factor involved in transcription of rDNA by RNA polymerase I +S000033242 CDS YLR140W 12 423474 423800 W 2011-02-03 1996-07-31 +S000004131 ORF Verified YLR141W RRN5 chromosome 12 L000003261 12 423683 424774 W 2011-02-03 1996-07-31 Protein involved in transcription of rDNA by RNA polymerase I; transcription factor, member of UAF (upstream activation factor) family along with Rrn9p and Rrn10p +S000033304 CDS YLR141W 12 423683 424774 W 2011-02-03 1996-07-31 +S000004132 ORF Verified YLR142W PUT1 proline dehydrogenase chromosome 12 L000001535 12 425186 426616 W 73 2011-02-03 1996-07-31 Proline oxidase; nuclear-encoded mitochondrial protein involved in utilization of proline as sole nitrogen source; PUT1 transcription is induced by Put3p in the presence of proline and the absence of a preferred nitrogen source +S000033371 CDS YLR142W 12 425186 426616 W 2011-02-03 1996-07-31 +S000006541 tRNA_gene tD(GUC)L1 chromosome 12 L000003647 12 427132 427203 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000031841 noncoding_exon tD(GUC)L1 12 427132 427203 W 2011-02-03 2000-05-19 +S000004133 ORF Verified YLR143W DPH6 diphthine--ammonia ligase chromosome 12 12 427329 429386 W 2011-02-03 1996-07-31 Diphthamide synthetase; catalyzes the last amidation step of diphthamide biosynthesis using ammonium and ATP; evolutionarily conserved in eukaryotes; dph6 mutants exhibit diphthine accumulation and resistance to sordarin, which is indicative of defects in diphthamide formation on EF2; green fluorescent protein (GFP)-tagged protein localizes to the cytoplasm; DPH6/YLR143W is not an essential gene +S000034284 CDS YLR143W 12 427329 429386 W 2011-02-03 1996-07-31 +S000004134 ORF Verified YLR144C ACF2 PCA1|ENG2 chromosome 12 L000004011 12 432016 429677 C 2011-02-03 1996-07-31 Intracellular beta-1,3-endoglucanase; expression is induced during sporulation; may have a role in cortical actin cytoskeleton assembly; protein abundance increases in response to DNA replication stress +S000034344 CDS YLR144C 12 432016 429677 C 2011-02-03 1996-07-31 +S000004135 ORF Verified YLR145W RMP1 chromosome 12 12 432168 432773 W 2011-02-03 1996-07-31 Subunit of RNase MRP; RNase MRP processes pre-rRNA and has a role in cell cycle-regulated degradation of daughter cell-specific mRNAs; unlike most subunits, not shared between RNase MRP and nuclear RNase P +S000034472 CDS YLR145W 12 432168 432773 W 2011-02-03 1996-07-31 +S000004136 ORF Verified YLR146C SPE4 spermine synthase chromosome 12 L000004341 12 433725 432823 C 2011-02-03 1996-07-31 Spermine synthase; required for the biosynthesis of spermine and also involved in biosynthesis of pantothenic acid +S000034521 CDS YLR146C 12 433725 432823 C 2011-02-03 1996-07-31 +S000113566 ORF Uncharacterized YLR146W-A chromosome 12 12 433870 434058 W 2011-02-03 2005-11-17 Putative protein of unknown function +S000113567 CDS YLR146W-A 12 433870 434058 W 2011-02-03 2005-11-17 +S000004137 ORF Verified YLR147C SMD3 mRNA splicing protein SMD3|Sm D3|SLT16 chromosome 12 L000001929 12 434463 434158 C 2011-02-03 1996-07-31 Core Sm protein Sm D3; part of heteroheptameric complex (with Smb1p, Smd1p, Smd2p, Sme1p, Smx3p, and Smx2p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; homolog of human Sm D3 +S000035546 CDS YLR147C 12 434463 434158 C 2011-02-03 1996-07-31 +S000004138 ORF Verified YLR148W PEP3 tethering complex subunit PEP3|VPT18|VPS18|VAM8 chromosome 12 L000001374|L000002473 12 434641 437397 W 91 2011-02-03 1996-07-31 Component of CORVET membrane tethering complex; vacuolar peripheral membrane protein that promotes vesicular docking/fusion reactions in conjunction with SNARE proteins, required for vacuolar biogenesis +S000035686 CDS YLR148W 12 434641 437397 W 2011-02-03 1996-07-31 +S000004139 ORF Verified YLR149C chromosome 12 12 439823 437631 C 2011-02-03 1996-07-31 Protein of unknown function; overexpression causes a cell cycle delay or arrest; null mutation results in a decrease in plasma membrane electron transport; YLR149C is not an essential gene; protein abundance increases in response to DNA replication stress +S000035734 CDS YLR149C 12 439823 437631 C 2011-02-03 1996-07-31 +S000007619 ORF Dubious YLR149C-A chromosome 12 12 440456 440370 C 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037217 CDS YLR149C-A 12 440456 440370 C 2011-02-03 2001-02-26 +S000004140 ORF Verified YLR150W STM1 MPT4 chromosome 12 L000002574 12 440467 441288 W 2011-02-03 1996-07-31 Protein required for optimal translation under nutrient stress; perturbs association of Yef3p with ribosomes; involved in TOR signaling; binds G4 quadruplex and purine motif triplex nucleic acid; helps maintain telomere structure; protein abundance increases in response to DNA replication stress; serves as a ribosome preservation factor both during quiescence and recovery +S000036485 CDS YLR150W 12 440467 441288 W 2011-02-03 1996-07-31 +S000004141 ORF Verified YLR151C PCD1 8-oxo-dGTP diphosphatase chromosome 12 12 442737 441715 C 2011-02-03 1996-07-31 8-oxo-dGTP diphosphatase; prevents spontaneous mutagenesis via sanitization of oxidized purine nucleoside triphosphates; can also act as peroxisomal pyrophosphatase with specificity for coenzyme A and CoA derivatives, may function to remove potentially toxic oxidized CoA disulfide from peroxisomes to maintain the capacity for beta-oxidation of fatty acids; nudix hydrolase family member; similar E. coli MutT and human, rat and mouse MTH1 +S000036493 CDS YLR151C 12 442737 441715 C 2011-02-03 1996-07-31 +S000004142 ORF Uncharacterized YLR152C chromosome 12 12 444688 442958 C 2011-02-03 1996-07-31 Putative protein of unknown function; YLR152C is not an essential gene +S000036614 CDS YLR152C 12 444688 442958 C 2011-02-03 1996-07-31 +S000004143 ORF Verified YLR153C ACS2 acetate--CoA ligase ACS2 chromosome 12 L000003111 12 447575 445524 C 2011-02-03 1996-07-31 Acetyl-coA synthetase isoform; along with Acs1p, acetyl-coA synthetase isoform is the nuclear source of acetyl-coA for histone acetylation; mutants affect global transcription; required for growth on glucose; expressed under anaerobic conditions +S000036713 CDS YLR153C 12 447575 445524 C 2011-02-03 1996-07-31 +S000004144 ORF Verified YLR154C RNH203 Rnh2C chromosome 12 12 448314 447982 C 2011-02-03 1996-07-31 Ribonuclease H2 subunit; required for RNase H2 activity; role in ribonucleotide excision repair; related to human AGS3 that causes Aicardi-Goutieres syndrome +S000037436 CDS YLR154C 12 448314 447982 C 2011-02-03 1996-07-31 +S000006699 tRNA_gene tQ(UUG)L chromosome 12 L000003663 12 448721 448650 C 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000032585 noncoding_exon tQ(UUG)L 12 448721 448650 C 2011-02-03 2000-05-19 +S000007084 long_terminal_repeat YLRWdelta6 chromosome 12 12 448842 449028 W 2011-02-03 2000-05-19 Ty1 LTR +S000118475 ARS ARS1216 ARSXII-451 chromosome 12 12 450485 450725 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178137 ARS_consensus_sequence ARS1216 12 450506 450522 W 2014-11-18 2014-11-18 +S000029718 rRNA_gene ETS2-1 ETS2-1 3' ETS chromosome 12 12 451785 451575 C 2011-02-03 2004-03-04 Non-coding region located adjacent to and downstream of RDN25; transcribed as part of the 35S rRNA precursor transcript; contains the primary rRNA transcription termination site at +93 and a secondary termination site between +211 and +250 +S000036854 external_transcribed_spacer_region ETS2-1 12 451785 451575 C 2011-02-03 2004-03-04 +S000028675 ORF Dubious YLR154W-A YLR154W-C chromosome 12 12 452438 452623 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; encoded within the 25S rRNA gene on the opposite strand +S000032525 CDS YLR154W-A 12 452438 452623 W 2011-02-03 2003-07-29 +S000028563 ORF Dubious YLR154W-B chromosome 12 12 454392 454556 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; encoded within the 25S rRNA gene on the opposite strand +S000031269 CDS YLR154W-B 12 454392 454556 W 2011-02-03 2003-07-29 +S000028422 ORF Verified YLR154W-C TAR1 YLR154W-A chromosome 12 S000007646 12 454696 455070 W 2011-02-03 2002-06-20 Protein potentially involved in regulation of respiratory metabolism; located in the mitochondria; interacts genetically with RPO41 and physically with Coq5p; encoded within the 25S rRNA gene on the opposite strand +S000029958 CDS YLR154W-C 12 454696 455070 W 2011-02-03 2002-06-20 +S000006484 rRNA_gene RDN25-1 RDN25-1 26S rRNA|RDN25 chromosome 12 12 455181 451786 C 2011-02-03 2000-05-19 25S ribosomal RNA (25S rRNA); component of the large (60S) ribosomal subunit; encoded in the rDNA repeat (RDN1) as part of the 35S primary transcript; formed by endonucleolytic cleavage at the C2 site of internal transcribed spacer 2 (ITS2) +S000032318 noncoding_exon RDN25-1 12 455181 451786 C 2011-02-03 2000-05-19 +S000029716 rRNA_gene ITS2-1 ITS2-1 ITS2 chromosome 12 12 455413 455182 C 2011-02-03 2004-03-04 Non-coding region between RDN58 and RDN25; transcribed as part of the 35S rRNA precursor transcript; forms a stem-loop structure that is required for processing of the precursor transcript +S000036852 internal_transcribed_spacer_region ITS2-1 12 455413 455182 C 2011-02-03 2004-03-04 +S000028676 ORF Dubious YLR154W-E chromosome 12 12 455433 455636 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; encoded within the 35S rRNA gene on the opposite strand +S000032527 CDS YLR154W-E 12 455433 455636 W 2011-02-03 2003-07-29 +S000006488 rRNA_gene RDN58-1 RDN58-1 RDN58 chromosome 12 12 455571 455414 C 2011-02-03 2000-05-19 5.8S ribosomal RNA (5.8S rRNA); component of the large (60S) ribosomal subunit; encoded in the rDNA repeat (RDN1) as part of the 35S primary transcript; 3' end formation involves processing by the exosome complex while 5' end is generated by Kem1p and Rat1p +S000033911 noncoding_exon RDN58-1 12 455571 455414 C 2011-02-03 2000-05-19 +S000028843 ORF Dubious YLR154W-F chromosome 12 12 455883 456023 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; encoded within the 35S rRNA gene on the opposite strand +S000034528 CDS YLR154W-F 12 455883 456023 W 2011-02-03 2003-07-29 +S000029715 rRNA_gene ITS1-1 ITS1-1 ITS1 chromosome 12 12 455932 455572 C 2011-02-03 2004-03-04 Non-coding region between RDN58 and RDN18; transcribed as part of the 35S rRNA precursor transcript; excision during transcript maturation is coupled with processing of the 3' external transcribed spacer (3'ETS) +S000036841 internal_transcribed_spacer_region ITS1-1 12 455932 455572 C 2011-02-03 2004-03-04 +S000006482 rRNA_gene RDN18-1 RDN18-1 RDN18 chromosome 12 12 457732 455933 C 2011-02-03 2000-05-19 18S ribosomal RNA (18S rRNA); component of the small (40S) ribosomal subunit; involved in codon recognition by tRNAs or the release factor eRF1 (Sup45p); encoded in the rDNA repeat (RDN1) as part of the 35S primary transcript +S000033329 noncoding_exon RDN18-1 12 457732 455933 C 2011-02-03 2000-05-19 +S000006486 rRNA_gene RDN37-1 RDN37-1 RDN37 chromosome 12 12 458432 451575 C 2011-02-03 1997-07-30 35S ribosomal RNA (35S rRNA) transcript; encoded by the RDN1 locus; processed into the 25S, 18S and 5.8S rRNAs (represented by the RDN25, RDN18, and RDN58 loci) +S000032929 external_transcribed_spacer_region RDN37-1 12 451785 451575 C 2011-02-03 2000-05-19 +S000032923 external_transcribed_spacer_region RDN37-1 12 458432 457733 C 2011-02-03 2000-05-19 +S000032927 internal_transcribed_spacer_region RDN37-1 12 455413 455182 C 2011-02-03 2000-05-19 +S000032925 internal_transcribed_spacer_region RDN37-1 12 455932 455572 C 2011-02-03 2000-05-19 +S000032928 noncoding_exon RDN37-1 12 455181 451786 C 2011-02-03 2000-05-19 +S000032926 noncoding_exon RDN37-1 12 455571 455414 C 2011-02-03 2000-05-19 +S000032924 noncoding_exon RDN37-1 12 457732 455933 C 2011-02-03 2000-05-19 +S000029717 rRNA_gene ETS1-1 ETS1-1 5' ETS chromosome 12 12 458432 457733 C 2011-02-03 2004-03-04 Non-coding region located immediately upstream of RDN18; transcribed as part of the 35S rRNA precursor transcript; contains an essential U3 snoRNA binding site required for maturation of 18S rRNA +S000036853 external_transcribed_spacer_region ETS1-1 12 458432 457733 C 2011-02-03 2004-03-04 +S000120636 ARS ARS1200-1 ARSXII-459|ARS1216.5|rDNA ARS chromosome 12 12 458991 459097 2011-02-03 2007-02-06 Chromosomal origin of bidirectional DNA replication; an rDNA ARS is presumed to be present in each tandem rDNA repeat, but fewer than one-third of the rDNA ARSs are actually used as replication origins in a given S phase +S000120639 ARS_consensus_sequence ARS1200-1 12 459088 459078 C 2011-02-03 2007-02-06 +S000029329 rRNA_gene NTS2-1 NTS2-1 chromosome 12 L000003944 12 459675 458433 C 2011-02-03 2003-12-09 Nontranscribed region of the rDNA repeat; located between RND5 and the 5'ETS; contains RNA polymerase I termination site +S000032460 non_transcribed_region NTS2-1 12 459675 458433 C 2011-02-03 2003-12-09 +S000006479 rRNA_gene RDN5-1 RDN5-1 MOF9|RDN5 chromosome 12 L000004821|S000029304 12 459676 459796 W 2011-02-03 2000-05-19 5S ribosomal RNA (5S rRNA); only complete sequence of 6 repeated RDN5 alleles; able to support viability when provided as sole form of 5S rRNA; component of the large (60S) ribosomal subunit; localized to the nucleolus via interaction with Rpl5p; may play a role in translational frame fidelity; transcription is mediated by PolIII and activated by TFIIIA and TFIIIE +S000031406 noncoding_exon RDN5-1 12 459676 459796 W 2011-02-03 2000-05-19 +S000029714 rRNA_gene NTS1-2 NTS1-2 NTS1 chromosome 12 12 460711 459797 C 2011-02-03 2004-03-04 Non-transcribed region of the rDNA repeat between the 3' ETS and RDN5; required for rDNA repeat expansion +S000036840 non_transcribed_region NTS1-2 12 460711 459797 C 2011-02-03 2004-03-04 +S000029713 rRNA_gene ETS2-2 ETS2-2 3' ETS chromosome 12 12 460922 460712 C 2011-02-03 2004-03-04 Non-coding region located adjacent to RDN25; transcribed as part of the 35S rRNA precursor transcript; contains the primary rRNA transcription termination site at +93 and a secondary termination site between +211 and +250 +S000036839 external_transcribed_spacer_region ETS2-2 12 460922 460712 C 2011-02-03 2004-03-04 +S000028561 ORF Uncharacterized YLR154C-G chromosome 12 12 462671 462522 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology comparisons and RT-PCR; this ORF is contained within RDN25-2 and RDN37-2 +S000031267 CDS YLR154C-G 12 462671 462522 C 2011-02-03 2003-07-29 +S000006485 rRNA_gene RDN25-2 RDN25-2 26S rRNA|RDN25 chromosome 12 12 464318 460923 C 2011-02-03 2000-05-19 25S ribosomal RNA (25S rRNA); component of the large (60S) ribosomal subunit; encoded in the rDNA repeat (RDN1) as part of the 35S primary transcript; formed by endonucleolytic cleavage at the C2 site of internal transcribed spacer 2 (ITS2) +S000032336 noncoding_exon RDN25-2 12 464318 460923 C 2011-02-03 2000-05-19 +S000029712 rRNA_gene ITS2-2 ITS2-2 ITS2 chromosome 12 12 464550 464319 C 2011-02-03 2004-03-04 Non-coding region between RDN58 and RDN25; transcribed as part of the 35S rRNA precursor transcript; forms a stem-loop structure required for processing of the precursor transcript +S000036837 internal_transcribed_spacer_region ITS2-2 12 464550 464319 C 2011-02-03 2004-03-04 +S000006489 rRNA_gene RDN58-2 RDN58-2 RDN58 chromosome 12 12 464708 464551 C 2011-02-03 2000-05-19 5.8S ribosomal RNA (5.8S rRNA); component of the large (60S) ribosomal subunit; encoded in the rDNA repeat (RDN1) +S000033912 noncoding_exon RDN58-2 12 464708 464551 C 2011-02-03 2000-05-19 +S000029709 rRNA_gene ITS1-2 ITS1-2 ITS1 chromosome 12 12 465069 464709 C 2011-02-03 2004-03-04 Non-coding region between RDN58 and RDN18; transcribed as part of the 35S rRNA precursor transcript; excision during transcript maturation is coupled with processing of the 3' external transcribed spacer (3' ETS) +S000036833 internal_transcribed_spacer_region ITS1-2 12 465069 464709 C 2011-02-03 2004-03-04 +S000006483 rRNA_gene RDN18-2 RDN18-2 RDN18 chromosome 12 12 466869 465070 C 2011-02-03 2000-05-19 18S ribosomal RNA (18S rRNA); component of the small (40S) ribosomal subunit; involved in codon recognition by tRNAs or the release factor eRF1 (Sup45p); encoded in the rDNA repeat (RDN1) as part of the 35S primary transcript +S000033332 noncoding_exon RDN18-2 12 466869 465070 C 2011-02-03 2000-05-19 +S000006487 rRNA_gene RDN37-2 RDN37-2 RDN37 chromosome 12 12 467569 460712 C 2011-02-03 1997-07-30 35S ribosomal RNA (35S rRNA) transcript; encoded by the RDN1 locus; processed into the 25S, 18S and 5.8S rRNAs (represented by the RDN25, RDN18, and RDN58 loci) +S000032939 external_transcribed_spacer_region RDN37-2 12 460922 460712 C 2011-02-03 2000-05-19 +S000032933 external_transcribed_spacer_region RDN37-2 12 467569 466870 C 2011-02-03 2000-05-19 +S000032937 internal_transcribed_spacer_region RDN37-2 12 464550 464319 C 2011-02-03 2000-05-19 +S000032935 internal_transcribed_spacer_region RDN37-2 12 465069 464709 C 2011-02-03 2000-05-19 +S000032938 noncoding_exon RDN37-2 12 464318 460923 C 2011-02-03 2000-05-19 +S000032936 noncoding_exon RDN37-2 12 464708 464551 C 2011-02-03 2000-05-19 +S000032934 noncoding_exon RDN37-2 12 466869 465070 C 2011-02-03 2000-05-19 +S000029707 rRNA_gene ETS1-2 ETS1-2 5' ETS chromosome 12 12 467569 466870 C 2011-02-03 2004-03-04 Non-coding region located immediately upstream of RDN18; transcribed as part of the 35S rRNA precursor transcript; contains an essential U3 snoRNA binding site required for maturation of 18S rRNA +S000036830 external_transcribed_spacer_region ETS1-2 12 467569 466870 C 2011-02-03 2004-03-04 +S000120655 ARS ARS1200-2 ARSXII-468|rDNA ARS chromosome 12 12 468128 468234 2011-02-03 2007-02-06 Chromosomal origin of bidirectional DNA replication; an rDNA ARS is presumed to be present in each tandem rDNA repeat, but fewer than one-third of the rDNA ARSs are actually used as replication origins in a given S phase +S000120656 ARS_consensus_sequence ARS1200-2 12 468225 468215 C 2011-02-03 2007-02-06 +S000029706 rRNA_gene NTS2-2 NTS2-2 NTS2 chromosome 12 12 468812 467570 C 2011-02-03 2004-03-04 Non-transcribed region of the rDNA repeat; located between RDN5 and the 5' ETS +S000036829 non_transcribed_region NTS2-2 12 468812 467570 C 2011-02-03 2004-03-04 +S000006480 rRNA_gene RDN5-2 RDN5-2 RDN5 chromosome 12 12 468813 468931 W 2011-02-03 1997-07-30 Variant 5S ribosomal rRNA (5S rRNA) gene; located within the RDN1 locus; unable to support cell viability when provided as sole source of 5S rRNA; identical in sequence to variant alleles RDN5-3, RDN5-4, and RDN5-5 +S000031412 noncoding_exon RDN5-2 12 468813 468931 W 2011-02-03 2000-05-19 +S000028562 ORF Uncharacterized YLR154C-H chromosome 12 12 468958 468827 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology comparisons and RT-PCR; this ORF partially overlaps RDN5-2; YLR154C-H has a paralog, YLR157C-C, that arose from a segmental duplication +S000031268 CDS YLR154C-H 12 468958 468827 C 2011-02-03 2003-07-29 +S000004145 ORF Verified YLR155C ASP3-1 asparaginase ASP3-1|ASP3 chromosome 12 L000000130 12 470405 469317 C 2011-02-03 1996-07-31 Cell-wall L-asparaginase II involved in asparagine catabolism; expression induced during nitrogen starvation; ORF contains a short non-coding RNA that enhances expression of full-length gene; likely arose in via horizontal gene transfer from the wine yeast Wickerhamomyces anomalus or a close relative; reference strain S288C has four copies of ASP3; ASP3-1 has a paralog, ASP3-3, that arose from a segmental duplication +S000037563 CDS YLR155C 12 470405 469317 C 2011-02-03 1996-07-31 +S000004146 ORF Uncharacterized YLR156W chromosome 12 12 472113 472457 W 2011-02-03 1996-07-31 Putative protein of unknown function; exhibits a two-hybrid interaction with Jsn1p in a large-scale analysis; YLR156W has a paralog, YLR159W, that arose from a segmental duplication +S000030409 CDS YLR156W 12 472113 472457 W 2011-02-03 1996-07-31 +S000006481 rRNA_gene RDN5-3 RDN5-3 RDN5 chromosome 12 12 472465 472583 W 2011-02-03 1997-07-30 Variant 5S ribosomal RNA (5S rRNA) gene; located at a site distal to the RDN1 locus; unable to support cell viability when provided as sole source of 5S rRNA; identical in sequence to variant alleles RDN5-2, RDN5-4, and RDN5-5 +S000031417 noncoding_exon RDN5-3 12 472465 472583 W 2011-02-03 2000-05-19 +S000028564 ORF Uncharacterized YLR156C-A chromosome 12 12 472610 472479 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology comparisons and RT-PCR; partially overlaps RND5-3; YLR156C-A has a paralog, YLR159C-A, that arose from a segmental duplication +S000031270 CDS YLR156C-A 12 472610 472479 C 2011-02-03 2003-07-29 +S000004147 ORF Verified YLR157C ASP3-2 asparaginase ASP3-2|ASP3 chromosome 12 12 474057 472969 C 2011-02-03 1996-07-31 Cell-wall L-asparaginase II involved in asparagine catabolism; expression induced during nitrogen starvation; ORF contains a short non-coding RNA that enhances expression of full-length gene; likely arose in via horizontal gene transfer from the wine yeast Wickerhamomyces anomalus or a close relative; reference strain S288C has four copies of ASP3; ASP3-2 has a paralog, ASP3-4, that arose from a segmental duplication +S000030487 CDS YLR157C 12 474057 472969 C 2011-02-03 1996-07-31 +S000028677 ORF Uncharacterized YLR157W-D YLR157W-A chromosome 12 12 475764 475976 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; YLR157W-D has a paralog, YLR161W, that arose from a segmental duplication +S000032531 CDS YLR157W-D 12 475764 475976 W 2011-02-03 2003-07-29 +S000007068 long_terminal_repeat YLRCdelta7 chromosome 12 12 476310 475976 C 2011-02-03 2000-05-19 Ty1 LTR +S000007374 transposable_element_gene YLR157C-B gag-pol fusion protein chromosome 12 12 481601 476333 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000035905 CDS YLR157C-B 12 480295 476333 C 2011-02-03 1999-07-17 +S000035904 CDS YLR157C-B 12 481601 480297 C 2011-02-03 1999-07-17 +S000035906 plus_1_translational_frameshift YLR157C-B 12 480296 480296 C 2011-02-03 1999-07-17 +S000007373 transposable_element_gene YLR157C-A gag protein chromosome 12 12 481601 480279 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000035900 CDS YLR157C-A 12 481601 480279 C 2011-02-03 1999-07-17 +S000028678 ORF Uncharacterized YLR157W-E YLR157W-B|YLR157W-C chromosome 12 12 481873 482037 W 2011-02-03 2003-07-29 Putative protein of unknown function identified by gene-trapping; microarray-based expression analysis, and genome-wide homology searching; partially overlaps a Ty1 element +S000032535 CDS YLR157W-E 12 481873 482037 W 2011-02-03 2003-07-29 +S000007081 LTR_retrotransposon YLRCTy1-1 Ty1 chromosome 12 12 481897 475976 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007069 long_terminal_repeat YLRCdelta8 chromosome 12 12 481897 481563 C 2011-02-03 2000-05-19 Ty1 LTR +S000029708 rRNA_gene RDN5-4 RDN5-4 RDN5 chromosome 12 12 482045 482163 W 2011-02-03 2004-03-04 Variant 5S ribosomal rRNA (5S rRNA) gene; located at a site distal to the RDN1 locus; unable to support cell viability when provided as sole source of 5S rRNA; identical in sequence to variant alleles RDN5-2, RDN5-3, and RDN5-5 +S000036831 noncoding_exon RDN5-4 12 482045 482163 W 2011-02-03 2004-03-04 +S000028565 ORF Uncharacterized YLR157C-C chromosome 12 12 482190 482059 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology comparisons and RT-PCR; this ORF partially overlaps RDN5-4; YLR157C-C has a paralog, YLR154C-H, that arose from a segmental duplication +S000031271 CDS YLR157C-C 12 482190 482059 C 2011-02-03 2003-07-29 +S000004148 ORF Verified YLR158C ASP3-3 asparaginase ASP3-3|ASP3 chromosome 12 12 483637 482549 C 2011-02-03 1996-07-31 Cell-wall L-asparaginase II involved in asparagine catabolism; expression induced during nitrogen starvation; ORF contains a short non-coding RNA that enhances expression of full-length gene; likely arose in via horizontal gene transfer from the wine yeast Wickerhamomyces anomalus or a close relative; reference strain S288C has four copies of ASP3; ASP3-3 has a paralog, ASP3-1, that arose from a segmental duplication +S000030598 CDS YLR158C 12 483637 482549 C 2011-02-03 1996-07-31 +S000004149 ORF Uncharacterized YLR159W chromosome 12 12 485345 485689 W 2011-02-03 1996-07-31 Putative protein of unknown function; YLR156W, YLR159W, and YLR161W are three identical open reading frames in S288C encoded near the ribosomal DNA region of chromosome 12; YLR159W has a paralog, YLR156W, that arose from a segmental duplication +S000031528 CDS YLR159W 12 485345 485689 W 2011-02-03 1996-07-31 +S000029710 rRNA_gene RDN5-5 RDN5-5 RDN5 chromosome 12 12 485697 485815 W 2011-02-03 2004-03-04 Variant 5S ribosomal rRNA (5S rRNA) gene; located at a site distal to the RDN1 locus; unable to support cell viability when provided as sole source of 5S rRNA; identical in sequence to variant alleles RDN5-2, RDN5-3, and RDN5-4 +S000036834 noncoding_exon RDN5-5 12 485697 485815 W 2011-02-03 2004-03-04 +S000028566 ORF Uncharacterized YLR159C-A chromosome 12 12 485842 485711 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology comparisons and RT-PCR; partially overlaps RND5-5; YLR159C-A has a paralog, YLR156C-A, that arose from a segmental duplication +S000031272 CDS YLR159C-A 12 485842 485711 C 2011-02-03 2003-07-29 +S000004150 ORF Verified YLR160C ASP3-4 asparaginase ASP3-4|ASP3 chromosome 12 12 487289 486201 C 2011-02-03 1996-07-31 Cell-wall L-asparaginase II involved in asparagine catabolism; expression induced during nitrogen starvation; ORF contains a short non-coding RNA that enhances expression of full-length gene; likely arose in via horizontal gene transfer from the wine yeast Wickerhamomyces anomalus or a close relative; reference strain S288C has four copies of ASP3; ASP3-4 has a paralog, ASP3-2, that arose from a segmental duplication +S000031490 CDS YLR160C 12 487289 486201 C 2011-02-03 1996-07-31 +S000004151 ORF Uncharacterized YLR161W chromosome 12 12 488997 489341 W 2011-02-03 1996-07-31 Putative protein of unknown function; YLR156W, YLR159W, and YLR161W are three identical open reading frames in S288C encoded near the ribosomal DNA region of chromosome 12; YLR161W has a paralog, YLR157W-D, that arose from a segmental duplication +S000031592 CDS YLR161W 12 488997 489341 W 2011-02-03 1996-07-31 +S000029711 rRNA_gene RDN5-6 RDN5-6 RDN5 chromosome 12 12 489349 489469 W 2011-02-03 2004-03-04 Variant 5S ribosomal rRNA (5S rRNA) gene; located at a site distal to the RDN1 locus +S000036835 noncoding_exon RDN5-6 12 489349 489469 W 2011-02-03 2004-03-04 +S000004152 ORF Verified YLR162W chromosome 12 12 489573 489929 W 2011-02-03 1996-07-31 Protein of unknown function; overexpression confers resistance to the antimicrobial peptide MiAMP1 and causes growth arrest, apoptosis, and increased sensitivity to cobalt chloride +S000032571 CDS YLR162W 12 489573 489929 W 2011-02-03 1996-07-31 +S000028567 ORF Uncharacterized YLR162W-A RRT15 chromosome 12 12 490406 490594 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology comparisons and RT-PCR; identified in a screen for mutants with decreased levels of rDNA transcription +S000031273 CDS YLR162W-A 12 490406 490594 W 2011-02-03 2003-07-29 +S000028844 ORF Dubious YLR163W-A chromosome 12 12 492812 492925 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034529 CDS YLR163W-A 12 492812 492925 W 2011-02-03 2003-07-29 +S000004153 ORF Verified YLR163C MAS1 MIF1 chromosome 12 L000001026|L000001108 12 493254 491866 C 2011-02-03 1996-07-31 Beta subunit of the mitochondrial processing protease (MPP); essential processing enzyme that cleaves the N-terminal targeting sequences from mitochondrially imported proteins +S000032649 CDS YLR163C 12 493254 491866 C 2011-02-03 1996-07-31 +S000004154 ORF Verified YLR164W SHH4 protein SHH4 chromosome 12 12 493883 494389 W 2011-02-03 1996-07-31 Putative alternate subunit of succinate dehydrogenase (SDH); mitochondrial inner membrane protein; genetic interaction with SDH4 suggests that Shh4p can function as a functional SDH subunit; a fraction copurifies with SDH subunit Sdh3p; expression induced by nitrogen limitation in a GLN3, GAT1-dependent manner; Shh4p has greater similarity to human SDHD (subunit D of SDH, implicated in paraganglioma) than does its paralog Sdh4p +S000032792 CDS YLR164W 12 493883 494389 W 2011-02-03 1996-07-31 +S000004155 ORF Verified YLR165C PUS5 pseudouridine synthase PUS5 chromosome 12 12 495258 494494 C 2011-02-03 1996-07-31 Pseudouridine synthase; catalyzes only the formation of pseudouridine (Psi)-2819 in mitochondrial 21S rRNA; not essential for viability +S000032861 CDS YLR165C 12 495258 494494 C 2011-02-03 1996-07-31 +S000004156 ORF Verified YLR166C SEC10 exocyst subunit SEC10 chromosome 12 L000003428 12 498044 495429 C 2011-02-03 1996-07-31 Essential 100kDa subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis at the plasma membrane prior to SNARE-mediated fusion +S000033562 CDS YLR166C 12 498044 495429 C 2011-02-03 1996-07-31 +S000004157 ORF Verified YLR167W RPS31 eS31|ubiquitin-ribosomal 40S subunit protein S31 fusion protein|S31e|UB13|YS24|S37|S31|UBI3|RPS37 chromosome 12 L000001768|L000002413 12 498947 499405 W 2011-02-03 1996-07-31 Fusion protein cleaved to yield ribosomal protein S31 and ubiquitin; ubiquitin may facilitate assembly of the ribosomal protein into ribosomes; interacts genetically with translation factor eIF2B; homologous to mammalian ribosomal protein S27A, no bacterial homolog +S000033714 CDS YLR167W 12 498947 499405 W 2011-02-03 1996-07-31 +S000004158 ORF Verified YLR168C UPS2 GEP1|AIM30|MSF1|MSF1' chromosome 12 12 500270 499578 C 2011-02-03 1996-07-31 Mitochondrial intermembrane space protein; involved in phospholipid metabolism; forms complex with Mdm35p that transfers phosphatidylserine from outer membrane to inner membrane for phosphatidylethanolamine synthesis; null mutant has defects in mitochondrial morphology; similar to Ups1p, Ups3p and to human PRELI; UPS2 has a paralog, UPS3, that arose from the whole genome duplication +S000033771 CDS YLR168C 12 500270 499578 C 2011-02-03 1996-07-31 +S000004159 ORF Dubious YLR169W chromosome 12 12 500335 500688 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034750 CDS YLR169W 12 500335 500688 W 2011-02-03 1996-07-31 +S000004161 ORF Dubious YLR171W chromosome 12 12 500733 501122 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035908 CDS YLR171W 12 500733 501122 W 2011-02-03 1996-07-31 +S000004160 ORF Verified YLR170C APS1 YAP19 chromosome 12 L000002493 12 501049 500579 C 2011-02-03 1996-07-31 Small subunit of the clathrin-associated adaptor complex AP-1; AP-1 is involved in protein sorting at the trans-Golgi network; homolog of the sigma subunit of the mammalian clathrin AP-1 complex +S000035745 CDS YLR170C 12 501049 500579 C 2011-02-03 1996-07-31 +S000004162 ORF Verified YLR172C DPH5 diphthine synthase chromosome 12 L000000523 12 502162 501260 C 2011-02-03 1996-07-31 Methyltransferase required for synthesis of diphthamide; diphthamide is a modified histidine residue of translation elongation factor 2 (Eft1p or Eft2p); not essential for viability; GFP-Dph5p fusion protein localizes to the cytoplasm +S000035977 CDS YLR172C 12 502162 501260 C 2011-02-03 1996-07-31 +S000004163 ORF Uncharacterized YLR173W chromosome 12 12 502421 504247 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000036883 CDS YLR173W 12 502421 504247 W 2011-02-03 1996-07-31 +S000004164 ORF Verified YLR174W IDP2 isocitrate dehydrogenase (NADP(+)) IDP2 chromosome 12 L000002737 12 504591 505829 W 2011-02-03 1996-07-31 Cytosolic NADP-specific isocitrate dehydrogenase; catalyzes oxidation of isocitrate to alpha-ketoglutarate; levels are elevated during growth on non-fermentable carbon sources and reduced during growth on glucose; IDP2 has a paralog, IDP3, that arose from the whole genome duplication +S000036934 CDS YLR174W 12 504591 505829 W 2011-02-03 1996-07-31 +S000004165 ORF Verified YLR175W CBF5 pseudouridine synthase CBF5 chromosome 12 L000000223 12 506134 507585 W 2011-02-03 1996-07-31 Pseudouridine synthase catalytic subunit of box H/ACA snoRNPs; acts on large and small rRNAs, on snRNA U2, and on some mRNAs; mutations in human ortholog dyskerin cause the disorder dyskeratosis congenita; small nucleolar ribonucleoprotein particles are also known as snoRNPs +S000037702 CDS YLR175W 12 506134 507585 W 2011-02-03 1996-07-31 +S000004166 ORF Verified YLR176C RFX1 CRT1 chromosome 12 L000004129 12 510232 507797 C 2011-02-03 1996-07-31 Major transcriptional repressor of DNA-damage-regulated genes; recruits repressors Tup1p and Cyc8p to their promoters; involved in DNA damage and replication checkpoint pathway; similar to a family of mammalian DNA binding RFX1-4 proteins +S000037720 CDS YLR176C 12 510232 507797 C 2011-02-03 1996-07-31 +S000004167 ORF Uncharacterized YLR177W chromosome 12 12 511054 512940 W 2011-02-03 1996-07-31 Putative protein of unknown function; phosphorylated by Dbf2p-Mob1p in vitro; some strains contain microsatellite polymophisms at this locus; not an essential gene; YLR177W has a paralog, PSP1, that arose from the whole genome duplication +S000037859 CDS YLR177W 12 511054 512940 W 2011-02-03 1996-07-31 +S000118476 ARS ARS1217 ARSXII-513 chromosome 12 12 512867 513115 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178138 ARS_consensus_sequence ARS1217 12 513086 513070 C 2014-11-18 2014-11-18 +S000004168 ORF Verified YLR178C TFS1 DKA1 chromosome 12 L000002291 12 513821 513162 C 124 2011-02-03 1996-07-31 Inhibitor of carboxypeptidase Y (Prc1p), and Ras GAP (Ira2p); phosphatidylethanolamine-binding protein (PEBP) family member and ortholog of hPEBP1/RKIP, a natural metastasis suppressor; targets to vacuolar membranes during stationary phase; acetylated by NatB N-terminal acetyltransferase; protein abundance increases in response to DNA replication stress +S000037879 CDS YLR178C 12 513821 513162 C 2011-02-03 1996-07-31 +S000004169 ORF Verified YLR179C chromosome 12 12 514713 514108 C 2011-02-03 1996-07-31 Protein of unknown function with similarity to Tfs1p; transcription is activated by paralogous proteins Yrm1p and Yrr1p along with proteins involved in multidrug resistance; GFP-tagged protein localizes to the cytoplasm and nucleus +S000030817 CDS YLR179C 12 514713 514108 C 2011-02-03 1996-07-31 +S000004170 ORF Verified YLR180W SAM1 methionine adenosyltransferase SAM1|ETH10 chromosome 12 L000001798 12 515262 516410 W 2011-02-03 1996-07-31 S-adenosylmethionine synthetase; catalyzes transfer of the adenosyl group of ATP to the sulfur atom of methionine; SAM1 has a paralog, SAM2, that arose from the whole genome duplication +S000031889 CDS YLR180W 12 515262 516410 W 2011-02-03 1996-07-31 +S000004171 ORF Verified YLR181C VTA1 chromosome 12 12 517670 516678 C 2011-02-03 1996-07-31 Multivesicular body (MVB) protein; involved in endosomal protein sorting; regulates Vps4p activity by promoting its oligomerization; has an N-terminal Vps60- and Did2- binding domain, a linker region, and a C-terminal Vps4p binding domain +S000031945 CDS YLR181C 12 517670 516678 C 2011-02-03 1996-07-31 +S000004172 ORF Verified YLR182W SWI6 transcriptional regulator SWI6|SDS11|PSL8 chromosome 12 L000002254 12 517940 520351 W 2011-02-03 1996-07-31 Transcription cofactor; forms complexes with Swi4p and Mbp1p to regulate transcription at the G1/S transition; involved in meiotic gene expression; also binds Stb1p to regulate transcription at START; cell wall stress induces phosphorylation by Mpk1p, which regulates Swi6p localization; required for the unfolded protein response, independently of its known transcriptional coactivators +S000032961 CDS YLR182W 12 517940 520351 W 2011-02-03 1996-07-31 +S000004173 ORF Verified YLR183C TOS4 chromosome 12 12 522012 520543 C 2011-02-03 1996-07-31 Putative transcription factor, contains Forkhead Associated domain; binds chromatin; involved in expression homeostasis, buffering of mRNA synthesis rate against gene dosage changes during S phase; target of SBF transcription factor; expression is periodic and peaks in G1; involved in DNA replication checkpoint response; interacts with Rpd3 and Set3 histone deacetylase complexes; APCC(Cdh1) substrate; relative distribution to nucleus increases upon DNA replication stress +S000032995 CDS YLR183C 12 522012 520543 C 2011-02-03 1996-07-31 +S000004174 ORF Dubious YLR184W chromosome 12 12 522106 522453 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033139 CDS YLR184W 12 522106 522453 W 2011-02-03 1996-07-31 +S000004175 ORF Verified YLR185W RPL37A eL37|ribosomal 60S subunit protein L37A|L37e|YL35|L43|L37A chromosome 12 L000002884 12 522663 523288 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L37A; required for processing of 27SB pre-rRNA and formation of stable 66S assembly intermediates; homologous to mammalian ribosomal protein L37, no bacterial homolog; RPL37A has a paralog, RPL37B, that arose from the whole genome duplication +S000033905 CDS YLR185W 12 522663 522669 W 2011-02-03 1996-07-31 +S000033906 CDS YLR185W 12 523029 523288 W 2011-02-03 1996-07-31 +S000033907 intron YLR185W 12 522670 523028 W 2011-02-03 1996-07-31 +S000004176 ORF Verified YLR186W EMG1 18S rRNA pseudouridine methyltransferase|NEP1 chromosome 12 12 523632 524390 W 2011-02-03 1996-07-31 Methyltransferase for rRNA; methylates pseudouridine 18S rRNA residue 1191; member of the SPOUT methyltransferase family; required for maturation of 18S rRNA and for 40S ribosomal subunit production independent of methyltransferase activity; forms homodimers; human ortholog is mutated in Bowen-Conradi syndrome, and equivalent yeast mutation affects Emg1p dimerization and localization but not methyltransferase activity; human EMG1 complements lethality of null and ts mutant +S000034031 CDS YLR186W 12 523632 524390 W 2011-02-03 1996-07-31 +S000004177 ORF Verified YLR187W SKG3 chromosome 12 12 524865 527945 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery, cytoplasm, bud, and bud neck; potential Cdc28p substrate; similar to Skg4p; relocalizes from bud neck to cytoplasm upon DNA replication stress; SKG3 has a paralog, CAF120, that arose from the whole genome duplication +S000034134 CDS YLR187W 12 524865 527945 W 2011-02-03 1996-07-31 +S000004178 ORF Verified YLR188W MDL1 ATP-binding cassette permease MDL1 chromosome 12 L000001049 12 528300 530387 W 2011-02-03 1996-07-31 Mitochondrial inner membrane half-type ABC transporter; mediates export of peptides generated upon proteolysis of mitochondrial proteins; plays a role in the regulation of cellular resistance to oxidative stress +S000034239 CDS YLR188W 12 528300 530387 W 2011-02-03 1996-07-31 +S000004179 ORF Verified YLR189C ATG26 UGT51 chromosome 12 L000004808 12 534393 530797 C 2011-02-03 1996-07-31 UDP-glucose:sterol glucosyltransferase; conserved enzyme involved in synthesis of sterol glucoside membrane lipids; in contrast to ATG26 from P. pastoris, S. cerevisiae ATG26 is not involved in autophagy +S000035108 CDS YLR189C 12 534393 530797 C 2011-02-03 1996-07-31 +S000004180 ORF Verified YLR190W MMR1 chromosome 12 12 535214 536689 W 2011-02-03 1996-07-31 Phosphorylated protein of the mitochondrial outer membrane; localizes only to mitochondria of the bud; interacts with Myo2p to mediate mitochondrial distribution to buds; mRNA is targeted to the bud via the transport system involving She2p +S000036058 CDS YLR190W 12 535214 536689 W 2011-02-03 1996-07-31 +S000004181 ORF Verified YLR191W PEX13 peroxin PEX13|PAS20 chromosome 12 L000003024 12 537272 538432 W 2011-02-03 1996-07-31 Peroxisomal importomer complex component; integral peroxisomal membrane protein required for docking and translocation of peroxisomal matrix proteins; interacts with the PTS1 signal recognition factor Pex5p and the PTS2 signal recognition factor Pex7p; forms a complex with Pex14p and Pex17p; human homolog PEX13 complements yeast null mutant +S000036199 CDS YLR191W 12 537272 538432 W 2011-02-03 1996-07-31 +S000004182 ORF Verified YLR192C HCR1 translation initiation factor eIF3 core subunit j chromosome 12 S000007439 12 539589 538792 C 2011-02-03 1996-07-31 eIF3j component of translation initiation factor 3 (eIF3); dual function protein involved in translation initiation as a substoichiometric component (eIF3j) of eIF3; required for 20S pre-rRNA processing; required at post-transcriptional step for efficient retrotransposition; absence decreases Ty1 Gag:GFP protein levels; binds eIF3 subunits Rpg1p, Prt1p and 18S rRNA; eIF3 also involved in programmed stop codon read through; human homolog EIF3J can complement yeast hcr1 mutant +S000036241 CDS YLR192C 12 539589 538792 C 2011-02-03 1996-07-31 +S000004183 ORF Verified YLR193C UPS1 chromosome 12 12 540536 540009 C 2011-02-03 1996-07-31 Phosphatidic acid transfer protein; plays a role in phospholipid metabolism by transporting phosphatidic acid from the outer to the inner mitochondrial membrane; localizes to the mitochondrial intermembrane space; null mutant has altered cardiolipin and phosphatidic acid levels; ortholog of human PRELI +S000031730 CDS YLR193C 12 540536 540009 C 2011-02-03 1996-07-31 +S000004184 ORF Verified YLR194C NCW2 chromosome 12 12 541573 540809 C 2011-02-03 1996-07-31 Structural constituent of the cell wall; attached to the plasma membrane by a GPI-anchor; expression is upregulated in response to cell wall stress; null mutant is sensitive to the antifungal agent polyhexamethylene biguanide, resistant to zymolyase treatment and has increased chitin deposition +S000031877 CDS YLR194C 12 541573 540809 C 2011-02-03 1996-07-31 +S000004185 ORF Verified YLR195C NMT1 glycylpeptide N-tetradecanoyltransferase NMT1|CDC72 chromosome 12 L000001259 12 543304 541937 C 142 2011-02-03 1996-07-31 N-myristoyl transferase; catalyzes the cotranslational, covalent attachment of myristic acid to the N-terminal glycine residue of several proteins involved in cellular growth and signal transduction +S000031996 CDS YLR195C 12 543304 541937 C 2011-02-03 1996-07-31 +S000004186 ORF Verified YLR196W PWP1 rRNA-processing protein PWP1 chromosome 12 L000001539 12 543968 545698 W 2011-02-03 1996-07-31 Protein with WD-40 repeats involved in rRNA processing; associates with trans-acting ribosome biogenesis factors; similar to beta-transducin superfamily +S000037527 CDS YLR196W 12 543968 545698 W 2011-02-03 1996-07-31 +S000004187 ORF Verified YLR197W NOP56 snoRNP complex protein NOP56|SIK1 chromosome 12 L000002982 12 546097 547611 W 2011-02-03 1996-07-31 Essential evolutionarily-conserved nucleolar protein; component of the box C/D snoRNP complexes that direct 2'-O-methylation of pre-rRNA during its maturation; overexpression causes spindle orientation defects +S000037605 CDS YLR197W 12 546097 547611 W 2011-02-03 1996-07-31 +S000004188 ORF Dubious YLR198C chromosome 12 12 547645 547286 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene SIK1/YLR197W +S000037636 CDS YLR198C 12 547645 547286 C 2011-02-03 1996-07-31 +S000004189 ORF Verified YLR199C PBA1 POC1 chromosome 12 12 548769 547853 C 2011-02-03 2003-09-27|1996-07-31 Protein involved in 20S proteasome assembly; forms a heterodimer with Add66p that binds to proteasome precursors; interaction with Pba1p-Add66p may affect function of the mature proteasome and its role in maintaining respiratory metabolism; similar to human PAC1 constituent of the PAC1-PAC2 complex involved in proteasome assembly +S000030462 CDS YLR199C 12 548677 547853 C 2011-02-03 2003-09-27|1996-07-31 +S000030461 CDS YLR199C 12 548769 548764 C 2011-02-03 2003-09-27 +S000030463 intron YLR199C 12 548763 548678 C 2011-02-03 2003-09-27 +S000004190 ORF Verified YLR200W YKE2 tubulin-binding prefolding complex subunit YKE2|PFD6|GIM1 chromosome 12 L000002791 12 549012 549356 W 2011-02-03 1996-07-31 Subunit of the heterohexameric Gim/prefoldin protein complex; involved in the folding of alpha-tubulin, beta-tubulin, and actin; prefoldin complex also localizes to chromatin of actively transcribed genes in the nucleus and facilitates transcriptional elongation +S000036300 CDS YLR200W 12 549012 549356 W 2011-02-03 1996-07-31 +S000004191 ORF Verified YLR201C COQ9 ubiquinone biosynthesis protein COQ9|FMP53 chromosome 12 12 550293 549511 C 2011-02-03 1996-07-31 Protein required for ubiquinone biosynthesis and respiratory growth; localizes to matrix face of mitochondrial inner membrane in a large complex with ubiquinone biosynthetic enzymes; ubiquinone is also known as coenzyme Q; human homolog COQ9 can complement yeast coq9 null mutant +S000036362 CDS YLR201C 12 550293 549511 C 2011-02-03 1996-07-31 +S000004192 ORF Dubious YLR202C chromosome 12 12 550636 550194 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YLR201C; ORF contains a putative intron +S000037015 CDS YLR202C 12 550458 550194 C 2011-02-03 1996-07-31 +S000037014 CDS YLR202C 12 550636 550575 C 2011-02-03 1996-07-31 +S000037016 intron YLR202C 12 550574 550459 C 2011-02-03 1996-07-31 +S000004193 ORF Verified YLR203C MSS51 chromosome 12 L000001205 12 551960 550650 C 149 2011-02-03 1996-07-31 Specific translational activator for the mitochondrial COX1 mRNA; loosely associated with the matrix face of the mitochondrial inner membrane; localizes to vacuole membrane in response to H2O2; influences both COX1 mRNA translation and Cox1p assembly into cytochrome c oxidase; binds to heme B, which may be a mechanism for sensing oxygen levels in order to regulate cytochrome c oxidase biogenesis +S000037086 CDS YLR203C 12 551960 550650 C 2011-02-03 1996-07-31 +S000004194 ORF Verified YLR204W QRI5 COX24 chromosome 12 L000001551 12 552270 552605 W 2011-02-03 1996-07-31 Mitochondrial inner membrane protein; required for accumulation of spliced COX1 mRNA; may have an additional role in translation of COX1 mRNA +S000037241 CDS YLR204W 12 552270 552605 W 2011-02-03 1996-07-31 +S000004195 ORF Verified YLR205C HMX1 chromosome 12 12 553677 552724 C 2011-02-03 2004-02-05|1996-07-31 ER localized heme oxygenase; involved in heme degradation during iron starvation and in the oxidative stress response; expression is regulated by AFT1 and oxidative stress; relocates to the perinuclear region in the presence of oxidants +S000037310 CDS YLR205C 12 553677 552724 C 2011-02-03 2004-02-05|1996-07-31 +S000004196 ORF Verified YLR206W ENT2 epsin chromosome 12 12 554578 556419 W 2011-02-03 1996-07-31 Epsin-like protein required for endocytosis and actin patch assembly; functionally redundant with Ent1p; contains clathrin-binding motif at C-terminus; ENT2 has a paralog, ENT1, that arose from the whole genome duplication +S000030027 CDS YLR206W 12 554578 556419 W 2011-02-03 1996-07-31 +S000004197 ORF Verified YLR207W HRD3 ubiquitin ligase complex subunit HRD3 chromosome 12 L000003040 12 556788 559289 W 2011-02-03 1996-07-31 ER membrane protein that plays a central role in ERAD; forms HRD complex with Hrd1p and ER-associated protein degradation (ERAD) determinants that engages in lumen to cytosol communication and coordination of ERAD events +S000030185 CDS YLR207W 12 556788 559289 W 2011-02-03 1996-07-31 +S000004198 ORF Verified YLR208W SEC13 GTPase-activating protein SEC13|ANU3 chromosome 12 L000001838 12 559551 560444 W 2011-02-03 1996-07-31 Structural component of 3 complexes; subunit of the Nup84p nuclear pore subcomplex that contributes to nucleocytoplasmic transport and NPC biogenesis; subunit of the COPII vesicle coat required for ER-to-Golgi transport; subunit of SEACAT, a subcomplex of the coatomer-related, vacuolar-associated SEA complex, that inhibits the TORC1 inhibitory role of SEACIT (Iml1p-Npr2p-Npr3p), a GAP for Gtr1p, thereby resulting in activation of TORC1 signaling; human SEC13 homolog +S000031129 CDS YLR208W 12 559551 560444 W 2011-02-03 1996-07-31 +S000004199 ORF Verified YLR209C PNP1 purine-nucleoside phosphorylase chromosome 12 12 561732 560797 C 2011-02-03 1996-07-31 Purine nucleoside phosphorylase; specifically metabolizes inosine and guanosine nucleosides; involved in the nicotinamide riboside salvage pathway +S000031185 CDS YLR209C 12 561732 560797 C 2011-02-03 1996-07-31 +S000004200 ORF Verified YLR210W CLB4 B-type cyclin CLB4 chromosome 12 L000000352 12 562008 563390 W 2011-02-03 1996-07-31 B-type cyclin involved in cell cycle progression; activates Cdc28p to promote the G2/M transition; may be involved in DNA replication and spindle assembly; accumulates during S phase and G2, then targeted for ubiquitin-mediated degradation; CLB4 has a paralog, CLB3, that arose from the whole genome duplication +S000032220 CDS YLR210W 12 562008 563390 W 2011-02-03 1996-07-31 +S000004201 ORF Verified YLR211C ATG38 chromosome 12 12 564531 563792 C 2011-02-03 2000-07-14|1996-07-31 Homodimeric subunit of autophagy-specific PtdIns-3-kinase complex I; required for the integrity of the active PtdIns-3-kinase complex I by maintaining an association between Vps15p-Vps34p and Atg14p-Vps30p subcomplexes; localizes to the pre-autophagosomal structure (PAS) in an Atg14p-dependent manner; ATG38 is non-essential but is required for macroautophagy +S000032247 CDS YLR211C 12 564454 563792 C 2011-02-03 2000-07-14|1996-07-31 +S000032246 CDS YLR211C 12 564531 564514 C 2011-02-03 2000-07-14 +S000032248 intron YLR211C 12 564513 564455 C 2011-02-03 2000-07-14 +S000004202 ORF Verified YLR212C TUB4 gamma-tubulin chromosome 12 L000002751 12 566281 564860 C 2011-02-03 1996-07-31 Gamma-tubulin; involved in nucleating microtubules from both the cytoplasmic and nuclear faces of the spindle pole body; protein abundance increases in response to DNA replication stress +S000032353 CDS YLR212C 12 566281 564860 C 2011-02-03 1996-07-31 +S000004203 ORF Verified YLR213C CRR1 putative glycosylase chromosome 12 S000007422 12 567922 566654 C 2011-02-03 1996-07-31 Putative glycoside hydrolase of the spore wall envelope; required for normal spore wall assembly, possibly for cross-linking between the glucan and chitosan layers; expressed during sporulation +S000033218 CDS YLR213C 12 567922 566654 C 2011-02-03 1996-07-31 +S000004204 ORF Verified YLR214W FRE1 ferric/cupric-chelate reductase chromosome 12 L000000626 12 568567 570627 W 2011-02-03 1996-07-31 Ferric reductase and cupric reductase; reduces siderophore-bound iron and oxidized copper prior to uptake by transporters; expression induced by low copper and iron levels +S000033306 CDS YLR214W 12 568567 570627 W 2011-02-03 1996-07-31 +S000004205 ORF Verified YLR215C CDC123 cell proliferation protein CDC123 chromosome 12 12 571858 570776 C 2011-02-03 1996-07-31 Assembly factor for the eIF2 translation initiation factor complex; regulates translational initiation; conserved residues of this ATP-Grasp protein that bind to ATP-Mg2+ in the pombe ortholog are required for complex assembly in budding yeast; interaction with eIF2 subunit Gcd11p facilitates complex assembly and activity; required for the START transition and timely progression through G2; regulated by nutrient availability; human ortholog complements the yeast mutant +S000033348 CDS YLR215C 12 571858 570776 C 2011-02-03 1996-07-31 +S000004207 ORF Dubious YLR217W chromosome 12 12 572909 573232 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene CPR6 +S000034392 CDS YLR217W 12 572909 573232 W 2011-02-03 1996-07-31 +S000004206 ORF Verified YLR216C CPR6 peptidylprolyl isomerase CPR6|CYP40 chromosome 12 L000003229 12 573211 572096 C 2011-02-03 1996-07-31 Peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; plays a role in determining prion variants; binds to Hsp82p and contributes to chaperone activity; protein abundance increases in response to DNA replication stress +S000033434 CDS YLR216C 12 573211 572096 C 2011-02-03 1996-07-31 +S000004208 ORF Verified YLR218C COA4 CMC3 chromosome 12 12 573918 573466 C 2011-02-03 1996-07-31 Twin Cx(9)C protein involved in cytochrome c oxidase organization; organization includes assembly or stability; localizes to the mitochondrial intermembrane space via the Mia40p-Erv1p system; interacts genetically with CYC1 and with cytochrome c oxidase assembly factors +S000034416 CDS YLR218C 12 573918 573466 C 2011-02-03 1996-07-31 +S000004209 ORF Verified YLR219W MSC3 chromosome 12 12 574151 576337 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery; msc3 mutants are defective in directing meiotic recombination events to homologous chromatids; potential Cdc28p substrate; protein abundance increases in response to DNA replication stress +S000035498 CDS YLR219W 12 574151 576337 W 2011-02-03 1996-07-31 +S000004210 ORF Verified YLR220W CCC1 chromosome 12 L000000234 12 576825 577793 W 2011-02-03 1996-07-31 Vacuolar Fe2+/Mn2+ transporter; suppresses respiratory deficit of yfh1 mutants, which lack the ortholog of mammalian frataxin, by preventing mitochondrial iron accumulation; relative distribution to the vacuole decreases upon DNA replication stress +S000035447 CDS YLR220W 12 576825 577793 W 2011-02-03 1996-07-31 +S000004211 ORF Verified YLR221C RSA3 chromosome 12 12 579024 578362 C 2011-02-03 1996-07-31 Protein with a likely role in ribosomal maturation; required for accumulation of wild-type levels of large (60S) ribosomal subunits; binds to the helicase Dbp6p in pre-60S ribosomal particles in the nucleolus +S000035470 CDS YLR221C 12 579024 578362 C 2011-02-03 1996-07-31 +S000004212 ORF Verified YLR222C UTP13 chromosome 12 12 581771 579318 C 2011-02-03 1996-07-31 Nucleolar protein; component of the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA +S000035533 CDS YLR222C 12 581771 579318 C 2011-02-03 1996-07-31 +S000028568 ORF Dubious YLR222C-A chromosome 12 12 582236 582006 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene IFH1 +S000031274 CDS YLR222C-A 12 582236 582006 C 2011-02-03 2003-07-29 +S000004213 ORF Verified YLR223C IFH1 chromosome 12 L000001775 12 585490 582233 C 2011-02-03 1996-07-31 Coactivator, regulates transcription of ribosomal protein (RP) genes; recruited to RP gene promoters during optimal growth conditions via Fhl1p; subunit of CURI, a complex that coordinates RP production and pre-rRNA processing; regulated by acetylation and phosphorylation at different growth states via TORC1 signaling; IFH1 has a paralog, CRF1, that arose from the whole genome duplication +S000036449 CDS YLR223C 12 585490 582233 C 2011-02-03 1996-07-31 +S000004214 ORF Verified YLR224W UCC1 chromosome 12 12 586464 587573 W 2011-02-03 1996-07-31 F-box protein and component of SCF ubiquitin ligase complexes; involved in ubiquitin-dependent protein catabolism; readily monoubiquitinated in vitro by SCF-Ubc4 complexes; SCF-Ucc1 regulates level of Cit2 citrate synthase protein to maintain citrate homeostasis, acts as metabolic switch for glyoxylate cycle; UCC1 transcription is downregulated in cells grown on C2-compounds +S000036572 CDS YLR224W 12 586464 587573 W 2011-02-03 1996-07-31 +S000004215 ORF Uncharacterized YLR225C chromosome 12 12 588918 587695 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; not an essential gene; YLR225C has a paralog, YDR222W, that arose from the whole genome duplication +S000036615 CDS YLR225C 12 588918 587695 C 2011-02-03 1996-07-31 +S000004216 ORF Verified YLR226W BUR2 CST4 chromosome 12 L000002994|L000000205 12 589354 590541 W 2011-02-03 1996-07-31 Cyclin for the Sgv1p (Bur1p) protein kinase; Sgv1p and Bur2p comprise the CDK-cyclin BUR kinase complex which is involved in transcriptional regulation through its phosphorylation of the carboxy-terminal domain (CTD) of the largest subunit of RNA polymerase II (Rpo21p); BUR kinase is also involved in the recruitment of Spt6p to the CTD at the onset of transcription +S000037389 CDS YLR226W 12 589354 590541 W 2011-02-03 1996-07-31 +S000004217 ORF Verified YLR227C ADY4 chromosome 12 S000007652 12 592043 590562 C 2011-02-03 1996-07-31 Structural component of the meiotic outer plaque; outer plaque is a membrane-organizing center that assembles on the cytoplasmic face of the spindle pole body during meiosis II and triggers the formation of the prospore membrane +S000037438 CDS YLR227C 12 592043 590562 C 2011-02-03 1996-07-31 +S000006655 tRNA_gene tL(UAG)L1 chromosome 12 L000003662 12 592619 592519 C 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000035002 intron tL(UAG)L1 12 592581 592563 C 2011-02-03 2000-05-19 +S000035001 noncoding_exon tL(UAG)L1 12 592562 592519 C 2011-02-03 2000-05-19 +S000035000 noncoding_exon tL(UAG)L1 12 592619 592582 C 2011-02-03 2000-05-19 +S000007070 long_terminal_repeat YLRCdelta9 chromosome 12 12 593035 592706 C 2011-02-03 2000-05-19 Ty1 LTR +S000007085 long_terminal_repeat YLRWdelta10 chromosome 12 12 593145 593478 W 2011-02-03 2000-05-19 Ty1 LTR +S000007098 LTR_retrotransposon YLRWTy1-2 Ty1 chromosome 12 12 593145 599062 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007375 transposable_element_gene YLR227W-A gag protein chromosome 12 12 593438 594760 W 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000035724 CDS YLR227W-A 12 593438 594760 W 2011-02-03 1996-07-31 +S000007376 transposable_element_gene YLR227W-B gag-pol fusion protein chromosome 12 12 593438 598706 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000035730 CDS YLR227W-B 12 593438 594742 W 2011-02-03 1999-07-17 +S000035731 CDS YLR227W-B 12 594744 598706 W 2011-02-03 1999-07-17 +S000035732 plus_1_translational_frameshift YLR227W-B 12 594743 594743 W 2011-02-03 1999-07-17 +S000007086 long_terminal_repeat YLRWdelta11 chromosome 12 12 598729 599062 W 2011-02-03 2000-05-19 Ty1 LTR +S000007087 long_terminal_repeat YLRWdelta12 chromosome 12 12 599268 599544 W 2011-02-03 2000-05-19 Ty1 LTR +S000007080 long_terminal_repeat YLRCtau1 chromosome 12 12 599844 599570 C 2011-02-03 2000-05-19 Ty4 LTR +S000004218 ORF Verified YLR228C ECM22 chromosome 12 L000004375 12 602463 600019 C 2011-02-03 1996-07-31 Sterol regulatory element binding protein; regulates transcription of sterol biosynthetic genes upon sterol depletion, after relocating from intracellular membranes to perinuclear foci; redundant activator of filamentation with UPC2, up-regulating the expression of genes involved in filamentous growth; contains Zn[2]-Cys[6] binuclear cluster; ECM22 has a paralog, UPC2, that arose from the whole genome duplication +S000037567 CDS YLR228C 12 602463 600019 C 2011-02-03 1996-07-31 +S000118477 ARS ARS1218 ARSXII-603 chromosome 12 12 603024 603132 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178139 ARS_consensus_sequence ARS1218 12 603110 603094 C 2014-11-18 2014-11-18 +S000004220 ORF Dubious YLR230W chromosome 12 12 604574 604879 W 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; overlaps 5' end of essential CDC42/YLR229C gene which encodes a small Rho-like GTPase essential for establishment and maintenance of cell polarity +S000030492 CDS YLR230W 12 604574 604879 W 2011-02-03 1996-07-31 +S000004219 ORF Verified YLR229C CDC42 Rho family GTPase CDC42 chromosome 12 L000000276 12 604787 604212 C 165 2011-02-03 1996-07-31 Small rho-like GTPase; essential for establishment and maintenance of cell polarity; plays a role late in cell fusion via activation of key cell fusion regulator Fus2p; mutants have defects in the organization of actin and septins; human homolog CDC42 can complement yeast cdc42 mutant +S000030359 CDS YLR229C 12 604787 604212 C 2011-02-03 1996-07-31 +S000006614 tRNA_gene tI(UAU)L chromosome 12 L000003661 12 605432 605300 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000035162 intron tI(UAU)L 12 605395 605336 C 2011-02-03 2000-05-19 +S000035161 noncoding_exon tI(UAU)L 12 605335 605300 C 2011-02-03 2000-05-19 +S000035160 noncoding_exon tI(UAU)L 12 605432 605396 C 2011-02-03 2000-05-19 +S000004222 ORF Dubious YLR232W chromosome 12 12 606830 607177 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene BNA5 +S000031460 CDS YLR232W 12 606830 607177 W 2011-02-03 1996-07-31 +S000004221 ORF Verified YLR231C BNA5 kynureninase chromosome 12 12 607119 605758 C 2011-02-03 1996-07-31 Kynureninase; required for the de novo biosynthesis of NAD from tryptophan via kynurenine; expression regulated by Hst1p +S000031316 CDS YLR231C 12 607119 605758 C 2011-02-03 1996-07-31 +S000004223 ORF Verified YLR233C EST1 chromosome 12 L000000588 12 609524 607425 C 2011-02-03 1996-07-31 TLC1 RNA-associated factor involved in telomere length regulation; recruitment subunit of telomerase; has G-quadruplex promoting activity required for telomere elongation; role in activating telomere-bound Est2p-TLC1-RNA; EST1 has a paralog, EBS1, that arose from the whole genome duplication +S000031492 CDS YLR233C 12 609524 607425 C 2011-02-03 1996-07-31 +S000004224 ORF Verified YLR234W TOP3 DNA topoisomerase 3|EDR1 chromosome 12 L000002321 12 609783 611753 W 163 2011-02-03 1996-07-31 DNA Topoisomerase III; conserved protein that functions in a complex with Sgs1p and Rmi1p to relax single-stranded negatively-supercoiled DNA preferentially; DNA catenation/decatenation activity is stimulated by RPA and Sgs1p-Top3p-Rmi1p; involved in telomere stability and regulation of mitotic recombination +S000031598 CDS YLR234W 12 609783 611753 W 2011-02-03 1996-07-31 +S000004225 ORF Dubious YLR235C chromosome 12 12 611930 611532 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORFs TOP3/YLR234W and YLR236C +S000031634 CDS YLR235C 12 611930 611532 C 2011-02-03 1996-07-31 +S000004226 ORF Dubious YLR236C chromosome 12 12 612117 611794 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF YLR235C +S000032651 CDS YLR236C 12 612117 611794 C 2011-02-03 1996-07-31 +S000004227 ORF Verified YLR237W THI7 thiamine transporter THI7|THI10 chromosome 12 L000003514 12 612367 614163 W 2011-02-03 1996-07-31 Plasma membrane transporter responsible for the uptake of thiamine; contributes to uptake of 5-aminoimidazole-4-carboxamide-1-beta-D-ribofuranoside (acadesine); member of the major facilitator superfamily of transporters; mutation of human ortholog causes thiamine-responsive megaloblastic anemia +S000032815 CDS YLR237W 12 612367 614163 W 2011-02-03 1996-07-31 +S000004228 ORF Verified YLR238W FAR10 chromosome 12 12 614755 616191 W 2011-02-03 1996-07-31 Protein involved in recovery from arrest in response to pheromone; acts in a cell cycle arrest recovery pathway independent from Far1p; interacts with Far3p, Far7p, Far8p, Far9p, and Far11p; potential Cdc28p substrate; FAR10 has a paralog, VPS64, that arose from the whole genome duplication +S000033527 CDS YLR238W 12 614755 616191 W 2011-02-03 1996-07-31 +S000004229 ORF Verified YLR239C LIP2 lipoyl(octanoyl) transferase LIP2 chromosome 12 12 617318 616332 C 2011-02-03 1996-07-31 Lipoyl ligase; involved in the modification of mitochondrial enzymes by the attachment of lipoic acid groups +S000033564 CDS YLR239C 12 617318 616332 C 2011-02-03 1996-07-31 +S000004230 ORF Verified YLR240W VPS34 phosphatidylinositol 3-kinase VPS34|VPS7|STT8|VPT29|VPL7|PEP15|END12 chromosome 12 L000002476 12 617533 620160 W 2011-02-03 1996-07-31 Phosphatidylinositol (PI) 3-kinase that synthesizes PI-3-phosphate; forms membrane-associated signal transduction complex with Vps15p to regulate protein sorting; activated by the GTP-bound form of Gpa1p; a fraction is localized, with Vps15p, to nuclear pores at nucleus-vacuole junctions and may facilitate transcription elongation for genes positioned at the nuclear periphery +S000034710 CDS YLR240W 12 617533 620160 W 2011-02-03 1996-07-31 +S000004231 ORF Verified YLR241W CSC1 chromosome 12 12 620473 622821 W 2011-02-03 1996-07-31 Calcium permeable gated cation channel; may be involved in detoxification; similar to Arabidopsis CSC1 +S000035645 CDS YLR241W 12 620473 622821 W 2011-02-03 1996-07-31 +S000130183 ARS ARS1219 chromosome 12 12 623198 623861 2011-02-03 2009-05-08 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay +S000004232 ORF Verified YLR242C ARV1 sterol homeostasis protein ARV1 chromosome 12 L000003505 12 623883 622918 C 2011-02-03 1996-07-31 Cortical ER protein; implicated in the membrane insertion of tail-anchored C-terminal single transmembrane domain proteins; may function in transport of glycosylphosphatidylinositol intermediates into the ER lumen; required for normal intracellular sterol distribution; human ARV1, required for normal cholesterol and bile acid homeostasis, can complement yeast arv1 null mutant; human variant causing early onset epileptic encephalopathy is unable to rescue the yeast null +S000035677 CDS YLR242C 12 623883 622918 C 2011-02-03 1996-07-31 +S000004233 ORF Verified YLR243W GPN3 putative signal sequence-binding GTPase GPN3 chromosome 12 12 624203 625021 W 2011-02-03 1996-07-31 Putative GTPase with a role in biogenesis of RNA pol II and polIII; may be involved in assembly of RNA polymerases II and III and in their transport into the nucleus; may have a role in sister chromatid cohesion; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively; contains a Gly-Pro-Asn motif in the G domain; similar to Npa3p and Gpn2p +S000035796 CDS YLR243W 12 624203 625021 W 2011-02-03 1996-07-31 +S000004234 ORF Verified YLR244C MAP1 methionine aminopeptidase MAP1 chromosome 12 L000001025 12 626331 625168 C 2011-02-03 1996-07-31 Methionine aminopeptidase; catalyzes the cotranslational removal of N-terminal methionine from nascent polypeptides; function is partially redundant with that of Map2p +S000035829 CDS YLR244C 12 626331 625168 C 2011-02-03 1996-07-31 +S000004235 ORF Verified YLR245C CDD1 cytidine deaminase chromosome 12 L000004644 12 626930 626502 C 2011-02-03 1996-07-31 Cytidine deaminase; catalyzes the modification of cytidine to uridine in vitro but native RNA substrates have not been identified, localizes to both the nucleus and cytoplasm +S000035981 CDS YLR245C 12 626930 626502 C 2011-02-03 1996-07-31 +S000004236 ORF Verified YLR246W ERF2 palmitoyltransferase ERF2 chromosome 12 12 627118 628197 W 2011-02-03 1996-07-31 Subunit of a palmitoyltransferase; this complex adds a palmitoyl lipid moiety to heterolipidated substrates such as Ras1p and Ras2p through a thioester linkage; mutants partially mislocalize Ras2p to the vacuole; palmitoyltransferase is composed of Erf2p and Shr5p +S000036884 CDS YLR246W 12 627118 628197 W 2011-02-03 1996-07-31 +S000006643 tRNA_gene tL(CAA)L chromosome 12 L000003648 12 628383 628497 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000033796 intron tL(CAA)L 12 628421 628453 W 2011-02-03 2000-05-19 +S000033794 noncoding_exon tL(CAA)L 12 628383 628420 W 2011-02-03 2000-05-19 +S000033795 noncoding_exon tL(CAA)L 12 628454 628497 W 2011-02-03 2000-05-19 +S000004237 ORF Verified YLR247C IRC20 E3 ubiquitin-protein ligase IRC20 chromosome 12 12 633354 628684 C 2011-02-03 1996-07-31 E3 ubiquitin ligase and putative helicase; involved in synthesis-dependent strand annealing-mediated homologous recombination; ensures precise end-joining along with Srs2p in the Yku70p/Yku80p/Lig4p-dependent nonhomologous end joining (NHEJ) pathway; localizes to both the mitochondrion and the nucleus; contains a Snf2/Swi2 family ATPase/helicase and a RING finger domain; interacts with Cdc48p and Smt3p; null mutant displays increased levels of spontaneous Rad52p foci +S000036895 CDS YLR247C 12 633354 628684 C 2011-02-03 1996-07-31 +S000004238 ORF Verified YLR248W RCK2 serine/threonine protein kinase RCK2|CMK3|CLK1 chromosome 12 L000001593 12 634252 636084 W 2011-02-03 1996-07-31 Protein kinase involved in response to oxidative and osmotic stress; identified as suppressor of S. pombe cell cycle checkpoint mutations; similar to CaM (calmodulin) kinases; RCK2 has a paralog, RCK1, that arose from the whole genome duplication +S000037704 CDS YLR248W 12 634252 636084 W 2011-02-03 1996-07-31 +S000004239 ORF Verified YLR249W YEF3 translation elongation factor EF-3|EF-3|eEF3|TEF3 chromosome 12 L000002505 12 636780 639914 W 2011-02-03 1996-07-31 Translation elongation factor 3; contains two ABC cassettes; binds and hydrolyzes ATP; YEF3 has a paralog, HEF3, that arose from the whole genome duplication +S000037766 CDS YLR249W 12 636780 639914 W 2011-02-03 1996-07-31 +S000004240 ORF Verified YLR250W SSP120 chromosome 12 L000002091 12 640317 641021 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern +S000030689 CDS YLR250W 12 640317 641021 W 2011-02-03 1996-07-31 +S000004241 ORF Verified YLR251W SYM1 ethanol metabolism protein chromosome 12 12 641464 642057 W 2011-02-03 1996-07-31 Protein required for ethanol metabolism; induced by heat shock and localized to the inner mitochondrial membrane; homologous to mammalian peroxisomal membrane protein Mpv17; human homolog MPV17 is implicated in hepatocerebral mtDNA depletion syndromes (MDDS), and complements yeast null mutant +S000030794 CDS YLR251W 12 641464 642057 W 2011-02-03 1996-07-31 +S000004242 ORF Dubious YLR252W chromosome 12 12 641957 642262 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene SYM1, a mitochondrial protein involved in ethanol metabolism +S000030890 CDS YLR252W 12 641957 642262 W 2011-02-03 1996-07-31 +S000004243 ORF Verified YLR253W MCP2 MRX13 chromosome 12 12 642627 644336 W 2011-02-03 1996-07-31 Mitochondrial protein of unknown function involved in lipid homeostasis; associates with mitochondrial ribosome; integral membrane protein that localizes to the mitochondrial inner membrane; involved in mitochondrial morphology; non-essential gene which interacts genetically with MDM10, and other members of the ERMES complex; transcription is periodic during the metabolic cycle; homologous to human aarF domain containing kinase, ADCK1 +S000031890 CDS YLR253W 12 642627 644336 W 2011-02-03 1996-07-31 +S000004244 ORF Verified YLR254C NDL1 chromosome 12 12 644973 644404 C 2011-02-03 1996-07-31 Homolog of nuclear distribution factor NudE; NUDEL; interacts with Pac1p and regulates dynein targeting to microtubule plus ends +S000031972 CDS YLR254C 12 644973 644404 C 2011-02-03 1996-07-31 +S000004245 ORF Dubious YLR255C chromosome 12 12 645953 645600 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032077 CDS YLR255C 12 645953 645600 C 2011-02-03 1996-07-31 +S000004246 ORF Verified YLR256W HAP1 CYP1 chromosome 12 L000002665 12 646415 650923 W 2011-02-03 1996-07-31 Zinc finger transcription factor; involved in the complex regulation of gene expression in response to levels of heme and oxygen; localizes to the mitochondrion as well as to the nucleus; the S288C sequence differs from other strain backgrounds due to a Ty1 insertion in the carboxy terminus +S000033058 CDS YLR256W 12 646415 650923 W 2011-02-03 1996-07-31 +S000007088 long_terminal_repeat YLRWdelta13 chromosome 12 12 650824 651157 W 2011-02-03 2000-05-19 Ty1 LTR +S000007099 LTR_retrotransposon YLRWTy1-3 Ty1 chromosome 12 12 650824 656743 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007377 transposable_element_gene YLR256W-A gag protein chromosome 12 12 651117 652439 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000035661 CDS YLR256W-A 12 651117 652439 W 2011-02-03 1999-07-17 +S000007089 long_terminal_repeat YLRWdelta14 chromosome 12 12 656410 656743 W 2011-02-03 2000-05-19 Ty1 LTR +S000006517 tRNA_gene tA(AGC)L chromosome 12 L000003660 12 657006 656934 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine +S000032303 noncoding_exon tA(AGC)L 12 657006 656934 C 2011-02-03 2000-05-19 +S000007096 long_terminal_repeat YLRWsigma3 chromosome 12 12 657022 657365 W 2011-02-03 2000-05-19 Ty3 LTR +S000007090 long_terminal_repeat YLRWdelta15 chromosome 12 12 657449 657767 W 2011-02-03 2000-05-19 Ty1 LTR +S000004247 ORF Verified YLR257W chromosome 12 12 658826 659791 W 2011-02-03 1996-07-31 Protein of unknown function; protein abundance increases in response to DNA replication stress +S000033141 CDS YLR257W 12 658826 659791 W 2011-02-03 1996-07-31 +S000118478 ARS ARS1220 ARSXII-660 chromosome 12 12 659884 659935 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178140 ARS_consensus_sequence ARS1220 12 659892 659908 W 2014-11-18 2014-11-18 +S000004248 ORF Verified YLR258W GSY2 glycogen (starch) synthase GSY2 chromosome 12 L000000740 12 660716 662833 W 2011-02-03 1996-07-31 Glycogen synthase; expression induced by glucose limitation, nitrogen starvation, heat shock, and stationary phase; activity regulated by cAMP-dependent, Snf1p and Pho85p kinases as well as by the Gac1p-Glc7p phosphatase; GSY2 has a paralog, GSY1, that arose from the whole genome duplication; relocalizes from cytoplasm to plasma membrane upon DNA replication stress +S000033909 CDS YLR258W 12 660716 662833 W 2011-02-03 1996-07-31 +S000004249 ORF Verified YLR259C HSP60 chaperone ATPase HSP60|MNA2|MIF4|CPN60 chromosome 12 L000000819 12 665002 663284 C 2011-02-03 1996-07-31 Tetradecameric mitochondrial chaperonin; required for ATP-dependent folding of precursor polypeptides and complex assembly; prevents aggregation and mediates protein refolding after heat shock; role in mtDNA transmission; phosphorylated +S000033960 CDS YLR259C 12 665002 663284 C 2011-02-03 1996-07-31 +S000004250 ORF Verified YLR260W LCB5 sphinganine kinase LCB5 chromosome 12 L000004329 12 665844 667907 W 2011-02-03 1996-07-31 Minor sphingoid long-chain base kinase; possibly involved in synthesis of long-chain base phosphates, which function as signaling molecules; LCB5 has a paralog, LCB4, that arose from the whole genome duplication +S000035015 CDS YLR260W 12 665844 667907 W 2011-02-03 1996-07-31 +S000004251 ORF Uncharacterized YLR261C VPS63 chromosome 12 12 668563 668237 C 2011-02-03 1996-07-31 Putative protein of unknown function; not conserved in closely related Saccharomyces species; 98% of ORF overlaps the verified gene YPT6; deletion causes a vacuolar protein sorting defect; decreased levels of protein in enolase deficient mutant +S000035062 CDS YLR261C 12 668563 668237 C 2011-02-03 1996-07-31 +S000004252 ORF Verified YLR262C YPT6 Rab family GTPase YPT6 chromosome 12 L000002896|L000002948 12 668891 668244 C 2011-02-03 1996-07-31 Rab family GTPase; required for endosome-to-Golgii, intra-Golgi retrograde, and retrograde Golgi-to-ER transport; temporarily at the Golgi, dissociating into the cytosol on arrival of the late Golgi GTPase Ypt32p; Golgi-localized form is GTP bound, while cytosolic form is GDP-bound; required for delivery of Atg9p to the phagophore assembly site during autophagy under heat stress, with Ypt6p for starvation induced autophagy and for the CVT pathway; homolog of mammalian Rab6 +S000035164 CDS YLR262C 12 668891 668244 C 2011-02-03 1996-07-31 +S000007246 ORF Verified YLR262C-A TMA7 RBF7 chromosome 12 12 669662 669468 C 2011-02-03 1999-07-17 Protein of unknown that associates with ribosomes; null mutant exhibits translation defects, altered polyribosome profiles, and resistance to the translation inhibitor anisomcyin; protein abundance increases in response to DNA replication stress +S000036510 CDS YLR262C-A 12 669662 669468 C 2011-02-03 1999-07-17 +S000004253 ORF Verified YLR263W RED1 chromosome 12 L000001608 12 670340 672823 W 2011-02-03 1996-07-31 Protein component of the synaptonemal complex axial elements; involved in chromosome segregation during the first meiotic division; critical for coupling checkpoint signaling to SC formation; promotes interhomolog recombination by phosphorylating Hop1p; also interacts with Mec3p and Ddc1p +S000036094 CDS YLR263W 12 670340 672823 W 2011-02-03 1996-07-31 +S000004254 ORF Verified YLR264W RPS28B eS28|ribosomal 40S subunit protein S28B|S28e|YS27|S33B|S28B|RPS33B chromosome 12 L000002744 12 673131 673334 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S28, no bacterial homolog; has an extraribosomal function in autoregulation, in which Rps28Bp binds to a decapping complex via Edc3p, which then binds to RPS28B mRNA leading to its decapping and degradation; RPS28B has a paralog, RPS28A, that arose from the whole genome duplication +S000036202 CDS YLR264W 12 673131 673334 W 2011-02-03 1996-07-31 +S000028808 ORF Uncharacterized YLR264C-A chromosome 12 12 673944 673828 C 2011-02-03 2003-07-29 Putative protein of unknown function +S000033593 CDS YLR264C-A 12 673944 673828 C 2011-02-03 2003-07-29 +S000004255 ORF Verified YLR265C NEJ1 LIF2 chromosome 12 12 675455 674427 C 2011-02-03 1996-07-31 Protein involved in regulation of nonhomologous end joining; interacts with DNA ligase IV components Dnl4p and Lif1p; repressed by MAT heterozygosity; regulates cellular distribution of Lif1p +S000036242 CDS YLR265C 12 675455 674427 C 2011-02-03 1996-07-31 +S000004256 ORF Verified YLR266C PDR8 chromosome 12 12 677724 675619 C 2011-02-03 1996-07-31 Transcription factor; targets include ATP-binding cassette (ABC) transporters, major facilitator superfamily transporters, and other genes involved in the pleiotropic drug resistance (PDR) phenomenon; PDR8 has a paralog, YRR1, that arose from the whole genome duplication +S000031731 CDS YLR266C 12 677724 675619 C 2011-02-03 1996-07-31 +S000004257 ORF Uncharacterized YLR267W BOP2 chromosome 12 L000004722 12 678212 679924 W 2011-02-03 1996-07-31 Protein of unknown function +S000031962 CDS YLR267W 12 678212 679924 W 2011-02-03 1996-07-31 +S000004258 ORF Verified YLR268W SEC22 SNAP receptor SEC22|TS26|TSL26|SLY2 chromosome 12 L000001845|S000029606|L000002362 12 680200 680844 W 2011-02-03 1996-07-31 R-SNARE protein; assembles into SNARE complex with Bet1p, Bos1p and Sed5p; cycles between the ER and Golgi complex; involved in anterograde and retrograde transport between the ER and Golgi; synaptobrevin homolog +S000037429 CDS YLR268W 12 680200 680844 W 2011-02-03 1996-07-31 +S000004260 ORF Verified YLR270W DCS1 5'-(N(7)-methyl 5'-triphosphoguanosine)-(mRNA) diphosphatase|DcpS chromosome 12 12 681186 682238 W 2011-02-03 1996-07-31 Non-essential hydrolase involved in mRNA decapping; activates Xrn1p; may function in a feedback mechanism to regulate deadenylation, contains pyrophosphatase activity and a HIT (histidine triad) motif; acts as inhibitor of neutral trehalase Nth1p; required for growth on glycerol medium; protein abundance increases in response to DNA replication stress; DCS1 has a paralog, DCS2, that arose from the whole genome duplication +S000037138 CDS YLR270W 12 681186 682238 W 2011-02-03 1996-07-31 +S000004259 ORF Dubious YLR269C chromosome 12 12 681216 680866 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037460 CDS YLR269C 12 681216 680866 C 2011-02-03 1996-07-31 +S000004261 ORF Uncharacterized YLR271W CMG1 chromosome 12 12 682737 683561 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and the nucleus and is induced in response to the DNA-damaging agent MMS +S000037234 CDS YLR271W 12 682737 683561 W 2011-02-03 1996-07-31 +S000004262 ORF Verified YLR272C YCS4 condensin subunit YCS4|LOC7 chromosome 12 12 687202 683672 C 2011-02-03 1996-07-31 Subunit of the condensin complex; required for establishment and maintenance of chromosome condensation, chromosome segregation, chromatin binding of condensin, tRNA gene clustering at the nucleolus, and silencing at the mating type locus; required for replication slow zone (RSZ) breakage following Mec1p inactivation +S000037272 CDS YLR272C 12 687202 683672 C 2011-02-03 1996-07-31 +S000006762 tRNA_gene tV(AAC)L chromosome 12 L000003659 12 687932 687859 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000032966 noncoding_exon tV(AAC)L 12 687932 687859 C 2011-02-03 2000-05-19 +S000007071 long_terminal_repeat YLRCdelta16 chromosome 12 12 688368 688119 C 2011-02-03 2000-05-19 Ty1 LTR +S000007091 long_terminal_repeat YLRWdelta17 chromosome 12 12 688369 688664 W 2011-02-03 2000-05-19 Ty1 LTR +S000004263 ORF Verified YLR273C PIG1 protein phosphatase regulator PIG1 chromosome 12 L000001436 12 691029 689083 C 2011-02-03 1996-07-31 Putative targeting subunit for type-1 protein phosphatase Glc7p; tethers Glc7p to Gsy2p glycogen synthase; PIG1 has a paralog, GAC1, that arose from the whole genome duplication +S000037347 CDS YLR273C 12 691029 689083 C 2011-02-03 1996-07-31 +S000004264 ORF Verified YLR274W MCM5 MCM DNA helicase complex subunit MCM5|CDC46|BOB1 chromosome 12 L000000279 12 691555 693882 W 2011-02-03 1996-07-31 Component of the Mcm2-7 hexameric helicase complex; MCM complex is important for priming origins of DNA replication in G1 and becomes an active ATP-dependent helicase that promotes DNA melting and elongation when activated by Cdc7p-Dbf4p in S-phase +S000030019 CDS YLR274W 12 691555 693882 W 2011-02-03 1996-07-31 +S000004265 ORF Verified YLR275W SMD2 mRNA splicing protein SMD2|Sm D2 chromosome 12 L000004145 12 694378 694800 W 2011-02-03 1996-07-31 Core Sm protein Sm D2; part of heteroheptameric complex (with Smb1p, Smd1p, Smd3p, Sme1p, Smx3p, and Smx2p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; homolog of human Sm D2 +S000030096 CDS YLR275W 12 694378 694382 W 2011-02-03 1996-07-31 +S000030097 CDS YLR275W 12 694473 694800 W 2011-02-03 1996-07-31 +S000030098 intron YLR275W 12 694383 694472 W 2011-02-03 1996-07-31 +S000004266 ORF Verified YLR276C DBP9 ATP-dependent DNA/RNA helicase chromosome 12 L000004249 12 696830 695046 C 2011-02-03 1996-07-31 DEAD-box protein required for 27S rRNA processing; exhibits DNA, RNA and DNA/RNA helicase activities; ATPase activity shows preference for DNA over RNA; DNA helicase activity abolished by mutation in RNA-binding domain +S000030144 CDS YLR276C 12 696830 695046 C 2011-02-03 1996-07-31 +S000004267 ORF Verified YLR277C YSH1 cleavage polyadenylation factor subunit YSH1|BRR5 chromosome 12 L000003344 12 699495 697156 C 2011-02-03 1996-07-31 Endoribonuclease; subunit of the mRNA cleavage and polyadenylation specificity complex; required for 3' processing, splicing, and transcriptional termination of mRNAs and snoRNAs; protein abundance increases in response to DNA replication stress; YSH1 has a paralog, SYC1, that arose from the whole genome duplication +S000030344 CDS YLR277C 12 699495 697156 C 2011-02-03 1996-07-31 +S000004268 ORF Uncharacterized YLR278C chromosome 12 12 704024 699999 C 2011-02-03 1996-07-31 Zinc-cluster protein; GFP-fusion protein localizes to the nucleus; mutant shows moderate growth defect on caffeine; has a prion-domain like fragment that increases frequency of [URE3]; YLR278C is not an essential gene +S000033636 CDS YLR278C 12 704024 699999 C 2011-02-03 1996-07-31 +S000004269 ORF Dubious YLR279W chromosome 12 12 704309 704698 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033857 CDS YLR279W 12 704309 704698 W 2011-02-03 1996-07-31 +S000004270 ORF Dubious YLR280C chromosome 12 12 704833 704483 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033385 CDS YLR280C 12 704833 704483 C 2011-02-03 1996-07-31 +S000004271 ORF Uncharacterized YLR281C chromosome 12 12 704960 704493 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to mitochondria; YLR281C is not an essential gene +S000033456 CDS YLR281C 12 704960 704493 C 2011-02-03 1996-07-31 +S000004273 ORF Uncharacterized YLR283W chromosome 12 12 705186 706130 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to mitochondria; YLR283W is not an essential gene +S000034433 CDS YLR283W 12 705186 706130 W 2011-02-03 1996-07-31 +S000004272 ORF Dubious YLR282C chromosome 12 12 705412 705071 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; deletion mutation confers an increase in Ty1 transposition +S000033516 CDS YLR282C 12 705412 705071 C 2011-02-03 1996-07-31 +S000004274 ORF Verified YLR284C ECI1 dodecenoyl-CoA isomerase chromosome 12 L000004206 12 707040 706198 C 2011-02-03 1996-07-31 Peroxisomal delta3,delta2-enoyl-CoA isomerase; hexameric protein that converts 3-hexenoyl-CoA to trans-2-hexenoyl-CoA, essential for the beta-oxidation of unsaturated fatty acids, oleate-induced; ECI1 has a paralog, DCI1, that arose from the whole genome duplication +S000034471 CDS YLR284C 12 707040 706198 C 2011-02-03 1996-07-31 +S000004275 ORF Verified YLR285W NNT1 EFM7|S-adenosylmethionine-dependent methyltransferase chromosome 12 12 707360 708145 W 2011-02-03 1996-07-31 S-adenosylmethionine-dependent methyltransferase; novel N-terminal protein methyltransferase that trimethylates the N-terminal glycine residue (G2) and also dimethylates lysine (K3) on elongation factor eEF1A (Tef1p/Tef2p); has a role in rDNA silencing and in lifespan determination +S000034643 CDS YLR285W 12 707360 708145 W 2011-02-03 1996-07-31 +S000028569 ORF Uncharacterized YLR285C-A chromosome 12 12 708338 708168 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031275 CDS YLR285C-A 12 708338 708168 C 2011-02-03 2003-07-29 +S000028679 ORF Dubious YLR286W-A chromosome 12 12 708562 708696 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene CTS1 +S000032537 CDS YLR286W-A 12 708562 708696 W 2011-02-03 2003-07-29 +S000004276 ORF Verified YLR286C CTS1 SCW2 chromosome 12 L000000434|S000029435|L000004563 12 710136 708448 C 2011-02-03 1996-07-31 Endochitinase; required for cell separation after mitosis; transcriptional activation during the G1 phase of the cell cycle is mediated by transcription factor Ace2p +S000034680 CDS YLR286C 12 710136 708448 C 2011-02-03 1996-07-31 +S000004277 ORF Uncharacterized YLR287C chromosome 12 12 712058 710991 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YLR287C is not an essential gene +S000035680 CDS YLR287C 12 712058 710991 C 2011-02-03 1996-07-31 +S000004278 ORF Verified YLR287C-A RPS30A eS30|ribosomal 40S subunit protein S30A|S30e|S30A chromosome 12 L000003183 12 713158 712537 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S30, no bacterial homolog; RPS30A has a paralog, RPS30B, that arose from the whole genome duplication +S000030932 CDS YLR287C-A 12 712725 712537 C 2011-02-03 1996-07-31 +S000030931 CDS YLR287C-A 12 713158 713156 C 2011-02-03 1996-07-31 +S000030933 intron YLR287C-A 12 713155 712726 C 2011-02-03 1996-07-31 +S000004279 ORF Verified YLR288C MEC3 PSO9|PIP3 chromosome 12 L000002907 12 714904 713480 C 2011-02-03 1996-07-31 DNA damage and meiotic pachytene checkpoint protein; subunit of a heterotrimeric complex (Rad17p-Mec3p-Ddc1p) that forms a sliding clamp, loaded onto partial duplex DNA by a clamp loader complex; homolog of human and S. pombe Hus1 +S000035804 CDS YLR288C 12 714904 713480 C 2011-02-03 1996-07-31 +S000004280 ORF Verified YLR289W GUF1 GTPase GUF1 chromosome 12 L000002749 12 715089 717026 W 2011-02-03 1996-07-31 Mitochondrial matrix GTPase; associates with mitochondrial ribosomes; important for translation under temperature and nutrient stress; may have a role in translational fidelity; similar to bacterial LepA elongation factor +S000037787 CDS YLR289W 12 715089 717026 W 2011-02-03 1996-07-31 +S000004281 ORF Verified YLR290C COQ11 ubiquinone biosynthesis protein COQ11|MRX2 chromosome 12 12 717978 717145 C 2011-02-03 1996-07-31 Putative oxidoreductase, subunit of Coenzyme Q biosynthetic complexes; required for synthesis of wild-type levels of Coenzyme Q (ubiquinone); member of the short-chain dehydrogenase/reductase (SDR) superfamily; orthologous gene in some other fungi is fused to the COQ10 ortholog +S000036802 CDS YLR290C 12 717978 717145 C 2011-02-03 1996-07-31 +S000004282 ORF Verified YLR291C GCD7 translation initiation factor eIF2B subunit beta chromosome 12 L000000675 12 719462 718317 C 2011-02-03 1996-07-31 Beta subunit of the translation initiation factor eIF2B; the guanine-nucleotide exchange factor for eIF2; activity subsequently regulated by phosphorylated eIF2; first identified as a negative regulator of GCN4 expression; human homolog EIF2B2 can complement yeast mutant, allows growth down-regulation of yeast gene +S000036871 CDS YLR291C 12 719462 718317 C 2011-02-03 1996-07-31 +S000004283 ORF Verified YLR292C SEC72 Sec63 complex subunit SEC72|SIM2|SEC67 chromosome 12 L000001857 12 720370 719789 C 2011-02-03 1996-07-31 Non-essential subunit of Sec63 complex; with Sec61 complex, Kar2p/BiP and Lhs1p forms a channel competent for SRP-dependent and post-translational SRP-independent protein targeting and import into the ER; other members are Sec63p, Sec62p, and Sec66p +S000037611 CDS YLR292C 12 720370 719789 C 2011-02-03 1996-07-31 +S000130184 ARS ARS1221 chromosome 12 12 720784 721418 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000004284 ORF Verified YLR293C GSP1 Ran GTPase GSP1|CST17|CNR1 chromosome 12 L000000736 12 721430 720771 C 2011-02-03 1996-07-31 Ran GTPase; GTP binding protein (mammalian Ranp homolog) involved in the maintenance of nuclear organization, RNA processing and transport; regulated by Srm1p, Rna1p, Yrb1p, Yrb2p, Yrp4p, Yrb30p, Cse1p and Kap95p; GSP1 has a paralog, GSP2, that arose from the whole genome duplication +S000037671 CDS YLR293C 12 721430 720771 C 2011-02-03 1996-07-31 +S000004285 ORF Dubious YLR294C chromosome 12 12 722030 721701 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene ATP14 +S000037718 CDS YLR294C 12 722030 721701 C 2011-02-03 1996-07-31 +S000004286 ORF Verified YLR295C ATP14 F1F0 ATP synthase subunit h chromosome 12 L000003379 12 722373 721999 C 2011-02-03 1996-07-31 Subunit h of the F0 sector of mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; protein abundance increases in response to DNA replication stress +S000037778 CDS YLR295C 12 722373 721999 C 2011-02-03 1996-07-31 +S000004287 ORF Dubious YLR296W chromosome 12 12 722978 723304 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030715 CDS YLR296W 12 722978 723304 W 2011-02-03 1996-07-31 +S000004288 ORF Verified YLR297W chromosome 12 12 724044 724433 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole; not an essential gene; induced by treatment with 8-methoxypsoralen and UVA irradiation; relocalizes from nucleus to vacuole upon DNA replication stress; YLR297W has a paralog, YOR186W, that arose from the whole genome duplication +S000030831 CDS YLR297W 12 724044 724433 W 2011-02-03 1996-07-31 +S000004289 ORF Verified YLR298C YHC1 U1C|U1-C chromosome 12 L000004161 12 725416 724721 C 2011-02-03 1996-07-31 Component of the U1 snRNP complex required for pre-mRNA splicing; putative ortholog of human U1C protein, which is involved in formation of a complex between U1 snRNP and the pre-mRNA 5' splice site +S000030863 CDS YLR298C 12 725416 724721 C 2011-02-03 1996-07-31 +S000004290 ORF Verified YLR299W ECM38 gamma-glutamyltransferase|CIS2 chromosome 12 L000003905 12 726069 728051 W 2011-02-03 1996-07-31 Gamma-glutamyltranspeptidase; major glutathione-degrading enzyme; involved in detoxification of electrophilic xenobiotics; expression induced mainly by nitrogen starvation +S000031951 CDS YLR299W 12 726069 728051 W 2011-02-03 1996-07-31 +S000028680 ORF Dubious YLR299C-A chromosome 12 12 728003 727911 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene ECM38 +S000032551 CDS YLR299C-A 12 728003 727911 C 2011-02-03 2003-07-29 +S000004291 ORF Verified YLR300W EXG1 glucan 1,3-beta-glucosidase|SCW6|BGL1 chromosome 12 L000000592|S000029437|L000004567 12 728955 730301 W 206 2011-02-03 1996-07-31 Major exo-1,3-beta-glucanase of the cell wall; involved in cell wall beta-glucan assembly; exists as three differentially glycosylated isoenzymes; EXG1 has a paralog, SPR1, that arose from the whole genome duplication +S000030080 CDS YLR300W 12 728955 730301 W 2011-02-03 1996-07-31 +S000004292 ORF Verified YLR301W HRI1 chromosome 12 12 730825 731559 W 2011-02-03 1996-07-31 Protein of unknown function that interacts with Sec72p and Hrr25p +S000030226 CDS YLR301W 12 730825 731559 W 2011-02-03 1996-07-31 +S000007072 long_terminal_repeat YLRCdelta18 chromosome 12 12 732000 731668 C 2011-02-03 2000-05-19 Ty2 LTR +S000006656 tRNA_gene tL(UAG)L2 chromosome 12 L000003649 12 732090 732190 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000035006 intron tL(UAG)L2 12 732128 732146 W 2011-02-03 2000-05-19 +S000035004 noncoding_exon tL(UAG)L2 12 732090 732127 W 2011-02-03 2000-05-19 +S000035005 noncoding_exon tL(UAG)L2 12 732147 732190 W 2011-02-03 2000-05-19 +S000004294 ORF Verified YLR303W MET17 bifunctional cysteine synthase/O-acetylhomoserine aminocarboxypropyltransferase MET17|MET25|MET15 chromosome 12 L000001091|L000001088 12 732542 733876 W 2011-02-03 1996-07-31 O-acetyl homoserine-O-acetyl serine sulfhydrylase; required for Methionine and cysteine biosynthesis +S000030497 CDS YLR303W 12 732542 733876 W 2011-02-03 1996-07-31 +S000004293 ORF Dubious YLR302C chromosome 12 12 732553 732191 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030295 CDS YLR302C 12 732553 732191 C 2011-02-03 1996-07-31 +S000007073 long_terminal_repeat YLRCdelta19 chromosome 12 12 734671 734501 C 2011-02-03 2000-05-19 Ty1 LTR +S000006607 tRNA_gene tI(AAU)L1 chromosome 12 L000003650 12 734802 734875 W 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000033931 noncoding_exon tI(AAU)L1 12 734802 734875 W 2011-02-03 2000-05-19 +S000004295 ORF Verified YLR304C ACO1 aconitate hydratase ACO1|GLU1 chromosome 12 L000000022 12 737548 735212 C 2011-02-03 1996-07-31 Aconitase; required for the tricarboxylic acid (TCA) cycle and also independently required for mitochondrial genome maintenance; component of the mitochondrial nucleoid; mutation leads to glutamate auxotrophy; human homolog ACO2 can complement yeast null mutant +S000031331 CDS YLR304C 12 737548 735212 C 2011-02-03 1996-07-31 +S000004296 ORF Verified YLR305C STT4 1-phosphatidylinositol 4-kinase STT4 chromosome 12 L000002137 12 743863 738161 C 2011-02-03 1996-07-31 Phosphatidylinositol-4-kinase; functions in the Pkc1p protein kinase pathway; required for normal vacuole morphology, cell wall integrity, and actin cytoskeleton organization +S000031384 CDS YLR305C 12 743863 738161 C 2011-02-03 1996-07-31 +S000004297 ORF Verified YLR306W UBC12 NEDD8-conjugating protein UBC12 chromosome 12 L000003386 12 744151 744851 W 2011-02-03 1996-07-31 Enzyme that mediates the conjugation of Rub1p; a ubiquitin-like protein, to other proteins; related to E2 ubiquitin-conjugating enzymes +S000031518 CDS YLR306W 12 744151 744153 W 2011-02-03 1996-07-31 +S000031519 CDS YLR306W 12 744288 744851 W 2011-02-03 1996-07-31 +S000031520 intron YLR306W 12 744154 744287 W 2011-02-03 1996-07-31 +S000118479 ARS ARS1223 ARSXII-745 chromosome 12 12 744943 745179 2011-02-03 2006-08-30 Autonomously Replicating Sequence; replication capacity dependent upon Sum1p +S000178141 ARS_consensus_sequence ARS1223 12 745116 745100 C 2014-11-18 2014-11-18 +S000004298 ORF Verified YLR307W CDA1 chitin deacetylase CDA1 chromosome 12 L000003112 12 745620 746525 W 2011-02-03 1996-07-31 Chitin deacetylase; together with Cda2p involved in the biosynthesis ascospore wall component, chitosan; required for proper rigidity of the ascospore wall +S000031600 CDS YLR307W 12 745620 746525 W 2011-02-03 1996-07-31 +S000028525 ORF Uncharacterized YLR307C-A chromosome 12 12 747111 746848 C 2011-02-03 2003-07-29 Putative protein of unknown function +S000030327 CDS YLR307C-A 12 747111 746848 C 2011-02-03 2003-07-29 +S000004299 ORF Verified YLR308W CDA2 chitin deacetylase CDA2 chromosome 12 L000003113 12 747937 748875 W 2011-02-03 1996-07-31 Chitin deacetylase; together with Cda1p involved in the biosynthesis ascospore wall component, chitosan; required for proper rigidity of the ascospore wall +S000032597 CDS YLR308W 12 747937 748875 W 2011-02-03 1996-07-31 +S000004300 ORF Verified YLR309C IMH1 SYS3 chromosome 12 L000003981 12 751769 749034 C 2011-02-03 1996-07-31|2011-02-03 Protein involved in vesicular transport; mediates transport between an endosomal compartment and the Golgi, contains a Golgi-localization (GRIP) domain that interacts with activated Arl1p-GTP to localize Imh1p to the Golgi +S000032653 CDS YLR309C 12 751769 749034 C 2011-02-03 1996-07-31|2011-02-03 +S000004301 ORF Verified YLR310C CDC25 Ras family guanine nucleotide exchange factor CDC25|CDC25'|CTN1 chromosome 12 L000000264|L000000263 12 756993 752224 C 213 2011-02-03 1996-07-31 Membrane bound guanine nucleotide exchange factor; also known as a GEF or GDP-release factor; indirectly regulates adenylate cyclase through activation of Ras1p and Ras2p by stimulating the exchange of GDP for GTP; required for progression through G1; thermosensitivity of the cdc25-5 mutant is functionally complemented by human RASGRF1 or by a fragment of human SOS1 comprising the CDC25-related catalytic domain +S000032496 CDS YLR310C 12 756993 752224 C 2011-02-03 1996-07-31 +S000004302 ORF Dubious YLR311C chromosome 12 12 757612 757265 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034499 CDS YLR311C 12 757612 757265 C 2011-02-03 1996-07-31 +S000004303 ORF Verified YLR312C ATG39 QNQ1 chromosome 12 12 758833 757637 C 2011-02-03 1996-07-31 Autophagy receptor with a role in degradation of the ER and nucleus; involved specifically in autophagy of perinuclear endoplasmic reticulum in response to nitrogen starvation or rapamycin treatment; localizes to the perinuclear ER +S000034606 CDS YLR312C 12 758833 757637 C 2011-02-03 1996-07-31 +S000004304 ORF Verified YLR312W-A MRPL15 mitochondrial 54S ribosomal protein YmL15|YmL15 chromosome 12 L000002688 12 759480 760241 W 2011-02-03 2001-06-12|1997-07-01|2006-10-03 Mitochondrial ribosomal protein of the large subunit +S000037404 CDS YLR312W-A 12 759480 760241 W 2011-02-03 1997-07-01|2006-10-03 +S000004305 ORF Verified YLR313C SPH1 YLR312C-B chromosome 12 L000004149 12 762342 760750 C 2011-02-03 2004-02-05|1996-07-31|2011-02-03 Protein involved in shmoo formation and bipolar bud site selection; localizes to sites of polarized growth in a cell cycle dependent- and Spa2p-dependent manner, interacts with MAPKKs Mkk1p, Mkk2p, and Ste7p; SPH1 has a paralog, SPA2, that arose from the whole genome duplication +S000034673 CDS YLR313C 12 762342 760750 C 2011-02-03 2004-02-05|1996-07-31|2011-02-03 +S000004306 ORF Verified YLR314C CDC3 septin CDC3 chromosome 12 L000000243 12 764137 762575 C 215 2004-02-05 1996-07-31|2011-02-03 Component of the septin ring that is required for cytokinesis; septins are GTP-binding proteins that assemble with other septins into rod-like complexes that can associate with other rods to form filament polymers; septin rings at the mother-bud neck act as scaffolds for recruiting factors needed for cell division and as barriers to prevent diffusion of specific proteins between mother and daughter cells +S000034752 CDS YLR314C 12 764137 762575 C 2004-02-05 1996-07-31|2011-02-03 +S000004307 ORF Verified YLR315W NKP2 chromosome 12 12 764808 765269 W 2004-02-05 1996-07-31 Central kinetochore protein and subunit of the Ctf19 complex; mutants have elevated rates of chromosome loss; orthologous to fission yeast kinetochore protein cnl2 +S000035712 CDS YLR315W 12 764808 765269 W 2004-02-05 1996-07-31 +S000004309 ORF Dubious YLR317W chromosome 12 12 765655 766089 W 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; may be part of a bicistronic transcript with NKP2/YLR315W; overlaps the verified ORF TAD3/YLR316C +S000035934 CDS YLR317W 12 765655 766089 W 2004-02-05 1996-07-31 +S000004308 ORF Verified YLR316C TAD3 chromosome 12 S000007486 12 766358 765266 C 2004-02-05 2000-07-22|1996-07-31 Subunit of tRNA-specific adenosine-34 deaminase; forms a heterodimer with Tad2p that converts adenosine to inosine at the wobble position of several tRNAs +S000035749 CDS YLR316C 12 766073 765266 C 2004-02-05 2000-07-22|1996-07-31 +S000035748 CDS YLR316C 12 766181 766130 C 2004-02-05 2000-07-22 +S000035747 CDS YLR316C 12 766358 766250 C 2004-02-05 2000-07-22 +S000035751 intron YLR316C 12 766129 766074 C 2004-02-05 2000-07-22 +S000035750 intron YLR316C 12 766249 766182 C 2004-02-05 2000-07-22 +S000004310 ORF Verified YLR318W EST2 TERT chromosome 12 L000003504 12 766542 769196 W 2004-02-05 1996-07-31|2011-02-03 Reverse transcriptase subunit of the telomerase holoenzyme; essential for telomerase core catalytic activity, involved in other aspects of telomerase assembly and function; mutations in human homolog are associated with aplastic anemia +S000036808 CDS YLR318W 12 766542 769196 W 2004-02-05 1996-07-31|2011-02-03 +S000004311 ORF Verified YLR319C BUD6 AIP3 chromosome 12 L000000071|L000002602 12 771684 769318 C 221 2004-02-05 1996-07-31 Actin- and formin-interacting protein; participates in actin cable assembly and organization as a nucleation-promoting factor (NPF) for formins Bni1p and Bnr1p; a triple helical coiled-coil domain in the C-terminal region interacts with Bni1p; involved in polarized cell growth; isolated as bipolar budding mutant; potential Cdc28p substrate +S000036838 CDS YLR319C 12 771684 769318 C 2004-02-05 1996-07-31 +S000004312 ORF Verified YLR320W MMS22 SLM2 chromosome 12 12 771940 776304 W 2004-02-05 1996-07-31 Subunit of E3 ubiquitin ligase complex involved in replication repair; stabilizes protein components of the replication fork, such as the fork-pausing complex and leading strand polymerase, preventing fork collapse and promoting efficient recovery during replication stress; required for accurate meiotic chromosome segregation +S000036604 CDS YLR320W 12 771940 776304 W 2004-02-05 1996-07-31 +S000004314 ORF Dubious YLR322W VPS65 chromosome 12 12 777628 777942 W 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 75% of ORF overlaps the verified gene SFH1; deletion causes a vacuolar protein sorting defect and blocks anaerobic growth +S000036774 CDS YLR322W 12 777628 777942 W 2004-02-05 1996-07-31 +S000004313 ORF Verified YLR321C SFH1 chromosome 12 L000003282 12 777864 776584 C 2004-02-05 1996-07-31 Component of the RSC chromatin remodeling complex; essential gene required for cell cycle progression and maintenance of proper ploidy; phosphorylated in the G1 phase of the cell cycle; Snf5p paralog; hSNF5 tumor suppressor ortholog +S000036636 CDS YLR321C 12 777864 776584 C 2004-02-05 1996-07-31 +S000004315 ORF Verified YLR323C CWC24 U2-type spliceosomal complex subunit CWC24 chromosome 12 12 778952 778173 C 2004-02-05 1996-07-31 General splicing factor; required for stable U2 snRNP binding to primary transcripts; essential for the first step of splicing; component of the pre-catalytic spliceosome complex containing Cef1p; similar to S. pombe Cwf24p +S000030574 CDS YLR323C 12 778952 778173 C 2004-02-05 1996-07-31 +S000004316 ORF Verified YLR324W PEX30 peroxisome biogenesis protein chromosome 12 12 779215 780786 W 2004-02-05 1996-07-31 ER-resident protein involved in peroxisomal biogenesis; ER-localized protein that associates with peroxisomes; interacts with Pex29p and reticulons Rtn1p and Yop1p to regulate peroxisome biogenesis from the ER; role in peroxisomal-destined vesicular flow from the ER; partially redundant with Pex31p; may function at a step downstream of steps mediated by Pex28p and Pex29p; PEX30 has a paralog, PEX31, that arose from the whole genome duplication +S000030797 CDS YLR324W 12 779215 780786 W 2004-02-05 1996-07-31 +S000004317 ORF Verified YLR325C RPL38 eL38|ribosomal 60S subunit protein L38|L38e|L38 chromosome 12 L000004468 12 781379 781143 C 2004-02-05 1996-07-31 Ribosomal 60S subunit protein L38; homologous to mammalian ribosomal protein L38, no bacterial homolog +S000030800 CDS YLR325C 12 781379 781143 C 2004-02-05 1996-07-31 +S000004318 ORF Uncharacterized YLR326W chromosome 12 12 782174 782896 W 2004-02-05 1996-07-31 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the cell periphery; predicted to be palmitoylated +S000031891 CDS YLR326W 12 782174 782896 W 2004-02-05 1996-07-31 +S000004319 ORF Verified YLR327C TMA10 RBF9|SFL2 chromosome 12 12 783387 783127 C 2004-02-05 1996-07-31 Protein of unknown function that associates with ribosomes; protein abundance increases in response to DNA replication stress; TMA10 has a paralog, STF2, that arose from the whole genome duplication +S000031973 CDS YLR327C 12 783387 783127 C 2004-02-05 1996-07-31 +S000006732 tRNA_gene tX(XXX)L tS(GCU)L chromosome 12 L000003651 12 784354 784453 W 2004-02-05 2000-05-19 tRNA of undetermined specificity, predicted by tRNAscan-SE analysis; very similar to serine tRNAs +S000037471 intron tX(XXX)L 12 784390 784409 W 2004-02-05 2000-05-19 +S000037469 noncoding_exon tX(XXX)L 12 784354 784389 W 2004-02-05 2000-05-19 +S000037470 noncoding_exon tX(XXX)L 12 784410 784453 W 2004-02-05 2000-05-19 +S000004320 ORF Verified YLR328W NMA1 nicotinamide-nucleotide adenylyltransferase NMA1 chromosome 12 12 784913 786118 W 2004-02-05 1996-07-31 Nicotinic acid mononucleotide adenylyltransferase; catalyzes the transfer of the adenylyl moiety of ATP to nicotinamide mononucleotide to form NAD; involved in pathways of NAD biosynthesis, including the de novo, NAD(+) salvage, and nicotinamide riboside salvage pathways; homolog of human NMNAT; NMA1 has a paralog, NMA2, that arose from the whole genome duplication +S000032965 CDS YLR328W 12 784913 786118 W 2004-02-05 1996-07-31 +S000004321 ORF Verified YLR329W REC102 chromosome 12 L000001604 12 786442 787333 W 235 2006-01-09 1996-07-31|2006-01-09 Protein involved in early stages of meiotic recombination; required for chromosome synapsis; forms a complex with Rec104p and Spo11p necessary during the initiation of recombination +S000113993 CDS YLR329W 12 786442 786615 W 2006-01-09 2006-01-09 +S000033059 CDS YLR329W 12 786713 787333 W 2006-01-09 1996-07-31|2006-01-09 +S000113994 intron YLR329W 12 786616 786712 W 2006-01-09 2006-01-09 +S000004322 ORF Verified YLR330W CHS5 CAL3 chromosome 12 L000000333 12 787664 789679 W 2004-02-05 1996-07-31 Component of the exomer complex; the exomer which also contains Csh6p, Bch1p, Bch2p, and Bud7, is involved in the export of select proteins, such as chitin synthase Chs3p, from the Golgi to the plasma membrane; interacts selectively with the activated, GTP-bound form of Arf1p; Chs5p is the only protein with a BRCT domain that is not localized to the nucleus +S000032805 CDS YLR330W 12 787664 789679 W 2004-02-05 1996-07-31 +S000004324 ORF Verified YLR332W MID2 KAI1 chromosome 12 L000001107|L000000885 12 790676 791806 W 2004-02-05 1996-07-31 O-glycosylated plasma membrane protein; acts as a sensor for cell wall integrity signaling and activates the pathway; interacts with Rom2p, a guanine nucleotide exchange factor for Rho1p, and with cell integrity pathway protein Zeo1p; MID2 has a paralog, MTL1, that arose from the whole genome duplication +S000034864 CDS YLR332W 12 790676 791806 W 2004-02-05 1996-07-31 +S000004323 ORF Dubious YLR331C JIP3 chromosome 12 12 791046 790669 C 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 98% of ORF overlaps the verified gene MID2 +S000032848 CDS YLR331C 12 791046 790669 C 2004-02-05 1996-07-31 +S000007097 long_terminal_repeat YLRWsigma4 chromosome 12 12 793552 793870 W 2004-02-05 2000-05-19 Ty3 LTR +S000006542 tRNA_gene tD(GUC)L2 chromosome 12 L000003652 12 793918 793989 W 2004-02-05 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000031888 noncoding_exon tD(GUC)L2 12 793918 793989 W 2004-02-05 2000-05-19 +S000118480 ARS ARS1226 ARSXII-794 chromosome 12 12 794100 794231 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178142 ARS_consensus_sequence ARS1226 12 794208 794192 C 2014-11-18 2014-11-18 +S000006452 snoRNA_gene snR61 SNR61 chromosome 12 L000004530 12 794575 794486 C 2004-02-05 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A1133 +S000030825 noncoding_exon snR61 12 794575 794486 C 2004-02-05 2000-05-19 +S000006446 snoRNA_gene snR55 SNR55 chromosome 12 L000004524 12 794794 794697 C 2004-02-05 2000-05-19 C/D box small nucleolar RNA (snoRNA); predicted to guide 2'-O-methylation of small subunit (SSU) rRNA at position U1269 +S000030741 noncoding_exon snR55 12 794794 794697 C 2004-02-05 2000-05-19 +S000006448 snoRNA_gene snR57 SNR57 chromosome 12 L000004526 12 795024 794937 C 2004-02-05 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position G1572 +S000030763 noncoding_exon snR57 12 795024 794937 C 2004-02-05 2000-05-19 +S000004325 ORF Verified YLR333C RPS25B eS25|ribosomal 40S subunit protein S25B|S25e|rp45|YS23|S31B|S25B chromosome 12 L000001766 12 795899 795573 C 2004-02-05 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S25, no bacterial homolog; RPS25B has a paralog, RPS25A, that arose from the whole genome duplication +S000034910 CDS YLR333C 12 795899 795573 C 2004-02-05 1996-07-31 +S000122107 five_prime_UTR_intron YLR333C 12 796335 795913 C 2007-04-04 2007-04-04 +S000007092 long_terminal_repeat YLRWdelta20 chromosome 12 12 796899 797088 W 2004-02-05 2000-05-19 Ty1 LTR +S000004326 ORF Dubious YLR334C chromosome 12 12 797078 796698 C 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps a stand-alone long terminal repeat sequence whose presence indicates a retrotransposition event occurred here +S000035063 CDS YLR334C 12 797078 796698 C 2004-02-05 1996-07-31 +S000006559 tRNA_gene tE(UUC)L chromosome 12 L000003653 12 797178 797249 W 2004-02-05 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; target of K. lactis zymocin +S000036008 noncoding_exon tE(UUC)L 12 797178 797249 W 2004-02-05 2000-05-19 +S000004327 ORF Verified YLR335W NUP2 nucleoporin NUP2 chromosome 12 L000001289 12 797430 799592 W 2004-02-05 1996-07-31 Nucleoporin involved in nucleocytoplasmic transport; binds to either the nucleoplasmic or cytoplasmic faces of the nuclear pore complex depending on Ran-GTP levels; also has a role in chromatin organization +S000035216 CDS YLR335W 12 797430 799592 W 2004-02-05 1996-07-31 +S000004328 ORF Verified YLR336C SGD1 chromosome 12 L000003498 12 802396 799697 C 2004-02-05 1996-07-31 Essential nuclear protein; required for biogenesis of the small ribosomal subunit; has a possible role in the osmoregulatory glycerol response; putative homolog of human NOM1 which is implicated in acute myeloid leukemia +S000035257 CDS YLR336C 12 802396 799697 C 2004-02-05 1996-07-31 +S000004330 ORF Dubious YLR338W OPI9 chromosome 12 12 804346 805203 W 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF VRP1/YLR337C +S000031689 CDS YLR338W 12 804346 805203 W 2004-02-05 1996-07-31 +S000004329 ORF Verified YLR337C VRP1 YLR337W|MDP2|END5 chromosome 12 L000001055|L000002481 12 805106 802653 C 2004-02-05 1996-07-31 Verprolin, proline-rich actin-associated protein; involved in cytoskeletal organization and cytokinesis; promotes actin nucleation and endocytosis; related to mammalian Wiskott-Aldrich syndrome protein (WASP)-interacting protein (WIP) +S000036142 CDS YLR337C 12 805106 802653 C 2004-02-05 1996-07-31 +S000004332 ORF Verified YLR340W RPP0 uL10|ribosomal protein P0|P0|L10E|A0|RPL10E chromosome 12 L000002669 12 805887 806825 W 2004-02-05 1996-07-31 Conserved ribosomal protein P0 of the ribosomal stalk; involved in interaction between translational elongation factors and the ribosome; phosphorylated on serine 302; homologous to mammalian ribosomal protein LP0 and bacterial L10 +S000036299 CDS YLR340W 12 805887 806825 W 2004-02-05 1996-07-31 +S000004331 ORF Dubious YLR339C chromosome 12 12 806335 805784 C 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the essential gene RPP0 +S000031733 CDS YLR339C 12 806335 805784 C 2004-02-05 1996-07-31 +S000004333 ORF Verified YLR341W SPO77 chromosome 12 12 807385 808818 W 2004-02-05 1996-07-31 Meiosis-specific protein of unknown function; required for spore wall formation during sporulation and for timely prospore membrane closure along with SPS1; required with Sps1p for phosphorylation and turnover of Ssp1p; dispensable for both nuclear divisions during meiosis +S000036414 CDS YLR341W 12 807385 808818 W 2004-02-05 1996-07-31 +S000004334 ORF Verified YLR342W FKS1 1,3-beta-D-glucan synthase|PBR1|GSC1|ETG1|CWH53|CND1 chromosome 12 L000000445|L000000732 12 809997 815627 W 2004-02-05 1996-07-31 Catalytic subunit of 1,3-beta-D-glucan synthase; functionally redundant with alternate catalytic subunit Gsc2p; binds to regulatory subunit Rho1p; involved in cell wall synthesis and maintenance; localizes to sites of cell wall remodeling; FKS1 has a paralog, GSC2, that arose from the whole genome duplication +S000036475 CDS YLR342W 12 809997 815627 W 2004-02-05 1996-07-31 +S000028571 ORF Uncharacterized YLR342W-A chromosome 12 12 815810 815983 W 2003-07-29 2003-07-29 Putative protein of unknown function +S000031299 CDS YLR342W-A 12 815810 815983 W 2003-07-29 2003-07-29 +S000004335 ORF Verified YLR343W GAS2 1,3-beta-glucanosyltransferase chromosome 12 12 816094 817761 W 2004-02-05 1996-07-31 1,3-beta-glucanosyltransferase; involved with Gas4p in spore wall assembly; has similarity to Gas1p +S000037140 CDS YLR343W 12 816094 817761 W 2004-02-05 1996-07-31 +S000007074 long_terminal_repeat YLRCdelta21 chromosome 12 12 818403 818073 C 2004-02-05 2000-05-19 Ty1 LTR +S000006706 tRNA_gene tR(CCG)L TRR4 chromosome 12 L000003654 12 818609 818680 W 2004-02-05 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; single essential nuclear tRNA gene containing the tDNA-anticodon CCG (presumably CCG in the mature tRNA), decodes CGG codons into arginine, one of 19 nuclear tRNAs for arginine; correct folding and efficient aminoacylation require Lhp1p +S000037079 noncoding_exon tR(CCG)L 12 818609 818680 W 2004-02-05 2000-05-19 +S000004336 ORF Verified YLR344W RPL26A uL24|ribosomal 60S subunit protein L26A|L24|YL33|L33A|L26A chromosome 12 L000004461 12 819312 820142 W 2004-02-05 1996-07-31 Ribosomal 60S subunit protein L26A; binds to 5.8S rRNA; non-essential even when paralog is also deleted; deletion has minimal affections on ribosome biosynthesis; homologous to mammalian ribosomal protein L26 and bacterial L24; RPL26A has a paralog, RPL26B, that arose from the whole genome duplication +S000037238 CDS YLR344W 12 819312 819330 W 2004-02-05 1996-07-31 +S000037239 CDS YLR344W 12 819778 820142 W 2004-02-05 1996-07-31 +S000037240 intron YLR344W 12 819331 819777 W 2004-02-05 1996-07-31 +S000004337 ORF Uncharacterized YLR345W bifunctional fructose-2,6-bisphosphate 2-phosphatase/6-phosphofructo-2-kinase chromosome 12 12 820511 822040 W 2004-02-05 1996-07-31 Similar to 6-phosphofructo-2-kinase enzymes; mRNA expression is repressed by the Rfx1p-Tup1p-Ssn6p repressor complex; YLR345W is not an essential gene +S000037321 CDS YLR345W 12 820511 822040 W 2004-02-05 1996-07-31 +S000004338 ORF Verified YLR346C CIS1 chromosome 12 12 822592 822287 C 2004-02-05 1996-07-31 Protein of unknown function found in mitochondria; expression is regulated by transcription factors involved in pleiotropic drug resistance, Pdr1p and Yrr1p; not an essential gene; YLR346C has a paralog, YGR035C, that arose from the whole genome duplication +S000037348 CDS YLR346C 12 822592 822287 C 2004-02-05 1996-07-31 +S000028681 ORF Dubious YLR347W-A chromosome 12 12 824789 824929 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified ORF KAP95/YLR347C +S000032552 CDS YLR347W-A 12 824789 824929 W 2011-02-03 2003-07-29 +S000004339 ORF Verified YLR347C KAP95 karyopherin beta|RSL1 chromosome 12 L000002781|L000002885 12 826413 823828 C 2011-02-03 1996-07-31 Karyopherin beta; forms a complex with Srp1p/Kap60p; interacts with nucleoporins to mediate nuclear import of NLS-containing cargo proteins via the nuclear pore complex; regulates PC biosynthesis; GDP-to-GTP exchange factor for Gsp1p +S000029972 CDS YLR347C 12 826413 823828 C 2011-02-03 1996-07-31 +S000004341 ORF Dubious YLR349W chromosome 12 12 827521 828027 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified ORF DIC1/YLR348C +S000030302 CDS YLR349W 12 827521 828027 W 2011-02-03 1996-07-31 +S000004340 ORF Verified YLR348C DIC1 chromosome 12 L000004327 12 827873 826977 C 2011-02-03 1996-07-31 Mitochondrial dicarboxylate carrier; integral membrane protein, catalyzes a dicarboxylate-phosphate exchange across the inner mitochondrial membrane, transports cytoplasmic dicarboxylates into the mitochondrial matrix +S000030051 CDS YLR348C 12 827873 826977 C 2011-02-03 1996-07-31 +S000004342 ORF Verified YLR350W ORM2 sphingolipid homeostasis protein ORM2 chromosome 12 12 828730 829380 W 2011-02-03 1996-07-31 Protein that mediates sphingolipid homeostasis; evolutionarily conserved, required for resistance to agents that induce unfolded protein response; Orm1p and Orm2p together control membrane biogenesis by coordinating lipid homeostasis with protein quality control; protein abundance increases in response to DNA replication stress; ORM2 has a paralog, ORM1, that arose from the whole genome duplication +S000032574 CDS YLR350W 12 828730 829380 W 2011-02-03 1996-07-31 +S000004343 ORF Verified YLR351C NIT3 putative hydrolase chromosome 12 L000004213 12 830364 829489 C 2011-02-03 1996-07-31 Nit protein; one of two proteins in S. cerevisiae with similarity to the Nit domain of NitFhit from fly and worm and to the mouse and human Nit protein which interacts with the Fhit tumor suppressor; nitrilase superfamily member +S000032619 CDS YLR351C 12 830364 829489 C 2011-02-03 1996-07-31 +S000004344 ORF Uncharacterized YLR352W chromosome 12 12 831116 833539 W 2011-02-03 1996-07-31 Putative protein of unknown function with similarity to F-box proteins; interacts with Skp1p and Cdc53p; YLR352W is not an essential gene +S000033355 CDS YLR352W 12 831116 833539 W 2011-02-03 1996-07-31 +S000004345 ORF Verified YLR353W BUD8 chromosome 12 L000002759 12 834352 836163 W 2011-02-03 1996-07-31 Protein involved in bud-site selection; diploid mutants display a unipolar budding pattern instead of the wild-type bipolar pattern, and bud at the proximal pole; BUD8 has a paralog, BUD9, that arose from the whole genome duplication +S000033422 CDS YLR353W 12 834352 836163 W 2011-02-03 1996-07-31 +S000004346 ORF Verified YLR354C TAL1 sedoheptulose-7-phosphate:D-glyceraldehyde-3-phosphate transaldolase TAL1 chromosome 12 L000002261 12 837357 836350 C 2011-02-03 1996-07-31 Transaldolase, enzyme in the non-oxidative pentose phosphate pathway; converts sedoheptulose 7-phosphate and glyceraldehyde 3-phosphate to erythrose 4-phosphate and fructose 6-phosphate; TAL1 has a paralog, NQM1, that arose from the whole genome duplication +S000033457 CDS YLR354C 12 837357 836350 C 2011-02-03 1996-07-31 +S000004347 ORF Verified YLR355C ILV5 ketol-acid reductoisomerase chromosome 12 L000000860 12 839253 838066 C 252 2011-02-03 1996-07-31 Acetohydroxyacid reductoisomerase and mtDNA binding protein; involved in branched-chain amino acid biosynthesis and maintenance of wild-type mitochondrial DNA; found in mitochondrial nucleoids +S000033517 CDS YLR355C 12 839253 838066 C 2011-02-03 1996-07-31 +S000004348 ORF Verified YLR356W ATG33 chromosome 12 12 840321 840914 W 2011-02-03 1996-07-31 Mitochondrial mitophagy-specific protein; required primarily for mitophagy induced at post-log phase; not required for other types of selective autophagy or macroautophagy; conserved within fungi, but not in higher eukaryotes; ATG33 has a paralog, SCM4, that arose from the whole genome duplication +S000034434 CDS YLR356W 12 840321 840914 W 2011-02-03 1996-07-31 +S000004349 ORF Verified YLR357W RSC2 chromosome 12 L000004025 12 841331 844000 W 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; required for expression of mid-late sporulation-specific genes; involved in telomere maintenance; RSC2 has a paralog, RSC1, that arose from the whole genome duplication +S000034579 CDS YLR357W 12 841331 844000 W 2011-02-03 1996-07-31 +S000004350 ORF Uncharacterized YLR358C chromosome 12 12 844050 843487 C 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels; partially overlaps ORF RSC2/YLR357W +S000034588 CDS YLR358C 12 844050 843487 C 2011-02-03 1996-07-31 +S000004351 ORF Verified YLR359W ADE13 adenylosuccinase ADE13|BRA8|BRA1 chromosome 12 L000003938 12 844282 845730 W 2011-02-03 1996-07-31 Adenylosuccinate lyase; catalyzes two steps in the 'de novo' purine nucleotide biosynthetic pathway; expression is repressed by adenine and activated by Bas1p and Pho2p; mutations in human ortholog ADSL cause adenylosuccinase deficiency; human ADSL can complement yeast ADE13 null mutant +S000035650 CDS YLR359W 12 844282 845730 W 2011-02-03 1996-07-31 +S000004352 ORF Verified YLR360W VPS38 VPL17 chromosome 12 L000003511 12 846103 847422 W 2011-02-03 1996-07-31 Part of a Vps34p phosphatidylinositol 3-kinase complex; functions in carboxypeptidase Y (CPY) sorting; binds Vps30p and Vps34p to promote production of phosphatidylinositol 3-phosphate (PtdIns3P) which stimulates kinase activity; required for overflow degradation of misfolded proteins when ERAD is saturated +S000036679 CDS YLR360W 12 846103 847422 W 2011-02-03 1996-07-31 +S000004353 ORF Verified YLR361C DCR2 phosphoprotein phosphatase chromosome 12 12 849124 847388 C 2011-02-03 1996-07-31 Protein phosphatase; involved in downregulation of the unfolded protein response (UPR), at least in part through dephosphorylation of Ire1p; dosage-dependent positive regulator of the G1/S phase transition through control of the timing of START; physically interacts with, dephosphorylates and destabilizes Sic1p; SWAT-GFP and mCherry fusion proteins localize to the vacuole +S000036700 CDS YLR361C 12 849124 847388 C 2011-02-03 1996-07-31 +S000028845 ORF Uncharacterized YLR361C-A chromosome 12 12 849679 849383 C 2011-02-03 2003-07-29 Putative protein of unknown function +S000034530 CDS YLR361C-A 12 849679 849383 C 2011-02-03 2003-07-29 +S000004354 ORF Verified YLR362W STE11 mitogen-activated protein kinase kinase kinase STE11 chromosome 12 L000002118 12 849866 852019 W 244 2011-02-03 1999-07-17|1996-07-31 Signal transducing MEK kinase; involved in pheromone response and pseudohyphal/invasive growth pathways where it phosphorylates Ste7p, and the high osmolarity response pathway, via phosphorylation of Pbs2p; regulated by Ste20p and Ste50p; protein abundance increases in response to DNA replication stress +S000036796 CDS YLR362W 12 849866 852019 W 2011-02-03 1999-07-17|1996-07-31 +S000004355 ORF Verified YLR363C NMD4 chromosome 12 L000002938 12 853151 852495 C 2011-02-03 1996-07-31 Protein that may be involved in nonsense-mediated mRNA decay; interacts with Nam7p, relocalizes from nucleus to cytoplasmic foci upon DNA replication stress +S000036803 CDS YLR363C 12 853151 852495 C 2011-02-03 1996-07-31 +S000007620 ORF Verified YLR363W-A chromosome 12 12 853461 853718 W 2011-02-03 2001-02-26 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; relocalizes from nucleus to nucleolus upon DNA replication stress +S000037218 CDS YLR363W-A 12 853461 853718 W 2011-02-03 2001-02-26 +S000004356 ORF Verified YLR364W GRX8 glutathione-disulfide reductase GRX8 chromosome 12 12 854062 854391 W 2011-02-03 1996-07-31 Glutaredoxin that employs a dithiol mechanism of catalysis; monomeric; activity is low and null mutation does not affect sensitivity to oxidative stress; GFP-fusion protein localizes to the cytoplasm; expression strongly induced by arsenic +S000037591 CDS YLR364W 12 854062 854391 W 2011-02-03 1996-07-31 +S000004357 ORF Dubious YLR365W chromosome 12 12 855199 855531 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps dubious gene YLR364C-A; YLR365W is not an essential gene +S000037651 CDS YLR365W 12 855199 855531 W 2011-02-03 1996-07-31 +S000004358 ORF Dubious YLR366W chromosome 12 12 855538 855843 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YLR364C-A +S000037710 CDS YLR366W 12 855538 855843 W 2011-02-03 1996-07-31 +S000028846 ORF Dubious YLR364C-A chromosome 12 12 855645 855523 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YLR366W +S000034531 CDS YLR364C-A 12 855645 855523 C 2011-02-03 2003-07-29 +S000004359 ORF Verified YLR367W RPS22B uS8|ribosomal 40S subunit protein S22B|S8|rp50|YS22|S24B|S22B chromosome 12 L000003030 12 856442 857317 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S15A and bacterial S8; RPS22B has a paralog, RPS22A, that arose from the whole genome duplication +S000037773 CDS YLR367W 12 856442 856574 W 2011-02-03 1996-07-31 +S000037774 CDS YLR367W 12 857058 857317 W 2011-02-03 1996-07-31 +S000122108 five_prime_UTR_intron YLR367W 12 855878 856434 W 2011-02-03 2007-04-04 +S000037775 intron YLR367W 12 856575 857057 W 2011-02-03 1996-07-31 +S000006504 snoRNA_gene snR44 SNR44 chromosome 12 L000003411 12 856710 856920 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U1056 and small subunit (SSU) rRNA at position U106 +S000030616 noncoding_exon snR44 12 856710 856920 W 2011-02-03 2000-05-19 +S000004360 ORF Verified YLR368W MDM30 SCF ubiquitin ligase complex subunit MDM30|DSG1 chromosome 12 12 857540 859336 W 2011-02-03 1996-07-31 F-box component of an SCF ubiquitin protein ligase complex; associates with and is required for Fzo1p ubiquitination and for mitochondria fusion; stimulates nuclear export of specific mRNAs; promotes ubiquitin-mediated degradation of Gal4p in some strains +S000030625 CDS YLR368W 12 857540 859336 W 2011-02-03 1996-07-31 +S000004361 ORF Verified YLR369W SSQ1 Hsp70 family ATPase SSQ1|SSH1|SSC2 chromosome 12 L000004573 12 859552 861525 W 2011-02-03 1996-07-31 Mitochondrial hsp70-type molecular chaperone; required for assembly of iron/sulfur clusters into proteins at a step after cluster synthesis, and for maturation of Yfh1p, which is a homolog of human frataxin implicated in Friedreich's ataxia +S000030742 CDS YLR369W 12 859552 861525 W 2011-02-03 1996-07-31 +S000004362 ORF Verified YLR370C ARC18 chromosome 12 L000004033 12 862254 861718 C 2011-02-03 1996-07-31 Subunit of the ARP2/3 complex; ARP2/3 is required for the motility and integrity of cortical actin patches +S000031542 CDS YLR370C 12 862254 861718 C 2011-02-03 1996-07-31 +S000004363 ORF Verified YLR371W ROM2 Rho family guanine nucleotide exchange factor ROM2 chromosome 12 L000003182 12 862714 866784 W 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF) for Rho1p and Rho2p; mutations are synthetically lethal with mutations in rom1, which also encodes a GEF; Rom2p localization to the bud surface is dependent on Ack1p; ROM2 has a paralog, ROM1, that arose from the whole genome duplication +S000031699 CDS YLR371W 12 862714 866784 W 2011-02-03 1996-07-31 +S000004364 ORF Verified YLR372W ELO3 SUR4|fatty acid elongase ELO3|APA1|VBM1|SRE1 chromosome 12 L000002245 12 867354 868391 W 2011-02-03 1996-07-31 Elongase; involved in fatty acid and sphingolipid biosynthesis; synthesizes very long chain 20-26-carbon fatty acids from C18-CoA primers; involved in regulation of sphingolipid biosynthesis; lethality of the elo2 elo3 double null mutation is functionally complemented by human ELOVL1 and weakly complemented by human ELOVL3 or ELOV7 +S000031801 CDS YLR372W 12 867354 868391 W 2011-02-03 1996-07-31 +S000004365 ORF Verified YLR373C VID22 chromosome 12 12 871367 868662 C 2011-02-03 1996-07-31 Glycosylated integral membrane protein localized to plasma membrane; plays a role in fructose-1,6-bisphosphatase (FBPase) degradation; involved in FBPase transport from the cytosol to Vid (vacuole import and degradation) vesicles; VID22 has a paralog, ENV11, that arose from the whole genome duplication +S000031859 CDS YLR373C 12 871367 868662 C 2011-02-03 1996-07-31 +S000004367 ORF Verified YLR375W STP3 chromosome 12 L000003371 12 871697 872728 W 2011-02-03 1996-07-31 Zinc-finger protein of unknown function; possibly involved in pre-tRNA splicing and in uptake of branched-chain amino acids; STP3 has a paralog, STP4, that arose from the whole genome duplication +S000032922 CDS YLR375W 12 871697 872728 W 2011-02-03 1996-07-31 +S000004366 ORF Dubious YLR374C chromosome 12 12 871842 871453 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF STP3/YLR375W +S000032763 CDS YLR374C 12 871842 871453 C 2011-02-03 1996-07-31 +S000004368 ORF Verified YLR376C PSY3 chromosome 12 12 873554 872826 C 2011-02-03 1996-07-31 Component of Shu complex (aka PCSS complex); Shu complex also includes Shu1, Csm2, Shu2, and promotes error-free DNA repair; promotes Rad51p filament assembly; Shu complex mediates inhibition of Srs2p function; Psy3p and Csm2p contain similar DNA-binding regions which work together to form a single DNA binding site; deletion of PSY3 results in a mutator phenotype; deletion increases sensitivity to anticancer drugs oxaliplatin and cisplatin but not mitomycin C +S000032974 CDS YLR376C 12 873554 872826 C 2011-02-03 1996-07-31 +S000004369 ORF Verified YLR377C FBP1 fructose 1,6-bisphosphate 1-phosphatase|ACN8 chromosome 12 L000000605 12 874792 873746 C 2011-02-03 1996-07-31 Fructose-1,6-bisphosphatase; key regulatory enzyme in the gluconeogenesis pathway, required for glucose metabolism; undergoes either proteasome-mediated or autophagy-mediated degradation depending on growth conditions; glucose starvation results in redistribution to the periplasm; interacts with Vid30p +S000033041 CDS YLR377C 12 874792 873746 C 2011-02-03 1996-07-31 +S000006633 tRNA_gene tK(UUU)L chromosome 12 L000003655 12 875376 875471 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000034214 intron tK(UUU)L 12 875413 875435 W 2011-02-03 2000-05-19 +S000034212 noncoding_exon tK(UUU)L 12 875376 875412 W 2011-02-03 2000-05-19 +S000034213 noncoding_exon tK(UUU)L 12 875436 875471 W 2011-02-03 2000-05-19 +S000004371 ORF Dubious YLR379W chromosome 12 12 876922 877296 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the essential ORF SEC61/YLR378C +S000033877 CDS YLR379W 12 876922 877296 W 2011-02-03 1996-07-31 +S000004370 ORF Verified YLR378C SEC61 translocon subunit SEC61 chromosome 12 L000001852 12 877178 875736 C 2011-02-03 1996-07-31 Conserved ER protein translocation channel; essential subunit of Sec61 complex (Sec61p, Sbh1p, and Sss1p); forms channel for SRP-dependent protein import; with Sec63 complex allows SRP-independent protein import into ER; involved in posttranslational soluble protein import into the ER, ERAD of soluble substrates, and misfolded soluble protein export from the ER +S000033713 CDS YLR378C 12 877178 875736 C 2011-02-03 1996-07-31 +S000004372 ORF Verified YLR380W CSR1 SFH2 chromosome 12 S000007449 12 878282 879508 W 2004-02-05 1996-07-31 Phosphatidylinositol transfer protein; has a potential role in regulating lipid and fatty acid metabolism under heme-depleted conditions; interacts specifically with thioredoxin peroxidase; may have a role in oxidative stress resistance; protein abundance increases in response to DNA replication stress +S000034850 CDS YLR380W 12 878282 879508 W 2004-02-05 1996-07-31 +S000004373 ORF Verified YLR381W CTF3 CHL3 chromosome 12 L000000320 12 879723 881924 W 2004-02-05 1996-07-31 Outer kinetochore protein that forms a complex with Mcm16p and Mcm22p; may bind the kinetochore to spindle microtubules; required for the spindle assembly checkpoint; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-I and fission yeast mis6 +S000034982 CDS YLR381W 12 879723 881924 W 2004-02-05 1996-07-31 +S000004374 ORF Verified YLR382C NAM2 leucine--tRNA ligase NAM2|LeuRS|MSL1 chromosome 12 L000001229 12 884751 882067 C 325 2004-02-05 1996-07-31 Mitochondrial leucyl-tRNA synthetase; also has direct role in splicing of several mitochondrial group I introns; indirectly required for mitochondrial genome maintenance; human homolog LARS2 can complement yeast null mutant, and is implicated in Perrault syndrome +S000035844 CDS YLR382C 12 884751 882067 C 2004-02-05 1996-07-31 +S000004375 ORF Verified YLR383W SMC6 DNA repair protein SMC6|RHC18 chromosome 12 L000004130 12 885288 888632 W 2004-02-05 1996-07-31 Component of the SMC5-SMC6 complex; this complex plays a key role in the removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair; homologous to S. pombe rad18 +S000036068 CDS YLR383W 12 885288 888632 W 2004-02-05 1996-07-31 +S000118987 ARS ARS1238 ARSXII-889|ARS1227.5 chromosome 12 12 888570 888810 2006-10-02 2006-10-02 Autonomously Replicating Sequence +S000178143 ARS_consensus_sequence ARS1238 12 888741 888725 C 2014-11-18 2014-11-18 +S000004376 ORF Verified YLR384C IKI3 Elongator subunit IKI3|KTI7|TOT1|ELP1 chromosome 12 L000003563 12 892900 888851 C 2004-02-05 1996-07-31 Subunit of Elongator complex; Elongator is required for modification of wobble nucleosides in tRNA; maintains structural integrity of Elongator; homolog of human IKAP, mutations in which cause familial dysautonomia (FD) +S000036126 CDS YLR384C 12 892900 888851 C 2004-02-05 1996-07-31 +S000004377 ORF Verified YLR385C SWC7 AWS1 chromosome 12 12 893390 892992 C 2004-02-05 1996-07-31 Protein of unknown function; component of the Swr1p complex that incorporates Htz1p into chromatin +S000036905 CDS YLR385C 12 893390 892992 C 2004-02-05 1996-07-31 +S000004378 ORF Verified YLR386W VAC14 chromosome 12 12 893628 896270 W 2004-02-05 1996-07-31 Enzyme regulator; involved in synthesis of phosphatidylinositol 3,5-bisphosphate, in control of trafficking of some proteins to the vacuole lumen via the MVB, and in maintenance of vacuole size and acidity; binds negative (Fig4p) and positive (Fab1p) regulators of PtdIns(3,5)P(2) to control endolysosome function; similar to mammalian Vac14p +S000037006 CDS YLR386W 12 893628 896270 W 2004-02-05 1996-07-31 +S000004379 ORF Verified YLR387C REH1 chromosome 12 12 897672 896374 C 2004-02-05 1996-07-31 Cytoplasmic 60S subunit biogenesis factor; associates with pre-60S particles; similar to Rei1p and shares partially redundant function in cytoplasmic 60S subunit maturation; contains dispersed C2H2 zinc finger domains +S000037044 CDS YLR387C 12 897672 896374 C 2004-02-05 1996-07-31 +S000004380 ORF Verified YLR388W RPS29A uS14|ribosomal 40S subunit protein S29A|S14|YS29|S36A|S29A|YS29A chromosome 12 L000004482|S000029649|L000002549 12 898651 898821 W 2004-02-05 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S29 and bacterial S14; RPS29A has a paralog, RPS29B, that arose from the whole genome duplication +S000037830 CDS YLR388W 12 898651 898821 W 2004-02-05 1996-07-31 +S000122109 five_prime_UTR_intron YLR388W 12 898158 898645 W 2007-04-04 2007-04-04 +S000006500 snoRNA_gene snR34 SNR34 chromosome 12 L000001972 12 899180 899382 W 2007-05-10 2000-05-19|2007-05-10 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at positions U2826 and U2880 +S000036763 noncoding_exon snR34 12 899180 899382 W 2007-05-10 2000-05-19|2007-05-10 +S000004381 ORF Verified YLR389C STE23 metalloendopeptidase chromosome 12 L000003081 12 902660 899577 C 2004-02-05 2004-02-05|1996-07-31 Metalloprotease; involved in N-terminal processing of pro-a-factor to mature form; expressed in both haploids and diploids; one of two yeast homologs of human insulin-degrading enzyme (hIDE); homolog Axl1p is also involved in processing of pro-a-factor +S000037885 CDS YLR389C 12 902660 899577 C 2004-02-05 2004-02-05|1996-07-31 +S000004382 ORF Verified YLR390W ECM19 chromosome 12 L000003894 12 903066 903404 W 2004-02-05 1996-07-31 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000030926 CDS YLR390W 12 903066 903404 W 2004-02-05 1996-07-31 +S000006429 ORF Verified YLR390W-A CCW14 ICWP|YLR391W|SSR1|YLR391W-A chromosome 12 L000004428 12 903724 904440 W 2004-02-05 1997-07-30 Covalently linked cell wall glycoprotein; present in the inner layer of the cell wall +S000037801 CDS YLR390W-A 12 903724 904440 W 2004-02-05 1997-07-30 +S000004384 ORF Verified YLR392C ART10 chromosome 12 12 906305 904749 C 2004-02-05 1996-07-31 Protein of unknown function that contains 2 PY motifs; ubiquinated by Rsp5p; overexpression confers resistance to arsenite; green fluorescent protein (GFP)-fusion protein localizes it to the cytoplasm; non-essential gene +S000031038 CDS YLR392C 12 906305 904749 C 2004-02-05 1996-07-31 +S000004385 ORF Verified YLR393W ATP10 chromosome 12 L000000147 12 907079 907918 W 2004-02-05 1996-07-31 Assembly factor for the F0 sector of mitochondrial F1F0 ATP synthase; mitochondrial inner membrane protein; interacts genetically with ATP6 +S000032047 CDS YLR393W 12 907079 907918 W 2004-02-05 1996-07-31 +S000004386 ORF Verified YLR394W CST9 SUMO ligase CST9|ZIP3 chromosome 12 L000002996 12 907950 909398 W 2004-02-05 1996-07-31 SUMO E3 ligase; required for synaptonemal complex formation; localizes to synapsis initiation sites on meiotic chromosomes; associates with centromeres early in meiosis, then with chromosome axes and finally with double-strand break sites that are engaged in repair by crossovers; potential Cdc28p substrate +S000032126 CDS YLR394W 12 907950 909398 W 2004-02-05 1996-07-31 +S000004387 ORF Verified YLR395C COX8 cytochrome c oxidase subunit VIII chromosome 12 L000000392 12 909965 909729 C 2004-02-05 1996-07-31 Subunit VIII of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain +S000032155 CDS YLR395C 12 909965 909729 C 2004-02-05 1996-07-31 +S000004388 ORF Verified YLR396C VPS33 tethering complex ATP-binding subunit VPS33|VPT33|VPL25|VAM5|SLP1|PEP14|MET27|CLS14 chromosome 12 L000002475 12 912310 910235 C 2004-02-05 1996-07-31 ATP-binding protein that is a subunit of the HOPS and CORVET complexes; essential for protein sorting, vesicle docking, and fusion at the vacuole; binds to SNARE domains +S000032235 CDS YLR396C 12 912310 910235 C 2004-02-05 1996-07-31 +S000004389 ORF Verified YLR397C AFG2 AAA family ATPase AFG2|DRG1 chromosome 12 L000000056 12 914892 912550 C 2004-02-05 1996-07-31 ATPase of the CDC48/PAS1/SEC18 (AAA) family, forms a hexameric complex; is essential for pre-60S maturation and release of several preribosome maturation factors; releases Rlp24p from purified pre-60S particles in vitro; target of the ribosomal biosynthesis inhibitor diazaborine; may be involved in degradation of aberrant mRNAs +S000032306 CDS YLR397C 12 914892 912550 C 2004-02-05 1996-07-31 +S000004390 ORF Verified YLR398C SKI2 SKI complex RNA helicase subunit SKI2 chromosome 12 L000001903 12 919019 915156 C 2004-02-05 1996-07-31 Ski complex component and putative RNA helicase; mediates 3'-5' RNA degradation by the cytoplasmic exosome; null mutants have superkiller phenotype of increased viral dsRNAs and are synthetic lethal with mutations in 5'-3' mRNA decay; mutations in the human ortholog, SKIV2L, causes Syndromic diarrhea/Trichohepatoenteric (SD/THE) syndrome +S000033167 CDS YLR398C 12 919019 915156 C 2004-02-05 1996-07-31 +S000130185 ARS ARS1228 chromosome 12 12 919800 920994 2009-05-08 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000028682 ORF Dubious YLR399W-A chromosome 12 12 920869 920973 W 2004-02-05 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the characterized ORF BDF1/YLR399C +S000032553 CDS YLR399W-A 12 920869 920973 W 2004-02-05 2003-07-29 +S000004391 ORF Verified YLR399C BDF1 chromatin-binding protein BDF1 chromosome 12 L000000165 12 921596 919536 C 2004-02-05 1996-07-31 Protein involved in transcription initiation; functions at TATA-containing promoters; associates with the basal transcription factor TFIID; contains two bromodomains; corresponds to the C-terminal region of mammalian TAF1; redundant with Bdf2p; BDF1 has a paralog, BDF2, that arose from the whole genome duplication +S000033234 CDS YLR399C 12 921596 919536 C 2004-02-05 1996-07-31 +S000004392 ORF Dubious YLR400W chromosome 12 12 922063 922536 W 2004-02-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031650 CDS YLR400W 12 922063 922536 W 2004-02-05 1996-07-31 +S000004393 ORF Verified YLR401C DUS3 tRNA dihydrouridine synthase DUS3 chromosome 12 12 924448 922442 C 2006-01-09 1996-07-31|2006-01-09 Dihydrouridine synthase; member of a widespread family of conserved proteins including Smm1p, Dus1p, and Dus4p; contains a consensus oleate response element (ORE) in its promoter region; forms nuclear foci upon DNA replication stress +S000031698 CDS YLR401C 12 924448 922442 C 2006-01-09 1996-07-31|2006-01-09 +S000004394 ORF Dubious YLR402W chromosome 12 12 924889 925080 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032705 CDS YLR402W 12 924889 925080 W 2011-02-03 1996-07-31|2011-02-03 +S000004395 ORF Verified YLR403W SFP1 zinc-coordinating transcription factor SFP1|[ISP+]|[ISP(+)] chromosome 12 L000001872 12 925568 927619 W 2011-02-03 1996-07-31 Regulates transcription of ribosomal protein and biogenesis genes; regulates response to nutrients and stress, G2/M transitions during mitotic cell cycle and DNA-damage response, and modulates cell size; regulated by TORC1 and Mrs6p; sequence of zinc finger, ChIP localization data, and protein-binding microarray (PBM) data, and computational analyses suggest it binds DNA directly at highly active RP genes and indirectly through Rap1p at others; can form the [ISP+] prion +S000032808 CDS YLR403W 12 925568 927619 W 2011-02-03 1996-07-31 +S000004396 ORF Verified YLR404W SEI1 seipin|FLD1 chromosome 12 12 928743 929600 W 2011-02-03 1996-07-31 Seipin involved in lipid droplet (LD) assembly; controls lipid particle morphology, number, and size; promotes initiation of LD formation on the ER; ensures that LDs bud from the ER towards the cytosolic side of the membrane; forms a complex with Ldb16p at ER-LD contact sites, stabilizing these sites; null mutants have localized accumulation of phosphatidic acid (PA) marker proteins; BSCL2, human homolog implicated in congenital lipodystrophy, complements yeast null mutant +S000032908 CDS YLR404W 12 928743 929600 W 2011-02-03 1996-07-31 +S000004397 ORF Verified YLR405W DUS4 tRNA dihydrouridine synthase chromosome 12 12 929789 930892 W 2011-02-03 1996-07-31 Dihydrouridine synthase; member of a widespread family of conserved proteins including Smm1p, Dus1p, and Dus3p +S000034865 CDS YLR405W 12 929789 930892 W 2011-02-03 1996-07-31 +S000130186 ARS ARS1230 chromosome 12 12 930891 931064 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000004398 ORF Verified YLR406C RPL31B eL31|ribosomal 60S subunit protein L31B|L31e|YL28|L34B|L31B chromosome 12 L000004463 12 931755 931065 C 2011-02-03 1999-07-17|1996-07-31 Ribosomal 60S subunit protein L31B; associates with karyopherin Sxm1p; loss of both Rpl31p and Rpl39p confers lethality; homologous to mammalian ribosomal protein L31, no bacterial homolog; RPL31B has a paralog, RPL31A, that arose from the whole genome duplication +S000034912 CDS YLR406C 12 931349 931065 C 2011-02-03 1999-07-17|1996-07-31 +S000034911 CDS YLR406C 12 931755 931699 C 2011-02-03 1999-07-17|1996-07-31 +S000034913 intron YLR406C 12 931698 931350 C 2011-02-03 1999-07-17|1996-07-31 +S000028683 ORF Uncharacterized YLR406C-A chromosome 12 12 932355 932206 C 2011-02-03 2003-07-29 Putative protein of unknown function; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole +S000032554 CDS YLR406C-A 12 932355 932206 C 2011-02-03 2003-07-29 +S000004399 ORF Uncharacterized YLR407W chromosome 12 12 932967 933653 W 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; null mutant displays elongated buds and a large fraction of budded cells have only one nucleus +S000035114 CDS YLR407W 12 932967 933653 W 2011-02-03 1996-07-31|2011-02-03 +S000004400 ORF Verified YLR408C BLS1 BLB1 chromosome 12 12 934253 933885 C 2011-02-03 1996-07-31 Subunit of the BLOC-1 complex involved in endosomal maturation; green fluorescent protein (GFP)-fusion protein localizes to the endosome; YLR408C is not an essential gene +S000035167 CDS YLR408C 12 934253 933885 C 2011-02-03 1996-07-31 +S000004401 ORF Verified YLR409C UTP21 rRNA-processing protein UTP21 chromosome 12 12 937233 934414 C 2011-02-03 1996-07-31 Subunit of U3-containing 90S preribosome and SSU processome complexes; involved in production of 18S rRNA and assembly of small ribosomal subunit; synthetic defect with STI1 Hsp90 cochaperone; human homolog linked to glaucoma; Small Subunit processome is also known as SSU processome +S000035261 CDS YLR409C 12 937233 934414 C 2011-02-03 1996-07-31 +S000004402 ORF Verified YLR410W VIP1 inositol polyphosphate kinase VIP1 chromosome 12 L000004547 12 937541 940981 W 2011-02-03 1996-07-31 Inositol hexakisphosphate and inositol heptakisphosphate kinase; inositol heptakisphosphate (IP7) production is important for phosphate signaling; involved in cortical actin cytoskeleton function, and invasive pseudohyphal growth analogous to S. pombe asp1; inositol hexakisphosphate is also known as IP6 +S000035093 CDS YLR410W 12 937541 940981 W 2011-02-03 1996-07-31 +S000007093 long_terminal_repeat YLRWdelta22 chromosome 12 12 941192 941523 W 2011-02-03 2000-05-19 Ty2 LTR +S000007100 LTR_retrotransposon YLRWTy2-1 Ty2 chromosome 12 12 941192 947150 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007379 transposable_element_gene YLR410W-A gag protein chromosome 12 12 941483 942799 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000034166 CDS YLR410W-A 12 941483 942799 W 2011-02-03 1999-07-17 +S000007380 transposable_element_gene YLR410W-B gag-pol fusion protein chromosome 12 12 941483 946796 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000034173 CDS YLR410W-B 12 941483 942775 W 2011-02-03 1999-07-17 +S000034174 CDS YLR410W-B 12 942777 946796 W 2011-02-03 1999-07-17 +S000034175 plus_1_translational_frameshift YLR410W-B 12 942776 942776 W 2011-02-03 1999-07-17 +S000007094 long_terminal_repeat YLRWdelta23 chromosome 12 12 946819 947150 W 2011-02-03 2000-05-19 Ty2 LTR +S000004403 ORF Verified YLR411W CTR3 high-affinity Cu transporter CTR3 chromosome 12 L000003441 12 947253 947978 W 2011-02-03 1996-07-31 High-affinity copper transporter of the plasma membrane; acts as a trimer; gene is disrupted by a Ty2 transposon insertion in many laboratory strains of S. cerevisiae +S000035281 CDS YLR411W 12 947253 947978 W 2011-02-03 1996-07-31 +S000004404 ORF Verified YLR412W BER1 chromosome 12 S000116954 12 948368 949192 W 2011-02-03 1996-07-31 Protein involved in microtubule-related processes; GFP-fusion protein localizes to the cytoplasm and is induced in response to the DNA-damaging agent MMS; YLR412W is not an essential gene; similar to Arabidopsis SRR1 gene +S000036189 CDS YLR412W 12 948368 949192 W 2011-02-03 1996-07-31 +S000028572 ORF Uncharacterized YLR412C-A chromosome 12 12 950473 950267 C 2011-02-03 2003-07-29 Putative protein of unknown function +S000031300 CDS YLR412C-A 12 950473 950267 C 2011-02-03 2003-07-29 +S000004405 ORF Verified YLR413W INA1 chromosome 12 12 951156 953183 W 2011-02-03 1996-07-31 Protein of unknown function; not an essential gene; YLR413W has a paralog, FAT3, that arose from the whole genome duplication +S000036302 CDS YLR413W 12 951156 953183 W 2011-02-03 1996-07-31 +S000004406 ORF Verified YLR414C PUN1 chromosome 12 12 954144 953353 C 2011-02-03 1996-07-31 Plasma membrane protein with a role in cell wall integrity; co-localizes with Sur7p in punctate membrane patches; null mutant displays decreased thermotolerance; transcription induced upon cell wall damage and metal ion stress +S000036366 CDS YLR414C 12 954144 953353 C 2011-02-03 1996-07-31 +S000004407 ORF Uncharacterized YLR415C chromosome 12 12 954597 954259 C 2011-02-03 1996-07-31 Putative protein of unknown function; YLR415C is not an essential gene +S000036440 CDS YLR415C 12 954597 954259 C 2011-02-03 1996-07-31 +S000004408 ORF Dubious YLR416C chromosome 12 12 954889 954491 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037090 CDS YLR416C 12 954889 954491 C 2011-02-03 1996-07-31 +S000004409 ORF Verified YLR417W VPS36 ESCRT-II subunit protein VPS36|VPL11|VAC3|GRD12 chromosome 12 L000002958 12 955010 956710 W 2011-02-03 1996-07-31 Component of the ESCRT-II complex; contains the GLUE (GRAM Like Ubiquitin binding in EAP45) domain which is involved in interactions with ESCRT-I and ubiquitin-dependent sorting of proteins into the endosome; plays a role in the formation of mutant huntingtin (Htt) aggregates in yeast +S000037244 CDS YLR417W 12 955010 956710 W 2011-02-03 1996-07-31 +S000004410 ORF Verified YLR418C CDC73 chromosome 12 L000002792 12 958095 956914 C 2011-02-03 1996-07-31 Component of the Paf1p complex; binds to and modulates the activity of RNA polymerases I and II; required for expression of certain genes, modification of some histones, and telomere maintenance; involved in transcription elongation as demonstrated by the G-less-based run-on (GLRO) assay; protein abundance increases in response to DNA replication stress; human homolog, parafibromin, is a tumour suppressor linked to breast, renal and gastric cancers +S000037277 CDS YLR418C 12 958095 956914 C 2011-02-03 1996-07-31 +S000004411 ORF Uncharacterized YLR419W putative helicase chromosome 12 12 958428 962735 W 2011-02-03 1996-07-31 Putative helicase with limited sequence similarity to human Rb protein; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YLR419W is not an essential gene +S000037392 CDS YLR419W 12 958428 962735 W 2011-02-03 1996-07-31 +S000006652 tRNA_gene tL(UAA)L chromosome 12 L000003658 12 963055 962972 C 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000037412 noncoding_exon tL(UAA)L 12 963055 962972 C 2011-02-03 2000-05-19 +S000007075 long_terminal_repeat YLRWdelta24 YLRCdelta24 chromosome 12 12 963230 963545 W 2011-02-03 2000-05-19|2007-04-03 Ty1 LTR +S000004412 ORF Verified YLR420W URA4 dihydroorotase chromosome 12 L000002433 12 963785 964879 W 304 2011-02-03 1996-07-31 Dihydroorotase; catalyzes the third enzymatic step in the de novo biosynthesis of pyrimidines, converting carbamoyl-L-aspartate into dihydroorotate +S000031350 CDS YLR420W 12 963785 964879 W 2011-02-03 1996-07-31 +S000004413 ORF Verified YLR421C RPN13 proteasome regulatory particle lid subunit RPN13 chromosome 12 12 965560 965090 C 2011-02-03 1996-07-31 Subunit of the 19S regulatory particle of the 26S proteasome lid; acts as a ubiquitin receptor for the proteasome; null mutants accumulate ubiquitinated Gcn4p and display decreased 26S proteasome stability; protein abundance increases in response to DNA replication stress +S000031396 CDS YLR421C 12 965560 965090 C 2011-02-03 1996-07-31 +S000004414 ORF Verified YLR422W DCK1 chromosome 12 12 965897 971695 W 2011-02-03 1996-07-31 Dock family protein (Dedicator Of CytoKinesis), homolog of human DOCK1; upstream component for regulation through the small GTPase Rho5p; may form a complex with Lmo1p that acts as a GEF for Rho5p; interacts with Ino4p; cytoplasmic protein that relocates to mitochondria under oxidative stress; implicated in mitophagy; not an essential protein; DOCK proteins act as guanine nucleotide exchange factors +S000032478 CDS YLR422W 12 965897 971695 W 2011-02-03 1996-07-31 +S000004415 ORF Verified YLR423C ATG17 protein kinase regulatory subunit ATG17|APG17 chromosome 12 12 973170 971917 C 2011-02-03 1996-07-31 Scaffold protein responsible for phagophore assembly site organization; regulatory subunit of an autophagy-specific complex that includes Atg1p and Atg13p; stimulates Atg1p kinase activity; human ortholog RB1CC1/FIP200 interacts with p53, which inhibits autophagy in human cells +S000032513 CDS YLR423C 12 973170 971917 C 2011-02-03 1996-07-31 +S000004416 ORF Verified YLR424W SPP382 mRNA splicing protein SPP382|NTR1|CCF8 chromosome 12 12 973395 975521 W 2011-02-03 1996-07-31 Essential protein that forms a dimer with Ntr2p; also forms a trimer, with Ntr2p and Prp43p, that is involved in spliceosome disassembly; found also in a multisubunit complex with the splicing factor Clf1p; suppressor of prp38-1 mutation +S000032667 CDS YLR424W 12 973395 975521 W 2011-02-03 1996-07-31 +S000006672 tRNA_gene tN(GUU)L chromosome 12 L000003657 12 976056 975983 C 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis +S000030743 noncoding_exon tN(GUU)L 12 976056 975983 C 2011-02-03 2000-05-19 +S000007076 long_terminal_repeat YLRCdelta25 chromosome 12 12 976589 976258 C 2011-02-03 2000-05-19 Ty2 LTR +S000007082 LTR_retrotransposon YLRCTy2-2 Ty2 chromosome 12 12 981700 976258 C 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; mutated in S288C +S000007077 long_terminal_repeat YLRCdelta26 chromosome 12 12 981700 981369 C 2011-02-03 2000-05-19 Ty2 LTR +S000004417 ORF Verified YLR425W TUS1 Rho family guanine nucleotide exchange factor TUS1|SOP10 chromosome 12 L000004619|L000004622 12 982894 986817 W 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF) that modulates Rho1p activity; involved in the cell integrity signaling pathway; interacts with Rgl1p; localization of Tus1p to the bed neck is regulated by Rgl1p; multicopy suppressor of tor2 mutation and ypk1 ypk2 double mutation; potential Cdc28p substrate +S000033357 CDS YLR425W 12 982894 986817 W 2011-02-03 1996-07-31 +S000004418 ORF Uncharacterized YLR426W TDA5 chromosome 12 12 987062 988113 W 2011-02-03 1996-07-31 Putative protein of unknown function; detected in highly purified mitochondria in high-throughput studies; proposed to be involved in resistance to mechlorethamine and streptozotocin; null mutant sensitive to expression of top1-T722A allele +S000033424 CDS YLR426W 12 987062 987141 W 2011-02-03 1996-07-31 +S000033425 CDS YLR426W 12 987213 988113 W 2011-02-03 1996-07-31 +S000033426 intron YLR426W 12 987142 987212 W 2011-02-03 1996-07-31 +S000004419 ORF Verified YLR427W MAG2 chromosome 12 12 988428 990440 W 2011-02-03 1996-07-31 Cytoplasmic protein of unknown function; induced in response to mycotoxin patulin; ubiquitinated protein similar to the human ring finger motif protein RNF10; predicted to be involved in repair of alkylated DNA due to interaction with MAG1 +S000033509 CDS YLR427W 12 988428 990440 W 2011-02-03 1996-07-31 +S000004421 ORF Verified YLR429W CRN1 chromosome 12 L000004279 12 990777 992732 W 2011-02-03 1996-07-31 Coronin; cortical actin cytoskeletal component that associates with the Arp2p/Arp3p complex to regulate its activity; plays a role in regulation of actin patch assembly +S000034435 CDS YLR429W 12 990777 992732 W 2011-02-03 1996-07-31 +S000004420 ORF Dubious YLR428C chromosome 12 12 990961 990617 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF CRN1 +S000033519 CDS YLR428C 12 990961 990617 C 2011-02-03 1996-07-31 +S000004422 ORF Verified YLR430W SEN1 putative DNA/RNA helicase SEN1|NRD2|CIK3 chromosome 12 L000001862 12 993434 1000129 W 2011-02-03 1996-07-31 ATP-dependent 5' to 3' RNA/DNA and DNA helicase; subunit of the exosome-associated Nrd1p complex that mediates 3' end formation of snRNAs, snoRNAs, CUTs and some mRNAs; helicase-independent role in transcription-coupled repair; coordinates replication with transcription, associating with moving forks and preventing errors that occur when forks encounter transcribed regions; homolog of Senataxin, implicated in Ataxia-Oculomotor Apraxia 2 and a dominant form of juvenile ALS +S000035580 CDS YLR430W 12 993434 1000129 W 2011-02-03 1996-07-31 +S000004423 ORF Verified YLR431C ATG23 CVT23 chromosome 12 12 1001703 1000342 C 2011-02-03 1996-07-31 Peripheral membrane protein required for autophagy and CVT; required for cytoplasm-to-vacuole targeting (Cvt) pathway and efficient macroautophagy; cycles between the phagophore assembly site (PAS) and non-PAS locations; forms a complex with Atg9p and Atg27p +S000035614 CDS YLR431C 12 1001703 1000342 C 2011-02-03 1996-07-31 +S000004424 ORF Verified YLR432W IMD3 IMP dehydrogenase IMD3 chromosome 12 12 1002557 1004128 W 2011-02-03 1996-07-31 Inosine monophosphate dehydrogenase; catalyzes the rate-limiting step in the de novo synthesis of GTP; member of a four-gene family in S. cerevisiae, constitutively expressed; IMD3 has a paralog, IMD4, that arose from the whole genome duplication +S000035774 CDS YLR432W 12 1002557 1004128 W 2011-02-03 1996-07-31 +S000004425 ORF Verified YLR433C CNA1 calcineurin catalytic subunit A|CMP1 chromosome 12 L000000370 12 1006008 1004347 C 2011-02-03 1996-07-31 Calcineurin A; one isoform (the other is Cmp2p) of the catalytic subunit of calcineurin, a Ca++/calmodulin-regulated protein phosphatase which regulates Crz1p (a stress-response transcription factor), the other calcineurin subunit is CNB1; regulates the function of Aly1p alpha-arrestin; CNA1 has a paralog, CMP2, that arose from the whole genome duplication +S000036640 CDS YLR433C 12 1006008 1004347 C 2011-02-03 1996-07-31 +S000004427 ORF Verified YLR435W TSR2 chromosome 12 12 1006378 1006995 W 2011-02-03 2003-09-22|1996-07-31 Protein with a potential role in pre-rRNA processing +S000036797 CDS YLR435W 12 1006378 1006995 W 2011-02-03 2003-09-22|1996-07-31 +S000004426 ORF Dubious YLR434C chromosome 12 12 1006408 1006025 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF TSR2/YLR435W +S000036704 CDS YLR434C 12 1006408 1006025 C 2011-02-03 1996-07-31 +S000118481 ARS ARS1232 ARSXII-1007 chromosome 12 12 1007186 1007475 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178144 ARS_consensus_sequence ARS1232 12 1007235 1007251 W 2014-11-18 2014-11-18 +S000004428 ORF Verified YLR436C ECM30 chromosome 12 L000003900 12 1011245 1007421 C 2011-02-03 1996-07-31 Protein of unknown function; may play a role in cell wall biosynthesis, mutants have abormal relative levels of mannose and glucose and have Gap1p sorting and transport defects; (GFP)-fusion protein localizes to the cytoplasm +S000036822 CDS YLR436C 12 1011245 1007421 C 2011-02-03 1996-07-31 +S000004429 ORF Verified YLR437C DIF1 chromosome 12 12 1012023 1011622 C 2011-02-03 1996-07-31 Protein that regulates nuclear localization of Rnr2p and Rnr4p; phosphorylated by Dun1p in response to DNA damage and degraded; N-terminal half shows similarity to S. pombe Spd1 protein; DIF1 has a paralog, SML1, that arose from the whole genome duplication +S000036873 CDS YLR437C 12 1012023 1011622 C 2011-02-03 1996-07-31 +S000004430 ORF Verified YLR438W CAR2 ornithine-oxo-acid transaminase|cargB chromosome 12 L000000217 12 1012501 1013775 W 330 2011-02-03 1996-07-31 L-ornithine transaminase (OTAse); catalyzes the second step of arginine degradation, expression is dually-regulated by allophanate induction and a specific arginine induction process; not nitrogen catabolite repression sensitive; protein abundance increases in response to DNA replication stress; human homolog OAT complements yeast null mutant +S000037652 CDS YLR438W 12 1012501 1013775 W 2011-02-03 1996-07-31 +S000028684 ORF Dubious YLR437C-A chromosome 12 12 1012686 1012459 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF CAR2/YLR438W +S000032558 CDS YLR437C-A 12 1012686 1012459 C 2011-02-03 2003-07-29 +S000118482 ARS ARS1233 ARSXII-1014 chromosome 12 12 1013795 1014022 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178145 ARS_consensus_sequence ARS1233 12 1013861 1013845 C 2014-11-18 2014-11-18 +S000006434 ORF Verified YLR438C-A LSM3 U4/U6-U5 snRNP complex subunit LSM3|USS2|SMX4 chromosome 12 L000004507 12 1014178 1013909 C 2011-02-03 1999-07-17 Lsm (Like Sm) protein; part of heteroheptameric complexes (Lsm2p-7p and either Lsm1p or 8p): cytoplasmic Lsm1p complex involved in mRNA decay; nuclear Lsm8p complex part of U6 snRNP and possibly involved in processing tRNA, snoRNA, and rRNA; protein increases in abundance and relocalizes from nucleus to cytoplasmic foci upon DNA replication stress +S000037756 CDS YLR438C-A 12 1014178 1013909 C 2011-02-03 1999-07-17 +S000004431 ORF Verified YLR439W MRPL4 mitochondrial 54S ribosomal protein YmL4|YmL4 chromosome 12 L000002523|L000001160 12 1014491 1015450 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; homolog of prokaryotic L29 ribosomal protein; located at the ribosomal tunnel exit +S000037711 CDS YLR439W 12 1014491 1015450 W 2011-02-03 1996-07-31 +S000004432 ORF Verified YLR440C SEC39 DSL3 chromosome 12 12 1017697 1015568 C 2011-02-03 1996-07-31 Component of the Dsl1p tethering complex; this complex interacts with ER SNAREs Sec20p and Use1p; mediates Sey1p-independent homotypic ER fusion; proposed to be involved in protein secretion; localizes to the ER and nuclear envelope +S000030454 CDS YLR440C 12 1017697 1015568 C 2011-02-03 1996-07-31 +S000004433 ORF Verified YLR441C RPS1A eS1|ribosomal 40S subunit protein S1A|S1e|rp10A|S1A|RP10A chromosome 12 L000001664 12 1018908 1018141 C 2011-02-03 1996-07-31 Ribosomal protein 10 (rp10) of the small (40S) subunit; homologous to mammalian ribosomal protein S3A, no bacterial homolog; RPS1A has a paralog, RPS1B, that arose from the whole genome duplication +S000030594 CDS YLR441C 12 1018908 1018141 C 2011-02-03 1996-07-31 +S000004434 ORF Verified YLR442C SIR3 chromatin-silencing protein SIR3|STE8|MAR2|CMT1 chromosome 12 L000001896 12 1022251 1019315 C 337 2011-02-03 1996-07-31 Silencing protein; interacts with Sir2p, Sir4p, and histone H3/H4 tails to establish transcriptionally silent chromatin; required for spreading of silenced chromatin; recruited to chromatin through interaction with Rap1p; C-terminus assumes variant winged helix-turn-helix (wH) fold that mediates homodimerization, which is critical for holo-SIR complex loading; required for telomere hypercluster formation in quiescent yeast cells; has paralog ORC1 from whole genome duplication +S000030676 CDS YLR442C 12 1022251 1019315 C 2011-02-03 1996-07-31 +S000004435 ORF Verified YLR443W ECM7 ZRG15 chromosome 12 L000003882 12 1022625 1023971 W 2011-02-03 1996-07-31 Putative integral membrane protein with a role in calcium uptake; non-essential protein; mutant has cell wall defects and Ca+ uptake deficiencies; transcription is induced under conditions of zinc deficiency +S000031587 CDS YLR443W 12 1022625 1023971 W 2011-02-03 1996-07-31 +S000004436 ORF Dubious YLR444C chromosome 12 12 1023988 1023686 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031628 CDS YLR444C 12 1023988 1023686 C 2011-02-03 1996-07-31 +S000118483 ARS ARS1234 ARSXII-1024 chromosome 12 12 1024026 1024186 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000004437 ORF Verified YLR445W GMC2 chromosome 12 12 1024189 1024837 W 2011-02-03 2004-02-03|1996-07-31 Protein involved in meiotic crossing over; component of the Synaptonemal Complex (SC) along with Ecm11p; required for the efficient loading of the SC transverse filament protein, Zip1p; promotes SUMOylation of Ecm11p; mutants are delayed in meiotic nuclear division and are defective in synaptonemal complex assembly; transcription is regulated by Ume6p and induced in response to alpha factor +S000031804 CDS YLR445W 12 1024189 1024572 W 2011-02-03 2004-02-03|1996-07-31 +S000031805 CDS YLR445W 12 1024655 1024837 W 2011-02-03 2004-02-03 +S000031806 intron YLR445W 12 1024573 1024654 W 2011-02-03 2004-02-03 +S000004438 ORF Uncharacterized YLR446W hexokinase chromosome 12 12 1025214 1026515 W 2011-02-03 1996-07-31 Putative hexokinase; transcript is upregulated during sporulation and the unfolded protein response; YLR446W is not an essential gene +S000031911 CDS YLR446W 12 1025214 1026515 W 2011-02-03 1996-07-31 +S000004439 ORF Verified YLR447C VMA6 H(+)-transporting V0 sector ATPase subunit d chromosome 12 L000002461 12 1027893 1026856 C 2011-02-03 1996-07-31 Subunit d of the V0 integral membrane domain of V-ATPase; part of the electrogenic proton pump found in the endomembrane system; required for V1 domain assembly on the vacuolar membrane; the V0 integral membrane domain of vacuolar H+-ATPase (V-ATPase) has five subunits +S000032768 CDS YLR447C 12 1027893 1026856 C 2011-02-03 1996-07-31 +S000004440 ORF Verified YLR448W RPL6B eL6|ribosomal 60S subunit protein L6B|L6e|rp18|YL16|L6B|L17B chromosome 12 L000001714 12 1028854 1029768 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L6B; binds 5.8S rRNA; homologous to mammalian ribosomal protein L6, no bacterial homolog; RPL6B has a paralog, RPL6A, that arose from the whole genome duplication +S000032930 CDS YLR448W 12 1028854 1028868 W 2011-02-03 1996-07-31 +S000032931 CDS YLR448W 12 1029253 1029768 W 2011-02-03 1996-07-31 +S000032932 intron YLR448W 12 1028869 1029252 W 2011-02-03 1996-07-31 +S000004441 ORF Verified YLR449W FPR4 peptidylprolyl isomerase FPR4 chromosome 12 L000004352 12 1030834 1032012 W 2011-02-03 1996-07-31 Peptidyl-prolyl cis-trans isomerase (PPIase); nuclear proline isomerase; affects expression of multiple genes via its role in nucleosome assembly; catalyzes isomerization of proline residues in histones H3 and H4, which affects lysine methylation of those histones; PPIase domain acts as a transcriptional repressor when tethered to DNA by lexA, and repressor activity is dependent on PPIase activity; contains a nucleoplasmin-like fold and can form pentamers +S000033009 CDS YLR449W 12 1030834 1032012 W 2011-02-03 1996-07-31 +S000004442 ORF Verified YLR450W HMG2 hydroxymethylglutaryl-CoA reductase (NADPH) HMG2 chromosome 12 L000000790 12 1032627 1035764 W 343 2011-02-03 1996-07-31 HMG-CoA reductase; converts HMG-CoA to mevalonate, a rate-limiting step in sterol biosynthesis; one of two isozymes; overproduction induces assembly of peripheral ER membrane arrays and short nuclear-associated membrane stacks; forms foci at nuclear periphery upon DNA replication stress; HMG2 has a paralog, HMG1, that arose from the whole genome duplication; human homolog HMGCR can complement yeast hmg2 mutant +S000033695 CDS YLR450W 12 1032627 1035764 W 2011-02-03 1996-07-31 +S000004443 ORF Verified YLR451W LEU3 leucine-responsive transcriptional regulator LEU3 chromosome 12 L000000944 12 1036093 1038753 W 346 2011-02-03 1996-07-31 Zinc-knuckle transcription factor, repressor and activator; regulates genes involved in branched chain amino acid biosynthesis and ammonia assimilation; acts as a repressor in leucine-replete conditions and as an activator in the presence of alpha-isopropylmalate, an intermediate in leucine biosynthesis that accumulates during leucine starvation +S000033823 CDS YLR451W 12 1036093 1038753 W 2011-02-03 1996-07-31 +S000004444 ORF Verified YLR452C SST2 GTPase-activating protein SST2 chromosome 12 L000002093 12 1041366 1039270 C 344 2011-02-03 1996-07-31 GTPase-activating protein for Gpa1p; regulates desensitization to alpha factor pheromone; also required to prevent receptor-independent signaling of the mating pathway; member of the RGS (regulator of G-protein signaling) family +S000034630 CDS YLR452C 12 1041366 1039270 C 2011-02-03 1996-07-31 +S000004445 ORF Verified YLR453C RIF2 chromosome 12 L000003513 12 1042986 1041799 C 2011-02-03 1996-07-31 Protein that binds to the Rap1p C-terminus; acts synergistically with Rif1p to help control telomere length and establish telomeric silencing; deletion results in telomere elongation; RIF2 has a paralog, ORC4, that arose from the whole genome duplication +S000034787 CDS YLR453C 12 1042986 1041799 C 2011-02-03 1996-07-31 +S000004446 ORF Uncharacterized YLR454W FMP27 chromosome 12 12 1043998 1051884 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000034985 CDS YLR454W 12 1043998 1051884 W 2011-02-03 1996-07-31 +S000006608 tRNA_gene tI(AAU)L2 chromosome 12 L000003656 12 1052144 1052071 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000033933 noncoding_exon tI(AAU)L2 12 1052144 1052071 C 2011-02-03 2000-05-19 +S000007078 long_terminal_repeat YLRCdelta27 chromosome 12 12 1052632 1052303 C 2011-02-03 2000-05-19 Ty1 LTR +S000004447 ORF Verified YLR455W PDP3 chromosome 12 12 1053629 1054543 W 2011-02-03 1996-07-31 Component of the NuA3b histone acetyltransferase complex; regulates interaction between NuA3b and H3K36me3 at the transcribed regions of genes; contains PWWP domain; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO); protein abundance increases in response to DNA replication stress; relocalizes to the cytosol in response to hypoxia +S000035931 CDS YLR455W 12 1053629 1054543 W 2011-02-03 1996-07-31 +S000004448 ORF Uncharacterized YLR456W pyridoxal 5'-phosphate synthase chromosome 12 12 1055070 1055684 W 2011-02-03 1996-07-31 Protein of unknown function; predicted to encode a pyridoxal 5'-phosphate synthase based on sequence similarity but purified protein does not possess this activity, nor does it bind flavin mononucleotide (FMN); null mutant displays increased resistance to antifungal agents gliotoxin, cycloheximide and H2O2; YLR456W has a paralog, YPR172W, that arose from the whole genome duplication +S000036078 CDS YLR456W 12 1055070 1055684 W 2011-02-03 1996-07-31 +S000004450 ORF Dubious YLR458W chromosome 12 12 1056455 1056835 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps 5' end of essential NBP1/YLR457C gene required for mitosis +S000036948 CDS YLR458W 12 1056455 1056835 W 2011-02-03 1996-07-31 +S000004449 ORF Verified YLR457C NBP1 chromosome 12 L000001234 12 1056771 1055812 C 2011-02-03 1996-07-31 Spindle pole body (SPB) component; required for the insertion of the duplication plaque into the nuclear membrane during SPB duplication; essential for bipolar spindle formation; component of the Mps2p-Bbp1p complex; NBP1 has a paralog, YPR174C, that arose from the whole genome duplication +S000036128 CDS YLR457C 12 1056771 1055812 C 2011-02-03 1996-07-31 +S000004451 ORF Verified YLR459W GAB1 GPI-anchor transamidase subunit GAB1|CDC91 chromosome 12 L000000290 12 1057334 1058518 W 2011-02-03 1996-07-31 GPI transamidase subunit; involved in attachment of glycosylphosphatidylinositol (GPI) anchors to proteins; may have a role in recognition of the attachment signal or of the lipid portion of GPI +S000037010 CDS YLR459W 12 1057334 1058518 W 2011-02-03 1996-07-31 +S000178146 ARS ARS1235 chromosome 12 12 1059439 1059923 2014-11-18 2014-11-18 Autonomously replicating sequence +S000178147 ARS_consensus_sequence ARS1235 12 1059718 1059702 C 2014-11-18 2014-11-18 +S000004452 ORF Uncharacterized YLR460C chromosome 12 12 1060887 1059757 C 2011-02-03 1996-07-31 Member of the quinone oxidoreductase family; up-regulated in response to the fungicide mancozeb; possibly up-regulated by iodine +S000037785 CDS YLR460C 12 1060887 1059757 C 2011-02-03 1996-07-31 +S000004453 ORF Verified YLR461W PAU4 seripauperin PAU4 chromosome 12 L000002731 12 1062919 1063281 W 2011-02-03 1996-07-31 Member of the seripauperin multigene family; encoded mainly in subtelomeric regions; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole; active during alcoholic fermentation; regulated by anaerobiosis; negatively regulated by oxygen; repressed by heme +S000029848 CDS YLR461W 12 1062919 1063281 W 2011-02-03 1996-07-31 +S000028982 telomere TEL12R chromosome 12 12 1064281 1078177 W 350 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome XII; composed of an X element core sequence, X element combinatorial repeats, two distinct regions of telomeric repeats, and two long Y' elements +S000028984 telomeric_repeat TEL12R 12 1065031 1065155 W 2011-02-03 2003-09-09 Internal telomeric repeats on the right arm of Chromosome XII +S000028983 telomeric_repeat TEL12R 12 1071646 1071653 W 2011-02-03 2003-09-09 Internal telomeric repeats on the right arm of Chromosome XII +S000028985 X_element TEL12R 12 1064281 1064747 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome XII; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028986 X_element_combinatorial_repeat TEL12R 12 1064748 1065030 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr XII; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000028988 Y_prime_element TEL12R 12 1065156 1071645 W 2011-02-03 2003-09-09 Long telomeric Y' element on the right arm of Chromosome XII; more centromere-proximal of two long telomeric Y' elements; contains an ARS consensus sequence, a region of 36-bp repeats, 5 ORFs (YLR466W, YLR462W, YLR464W, YLR463C, YLR465C), and part of ORF YLR466C-B +S000028987 Y_prime_element TEL12R 12 1071654 1078177 W 2011-02-03 2003-09-09 Long telomeric Y' element on the right arm of Chromosome XII; more end-proximal of two long telomeric Y' elements; contains an ARS consensus sequence, a region of 36-bp repeats, ORFs YRF1-5/YLR467W and YLR467C-A, and part of ORF YLR466C-B +S000004454 ORF Uncharacterized YLR462W chromosome 12 12 1065956 1066564 W 2011-02-03 1996-07-31 Putative protein of unknown function with similarity to helicases; YLR462W is within the telomere on the right arm of chromosome XII +S000030870 CDS YLR462W 12 1065956 1066564 W 2011-02-03 1996-07-31 +S000004456 ORF Uncharacterized YLR464W chromosome 12 12 1066572 1067501 W 2011-02-03 1996-07-31 Putative protein of unknown function; intron is predicted but not detected experimentally; YLR464W overlaps the verified gene YRF1-4/YLR466W and two dubious ORFs YLR463C and YLR465C +S000031004 CDS YLR464W 12 1066572 1067084 W 2011-02-03 1996-07-31 +S000031005 CDS YLR464W 12 1067364 1067501 W 2011-02-03 1996-07-31 +S000031006 intron YLR464W 12 1067085 1067363 W 2011-02-03 1996-07-31 +S000004455 ORF Dubious YLR463C chromosome 12 12 1066816 1066265 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the uncharacterized ORFs YLR462W and YLR464W +S000030903 CDS YLR463C 12 1066816 1066265 C 2011-02-03 1996-07-31 +S000004458 ORF Verified YLR466W YRF1-4 Y' element ATP-dependent helicase protein 1 copy 4|YRF1 chromosome 12 12 1067087 1071235 W 2011-02-03 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p +S000032053 CDS YLR466W 12 1067087 1071235 W 2011-02-03 1996-07-31 +S000004457 ORF Dubious YLR465C BSC3 chromosome 12 12 1067353 1067045 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 100% of YLR465C overlaps the uncharacterized ORF YLR464W and 86% of YLR465C overlaps the verified gene YRF1-4 +S000031044 CDS YLR465C 12 1067353 1067045 C 2011-02-03 1996-07-31 +S000028685 ORF Dubious YLR466C-A chromosome 12 12 1070869 1070387 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YRF1-4/YLR466W +S000032560 CDS YLR466C-A 12 1070869 1070387 C 2011-02-03 2003-07-29 +S000028686 ORF Dubious YLR466C-B chromosome 12 12 1071710 1071594 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032562 CDS YLR466C-B 12 1071710 1071594 C 2011-02-03 2003-07-29 +S000004459 ORF Verified YLR467W YRF1-5 Y' element ATP-dependent helicase protein 1 copy 5|YRF1 chromosome 12 12 1072508 1077898 W 2011-02-03 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p +S000032127 CDS YLR467W 12 1072508 1077898 W 2011-02-03 1996-07-31 +S000028687 ORF Dubious YLR467C-A chromosome 12 12 1077532 1077050 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YRF1-4/YLR466W +S000032565 CDS YLR467C-A 12 1077532 1077050 C 2011-02-03 2003-07-29 +S000028690 ORF Dubious YML133W-B chromosome 13 13 827 1309 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized ORF YML133C +S000032587 CDS YML133W-B 13 827 1309 W 2003-07-29 2003-07-29 +S000028689 ORF Dubious YML133W-A chromosome 13 13 1610 2185 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized ORF YML133C +S000032568 CDS YML133W-A 13 1610 2185 W 2003-07-29 2003-07-29 +S000004602 ORF Uncharacterized YML133C Y' element ATP-dependent helicase chromosome 13 13 4684 461 C 1996-07-31 1996-07-31 Putative Y' element ATP-dependent helicase; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YML133C contains an intron +S000033211 CDS YML133C 13 3791 461 C 1996-07-31 1996-07-31 +S000033210 CDS YML133C 13 4684 3891 C 1996-07-31 1996-07-31 +S000033212 intron YML133C 13 3890 3792 C 1996-07-31 1996-07-31 +S000028918 telomere TEL13L chromosome 13 13 6344 1 C -102 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome XIII; composed of an X element core sequence, X element combinatorial repeats, a short region of telomeric repeats, a short Y' element, and a short terminal region of telomeric repeats +S000028919 telomeric_repeat TEL13L 13 51 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome XIII +S000028920 telomeric_repeat TEL13L 13 5585 5538 C 2003-09-09 2003-09-09 Internal telomeric repeats on the left arm of Chromosome XIII +S000028921 X_element TEL13L 13 6344 5875 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome XIII; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028922 X_element_combinatorial_repeat TEL13L 13 5874 5586 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr XIII; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000028923 Y_prime_element TEL13L 13 5537 52 C 2003-09-09 2003-09-09 Telomeric short Y' element on the left arm of Chromosome XIII; contains an ARS consensus sequence, a region of 36-bp repeats, and three ORFs (YML133C, YML133W-A, YML133W-B) +S000004601 ORF Verified YML132W COS3 chromosome 13 L000004061 13 7244 8383 W 1996-07-31 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins +S000033185 CDS YML132W 13 7244 8383 W 1996-07-31 1996-07-31 +S000004600 ORF Verified YML131W chromosome 13 13 10198 11295 W 2011-02-03 1996-07-31 Protein of unknown function; similar to medium chain dehydrogenase/reductases; expression induced by stresses including osmotic shock, DNA damaging agents, and other chemicals; GFP-fusion protein localizes to the cytoplasm; protein abundance increases in response to DNA replication stress +S000033094 CDS YML131W 13 10198 11295 W 2011-02-03 1996-07-31 +S000004599 ORF Verified YML130C ERO1 ER oxidoreductin chromosome 13 L000004013 13 13174 11483 C 2011-02-03 1996-07-31 Thiol oxidase required for oxidative protein folding in the ER; essential for maintaining ER redox balance; feedback regulated via reduction and oxidation of regulatory bonds; reduced Pdi1p activates Ero1p by direct reduction of Ero1p regulatory bonds; depletion of thiol substrates and accumulation of oxidized Pdi1p results in inactivation of Ero1p by both Pdi1p-mediated oxidation and autonomous oxidation of Ero1p regulatory bonds; ero1-1 mutation complemented by human ERO1L +S000032133 CDS YML130C 13 13174 11483 C 2011-02-03 1996-07-31 +S000004598 ORF Verified YML129C COX14 chromosome 13 L000000398 13 14753 14541 C 2011-02-03 1996-07-31 Mitochondrial cytochrome c oxidase (complex IV) assembly factor; also involved in translational regulation of Cox1p and prevention of Cox1p aggregation before assembly; associates with complex IV assembly intermediates and complex III/complex IV supercomplexes; located in the mitochondrial membrane +S000031027 CDS YML129C 13 14753 14541 C 2011-02-03 1996-07-31 +S000004597 ORF Verified YML128C MSC1 chromosome 13 13 16676 15135 C 2011-02-03 1996-07-31 Protein of unknown function; mutant is defective in directing meiotic recombination events to homologous chromatids; the authentic, non-tagged protein is detected in highly purified mitochondria and is phosphorylated +S000030934 CDS YML128C 13 16676 15135 C 2011-02-03 1996-07-31 +S000004596 ORF Verified YML127W RSC9 chromosome 13 13 17064 18809 W 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; DNA-binding protein involved in the synthesis of rRNA and in transcriptional repression and activation of genes regulated by the Target of Rapamycin (TOR) pathway +S000030913 CDS YML127W 13 17064 18809 W 2011-02-03 1996-07-31 +S000004595 ORF Verified YML126C ERG13 hydroxymethylglutaryl-CoA synthase|HMGS chromosome 13 L000004090 13 20535 19060 C 2011-02-03 1996-07-31 3-hydroxy-3-methylglutaryl-CoA (HMG-CoA) synthase; catalyzes the formation of HMG-CoA from acetyl-CoA and acetoacetyl-CoA; involved in the second step in mevalonate biosynthesis +S000030789 CDS YML126C 13 20535 19060 C 2011-02-03 1996-07-31 +S000004594 ORF Verified YML125C PGA3 cytochrome-b5 reductase|NQR1 chromosome 13 13 21699 20761 C 2011-02-03 1996-07-31 Putative cytochrome b5 reductase, localized to the plasma membrane; may be involved in regulation of lifespan; required for maturation of Gas1p and Pho8p, proposed to be involved in protein trafficking; PGA3 has a paralog, AIM33, that arose from the whole genome duplication +S000037858 CDS YML125C 13 21699 20761 C 2011-02-03 1996-07-31 +S000004593 ORF Verified YML124C TUB3 alpha-tubulin TUB3 chromosome 13 L000002389 13 23683 22048 C -101 2011-02-03 1996-07-31 Alpha-tubulin; associates with beta-tubulin (Tub2p) to form tubulin dimer, which polymerizes to form microtubules; expressed at lower level than Tub1p; TUB3 has a paralog, TUB1, that arose from the whole genome duplication +S000037763 CDS YML124C 13 23360 22048 C 2011-02-03 1996-07-31 +S000037762 CDS YML124C 13 23683 23659 C 2011-02-03 1996-07-31 +S000037764 intron YML124C 13 23658 23361 C 2011-02-03 1996-07-31 +S000004592 ORF Verified YML123C PHO84 phosphate transporter PHO84|phoT chromosome 13 L000001430 13 25800 24037 C -100.5 2011-02-03 1996-07-31 High-affinity inorganic phosphate (Pi) transporter; also low-affinity manganese transporter; regulated by Pho4p and Spt7p; mutation confers resistance to arsenate; exit from the ER during maturation requires Pho86p; cells overexpressing Pho84p accumulate heavy metals but do not develop symptoms of metal toxicity +S000037701 CDS YML123C 13 25800 24037 C 2011-02-03 1996-07-31 +S000004591 ORF Uncharacterized YML122C chromosome 13 13 26418 26038 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YML122C is not an essential gene +S000036933 CDS YML122C 13 26418 26038 C 2011-02-03 1996-07-31 +S000004590 ORF Verified YML121W GTR1 Rag GTPase GTR1 chromosome 13 L000000742 13 26930 27862 W -99.6 1996-07-31 1996-07-31 Subunit of a TORC1-stimulating GTPase complex; subunit of the heterodimeric Gtr1-Gtr2 GTPase complex that stimulates TORC1 in response to amino acid stimulation; tethered to the vacuolar membrane as part of the EGOC, a complex required for sorting of Gap1p and microautophagy; involved in phosphate transport and telomeric chromatin silencing; activated by the the Iml1p (GAP) subunit of the SEACIT complex; similar to human RagA and RagB +S000036898 CDS YML121W 13 26930 27862 W 1996-07-31 1996-07-31 +S000004589 ORF Verified YML120C NDI1 NADH-ubiquinone reductase (H(+)-translocating) NDI1 chromosome 13 L000001239 13 29807 28266 C 1996-07-31 1996-07-31 NADH:ubiquinone oxidoreductase; transfers electrons from NADH to ubiquinone in respiratory chain but does not pump protons, in contrast to higher eukaryotic multisubunit respiratory complex I; upon apoptotic stress, is activated in mitochondria by N-terminal cleavage, then translocates to cytoplasm to induce apoptosis; homolog of human AIFM2; yeast NDI1 complements several phenotypes of human cell line with mutated MT-ND4, implicated in Leber hereditary optic neuropathy +S000036805 CDS YML120C 13 29807 28266 C 1996-07-31 1996-07-31 +S000004588 ORF Uncharacterized YML119W chromosome 13 13 30611 31684 W 1996-07-31 1996-07-31 Putative protein of unknown function; YML119W is not an essential gene; potential Cdc28p substrate +S000035884 CDS YML119W 13 30611 31684 W 1996-07-31 1996-07-31 +S000118365 ARS ARS1303 ARSXIII-32 chromosome 13 13 31766 31835 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000004587 ORF Verified YML118W NGL3 3'-5' poly(A) RNA exonuclease chromosome 13 13 32334 33851 W 1996-07-31 1996-07-31 3'-5' exonuclease specific for poly-A RNAs; has a domain similar to a magnesium-dependent endonuclease motif in mRNA deadenylase Ccr4p; similar to Ngl1p; NGL3 has a paralog, NGL2, that arose from the whole genome duplication +S000034970 CDS YML118W 13 32334 33851 W 1996-07-31 1996-07-31 +S000004585 ORF Verified YML117W NAB6 chromosome 13 13 34243 37647 W 1996-07-31 1996-07-31 Putative RNA-binding protein; associates with mRNAs encoding cell wall proteins in high-throughput studies; deletion mutants display increased sensitivity to some cell wall disrupting agents; expression negatively regulated by cAMP +S000034816 CDS YML117W 13 34243 37647 W 1996-07-31 1996-07-31 +S000004586 ORF Dubious YML116W-A YML117W-A chromosome 13 13 37472 37774 W 1996-07-31 1996-07-31 Putative protein of unknown function +S000031380 CDS YML116W-A 13 37472 37774 W 1996-07-31 1996-07-31 +S000004584 ORF Verified YML116W ATR1 borate transporter|SNQ1 chromosome 13 L000001956|L000002831 13 38196 39824 W 1996-07-31 1996-07-31 Multidrug efflux pump of the major facilitator superfamily; required for resistance to aminotriazole and 4-nitroquinoline-N-oxide; ATR1 has a paralog, YMR279C, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000034666 CDS YML116W 13 38196 39824 W 1996-07-31 1996-07-31 +S000130187 ARS ARS1304 chromosome 13 13 39824 40187 2009-05-08 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000178150 ARS_consensus_sequence ARS1304 13 40149 40133 C 2014-11-18 2014-11-18 +S000004583 ORF Verified YML115C VAN1 LDB13|VRG8|VRG7 chromosome 13 L000002453 13 41794 40187 C 38 1996-07-31 1996-07-31 Component of the mannan polymerase I; complex contains Van1p and Mnn9p and is involved in the first steps of mannan synthesis; mutants are vanadate-resistant +S000033712 CDS YML115C 13 41794 40187 C 1996-07-31 1996-07-31 +S000004582 ORF Verified YML114C TAF8 TafII65|TAF65 chromosome 13 13 43575 42043 C 1996-07-31 1996-07-31 TFIID subunit (65 kDa); involved in RNA polymerase II transcription initiation +S000033619 CDS YML114C 13 43575 42043 C 1996-07-31 1996-07-31 +S000004581 ORF Verified YML113W DAT1 chromosome 13 L000000485 13 44045 44791 W 1996-07-31 1996-07-31 DNA binding protein that recognizes oligo(dA).oligo(dT) tracts; Arg side chain in its N-terminal pentad Gly-Arg-Lys-Pro-Gly repeat is required for DNA-binding; relocalizes to the cytosol in response to hypoxia; not essential for viability +S000033570 CDS YML113W 13 44045 44791 W 1996-07-31 1996-07-31 +S000004580 ORF Verified YML112W CTK3 chromosome 13 L000003012 13 45063 45953 W 1996-07-31 1996-07-31 Gamma subunit of C-terminal domain kinase I; CTDK-I phosphorylates RNA polymerase II subunit Rpo21p to affect transcription and pre-mRNA 3' end processing, and also phosphorylates ribosomal protein Rps2p to increase translational fidelity; protein abundance increases in response to DNA replication stress +S000032868 CDS YML112W 13 45063 45953 W 1996-07-31 1996-07-31 +S000004579 ORF Verified YML111W BUL2 ubiquitin-ubiquitin ligase BUL2 chromosome 13 L000004755 13 46942 49704 W 1996-07-31 1996-07-31 Component of the Rsp5p E3-ubiquitin ligase complex; involved in intracellular amino acid permease sorting, functions in heat shock element mediated gene expression, essential for growth in stress conditions; BUL2 has a paralog, BUL1, that arose from the whole genome duplication +S000032740 CDS YML111W 13 46942 49704 W 1996-07-31 1996-07-31 +S000004578 ORF Verified YML110C COQ5 2-hexaprenyl-6-methoxy-1,4-benzoquinone methyltransferase|DBI56 chromosome 13 L000003398 13 50954 50031 C 1996-07-31 1996-07-31 2-hexaprenyl-6-methoxy-1,4-benzoquinone methyltransferase; involved in ubiquinone (Coenzyme Q) biosynthesis; localizes to the matrix face of the mitochondrial inner membrane in a large complex with other ubiquinone biosynthetic enzymes; respiratory defect of the null mutant is partially complemented by human COQ5 +S000032570 CDS YML110C 13 50954 50031 C 1996-07-31 1996-07-31 +S000004577 ORF Verified YML109W ZDS2 CES4 chromosome 13 L000003287 13 51640 54468 W 1996-07-31 1996-07-31 Protein with a role in regulating Swe1p-dependent polarized growth; involved in maintenance of Cdc55p in the cytoplasm where it promotes mitotic entry; interacts with silencing proteins at the telomere; implicated in the mitotic exit network through regulation of Cdc14p localization; ZDS2 has a paralog, ZDS1, that arose from the whole genome duplication +S000031758 CDS YML109W 13 51640 54468 W 1996-07-31 1996-07-31 +S000004576 ORF Verified YML108W chromosome 13 13 54793 55110 W 1996-07-31 1996-07-31 Protein of unknown function; structure defines a new subfamily of the split beta-alpha-beta sandwiches; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; YML108W is not an essential gene; relative distribution to the nucleus increases upon DNA replication stress +S000031668 CDS YML108W 13 54793 55110 W 1996-07-31 1996-07-31 +S000004575 ORF Verified YML107C PML39 chromosome 13 13 56269 55265 C 2003-09-22 2003-09-22|1996-07-31 Protein required for nuclear retention of unspliced pre-mRNAs; required along with Mlp1p and Pml1p; anchored to nuclear pore complex via Mlp1p and Mlp2p; found with the subset of nuclear pores farthest from the nucleolus; may interact with ribosomes +S000031517 CDS YML107C 13 56269 55265 C 2003-09-22 2003-09-22|1996-07-31 +S000004574 ORF Verified YML106W URA5 orotate phosphoribosyltransferase URA5|PYR5 chromosome 13 L000002434 13 56773 57453 W 1996-07-31 1996-07-31 Major orotate phosphoribosyltransferase (OPRTase) isozyme; catalyzes the fifth enzymatic step in de novo biosynthesis of pyrimidines, converting orotate into orotidine-5'-phosphate; URA5 has a paralog, URA10, that arose from the whole genome duplication +S000030709 CDS YML106W 13 56773 57453 W 1996-07-31 1996-07-31 +S000004573 ORF Verified YML105C SEC65 RNA-binding signal recognition particle subunit SEC65 chromosome 13 L000001855 13 58687 57866 C 1996-07-31 1996-07-31 Subunit of the signal recognition particle (SRP); involved in protein targeting to the ER; interacts with Srp54p; homolog of mammalian SRP19 +S000030552 CDS YML105C 13 58687 57866 C 1996-07-31 1996-07-31 +S000004572 ORF Verified YML104C MDM1 chromosome 13 L000001051 13 62322 58939 C 1996-07-31 1996-07-31 PtdIns-3-P binding protein that tethers the ER to vacuoles at NVJs; anchored in the ER membrane at nucleus-vacuole junctions and binds phosphatidylinositol 3-phosphate (PtdIns-3-P) in the vacuolar membrane via its Phox homology (PX) domain; expressed predominantly in late G1 to early S phase of the cell cycle; mutation affects nuclear and mitochondrial transmission to daughter buds; similar to 4 human genes, one of which (SNX14) is associated with neurological disease +S000030408 CDS YML104C 13 62322 58939 C 1996-07-31 1996-07-31 +S000004571 ORF Verified YML103C NUP188 chromosome 13 L000003099 13 67549 62582 C 1996-07-31 1996-07-31 Subunit of the inner ring of the nuclear pore complex (NPC); contributes to NPC organization and nucleocytoplasmic transport; homologous to human NUP188 +S000037631 CDS YML103C 13 67549 62582 C 1996-07-31 1996-07-31 +S000081376 snoRNA_gene snR85 SNR85 chromosome 13 13 67938 67768 C 2006-01-24 2006-01-24 H/ACA box small nucleolar RNA (snoRNA); predicted to guide pseudouridylation of small subunit (SSU) rRNA at position U1181 +S000114174 noncoding_exon snR85 13 67938 67768 C 2006-01-24 2006-01-24 +S000004570 ORF Verified YML102W CAC2 chromosome 13 L000003389 13 68294 69700 W 1996-07-31 1996-07-31 Subunit of chromatin assembly factor I (CAF-1), with Rlf2p and Msi1p; chromatin assembly by CAF-1 is important for multiple processes including silencing at telomeres, mating type loci, and rDNA; maintenance of kinetochore structure, deactivation of the DNA damage checkpoint after DNA repair, chromatin dynamics during transcription; and repression of divergent transcription; relocalizes to the cytosol in response to hypoxia +S000037576 CDS YML102W 13 68294 69700 W 1996-07-31 1996-07-31 +S000004569 ORF Dubious YML101C-A YML102C-A chromosome 13 13 69726 69409 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032439 CDS YML101C-A 13 69726 69409 C 1996-07-31 1996-07-31 +S000004568 ORF Verified YML101C CUE4 chromosome 13 13 70088 69735 C 1996-07-31 1996-07-31 Protein of unknown function; has a CUE domain that binds ubiquitin, which may facilitate intramolecular monoubiquitination; CUE4 has a paralog, CUE1, that arose from the whole genome duplication +S000037386 CDS YML101C 13 70088 69735 C 1996-07-31 1996-07-31 +S000028688 ORF Uncharacterized YML100W-A chromosome 13 13 70138 70311 W 2003-07-29 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032567 CDS YML100W-A 13 70138 70311 W 2003-07-29 2003-07-29 +S000004566 ORF Verified YML100W TSL1 trehalose 6-phosphate synthase/phosphatase complex subunit chromosome 13 L000002361 13 70624 73920 W 1996-07-31 1996-07-31 Large subunit of trehalose 6-phosphate synthase/phosphatase complex; Tps1p-Tps2p complex converts uridine-5'-diphosphoglucose and glucose 6-phosphate to trehalose; contributes to survival to acute lethal heat stress; mutant has aneuploidy tolerance; protein abundance increases in response to DNA replication stress; TSL1 has a paralog, TPS3, that arose from the whole genome duplication +S000036726 CDS YML100W 13 70624 73920 W 1996-07-31 1996-07-31 +S000004567 ORF Dubious YML099W-A YML100W-A chromosome 13 13 74229 74558 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF ARG81/YML099C +S000037139 CDS YML099W-A 13 74229 74558 W 1996-07-31 1996-07-31 +S000004565 ORF Verified YML099C ARG81 ARGRII|ARGR2 chromosome 13 L000000114|L000000113 13 77040 74398 C -63 1996-07-31 1996-07-31 Zinc finger transcription factor involved in arginine-responsive genes; Zn(2)-Cys(6) binuclear cluster domain type; involved in the regulation of arginine-responsive genes; acts with Arg80p and Arg82p +S000032192 CDS YML099C 13 77040 74398 C 1996-07-31 1996-07-31 +S000004564 ORF Verified YML098W TAF13 TafII19|TAF19|FUN81 chromosome 13 L000000650 13 77267 77770 W -63 1996-07-31 1996-07-31 TFIID subunit (19 kDa); involved in RNA polymerase II transcription initiation, similar to histone H4 with atypical histone fold motif of Spt3-like transcription factors +S000032162 CDS YML098W 13 77267 77770 W 1996-07-31 1996-07-31 +S000004563 ORF Verified YML097C VPS9 guanine nucleotide exchange factor VPS9|VPT9|VPL31 chromosome 13 L000002659 13 79690 78335 C 1996-07-31 1996-07-31 Guanine nucleotide exchange factor (GEF) and ubiquitin receptor; involved in vesicle-mediated vacuolar transport, including Golgi-endosome trafficking and sorting through the multivesicular body (MVB); stimulates the intrinsic guanine nucleotide exchange activity of Rab family members (Vps21p/Ypt52p/Ypt53p); partially redundant with GEF MUK1; required for localization of the CORVET complex to endosomes; similar to mammalian ras inhibitors; contains a Ub-interacting CUE domain +S000031138 CDS YML097C 13 79690 78335 C 1996-07-31 1996-07-31 +S000004562 ORF Uncharacterized YML096W putative asparagine synthase chromosome 13 13 79909 81486 W 1996-07-31 1996-07-31 Putative protein with similarity to asparagine synthetases; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YML096W is not an essential gene and partially overlaps the verified gene RAD10 +S000031103 CDS YML096W 13 79909 81486 W 1996-07-31 1996-07-31 +S000004560 ORF Verified YML095C RAD10 chromosome 13 L000001563 13 82113 81481 C 48 1996-07-31 1996-07-31 Single-stranded DNA endonuclease (with Rad1p); cleaves single-stranded DNA during nucleotide excision repair and double-strand break repair; subunit of Nucleotide Excision Repair Factor 1 (NEF1); homolog of human ERCC1 protein +S000030965 CDS YML095C 13 82113 81481 C 1996-07-31 1996-07-31 +S000004559 ORF Verified YML094W GIM5 PFD5 chromosome 13 L000004370 13 82275 82849 W 1996-07-31 1996-07-31 Subunit of the heterohexameric cochaperone prefoldin complex; prefoldin binds specifically to cytosolic chaperonin and transfers target proteins to it; prefoldin complex also localizes to chromatin of actively transcribed genes in the nucleus and facilitates transcriptional elongation +S000030920 CDS YML094W 13 82275 82290 W 1996-07-31 1996-07-31 +S000030921 CDS YML094W 13 82374 82849 W 1996-07-31 1996-07-31 +S000030922 intron YML094W 13 82291 82373 W 1996-07-31 1996-07-31 +S000004561 ORF Dubious YML094C-A YML095C-A chromosome 13 13 82620 82219 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene GIM5/YML094W; deletion confers sensitivity to GSAO +S000032030 CDS YML094C-A 13 82620 82219 C 1996-07-31 1996-07-31 +S000004558 ORF Verified YML093W UTP14 chromosome 13 13 83090 85789 W 1996-07-31 1996-07-31 Subunit of U3-containing Small Subunit (SSU) processome complex; involved in production of 18S rRNA and assembly of small ribosomal subunit +S000029918 CDS YML093W 13 83090 85789 W 1996-07-31 1996-07-31 +S000004557 ORF Verified YML092C PRE8 proteasome core particle subunit alpha 2 chromosome 13 L000002700 13 86739 85987 C 1996-07-31 1996-07-31 Alpha 2 subunit of the 20S proteasome +S000037849 CDS YML092C 13 86739 85987 C 1996-07-31 1996-07-31 +S000004556 ORF Verified YML091C RPM2 ribonuclease P chromosome 13 L000001743 13 90731 87123 C 1996-07-31 1996-07-31 Protein subunit of mitochondrial RNase P; has roles in nuclear transcription, cytoplasmic and mitochondrial RNA processing, and mitochondrial translation; distributed to mitochondria, cytoplasmic processing bodies, and the nucleus +S000036004 CDS YML091C 13 90731 87123 C 1996-07-31 1996-07-31 +S000004555 ORF Dubious YML090W chromosome 13 13 90744 91130 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YML089C; exhibits growth defect on a non-fermentable (respiratory) carbon source +S000035949 CDS YML090W 13 90744 91130 W 1996-07-31 1996-07-31 +S000004554 ORF Dubious YML089C chromosome 13 13 91409 91041 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; expression induced by calcium shortage +S000036274 CDS YML089C 13 91409 91041 C 1996-07-31 1996-07-31 +S000077071 ncRNA_gene ZOD1 ZOD1 chromosome 13 13 91970 92027 W 2014-11-18 2014-11-18 tDNA relic, ancient tDNA for tRNA-Ile; weakly transcribed by RNA polymerase III; located upstream of UFO1; associated with components of the Pol III machinery: Tfc4p, Brf1p, Bdp1, and Rpc34p +S000178148 noncoding_exon ZOD1 13 91970 92027 W 2014-11-18 2014-11-18 +S000004553 ORF Verified YML088W UFO1 SCF ubiquitin ligase complex subunit UFO1 chromosome 13 13 92235 94241 W 1996-07-31 1996-07-31 F-box receptor protein; subunit of the Skp1-Cdc53-F-box receptor (SCF) E3 ubiquitin ligase complex; binds to phosphorylated Ho endonuclease, allowing its ubiquitination by SCF and subsequent degradation +S000036233 CDS YML088W 13 92235 94241 W 1996-07-31 1996-07-31 +S000118366 ARS ARS1305 ARSXIII-94 chromosome 13 13 94217 94463 2006-08-30 2006-08-30 Autonomously Replicating Sequence +S000004552 ORF Verified YML087C AIM33 cytochrome-b5 reductase chromosome 13 13 95369 94431 C 1996-07-31 1996-07-31 Protein of unknown function, highly conserved across species; homolog of human CYB5R4; null mutant displays reduced frequency of mitochondrial genome loss; AIM33 has a paralog, PGA3, that arose from the whole genome duplication +S000036086 CDS YML087C 13 95369 94431 C 1996-07-31 1996-07-31 +S000004551 ORF Verified YML086C ALO1 D-arabinono-1,4-lactone oxidase chromosome 13 L000004264 13 97371 95791 C 1996-07-31 1996-07-31 D-Arabinono-1,4-lactone oxidase; catalyzes the final step in biosynthesis of dehydro-D-arabinono-1,4-lactone, which is protective against oxidative stress +S000036007 CDS YML086C 13 97371 95791 C 1996-07-31 1996-07-31 +S000004550 ORF Verified YML085C TUB1 alpha-tubulin TUB1 chromosome 13 L000002387 13 99400 97941 C -62 1996-07-31 1996-07-31 Alpha-tubulin; associates with beta-tubulin (Tub2p) to form tubulin dimer, which polymerizes to form microtubules; relative distribution to nuclear foci increases upon DNA replication stress; TUB1 has a paralog, TUB3, that arose from the whole genome duplication +S000035128 CDS YML085C 13 99259 97941 C 1996-07-31 1996-07-31 +S000035127 CDS YML085C 13 99400 99376 C 1996-07-31 1996-07-31 +S000035129 intron YML085C 13 99375 99260 C 1996-07-31 1996-07-31 +S000004549 ORF Dubious YML084W chromosome 13 13 99489 99797 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035047 CDS YML084W 13 99489 99797 W 1996-07-31 1996-07-31 +S000004548 ORF Verified YML083C chromosome 13 13 101050 99794 C 1996-07-31 1996-07-31 Protein of unknown function; transcriptionally regulated by Upc2p via an upstream sterol response element; strong increase in transcript abundance during anaerobic growth compared to aerobic growth; cells deleted for YML083C do not exhibit growth defects in anerobic or anaerobic conditions +S000034849 CDS YML083C 13 101050 99794 C 1996-07-31 1996-07-31 +S000004547 ORF Uncharacterized YML082W putative cystathionine gamma-synthase chromosome 13 13 101862 103811 W 1996-07-31 1996-07-31 Putative protein predicted to have carbon-sulfur lyase activity; transcriptionally regulated by Upc2p via an upstream sterol response element; green fluorescent protein (GFP)-fusion protein localizes to the nucleus and the cytoplasm; not an essential gene; YML082W has a paralog, STR2, that arose from the whole genome duplication +S000034791 CDS YML082W 13 101862 103811 W 1996-07-31 1996-07-31 +S000007247 ORF Verified YML081C-A ATP18 F1F0 ATP synthase subunit i chromosome 13 L000004548 13 104162 103983 C 1997-07-17 1997-07-17 Subunit of the mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; termed subunit I or subunit j; does not correspond to known ATP synthase subunits in other organisms +S000032427 CDS YML081C-A 13 104162 103983 C 1997-07-17 1997-07-17 +S000004546 ORF Verified YML081W TDA9 AAF1 chromosome 13 13 104777 108532 W 1996-07-31 1996-07-31 Transcription factor that regulates acetate production; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; null mutant is sensitive to expression of the top1-T722A allele; not an essential gene; TDA9 has a paralog, RSF2, that arose from the whole genome duplication +S000033928 CDS YML081W 13 104777 108532 W 1996-07-31 1996-07-31 +S000004545 ORF Verified YML080W DUS1 tRNA dihydrouridine synthase chromosome 13 13 108806 110077 W 1996-07-31 1996-07-31 Dihydrouridine synthase; member of a widespread family of conserved proteins including Smm1p, Dus3p, and Dus4p; modifies pre-tRNA(Phe) at U17 +S000033787 CDS YML080W 13 108806 110077 W 1996-07-31 1996-07-31 +S000004544 ORF Uncharacterized YML079W chromosome 13 13 110247 110852 W 1996-07-31 1996-07-31 Non-essential protein of unknown function; has structural resemblance to plant storage and ligand binding proteins (canavalin, glycinin, auxin binding protein) and to some enzymes (epimerase, germin); localizes to the nucleus and cytoplasm +S000031763 CDS YML079W 13 110247 110852 W 1996-07-31 1996-07-31 +S000004543 ORF Verified YML078W CPR3 peptidylprolyl isomerase CPR3|CYP3 chromosome 13 L000000464|L000000402 13 111002 111550 W 1996-07-31 1996-07-31 Mitochondrial peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; involved in protein refolding after import into mitochondria +S000031645 CDS YML078W 13 111002 111550 W 1996-07-31 1996-07-31 +S000004542 ORF Verified YML077W BET5 TRAPP subunit BET5 chromosome 13 L000004608 13 111865 112344 W 1996-07-31 1996-07-31 Core component of transport protein particle (TRAPP) complexes I-III; TRAPP complexes are related multimeric guanine nucleotide-exchange factors for the GTPase Ypt1p, regulating ER-Golgi traffic (TRAPPI), intra-Golgi traffic (TRAPPII), endosome-Golgi traffic (TRAPPII and III) and autophagy (TRAPPIII); human homology TRAPPC1 complements yeast null mutant +S000031560 CDS YML077W 13 111865 112344 W 1996-07-31 1996-07-31 +S000004541 ORF Verified YML076C WAR1 chromosome 13 13 115347 112513 C 1996-07-31 1996-07-31 Homodimeric Zn2Cys6 zinc finger transcription factor; binds to a weak acid response element to induce transcription of PDR12 and FUN34, encoding an acid transporter and a putative ammonia transporter, respectively +S000030680 CDS YML076C 13 115347 112513 C 1996-07-31 1996-07-31 +S000004540 ORF Verified YML075C HMG1 hydroxymethylglutaryl-CoA reductase (NADPH) HMG1 chromosome 13 L000000789 13 118898 115734 C -50 1996-07-31 1996-07-31 HMG-CoA reductase; catalyzes conversion of HMG-CoA to mevalonate, which is a rate-limiting step in sterol biosynthesis; one of two isozymes; localizes to nuclear envelope; overproduction induces formation of karmellae; forms foci at nuclear periphery upon DNA replication stress; HMG1 has a paralog, HMG2, that arose from the whole genome duplication; human homolog HMGCR can complement yeast hmg1 mutant +S000030566 CDS YML075C 13 118898 115734 C 1996-07-31 1996-07-31 +S000004539 ORF Verified YML074C FPR3 peptidylprolyl isomerase FPR3|NPI46 chromosome 13 L000001268 13 121324 120089 C 1996-07-31 1996-07-31 Nucleolar peptidyl-prolyl cis-trans isomerase (PPIase); FK506 binding protein; affects expression of multiple genes via its role in nucleosome assembly; phosphorylated by casein kinase II (Cka1p-Cka2p-Ckb1p-Ckb2p) and dephosphorylated by Ptp1p; PPIase domain acts as a transcriptional repressor when tethered to DNA by lexA, and repressor activity is dependent on PPIase activity; FPR3 has a paralog, FPR4, that arose from the whole genome duplication +S000030502 CDS YML074C 13 121324 120089 C 1996-07-31 1996-07-31 +S000004538 ORF Verified YML073C RPL6A eL6|ribosomal 60S subunit protein L6A|L6e|rp18|YL16|L6A|L17A|YL16A chromosome 13 L000004165 13 124172 123227 C 1996-07-31 1996-07-31 Ribosomal 60S subunit protein L6A; N-terminally acetylated; binds 5.8S rRNA; homologous to mammalian ribosomal protein L6, no bacterial homolog; RPL6A has a paralog, RPL6B, that arose from the whole genome duplication +S000037684 CDS YML073C 13 123742 123227 C 1996-07-31 1996-07-31 +S000037683 CDS YML073C 13 124172 124158 C 1996-07-31 1996-07-31 +S000037685 intron YML073C 13 124157 123743 C 1996-07-31 1996-07-31 +S000004537 ORF Verified YML072C TCB3 chromosome 13 13 129367 124730 C 1996-07-31 1996-07-31 Cortical ER protein involved in ER-plasma membrane tethering; one of 6 proteins (Ist2p, Scs2p, Scs22p, Tcb1p, Tcb2p, Tcb3p) that connect ER to the plasma membrane (PM) and regulate PM phosphatidylinositol-4-phosphate (PI4P) levels by controlling access of Sac1p phosphatase to its substrate PI4P in the PM; localized to the bud via specific mRNA transport; non-tagged protein detected in a phosphorylated state in mitochondria; C-termini of Tcb1p, Tcb2p and Tcb3p interact +S000037588 CDS YML072C 13 129367 124730 C 1996-07-31 1996-07-31 +S000004536 ORF Verified YML071C COG8 Golgi transport complex subunit COG8|DOR1 chromosome 13 13 131572 129749 C 1996-07-31 1996-07-31 Component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments +S000037526 CDS YML071C 13 131572 129749 C 1996-07-31 1996-07-31 +S000006718 tRNA_gene tR(UCU)M2 chromosome 13 L000003686 13 131896 131825 C 2000-05-19 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000031505 noncoding_exon tR(UCU)M2 13 131896 131825 C 2000-05-19 2000-05-19 +S000007101 long_terminal_repeat YMLCdelta1 chromosome 13 13 132321 131989 C 2000-05-19 2000-05-19 Ty1 LTR +S000004535 ORF Verified YML070W DAK1 dihydroxyacetone kinase chromosome 13 L000004203 13 133475 135229 W 1996-07-31 1996-07-31 Dihydroxyacetone kinase; required for detoxification of dihydroxyacetone (DHA); involved in stress adaptation +S000037490 CDS YML070W 13 133475 135229 W 1996-07-31 1996-07-31 +S000004534 ORF Verified YML069W POB3 FACT complex subunit POB3 chromosome 13 L000003326 13 135500 137158 W 1996-07-31 1996-07-31 Subunit of the heterodimeric FACT complex (Spt16p-Pob3p); FACT associates with chromatin via interaction with Nhp6Ap and Nhp6Bp, and reorganizes nucleosomes to facilitate access to DNA by RNA and DNA polymerases; protein abundance increases in response to DNA replication stress +S000036481 CDS YML069W 13 135500 137158 W 1996-07-31 1996-07-31 +S000118367 ARS ARS1307 ARSXIII-137 chromosome 13 13 137300 137548 2006-08-30 2006-08-30 Autonomously Replicating Sequence +S000178151 ARS_consensus_sequence ARS1307 13 137321 137337 W 2014-11-18 2014-11-18 +S000004533 ORF Verified YML068W ITT1 chromosome 13 13 137550 138944 W 1996-07-31 1996-07-31 Protein that modulates the efficiency of translation termination; interacts with translation release factors eRF1 (Sup45p) and eRF3 (Sup35p) in vitro, contains a zinc finger domain characteristic of the TRIAD class of proteins +S000036418 CDS YML068W 13 137550 138944 W 1996-07-31 1996-07-31 +S000004532 ORF Verified YML067C ERV41 chromosome 13 13 140214 139063 C 1996-07-31 1996-07-31 Protein localized to COPII-coated vesicles; forms a complex with Erv46p; involved in the membrane fusion stage of transport; has homology to human ERGIC2 (PTX1) protein +S000035439 CDS YML067C 13 140090 139063 C 1996-07-31 1996-07-31 +S000035438 CDS YML067C 13 140214 140184 C 1996-07-31 1996-07-31 +S000035440 intron YML067C 13 140183 140091 C 1996-07-31 1996-07-31 +S000004531 ORF Verified YML066C SMA2 chromosome 13 13 141533 140424 C 1996-07-31 1996-07-31 Meiosis-specific prospore membrane protein; required to produce bending force necessary for proper assembly of the prospore membrane during sporulation +S000035365 CDS YML066C 13 141533 140424 C 1996-07-31 1996-07-31 +S000004530 ORF Verified YML065W ORC1 origin recognition complex subunit 1 chromosome 13 L000003162 13 142210 144954 W 1996-07-31 1996-07-31 Largest subunit of the origin recognition complex; involved in directing DNA replication by binding to replication origins; also involved in transcriptional silencing; exhibits ATPase activity; ORC1 has a paralog, SIR3, that arose from the whole genome duplication +S000035334 CDS YML065W 13 142210 144954 W 1996-07-31 1996-07-31 +S000004529 ORF Verified YML064C TEM1 Ras family GTPase TEM1 chromosome 13 L000002282 13 145876 145139 C 1996-07-31 1996-07-31 GTP-binding protein of the Ras superfamily; involved in termination of M-phase; controls actomyosin and septin dynamics during cytokinesis +S000035202 CDS YML064C 13 145876 145139 C 1996-07-31 1996-07-31 +S000004528 ORF Verified YML063W RPS1B eS1|ribosomal 40S subunit protein S1B|S1e|rp10B|S1B|RP10B|PLC2 chromosome 13 L000001665 13 146482 147249 W 1996-07-31 1996-07-31 Ribosomal protein 10 (rp10) of the small (40S) subunit; homologous to mammalian ribosomal protein S3A, no bacterial homolog; RPS1B has a paralog, RPS1A, that arose from the whole genome duplication +S000035158 CDS YML063W 13 146482 147249 W 1996-07-31 1996-07-31 +S000004527 ORF Verified YML062C MFT1 MFT52 chromosome 13 L000001099 13 148683 147505 C 1996-07-31 1996-07-31 Subunit of the THO complex; THO is a nuclear complex comprised of Hpr1p, Mft1p, Rlr1p, and Thp2p, that is involved in transcription elongation and mitotic recombination; involved in telomere maintenance +S000034129 CDS YML062C 13 148683 147505 C 1996-07-31 1996-07-31 +S000004526 ORF Verified YML061C PIF1 DNA helicase PIF1|TST1 chromosome 13 L000001435 13 151532 148953 C 1996-07-31 1996-07-31 DNA helicase, potent G-quadruplex DNA binder/unwinder; possesses strand annealing activity; promotes DNA synthesis during break-induced replication; important for crossover recombination; translation from different start sites produces mitochondrial and nuclear forms; nuclear form is a catalytic inhibitor of telomerase; mitochondrial form involved in DNA repair and recombination; mutations affect Zn, Fe homeostasis; regulated by Rad53p-dependent phosphorylation in rho0 cells +S000034029 CDS YML061C 13 151532 148953 C 1996-07-31 1996-07-31 +S000004525 ORF Verified YML060W OGG1 8-oxoguanine glycosylase OGG1 chromosome 13 L000003339 13 151871 153001 W 1996-07-31 1996-07-31 Nuclear and mitochondrial glycosylase/lyase; specifically excises 7,8-dihydro-8-oxoguanine residues located opposite cytosine or thymine residues in DNA, repairs oxidative damage to mitochondrial DNA, contributes to UVA resistance +S000033997 CDS YML060W 13 151871 153001 W 1996-07-31 1996-07-31 +S000004524 ORF Verified YML059C NTE1 lysophospholipase chromosome 13 13 158258 153219 C 1996-07-31 1996-07-31 Serine esterase; homolog of human neuropathy target esterase (NTE); Nte1p-mediated phosphatidylcholine turnover influences transcription factor Opi1p localization, affecting transcriptional regulation of phospholipid biosynthesis genes +S000032143 CDS YML059C 13 158258 153219 C 1996-07-31 1996-07-31 +S000007472 ORF Verified YML058W-A HUG1 chromosome 13 L000004561 13 158760 158966 W 1998-11-10 1998-11-10 Ribonucleotide reductase inhibitor; intrinsically disordered protein that binds to and inhibits Rnr2p; involved in the Mec1p-mediated checkpoint pathway; transcription is induced by genotoxic stress and by activation of the Rad53p pathway; protein abundance increases in response to DNA replication stress +S000030950 CDS YML058W-A 13 158760 158966 W 1998-11-10 1998-11-10 +S000178152 ARS ARS1307.5 chromosome 13 13 158887 159277 2014-11-18 2014-11-18 Autonomously replicating sequence +S000178153 ARS_consensus_sequence ARS1307.5 13 159046 159062 W 2014-11-18 2014-11-18 +S000004523 ORF Verified YML058W SML1 ribonucleotide reductase inhibiting protein SML1 chromosome 13 L000004580 13 159383 159697 W 1996-07-31 1996-07-31 Ribonucleotide reductase inhibitor; involved in regulating dNTP production; regulated by Mec1p and Rad53p during DNA damage and S phase; SML1 has a paralog, DIF1, that arose from the whole genome duplication +S000032114 CDS YML058W 13 159383 159697 W 1996-07-31 1996-07-31 +S000004521 ORF Verified YML057W CMP2 calcineurin catalytic subunit A|CNA2 chromosome 13 L000000368 13 160180 161994 W 1996-07-31 1996-07-31 Calcineurin A; one isoform (the other is Cna1p) of the catalytic subunit of calcineurin, a Ca++/calmodulin-regulated protein phosphatase which regulates Crz1p (a stress-response transcription factor), the other calcineurin subunit is CNB1; regulates the function of Aly1p alpha-arrestin; CMP2 has a paralog, CNA1, that arose from the whole genome duplication +S000032034 CDS YML057W 13 160180 161994 W 1996-07-31 1996-07-31 +S000004522 ORF Dubious YML057C-A YML058C-A chromosome 13 13 160412 160023 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene CMP2/YML057W +S000036471 CDS YML057C-A 13 160412 160023 C 1996-07-31 1996-07-31 +S000006445 snoRNA_gene snR54 SNR54 chromosome 13 L000004523 13 163620 163535 C 2000-05-19 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position A974 +S000030738 noncoding_exon snR54 13 163620 163535 C 2000-05-19 2000-05-19 +S000004520 ORF Verified YML056C IMD4 IMP dehydrogenase IMD4 chromosome 13 13 164176 162194 C 1996-07-31 1996-07-31 Inosine monophosphate dehydrogenase; catalyzes the rate-limiting step in the de novo synthesis of GTP; member of a four-gene family in S. cerevisiae, constitutively expressed; IMD4 has a paralog, IMD3, that arose from the whole genome duplication +S000031022 CDS YML056C 13 163308 162194 C 1996-07-31 1996-07-31 +S000031021 CDS YML056C 13 164176 163717 C 1996-07-31 1996-07-31 +S000031023 intron YML056C 13 163716 163309 C 1996-07-31 1996-07-31 +S000004519 ORF Verified YML055W SPC2 signal peptidase complex subunit SPC2|SPY1 chromosome 13 L000002874 13 164790 165326 W 1996-07-31 1996-07-31 Subunit of signal peptidase complex; complex catalyzes cleavage of N-terminal signal sequences of proteins targeted to the secretory pathway; homologous to mammalian SPC25; other members of the complex are Spc1p, Spc1p, and Sec11p +S000030975 CDS YML055W 13 164790 165326 W 1996-07-31 1996-07-31 +S000004518 ORF Verified YML054C CYB2 FCB2 chromosome 13 L000000447 13 167308 165533 C -30 1996-07-31 1996-07-31 Cytochrome b2 (L-lactate cytochrome-c oxidoreductase); component of the mitochondrial intermembrane space, required for lactate utilization; expression is repressed by glucose and anaerobic conditions +S000030874 CDS YML054C 13 167308 165533 C 1996-07-31 1996-07-31 +S000028573 ORF Uncharacterized YML054C-A chromosome 13 13 167781 167623 C 2003-07-29 2003-07-29 Putative protein of unknown function +S000031301 CDS YML054C-A 13 167781 167623 C 2003-07-29 2003-07-29 +S000007102 long_terminal_repeat YMLCdelta2 chromosome 13 13 168681 168349 C 2000-05-19 2000-05-19 Ty2 LTR +S000006783 tRNA_gene tY(GUA)M1 SUP5 chromosome 13 L000003666|L000002184 13 168795 168883 W -34 2000-05-19 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations +S000032294 intron tY(GUA)M1 13 168834 168847 W 2000-05-19 2000-05-19 +S000032292 noncoding_exon tY(GUA)M1 13 168795 168833 W 2000-05-19 2000-05-19 +S000032293 noncoding_exon tY(GUA)M1 13 168848 168883 W 2000-05-19 2000-05-19 +S000004517 ORF Uncharacterized YML053C chromosome 13 13 169754 169116 C 1996-07-31 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and the nucleus; overexpression causes a cell cycle delay or arrest; YML053C is not an essential gene +S000030788 CDS YML053C 13 169754 169116 C 1996-07-31 1996-07-31 +S000004516 ORF Verified YML052W SUR7 chromosome 13 L000004152 13 170402 171310 W 1996-07-31 1996-07-31 Plasma membrane protein, component of eisosomes; long-lived protein that remains stable in eisosomes of mother cells while other eisosome proteins, Pil1p and Lsp1p, turn over; may function to anchor the eisosome in place; sporulation and plasma membrane sphingolipid content are altered in mutants; localizes to furrow-like invaginations (MCC patches) +S000037898 CDS YML052W 13 170402 171310 W 1996-07-31 1996-07-31 +S000004515 ORF Verified YML051W GAL80 transcription regulator GAL80 chromosome 13 L000000665 13 171594 172901 W -33 1996-07-31 1996-07-31 Transcriptional regulator involved in the repression of GAL genes; involved in the repression of GAL genes in the absence of galactose; inhibits transcriptional activation by Gal4p; inhibition relieved by Gal3p or Gal1p binding +S000037805 CDS YML051W 13 171594 172901 W 1996-07-31 1996-07-31 +S000004514 ORF Verified YML050W AIM32 chromosome 13 13 173139 174074 W 1996-07-31 1996-07-31 Protein of unknown function; null mutant is viable and displays elevated frequency of mitochondrial genome loss +S000037724 CDS YML050W 13 173139 174074 W 1996-07-31 1996-07-31 +S000004513 ORF Verified YML049C RSE1 U2 snRNP complex subunit RSE1 chromosome 13 L000004030 13 178305 174220 C 1996-07-31 1996-07-31 Protein involved in pre-mRNA splicing; component of the pre-spliceosome; associates with U2 snRNA; involved in ER to Golgi transport +S000036229 CDS YML049C 13 178305 174220 C 1996-07-31 1996-07-31 +S000004511 ORF Verified YML048W GSF2 ECM6 chromosome 13 L000003209 13 178426 179637 W 1996-07-31 1996-07-31 Endoplasmic reticulum (ER) localized integral membrane protein; may promote secretion of certain hexose transporters, including Gal2p; involved in glucose-dependent repression +S000036176 CDS YML048W 13 178426 179637 W 1996-07-31 1996-07-31 +S000004512 ORF Dubious YML047W-A YML048W-A chromosome 13 13 179893 180258 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF PRM6/YML047C +S000031724 CDS YML047W-A 13 179893 180258 W 1996-07-31 1996-07-31 +S000004510 ORF Verified YML047C PRM6 pheromone-regulated K(+) transporter PRM6|KCH2 chromosome 13 13 181075 180017 C 1996-07-31 1996-07-31 Potassium transporter that mediates K+ influx; activates high-affinity Ca2+ influx system (HACS) during mating pheromone response; expression up-regulated in response to alpha factor; regulated by Ste12p during mating; localized to sites of polarized growth; member of a fungal-specific gene family; PRM6 has a paralog, KCH1, that arose from the whole genome duplication +S000035933 CDS YML047C 13 181075 180017 C 1996-07-31 1996-07-31 +S000004509 ORF Verified YML046W PRP39 chromosome 13 L000001511 13 181474 183363 W 1996-07-31 1996-07-31 U1 snRNP protein involved in splicing; contains multiple tetriatricopeptide repeats +S000035883 CDS YML046W 13 181474 183363 W 1996-07-31 1996-07-31 +S000118368 ARS ARS1308 ARSXIII-184 chromosome 13 13 183797 183887 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178154 ARS_consensus_sequence ARS1308 13 183874 183858 C 2014-11-18 2014-11-18 +S000006585 tRNA_gene tG(GCC)M chromosome 13 L000003685 13 183968 183898 C 2000-05-19 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis +S000029832 noncoding_exon tG(GCC)M 13 183968 183898 C 2000-05-19 2000-05-19 +S000007103 long_terminal_repeat YMLWdelta3 chromosome 13 13 184170 184501 W 2000-05-19 2000-05-19 Ty1 LTR +S000007107 LTR_retrotransposon YMLWTy1-1 Ty1 chromosome 13 13 184170 190083 W 2000-05-19 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007381 transposable_element_gene YML045W-A gag protein chromosome 13 13 184461 185783 W 1996-07-31 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000036727 CDS YML045W-A 13 184461 185783 W 1996-07-31 1996-07-31 +S000004508 transposable_element_gene YML045W gag-pol fusion protein chromosome 13 13 184461 189729 W 1996-07-31 1999-07-17|1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000034966 CDS YML045W 13 184461 185765 W 1999-07-17 1999-07-17|1996-07-31 +S000034967 CDS YML045W 13 185767 189729 W 1999-07-17 1999-07-17|1996-07-31 +S000034968 plus_1_translational_frameshift YML045W 13 185766 185766 W 1999-07-17 1999-07-17|1996-07-31 +S000007104 long_terminal_repeat YMLWdelta4 chromosome 13 13 189752 190083 W 2000-05-19 2000-05-19 Ty1 LTR +S000004507 ORF Verified YML043C RRN11 chromosome 13 L000004133 13 191767 190244 C 1996-07-31 1996-07-31 Component of the core factor (CF) rDNA transcription factor complex; CF is required for transcription of 35S rRNA genes by RNA polymerase I and is composed of Rrn6p, Rrn7p, and Rrn11p +S000033836 CDS YML043C 13 191767 190244 C 1996-07-31 1996-07-31 +S000004506 ORF Verified YML042W CAT2 carnitine O-acetyltransferase CAT2|YCAT chromosome 13 L000000218 13 192788 194800 W 1996-07-31 1996-07-31 Carnitine acetyl-CoA transferase; present in both mitochondria and peroxisomes; transfers activated acetyl groups to carnitine to form acetylcarnitine which can be shuttled across membranes +S000033788 CDS YML042W 13 192788 194800 W 1996-07-31 1996-07-31 +S000004505 ORF Verified YML041C VPS71 SWC6 chromosome 13 13 195755 194913 C 1996-07-31 1996-07-31 Nucleosome-binding component of the SWR1 complex; SWR1 exchanges histone variant H2AZ (Htz1p) for chromatin-bound histone H2A; required for vacuolar protein sorting +S000033617 CDS YML041C 13 195755 194913 C 1996-07-31 1996-07-31 +S000006684 tRNA_gene tP(UGG)M SUF7 chromosome 13 L000002155|L000003684 13 196170 196068 C -32 2000-05-19 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin; can mutate to suppress +1 frameshift mutations in proline codons +S000036019 intron tP(UGG)M 13 196134 196104 C 2000-05-19 2000-05-19 +S000036018 noncoding_exon tP(UGG)M 13 196103 196068 C 2000-05-19 2000-05-19 +S000036017 noncoding_exon tP(UGG)M 13 196170 196135 C 2000-05-19 2000-05-19 +S000007105 long_terminal_repeat YMLWdelta5 chromosome 13 13 196332 196668 W 2000-05-19 2000-05-19 Ty1 LTR +S000007108 LTR_retrotransposon YMLWTy1-2 Ty1 chromosome 13 13 196332 202234 W 2000-05-19 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000004504 transposable_element_gene YML040W gag protein chromosome 13 13 196628 197950 W 1996-07-31 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000033569 CDS YML040W 13 196628 197950 W 1996-07-31 1996-07-31 +S000004503 transposable_element_gene YML039W gag-pol fusion protein chromosome 13 S000029016 13 196628 201896 W 1996-07-31 1999-07-17|1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000032892 CDS YML039W 13 196628 197932 W 1999-07-17 1999-07-17|1996-07-31 +S000032893 CDS YML039W 13 197934 201896 W 1999-07-17 1999-07-17|1996-07-31 +S000032894 plus_1_translational_frameshift YML039W 13 197933 197933 W 1999-07-17 1999-07-17|1996-07-31 +S000007106 long_terminal_repeat YMLWdelta6 chromosome 13 13 201919 202234 W 2000-05-19 2000-05-19 Ty1 LTR +S000004502 ORF Verified YML038C YMD8 chromosome 13 13 204103 202775 C 1996-07-31 1996-07-31 Putative nucleotide sugar transporter; has similarity to Vrg4p +S000032731 CDS YML038C 13 204103 202775 C 1996-07-31 1996-07-31 +S000004501 ORF Uncharacterized YML037C chromosome 13 13 205408 204386 C 1996-07-31 1996-07-31 Putative protein of unknown function; has some characteristics of a transcriptional activator; may be a target of Dbf2p-Mob1p kinase; GFP-fusion protein co-localizes with clathrin-coated vesicles; YML037C is not an essential gene +S000031852 CDS YML037C 13 205408 204386 C 1996-07-31 1996-07-31 +S000004500 ORF Verified YML036W CGI121 chromosome 13 13 205642 206293 W 2007-07-10 1996-07-31|2007-07-10 Component of the EKC/KEOPS complex; EKC/KEOPS complex is required for t6A tRNA modification and telomeric TG1-3 recombination; may have role in transcription; Cgi121p is dispensable for tRNA modification; other complex members are Bud32p, Kae1p, Pcc1p, and Gon7p +S000031755 CDS YML036W 13 205642 206097 W 2007-07-10 1996-07-31|2007-07-10 +S000123281 CDS YML036W 13 206204 206293 W 2007-07-10 2007-07-10 +S000123280 intron YML036W 13 206098 206203 W 2007-07-10 2007-07-10 +S000004498 ORF Verified YML035C AMD1 AMP deaminase|AMD3 chromosome 13 L000000082|L000002678 13 208860 206428 C 1996-07-31 1996-07-31 AMP deaminase; tetrameric enzyme that catalyzes the deamination of AMP to form IMP and ammonia; thought to be involved in regulation of intracellular purine (adenine, guanine, and inosine) nucleotide pools +S000031615 CDS YML035C 13 208860 206428 C 1996-07-31 1996-07-31 +S000004497 ORF Verified YML034W SRC1 HEH1|YML033W chromosome 13 S000004496 13 209525 212155 W 1998-11-10 1998-11-10|1996-07-31 Inner nuclear membrane protein; highly enriched at telomeres and subtelomeric regions; functions in regulation of subtelomeric genes and is linked to TREX (transcription export) factors; SRC1 produces 2 splice variant proteins with different functions; alternative splicing of SRC1 pre-mRNA is promoted by Hub1p; mutant has aneuploidy tolerance; SEC1 has a paralog, HEH2, that arose from the whole genome duplication +S000031569 CDS YML034W 13 209525 211444 W 1998-11-10 1998-11-10|1996-07-31 +S000031570 CDS YML034W 13 211571 212155 W 1998-11-10 1998-11-10 +S000031571 intron YML034W 13 211445 211570 W 1998-11-10 1998-11-10 +S000004499 ORF Dubious YML034C-A YML035C-A chromosome 13 13 209826 209428 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF SRC1/YML034W +S000031984 CDS YML034C-A 13 209826 209428 C 1996-07-31 1996-07-31 +S000004494 ORF Verified YML032C RAD52 recombinase RAD52 chromosome 13 L000001572 13 213930 212515 C -18 2003-01-07 2003-01-07|1996-07-31 Protein that stimulates strand exchange; stimulates strand exchange by facilitating Rad51p binding to single-stranded DNA; anneals complementary single-stranded DNA; involved in the repair of double-strand breaks in DNA during vegetative growth and meiosis and UV induced sister chromatid recombination +S000030550 CDS YML032C 13 213930 212515 C 2003-01-07 2003-01-07|1996-07-31 +S000004493 ORF Verified YML031W NDC1 chromosome 13 L000001237 13 214189 216156 W -18 1996-07-31 1996-07-31 Subunit of the transmembrane ring of the nuclear pore complex (NPC); contributes to nucleocytoplasmic transport, NPC biogenesis and spindle pole body duplication; homologous to human NDC1 +S000030507 CDS YML031W 13 214189 216156 W 1996-07-31 1996-07-31 +S000028809 ORF Dubious YML031C-A YML032C-A chromosome 13 S000004495 13 214421 214086 C 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF NDC1/YML031W +S000033595 CDS YML031C-A 13 214421 214086 C 2003-07-29 2003-07-29 +S000004492 ORF Verified YML030W RCF1 AIM31 chromosome 13 13 216435 216914 W 1996-07-31 1996-07-31 Cytochrome c oxidase subunit; required for assembly of the Complex III-Complex IV supercomplex, and for assembly of Cox13p and Rcf2p into cytochrome c oxidase; similar to Rcf2p, and either Rcf1p or Rcf2p is required for late-stage assembly of the Cox12p and Cox13p subunits and for cytochrome c oxidase activity; required for growth under hypoxic conditions; member of the hypoxia induced gene family; C. elegans and human orthologs are functional in yeast +S000030362 CDS YML030W 13 216435 216914 W 1996-07-31 1996-07-31 +S000004491 ORF Verified YML029W USA1 chromosome 13 L000003225 13 217362 219878 W 1996-07-31 1996-07-31 Scaffold subunit of the Hrd1p ubiquitin ligase; also promotes ligase oligomerization; involved in ER-associated protein degradation (ERAD); interacts with the U1 snRNP-specific protein, Snp1p +S000037625 CDS YML029W 13 217362 219878 W 1996-07-31 1996-07-31 +S000004490 ORF Verified YML028W TSA1 thioredoxin peroxidase TSA1|cTPxI|TPX1|ZRG14 chromosome 13 L000002365 13 220138 220728 W 1996-07-31 1996-07-31 Thioredoxin peroxidase; acts as both ribosome-associated and free cytoplasmic antioxidant; self-associates to form high-molecular weight chaperone complex under oxidative stress; chaperone activity essential for growth in zinc deficiency; required for telomere length maintenance; binds and modulates Cdc19p activity; protein abundance increases, forms cytoplasmic foci during DNA replication stress; TSA1 has a paralog, TSA2, that arose from the whole genome duplication +S000037561 CDS YML028W 13 220138 220728 W 1996-07-31 1996-07-31 +S000004489 ORF Verified YML027W YOX1 chromosome 13 L000002540 13 221406 222563 W 1996-07-31 1996-07-31 Homeobox transcriptional repressor; binds to Mcm1p and to early cell cycle boxes (ECBs) in the promoters of cell cycle-regulated genes expressed in M/G1 phase; expression is cell cycle-regulated; phosphorylated by Cdc28p; relocalizes from nucleus to cytoplasm upon DNA replication stress; YOX1 has a paralog, YHP1, that arose from the whole genome duplication +S000036828 CDS YML027W 13 221406 222563 W 1996-07-31 1996-07-31 +S000004488 ORF Verified YML026C RPS18B uS13|ribosomal 40S subunit protein S18B|S18B|S13 chromosome 13 L000004481 13 223828 222987 C 1996-07-31 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S18 and bacterial S13; RPS18B has a paralog, RPS18A, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000036754 CDS YML026C 13 223380 222987 C 1996-07-31 1996-07-31 +S000036753 CDS YML026C 13 223828 223782 C 1996-07-31 1996-07-31 +S000036755 intron YML026C 13 223781 223381 C 1996-07-31 1996-07-31 +S000004487 ORF Verified YML025C YML6 mitochondrial 54S ribosomal protein YmL6 chromosome 13 13 225365 224406 C 1996-07-31 1996-07-31 Mitochondrial ribosomal protein of the large subunit; has similarity to E. coli L4 ribosomal protein and human mitoribosomal MRP-L4 protein; essential for viability, unlike most other mitoribosomal proteins +S000036690 CDS YML025C 13 225239 224406 C 1996-07-31 1996-07-31 +S000036689 CDS YML025C 13 225365 225339 C 1996-07-31 1996-07-31 +S000036691 intron YML025C 13 225338 225240 C 1996-07-31 1996-07-31 +S000004486 ORF Verified YML024W RPS17A eS17|ribosomal 40S subunit protein S17A|S17e|rp51A|S17A|RPL51A|RP51A chromosome 13 L000001740|L000004479|L000001669 13 225889 226697 W 1996-07-31 1996-07-31 Ribosomal protein 51 (rp51) of the small (40s) subunit; homologous to mammalian ribosomal protein S17, no bacterial homolog; RPS17A has a paralog, RPS17B, that arose from the whole genome duplication +S000036659 CDS YML024W 13 225889 225891 W 1996-07-31 1996-07-31 +S000036660 CDS YML024W 13 226290 226697 W 1996-07-31 1996-07-31 +S000036661 intron YML024W 13 225892 226289 W 1996-07-31 1996-07-31 +S000004485 ORF Verified YML023C NSE5 Smc5-Smc6 complex subunit NSE5 chromosome 13 13 228664 226994 C 1996-07-31 1996-07-31 Component of the SMC5-SMC6 complex; this complex plays a key role in the removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair +S000035667 CDS YML023C 13 228664 226994 C 1996-07-31 1996-07-31 +S000004484 ORF Verified YML022W APT1 adenine phosphoribosyltransferase APT1 chromosome 13 L000002641 13 228937 229500 W 1996-07-31 1996-07-31 Adenine phosphoribosyltransferase; catalyzes the formation of AMP from adenine and 5-phosphoribosylpyrophosphate; involved in the salvage pathway of purine nucleotide biosynthesis; APT1 has a paralog, APT2, that arose from the whole genome duplication +S000035625 CDS YML022W 13 228937 229500 W 1996-07-31 1996-07-31 +S000004483 ORF Verified YML021C UNG1 uracil-DNA glycosylase chromosome 13 L000002428 13 230813 229734 C -16 1996-07-31 1996-07-31 Uracil-DNA glycosylase; required for repair of uracil in DNA formed by spontaneous cytosine deamination; efficiently excises uracil from single-stranded DNA in vivo; not required for strand-specific mismatch repair; cell-cycle regulated, expressed in late G1; localizes to mitochondria and nucleus +S000035496 CDS YML021C 13 230813 229734 C 1996-07-31 1996-07-31 +S000004482 ORF Uncharacterized YML020W chromosome 13 13 231149 233143 W 1996-07-31 1996-07-31 Putative protein of unknown function +S000034551 CDS YML020W 13 231149 233143 W 1996-07-31 1996-07-31 +S000004481 ORF Verified YML019W OST6 dolichyl-diphosphooligosaccharide--protein glycotransferase chromosome 13 L000004224 13 233457 234455 W 1996-07-31 1996-07-31 Subunit of the oligosaccharyltransferase complex of the ER lumen; complex catalyzes asparagine-linked glycosylation of newly synthesized proteins; similar to and partially functionally redundant with Ost3p +S000033544 CDS YML019W 13 233457 234455 W 1996-07-31 1996-07-31 +S000004480 ORF Verified YML018C chromosome 13 13 235952 234771 C 1996-07-31 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the membrane of the vacuole; physical interaction with Atg27p suggests a possible role in autophagy; YML018C is not an essential gene; relative distribution to the vacuolar membrane decreases upon DNA replication stress; YML018C has a paralog, THI74, that arose from the whole genome duplication +S000033433 CDS YML018C 13 235952 234771 C 1996-07-31 1996-07-31 +S000004479 ORF Verified YML017W PSP2 MRS15 chromosome 13 L000002882 13 236588 238731 W 2004-01-30 2004-01-30|1996-07-31|1999-07-17 Asn rich cytoplasmic protein that contains RGG motifs; high-copy suppressor of group II intron-splicing defects of a mutation in MRS2 and of a conditional mutation in POL1 (DNA polymerase alpha); possible role in mitochondrial mRNA splicing +S000033400 CDS YML017W 13 236588 236591 W 2004-01-30 2004-01-30|1999-07-17|1996-07-31 +S000033401 CDS YML017W 13 236954 238731 W 2004-01-30 2004-01-30 +S000033402 intron YML017W 13 236592 236953 W 2004-01-30 2004-01-30 +S000004478 ORF Verified YML016C PPZ1 salt homeostasis regulator chromosome 13 L000001478 13 241536 239458 C 1996-07-31 1996-07-31 Serine/threonine protein phosphatase Z, isoform of Ppz2p; involved in regulation of potassium transport, which affects osmotic stability, cell cycle progression, and halotolerance +S000032668 CDS YML016C 13 241536 239458 C 1996-07-31 1996-07-31 +S000004477 ORF Verified YML015C TAF11 TafII40|TAF40 chromosome 13 L000003461 13 243029 241989 C 1996-07-31 1996-07-31 TFIID subunit (40 kDa); involved in RNA polymerase II transcription initiation, similar to histone H3 with atypical histone fold motif of Spt3-like transcription factors +S000032578 CDS YML015C 13 243029 241989 C 1996-07-31 1996-07-31 +S000004476 ORF Verified YML014W TRM9 tRNA (carboxymethyluridine(34)-5-O)-methyltransferase|KTI1 chromosome 13 S000028426 13 243225 244064 W 1996-07-31 1996-07-31 tRNA methyltransferase; catalyzes modification of wobble bases in tRNA anticodons to 2, 5-methoxycarbonylmethyluridine and 5-methoxycarbonylmethyl-2-thiouridine; may act as part of a complex with Trm112p; deletion mutation increases translational infidelity, including amino acid misincorporation and -1 frameshifting, and also confers resistance to zymocin; null mutant displays activation of stress responses +S000032547 CDS YML014W 13 243225 244064 W 1996-07-31 1996-07-31 +S000004475 ORF Verified YML013W UBX2 SEL1 chromosome 13 13 244149 245903 W 1996-07-31 1996-07-31 Bridging factor involved in ER-associated protein degradation (ERAD); bridges the cytosolic Cdc48p-Npl1p-Ufd1p ATPase complex and the membrane associated Ssm4p and Hrd1p ubiquitin ligase complexes; contains a UBX (ubiquitin regulatory X) domain and a ubiquitin-associated (UBA) domain; redistributes from the ER to lipid droplets during the diauxic shift and stationary phase; required for the maintenance of lipid homeostasis +S000032448 CDS YML013W 13 244149 245903 W 1996-07-31 1996-07-31 +S000004474 ORF Dubious YML012C-A YML013C-A chromosome 13 13 245914 245537 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene SEL1 +S000037094 CDS YML012C-A 13 245914 245537 C 1996-07-31 1996-07-31 +S000004473 ORF Verified YML012W ERV25 chromosome 13 L000004076 13 246116 246751 W 1996-07-31 1996-07-31 Member of the p24 family involved in ER to Golgi transport; role in misfolded protein quality control; forms a heterotrimeric complex with Erp1, Erp2p, and Emp24, +S000031434 CDS YML012W 13 246116 246751 W 1996-07-31 1996-07-31 +S000004472 ORF Verified YML011C RAD33 chromosome 13 13 247428 246895 C 1996-07-31 1996-07-31 Protein involved in nucleotide excision repair; green fluorescent protein (GFP)-fusion protein localizes to the nucleus +S000031265 CDS YML011C 13 247428 246895 C 1996-07-31 1996-07-31 +S000004470 ORF Verified YML010W SPT5 transcription elongation factor SPT5 chromosome 13 L000002031 13 247677 250868 W -5 1996-07-31 1996-07-31 Spt4p/5p (DSIF) transcription elongation factor complex subunit; the Spt4/5 complex binds to ssRNA in a sequence-specific manner, and in concert with RNAP I and II has multiple roles regulating transcriptional elongation, RNA processing, quality control, and transcription-coupled repair; interacts with DNA upstream of RNAPII and the non-template strand of the transcription bubble; Spt5p is the only transcription elongation factor conserved in all domains of life +S000031213 CDS YML010W 13 247677 250868 W 1996-07-31 1996-07-31 +S000004471 ORF Dubious YML009W-B YML010W-A chromosome 13 13 250435 250911 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; deletion mutation confers an increase in Ty1 transposition +S000032788 CDS YML009W-B 13 250435 250911 W 1996-07-31 1996-07-31 +S000004469 ORF Dubious YML009C-A YML010W-B|YML010C-B chromosome 13 13 251001 250675 C 1997-07-01 1997-07-01 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORFs SPT5/YML010W and YML009W-B +S000031473 CDS YML009C-A 13 251001 250675 C 1997-07-01 1997-07-01 +S000004468 ORF Verified YML009C MRPL39 mitochondrial 54S ribosomal protein YmL39|YmL39 chromosome 13 L000002695 13 251516 251304 C 1996-07-31 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000037268 CDS YML009C 13 251516 251304 C 1996-07-31 1996-07-31 +S000004467 ORF Verified YML008C ERG6 sterol 24-C-methyltransferase|VID1|SED6|LIS1|ISE1 chromosome 13 L000000572|S000029637|L000003110 13 252990 251839 C 2 1996-07-31 1996-07-31 Delta(24)-sterol C-methyltransferase; converts zymosterol to fecosterol in the ergosterol biosynthetic pathway by methylating position C-24; localized to lipid particles, the plasma membrane-associated endoplasmic reticulum, and the mitochondrial outer membrane +S000037178 CDS YML008C 13 252990 251839 C 1996-07-31 1996-07-31 +S000007621 ORF Uncharacterized YML007C-A chromosome 13 13 253272 253162 C 2001-02-26 2001-02-26 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to mitochondria +S000037219 CDS YML007C-A 13 253272 253162 C 2001-02-26 2001-02-26 +S000004466 ORF Verified YML007W YAP1 PDR4|DNA-binding transcription factor YAP1|SNQ3|PAR1 chromosome 13 L000001364 13 253848 255800 W -8 1996-07-31 1996-07-31 Basic leucine zipper (bZIP) transcription factor; required for oxidative stress tolerance; activated by H2O2 through the multistep formation of disulfide bonds and transit from the cytoplasm to the nucleus; Yap1p is degraded in the nucleus after the oxidative stress has passed; mediates resistance to cadmium; relative distribution to the nucleus increases upon DNA replication stress; YAP1 has a paralog, CAD1, that arose from the whole genome duplication +S000037132 CDS YML007W 13 253848 255800 W 1996-07-31 1996-07-31 +S000004465 ORF Verified YML006C GIS4 chromosome 13 L000004864 13 258416 256092 C 1996-07-31 1996-07-31 CAAX box containing protein of unknown function; proposed to be involved in the RAS/cAMP signaling pathway +S000036417 CDS YML006C 13 258416 256092 C 1996-07-31 1996-07-31 +S000006729 tRNA_gene tS(AGA)M chromosome 13 L000003683 13 259239 259158 C 2000-05-19 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000032411 noncoding_exon tS(AGA)M 13 259239 259158 C 2000-05-19 2000-05-19 +S000004464 ORF Verified YML005W TRM12 TYW2 chromosome 13 13 260221 261609 W 1996-07-31 1996-07-31 S-adenosylmethionine-dependent methyltransferase; required for wybutosine formation in phenylalanine-accepting tRNA; member of the seven beta-strand family +S000036385 CDS YML005W 13 260221 261609 W 1996-07-31 1996-07-31 +S000004463 ORF Verified YML004C GLO1 lactoylglutathione lyase GLO1 chromosome 13 L000000712 13 262685 261705 C 1996-07-31 1996-07-31 Monomeric glyoxalase I; catalyzes the detoxification of methylglyoxal (a by-product of glycolysis) via condensation with glutathione to produce S-D-lactoylglutathione; expression regulated by methylglyoxal levels and osmotic stress +S000036221 CDS YML004C 13 262685 261705 C 1996-07-31 1996-07-31 +S000118369 ARS ARS1309 ARSXIII-263 chromosome 13 13 263063 263296 2006-08-30 2006-08-30 Autonomously Replicating Sequence +S000178155 ARS_consensus_sequence ARS1309 13 263126 263142 W 2014-11-18 2014-11-18 +S000004462 ORF Uncharacterized YML003W chromosome 13 13 263483 264355 W 1996-07-31 1996-07-31 Putative protein of unknown function +S000036178 CDS YML003W 13 263483 264355 W 1996-07-31 1996-07-31 +S000004461 ORF Uncharacterized YML002W chromosome 13 13 264541 266754 W 1996-07-31 1996-07-31 Putative protein of unknown function; expression induced by heat and by calcium shortage +S000035235 CDS YML002W 13 264541 266754 W 1996-07-31 1996-07-31 +S000004460 ORF Verified YML001W YPT7 Rab family GTPase YPT7|VAM4|AST4 chromosome 13 L000002544 13 267174 267800 W 1996-07-31 1996-07-31 Rab family GTPase; GTP-binding protein of the rab family; required for homotypic fusion event in vacuole inheritance, for endosome-endosome fusion; localizes to sites of contact between the vacuole and mitochondria (vCLAMPs); interacts with the cargo selection/retromer complex for retrograde sorting; similar to mammalian Rab7 +S000035058 CDS YML001W 13 267174 267800 W 1996-07-31 1996-07-31 +S000006474 centromere CEN13 CEN13 chromosome 13 L000000306 13 268031 268149 W 0 2004-10-08 2000-05-19|2004-10-08 Chromosome XIII centromere +S000077278 centromere_DNA_Element_I CEN13 13 268031 268040 W 2004-10-05 2004-10-05 +S000077279 centromere_DNA_Element_II CEN13 13 268041 268124 W 2004-10-05 2004-10-05 +S000077280 centromere_DNA_Element_III CEN13 13 268125 268149 W 2004-10-05 2004-10-05 +S000004603 ORF Verified YMR001C CDC5 polo kinase CDC5|PKX2|MSD2 chromosome 13 L000000245 13 271136 269019 C -14 1996-07-31 1996-07-31 Polo-like kinase; controls targeting and activation of Rho1p at cell division site via Rho1p guanine nucleotide exchange factors; regulates Spc72p; also functions in adaptation to DNA damage during meiosis; regulates the shape of the nucleus and expansion of the nuclear envelope during mitosis; similar to Xenopus Plx1 and S. pombe Plo1p; human homologs PLK1, PLK3 can each complement yeast cdc5 thermosensitive mutants +S000031052 CDS YMR001C 13 271136 269019 C 1996-07-31 1996-07-31 +S000028691 ORF Uncharacterized YMR001C-A chromosome 13 13 271577 271347 C 2003-07-29 2003-07-29 Putative protein of unknown function +S000032590 CDS YMR001C-A 13 271577 271347 C 2003-07-29 2003-07-29 +S000004604 ORF Verified YMR002W MIX17 MIC17 chromosome 13 13 272193 272663 W 1996-07-31 1996-07-31 Mitochondrial intermembrane space protein; required for normal oxygen consumption; contains twin cysteine-x9-cysteine motifs; protein abundance increases in response to DNA replication stress +S000031255 CDS YMR002W 13 272193 272663 W 1996-07-31 1996-07-31 +S000004605 ORF Verified YMR003W AIM34 chromosome 13 13 273118 273714 W 1996-07-31 1996-07-31 Protein of unknown function; GFP-fusion protein localizes to the mitochondria; null mutant is viable and displays reduced frequency of mitochondrial genome loss +S000032255 CDS YMR003W 13 273118 273714 W 1996-07-31 1996-07-31 +S000004606 ORF Verified YMR004W MVP1 chromosome 13 L000001221 13 274017 275552 W 1996-07-31 1996-07-31 Protein required for sorting proteins to the vacuole; Mvp1p and Vps1p act in concert to promote membrane traffic to the vacuole; participates in transcription initiation and/or early elongation of specific genes; interacts with "foot domain" of RNA polymerase II; deletion results in abnormal CTD-Ser5 phosphorylation of RNA polymerase II at specific promoter regions; protein abundance increases in response to DNA replication stress +S000032360 CDS YMR004W 13 274017 275552 W 1996-07-31 1996-07-31 +S000004607 ORF Verified YMR005W TAF4 TafII48|MPT1|TSG2|TAF48 chromosome 13 L000001144 13 276045 277211 W 1996-07-31 1996-07-31 TFIID subunit (48 kDa); involved in RNA polymerase II transcription initiation; potential Cdc28p substrate +S000032443 CDS YMR005W 13 276045 277211 W 1996-07-31 1996-07-31 +S000004608 ORF Verified YMR006C PLB2 lysophospholipase chromosome 13 L000004866 13 279681 277561 C 1996-07-31 1996-07-31 Phospholipase B (lysophospholipase) involved in lipid metabolism; displays transacylase activity in vitro; overproduction confers resistance to lysophosphatidylcholine +S000032499 CDS YMR006C 13 279681 277561 C 1996-07-31 1996-07-31 +S000004609 ORF Uncharacterized YMR007W chromosome 13 13 279960 280340 W 1996-07-31 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YMR007W is not an essential gene +S000034599 CDS YMR007W 13 279960 280340 W 1996-07-31 1996-07-31 +S000004610 ORF Verified YMR008C PLB1 lysophospholipase chromosome 13 L000001447 13 282584 280590 C 1996-07-31 1996-07-31 Phospholipase B (lysophospholipase) involved in lipid metabolism; required for efficient acyl chain remodeling of newly synthesized phosphatidylethanolamine-derived phosphatidylcholine; required for deacylation of phosphatidylcholine and phosphatidylethanolamine but not phosphatidylinositol; PLB1 has a paralog, PLB3, that arose from the whole genome duplication +S000034626 CDS YMR008C 13 282584 280590 C 1996-07-31 1996-07-31 +S000004611 ORF Verified YMR009W ADI1 acireductone dioxygenase (Ni2+-requiring) chromosome 13 13 284102 284641 W 2011-02-03 1996-07-31 Acireductone dioxygenease involved in methionine salvage pathway; transcribed as polycistronic mRNA with YMR010W and regulated post-transcriptionally by RNase III (Rnt1p) cleavage; ADI1 mRNA is induced in heat shock conditions; human ortholog ADI1 can complement yeast adi1 mutant +S000034714 CDS YMR009W 13 284102 284641 W 2011-02-03 1996-07-31 +S000004612 ORF Verified YMR010W ANY1 chromosome 13 13 285100 286317 W 2011-02-03 1996-07-31 Putative protein of unknown function; null allele suppresses the lethality of neo1 and dop1 null alleles, as well as the growth defect of a mon2 null allele, and the cold sensitivity of a drs2 null; proposed function as a phospholipid scramblase that reduces membrane asymmetry; PQ loop family member; localizes to the cytoplasm and endoplasmic reticulum in HTP studies; non-essential gene +S000034268 CDS YMR010W 13 285100 286317 W 2011-02-03 1996-07-31 +S000118370 ARS ARS1310 ARSXIII-287 chromosome 13 13 286835 286951 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000004613 ORF Verified YMR011W HXT2 hexose transporter HXT2 chromosome 13 L000000836 13 288079 289704 W 2011-02-03 1996-07-31 High-affinity glucose transporter of the major facilitator superfamily; expression is induced by low levels of glucose and repressed by high levels of glucose +S000034391 CDS YMR011W 13 288079 289704 W 2011-02-03 1996-07-31 +S000007117 long_terminal_repeat YMRCtau1 chromosome 13 13 290224 290049 C 2011-02-03 2000-05-19 Ty4 LTR +S000006560 tRNA_gene tE(UUC)M chromosome 13 L000003667 13 290801 290872 W 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000036015 noncoding_exon tE(UUC)M 13 290801 290872 W 2011-02-03 2000-05-19 +S000004614 ORF Verified YMR012W CLU1 translation initiation factor 3 subunit CLU1|TIF31 chromosome 13 L000003531 13 291134 294967 W 2011-02-03 1996-07-31 Subunit of the eukaryotic translation initiation factor 3 (eIF3); component of unknown function; deletion causes defects in mitochondrial organization but not in growth or translation initiation; can rescue cytokinesis and mitochondrial organization defects of the Dictyostelium cluA- mutant; eIF3 is also involved in programmed stop codon readthrough +S000035421 CDS YMR012W 13 291134 294967 W 2011-02-03 1996-07-31 +S000028847 ORF Dubious YMR013C-A chromosome 13 13 296620 296471 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF SEC59/YML013C +S000034532 CDS YMR013C-A 13 296620 296471 C 2011-02-03 2003-07-29 +S000004615 ORF Verified YMR013C SEC59 dolichol kinase chromosome 13 L000001851 13 296738 295179 C 3 2011-02-03 1996-07-31 Dolichol kinase; catalyzes the terminal step in dolichyl monophosphate (Dol-P) biosynthesis; required for viability and for normal rates of lipid intermediate synthesis and protein N-glycosylation +S000035477 CDS YMR013C 13 296738 295179 C 2011-02-03 1996-07-31 +S000007312 snoRNA_gene snR78 SNR78 Z8 chromosome 13 L000004806 13 297278 297364 W 2011-02-03 2000-05-19|2007-05-08 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U2421 +S000031835 noncoding_exon snR78 13 297278 297364 W 2011-02-03 2000-05-19|2007-05-08 +S000007311 snoRNA_gene snR77 SNR77 Z7 chromosome 13 L000004805 13 297506 297593 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position U578 +S000031791 noncoding_exon snR77 13 297506 297593 W 2011-02-03 2000-05-19 +S000007310 snoRNA_gene snR76 SNR76 Z6 chromosome 13 L000004804 13 297725 297833 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position C2197 +S000031789 noncoding_exon snR76 13 297725 297833 W 2011-02-03 2000-05-19 +S000007309 snoRNA_gene snR75 SNR75 Z5 chromosome 13 L000004803 13 297918 298006 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position G2288 +S000031787 noncoding_exon snR75 13 297918 298006 W 2011-02-03 2000-05-19 +S000007308 snoRNA_gene snR74 SNR74 Z4 chromosome 13 L000004802 13 298138 298225 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position A28 +S000031786 noncoding_exon snR74 13 298138 298225 W 2011-02-03 2000-05-19 +S000007307 snoRNA_gene snR73 SNR73 Z3 chromosome 13 L000004801 13 298307 298412 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position C2959 +S000031785 noncoding_exon snR73 13 298307 298412 W 2011-02-03 2000-05-19 +S000007622 ORF Dubious YMR013W-A chromosome 13 13 298311 298391 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the characterized snoRNA gene snR73 +S000037220 CDS YMR013W-A 13 298311 298391 W 2011-02-03 2001-02-26 +S000007306 snoRNA_gene snR72 SNR72 Z2 chromosome 13 L000004800 13 298554 298651 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A876 +S000031784 noncoding_exon snR72 13 298554 298651 W 2011-02-03 2000-05-19 +S000004616 ORF Verified YMR014W BUD22 chromosome 13 13 298868 300427 W 2011-02-03 1996-07-31 Protein required for rRNA maturation and ribosomal subunit biogenesis; required for 18S rRNA maturation; also required for small ribosomal subunit biogenesis; cosediments with pre-ribosomal particles; mutation decreases efficiency of +1 Ty1 frameshifting and transposition, and affects budding pattern +S000035607 CDS YMR014W 13 298868 300427 W 2011-02-03 1996-07-31 +S000004617 ORF Verified YMR015C ERG5 C-22 sterol desaturase|CYP61 chromosome 13 L000003978 13 302485 300869 C 2011-02-03 1996-07-31 C-22 sterol desaturase; a cytochrome P450 enzyme that catalyzes the formation of the C-22(23) double bond in the sterol side chain in ergosterol biosynthesis; may be a target of azole antifungal drugs +S000035627 CDS YMR015C 13 302485 300869 C 2011-02-03 1996-07-31 +S000004618 ORF Verified YMR016C SOK2 chromosome 13 L000004147 13 305593 303236 C 2011-02-03 1996-07-31 Nuclear protein that negatively regulates pseudohyphal differentiation; plays a regulatory role in the cyclic AMP (cAMP)-dependent protein kinase (PKA) signal transduction pathway; relocalizes to the cytosol in response to hypoxia; SOK2 has a paralog, PHD1, that arose from the whole genome duplication +S000036571 CDS YMR016C 13 305593 303236 C 2011-02-03 1996-07-31 +S000004619 ORF Verified YMR017W SPO20 DBI9 chromosome 13 L000003397 13 307489 308682 W 2011-02-03 1996-07-31 Meiosis-specific subunit of the t-SNARE complex; required for prospore membrane formation during sporulation; similar to but not functionally redundant with Sec9p; binds to phosphatidic acid; SNAP-25 homolog +S000036703 CDS YMR017W 13 307489 308682 W 2011-02-03 1996-07-31 +S000004620 ORF Uncharacterized YMR018W PEX9 chromosome 13 13 310208 311752 W 2011-02-03 1996-07-31 Putative protein of unknown function with similarity to human PEX5Rp; transcription increases during colony development similar to genes involved in peroxisome biogenesis; YMR018W is not an essential gene; PEX5Rp is also known as peroxin protein 5 related protein +S000030567 CDS YMR018W 13 310208 311752 W 2011-02-03 1996-07-31 +S000004621 ORF Verified YMR019W STB4 chromosome 13 L000003367 13 312156 315005 W 2011-02-03 1996-07-31 Putative transcription factor; contains a Zn(II)2Cys6 zinc finger domain characteristic of DNA-binding proteins; computational analysis suggests a role in regulation of expression of genes encoding transporters; binds Sin3p in a two-hybrid assay; +S000030693 CDS YMR019W 13 312156 315005 W 2011-02-03 1996-07-31 +S000004622 ORF Verified YMR020W FMS1 polyamine oxidase chromosome 13 L000003091 13 315377 316903 W 2011-02-03 1996-07-31 Polyamine oxidase; converts spermine to spermidine, which is required for the essential hypusination modification of translation factor eIF-5A; also involved in pantothenic acid biosynthesis +S000030473 CDS YMR020W 13 315377 316903 W 2011-02-03 1996-07-31 +S000004623 ORF Verified YMR021C MAC1 CUA1 chromosome 13 L000000973|L000001035 13 318418 317165 C 2011-02-03 1996-07-31 Copper-sensing transcription factor; involved in regulation of genes required for high affinity copper transport; required for regulation of yeast copper genes in response to DNA-damaging agents; undergoes changes in redox state in response to changing levels of copper or MMS +S000030536 CDS YMR021C 13 318418 317165 C 2011-02-03 1996-07-31 +S000004624 ORF Verified YMR022W UBC7 E2 ubiquitin-conjugating protein UBC7|DER2|QRI8 chromosome 13 L000001552 13 318680 319177 W 2011-02-03 1996-07-31 Ubiquitin conjugating enzyme; involved in the ER-associated protein degradation (ERAD) pathway and in the inner nuclear membrane-associated degradation (INMAD) pathway; requires Cue1p for recruitment to the ER membrane; proposed to be involved in chromatin assembly +S000031503 CDS YMR022W 13 318680 319177 W 2011-02-03 1996-07-31 +S000004625 ORF Verified YMR023C MSS1 PET53 chromosome 13 L000001201 13 321017 319437 C 2011-02-03 1996-07-31 Mitochondrial protein; forms a heterodimer complex with Mto1p that performs the 5-carboxymethylaminomethyl modification of the wobble uridine base in mitochondrial tRNAs; similar to human GTPBP3 +S000031572 CDS YMR023C 13 321017 319437 C 2011-02-03 1996-07-31 +S000006518 tRNA_gene tA(AGC)M1 chromosome 13 L000003682 13 321219 321147 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine +S000036429 noncoding_exon tA(AGC)M1 13 321219 321147 C 2011-02-03 2000-05-19 +S000004626 ORF Verified YMR024W MRPL3 mitochondrial 54S ribosomal protein YmL3|YmL3 chromosome 13 L000002683 13 321875 323047 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; located in close proximity to the polypeptide exit channel of the ribosome; mutations in human homolog MRPL44 cause childhood cardiomyopathy; human MRPL44 deficiency results in inefficient assembly of the mitochondrial ribosome, and in tissue-specific respiratory chain deficiency, manifesting as either Complex I+Complex IV or Complex IV deficiency, depending on a cell type +S000032636 CDS YMR024W 13 321875 323047 W 2011-02-03 1996-07-31 +S000004627 ORF Verified YMR025W CSI1 chromosome 13 S000028416 13 323300 324187 W 2011-02-03 1996-07-31 Subunit of the Cop9 signalosome; which is required for deneddylation, or removal of the ubiquitin-like protein Rub1p from Cdc53p (cullin); involved in adaptation to pheromone signaling; functional equivalent of canonical Csn6 subunit of the COP9 signalosome +S000032707 CDS YMR025W 13 323300 324187 W 2011-02-03 1996-07-31 +S000004628 ORF Verified YMR026C PEX12 ubiquitin-protein ligase peroxin 12|PAS11 chromosome 13 L000004223|L000003964 13 325435 324236 C 2011-02-03 1996-07-31 C3HC4-type RING-finger peroxin and E3 ubiquitin ligase; required for peroxisome biogenesis and peroxisomal matrix protein import; forms translocation subcomplex with Pex2p and Pex10p; mutations in human homolog cause peroxisomal disorder +S000032743 CDS YMR026C 13 325435 324236 C 2011-02-03 1996-07-31 +S000004629 ORF Verified YMR027W putative methyltransferase chromosome 13 L000004444 13 325877 327289 W 2011-02-03 1996-07-31 A metal-dependent phosphatase, part of the DUF89 protein family; dephosphorylates fructose-1-phosphate; human ortholog, C6orf211 is involved in response to DNA damage; green fluorescent protein (GFP)-fusion protein localizes to the nucleus and cytoplasm; YMR027W is not an essential gene +S000032910 CDS YMR027W 13 325877 327289 W 2011-02-03 1996-07-31 +S000004630 ORF Verified YMR028W TAP42 chromosome 13 L000002599 13 327482 328582 W 2011-02-03 1996-07-31 Essential protein involved in the TOR signaling pathway; physically associates with the protein phosphatase 2A and the SIT4 protein phosphatase catalytic subunits +S000034867 CDS YMR028W 13 327482 328582 W 2011-02-03 1996-07-31 +S000004631 ORF Verified YMR029C FAR8 chromosome 13 13 330231 328660 C 2011-02-03 1996-07-31 Protein involved in recovery from arrest in response to pheromone; acts in a cell cycle arrest recovery pathway independent from Far1p; interacts with Far3p, Far7p, Far9p, Far10p, and Far11p +S000034915 CDS YMR029C 13 330231 328660 C 2011-02-03 1996-07-31 +S000004632 ORF Verified YMR030W RSF1 chromosome 13 13 330793 331923 W 2011-02-03 1996-07-31 Protein required for respiratory growth; localized to both the nucleus and mitochondrion; may interact with transcription factors to mediate the transition to respiratory growth and activate transcription of nuclear and mitochondrial genes +S000033894 CDS YMR030W 13 330793 331923 W 2011-02-03 1996-07-31 +S000004634 ORF Dubious YMR031W-A chromosome 13 13 334709 335035 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; null mutant displays shortened telomeres; partially overlaps the uncharacterized ORF YMR031C +S000036523 CDS YMR031W-A 13 334709 335035 W 2011-02-03 1996-07-31 +S000004633 ORF Verified YMR031C EIS1 chromosome 13 13 334743 332212 C 2011-02-03 1996-07-31 Component of the eisosome required for proper eisosome assembly; similar to Uso1p; authentic, non-tagged protein is detected in a phosphorylated state in highly purified mitochondria in high-throughput studies; protein increases in abundance and relocalizes from plasma membrane to cytoplasm upon DNA replication stress; EIS1 has a paralog, YKL050C, that arose from the whole genome duplication +S000033984 CDS YMR031C 13 334743 332212 C 2011-02-03 1996-07-31 +S000004635 ORF Verified YMR032W HOF1 formin-binding protein HOF1|CYK2 chromosome 13 L000004406 13 335298 337307 W 2011-02-03 1996-07-31 Protein that regulates actin cytoskeleton organization; required for cytokinesis, actin cable organization, and secretory vesicle trafficking; localized to bud neck; phosphorylated by Dbf2p; regulates actomyosin ring dynamics and septin localization; contains an SH3 domain; N terminus controls cell size and levels of actin cables, while C terminus controls actin cable organization via direct regulation of the formin Bnr1p +S000034951 CDS YMR032W 13 335298 337307 W 2011-02-03 1996-07-31 +S000028574 ORF Uncharacterized YMR030W-A chromosome 13 13 337313 337603 W 2011-02-03 2003-07-29 Putative protein of unknown function; mCherry fusion protein localizes to the cytosol +S000031303 CDS YMR030W-A 13 337313 337603 W 2011-02-03 2003-07-29 +S000004636 ORF Verified YMR033W ARP9 RSC12|SWP59 chromosome 13 L000003438 13 337788 339277 W 2011-02-03 1996-07-31 Component of both the SWI/SNF and RSC chromatin remodeling complexes; actin-related protein involved in transcriptional regulation +S000035135 CDS YMR033W 13 337788 337817 W 2011-02-03 1996-07-31 +S000035136 CDS YMR033W 13 337904 339277 W 2011-02-03 1996-07-31 +S000035137 intron YMR033W 13 337818 337903 W 2011-02-03 1996-07-31 +S000004637 ORF Verified YMR034C RCH1 chromosome 13 13 340722 339418 C 2011-02-03 1996-07-31 Putative transporter; localizes to the plasma membrane in response to high levels of extracellular calcium; member of the SLC10 carrier family; identified in a transposon mutagenesis screen as a gene involved in azole resistance; YMR034C is not an essential gene +S000035192 CDS YMR034C 13 340722 339418 C 2011-02-03 1996-07-31 +S000004638 ORF Verified YMR035W IMP2 endopeptidase catalytic subunit chromosome 13 L000002836 13 341142 341675 W 2011-02-03 1996-07-31 Catalytic subunit of mitochondrial inner membrane peptidase complex; required for maturation of mitochondrial proteins of the intermembrane space; complex contains two catalytic subunits (Imp1p and Imp2p that differ in substrate specificity), and Som1p +S000036191 CDS YMR035W 13 341142 341675 W 2011-02-03 1996-07-31 +S000004639 ORF Verified YMR036C MIH1 putative tyrosine protein phosphatase MIH1 chromosome 13 L000001111 13 343520 341856 C 2011-02-03 1996-07-31 Protein tyrosine phosphatase involved in cell cycle control; regulates the phosphorylation state of Cdc28p; homolog of S. pombe cdc25 +S000036273 CDS YMR036C 13 343520 341856 C 2011-02-03 1996-07-31 +S000004640 ORF Verified YMR037C MSN2 stress-responsive transcriptional activator MSN2 chromosome 13 L000001198 13 346517 344403 C 2011-02-03 1996-07-31 Stress-responsive transcriptional activator; activated in stochastic pulses of nuclear localization in response to various stress conditions; binds DNA at stress response elements of responsive genes; relative distribution to nucleus increases upon DNA replication stress +S000036377 CDS YMR037C 13 346517 344403 C 2011-02-03 1996-07-31 +S000004641 ORF Verified YMR038C CCS1 copper chaperone CCS1|LYS7|CCS chromosome 13 L000000968 13 348260 347511 C 30 2011-02-03 1996-07-31 Copper chaperone for superoxide dismutase Sod1p; involved in oxidative stress protection; Met-X-Cys-X2-Cys motif within N-terminus is involved in insertion of copper into Sod1p under conditions of copper deprivation; required for regulation of yeast copper genes in response to DNA-damaging agents; protein abundance increases in response to DNA replication stress; human homolog CCS can complement yeast ccs1 null mutant +S000036442 CDS YMR038C 13 348260 347511 C 2011-02-03 1996-07-31 +S000004642 ORF Verified YMR039C SUB1 chromatin-binding transcription coactivator SUB1|TSP1 chromosome 13 L000003936 13 349522 348644 C 2011-02-03 1996-07-31 Transcriptional regulator; facilitates elongation through factors that modify RNAP II; role in peroxide resistance involving Rad2p; role in nonhomologous end-joining (NHEJ) of ds breaks in plasmid DNA, but not chromosomal DNA; role in the hyperosmotic stress response through polymerase recruitment at RNAP II and RNAP III genes; negatively regulates sporulation; protein abundance increases in response to DNA replication stress; functionally complemented by human SUB1 (PC4) +S000037092 CDS YMR039C 13 349522 348644 C 2011-02-03 1996-07-31 +S000004643 ORF Verified YMR040W YET2 chromosome 13 13 350381 350863 W 2011-02-03 1996-07-31 Protein of unknown function that may interact with ribosomes; based on co-purification experiments; homolog of human BAP31 protein; YET2 has a paralog, YET1, that arose from the whole genome duplication +S000030127 CDS YMR040W 13 350381 350863 W 2011-02-03 1996-07-31 +S000004644 ORF Verified YMR041C ARA2 D-arabinose 1-dehydrogenase (NAD(P)(+)) ARA2 chromosome 13 13 351973 350966 C 2011-02-03 1996-07-31 NAD-dependent arabinose dehydrogenase; involved in biosynthesis of dehydro-D-arabinono-1,4-lactone; similar to plant L-galactose dehydrogenase +S000030237 CDS YMR041C 13 351973 350966 C 2011-02-03 1996-07-31 +S000006568 tRNA_gene tF(GAA)M chromosome 13 L000003668 13 352280 352370 W 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis +S000035417 intron tF(GAA)M 13 352317 352334 W 2011-02-03 2000-05-19 +S000035415 noncoding_exon tF(GAA)M 13 352280 352316 W 2011-02-03 2000-05-19 +S000035416 noncoding_exon tF(GAA)M 13 352335 352370 W 2011-02-03 2000-05-19 +S000004645 ORF Verified YMR042W ARG80 ARGRI|ARGR1 chromosome 13 L000000112 13 352603 353136 W 36 2011-02-03 1996-07-31 Transcription factor involved in regulating arginine-responsive genes; acts with Arg81p and Arg82p +S000031259 CDS YMR042W 13 352603 353136 W 2011-02-03 1996-07-31 +S000004646 ORF Verified YMR043W MCM1 transcription factor MCM1|FUN80 chromosome 13 L000001037 13 353871 354731 W 35 2011-02-03 1996-07-31 Transcription factor; involved in cell-type-specific transcription and pheromone response; plays a central role in the formation of both repressor and activator complexes; relocalizes to the cytosol in response to hypoxia +S000031354 CDS YMR043W 13 353871 354731 W 2011-02-03 1996-07-31 +S000004647 ORF Verified YMR044W IOC4 chromosome 13 13 355384 356811 W 2011-02-03 1996-07-31 Member of a complex (Isw1b) with Isw1p and Ioc2p; interacts directly with H3K36me3 nucleosomes through its PWWP domain to recruit the Isw1b complex to open reading frames in a Set2p-dependent manner; Isw1b exhibits nucleosome-stimulated ATPase activity and acts within coding regions to coordinate transcription elongation with termination and processing +S000032363 CDS YMR044W 13 355384 356811 W 2011-02-03 1996-07-31 +S000007109 long_terminal_repeat YMRCdelta7 chromosome 13 13 357336 357005 C 2011-02-03 2000-05-19 Ty1 LTR +S000004648 transposable_element_gene YMR045C gag-pol fusion protein chromosome 13 13 362627 357359 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000032431 CDS YMR045C 13 361321 357359 C 2011-02-03 1999-07-17|1996-07-31 +S000032430 CDS YMR045C 13 362627 361323 C 2011-02-03 1999-07-17|1996-07-31 +S000032432 plus_1_translational_frameshift YMR045C 13 361322 361322 C 2011-02-03 1999-07-17|1996-07-31 +S000004649 transposable_element_gene YMR046C gag protein chromosome 13 13 362627 361305 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000032514 CDS YMR046C 13 362627 361305 C 2011-02-03 1996-07-31 +S000007248 ORF Dubious YMR046W-A chromosome 13 13 362702 362830 W 2011-02-03 1997-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033646 CDS YMR046W-A 13 362702 362830 W 2011-02-03 1997-07-17 +S000007119 LTR_retrotransposon YMRCTy1-3 Ty1 chromosome 13 13 362918 357005 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007110 long_terminal_repeat YMRCdelta8 chromosome 13 13 362918 362587 C 2011-02-03 2000-05-19 Ty1 LTR +S000006599 tRNA_gene tH(GUG)M chromosome 13 L000003669 13 363064 363135 W 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis +S000033895 noncoding_exon tH(GUG)M 13 363064 363135 W 2011-02-03 2000-05-19 +S000004650 ORF Verified YMR047C NUP116 FG-nucleoporin NUP116|NSP116 chromosome 13 L000001293 13 366705 363364 C 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; contributes directly to nucleocytoplasmic transport and maintenance of the nuclear pore complex (NPC) permeability barrier; forms a stable association with Nup82p, Gle2p and two other FG-nucleoporins (Nsp1p and Nup159p); NUP116 has a paralog, NUP100, that arose from the whole genome duplication +S000032621 CDS YMR047C 13 366705 363364 C 2011-02-03 1996-07-31 +S000004651 ORF Verified YMR048W CSM3 chromosome 13 13 366981 367934 W 2011-02-03 1996-07-31 Replication fork associated factor; required for stable replication fork pausing; component of the DNA replication checkpoint pathway; required for accurate chromosome segregation during meiosis; forms nuclear foci upon DNA replication stress +S000033358 CDS YMR048W 13 366981 367934 W 2011-02-03 1996-07-31 +S000004652 ORF Verified YMR049C ERB1 chromosome 13 13 370517 368094 C 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; forms a complex with Nop7p and Ytm1p that is required for maturation of the large ribosomal subunit; required for maturation of the 25S and 5.8S ribosomal RNAs; homologous to mammalian Bop1 +S000033387 CDS YMR049C 13 370517 368094 C 2011-02-03 1996-07-31 +S000118371 ARS ARS1312 ARSXIII-371 chromosome 13 13 371001 371105 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178156 ARS_consensus_sequence ARS1312 13 371019 371035 W 2014-11-18 2014-11-18 +S000006763 tRNA_gene tV(AAC)M1 chromosome 13 L000003681 13 372518 372445 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000030017 noncoding_exon tV(AAC)M1 13 372518 372445 C 2011-02-03 2000-05-19 +S000007111 long_terminal_repeat YMRCdelta9 chromosome 13 13 373034 372697 C 2011-02-03 2000-05-19 Ty1 LTR +S000004653 transposable_element_gene YMR050C gag-pol fusion protein chromosome 13 13 378325 373057 C 2011-02-03 1999-07-17|1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000034328 CDS YMR050C 13 377019 373057 C 2011-02-03 1999-07-17|1996-07-31 +S000034327 CDS YMR050C 13 378325 377021 C 2011-02-03 1999-07-17|1996-07-31 +S000034329 plus_1_translational_frameshift YMR050C 13 377020 377020 C 2011-02-03 1999-07-17|1996-07-31 +S000004654 transposable_element_gene YMR051C gag protein chromosome 13 13 378325 377003 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000034409 CDS YMR051C 13 378325 377003 C 2011-02-03 1996-07-31 +S000007120 LTR_retrotransposon YMRCTy1-4 Ty1 chromosome 13 13 378622 372697 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007112 long_terminal_repeat YMRCdelta10 chromosome 13 13 378622 378285 C 2011-02-03 2000-05-19 Ty1 LTR +S000007113 long_terminal_repeat YMRCdelta11 chromosome 13 13 379061 378727 C 2011-02-03 2000-05-19 Ty1 LTR +S000007121 long_terminal_repeat YMRWdelta12 chromosome 13 13 379072 379198 W 2011-02-03 2000-05-19 Ty1 LTR +S000006775 tRNA_gene tW(CCA)M chromosome 13 L000003680 13 379408 379303 C 2011-02-03 2000-05-19 Tryptophan tRNA (tRNA-Trp), predicted by tRNAscan-SE analysis +S000034112 intron tW(CCA)M 13 379372 379339 C 2011-02-03 2000-05-19 +S000034111 noncoding_exon tW(CCA)M 13 379338 379303 C 2011-02-03 2000-05-19 +S000034110 noncoding_exon tW(CCA)M 13 379408 379373 C 2011-02-03 2000-05-19 +S000004656 ORF Verified YMR052W FAR3 chromosome 13 L000002919 13 379586 380200 W 2011-02-03 1996-07-31 Protein of unknown function; involved in recovery from cell cycle arrest in response to pheromone, in a Far1p-independent pathway; interacts with Far7p, Far8p, Far9p, Far10p, and Far11p; localizes to the endoplasmic reticulum; protein abundance increases in response to DNA replication stress +S000035481 CDS YMR052W 13 379586 380200 W 2011-02-03 1996-07-31 +S000004655 ORF Dubious YMR052C-A chromosome 13 13 380434 380069 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036215 CDS YMR052C-A 13 380434 380069 C 2011-02-03 1996-07-31 +S000004657 ORF Verified YMR053C STB2 chromosome 13 L000002108 13 382898 380346 C 2011-02-03 1996-07-31 Protein that interacts with Sin3p in a two-hybrid assay; part of a large protein complex with Sin3p and Stb1p; STB2 has a paralog, STB6, that arose from the whole genome duplication +S000035527 CDS YMR053C 13 382898 380346 C 2011-02-03 1996-07-31 +S000004658 ORF Verified YMR054W STV1 H(+)-transporting V0 sector ATPase subunit a chromosome 13 L000002139 13 383303 385975 W 2011-02-03 1996-07-31 Subunit a of the vacuolar-ATPase V0 domain; one of two isoforms (Stv1p and Vph1p); Stv1p is located in V-ATPase complexes of the Golgi and endosomes while Vph1p is located in V-ATPase complexes of the vacuole +S000035660 CDS YMR054W 13 383303 385975 W 2011-02-03 1996-07-31 +S000004659 ORF Verified YMR055C BUB2 PAC7 chromosome 13 L000000197 13 387021 386101 C 2011-02-03 1996-07-31 Mitotic exit network regulator; forms GTPase-activating Bfa1p-Bub2p complex that binds Tem1p and spindle pole bodies, blocks cell cycle progression before anaphase in response to spindle and kinetochore damage +S000035699 CDS YMR055C 13 387021 386101 C 2011-02-03 1996-07-31 +S000004660 ORF Verified YMR056C AAC1 ADP/ATP carrier protein AAC1 chromosome 13 L000000003 13 388244 387315 C 2011-02-03 1996-07-31 Mitochondrial inner membrane ADP/ATP translocator; exchanges cytosolic ADP for mitochondrially synthesized ATP; phosphorylated; Aac1p is a minor isoform while Pet9p is the major ADP/ATP translocator; relocalizes from mitochondrion to cytoplasm upon DNA replication stress +S000036642 CDS YMR056C 13 388244 387315 C 2011-02-03 1996-07-31 +S000004661 ORF Dubious YMR057C chromosome 13 13 388730 388359 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF AAC1 +S000036707 CDS YMR057C 13 388730 388359 C 2011-02-03 1996-07-31 +S000004662 ORF Verified YMR058W FET3 ferroxidase FET3 chromosome 13 L000000610 13 388822 390732 W 2011-02-03 1996-07-31 Ferro-O2-oxidoreductase; multicopper oxidase that oxidizes ferrous (Fe2+) to ferric iron (Fe3+) for subsequent cellular uptake by transmembrane permease Ftr1p; required for high-affinity iron uptake and involved in mediating resistance to copper ion toxicity, belongs to class of integral membrane multicopper oxidases; protein abundance increases in response to DNA replication stress +S000036798 CDS YMR058W 13 388822 390732 W 2011-02-03 1996-07-31 +S000004663 ORF Verified YMR059W SEN15 chromosome 13 L000003972 13 391099 391485 W 2011-02-03 1996-07-31|2006-05-10 Subunit of the tRNA splicing endonuclease; tRNA splicing endonuclease (Sen complex) is composed of Sen2p, Sen15p, Sen34p, and Sen54p; Sen complex also cleaves the CBP1 mRNA at the mitochondrial surface +S000036866 CDS YMR059W 13 391099 391485 W 2011-02-03 1996-07-31|2006-05-10 +S000004664 ORF Verified YMR060C SAM37 SAM complex subunit SAM37|TOM37|PET3027|MAS37 chromosome 13 L000002841|L000003251 13 392515 391532 C 2011-02-03 1996-07-31 Component of the Sorting and Assembly Machinery (SAM) complex; the SAM (or TOB) complex is located in the mitochondrial outer membrane; binds precursors of beta-barrel proteins and facilitates their outer membrane insertion; contributes to SAM complex stability +S000037417 CDS YMR060C 13 392515 391532 C 2011-02-03 1996-07-31 +S000004665 ORF Verified YMR061W RNA14 cleavage polyadenylation factor subunit RNA14 chromosome 13 L000001650 13 392755 394788 W 2011-02-03 1996-07-31 Component of the cleavage and polyadenylation factor I (CF I); CF 1, composed of the CF 1A complex (Rna14p, Rna15p, Clp1p, Pcf11p) and Hrp1, is involved in cleavage and polyadenylation of mRNA 3' ends; bridges interaction between Rna15p and Hrp1p in the CF I complex; mutant displays reduced transcription elongation in the G-less-based run-on (GLRO) assay; required for gene looping and maintenance of genome stability; relocalizes to the cytosol in response to hypoxia +S000037628 CDS YMR061W 13 392755 394788 W 2011-02-03 1996-07-31 +S000004666 ORF Verified YMR062C ARG7 glutamate N-acetyltransferase|ECM40 chromosome 13 L000003528 13 396379 395054 C 2011-02-03 1996-07-31 Mitochondrial ornithine acetyltransferase; catalyzes the fifth step in arginine biosynthesis; also possesses acetylglutamate synthase activity, regenerates acetylglutamate while forming ornithine +S000037657 CDS YMR062C 13 396379 395054 C 2011-02-03 1996-07-31 +S000004667 ORF Verified YMR063W RIM9 chromosome 13 L000003427 13 397077 397796 W 2011-02-03 1996-07-31 Plasma membrane protein of unknown function; involved in the proteolytic activation of Rim101p in response to alkaline pH; interacts with Rim21p and Dfg16p to form a pH-sensing complex in the Rim101 pathway and is required to maintain Rim21p levels; has similarity to A. nidulans PalI; +S000030541 CDS YMR063W 13 397077 397796 W 2011-02-03 1996-07-31 +S000004668 ORF Verified YMR064W AEP1 NCA1 chromosome 13 L000000053 13 397903 399459 W 2011-02-03 1996-07-31 Protein required for expression of the mitochondrial OLI1 gene; mitochondrial OLI1 gene encodes subunit 9 of F1-F0 ATP synthase +S000030637 CDS YMR064W 13 397903 399459 W 2011-02-03 1996-07-31 +S000004669 ORF Verified YMR065W KAR5 FIG3 chromosome 13 L000003315 13 399702 401216 W 2011-02-03 1996-07-31 Protein required for nuclear membrane fusion during karyogamy; localizes to the membrane with a soluble portion in the endoplasmic reticulum lumen, may form a complex with Jem1p and Kar2p; similar to zebrafish Brambleberry protein; expression of the gene is regulated by pheromone +S000031502 CDS YMR065W 13 399702 401216 W 2011-02-03 1996-07-31 +S000004670 ORF Verified YMR066W SOV1 chromosome 13 L000004620 13 401541 404237 W 2011-02-03 1996-07-31 Mitochondrial protein of unknown function +S000031589 CDS YMR066W 13 401541 404237 W 2011-02-03 1996-07-31 +S000004671 ORF Verified YMR067C UBX4 CUI1 chromosome 13 13 405573 404323 C 2011-02-03 1996-07-31 UBX domain-containing protein that interacts with Cdc48p; involved in degradation of polyubiquitinated proteins via the ERAD (ER-associated degradation) pathway; modulates the Cdc48p-Nplp-Ufd1p AAA ATPase complex during its role in delivery of misfolded proteins to the proteasome; protein abundance increases in response to DNA replication stress +S000031655 CDS YMR067C 13 405573 404323 C 2011-02-03 1996-07-31 +S000004672 ORF Verified YMR068W AVO2 chromosome 13 13 406304 407584 W 2011-02-03 1996-07-31 Component of a complex containing the Tor2p kinase and other proteins; complex may have a role in regulation of cell growth +S000031807 CDS YMR068W 13 406304 407584 W 2011-02-03 1996-07-31 +S000004673 ORF Verified YMR069W NAT4 NAA40 chromosome 13 13 407709 408566 W 2011-02-03 1996-07-31 N alpha-acetyl-transferase; involved in acetylation of the N-terminal residues of histones H4 and H2A +S000032728 CDS YMR069W 13 407709 408566 W 2011-02-03 1996-07-31 +S000004674 ORF Verified YMR070W MOT3 [MOT3]|[MOT3+]|ROX7 chromosome 13 L000002675 13 409154 410626 W 43 2011-02-03 1996-07-31 Transcriptional repressor, activator; role in cellular adjustment to osmotic stress including modulation of mating efficiency; involved in repression of subset of hypoxic genes by Rox1p, repression of several DAN/TIR genes during aerobic growth, ergosterol biosynthetic genes in response to hyperosmotic stress; contributes to recruitment of Tup1p-Cyc8p general repressor to promoters; relocalizes to cytosol under hypoxia; forms [MOT3+] prion under anaerobic conditions +S000032777 CDS YMR070W 13 409154 410626 W 2011-02-03 1996-07-31 +S000004675 ORF Verified YMR071C TVP18 chromosome 13 13 411265 410762 C 2011-02-03 1996-07-31 Integral membrane protein; localized to late Golgi vesicles along with the v-SNARE Tlg2p; may interact with ribosomes, based on co-purification experiments; may have a role in intracellular sterol transport +S000032836 CDS YMR071C 13 411265 410762 C 2011-02-03 1996-07-31 +S000004676 ORF Verified YMR072W ABF2 DNA-binding protein ABF2|mtTFA|HM|p19 chromosome 13 L000000012 13 411569 412120 W 2011-02-03 1996-07-31 Mitochondrial DNA-binding protein; involved in mitochondrial DNA replication and recombination, member of HMG1 DNA-binding protein family; activity may be regulated by protein kinase A phosphorylation; ABF2 has a paralog, IXR1, that arose from the whole genome duplication; human homolog TFAM can complement yeast abf2 mutant, rescuing the loss-of-mitochondrial DNA phenotype in a yeast abf2 strain +S000033599 CDS YMR072W 13 411569 412120 W 2011-02-03 1996-07-31 +S000004677 ORF Verified YMR073C IRC21 chromosome 13 13 412873 412268 C 2011-02-03 1996-07-31 Protein of unknown function; may be involved in resistance to carboplatin and cisplatin; null mutant displays increase in spontaneous Rad52p foci; contains a lipid-binding domain and binds cardiolipin in a large-scale study +S000033642 CDS YMR073C 13 412873 412268 C 2011-02-03 1996-07-31 +S000004678 ORF Verified YMR074C SDD2 chromosome 13 13 413473 413036 C 2011-02-03 1996-07-31 Protein with homology to human PDCD5; PDCD5 is involved in programmed cell death; N-terminal region forms a conserved triple-helix bundle structure; overproduction suppresses lethality due to expression of the dominant PET9 allele AAC2-A128P; overexpression promotes H2O2-induced apoptosis; YMR074C is not an essential gene; protein abundance increases in response to DNA replication stress +S000033760 CDS YMR074C 13 413473 413036 C 2011-02-03 1996-07-31 +S000004680 ORF Verified YMR075W RCO1 chromosome 13 13 413982 416036 W 2011-02-03 1996-07-31 Essential component of the Rpd3S histone deacetylase complex; interacts with Eaf3p +S000034738 CDS YMR075W 13 413982 416036 W 2011-02-03 1996-07-31 +S000004679 ORF Dubious YMR075C-A chromosome 13 13 416053 415688 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF RCO1/YMR075W +S000033031 CDS YMR075C-A 13 416053 415688 C 2011-02-03 1996-07-31 +S000004681 ORF Verified YMR076C PDS5 chromosome 13 L000003047 13 420029 416196 C 2011-02-03 1996-07-31 Cohesion maintenance factor; involved in sister chromatid condensation and cohesion; colocalizes with cohesin on chromosomes; performs its cohesin maintenance function in pre-anaphase cells by protecting the integrity of the cohesion complex; also required during meiosis; relocalizes to the cytosol in response to hypoxia +S000034790 CDS YMR076C 13 420029 416196 C 2011-02-03 1996-07-31 +S000006764 tRNA_gene tV(AAC)M2 chromosome 13 L000003679 13 420661 420588 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000030020 noncoding_exon tV(AAC)M2 13 420661 420588 C 2011-02-03 2000-05-19 +S000004682 ORF Verified YMR077C VPS20 ESCRT-III subunit protein VPS20|VPL10|VPT20|CHM6 chromosome 13 13 422149 421484 C 2011-02-03 1996-07-31 Myristoylated subunit of the ESCRT-III complex; the endosomal sorting complex required for transport of transmembrane proteins into the multivesicular body pathway to the lysosomal/vacuolar lumen; cytoplasmic protein recruited to endosomal membranes +S000034931 CDS YMR077C 13 422149 421484 C 2011-02-03 1996-07-31 +S000004683 ORF Verified YMR078C CTF18 CHL12 chromosome 13 L000000431|L000000325 13 424728 422503 C 2011-02-03 1996-07-31 Subunit of a complex with Ctf8p; shares some subunits with Replication Factor C and is required for sister chromatid cohesion; may have overlapping functions with Rad24p in the DNA damage replication checkpoint +S000035849 CDS YMR078C 13 424728 422503 C 2011-02-03 1996-07-31 +S000004684 ORF Verified YMR079W SEC14 phosphatidylinositol/phosphatidylcholine transfer protein SEC14|PIT1 chromosome 13 L000001839 13 424989 426059 W 2011-02-03 1996-07-31 Phosphatidylinositol/phosphatidylcholine transfer protein; involved in regulating PtdIns, PtdCho, and ceramide metabolism, products of which regulate intracellular transport and UPR; has a role in localization of lipid raft proteins; functionally homologous to mammalian PITPs; SEC14 has a paralog, YKL091C, that arose from the whole genome duplication +S000036083 CDS YMR079W 13 424989 424997 W 2011-02-03 1996-07-31 +S000036084 CDS YMR079W 13 425154 426059 W 2011-02-03 1996-07-31 +S000036085 intron YMR079W 13 424998 425153 W 2011-02-03 1996-07-31 +S000004685 ORF Verified YMR080C NAM7 SUT2|ATP-dependent RNA helicase NAM7|SUP113|UPF1|MOF4|IFS2 chromosome 13 L000002429|S000029550|L000002232 13 429627 426712 C 60 2011-02-03 1996-07-31 ATP-dependent RNA helicase of the SFI superfamily; involved in nonsense mediated mRNA decay; required for efficient translation termination at nonsense codons and targeting of NMD substrates to P-bodies; binds to the small ribosomal subunit via an interaction with Rps26; forms cytoplasmic foci upon DNA replication stress +S000036887 CDS YMR080C 13 429627 426712 C 2011-02-03 1996-07-31 +S000004686 ORF Verified YMR081C ISF1 MBR3 chromosome 13 L000001034 13 431095 430079 C 2011-02-03 1996-07-31 Serine-rich, hydrophilic protein; overexpression suppresses growth defects of hap2, hap3, and hap4 mutants; expression is under glucose control; cotranscribed with NAM7 in a cyp1 mutant; ISF1 has a paralog, MBR1, that arose from the whole genome duplication +S000036954 CDS YMR081C 13 431095 430079 C 2011-02-03 1996-07-31 +S000004687 ORF Uncharacterized YMR082C chromosome 13 13 432125 431769 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YMR082C is not an essential gene +S000037719 CDS YMR082C 13 432125 431769 C 2011-02-03 1996-07-31 +S000004688 ORF Verified YMR083W ADH3 alcohol dehydrogenase ADH3 chromosome 13 L000000043 13 434788 435915 W 45 2011-02-03 1996-07-31 Mitochondrial alcohol dehydrogenase isozyme III; involved in the shuttling of mitochondrial NADH to the cytosol under anaerobic conditions and ethanol production +S000037845 CDS YMR083W 13 434788 435915 W 2011-02-03 1996-07-31 +S000004689 ORF Uncharacterized YMR084W putative glutamine--fructose-6-phosphate transaminase chromosome 13 13 436628 437416 W 2011-02-03 1996-07-31 Putative protein of unknown function; YMR084W and adjacent ORF YMR085W are merged in related strains, and together are paralogous to glutamine-fructose-6-phosphate amidotransferase GFA1 +S000030786 CDS YMR084W 13 436628 437416 W 2011-02-03 1996-07-31 +S000004690 ORF Uncharacterized YMR085W chromosome 13 13 437491 438789 W 2011-02-03 1996-07-31 Putative protein of unknown function; YMR085W and adjacent ORF YMR084W are merged in related strains, and together are paralogous to glutamine-fructose-6-phosphate amidotransferase GFA1 +S000030871 CDS YMR085W 13 437491 438789 W 2011-02-03 1996-07-31 +S000004692 ORF Verified YMR086W SEG1 chromosome 13 13 439208 442090 W 2011-02-03 1996-07-31 Component of eisosome required for proper eisosome assembly; precedes Pil1p/Lsp1p during eisosome formation, controls eisosome length and shape; diffusely distributed, forms heterogeneous patches at plasma membrane in small buds, also found in medium and large buds; expression repressed by cAMP; similar to A. gossypii SEG gene and to S. pombe Sle1p, important for generating eisosomes; SEG1 has a paralog, SEG2, that arose from the whole genome duplication +S000030930 CDS YMR086W 13 439208 442090 W 2011-02-03 1996-07-31 +S000004691 ORF Dubious YMR086C-A chromosome 13 13 442364 442026 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037663 CDS YMR086C-A 13 442364 442026 C 2011-02-03 1996-07-31 +S000004693 ORF Verified YMR087W putative ADP-ribose 1''-phosphate phosphatase chromosome 13 S000154613 13 442527 443381 W 2011-02-03 1996-07-31 Putative ADP-ribose-1''-monophosphatase; converts ADP-ribose-1''-monophosphate to ADP-ribose; may have a role in tRNA splicing; contains an A1pp domain +S000031010 CDS YMR087W 13 442527 443381 W 2011-02-03 1996-07-31 +S000004694 ORF Verified YMR088C VBA1 chromosome 13 13 445102 443414 C 2011-02-03 1996-07-31 Permease of basic amino acids in the vacuolar membrane +S000031056 CDS YMR088C 13 445102 443414 C 2011-02-03 1996-07-31 +S000004695 ORF Verified YMR089C YTA12 m-AAA protease subunit YTA12|RCA1 chromosome 13 L000001591|L000002564 13 448086 445609 C 2011-02-03 1996-07-31 Mitochondrial inner membrane m-AAA protease component; mediates degradation of misfolded or unassembled proteins; also required for correct assembly of mitochondrial enzyme complexes; overexpression of human AFG3L2 complements respiratory defect of yeast afg3 yta12 double null mutation, but overexpression of disease-associated AFG3L2 variants does not; expression of both human SPG7 (paraplegin) and AFG3L2 complements yeast yta12 afg3 double mutation +S000032008 CDS YMR089C 13 448086 445609 C 2011-02-03 1996-07-31 +S000004696 ORF Uncharacterized YMR090W chromosome 13 13 449245 449928 W 2011-02-03 1996-07-31 Putative protein of unknown function; similar to DTDP-glucose 4,6-dehydratases; GFP-fusion protein localizes to the cytoplasm; up-regulated in response to the fungicide mancozeb; not essential for viability +S000033126 CDS YMR090W 13 449245 449928 W 2011-02-03 1996-07-31 +S000004697 ORF Verified YMR091C NPL6 RSC7 chromosome 13 L000001272 13 451365 450058 C 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; interacts with Rsc3p, Rsc30p, Ldb7p, and Htl1p to form a module important for a broad range of RSC functions +S000033161 CDS YMR091C 13 451365 450058 C 2011-02-03 1996-07-31 +S000004698 ORF Verified YMR092C AIP1 chromosome 13 L000000069 13 453479 451632 C 2011-02-03 1996-07-31 Actin cortical patch component; interacts with the actin depolymerizing factor cofilin; inhibits elongation of aged ADP-actin filaments decorated with cofilin to maintain a high level of assembly-competent actin species; required to restrict cofilin localization to cortical patches; putative regulator of cytokinesis; contains WD repeats; protein increases in abundance and relocalizes from cytoplasm to plasma membrane upon DNA replication stress +S000033958 CDS YMR092C 13 453479 451632 C 2011-02-03 1996-07-31 +S000004699 ORF Verified YMR093W UTP15 snoRNA-binding rRNA-processing protein UTP15 chromosome 13 13 454015 455556 W 2011-02-03 1996-07-31 Nucleolar protein; component of the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA +S000034125 CDS YMR093W 13 454015 455556 W 2011-02-03 1996-07-31 +S000004700 ORF Verified YMR094W CTF13 CBF3C chromosome 13 L000000429 13 455825 457261 W 2011-02-03 1996-07-31 Subunit of the CBF3 complex; CBF3 binds to the CDE III element of centromeres, bending the DNA upon binding, and may be involved in sister chromatid cohesion during mitosis +S000034211 CDS YMR094W 13 455825 457261 W 2011-02-03 1996-07-31 +S000004701 ORF Verified YMR095C SNO1 putative pyridoxal 5'-phosphate synthase chromosome 13 L000003451 13 457959 457285 C 2011-02-03 1996-07-31 Protein of unconfirmed function; involved in pyridoxine metabolism; expression is induced during stationary phase; forms a putative glutamine amidotransferase complex with Snz1p, with Sno1p serving as the glutaminase +S000035105 CDS YMR095C 13 457959 457285 C 2011-02-03 1996-07-31 +S000004702 ORF Verified YMR096W SNZ1 pyridoxine biosynthesis protein SNZ1 chromosome 13 L000002575 13 458408 459301 W 2011-02-03 1996-07-31 Protein involved in vitamin B6 biosynthesis; member of a stationary phase-induced gene family; coregulated with SNO1; interacts with Sno1p and with Yhr198p, perhaps as a multiprotein complex containing other Snz and Sno proteins +S000035303 CDS YMR096W 13 458408 459301 W 2011-02-03 1996-07-31 +S000004703 ORF Verified YMR097C MTG1 putative GTPase MTG1 chromosome 13 13 460527 459424 C 2011-02-03 1996-07-31 Putative GTPase peripheral to the mitochondrial inner membrane; essential for respiratory competence, likely functions in assembly of the large ribosomal subunit, has homologs in plants and animals +S000035321 CDS YMR097C 13 460527 459424 C 2011-02-03 1996-07-31 +S000004704 ORF Verified YMR098C ATP25 LRC4 chromosome 13 13 462609 460771 C 2011-02-03 1996-07-31 Mitochondrial protein required for the stability of Oli1p (Atp9p) mRNA; also required for the Oli1p ring formation; YMR098C is not an essential gene +S000035398 CDS YMR098C 13 462609 460771 C 2011-02-03 1996-07-31 +S000007114 long_terminal_repeat YMRCdelta13 chromosome 13 13 463461 463128 C 2011-02-03 2000-05-19 Ty1 LTR +S000006543 tRNA_gene tD(GUC)M chromosome 13 L000003670 13 463554 463625 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000030421 noncoding_exon tD(GUC)M 13 463554 463625 W 2011-02-03 2000-05-19 +S000004705 ORF Verified YMR099C glucose-6-phosphate 1-epimerase chromosome 13 13 464827 463934 C 2011-02-03 1996-07-31 Glucose-6-phosphate 1-epimerase (hexose-6-phosphate mutarotase); likely involved in carbohydrate metabolism; GFP-fusion protein localizes to both the nucleus and cytoplasm and is induced in response to the DNA-damaging agent MMS +S000035458 CDS YMR099C 13 464827 463934 C 2011-02-03 1996-07-31 +S000004706 ORF Verified YMR100W MUB1 chromosome 13 L000004359 13 466300 468162 W 2011-02-03 1996-07-31 MYND domain-containing protein; component of the Mub1p-Ubr2p-Rad6p ubiquitin ligase complex, required for ubiquitination and degradation of Rpn4p; interacts with Ubr2p (E3) and indirectly with Rad6p (E2); short-lived protein degraded in a Ubr2p/Rad6p dependent manner; proposed to function as both a partner and substrate of the Ubr2p/Rad6p ubiquitin ligase; similar to the A. nidulans samB gene +S000032955 CDS YMR100W 13 466300 468162 W 2011-02-03 1996-07-31 +S000118372 ARS ARS1316 ARSXIII-468 chromosome 13 13 468179 468469 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178157 ARS_consensus_sequence ARS1316 13 468236 468252 W 2014-11-18 2014-11-18 +S000004707 ORF Verified YMR101C SRT1 ditrans,polycis-polyprenyl diphosphate synthase chromosome 13 L000004878 13 469476 468445 C 2011-02-03 1996-07-31 Forms the dehydrodolichyl diphosphate syntase (DDS) complex with NUS1; involved in synthesis of long-chain dolichols (19-22 isoprene units; as opposed to Rer2p which synthesizes shorter-chain dolichols); localizes to lipid bodies; transcription is induced during stationary phase +S000032988 CDS YMR101C 13 469476 468445 C 2011-02-03 1996-07-31 +S000004708 ORF Uncharacterized YMR102C chromosome 13 13 472352 469848 C 2011-02-03 1996-07-31 Protein of unknown function; transcription is activated by paralogous transcription factors Yrm1p and Yrr1p along with genes involved in multidrug resistance; mutant shows increased resistance to azoles; not an essential gene; YMR102C has a paralog, DGR2, that arose from the whole genome duplication +S000033083 CDS YMR102C 13 472352 469848 C 2011-02-03 1996-07-31 +S000004709 ORF Uncharacterized YMR103C chromosome 13 13 473264 472902 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YMR103C is not an essential gene +S000033841 CDS YMR103C 13 473264 472902 C 2011-02-03 1996-07-31 +S000004710 ORF Verified YMR104C YPK2 putative protein kinase YPK2|YKR2 chromosome 13 L000002542 13 475453 473420 C 2011-02-03 1996-07-31 Protein kinase similar to S/T protein kinase Ypk1p; functionally redundant with YPK1 at the genetic level; participates in a signaling pathway required for optimal cell wall integrity; involved in the TORC-dependent phosphorylation of ribosomal proteins Rps6a/b (S6); human homolog SGK2 can complement a ypk1 ypk2 double mutant +S000033988 CDS YMR104C 13 475453 473420 C 2011-02-03 1996-07-31 +S000004711 ORF Verified YMR105C PGM2 phosphoglucomutase PGM2|GAL5 chromosome 13 L000001413 13 477606 475897 C 2011-02-03 1996-07-31 Phosphoglucomutase; catalyzes the conversion from glucose-1-phosphate to glucose-6-phosphate, which is a key step in hexose metabolism; functions as the acceptor for a Glc-phosphotransferase; protein abundance increases in response to DNA replication stress; PGM2 has a paralog, PGM1, that arose from the whole genome duplication +S000034889 CDS YMR105C 13 477606 475897 C 2011-02-03 1996-07-31 +S000130188 ARS ARS1317 chromosome 13 13 477606 478301 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000028692 ORF Uncharacterized YMR105W-A chromosome 13 13 478064 478258 W 2011-02-03 2003-07-29 Putative protein of unknown function +S000032592 CDS YMR105W-A 13 478064 478258 W 2011-02-03 2003-07-29 +S000004712 ORF Verified YMR106C YKU80 ATP-dependent DNA helicase YKU80|HDF2 chromosome 13 L000004089 13 480190 478301 C 2011-02-03 1996-07-31 Subunit of telomeric Ku complex (Yku70p-Yku80p); involved in telomere length maintenance, structure and telomere position effect; required for localization of telomerase ribonucleoprotein via interaction with TLC1 guide RNA; relocates to sites of double-strand cleavage to promote nonhomologous end joining during DSB repair; colocalizes with quiescent cell telomere hyperclusters +S000035040 CDS YMR106C 13 480190 478301 C 2011-02-03 1996-07-31 +S000006627 tRNA_gene tK(CUU)M chromosome 13 L000003678 13 480693 480621 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000036046 noncoding_exon tK(CUU)M 13 480693 480621 C 2011-02-03 2000-05-19 +S000007115 long_terminal_repeat YMRCdelta14 chromosome 13 13 481547 481214 C 2011-02-03 2000-05-19 Ty1 LTR +S000007122 long_terminal_repeat YMRWdelta15 chromosome 13 13 481571 481808 W 2011-02-03 2000-05-19 Ty1 LTR +S000004713 ORF Verified YMR107W SPG4 chromosome 13 13 483014 483361 W 2011-02-03 1996-07-31 Protein required for high temperature survival during stationary phase; not required for growth on nonfermentable carbon sources +S000035284 CDS YMR107W 13 483014 483361 W 2011-02-03 1996-07-31 +S000004714 ORF Verified YMR108W ILV2 acetolactate synthase catalytic subunit|THI1|SMR1 chromosome 13 L000002296|L000002515|L000000858 13 484084 486147 W 66 2011-02-03 1996-07-31 Acetolactate synthase; catalyses the first common step in isoleucine and valine biosynthesis and is the target of several classes of inhibitors, localizes to the mitochondria; expression of the gene is under general amino acid control +S000036218 CDS YMR108W 13 484084 486147 W 2011-02-03 1996-07-31 +S000004715 ORF Verified YMR109W MYO5 myosin 5 chromosome 13 L000002935 13 486587 490246 W 2011-02-03 1996-07-31 One of two type I myosin motors; contains proline-rich tail homology 2 (TH2) and SH3 domains; MYO5 deletion has little effect on growth, but myo3 myo5 double deletion causes severe defects in growth and actin cytoskeleton organization; MYO5 has a paralog, MYO3, that arose from the whole genome duplication +S000036305 CDS YMR109W 13 486587 490246 W 2011-02-03 1996-07-31 +S000004716 ORF Verified YMR110C HFD1 hexadecenal dehydrogenase chromosome 13 13 491992 490394 C 2011-02-03 1996-07-31 Dehydrogenase involved in ubiquinone and sphingolipid metabolism; oxidizes 4-hydroxybenzaldehyde into 4-hydroxybenzoic acid in ubiquinone biosynthesis; converts hexadecenal to hexadecenoic acid in sphingosine 1-phosphate breakdown pathway; located in the mitochondrial outer membrane and also in lipid particles; human homolog ALDH3A2, a fatty aldehyde dehydrogenase (FALDH) mutated in neurocutaneous disorder Sjogren-Larsson syndrome, can complement yeast hfd1 mutant +S000037194 CDS YMR110C 13 491992 490394 C 2011-02-03 1996-07-31 +S000004717 ORF Verified YMR111C chromosome 13 13 493792 492404 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; YMR111C is not an essential gene; forms nuclear foci upon DNA replication stress +S000037278 CDS YMR111C 13 493792 492404 C 2011-02-03 1996-07-31 +S000004718 ORF Verified YMR112C MED11 chromosome 13 L000004634 13 494495 494100 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential protein +S000029941 CDS YMR112C 13 494495 494100 C 2011-02-03 1996-07-31 +S000004719 ORF Verified YMR113W FOL3 dihydrofolate synthase chromosome 13 13 494999 496282 W 2011-02-03 1996-07-31 Dihydrofolate synthetase, involved in folic acid biosynthesis; catalyzes conversion of dihydropteroate to dihydrofolate in folate coenzyme biosynthesis; FOL3 has a paralog, RMA1, that arose from the whole genome duplication +S000030131 CDS YMR113W 13 494999 496282 W 2011-02-03 1996-07-31 +S000004720 ORF Verified YMR114C putative peptide hydrolase chromosome 13 13 497449 496343 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; green fluorescent protein (GFP)-fusion protein localizes to the nucleus and cytoplasm; YMR114C is not an essential gene +S000030240 CDS YMR114C 13 497449 496343 C 2011-02-03 1996-07-31 +S000004721 ORF Verified YMR115W MGR3 FMP24 chromosome 13 13 497704 499209 W 2011-02-03 1996-07-31 Subunit of the mitochondrial (mt) i-AAA protease supercomplex; i-AAA degrades misfolded mitochondrial proteins; forms a subcomplex with Mgr1p that binds to substrates to facilitate proteolysis; required for growth of cells lacking mtDNA +S000031261 CDS YMR115W 13 497704 499209 W 2011-02-03 1996-07-31 +S000007501 snoRNA_gene snR24 SNR24 U24 chromosome 13 L000002911 13 500072 499984 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); commonly referred to as U24; guides 2'-O-methylation of large subunit (LSU) rRNA at positions C1437, C1449, and C1450 +S000036664 noncoding_exon snR24 13 500072 499984 C 2011-02-03 2000-05-19 +S000004722 ORF Verified YMR116C ASC1 RACK1|guanine nucleotide-binding protein subunit beta|ASU9|NAD1|CPC2 chromosome 13 L000003529|L000000135|S000029045 13 500688 499456 C 2011-02-03 1996-07-31 G-protein beta subunit and guanine dissociation inhibitor for Gpa2p; ortholog of RACK1 that inhibits translation; core component of the small (40S) ribosomal subunit; required to prevent frameshifting at ribosomes stalled at repeated CGA codons; regulates P-body formation induced by replication stress; represses Gcn4p in the absence of amino acid starvation +S000031294 CDS YMR116C 13 499878 499456 C 2011-02-03 1996-07-31 +S000031293 CDS YMR116C 13 500688 500152 C 2011-02-03 1996-07-31 +S000031295 intron YMR116C 13 500151 499879 C 2011-02-03 1996-07-31 +S000004723 ORF Verified YMR117C SPC24 kinetochore-associated Ndc80 complex subunit SPC24 chromosome 13 L000004694 13 501891 501250 C 2011-02-03 1996-07-31 Component of the kinetochore-associated Ndc80 complex; involved in chromosome segregation, spindle checkpoint activity, and kinetochore clustering; evolutionarily conserved; other members include Ndc80p, Nuf2p, Spc24p, and Spc25p +S000031427 CDS YMR117C 13 501891 501250 C 2011-02-03 1996-07-31 +S000004724 ORF Uncharacterized YMR118C SHH3 protein SHH3 chromosome 13 13 502734 502144 C 2011-02-03 1996-07-31 Putative mitochondrial inner membrane protein of unknown function; although similar to paralogous Sdh3p, Shh3p is not a stoichiometric subunit of either succinate dehydrogenase or of the TIM22 translocase; SHH3 has a paralog, SDH3, that arose from the whole genome duplication +S000032434 CDS YMR118C 13 502734 502144 C 2011-02-03 1996-07-31 +S000007123 long_terminal_repeat YMRWdelta16 chromosome 13 13 503192 503389 W 2011-02-03 2000-05-19 Ty1 LTR +S000130189 ARS ARS1319 chromosome 13 13 503389 503771 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000007128 long_terminal_repeat YMRWtau2 chromosome 13 13 503771 504141 W 2011-02-03 2000-05-19 Ty4 LTR +S000007124 long_terminal_repeat YMRWdelta17 chromosome 13 13 504346 504677 W 2011-02-03 2000-05-19 Ty1 LTR +S000006644 tRNA_gene tL(CAA)M chromosome 13 L000003671 13 504895 505008 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000033800 intron tL(CAA)M 13 504933 504964 W 2011-02-03 2000-05-19 +S000033798 noncoding_exon tL(CAA)M 13 504895 504932 W 2011-02-03 2000-05-19 +S000033799 noncoding_exon tL(CAA)M 13 504965 505008 W 2011-02-03 2000-05-19 +S000004725 ORF Verified YMR119W ASI1 putative ubiquitin-protein ligase ASI1 chromosome 13 13 505333 507207 W 2011-02-03 1996-07-31 Subunit of the inner nuclear membrane Asi ubiquitin ligase complex; the Asi complex targets both misfolded proteins of the inner nuclear membrane-associated degradation (INMAD) pathway and regulators of sterol biosynthesis for ubiquitin-mediated degradation; acts with Asi2p and Asi3p to ensure the fidelity of SPS-sensor signaling by targeting latent unprocessed forms of Stp1p and Stp2p, maintaining the repressed state of gene expression in the absence of inducing amino acids +S000032577 CDS YMR119W 13 505333 507207 W 2011-02-03 1996-07-31 +S000004726 ORF Dubious YMR119W-A chromosome 13 13 506996 507370 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps 3' end of ORF ASI1/YMR119W +S000037793 CDS YMR119W-A 13 506996 507370 W 2011-02-03 1996-07-31 +S000004727 ORF Verified YMR120C ADE17 bifunctional phosphoribosylaminoimidazolecarboxamide formyltransferase/IMP cyclohydrolase ADE17 chromosome 13 L000003306 13 509280 507502 C 2011-02-03 1996-07-31 Enzyme of 'de novo' purine biosynthesis; contains both 5-aminoimidazole-4-carboxamide ribonucleotide transformylase and inosine monophosphate cyclohydrolase activities; ADE17 has a paralog, ADE16, that arose from the whole genome duplication; ade16 ade17 mutants require adenine and histidine +S000033275 CDS YMR120C 13 509280 507502 C 2011-02-03 1996-07-31 +S000004728 ORF Verified YMR121C RPL15B eL15|ribosomal 60S subunit protein L15B|L15e|rp15R|YL10|L15B|L13B chromosome 13 L000004456 13 510348 509734 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L15B; binds to 5.8 S rRNA; homologous to mammalian ribosomal protein L15, no bacterial homolog; RPL15B has a paralog, RPL15A, that arose from the whole genome duplication; relocalizes from nucleus to nucleolus upon DNA replication stress +S000033342 CDS YMR121C 13 510348 509734 C 2011-02-03 1996-07-31 +S000004729 ORF Uncharacterized YMR122C chromosome 13 13 511075 510701 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YMR122C is not an essential gene +S000033409 CDS YMR122C 13 511075 510701 C 2011-02-03 1996-07-31 +S000007524 ORF Uncharacterized YMR122W-A chromosome 13 13 511315 511569 W 2011-02-03 2000-07-14 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and endoplasmic reticulum +S000037063 CDS YMR122W-A 13 511315 511569 W 2011-02-03 2000-07-14 +S000004730 ORF Verified YMR123W PKR1 chromosome 13 13 513593 513961 W 2011-02-03 1996-07-31 V-ATPase assembly factor; functions with other V-ATPase assembly factors in the ER to efficiently assemble the V-ATPase membrane sector (V0); protein abundance increases in response to DNA replication stress +S000034386 CDS YMR123W 13 513593 513961 W 2011-02-03 1996-07-31 +S000004731 ORF Verified YMR124W EPO1 chromosome 13 13 514456 517287 W 2011-02-03 1996-07-31 Protein involved in septin-ER tethering; interacts with ER membrane protein, Scs2p, and Shs1p, a septin ring component, at bud neck to create ER diffusion barrier; GFP-fusion protein localizes to the cell periphery, cytoplasm, bud, and bud neck; interacts with Crm1p in two-hybrid assay; YMR124W has a paralog, YLR031W, that arose from the whole genome duplication +S000034454 CDS YMR124W 13 514456 517287 W 2011-02-03 1996-07-31 +S000004732 ORF Verified YMR125W STO1 SUT1|CBP80|GCR3|CBC1 chromosome 13 L000002131 13 517539 520446 W 87 2011-02-03 1999-11-17|1996-07-31 Large subunit of the nuclear mRNA cap-binding protein complex; interacts with Npl3p to carry nuclear poly(A)+ mRNA to cytoplasm; also involved in nuclear mRNA degradation and telomere maintenance; orthologous to mammalian CBP80 +S000035482 CDS YMR125W 13 517539 517563 W 2011-02-03 1999-11-17|1996-07-31 +S000035483 CDS YMR125W 13 517886 520446 W 2011-02-03 1999-11-17 +S000035484 intron YMR125W 13 517564 517885 W 2011-02-03 1999-11-17 +S000004733 ORF Uncharacterized YMR126C DLT1 chromosome 13 13 521789 520761 C 2011-02-03 1996-07-31 Protein of unknown function; mutant sensitive to 6-azauracil (6AU) and mycophenolic acid (MPA) +S000035540 CDS YMR126C 13 521789 520761 C 2011-02-03 1996-07-31 +S000004734 ORF Verified YMR127C SAS2 KAT8 chromosome 13 L000001802 13 523345 522329 C 2011-02-03 1996-07-31 Histone acetyltransferase (HAT) catalytic subunit of the SAS complex; acetylates free histones and nucleosomes and regulates transcriptional silencing; member of the MYSTacetyltransferase family; other members are Sas4p and Sas5p +S000035616 CDS YMR127C 13 523345 522329 C 2011-02-03 1996-07-31 +S000004735 ORF Verified YMR128W ECM16 ATP-dependent RNA helicase ECM16|DHR1 chromosome 13 L000003891 13 523696 527499 W 2011-02-03 1996-07-31 Essential DEAH-box ATP-dependent RNA helicase specific to U3 snoRNP; predominantly nucleolar in distribution; required for 18S rRNA synthesis +S000035779 CDS YMR128W 13 523696 527499 W 2011-02-03 1996-07-31 +S000004736 ORF Verified YMR129W POM152 chromosome 13 L000001464 13 527804 531817 W 2011-02-03 1996-07-31 Glycoprotein subunit of transmembrane ring of nuclear pore complex; contributes to nucleocytoplasmic transport, nuclear pore complex (NPC) biogenesis and spindle pole body duplication; homologous to human NUP210 +S000036687 CDS YMR129W 13 527804 531817 W 2011-02-03 1996-07-31 +S000004737 ORF Uncharacterized YMR130W chromosome 13 13 532119 533027 W 2011-02-03 1996-07-31 Putative protein of unknown function; YMR130W is not an essential gene +S000036551 CDS YMR130W 13 532119 533027 W 2011-02-03 1996-07-31 +S000004738 ORF Verified YMR131C RRB1 ribosome biosynthesis protein RRB1 chromosome 13 13 534698 533163 C 2011-02-03 1996-07-31 Specific chaperone for ribosomal protein Rpl3p; binds to nascent Rpl3p during translation; essential gene +S000036599 CDS YMR131C 13 534698 533163 C 2011-02-03 1996-07-31 +S000004739 ORF Uncharacterized YMR132C JLP2 chromosome 13 13 535570 534944 C 2011-02-03 1996-07-31 Protein of unknown function; contains sequence that closely resembles a J domain (typified by the E. coli DnaJ protein) +S000036706 CDS YMR132C 13 535570 534944 C 2011-02-03 1996-07-31 +S000118373 ARS ARS1320 ARSXIII-536 chromosome 13 13 535597 535844 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178158 ARS_consensus_sequence ARS1320 13 535770 535754 C 2014-11-18 2014-11-18 +S000004740 ORF Verified YMR133W REC114 chromosome 13 L000001607 13 536207 537609 W 91 2011-02-03 1999-07-17|1996-07-31 Protein involved in early stages of meiotic recombination; possibly involved in the coordination of recombination and meiotic division; mutations lead to premature initiation of the first meiotic division +S000037485 CDS YMR133W 13 536207 537448 W 2011-02-03 1999-07-17|1996-07-31 +S000037486 CDS YMR133W 13 537565 537609 W 2011-02-03 1999-07-17 +S000037487 intron YMR133W 13 537449 537564 W 2011-02-03 1999-07-17 +S000004741 ORF Verified YMR134W ERG29 chromosome 13 13 537838 538551 W 2011-02-03 1996-07-31 Protein of unknown function involved in ergosterol biosynthesis; conditional mutants produce less ergosterol, display impaired oxygen consumption, respiratory growth, mitochondrial iron utilization, and are more sensitive to oxidative stress; mutant bm-8 has a growth defect on iron-limited medium that is complemented by overexpression of Yfh1p; protein localizes to the cytoplasm, ER and nuclear envelope; highly conserved in ascomycetes +S000037629 CDS YMR134W 13 537838 538551 W 2011-02-03 1996-07-31 +S000004743 ORF Dubious YMR135W-A chromosome 13 13 539911 540444 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036832 CDS YMR135W-A 13 539911 540444 W 2011-02-03 1996-07-31 +S000004742 ORF Verified YMR135C GID8 glucose-induced degradation complex subunit GID8|DCR1 chromosome 13 13 540056 538689 C 2011-02-03 1996-07-31 Subunit of GID Complex, binds strongly to central component Vid30p; GID Complex is involved in proteasome-dependent catabolite inactivation of fructose-1,6-bisphosphatase; recruits Rmd5p, Fyv10 and Vid28p to GID Complex; contains LisH, CTLH, and CRA domains that mediate binding to Vid30p (LisH) and Rmd5p and Vid28p (CTLH and CRA); dosage-dependent regulator of START +S000030355 CDS YMR135C 13 540056 538689 C 2011-02-03 1996-07-31 +S000004744 ORF Verified YMR136W GAT2 chromosome 13 S000007443 13 541199 542881 W 2011-02-03 1996-07-31 Protein containing GATA family zinc finger motifs; similar to Gln3p and Dal80p; expression repressed by leucine +S000030544 CDS YMR136W 13 541199 542881 W 2011-02-03 1996-07-31 +S000130190 ARS ARS1321 chromosome 13 13 542881 542978 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000004745 ORF Verified YMR137C PSO2 SNM1 chromosome 13 L000001953 13 544963 542978 C 2011-02-03 1996-07-31 Nuclease required for DNA single- and double-strand break repair; acts at a post-incision step in repair of breaks that result from interstrand cross-links produced by a variety of mono- and bi-functional psoralen derivatives; induced by UV-irradiation; forms nuclear foci upon DNA replication stress +S000030595 CDS YMR137C 13 544963 542978 C 2011-02-03 1996-07-31 +S000004746 ORF Verified YMR138W CIN4 Arf family GTPase CIN4|UGX1|GTP1 chromosome 13 L000000338 13 545155 545730 W 86 2011-02-03 1996-07-31 GTP-binding protein involved in beta-tubulin (Tub2p) folding; isolated as mutant with increased chromosome loss and sensitivity to benomyl; regulated by the GTPase-activating protein, Cin2p, the human retinitis pigmentosa 2 (RP2) homolog +S000031508 CDS YMR138W 13 545155 545730 W 2011-02-03 1996-07-31 +S000004747 ORF Verified YMR139W RIM11 serine/threonine protein kinase RIM11|MDS1|GSK3 chromosome 13 L000001056 13 546125 547237 W 2011-02-03 1996-07-31 Protein kinase; required for signal transduction during entry into meiosis; promotes the formation of the Ime1p-Ume6p complex by phosphorylating Ime1p and Ume6p; shares similarity with mammalian glycogen synthase kinase 3-beta; protein abundance increases in response to DNA replication stress; RIM11 has a paralog, MRK1, that arose from the whole genome duplication +S000031611 CDS YMR139W 13 546125 547237 W 2011-02-03 1996-07-31 +S000004748 ORF Verified YMR140W SIP5 chromosome 13 13 547714 549183 W 2011-02-03 1996-07-31 Protein of unknown function; interacts with both the Reg1p/Glc7p phosphatase and the Snf1p kinase; forms cytoplasmic foci upon DNA replication stress +S000031580 CDS YMR140W 13 547714 549183 W 2011-02-03 1996-07-31 +S000004749 ORF Uncharacterized YMR141C chromosome 13 13 550044 549736 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YMR141C is not an essential gene +S000031632 CDS YMR141C 13 550044 549736 C 2011-02-03 1996-07-31 +S000028575 ORF Dubious YMR141W-A chromosome 13 13 550911 551135 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene RPL13B/YMR142C +S000031304 CDS YMR141W-A 13 550911 551135 W 2011-02-03 2003-07-29 +S000004750 ORF Verified YMR142C RPL13B eL13|ribosomal 60S subunit protein L13B|L13e|L13B chromosome 13 L000004455 13 551207 550206 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L13B; not essential for viability; homologous to mammalian ribosomal protein L13, no bacterial homolog; RPL13B has a paralog, RPL13A, that arose from the whole genome duplication +S000032639 CDS YMR142C 13 550801 550206 C 2011-02-03 1996-07-31 +S000032638 CDS YMR142C 13 551207 551204 C 2011-02-03 1996-07-31 +S000032640 intron YMR142C 13 551203 550802 C 2011-02-03 1996-07-31 +S000004751 ORF Verified YMR143W RPS16A uS9|ribosomal 40S subunit protein S16A|S9|rp61R|S16A chromosome 13 L000004477 13 551928 552903 W 2011-02-03 2000-07-22|1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S16 and bacterial S9; RPS16A has a paralog, RPS16B, that arose from the whole genome duplication +S000032779 CDS YMR143W 13 551928 551951 W 2011-02-03 2000-07-22|1996-07-31 +S000032780 CDS YMR143W 13 552496 552903 W 2011-02-03 1996-07-31 +S000032781 intron YMR143W 13 551952 552495 W 2011-02-03 2000-07-22|1996-07-31 +S000004752 ORF Uncharacterized YMR144W FDO1 chromosome 13 13 553362 554390 W 2011-02-03 1996-07-31 Protein involved in directionality of mating type switching; acts with Fkh1p to control which donor mating-type locus is inserted into MAT locus during mating type switching; localized to the nucleus; not an essential gene +S000033505 CDS YMR144W 13 553362 554390 W 2011-02-03 1996-07-31 +S000130191 ARS ARS1322 chromosome 13 13 553422 554331 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000004753 ORF Verified YMR145C NDE1 NADH-ubiquinone reductase (H(+)-translocating) NDE1|NDH1 chromosome 13 13 556475 554793 C 2011-02-03 1996-07-31 Mitochondrial external NADH dehydrogenase; type II NAD(P)H:quinone oxidoreductase that catalyzes the oxidation of cytosolic NADH; Nde1p and Nde2p provide cytosolic NADH to the mitochondrial respiratory chain; NDE1 has a paralog, NDE2, that arose from the whole genome duplication +S000033554 CDS YMR145C 13 556475 554793 C 2011-02-03 1996-07-31 +S000004754 ORF Verified YMR146C TIF34 translation initiation factor eIF3 subunit i chromosome 13 L000003329 13 558524 557481 C 2011-02-03 1996-07-31 eIF3i subunit of the eukaryotic translation initiation factor 3 (eIF3); subunit of the core complex of eIF3; essential for translation; stimulates rate of ribosomal scanning during translation reinitiation; eIF3 is also involved in programmed stop codon readthrough +S000033644 CDS YMR146C 13 558524 557481 C 2011-02-03 1996-07-31 +S000004755 ORF Uncharacterized YMR147W chromosome 13 13 559199 559870 W 2011-02-03 1996-07-31 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the cell periphery +S000033833 CDS YMR147W 13 559199 559870 W 2011-02-03 1996-07-31 +S000004756 ORF Verified YMR148W OSW5 chromosome 13 13 560366 560812 W 2011-02-03 1996-07-31 Protein of unknown function with possible role in spore wall assembly; predicted to contain an N-terminal transmembrane domain; osw5 null mutant spores exhibit increased spore wall permeability and sensitivity to beta-glucanase digestion +S000034741 CDS YMR148W 13 560366 560812 W 2011-02-03 1996-07-31 +S000004757 ORF Verified YMR149W SWP1 dolichyl-diphosphooligosaccharide-protein glycotransferase chromosome 13 L000002255 13 560996 561856 W 2011-02-03 1996-07-31 Delta subunit of the oligosaccharyl transferase glycoprotein complex; complex is required for N-linked glycosylation of proteins in the endoplasmic reticulum +S000034875 CDS YMR149W 13 560996 561856 W 2011-02-03 1996-07-31 +S000004759 ORF Dubious YMR151W YIM2 chromosome 13 L000002672 13 562506 562943 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 5% of ORF overlaps the verified gene IMP1 +S000036792 CDS YMR151W 13 562506 562943 W 2011-02-03 1996-07-31 +S000004758 ORF Verified YMR150C IMP1 endopeptidase catalytic subunit IMP1|PET-TS2858 chromosome 13 L000000864 13 562528 561956 C 92 2011-02-03 1996-07-31 Catalytic subunit of mitochondrial inner membrane peptidase complex; required for maturation of mitochondrial proteins of the intermembrane space; complex contains two catalytic subunits (Imp1p and Imp2p that differ in substrate specificty) and Som1p +S000035827 CDS YMR150C 13 562528 561956 C 2011-02-03 1996-07-31 +S000004760 ORF Verified YMR152W YIM1 chromosome 13 L000002671 13 563096 564193 W 2011-02-03 1996-07-31 Protein of unknown function; null mutant displays sensitivity to DNA damaging agents; may have a role in lipid metabolism, based on localization to lipid droplets; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; protein abundance increases in response to DNA replication stress +S000036879 CDS YMR152W 13 563096 564193 W 2011-02-03 1996-07-31 +S000004762 ORF Verified YMR153W NUP53 FG-nucleoporin NUP53 chromosome 13 13 564435 565862 W 2011-02-03 1996-07-31 FG-nucleoporin component of central core of nuclear pore complex (NPC); also part of the NPC nuclear basket; contributes directly to nucleocytoplasmic transport; involved in regulation of transcription and mitosis; induces membrane tubulation, which may contribute to nuclear pore assembly; NUP53 has a paralog, ASM4, that arose from the whole genome duplication +S000036930 CDS YMR153W 13 564435 565862 W 2011-02-03 1996-07-31 +S000004761 ORF Dubious YMR153C-A chromosome 13 13 565909 565574 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps 3' end of verified gene NUP53/YMR153W +S000036598 CDS YMR153C-A 13 565909 565574 C 2011-02-03 1996-07-31 +S000004763 ORF Verified YMR154C RIM13 CPL1 chromosome 13 L000004172 13 568182 565999 C 2011-02-03 1996-07-31 Calpain-like cysteine protease; involved in proteolytic activation of Rim101p in response to alkaline pH; localizes to punctate structures in alkaline conditions and in vps4 mutant; has similarity to A. nidulans palB +S000036955 CDS YMR154C 13 568182 565999 C 2011-02-03 1996-07-31 +S000004764 ORF Uncharacterized YMR155W chromosome 13 13 568551 570194 W 2011-02-03 1996-07-31 Putative protein of unknown function; identified as interacting with Hsp82p in a high-throughput two-hybrid screen +S000037749 CDS YMR155W 13 568551 570194 W 2011-02-03 1996-07-31 +S000004765 ORF Verified YMR156C TPP1 polynucleotide 3'-phosphatase chromosome 13 13 571016 570300 C 2011-02-03 1996-07-31 DNA 3'-phosphatase; functions in repair of endogenous damage of double-stranded DNA, activity is specific for removal of 3' phosphates at strand breaks; similar to the l-2-haloacid dehalogenase superfamily; homolog of human polynucleotide kinase/3'-phosphatase +S000037789 CDS YMR156C 13 571016 570300 C 2011-02-03 1996-07-31 +S000004766 ORF Verified YMR157C AIM36 FMP39 chromosome 13 13 572044 571277 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant displays reduced respiratory growth and elevated frequency of mitochondrial genome loss; the authentic, non-tagged protein is detected in purified mitochondria in high-throughput studies +S000037876 CDS YMR157C 13 572044 571277 C 2011-02-03 1996-07-31 +S000004767 ORF Verified YMR158W MRPS8 mitochondrial 37S ribosomal protein MRPS8 chromosome 13 13 572248 572715 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit +S000030873 CDS YMR158W 13 572248 572715 W 2011-02-03 1996-07-31 +S000006664 tRNA_gene tM(CAU)M EMT4 chromosome 13 L000003677|L000000554 13 572955 572883 C 2011-02-03 2000-05-19 Methionine tRNA (tRNA-Met), functions in translational elongation; not involved in translational initiation; predicted by tRNAscan-SE analysis +S000034574 noncoding_exon tM(CAU)M 13 572955 572883 C 2011-02-03 2000-05-19 +S000007249 ORF Uncharacterized YMR158C-A YMR158C-B chromosome 13 13 573331 573194 C 2011-02-03 1997-07-17 Putative protein of unknown function; may contain a lipid attachment site; YMR158C-A is not an essential gene +S000030986 CDS YMR158C-A 13 573331 573194 C 2011-02-03 1997-07-17 +S000007116 long_terminal_repeat YMRCdelta18 chromosome 13 13 573338 573112 C 2011-02-03 2000-05-19 Ty1 LTR +S000004768 ORF Dubious YMR158W-B YMR158W-A chromosome 13 13 574471 574791 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene ATG16/YMR159C +S000034209 CDS YMR158W-B 13 574471 574791 W 2011-02-03 1996-07-31 +S000004769 ORF Verified YMR159C ATG16 APG15|APG16|CVT11|SAP18 chromosome 13 L000004135|L000004762|S000029036|L000004787 13 574928 574476 C 2011-02-03 1996-07-31 Conserved protein involved in autophagy; interacts with Atg12p-Atg5p conjugates to form Atg12p-Atg5p-Atg16p multimers, which binds to membranes and localizes to the pre-autophagosomal structure and are required for autophagy; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress +S000030904 CDS YMR159C 13 574928 574476 C 2011-02-03 1996-07-31 +S000004770 ORF Verified YMR160W chromosome 13 13 575066 577516 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the membrane of the vacuole; mutant has enhanced sensitivity to overexpression of mutant huntingtin; YMR160W is not an essential gene; relative distribution within the vacuolar membrane changes upon DNA replication stress +S000032016 CDS YMR160W 13 575066 577516 W 2011-02-03 1996-07-31 +S000004771 ORF Verified YMR161W HLJ1 type I HSP40 co-chaperone HLJ1 chromosome 13 L000002962 13 577718 578392 W 2011-02-03 1996-07-31 Co-chaperone for Hsp40p; anchored in the ER membrane; with its homolog Ydj1p promotes ER-associated protein degradation (ERAD) of integral membrane substrates; similar to E. coli DnaJ +S000032125 CDS YMR161W 13 577718 578392 W 2011-02-03 1996-07-31 +S000004772 ORF Verified YMR162C DNF3 aminophospholipid-translocating P4-type ATPase DNF3 chromosome 13 13 583921 578951 C 2011-02-03 1996-07-31 Trans-golgi network aminophospholipid translocase (flippase); type 4 P-type ATPase; involved in phospholipid translocation, contributing to the maintenance of membrane lipid asymmetry in post-Golgi secretory vesicles; role in protein trafficking between the Golgi and endosomal system; localizes to the trans-Golgi network; localizes to the shmoo tip where it has a redundant role in the cellular response to mating pheromone +S000032992 CDS YMR162C 13 583921 578951 C 2011-02-03 1996-07-31 +S000004773 ORF Verified YMR163C INP2 chromosome 13 13 586388 584271 C 2011-02-03 1996-07-31 Peroxisome-specific receptor important for peroxisome inheritance; co-fractionates with peroxisome membranes and co-localizes with peroxisomes in vivo; physically interacts with the myosin V motor Myo2p; INP2 is not an essential gene +S000033087 CDS YMR163C 13 586388 584271 C 2011-02-03 1996-07-31 +S000006765 tRNA_gene tV(AAC)M3 chromosome 13 L000003676 13 586709 586636 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000030039 noncoding_exon tV(AAC)M3 13 586709 586636 C 2011-02-03 2000-05-19 +S000004774 ORF Verified YMR164C MSS11 chromosome 13 L000003920 13 589550 587274 C 2011-02-03 1996-07-31 Transcription factor; involved in regulation of invasive growth and starch degradation; controls the activation of FLO11 and STA2 in response to nutritional signals; forms a heterodimer with Flo8p that interacts with the Swi/Snf complex during transcriptional activation of FLO1, FLO11, and STA1 +S000033162 CDS YMR164C 13 589550 587274 C 2011-02-03 1996-07-31 +S000004775 ORF Verified YMR165C PAH1 phosphatidate phosphatase PAH1|SMP2 chromosome 13 L000001934 13 592628 590040 C 2011-02-03 1996-07-31 Mg2+-dependent phosphatidate (PA) phosphatase; dephosphorylates PA to yield diacylglycerol; regulates phospholipid synthesis, nuclear/ER membrane growth, lipid droplet formation, triacylglycerol synthesis, vacuolar homeostasis and cell wall integrity; phosphorylated by Pho85p/Pho80p, Cdc28p/Cyclin B, PKA, PKC, and CKII, regulating activity, localization, and proteosomal degradation; homolog of mammalian lipins 1 and 2; human homologs LPIN1, LPIN2, LPIN3 complement the null +S000033959 CDS YMR165C 13 592628 590040 C 2011-02-03 1996-07-31 +S000004776 ORF Verified YMR166C MME1 chromosome 13 13 594473 593367 C 2011-02-03 1996-07-31 Transporter of the mitochondrial inner membrane that exports magnesium; involved in mitochondrial Mg2+ homeostasis; has similarity to human mitochondrial ATP-Mg/Pi carriers +S000034071 CDS YMR166C 13 594473 593367 C 2011-02-03 1996-07-31 +S000004777 ORF Verified YMR167W MLH1 mismatch repair ATPase MLH1|PMS2 chromosome 13 L000001121 13 594886 597195 W 2011-02-03 1996-07-31 Protein required for mismatch repair in mitosis and meiosis; also required for crossing over during meiosis; forms a complex with Pms1p and Msh2p-Msh3p during mismatch repair; human homolog is associated with hereditary non-polyposis colon cancer +S000034230 CDS YMR167W 13 594886 597195 W 2011-02-03 1996-07-31 +S000004778 ORF Verified YMR168C CEP3 CSL1|CBF3B|CBF3 chromosome 13 L000000312|L000000222 13 599158 597332 C 2011-02-03 1996-07-31 Essential kinetochore protein; component of the CBF3 complex that binds the CDEIII region of the centromere; contains an N-terminal Zn2Cys6 type zinc finger domain, a C-terminal acidic domain, and a putative coiled coil dimerization domain +S000035106 CDS YMR168C 13 599158 597332 C 2011-02-03 1996-07-31 +S000004779 ORF Verified YMR169C ALD3 aldehyde dehydrogenase (NAD(+)) ALD3 chromosome 13 L000002992 13 600872 599352 C 2011-02-03 1996-07-31 Cytoplasmic aldehyde dehydrogenase; involved in beta-alanine synthesis; uses NAD+ as the preferred coenzyme; very similar to Ald2p; expression is induced by stress and repressed by glucose +S000035214 CDS YMR169C 13 600872 599352 C 2011-02-03 1996-07-31 +S000004780 ORF Verified YMR170C ALD2 aldehyde dehydrogenase (NAD(+)) ALD2 chromosome 13 L000003120|L000002991 13 603082 601562 C 2011-02-03 1996-07-31 Cytoplasmic aldehyde dehydrogenase; involved in ethanol oxidation and beta-alanine biosynthesis; uses NAD+ as the preferred coenzyme; expression is stress induced and glucose repressed; very similar to Ald3p +S000036140 CDS YMR170C 13 603082 601562 C 2011-02-03 1996-07-31 +S000004781 ORF Verified YMR171C EAR1 chromosome 13 13 605520 603868 C 2011-02-03 1996-07-31 Specificity factor required for Rsp5p-dependent ubiquitination; also required for sorting of specific cargo proteins at the multivesicular body; mRNA is targeted to the bud via the mRNA transport system involving She2p +S000036240 CDS YMR171C 13 605520 603868 C 2011-02-03 1996-07-31 +S000004783 ORF Verified YMR172W HOT1 chromosome 13 L000004957 13 605981 608140 W 2011-02-03 1996-07-31 Transcription factor for glycerol biosynthetic genes; required for the transient induction of glycerol biosynthetic genes GPD1 and GPP2 in response to high osmolarity; targets Hog1p to osmostress responsive promoters; has similarity to Msn1p and Gcr1p +S000031822 CDS YMR172W 13 605981 608140 W 2011-02-03 1996-07-31 +S000004782 ORF Dubious YMR172C-A chromosome 13 13 608211 607828 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps 3' end of ORF HOT1/YMR172W +S000034962 CDS YMR172C-A 13 608211 607828 C 2011-02-03 1996-07-31 +S000004784 ORF Verified YMR173W DDR48 DNA damage-responsive protein 48|FSP chromosome 13 L000000498 13 608689 609981 W 2011-02-03 1996-07-31 DNA damage-responsive protein; expression is increased in response to heat-shock stress or treatments that produce DNA lesions; contains multiple repeats of the amino acid sequence NNNDSYGS; protein abundance increases in response to DNA replication stress +S000031955 CDS YMR173W 13 608689 609981 W 2011-02-03 1996-07-31 +S000004785 ORF Dubious YMR173W-A chromosome 13 13 608897 610081 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene DDR48/YML173W +S000030427 CDS YMR173W-A 13 608897 610081 W 2011-02-03 1996-07-31 +S000004786 ORF Verified YMR174C PAI3 IA3 chromosome 13 L000001332 13 610365 610159 C 2011-02-03 1996-07-31 Cytoplasmic proteinase A (Pep4p) inhibitor; dependent on Pbs2p and Hog1p protein kinases for osmotic induction; intrinsically unstructured, N-terminal half becomes ordered in the active site of proteinase A upon contact +S000031994 CDS YMR174C 13 610365 610159 C 2011-02-03 1996-07-31 +S000004787 ORF Verified YMR175W SIP18 chromosome 13 L000002670 13 611016 611255 W 2011-02-03 1996-07-31 Phospholipid-binding hydrophilin; essential to overcome desiccation-rehydration process; expression is induced by osmotic stress; SIP18 has a paralog, GRE1, that arose from the whole genome duplication +S000037525 CDS YMR175W 13 611016 611255 W 2011-02-03 1996-07-31 +S000118374 ARS ARS1323 ARSXIII-611 chromosome 13 13 611275 611489 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178159 ARS_consensus_sequence ARS1323 13 611317 611333 W 2014-11-18 2014-11-18 +S000028848 ORF Uncharacterized YMR175W-A chromosome 13 13 611314 611508 W 2011-02-03 2003-07-29 Putative protein of unknown function +S000034535 CDS YMR175W-A 13 611314 611508 W 2011-02-03 2003-07-29 +S000004788 ORF Verified YMR176W ECM5 chromosome 13 L000003881 13 611740 615975 W 2011-02-03 1996-07-31 Subunit of the Snt2C complex; physically associates with Snt2p and Rpd3p; along with Snt2p, recruits Rpd3p to a small number of promoters; also colocalizes with Snt2p, independently of Rpd3p, to promoters of stress response genes in response to oxidative stress; contains ATP/GTP-binding site motif A; null mutant exhibits increased cellular volume, large drooping buds with elongated necks; relative distribution to the nucleus increases upon DNA replication stress +S000037587 CDS YMR176W 13 611740 615975 W 2011-02-03 1996-07-31 +S000004789 ORF Verified YMR177W MMT1 MFT1 chromosome 13 L000004107 13 616566 618098 W 2011-02-03 1996-07-31 Putative metal transporter involved in mitochondrial iron accumulation; MMT1 has a paralog, MMT2, that arose from the whole genome duplication +S000037682 CDS YMR177W 13 616566 618098 W 2011-02-03 1996-07-31 +S000004790 ORF Verified YMR178W chromosome 13 13 618479 619303 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and nucleus; YMR178W is not an essential gene; protein abundance increases in response to DNA replication stress +S000030501 CDS YMR178W 13 618479 619303 W 2011-02-03 1996-07-31 +S000004791 ORF Verified YMR179W SPT21 chromosome 13 L000002040 13 619858 622134 W 2011-02-03 1996-07-31 Protein with a role in transcriptional silencing; required for normal transcription at several loci including HTA2-HTB2 and HHF2-HHT2, but not required at the other histone loci; functionally related to Spt10p; localizes to nuclear foci that become diffuse upon DNA replication stress +S000030565 CDS YMR179W 13 619858 622134 W 2011-02-03 1996-07-31 +S000004792 ORF Verified YMR180C CTL1 polynucleotide 5'-phosphatase|CTH1 chromosome 13 S000007412 13 623213 622251 C 2011-02-03 1996-07-31 RNA 5'-triphosphatase, localizes to both the nucleus and cytoplasm; CTL1 has a paralog, CET1, that arose from the whole genome duplication +S000037398 CDS YMR180C 13 623213 622251 C 2011-02-03 1996-07-31 +S000004793 ORF Uncharacterized YMR181C chromosome 13 13 624080 623616 C 2011-02-03 1996-07-31 Protein of unknown function; mRNA transcribed as part of a bicistronic transcript with a predicted transcriptional repressor RGM1/YMR182C; mRNA is destroyed by nonsense-mediated decay (NMD); not an essential gene; YMR181C has a paralog, YPL229W, that arose from the whole genome duplication +S000030034 CDS YMR181C 13 624080 623616 C 2011-02-03 1996-07-31 +S000004794 ORF Verified YMR182C RGM1 chromosome 13 L000001627 13 625167 624532 C 2011-02-03 1996-07-31 Putative zinc finger DNA binding transcription factor; contains two N-terminal C2H2 zinc fingers and C-terminal proline rich domain; overproduction impairs cell growth and induces expression of genes involved in monosaccharide catabolism and aldehyde metabolism; regulates expression of of Y' telomeric elements and subtelomeric COS genes; relocalizes to the cytosol in response to hypoxia; RGM1 has a paralog, USV1, that arose from the whole genome duplication +S000030142 CDS YMR182C 13 625167 624532 C 2011-02-03 1996-07-31 +S000028693 ORF Uncharacterized YMR182W-A chromosome 13 13 625811 625897 W 2011-02-03 2003-07-29 Putative protein of unknown function +S000032593 CDS YMR182W-A 13 625811 625897 W 2011-02-03 2003-07-29 +S000028468 snoRNA_gene snR83 SNR83 RUF3 chromosome 13 13 626349 626654 W 2011-02-03 2004-04-01 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of small subunit (SSU) rRNA at positions U1290 and U1415 +S000030105 noncoding_exon snR83 13 626349 626654 W 2011-02-03 2004-04-01 +S000004795 ORF Verified YMR183C SSO2 syntaxin chromosome 13 L000002090 13 627808 626921 C 2011-02-03 1996-07-31 Plasma membrane t-SNARE; involved in fusion of secretory vesicles at the plasma membrane; syntaxin homolog that is functionally redundant with Sso1p; SSO2 has a paralog, SSO1, that arose from the whole genome duplication +S000030342 CDS YMR183C 13 627808 626921 C 2011-02-03 1996-07-31 +S000004796 ORF Verified YMR184W ADD37 chromosome 13 13 628189 628785 W 2011-02-03 1996-07-31 Protein of unknown function; involved in ER-associated protein degradation; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and is induced in response to the DNA-damaging agent MMS; YMR184W is not an essential gene; protein abundance increases in response to DNA replication stress +S000033702 CDS YMR184W 13 628189 628785 W 2011-02-03 1996-07-31 +S000004797 ORF Verified YMR185W RTP1 chromosome 13 13 629025 631970 W 2011-02-03 1996-07-31 Protein required for the nuclear import and biogenesis of RNA pol II; conflicting evidence on whether null mutant is viable with elongated buds, or inviable; interacts with Rpb2, Rpb3, Nup116p, Nup100p and components of the R2TP complex (Rvb1p, Rvb2p, Pih1p); similar to human TMCO7 gene +S000033842 CDS YMR185W 13 629025 631970 W 2011-02-03 1996-07-31 +S000004798 ORF Verified YMR186W HSC82 Hsp90 family chaperone HSC82|HSP90 chromosome 13 L000000813 13 632355 634472 W 2011-02-03 1996-07-31 Cytoplasmic chaperone of the Hsp90 family; plays a role in determining prion variants; redundant in function and nearly identical with Hsp82p, and together they are essential; expressed constitutively at 10-fold higher basal levels than HSP82 and induced 2-3 fold by heat shock; contains two acid-rich unstructured regions that promote the solubility of chaperone-substrate complexes; HSC82 has a paralog, HSP82, that arose from the whole genome duplication +S000033979 CDS YMR186W 13 632355 634472 W 2011-02-03 1996-07-31 +S000118375 ARS ARS1324 ARSXIII-635 chromosome 13 13 634501 634588 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000004799 ORF Uncharacterized YMR187C chromosome 13 13 635984 634689 C 2011-02-03 1996-07-31 Putative protein of unknown function; YMR187C is not an essential gene +S000033992 CDS YMR187C 13 635984 634689 C 2011-02-03 1996-07-31 +S000004800 ORF Verified YMR188C MRPS17 mitochondrial 37S ribosomal protein MRPS17 chromosome 13 13 637004 636291 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit +S000034878 CDS YMR188C 13 637004 636291 C 2011-02-03 1996-07-31 +S000004801 ORF Verified YMR189W GCV2 glycine decarboxylase subunit P|GSD2 chromosome 13 L000000734 13 637500 640604 W 2011-02-03 1996-07-31 P subunit of the mitochondrial glycine decarboxylase complex; glycine decarboxylase is required for the catabolism of glycine to 5,10-methylene-THF; expression is regulated by levels of 5,10-methylene-THF in the cytoplasm +S000035091 CDS YMR189W 13 637500 640604 W 2011-02-03 1996-07-31 +S000004802 ORF Verified YMR190C SGS1 ATP-dependent DNA helicase SGS1 chromosome 13 L000001877 13 645258 640915 C 115.6 2011-02-03 1996-07-31 RecQ family nucleolar DNA helicase; role in genome integrity maintenance, chromosome synapsis, meiotic joint molecule/crossover formation; stimulates activity of Top3p; rapidly lost in response to rapamycin in Rrd1p-dependent manner; forms nuclear foci upon DNA replication stress; yeast SGS1 complements mutations in human homolog BLM implicated in Bloom syndrome; also similar to human WRN implicated in Werner syndrome; human BLM and WRN can each complement yeast null mutant +S000034467 CDS YMR190C 13 645258 640915 C 2011-02-03 1996-07-31 +S000004803 ORF Verified YMR191W SPG5 chromosome 13 13 645656 646777 W 2011-02-03 2003-09-22|1996-07-31 Protein required for proteasome assembly during quiescence; binds to base of the proteasome regulartory particle; required for survival at high temperature during stationary phase; not required for growth on nonfermentable carbon sources +S000034638 CDS YMR191W 13 645656 646777 W 2011-02-03 2003-09-22|1996-07-31 +S000004804 ORF Verified YMR192W GYL1 APP2 chromosome 13 13 647118 649280 W 2011-02-03 1996-07-31 Putative GTPase activating protein (GAP) with a role in exocytosis; stimulates Gyp5p GAP activity on Ypt1p, colocalizes with Gyp5p at sites of polarized growth; interacts with Gyp5p, Rvs161p, and Rvs167p; involved in recruiting Rvs167p to the bud tip during polarized growth; increases in abundance and relocalizes from bud neck to cytoplasm upon DNA replication stress; GYL1 has a paralog, GYP5, that arose from the whole genome duplication +S000034769 CDS YMR192W 13 647118 649280 W 2011-02-03 1996-07-31 +S000118376 ARS ARS1325 ARSXIII-649 chromosome 13 13 649309 649552 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178160 ARS_consensus_sequence ARS1325 13 649361 649377 W 2014-11-18 2014-11-18 +S000004806 ORF Verified YMR193W MRPL24 mitochondrial 54S ribosomal protein YmL24/YmL14|YmL14|YmL24|MRPL14 chromosome 13 L000002690 13 650036 650812 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; two mitochondrial ribosomal proteins, YmL14 and YmL24, have been assigned to the same gene +S000035736 CDS YMR193W 13 650036 650812 W 2011-02-03 1996-07-31 +S000004807 ORF Verified YMR194W RPL36A eL36|ribosomal 60S subunit protein L36A|L36e|YL39|L39|L36A|RPL39B chromosome 13 L000004467|L000003236 13 651145 651910 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L36A; N-terminally acetylated; binds to 5.8 S rRNA; homologous to mammalian ribosomal protein L36, no bacterial homolog; RPL36A has a paralog, RPL36B, that arose from the whole genome duplication +S000035869 CDS YMR194W 13 651145 651160 W 2011-02-03 1996-07-31 +S000035870 CDS YMR194W 13 651624 651910 W 2011-02-03 1996-07-31 +S000035871 intron YMR194W 13 651161 651623 W 2011-02-03 1996-07-31 +S000004805 ORF Dubious YMR193C-A chromosome 13 13 651458 651072 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035259 CDS YMR193C-A 13 651458 651072 C 2011-02-03 1996-07-31 +S000007293 snoRNA_gene snR11 SNR11 chromosome 13 L000004943|L000002848 13 652275 652532 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2416 +S000036590 noncoding_exon snR11 13 652275 652532 W 2011-02-03 2000-05-19 +S000028514 ORF Verified YMR194C-B CMC4 chromosome 13 13 652887 652594 C 2011-02-03 2003-07-29 Protein that localizes to the mitochondrial intermembrane space; localizes via the Mia40p-Erv1p system; contains twin cysteine-x(9)-cysteine motifs +S000030281 CDS YMR194C-B 13 652775 652594 C 2011-02-03 2003-07-29 +S000030280 CDS YMR194C-B 13 652887 652848 C 2011-02-03 2003-07-29 +S000030282 intron YMR194C-B 13 652847 652776 C 2011-02-03 2003-07-29 +S000007250 ORF Dubious YMR194C-A chromosome 13 13 653136 652912 C 2011-02-03 1997-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037816 CDS YMR194C-A 13 653136 652912 C 2011-02-03 1997-07-17 +S000004808 ORF Verified YMR195W ICY1 chromosome 13 S000007527 13 654034 654417 W 2011-02-03 1996-07-31 Protein of unknown function; required for viability in rich media of cells lacking mitochondrial DNA; mutants have an invasive growth defect with elongated morphology; induced by amino acid starvation; ICY1 has a paralog, ICY2, that arose from the whole genome duplication +S000036003 CDS YMR195W 13 654034 654417 W 2011-02-03 1996-07-31 +S000004809 ORF Uncharacterized YMR196W chromosome 13 13 655076 658342 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YMR196W is not an essential gene +S000037847 CDS YMR196W 13 655076 658342 W 2011-02-03 1996-07-31 +S000004810 ORF Verified YMR197C VTI1 v-SNARE protein VTI1 chromosome 13 L000003598 13 659198 658545 C 2011-02-03 1996-07-31 Protein involved in cis-Golgi membrane traffic; v-SNARE that interacts with two t-SNARES, Sed5p and Pep12p; required for multiple vacuolar sorting pathways; human homolog VTI1A can complement yeast null mutant +S000037881 CDS YMR197C 13 659198 658545 C 2011-02-03 1996-07-31 +S000004811 ORF Verified YMR198W CIK1 chromosome 13 L000000335 13 659745 661529 W 2011-02-03 1996-07-31 Kinesin-associated protein; required for both karyogamy and mitotic spindle organization, interacts stably and specifically with Kar3p and may function to target this kinesin to a specific cellular role; locus encodes a long and short transcript with differing functions; CIK1 has a paralog, VIK1, that arose from the whole genome duplication +S000029971 CDS YMR198W 13 659745 661529 W 2011-02-03 1996-07-31 +S000004812 ORF Verified YMR199W CLN1 cyclin CLN1 chromosome 13 L000000357 13 662644 664284 W 2011-02-03 1996-07-31 G1 cyclin involved in regulation of the cell cycle; activates Cdc28p kinase to promote the G1 to S phase transition; late G1 specific expression depends on transcription factor complexes, MBF (Swi6p-Mbp1p) and SBF (Swi6p-Swi4p); CLN1 has a paralog, CLN2, that arose from the whole genome duplication; cell cycle arrest phenotype of the cln1 cln2 cln3 triple null mutant is complemented by any of human cyclins CCNA2, CCNB1, CCNC, CCND1, or CCNE1 +S000030961 CDS YMR199W 13 662644 664284 W 2011-02-03 1996-07-31 +S000004813 ORF Verified YMR200W ROT1 chromosome 13 L000003404 13 664752 665522 W 2011-02-03 1996-07-31 Molecular chaperone involved in protein folding in ER; mutation causes defects in cell wall synthesis and lysis of autophagic bodies, suppresses tor2 mutations, and is synthetically lethal with kar2-1 and with rot2 mutations; involved in N-linked glycosylation and O-mannosylation; transmembrane helix Ser250 is essential for Rot1p to interact with other membrane components and exert its functional role, avoiding exposure of Ser H-bonding group at lipid-exposed surface +S000035501 CDS YMR200W 13 664752 665522 W 2011-02-03 1996-07-31 +S000004814 ORF Verified YMR201C RAD14 chromosome 13 L000001564 13 667044 665845 C 2011-02-03 1996-07-31 Protein that recognizes and binds damaged DNA during NER; subunit of Nucleotide Excision Repair Factor 1 (NEF1); contains zinc finger motif; homolog of human XPA protein; NER stands for nucleotide excision repair +S000035530 CDS YMR201C 13 666933 665845 C 2011-02-03 1996-07-31 +S000035529 CDS YMR201C 13 667044 667018 C 2011-02-03 1996-07-31 +S000035531 intron YMR201C 13 667017 666934 C 2011-02-03 1996-07-31 +S000178149 matrix_attachment_site ETC5 ETC5 chromosome 13 13 667324 667346 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; can act as a transcription-blocking insulator or as a heterochromatin barrier element; located within ncRNA RNA170 which lies between divergently transcribed genes RAD14 and ERG2 +S000114171 ncRNA_gene RNA170 RNA170 chromosome 13 S000077076 13 667456 667288 C 2011-02-03 2006-01-23 RNA polymerase III transcribed RNA of unknown function; conserved in other yeast species +S000114172 noncoding_exon RNA170 13 667456 667288 C 2011-02-03 2006-01-23 +S000004815 ORF Verified YMR202W ERG2 C-8 sterol isomerase ERG2|END11 chromosome 13 L000000569|L000004560 13 667537 668205 W 2011-02-03 1996-07-31 C-8 sterol isomerase; catalyzes isomerization of delta-8 double bond to delta-7 position at an intermediate step in ergosterol biosynthesis; transcriptionally down-regulated when ergosterol is in excess; mutation is functionally complemented by human EBP +S000036484 CDS YMR202W 13 667537 668205 W 2011-02-03 1996-07-31 +S000004816 ORF Verified YMR203W TOM40 MOM38|ISP42 chromosome 13 L000000878 13 668492 669655 W 2011-02-03 1996-07-31 Component of the TOM (translocase of outer membrane) complex; responsible for recognition and initial import steps for all mitochondrially directed proteins; constitutes the core element of the protein conducting pore; pre-Tom40p is phosphorylated by PKA, which impairs its import into mitochondria under non-respiratory conditions +S000036557 CDS YMR203W 13 668492 669655 W 2011-02-03 1996-07-31 +S000004817 ORF Verified YMR204C INP1 chromosome 13 13 671325 670063 C 2011-02-03 1996-07-31 Peripheral membrane protein of peroxisomes; involved in peroxisomal inheritance; recruitment to peroxisomes is mediated by interaction with Pex3p at the peroxisomal membrane +S000036611 CDS YMR204C 13 671325 670063 C 2011-02-03 1996-07-31 +S000004818 ORF Verified YMR205C PFK2 6-phosphofructokinase subunit beta chromosome 13 L000001405 13 674766 671887 C 132 2011-02-03 1996-07-31 Beta subunit of heterooctameric phosphofructokinase; involved in glycolysis; indispensable for anaerobic growth; activated by fructose-2,6-bisphosphate and AMP; mutation inhibits glucose induction of cell cycle-related genes +S000036708 CDS YMR205C 13 674766 671887 C 2011-02-03 1996-07-31 +S000004819 ORF Uncharacterized YMR206W chromosome 13 13 675896 676837 W 2011-02-03 1996-07-31 Putative protein of unknown function; not an essential gene; YMR206W has a paralog, YNR014W, that arose from the whole genome duplication +S000037504 CDS YMR206W 13 675896 676837 W 2011-02-03 1996-07-31 +S000004820 ORF Verified YMR207C HFA1 acetyl-CoA carboxylase HFA1 chromosome 13 L000000769 13 683564 677193 C 2011-02-03 1996-07-31 Mitochondrial acetyl-coenzyme A carboxylase; catalyzes production of malonyl-CoA in mitochondrial fatty acid biosynthesis; relocalizes from mitochondrion to cytoplasm upon DNA replication stress; genetic and comparative analysis suggests that translation begins at a non-canonical (Ile) start codon at -372 relative to the annotated start codon +S000037547 CDS YMR207C 13 683564 677193 C 2011-02-03 1996-07-31 +S000004821 ORF Verified YMR208W ERG12 mevalonate kinase|RAR1 chromosome 13 L000000578 13 684467 685798 W 176 2011-02-03 1996-07-31 Mevalonate kinase; acts in the biosynthesis of isoprenoids and sterols, including ergosterol, from mevalonate; human MVK functionally complements the lethality of the erg12 null mutation +S000030406 CDS YMR208W 13 684467 685798 W 2011-02-03 1996-07-31 +S000004822 ORF Uncharacterized YMR209C chromosome 13 13 687284 685911 C 2011-02-03 1996-07-31 Putative S-adenosylmethionine-dependent methyltransferase; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively; YMR209C is not an essential gene +S000030480 CDS YMR209C 13 687284 685911 C 2011-02-03 1996-07-31 +S000004823 ORF Verified YMR210W MGL2 putative carboxylic ester hydrolase chromosome 13 13 687516 688865 W 2011-02-03 1996-07-31 Monoacylglycerol lipase; palmitoyl monoacylglycerol is the preferred substrate; role in triacylglycerol catabolism; minor role in medium-chain fatty acid ethyl ester biosynthesis; contains an alpha/beta hydrolase domain and a typical lipase motif; has similarity to acyltransferases, Eeb1p and Eht1p, and human ABHD1 +S000031343 CDS YMR210W 13 687516 688865 W 2011-02-03 1996-07-31 +S000004824 ORF Verified YMR211W DML1 chromosome 13 13 689083 690510 W 2011-02-03 1996-07-31 Essential protein involved in mtDNA inheritance; may also function in the partitioning of the mitochondrial organelle or in the segregation of chromosomes, exhibits regions similar to members of a GTPase family +S000031451 CDS YMR211W 13 689083 690510 W 2011-02-03 1996-07-31 +S000004825 ORF Verified YMR212C EFR3 chromosome 13 13 693043 690695 C 2011-02-03 1996-07-31 Protein required for Stt4-containing PI kinase complex localization; required for Stt4-containing phosphoinositide (PI) kinase patch assembly at the plasma membrane; recruited to the plasma membrane via a conserved basic patch near its N-terminus; exhibits synthetic lethal genetic interactions with PHO85; has sequence similarity to the Drosophila rolling blackout (RBO) gene +S000031486 CDS YMR212C 13 693043 690695 C 2011-02-03 1996-07-31 +S000004826 ORF Verified YMR213W CEF1 NTC85 chromosome 13 L000004270 13 693381 695153 W 2011-02-03 1996-07-31 Essential splicing factor; associated with Prp19p and the spliceosome, contains an N-terminal c-Myb DNA binding motif necessary for cell viability but not for Prp19p association, evolutionarily conserved and homologous to S. pombe Cdc5p +S000031586 CDS YMR213W 13 693381 695153 W 2011-02-03 1996-07-31 +S000004827 ORF Verified YMR214W SCJ1 chromosome 13 L000001811 13 695350 696483 W 2011-02-03 2003-09-22|1996-07-31 One of several homologs of bacterial chaperone DnaJ; located in the ER lumen where it cooperates with Kar2p to mediate maturation of proteins +S000032566 CDS YMR214W 13 695350 696483 W 2011-02-03 2003-09-22|1996-07-31 +S000004828 ORF Verified YMR215W GAS3 putative 1,3-beta-glucanosyltransferase chromosome 13 13 696796 698370 W 2011-02-03 1996-07-31 Putative 1,3-beta-glucanosyltransferase; has similarity go other GAS family members; low abundance, possibly inactive member of the GAS family of GPI-containing proteins; localizes to the cell wall; mRNA induced during sporulation +S000032695 CDS YMR215W 13 696796 698370 W 2011-02-03 1996-07-31 +S000004829 ORF Verified YMR216C SKY1 serine/threonine protein kinase SKY1 chromosome 13 L000003941 13 701039 698811 C 2011-02-03 1996-07-31 SR protein kinase (SRPK); involved in regulating proteins involved in mRNA metabolism and cation homeostasis; similar to human SRPK1 +S000032724 CDS YMR216C 13 701039 698811 C 2011-02-03 1996-07-31 +S000004830 ORF Verified YMR217W GUA1 GMP synthase (glutamine-hydrolyzing) chromosome 13 L000000744 13 701790 703367 W 2011-02-03 1996-07-31 GMP synthase; highly conserved enzyme that catalyzes the second step in the biosynthesis of GMP from inosine 5'-phosphate (IMP); transcription is not subject to regulation by guanine but is negatively regulated by nutrient starvation; reduction-of-function mutation gua1-G388D causes changes in cellular guanine nucleotide pools, defects in general protein synthesis, and impaired translation of GCN4 mRNA +S000033507 CDS YMR217W 13 701790 703367 W 2011-02-03 1996-07-31 +S000004831 ORF Verified YMR218C TRS130 transport protein particle complex II subunit TRS130 chromosome 13 S000007468 13 706887 703579 C 2011-02-03 1996-07-31 Component of transport protein particle (TRAPP) complex II; TRAPPII is a multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating intra-Golgi and endosome-Golgi traffic +S000033556 CDS YMR218C 13 706887 703579 C 2011-02-03 1996-07-31 +S000004832 ORF Verified YMR219W ESC1 chromosome 13 L000004422 13 707133 712109 W 2011-02-03 1996-07-31 Protein involved in telomeric silencing; required for quiescent cell telomere hypercluster localization at nuclear membrane vicinity; interacts with PAD4-domain of Sir4p +S000033701 CDS YMR219W 13 707133 712109 W 2011-02-03 1996-07-31 +S000004833 ORF Verified YMR220W ERG8 phosphomevalonate kinase chromosome 13 L000000574 13 712316 713671 W 2011-02-03 1996-07-31 Phosphomevalonate kinase; an essential cytosolic enzyme that acts in the biosynthesis of isoprenoids and sterols, including ergosterol, from mevalonate +S000035642 CDS YMR220W 13 712316 713671 W 2011-02-03 1996-07-31 +S000004834 ORF Uncharacterized YMR221C FMP42 chromosome 13 13 715445 713931 C 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; physical interaction with Atg27p suggests a possible role in autophagy +S000035674 CDS YMR221C 13 715445 713931 C 2011-02-03 1996-07-31 +S000004835 ORF Verified YMR222C FSH2 putative serine hydrolase chromosome 13 13 716309 715638 C 2011-02-03 1996-07-31 Putative serine hydrolase that localizes to the cytoplasm; sequence is similar to S. cerevisiae Fsh1p and Fsh3p and the human candidate tumor suppressor OVCA2 +S000035719 CDS YMR222C 13 716309 715638 C 2011-02-03 1996-07-31 +S000004836 ORF Verified YMR223W UBP8 ubiquitin-specific protease UBP8 chromosome 13 L000004587 13 716715 718130 W 2011-02-03 1996-07-31 Ubiquitin-specific protease component of the SAGA acetylation complex; required for SAGA (Spt-Ada-Gcn5-Acetyltransferase)-mediated deubiquitination of histone H2B +S000035903 CDS YMR223W 13 716715 718130 W 2011-02-03 1996-07-31 +S000004837 ORF Verified YMR224C MRE11 MRX complex nuclease subunit|NGS1|XRS4|RAD58 chromosome 13 L000004732|L000001149|L000004275 13 720653 718575 C 2011-02-03 1996-07-31 Nuclease subunit of the MRX complex with Rad50p and Xrs2p; complex functions in repair of DNA double-strand breaks and in telomere stability; Mre11p associates with Ser/Thr-rich ORFs in premeiotic phase; nuclease activity required for MRX function; widely conserved; forms nuclear foci upon DNA replication stress +S000035950 CDS YMR224C 13 720653 718575 C 2011-02-03 1996-07-31 +S000004838 ORF Verified YMR225C MRPL44 mitochondrial 54S ribosomal protein YmL44|YmL44|YMR44 chromosome 13 L000002534 13 721403 720960 C 158 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; protein abundance increases in response to DNA replication stress +S000036820 CDS YMR225C 13 721198 720960 C 2011-02-03 1996-07-31 +S000036819 CDS YMR225C 13 721403 721346 C 2011-02-03 1996-07-31 +S000036821 intron YMR225C 13 721345 721199 C 2011-02-03 1996-07-31 +S000004839 ORF Verified YMR226C oxidoreductase|TMA29 chromosome 13 13 722396 721593 C 2011-02-03 1996-07-31 NADP(+)-dependent serine dehydrogenase and carbonyl reductase; acts on serine, L-allo-threonine, and other 3-hydroxy acids; green fluorescent protein fusion protein localizes to the cytoplasm and nucleus; may interact with ribosomes, based on co-purification experiments +S000036891 CDS YMR226C 13 722396 721593 C 2011-02-03 1996-07-31 +S000004840 ORF Verified YMR227C TAF7 TafII67|TAF67 chromosome 13 L000003463 13 724385 722613 C 2011-02-03 1996-07-31 TFIID subunit (67 kDa); involved in RNA polymerase II transcription initiation +S000036956 CDS YMR227C 13 724385 722613 C 2011-02-03 1996-07-31 +S000004841 ORF Verified YMR228W MTF1 RNA polymerase specificity factor chromosome 13 L000001211 13 724626 725651 W 157.9 2011-02-03 1996-07-31 Mitochondrial RNA polymerase specificity factor; has structural similarity to S-adenosylmethionine-dependent methyltransferases and functional similarity to bacterial sigma-factors; Mtf1p interacts with and stabilizes the Rpo41p-promoter complex, enhancing DNA bending and melting to facilitate pre-initiation open complex formation +S000037761 CDS YMR228W 13 724626 725651 W 2011-02-03 1996-07-31 +S000004842 ORF Verified YMR229C RRP5 chromosome 13 L000003232 13 731123 725934 C 2011-02-03 1996-07-31 RNA binding protein involved in synthesis of 18S and 5.8S rRNAs; component of ribosomal small subunit (SSU) processome and 90S preribosome; required for pre-rRNA packaging and compaction of processome into dense terminal balls; part of Mak21p-Noc2p-Rrp5p module that associates with nascent pre-rRNA during transcription with role in biogenesis of large ribosomal subunit; binds single stranded tracts of U's; relocalizes from nucleolus to nucleus upon DNA replication stress +S000037792 CDS YMR229C 13 731123 725934 C 2011-02-03 1996-07-31 +S000004843 ORF Verified YMR230W RPS10B eS10|ribosomal 40S subunit protein S10B|S10e|S10B chromosome 13 L000004476 13 732414 733141 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S10, no bacterial homolog; RPS10B has a paralog, RPS10A, that arose from the whole genome duplication; mutations in the human homolog associated with Diamond-Blackfan anemia +S000030773 CDS YMR230W 13 732414 732465 W 2011-02-03 1996-07-31 +S000030774 CDS YMR230W 13 732876 733141 W 2011-02-03 1996-07-31 +S000030775 intron YMR230W 13 732466 732875 W 2011-02-03 1996-07-31 +S000028576 ORF Uncharacterized YMR230W-A chromosome 13 13 733268 733456 W 2011-02-03 2003-07-29 Putative protein of unknown function +S000031309 CDS YMR230W-A 13 733268 733456 W 2011-02-03 2003-07-29 +S000004844 ORF Verified YMR231W PEP5 tethering complex subunit PEP5|VPT11|VPS11|VPL9|VAM1|END1 chromosome 13 L000001376|L000002957 13 733545 736634 W 152 2011-02-03 1996-07-31 Histone E3 ligase, component of CORVET membrane tethering complex; peripheral vacuolar membrane protein required for protein trafficking and vacuole biogenesis; interacts with Pep7p; involved in ubiquitination and degradation of excess histones +S000030876 CDS YMR231W 13 733545 736634 W 2011-02-03 1996-07-31 +S000004845 ORF Verified YMR232W FUS2 chromosome 13 L000000654 13 736926 738959 W 160 2011-02-03 1996-07-31 Cell fusion regulator; cytoplasmic protein localized to shmoo tip; required for alignment of parental nuclei before nuclear fusion during mating; contains a Dbl-homology domain; binds specifically with activated Cdc42p +S000031887 CDS YMR232W 13 736926 738959 W 2011-02-03 1996-07-31 +S000004846 ORF Verified YMR233W TRI1 chromosome 13 13 739185 739865 W 2011-02-03 1996-07-31 Non-essential sumoylated protein of unknown function; similar to components of human SWI/SNF complex including SMRD3; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm, nucleus and nucleolus; TRI1 has a paralog, UAF30, that arose from the whole genome duplication +S000032018 CDS YMR233W 13 739185 739865 W 2011-02-03 1996-07-31 +S000004847 ORF Verified YMR234W RNH1 RNA-DNA hybrid ribonuclease chromosome 13 L000001653 13 740266 741312 W 160 2011-02-03 1996-07-31 Ribonuclease H1; able to bind double-stranded RNAs and RNA-DNA hybrids; associates with RNAse polymerase I. +S000032129 CDS YMR234W 13 740266 741312 W 2011-02-03 1996-07-31 +S000004848 ORF Verified YMR235C RNA1 GTPase-activating protein RNA1 chromosome 13 L000001649 13 742735 741512 C 159 2011-02-03 1996-07-31 GTPase activating protein (GAP) for Gsp1p; involved in nuclear transport +S000032993 CDS YMR235C 13 742735 741512 C 2011-02-03 1996-07-31 +S000004849 ORF Verified YMR236W TAF9 chromatin modification protein|TafII17|TAF17 chromosome 13 L000003459 13 742971 743444 W 2011-02-03 1996-07-31 Subunit (17 kDa) of TFIID and SAGA complexes; involved in RNA polymerase II transcription initiation and in chromatin modification, similar to histone H3 +S000033137 CDS YMR236W 13 742971 743444 W 2011-02-03 1996-07-31 +S000004850 ORF Verified YMR237W BCH1 exomer complex subunit chromosome 13 13 743749 745923 W 2011-02-03 1996-07-31 Member of the ChAPs family (Chs5p-Arf1p-binding proteins); members include Bch1p, Bch2p, Bud7p, and Chs6p; ChAPs family proteins form the exomer complex with Chs5p to mediate export of specific cargo proteins from the Golgi to the plasma membrane; interacts selectively with the activated, GTP-bound form of Arf1p; may interact with ribosomes; protein abundance increases and forms cytoplasmic foci in response to DNA replication stress +S000033208 CDS YMR237W 13 743749 745923 W 2011-02-03 1996-07-31 +S000004851 ORF Verified YMR238W DFG5 putative mannan endo-1,6-alpha-mannosidase chromosome 13 L000004072 13 746353 747729 W 2011-02-03 1996-07-31 Putative mannosidase; essential glycosylphosphatidylinositol (GPI)-anchored membrane protein required for cell wall biogenesis in bud formation, involved in filamentous growth, homologous to Dcw1p +S000034028 CDS YMR238W 13 746353 747729 W 2011-02-03 1996-07-31 +S000006717 tRNA_gene tR(UCU)M1 chromosome 13 L000003675 13 747963 747892 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000031501 noncoding_exon tR(UCU)M1 13 747963 747892 C 2011-02-03 2000-05-19 +S000004852 ORF Verified YMR239C RNT1 ribonuclease III chromosome 13 L000002844 13 749677 748262 C 2011-02-03 1996-07-31 Nuclear dsRNA-specific ribonuclease (RNase III); involved in rDNA transcription, rRNA processing and U2 snRNA 3' end formation by cleavage of a stem-loop structure at the 3' end of U2 snRNA; involved in polyadenylation-independent transcription termination; involved in the cell wall stress response, regulating the degradation of cell wall integrity and morphogenesis checkpoint genes +S000034074 CDS YMR239C 13 749677 748262 C 2011-02-03 1996-07-31 +S000004853 ORF Verified YMR240C CUS1 U2 snRNP complex subunit CUS1 chromosome 13 L000002833 13 751240 749930 C 2011-02-03 1996-07-31 Protein required for assembly of U2 snRNP into the spliceosome; forms a complex with Hsh49p and Hsh155p +S000035059 CDS YMR240C 13 751240 749930 C 2011-02-03 1996-07-31 +S000004854 ORF Verified YMR241W YHM2 chromosome 13 L000004516 13 751961 752905 W 2011-02-03 1996-07-31 Citrate and oxoglutarate carrier protein; exports citrate from and imports oxoglutarate into the mitochondrion, causing net export of NADPH reducing equivalents; also associates with mt nucleoids and has a role in replication and segregation of the mt genome +S000035206 CDS YMR241W 13 751961 752905 W 2011-02-03 1996-07-31 +S000004855 ORF Verified YMR242C RPL20A eL20|ribosomal 60S subunit protein L20A|L20e|L20A|L18A|RPL18A2 chromosome 13 L000004458|L000003149 13 754220 753225 C 2011-02-03 2003-09-27|1996-07-31|2007-07-10 Ribosomal 60S subunit protein L20A; homologous to mammalian ribosomal protein L18A, no bacterial homolog; RPL20A has a paralog, RPL20B, that arose from the whole genome duplication +S000035252 CDS YMR242C 13 753742 753225 C 2011-02-03 2003-09-27 +S000035251 CDS YMR242C 13 754220 754220 C 2011-02-03 2003-09-27|1996-07-31|2007-07-10 +S000035253 intron YMR242C 13 754219 753743 C 2011-02-03 2003-09-27|2007-07-10 +S000028694 ORF Uncharacterized YMR242W-A chromosome 13 13 754297 754386 W 2011-02-03 2003-07-29 Putative protein of unknown function +S000032596 CDS YMR242W-A 13 754297 754386 W 2011-02-03 2003-07-29 +S000004856 ORF Verified YMR243C ZRC1 Zn(2+) transporter ZRC1|OSR1 chromosome 13 L000002570 13 756166 754838 C 2011-02-03 1996-07-31 Vacuolar membrane zinc transporter; transports zinc from cytosol to vacuole for storage; also has role in resistance to zinc shock resulting from sudden influx of zinc into cytoplasm; human ortholog SLC30A10 functions as a Mn transporter and mutations in SLC30A10 cause neurotoxic accumulation of Mn in liver and brain; ZRC1 has a paralog, COT1, that arose from the whole genome duplication +S000036141 CDS YMR243C 13 756166 754838 C 2011-02-03 1996-07-31 +S000004858 ORF Uncharacterized YMR244W chromosome 13 13 757250 758317 W 2011-02-03 1996-07-31 Putative protein of unknown function; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole +S000031680 CDS YMR244W 13 757250 758317 W 2011-02-03 1996-07-31 +S000118377 ARS ARS1327 ARSXIII-758 chromosome 13 13 758224 758471 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178161 ARS_consensus_sequence ARS1327 13 758417 758401 C 2014-11-18 2014-11-18 +S000004859 ORF Dubious YMR245W chromosome 13 13 758563 759183 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031825 CDS YMR245W 13 758563 759183 W 2011-02-03 1996-07-31 +S000004857 ORF Verified YMR244C-A COA6 chromosome 13 13 758831 758517 C 2011-02-03 1996-07-31 Protein involved in cytochrome c oxidase (Complex IV) assembly; involved in delivery of copper to Complex IV; also required for efficient formation of respiratory supercomplexes comprised of Complexes III and IV; localizes to the mitochondrial intermembrane space; ortholog implicated in cardiac defects in zebrafish and human; transcription is induced in response to the DNA-damaging agent MMS; protein abundance increases in response to DNA replication stress +S000035790 CDS YMR244C-A 13 758831 758517 C 2011-02-03 1996-07-31 +S000004860 ORF Verified YMR246W FAA4 long-chain fatty acid-CoA ligase FAA4 chromosome 13 L000002647 13 759807 761891 W 2011-02-03 1996-07-31 Long chain fatty acyl-CoA synthetase; activates fatty acids with a preference for C12:0-C16:0 chain lengths; role in the competitive import of long-chain fatty acids and sphingoid long-chain bases; role in stationary phase survival; localizes to lipid particles and the plasma membrane; role in sphingolipid-to-glycerolipid metabolism; forms cytoplasmic foci upon replication stress; faa1 faa4 double null complemented by any of human ACSBG1, ACSL1, 3, 4, 5, 6, SLC27A2, or 4 +S000031958 CDS YMR246W 13 759807 761891 W 2011-02-03 1996-07-31 +S000119075 snoRNA_gene snR86 SNR86 chromosome 13 13 763113 762110 C 2011-02-03 2006-10-05 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2314 +S000119077 noncoding_exon snR86 13 763113 762110 C 2011-02-03 2006-10-05 +S000004861 ORF Verified YMR247C RKR1 ubiquitin-protein ligase RKR1|LTN1 chromosome 13 13 768039 763351 C 2011-02-03 1996-07-31 RING domain E3 ubiquitin ligase; involved in ubiquitin-mediated degradation of non-stop proteins and translationally stalled ER membrane proteins; component of ribosome-bound RQC (ribosome quality control) complex; degrades products of mRNAs lacking a termination codon regardless of a poly(A) tail; functional connections to chromatin modification; homolog of mouse Listerin, mutations in which reported to cause neurodegeneration +S000031995 CDS YMR247C 13 768039 763351 C 2011-02-03 1996-07-31 +S000006519 tRNA_gene tA(AGC)M2 chromosome 13 L000003674 13 768441 768369 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine +S000036431 noncoding_exon tA(AGC)M2 13 768441 768369 C 2011-02-03 2000-05-19 +S000007125 long_terminal_repeat YMRWdelta19 chromosome 13 13 768548 768879 W 2011-02-03 2000-05-19 Ty2 LTR +S000028849 ORF Uncharacterized YMR247W-A chromosome 13 13 769283 769426 W 2011-02-03 2003-07-29 Putative protein of unknown function; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole +S000034536 CDS YMR247W-A 13 769283 769426 W 2011-02-03 2003-07-29 +S000004862 ORF Verified YMR250W GAD1 glutamate decarboxylase GAD1 chromosome 13 S000007509 13 770801 772558 W 2011-02-03 1996-07-31 Glutamate decarboxylase; converts glutamate into gamma-aminobutyric acid (GABA) during glutamate catabolism; involved in response to oxidative stress +S000037211 CDS YMR250W 13 770801 772558 W 2011-02-03 1996-07-31 +S000118378 ARS ARS1328 ARSXIII-773 chromosome 13 13 772631 772879 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000004863 ORF Verified YMR251W GTO3 omega-class glutathione transferase chromosome 13 13 772915 774015 W 2011-02-03 1996-07-31 Omega class glutathione transferase; putative cytosolic localization +S000037313 CDS YMR251W 13 772915 774015 W 2011-02-03 1996-07-31 +S000004864 ORF Verified YMR251W-A HOR7 chromosome 13 L000003980 13 774752 774931 W 2011-02-03 1996-07-31 Protein of unknown function; overexpression suppresses Ca2+ sensitivity of mutants lacking inositol phosphorylceramide mannosyltransferases Csg1p and Csh1p; transcription is induced under hyperosmotic stress and repressed by alpha factor; HOR7 has a paralog, DDR2, that arose from the whole genome duplication +S000035256 CDS YMR251W-A 13 774752 774931 W 2011-02-03 1996-07-31 +S000004865 ORF Uncharacterized YMR252C chromosome 13 13 775719 775315 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to mitochondria; YMR252C is not an essential gene +S000037324 CDS YMR252C 13 775719 775315 C 2011-02-03 1996-07-31 +S000004866 ORF Uncharacterized YMR253C chromosome 13 13 777190 775946 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; YMR253C is not an essential gene +S000037399 CDS YMR253C 13 777190 775946 C 2011-02-03 1996-07-31 +S000004867 ORF Dubious YMR254C chromosome 13 13 777923 777615 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030036 CDS YMR254C 13 777923 777615 C 2011-02-03 1996-07-31 +S000004868 ORF Verified YMR255W GFD1 chromosome 13 L000004632 13 778001 778567 W 2011-02-03 1996-07-31 Coiled-coiled protein of unknown function; identified as a high-copy suppressor of a dbp5 mutation; protein abundance increases in response to DNA replication stress +S000030249 CDS YMR255W 13 778001 778567 W 2011-02-03 1996-07-31 +S000004869 ORF Verified YMR256C COX7 cytochrome c oxidase subunit VII chromosome 13 L000000391 13 779127 778945 C 2011-02-03 1996-07-31 Subunit VII of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain +S000030343 CDS YMR256C 13 779127 778945 C 2011-02-03 1996-07-31 +S000004870 ORF Verified YMR257C PET111 chromosome 13 L000001393 13 782031 779629 C 177 2011-02-03 1996-07-31 Mitochondrial translational activator specific for the COX2 mRNA; located in the mitochondrial inner membrane +S000033634 CDS YMR257C 13 782031 779629 C 2011-02-03 1996-07-31 +S000004871 ORF Verified YMR258C ROY1 chromosome 13 13 784281 782620 C 2011-02-03 1996-07-31 GTPase inhibitor with similarity to F-box proteins; inhibits Ypt52p GTPase activity by preventing Ypt52p from binding GTP; involved in regulating intracellular trafficking; physically interacts with Skp1p +S000033770 CDS YMR258C 13 784281 782620 C 2011-02-03 1996-07-31 +S000004872 ORF Verified YMR259C TRM732 tRNA methylation protein TRM732 chromosome 13 13 788883 784621 C 2011-02-03 1996-07-31 Protein involved in 2'-O-methylation of C32 of substrate tRNAs; interacts with 2'-O-ribose methyltransferase Trm7p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; non-essential gene; yeast null mutant can be functionally complemented by human THADA, mutations in which have been implicated in epithelial thyroid adenomas, type 2 diabetes, and polycystic ovary syndrome (PCOS) +S000033886 CDS YMR259C 13 788883 784621 C 2011-02-03 1996-07-31 +S000004873 ORF Verified YMR260C TIF11 chromosome 13 L000002306 13 789839 789378 C 2011-02-03 1996-07-31 Translation initiation factor eIF1A; essential protein that forms a complex with Sui1p (eIF1) and the 40S ribosomal subunit and scans for the start codon; C-terminus associates with Fun12p (eIF5B); N terminus interacts with eIF2 and eIF3 +S000033454 CDS YMR260C 13 789839 789378 C 2011-02-03 1996-07-31 +S000004874 ORF Verified YMR261C TPS3 trehalose 6-phosphate synthase/phosphatase complex subunit chromosome 13 L000002718 13 793369 790205 C 2011-02-03 1996-07-31 Regulatory subunit of trehalose-6-phosphate synthase/phosphatase; involved in synthesis of storage carbohydrate trehalose; expression is induced by stress conditions and repressed by the Ras-cAMP pathway; TPS3 has a paralog, TSL1, that arose from the whole genome duplication +S000033514 CDS YMR261C 13 793369 790205 C 2011-02-03 1996-07-31 +S000004875 ORF Uncharacterized YMR262W putative endodeoxyribonuclease chromosome 13 13 793726 794667 W 2011-02-03 1996-07-31|2011-02-03 Protein of unknown function; interacts weakly with Knr4p; YMR262W is not an essential gene +S000033607 CDS YMR262W 13 793726 794667 W 2011-02-03 1996-07-31|2011-02-03 +S000004876 ORF Verified YMR263W SAP30 chromosome 13 13 794919 795524 W 2011-02-03 1996-07-31 Component of Rpd3L histone deacetylase complex; involved in silencing at telomeres, rDNA, and silent mating-type loci; involved in telomere maintenance +S000034555 CDS YMR263W 13 794919 795524 W 2011-02-03 1996-07-31 +S000004877 ORF Verified YMR264W CUE1 KIS4 chromosome 13 L000003518 13 795805 796416 W 2011-02-03 1996-07-31 Ubiquitin-binding protein; ER membrane protein that recruits and integrates the ubiquitin-conjugating enzyme Ubc7p into ER membrane-bound ubiquitin ligase complexes that function in the ER-associated degradation (ERAD) pathway for misfolded proteins; contains a CUE domain that binds ubiquitin to facilitate intramolecular monoubiquitination and to promote diubiquitin elongation, facilitating polyubiquitin chain formation +S000034641 CDS YMR264W 13 795805 796416 W 2011-02-03 1996-07-31 +S000004878 ORF Uncharacterized YMR265C chromosome 13 13 797925 796540 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000034679 CDS YMR265C 13 797925 796540 C 2011-02-03 1996-07-31 +S000004879 ORF Verified YMR266W RSN1 chromosome 13 13 798518 801379 W 2011-02-03 1996-07-31 Membrane protein of unknown function; overexpression suppresses NaCl sensitivity of sro7 mutant cells by restoring sodium pump (Ena1p) localization to the plasma membrane +S000035756 CDS YMR266W 13 798518 801379 W 2011-02-03 1996-07-31 +S000004880 ORF Verified YMR267W PPA2 inorganic diphosphatase PPA2|IPP2 chromosome 13 L000001469 13 801772 802704 W 2011-02-03 1996-07-31 Mitochondrial inorganic pyrophosphatase; required for mitochondrial function and possibly involved in energy generation from inorganic pyrophosphate; human ortholog, PPA2, functionally complements the null mutant; mutations in human PPA2 cause a mitochondrial disease resulting in sudden unexpected cardiac arrest in infants +S000035874 CDS YMR267W 13 801772 802704 W 2011-02-03 1996-07-31 +S000004881 ORF Verified YMR268C PRP24 U6 snRNP complex subunit PRP24 chromosome 13 L000002842 13 804222 802888 C 2011-02-03 1996-07-31 Splicing factor that reanneals snRNPs during spliceosome recycling; reanneals U4 and U6 snRNPs +S000035917 CDS YMR268C 13 804222 802888 C 2011-02-03 1996-07-31 +S000004882 ORF Verified YMR269W TMA23 YMR268W-A chromosome 13 13 804456 805091 W 2011-02-03 2004-02-27|1996-07-31 Nucleolar protein implicated in ribosome biogenesis; deletion extends chronological lifespan +S000037848 CDS YMR269W 13 804456 805091 W 2011-02-03 2004-02-27|1996-07-31 +S000118379 ARS ARS1329 ARSXIII-805 chromosome 13 13 805152 805282 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178162 ARS_consensus_sequence ARS1329 13 805162 805178 W 2014-11-18 2014-11-18 +S000004883 ORF Verified YMR270C RRN9 chromosome 13 L000003278 13 806423 805326 C 2011-02-03 1996-07-31 Protein involved in promoting high level transcription of rDNA; subunit of UAF (upstream activation factor) for RNA polymerase I +S000036870 CDS YMR270C 13 806423 805326 C 2011-02-03 1996-07-31 +S000004884 ORF Verified YMR271C URA10 orotate phosphoribosyltransferase URA10 chromosome 13 L000002438 13 807548 806865 C 2011-02-03 1996-07-31 Minor orotate phosphoribosyltransferase (OPRTase) isozyme; catalyzes the fifth enzymatic step in the de novo biosynthesis of pyrimidines, converting orotate into orotidine-5'-phosphate; URA10 has a paralog, URA5, that arose from the whole genome duplication +S000037601 CDS YMR271C 13 807548 806865 C 2011-02-03 1996-07-31 +S000006690 tRNA_gene tQ(CUG)M CDC65 SUP60|SUP70|DNA33 chromosome 13 L000000287|L000003673 13 808317 808246 C 187 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; can mutate to cause constitutive pseudohyphal growth in homozygous diploids; required for localization of transcription factor Gln3p to the nucleus in response to nitrogen starvation or rapamycin treatment +S000036125 noncoding_exon tQ(CUG)M 13 808317 808246 C 2011-02-03 2000-05-19 +S000007118 long_terminal_repeat YMRCtau3 chromosome 13 13 808906 808537 C 2011-02-03 2000-05-19 Ty4 LTR +S000007126 long_terminal_repeat YMRWdelta20 chromosome 13 13 809000 809233 W 2011-02-03 2000-05-19 Ty1 LTR +S000028695 ORF Dubious YMR272W-A chromosome 13 13 810466 810579 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene SCS7/YMR272C +S000032602 CDS YMR272W-A 13 810466 810579 W 2011-02-03 2003-07-29 +S000004885 ORF Verified YMR272C SCS7 fatty acid alpha-hydroxylase|FAH1 chromosome 13 L000004408 13 810777 809623 C 2011-02-03 1996-07-31 Sphingolipid alpha-hydroxylase; functions in the alpha-hydroxylation of sphingolipid-associated very long chain fatty acids, has both cytochrome b5-like and hydroxylase/desaturase domains, not essential for growth +S000037670 CDS YMR272C 13 810777 809623 C 2011-02-03 1996-07-31 +S000028696 ORF Uncharacterized YMR272W-B chromosome 13 13 811089 811196 W 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole +S000032604 CDS YMR272W-B 13 811089 811196 W 2011-02-03 2003-07-29 +S000004886 ORF Verified YMR273C ZDS1 OSS1|NRC1|CKM1|CES1 chromosome 13 L000002813 13 813980 811233 C 2011-02-03 1996-07-31 Protein with a role in regulating Swe1p-dependent polarized growth; involved in maintaining Cdc55p in the cytoplasm where it promotes mitotic entry; involved in mitotic exit through Cdc14p regulation; interacts with silencing proteins at telomeres; has a role in Bcy1p localization; implicated in mRNA nuclear export; ZDS1 has a paralog, ZDS2, that arose from the whole genome duplication +S000037717 CDS YMR273C 13 813980 811233 C 2011-02-03 1996-07-31 +S000004887 ORF Verified YMR274C RCE1 CAAX prenyl protease chromosome 13 L000004125 13 815311 814364 C 2011-02-03 1996-07-31 Type II CAAX prenyl protease; involved in the proteolysis and maturation of Ras and the a-factor mating pheromone +S000037777 CDS YMR274C 13 815311 814364 C 2011-02-03 1996-07-31 +S000118380 ARS ARS1330 ARSXIII-815 chromosome 13 13 815342 815567 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178163 ARS_consensus_sequence ARS1330 13 815391 815407 W 2014-11-18 2014-11-18 +S000004888 ORF Verified YMR275C BUL1 ubiquitin-ubiquitin ligase BUL1|SMM2|RDS1|DAG1 chromosome 13 L000002733 13 818581 815651 C 2011-02-03 1996-07-31 Ubiquitin-binding component of the Rsp5p E3-ubiquitin ligase complex; disruption causes temperature-sensitive growth, overexpression causes missorting of amino acid permeases; BUL1 has a paralog, BUL2, that arose from the whole genome duplication +S000030633 CDS YMR275C 13 818581 815651 C 2011-02-03 1996-07-31 +S000004889 ORF Verified YMR276W DSK2 chromosome 13 L000002646 13 818827 819948 W 2011-02-03 1996-07-31 Nuclear-enriched ubiquitin-like polyubiquitin-binding protein; required for spindle pole body (SPB) duplication and for transit through the G2/M phase of the cell cycle; involved in proteolysis; interacts with the proteasome; protein abundance increases in response to DNA replication stress +S000030830 CDS YMR276W 13 818827 819948 W 2011-02-03 1996-07-31 +S000004890 ORF Verified YMR277W FCP1 protein serine/threonine phosphatase chromosome 13 L000003350 13 820256 822454 W 2011-02-03 1996-07-31 Carboxy-terminal domain (CTD) phosphatase; essential for dephosphorylation of the repeated C-terminal domain of the RNA polymerase II large subunit (Rpo21p); relocalizes to the cytosol in response to hypoxia +S000031799 CDS YMR277W 13 820256 822454 W 2011-02-03 1996-07-31 +S000004891 ORF Verified YMR278W PRM15 PGM3|phosphoribomutase PRM15 chromosome 13 13 822763 824631 W 2011-02-03 1996-07-31 Phosphoribomutase; catalyzes interconversion of ribose-1-phosphate and ribose-5-phosphate; has some phosphoglucomutase activity but primary activity in vivo is phosphoribomutase; contributes to ribose recycling in the pentose phosphate pathway; transcription induced in response to stress; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; non-essential +S000031949 CDS YMR278W 13 822763 824631 W 2011-02-03 1996-07-31 +S000004892 ORF Verified YMR279C chromosome 13 13 826351 824729 C 2011-02-03 1996-07-31 Putative boron transporter involved in boron efflux and resistance; overexpression mutant but not null mutant displays boron tolerance phenotype; identified as a heat-induced gene in a high-throughout screen; YMR279C is not an essential gene; YMR279C has a paralog, ATR1, that arose from the whole genome duplication +S000031988 CDS YMR279C 13 826351 824729 C 2011-02-03 1996-07-31 +S000004893 ORF Verified YMR280C CAT8 DNA-binding transcription factor CAT8|MSP8|DIL1 chromosome 13 L000000220 13 831329 827028 C 2011-02-03 1996-07-31 Zinc cluster transcriptional activator; necessary for derepression of a variety of genes under non-fermentative growth conditions, active after diauxic shift, binds carbon source responsive elements; relative distribution to the nucleus increases upon DNA replication stress +S000032751 CDS YMR280C 13 831329 827028 C 2011-02-03 1996-07-31 +S000004894 ORF Verified YMR281W GPI12 N-acetylglucosaminylphosphatidylinositol deacetylase chromosome 13 L000004952 13 832339 833253 W 2011-02-03 1996-07-31 ER membrane protein involved in the second step of GPI anchor assembly; the second step is the de-N-acetylation of the N-acetylglucosaminylphosphatidylinositol intermediate; functional homolog of human PIG-Lp; GPI stands for glycosylphosphatidylinositol +S000032913 CDS YMR281W 13 832339 833253 W 2011-02-03 1996-07-31 +S000004895 ORF Verified YMR282C AEP2 ATP13 chromosome 13 L000000054 13 835098 833356 C 2011-02-03 1996-07-31 Mitochondrial protein; likely involved in translation of the mitochondrial OLI1 mRNA; exhibits genetic interaction with the OLI1 mRNA 5'-untranslated leader +S000032972 CDS YMR282C 13 835098 833356 C 2011-02-03 1996-07-31 +S000004896 ORF Verified YMR283C RIT1 tRNA A64-2'-O-ribosylphosphate transferase chromosome 13 L000001645 13 836867 835326 C 2011-02-03 1996-07-31 Initiator methionine 2'-O-ribosyl phosphate transferase; modifies the initiator methionine tRNA at position 64 to distinguish it from elongator methionine tRNA +S000033039 CDS YMR283C 13 836867 835326 C 2011-02-03 1996-07-31 +S000007127 long_terminal_repeat YMRWdelta21 chromosome 13 13 837450 837764 W 2011-02-03 2000-05-19 Ty1 LTR +S000130192 ARS ARS1331 chromosome 13 13 837764 837928 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000006784 tRNA_gene tY(GUA)M2 SUP8 chromosome 13 L000003672|L000002187 13 837928 838016 W 193 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations +S000032300 intron tY(GUA)M2 13 837967 837980 W 2011-02-03 2000-05-19 +S000032298 noncoding_exon tY(GUA)M2 13 837928 837966 W 2011-02-03 2000-05-19 +S000032299 noncoding_exon tY(GUA)M2 13 837981 838016 W 2011-02-03 2000-05-19 +S000004897 ORF Verified YMR284W YKU70 ATP-dependent DNA helicase YKU70|KU70|NES24|HDF1 chromosome 13 L000000759 13 838187 839995 W 2011-02-03 1996-07-31 Subunit of the telomeric Ku complex (Yku70p-Yku80p); involved in telomere length maintenance, structure and telomere position effect; required for localization of telomerase ribonucleoprotein to nucleus via interaction with the TLC1 guide RNA; relocates to sites of double-strand cleavage to promote nonhomologous end joining during DSB repair +S000033764 CDS YMR284W 13 838187 839995 W 2011-02-03 1996-07-31 +S000004898 ORF Verified YMR285C NGL2 RNA exonuclease chromosome 13 13 841691 840144 C 2011-02-03 1996-07-31 Protein involved in 5.8S rRNA processing; Ccr4p-like RNase required for correct 3'-end formation of 5.8S rRNA at site E; similar to Ngl1p; NGL2 has a paralog, NGL3, that arose from the whole genome duplication +S000033818 CDS YMR285C 13 841691 840144 C 2011-02-03 1996-07-31 +S000004899 ORF Verified YMR286W MRPL33 mitochondrial 54S ribosomal protein YmL33|YmL33 chromosome 13 L000002530|L000001170 13 841942 842202 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000034015 CDS YMR286W 13 841942 842202 W 2011-02-03 1996-07-31 +S000004900 ORF Verified YMR287C DSS1 MSU1 chromosome 13 L000001208 13 845345 842436 C 2011-02-03 1996-07-31 3'-5' exoribonuclease; component of the mitochondrial degradosome along with the ATP-dependent RNA helicase Suv3p; the degradosome associates with the ribosome and mediates turnover of aberrant or unprocessed RNAs +S000034048 CDS YMR287C 13 845345 842436 C 2011-02-03 1996-07-31 +S000004901 ORF Verified YMR288W HSH155 U2 snRNP complex subunit HSH155 chromosome 13 13 845571 848486 W 2011-02-03 1996-07-31 U2-snRNP associated splicing factor; forms extensive associations with the branch site-3' splice site-3' exon region upon prespliceosome formation; similarity to the mammalian U2 snRNP-associated splicing factor SAP155 +S000035070 CDS YMR288W 13 845571 848486 W 2011-02-03 1996-07-31 +S000004902 ORF Verified YMR289W ABZ2 aminodeoxychorismate lyase ABZ2 chromosome 13 13 848685 849809 W 2011-02-03 1996-07-31 Aminodeoxychorismate lyase (4-amino-4-deoxychorismate lyase); catalyzes the third step in para-aminobenzoic acid biosynthesis; involved in folic acid biosynthesis +S000035264 CDS YMR289W 13 848685 849809 W 2011-02-03 1996-07-31 +S000004904 ORF Dubious YMR290W-A chromosome 13 13 851422 851769 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps 5' end of essential HAS1/YMR290C gene which encodes an ATP-dependent RNA helicase +S000037856 CDS YMR290W-A 13 851422 851769 W 2011-02-03 1996-07-31|2011-02-03 +S000004903 ORF Verified YMR290C HAS1 ATP-dependent RNA helicase HAS1 chromosome 13 L000004179 13 851591 850074 C 2011-02-03 1996-07-31 ATP-dependent RNA helicase; involved in the biogenesis of 40S and 60S ribosome subunits; localizes to both the nuclear periphery and nucleolus; highly enriched in nuclear pore complex fractions; constituent of 66S pre-ribosomal particles +S000036112 CDS YMR290C 13 851591 850074 C 2011-02-03 1996-07-31 +S000004905 ORF Verified YMR291W TDA1 protein kinase TDA1 chromosome 13 13 852630 854390 W 2011-02-03 1996-07-31 Protein kinase of unknown cellular role; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; null mutant is sensitive to expression of the top1-T722A allele; not an essential gene; relocalizes from nucleus to cytoplasm upon DNA replication stress +S000036939 CDS YMR291W 13 852630 854390 W 2011-02-03 1996-07-31 +S000004906 ORF Verified YMR292W GOT1 chromosome 13 L000004951 13 854795 855293 W 2011-02-03 1996-07-31 Homodimeric protein that is packaged into COPII vesicles; cycles between the ER and Golgi; involved in secretory transport but not directly required for aspects of transport assayed in vitro; may influence membrane composition +S000037002 CDS YMR292W 13 854795 854816 W 2011-02-03 1996-07-31 +S000037003 CDS YMR292W 13 854899 855293 W 2011-02-03 1996-07-31 +S000037004 intron YMR292W 13 854817 854898 W 2011-02-03 1996-07-31 +S000004907 ORF Verified YMR293C HER2 QRS1|glutamyl-tRNA(Gln) amidotransferase subunit HER2|RRG6|GEP6|LRC6 chromosome 13 S000124020 13 856793 855399 C 2011-02-03 1996-07-31 Subunit of the trimeric GatFAB AmidoTransferase(AdT) complex; involved in the formation of Q-tRNAQ; required for remodeling of ER caused by Hmg2p overexpression; similar to bacterial GatA glutamyl-tRNA amidotransferase +S000037041 CDS YMR293C 13 856793 855399 C 2011-02-03 1996-07-31 +S000004908 ORF Verified YMR294W JNM1 PAC3|INS1 chromosome 13 L000000884 13 856966 858087 W 2011-02-03 1996-07-31 Component of the yeast dynactin complex; consisting of Nip100p, Jnm1p, and Arp1p; required for proper nuclear migration and spindle partitioning during mitotic anaphase B +S000037827 CDS YMR294W 13 856966 858087 W 2011-02-03 1996-07-31 +S000004909 ORF Dubious YMR294W-A chromosome 13 13 858209 858568 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; substantially overlaps YMR295C; deletion causes sensitivity to unfolded protein response-inducing agents +S000031101 CDS YMR294W-A 13 858209 858568 W 2011-02-03 1996-07-31 +S000004910 ORF Verified YMR295C IBI2 chromosome 13 13 858890 858297 C 2011-02-03 1996-07-31 Protein of unknown function that associates with ribosomes; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery and bud; not an essential gene; protein abundance increases in response to DNA replication stress; YMR295C has a paralog, YGR273C, that arose from the whole genome duplication +S000037861 CDS YMR295C 13 858890 858297 C 2011-02-03 1996-07-31 +S000004911 ORF Verified YMR296C LCB1 serine C-palmitoyltransferase LCB1|TSC2|END8 chromosome 13 L000000934 13 860891 859215 C 2011-02-03 1996-07-31 Component of serine palmitoyltransferase; responsible along with Lcb2p for the first committed step in sphingolipid synthesis, which is the condensation of serine with palmitoyl-CoA to form 3-ketosphinganine +S000029901 CDS YMR296C 13 860891 859215 C 2011-02-03 1996-07-31 +S000004912 ORF Verified YMR297W PRC1 CPY1|carboxypeptidase C PRC1|CPY|LBC1 chromosome 13 L000001481 13 861922 863520 W 210 2011-02-03 1996-07-31 Vacuolar carboxypeptidase Y (proteinase C, CPY); broad-specificity C-terminal exopeptidase involved in non-specific protein degradation in the vacuole; member of the serine carboxypeptidase family +S000030979 CDS YMR297W 13 861922 863520 W 2011-02-03 1996-07-31 +S000004913 ORF Verified YMR298W LIP1 sphingosine N-acyltransferase subunit LIP1 chromosome 13 13 863819 864271 W 2011-02-03 1996-07-31 Ceramide synthase subunit; single-span ER membrane protein associated with Lag1p and Lac1p and required for ceramide synthase activity, null mutant grows extremely slowly and is defective in ceramide synthesis +S000031080 CDS YMR298W 13 863819 864271 W 2011-02-03 1996-07-31 +S000004914 ORF Verified YMR299C DYN3 dynein light intermediate chain chromosome 13 13 865350 864412 C 2011-02-03 1996-07-31|2011-02-03 Dynein light intermediate chain (LIC); localizes with dynein, null mutant is defective in nuclear migration +S000031115 CDS YMR299C 13 865350 864412 C 2011-02-03 1996-07-31|2011-02-03 +S000004915 ORF Verified YMR300C ADE4 amidophosphoribosyltransferase chromosome 13 L000000034 13 867091 865559 C 213 2011-02-03 1996-07-31 Phosphoribosylpyrophosphate amidotransferase (PRPPAT); catalyzes first step of the 'de novo' purine nucleotide biosynthetic pathway; also known as amidophosphoribosyltransferase +S000036627 CDS YMR300C 13 867091 865559 C 2011-02-03 1996-07-31 +S000004916 ORF Verified YMR301C ATM1 ATP-binding cassette Fe/S cluster precursor transporter ATM1 chromosome 13 L000000140 13 869627 867555 C 2011-02-03 1996-07-31 Mitochondrial inner membrane ATP-binding cassette (ABC) transporter; exports mitochondrially synthesized precursors of iron-sulfur (Fe/S) clusters to the cytosol; human homolog ABCB7 can complement yeast null mutant +S000036724 CDS YMR301C 13 869627 867555 C 2011-02-03 1996-07-31 +S000004917 ORF Verified YMR302C YME2 PRP12|RNA12 chromosome 13 L000001503 13 872625 870073 C 2011-02-03 1996-07-31 Integral inner mitochondrial membrane protein; role in maintaining mitochondrial nucleoid structure and number; mutants exhibit an increased rate of mitochondrial DNA escape; shows some sequence similarity to exonucleases +S000030571 CDS YMR302C 13 872625 870073 C 2011-02-03 1996-07-31 +S000004918 ORF Verified YMR303C ADH2 alcohol dehydrogenase ADH2|ADR2 chromosome 13 L000000042|L000000051 13 874337 873291 C 216 2011-02-03 1996-07-31 Glucose-repressible alcohol dehydrogenase II; catalyzes the conversion of ethanol to acetaldehyde; involved in the production of certain carboxylate esters; regulated by ADR1 +S000030697 CDS YMR303C 13 874337 873291 C 2011-02-03 1996-07-31 +S000004920 ORF Verified YMR304W UBP15 ubiquitin-specific protease UBP15 chromosome 13 L000004589 13 874987 878679 W 2011-02-03 1996-07-31 Ubiquitin-specific protease involved in protein deubiquitination; forms a complex with AAA peroxins Pex1p and Pex6p; deubiquitinates mono- and polyubiquitinated forms of Pex5p; deubiquitinates Clb5p, counteracting APC activity, and facilitating both Clb5p accumulation and S phase entry; physically interacts with anaphase-promoting complex/cyclosome (APC/C) activator, Cdh1p; catalytic activity regulated by an N-terminal TRAF-like domain and and C-terminal sequences +S000030883 CDS YMR304W 13 874987 878679 W 2011-02-03 1996-07-31 +S000004919 ORF Dubious YMR304C-A chromosome 13 13 879130 878780 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps 3' end of verified ORF SCW10/YMR305C +S000037462 CDS YMR304C-A 13 879130 878780 C 2011-02-03 1996-07-31 +S000004921 ORF Verified YMR305C SCW10 putative family 17 glucosidase chromosome 13 13 880232 879063 C 2011-02-03 1996-07-31 Cell wall protein with similarity to glucanases; may play a role in conjugation during mating based on mutant phenotype and its regulation by Ste12p; SWC10 has a paralog, SCW4, that arose from the whole genome duplication +S000031740 CDS YMR305C 13 880232 879063 C 2011-02-03 1996-07-31 +S000004923 ORF Verified YMR306W FKS3 putative 1,3-beta-D-glucan synthase chromosome 13 L000004080 13 881159 886516 W 2011-02-03 1996-07-31 Protein involved in spore wall assembly; has similarity to 1,3-beta-D-glucan synthase catalytic subunits Fks1p and Gsc2p; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000032042 CDS YMR306W 13 881159 886516 W 2011-02-03 1996-07-31 +S000004922 ORF Dubious YMR306C-A chromosome 13 13 886572 886183 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps 3' end of ORF FKS3/YMR306W +S000034582 CDS YMR306C-A 13 886572 886183 C 2011-02-03 1996-07-31 +S000004924 ORF Verified YMR307W GAS1 1,3-beta-glucanosyltransferase GAS1|GGP1|CWH52 chromosome 13 L000000669 13 887003 888682 W 2011-02-03 1997-07-17 Beta-1,3-glucanosyltransferase; required for cell wall assembly and also has a role in transcriptional silencing; localizes to cell surface via a glycosylphosphatidylinositol (GPI) anchor; also found at nuclear periphery; genetic interactions with histone H3 lysine acetyltransferases GCN5 and SAS3 indicate previously unsuspected functions for Gas1 in DNA damage response and cell cycle regulation +S000032131 CDS YMR307W 13 887003 888682 W 2011-02-03 1997-07-17 +S000028578 ORF Dubious YMR307C-A chromosome 13 13 887925 887731 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene GAS1/YMR307W +S000031312 CDS YMR307C-A 13 887925 887731 C 2011-02-03 2003-07-29 +S000004925 ORF Verified YMR308C PSE1 KAP121 chromosome 13 L000001519 13 892221 888952 C 2011-02-03 1996-07-31 Karyopherin/importin that interacts with the nuclear pore complex; acts as the nuclear import receptor for specific proteins, including Pdr1p, Yap1p, Ste12p, and Aft1p +S000032994 CDS YMR308C 13 892221 888952 C 2011-02-03 1996-07-31 +S000004926 ORF Verified YMR309C NIP1 translation initiation factor eIF3 core subunit c chromosome 13 L000001252 13 895426 892988 C 2011-02-03 1996-07-31 eIF3c subunit of the eukaryotic translation initiation factor 3 (eIF3); involved in the assembly of preinitiation complex and start codon selection; eIF3 is also involved in programmed stop codon readthrough +S000033088 CDS YMR309C 13 895426 892988 C 2011-02-03 1996-07-31 +S000004927 ORF Uncharacterized YMR310C putative methyltransferase chromosome 13 13 896669 895716 C 2011-02-03 1996-07-31 Putative methyltransferase; predicted to be involved in ribosome biogenesis; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; not an essential gene; YMR310C has a paralog, YGR283C, that arose from the whole genome duplication +S000032818 CDS YMR310C 13 896669 895716 C 2011-02-03 1996-07-31 +S000004928 ORF Verified YMR311C GLC8 chromosome 13 L000000707 13 897603 896914 C 2011-02-03 1996-07-31 Regulatory subunit of protein phosphatase 1 (Glc7p); involved in glycogen metabolism and chromosome segregation; proposed to regulate Glc7p activity via conformational alteration; ortholog of the mammalian protein phosphatase inhibitor 2; protein abundance increases in response to DNA replication stress +S000034823 CDS YMR311C 13 897603 896914 C 2011-02-03 1996-07-31 +S000118381 ARS ARS1332 ARSXIII-898 chromosome 13 13 897935 897985 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178164 ARS_consensus_sequence ARS1332 13 897977 897961 C 2014-11-18 2014-11-18 +S000004929 ORF Verified YMR312W ELP6 Elongator subunit ELP6|KTI4|TOT6|HAP3 chromosome 13 13 898405 899226 W 2011-02-03 1996-07-31 Subunit of hexameric RecA-like ATPase Elp456 Elongator subcomplex; which is required for modification of wobble nucleosides in tRNA; required for Elongator structural integrity +S000035014 CDS YMR312W 13 898405 899226 W 2011-02-03 1996-07-31 +S000004930 ORF Verified YMR313C TGL3 bifunctional triglyceride lipase/lysophosphatidylethanolamine acyltransferase chromosome 13 13 901307 899379 C 2011-02-03 1996-07-31 Bifunctional triacylglycerol lipase and LPE acyltransferase; major lipid particle-localized triacylglycerol (TAG) lipase; catalyzes acylation of lysophosphatidylethanolamine (LPE), a function which is essential for sporulation; protein level and stability of Tgl3p are markedly reduced in the absence of lipid droplets; required with Tgl4p for timely bud formation +S000035060 CDS YMR313C 13 901307 899379 C 2011-02-03 1996-07-31 +S000004931 ORF Verified YMR314W PRE5 proteasome core particle subunit alpha 6 chromosome 13 L000001487 13 901709 902413 W 2011-02-03 1996-07-31 Alpha 6 subunit of the 20S proteasome; protein abundance increases in response to DNA replication stress +S000035211 CDS YMR314W 13 901709 902413 W 2011-02-03 1996-07-31 +S000004932 ORF Verified YMR315W chromosome 13 13 902800 903849 W 2011-02-03 1996-07-31 Protein with NADP(H) oxidoreductase activity; transcription is regulated by Stb5p in response to NADPH depletion induced by diamide; promoter contains a putative Stb5p binding site; protein abundance increases in response to DNA replication stress +S000036057 CDS YMR315W 13 902800 903849 W 2011-02-03 1996-07-31 +S000028697 ORF Uncharacterized YMR315W-A chromosome 13 13 904286 904393 W 2011-02-03 2003-07-29 Putative protein of unknown function +S000032606 CDS YMR315W-A 13 904286 904393 W 2011-02-03 2003-07-29 +S000004935 ORF Verified YMR316W DIA1 chromosome 13 13 904825 905835 W 2011-02-03 1996-07-31 Protein of unknown function; involved in invasive and pseudohyphal growth; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern +S000036198 CDS YMR316W 13 904825 905835 W 2011-02-03 1996-07-31 +S000004933 ORF Uncharacterized YMR316C-A chromosome 13 13 905973 905662 C 2011-02-03 1996-07-31 Protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; mRNA identified as translated by ribosome profiling data; overlaps the verified gene DIA1/YMR316W +S000036747 CDS YMR316C-A 13 905973 905662 C 2011-02-03 1996-07-31 +S000004936 ORF Uncharacterized YMR317W chromosome 13 13 907364 910786 W 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; has some similarity to sialidase from Trypanosoma; YMR317W is not an essential gene +S000031682 CDS YMR317W 13 907364 910786 W 2011-02-03 1996-07-31|2011-02-03 +S000004934 ORF Dubious YMR316C-B chromosome 13 13 907629 907321 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps 5' end of ORF YMR317W +S000036748 CDS YMR316C-B 13 907629 907321 C 2011-02-03 1996-07-31 +S000004937 ORF Verified YMR318C ADH6 NADP-dependent alcohol dehydrogenase|ADHVI chromosome 13 13 912143 911061 C 2011-02-03 1996-07-31 NADPH-dependent medium chain alcohol dehydrogenase; has broad substrate specificity; member of the cinnamyl family of alcohol dehydrogenases; may be involved in fusel alcohol synthesis or in aldehyde tolerance; protein abundance increases in response to DNA replication stress +S000031726 CDS YMR318C 13 912143 911061 C 2011-02-03 1996-07-31 +S000004938 ORF Verified YMR319C FET4 chromosome 13 L000000611 13 914538 912880 C 2011-02-03 1996-07-31 Low-affinity Fe(II) transporter of the plasma membrane +S000031875 CDS YMR319C 13 914538 912880 C 2011-02-03 1996-07-31 +S000004939 ORF Uncharacterized YMR320W chromosome 13 13 916746 917051 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YMR320W is not an essential gene +S000036413 CDS YMR320W 13 916746 917051 W 2011-02-03 1996-07-31 +S000004940 ORF Uncharacterized YMR321C chromosome 13 13 917896 917579 C 2011-02-03 1996-07-31 Putative protein of unknown function; proposed to be a palmitoylated membrane protein; YMR321C has a paralog, SAM4, that arose from a single-locus duplication +S000036437 CDS YMR321C 13 917896 917579 C 2011-02-03 1996-07-31 +S000130193 ARS ARS1333 chromosome 13 13 917896 918366 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000004941 ORF Verified YMR322C SNO4 glutathione-independent methylglyoxalase family protein|HSP34 chromosome 13 13 919079 918366 C 2011-02-03 1996-07-31 Possible chaperone and cysteine protease; required for transcriptional reprogramming during the diauxic shift and for survival in stationary phase; similar to bacterial Hsp31 and yeast Hsp31p, Hsp32p, and Hsp33p; DJ-1/ThiJ/PfpI superfamily member; predicted involvement in pyridoxine metabolism; induced by mild heat stress and copper deprivation +S000037082 CDS YMR322C 13 919079 918366 C 2011-02-03 1996-07-31 +S000004942 ORF Verified YMR323W ERR3 phosphopyruvate hydratase ERR3 chromosome 13 13 920088 921401 W 2011-02-03 1996-07-31 Enolase, a phosphopyruvate hydratase; catalyzes the conversion of 2-phosphoglycerate to phosphoenolpyruvate; complements the growth defect of an ENO1 ENO2 double mutant in glucose +S000037230 CDS YMR323W 13 920088 921401 W 2011-02-03 1996-07-31 +S000004943 ORF Dubious YMR324C chromosome 13 13 922444 922202 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; transcription is AZF1 dependent in glycerol-lactate medium and SLT2 dependent in response to the lipid hydroperoxides +S000037270 CDS YMR324C 13 922444 922202 C 2011-02-03 1996-07-31 +S000004944 ORF Verified YMR325W PAU19 seripauperin PAU19 chromosome 13 13 922641 923015 W 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions +S000037375 CDS YMR325W 13 922641 923015 W 2011-02-03 1996-07-31 +S000130194 ARS ARS1335 chromosome 13 13 923015 923494 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000028989 telomere TEL13R chromosome 13 13 923541 924431 W 219 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome XIII; composed of an X element core sequence, X element combinatorial repeats, and a terminal stretch of telomeric repeats +S000028990 telomeric_repeat TEL13R 13 924307 924431 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome XIII +S000028991 X_element TEL13R 13 923541 924005 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome XIII; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YMR326C +S000028992 X_element_combinatorial_repeat TEL13R 13 924006 924306 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr XIII; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000004945 ORF Dubious YMR326C chromosome 13 13 923802 923494 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the telomere on the right arm of chromosome 13 +S000037400 CDS YMR326C 13 923802 923494 C 2011-02-03 1996-07-31 +S000028704 ORF Dubious YNL339W-B chromosome 14 14 734 1216 W 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032643 CDS YNL339W-B 14 734 1216 W 2003-07-29 2003-07-29 +S000028703 ORF Dubious YNL339W-A chromosome 14 14 1517 2092 W 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032637 CDS YNL339W-A 14 1517 2092 W 2003-07-29 2003-07-29 +S000005283 ORF Verified YNL339C YRF1-6 Y' element ATP-dependent helicase protein 1 copy 6|YRF1 chromosome 14 14 6098 371 C 1996-07-31 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p +S000031358 CDS YNL339C 14 5931 371 C 1996-07-31 1996-07-31 +S000031357 CDS YNL339C 14 6098 6080 C 1996-07-31 1996-07-31 +S000031359 intron YNL339C 14 6079 5932 C 1996-07-31 1996-07-31 +S000005282 ORF Dubious YNL338W chromosome 14 14 6561 6719 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps TEL14L-XC, which is a telomeric X element core sequence on the left arm of chromosome XIV +S000030505 CDS YNL338W 14 6561 6719 W 1996-07-31 1996-07-31 +S000005281 ORF Dubious YNL337W chromosome 14 14 7165 7419 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030361 CDS YNL337W 14 7165 7419 W 1996-07-31 1996-07-31 +S000028924 telomere TEL14L chromosome 14 14 7428 1 C -238 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome XIV; composed of an X element core sequence, X element combinatorial repeats, a short stretch of telomeric repeats, and a long Y' element +S000028925 telomeric_repeat TEL14L 14 6691 6618 C 2003-09-09 2003-09-09 Internal telomeric repeats on the left arm of Chromosome XIV; spans ORF YNL338W +S000028926 X_element TEL14L 14 7428 6964 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome XIV; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YNL337W +S000028927 X_element_combinatorial_repeat TEL14L 14 6963 6692 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr XIV; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000028928 Y_prime_element TEL14L 14 6617 1 C 2003-09-09 2003-09-09 Telomeric long Y' element on the left arm of Chromosome XIV; contains an ARS consensus sequence, a region of 36-bp repeats, and three ORFs (YRF1-6/YNL339C, YNL339W-A, YNL339W-B) +S000005280 ORF Verified YNL336W COS1 chromosome 14 L000004060 14 8330 9475 W 1996-07-31 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins +S000030202 CDS YNL336W 14 8330 9475 W 1996-07-31 1996-07-31 +S000005279 ORF Verified YNL335W DDI3 cyanamide hydratase chromosome 14 14 11452 12129 W 1996-07-31 1996-07-31 Cyanamide hydratase that detoxifies cyanamide; member of the HD domain metalloprotein superfamily; expression is induced over 100-fold by cyanamide and by SN2-type DNA alkylating agents such as MMS and DMA; induction decreased in rad6 and rad18 mutants; gene and protein are identical to DDI2 and Ddi2p +S000037479 CDS YNL335W 14 11452 12129 W 1996-07-31 1996-07-31 +S000005278 ORF Verified YNL334C SNO2 putative pyridoxal 5'-phosphate synthase chromosome 14 L000003452 14 12876 12208 C 1996-07-31 1996-07-31 Protein of unknown function; nearly identical to Sno3p; expression is induced before the diauxic shift and also in the absence of thiamin +S000037293 CDS YNL334C 14 12876 12208 C 1996-07-31 1996-07-31 +S000005277 ORF Verified YNL333W SNZ2 pyridoxine biosynthesis protein SNZ2 chromosome 14 L000002576 14 13267 14163 W 1996-07-31 1996-07-31 Member of a stationary phase-induced gene family; transcription of SNZ2 is induced prior to diauxic shift, and also in the absence of thiamin in a Thi2p-dependent manner; forms a coregulated gene pair with SNO2; interacts with Thi11p +S000037255 CDS YNL333W 14 13267 14163 W 1996-07-31 1996-07-31 +S000005276 ORF Verified YNL332W THI12 4-amino-5-hydroxymethyl-2-methylpyrimidine phosphate synthase chromosome 14 L000003223 14 14832 15854 W 1996-07-31 1996-07-31 Protein involved in synthesis of the thiamine precursor HMP; member of a subtelomeric gene family including THI5, THI11, THI12, and THI13; hydroxymethylpyrimidine is also known as HMP +S000036570 CDS YNL332W 14 14832 15854 W 1996-07-31 1996-07-31 +S000005275 ORF Verified YNL331C AAD14 putative aryl-alcohol dehydrogenase chromosome 14 L000004676 14 17248 16118 C 1996-07-31 1996-07-31 Putative aryl-alcohol dehydrogenase; similar to P. chrysosporium aryl-alcohol dehydrogenase; mutational analysis has not yet revealed a physiological role; members of the AAD gene family comprise three pairs (AAD3 + AAD15, AAD6/AAD16 + AAD4, AAD10 + AAD14) whose two genes are more related to one another than to other members of the family +S000036424 CDS YNL331C 14 17248 16118 C 1996-07-31 1996-07-31 +S000005274 ORF Verified YNL330C RPD3 histone deacetylase RPD3|MOF6|SDS6|SDI2|REC3 chromosome 14 L000001696|L000001603 14 19302 18001 C -237 1996-07-31 1996-07-31 Histone deacetylase, component of both the Rpd3S and Rpd3L complexes; regulates transcription, silencing, autophagy and other processes by influencing chromatin remodeling; forms at least two different complexes which have distinct functions and members; Rpd3(L) recruitment to the subtelomeric region is regulated by interaction with the arginine methyltransferase, Hmt1p +S000036315 CDS YNL330C 14 19302 18001 C 1996-07-31 1996-07-31 +S000005273 ORF Verified YNL329C PEX6 AAA family ATPase peroxin 6|PAS8 chromosome 14 L000001341 14 22633 19541 C 1996-07-31 1996-07-31 AAA-peroxin; heterodimerizes with AAA-peroxin Pex1p and participates in the recycling of peroxisomal signal receptor Pex5p from the peroxisomal membrane to the cystosol; mutations in human PEX6 can lead to severe peroxisomal disorders and early death +S000034361 CDS YNL329C 14 22633 19541 C 1996-07-31 1996-07-31 +S000005272 ORF Verified YNL328C MDJ2 chromosome 14 L000004357 14 23274 22834 C 1996-07-31 1996-07-31 Constituent of the mitochondrial import motor; associated with the presequence translocase; function overlaps with that of Pam18p; stimulates the ATPase activity of Ssc1p to drive mitochondrial import; contains a J domain +S000034238 CDS YNL328C 14 23274 22834 C 1996-07-31 1996-07-31 +S000005271 ORF Verified YNL327W EGT2 chromosome 14 L000004074 14 24048 27173 W 2011-02-03 1996-07-31|2011-02-03 Glycosylphosphatidylinositol (GPI)-anchored cell wall endoglucanase; required for proper cell separation after cytokinesis; expression is activated by Swi5p and tightly regulated in a cell cycle-dependent manner +S000034184 CDS YNL327W 14 24048 27173 W 2011-02-03 1996-07-31|2011-02-03 +S000005270 ORF Verified YNL326C PFA3 palmitoyltransferase PFA3 chromosome 14 14 28347 27337 C 2011-02-03 1996-07-31 Palmitoyltransferase for Vac8p; required for vacuolar membrane fusion; contains an Asp-His-His-Cys-cysteine rich (DHHC-CRD) domain; autoacylates; required for vacuolar integrity under stress conditions +S000033265 CDS YNL326C 14 28347 27337 C 2011-02-03 1996-07-31 +S000118382 ARS ARS1405 ARSXIV-29 chromosome 14 14 28469 28700 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178165 ARS_consensus_sequence ARS1405 14 28654 28638 C 2014-11-18 2014-11-18 +S000005268 ORF Dubious YNL324W chromosome 14 14 31050 31445 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033183 CDS YNL324W 14 31050 31445 W 2011-02-03 1996-07-31 +S000005269 ORF Verified YNL325C FIG4 phosphatidylinositol-3,5-bisphosphate 5-phosphatase chromosome 14 L000003583 14 31378 28739 C 2011-02-03 1996-07-31 Phosphatidylinositol 3,5-bisphosphate (PtdIns[3,5]P) phosphatase; required for efficient mating and response to osmotic shock; physically associates with and regulated by Vac14p; contains a SAC1-like domain; homologous to human FIG4, which is associated with CMT4J, a form of Charcot-Marie-Tooth disorder +S000033213 CDS YNL325C 14 31378 28739 C 2011-02-03 1996-07-31 +S000005267 ORF Verified YNL323W LEM3 ROS3|BRE3 chromosome 14 14 31944 33188 W 2011-02-03 1996-07-31 Membrane protein of the plasma membrane and ER; interacts specifically in vivo with the phospholipid translocase (flippase) Dnf1p; involved in translocation of phospholipids and alkylphosphocholine drugs across the plasma membrane; null mutant requires tryptophan due to mislocalization of tryptophan permease Tat2p +S000033125 CDS YNL323W 14 31944 33188 W 2011-02-03 1996-07-31 +S000005266 ORF Verified YNL322C KRE1 chromosome 14 L000000912 14 34235 33294 C -235 2011-02-03 1996-07-31 Cell wall glycoprotein involved in beta-glucan assembly; serves as a K1 killer toxin membrane receptor +S000032211 CDS YNL322C 14 34235 33294 C 2011-02-03 1996-07-31 +S000005265 ORF Verified YNL321W VNX1 chromosome 14 14 34696 37422 W 2011-02-03 1996-07-31 Calcium/H+ antiporter localized to the endoplasmic reticulum membrane; member of the calcium exchanger (CAX) family; potential Cdc28p substrate +S000032167 CDS YNL321W 14 34696 37422 W 2011-02-03 1996-07-31 +S000005264 ORF Uncharacterized YNL320W chromosome 14 14 37700 38554 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000032112 CDS YNL320W 14 37700 38554 W 2011-02-03 1996-07-31 +S000005263 ORF Dubious YNL319W chromosome 14 14 38642 39082 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene HXT14 +S000031153 CDS YNL319W 14 38642 39082 W 2011-02-03 1996-07-31 +S000005262 ORF Verified YNL318C HXT14 chromosome 14 L000002762 14 40329 38707 C 2011-02-03 1996-07-31 Protein with similarity to hexose transporter family members; expression is induced in low glucose and repressed in high glucose; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000030981 CDS YNL318C 14 40329 38707 C 2011-02-03 1996-07-31 +S000005261 ORF Verified YNL317W PFS2 cleavage polyadenylation factor subunit PFS2 chromosome 14 14 40619 42016 W 2011-02-03 1996-07-31 Integral subunit of the pre-mRNA CPF complex; the cleavage and polyadenylation factor (CPF) complex plays an essential role in mRNA 3'-end formation by bridging different processing factors and thereby promoting the assembly of the processing complex +S000030052 CDS YNL317W 14 40619 42016 W 2011-02-03 1996-07-31 +S000005260 ORF Verified YNL316C PHA2 prephenate dehydratase PHA2 chromosome 14 L000001414 14 43075 42071 C -227 2011-02-03 2003-09-22|1996-07-31 Prephenate dehydratase; catalyzes the conversion of prephanate to phenylpyruvate, which is a step in the phenylalanine biosynthesis pathway +S000029856 CDS YNL316C 14 43075 42071 C 2011-02-03 2003-09-22|1996-07-31 +S000005259 ORF Verified YNL315C ATP11 chromosome 14 L000000148 14 44280 43324 C 2011-02-03 1996-07-31 Molecular chaperone; required for the assembly of alpha and beta subunits into the F1 sector of mitochondrial F1F0 ATP synthase; N-terminally propionylated in vivo +S000037828 CDS YNL315C 14 44280 43324 C 2011-02-03 1996-07-31 +S000005258 ORF Verified YNL314W DAL82 DURM chromosome 14 L000000482 14 44447 45214 W 2011-02-03 1996-07-31 Positive regulator of allophanate inducible genes; binds a dodecanucleotide sequence upstream of all genes that are induced by allophanate; contains an UISALL DNA-binding, a transcriptional activation, and a coiled-coil domain +S000037152 CDS YNL314W 14 44447 45214 W 2011-02-03 1996-07-31 +S000005257 ORF Verified YNL313C EMW1 tetratricopeptide repeat-containing protein EMW1 chromosome 14 14 48022 45308 C 2011-02-03 1996-07-31 Essential conserved protein with a role in cell wall integrity; contains six TPR (tetratricopeptide repeat) domains clustered in the C-terminal region; conditional mutant is suppressed by overexpression of GFA1; protein abundance increases in response to DNA replication stress +S000037005 CDS YNL313C 14 48022 45308 C 2011-02-03 1996-07-31 +S000005256 ORF Verified YNL312W RFA2 RPA32|RPA2|BUF1 chromosome 14 L000000203|L000001621 14 48287 49216 W 2011-02-03 1996-07-31 Subunit of heterotrimeric Replication Protein A (RPA); RPA is a highly conserved single-stranded DNA binding protein involved in DNA replication, repair, and recombination; RPA protects against inappropriate telomere recombination, and upon telomere uncapping, prevents cell proliferation by a checkpoint-independent pathway; in concert with Sgs1p-Top2p-Rmi1p, stimulates DNA catenation/decatenation activity of Top3p; protein abundance increases in response to DNA replication s +S000036978 CDS YNL312W 14 48287 48293 W 2011-02-03 1996-07-31 +S000036979 CDS YNL312W 14 48402 49216 W 2011-02-03 1996-07-31 +S000036980 intron YNL312W 14 48294 48401 W 2011-02-03 1996-07-31 +S000005255 ORF Verified YNL311C SKP2 putative SCF ubiquitin ligase complex subunit SKP2 chromosome 14 14 51688 49397 C 2011-02-03 1996-07-31 F-box protein of unknown function; predicted to be part of an SCF ubiquitin protease complex; involved in regulating protein levels of sulfur metabolism enzymes; may interact with ribosomes, based on co-purification experiments +S000036212 CDS YNL311C 14 51688 49397 C 2011-02-03 1996-07-31 +S000005254 ORF Verified YNL310C ZIM17 HEP1|TIM15|FMP28 chromosome 14 14 52431 51907 C 2011-02-03 1996-07-31|2006-05-10 Protein co-chaperone with a zinc finger motif; essential for protein import into mitochondria; may act with Pam18p to facilitate recognition and folding of imported proteins by Ssc1p (mtHSP70) in the mitochondrial matrix; required for the maintenance of Ssc1p solubility and assists in the functional interaction of Ssc1p with substrate proteins +S000036042 CDS YNL310C 14 52431 51907 C 2011-02-03 1996-07-31|2006-05-10 +S000005253 ORF Verified YNL309W STB1 chromosome 14 L000002107 14 52662 53924 W 2011-02-03 2003-09-22|1996-07-31 Protein with role in regulation of MBF-specific transcription at Start; phosphorylated by Cln-Cdc28p kinases in vitro; unphosphorylated form binds Swi6p, which is required for Stb1p function; expression is cell-cycle regulated; STB1 has a paralog, YOL131W, that arose from the whole genome duplication +S000035181 CDS YNL309W 14 52662 53924 W 2011-02-03 2003-09-22|1996-07-31 +S000005252 ORF Verified YNL308C KRI1 chromosome 14 S000007481 14 55897 54122 C 2011-02-03 1996-07-31 Essential nucleolar protein required for 40S ribosome biogenesis; associate with snR30; physically and functionally interacts with Krr1p +S000034918 CDS YNL308C 14 55897 54122 C 2011-02-03 1996-07-31 +S000005251 ORF Verified YNL307C MCK1 serine/threonine/tyrosine protein kinase MCK1|CMS1|YPK1 chromosome 14 L000001036|S000029094|L000000369 14 57573 56446 C 1996-07-31 1996-07-31 Dual-specificity ser/thr and tyrosine protein kinase; roles in chromosome segregation, meiotic entry, genome stability, phosphorylation-dependent protein degradation (Rcn1p and Cdc6p), inhibition of protein kinase A, transcriptional regulation, inhibition of RNA pol III, calcium stress and inhibition of Clb2p-Cdc28p after nuclear division; MCK1 has a paralog, YGK3, that arose from the whole genome duplication +S000034016 CDS YNL307C 14 57573 56446 C 1996-07-31 1996-07-31 +S000005250 ORF Verified YNL306W MRPS18 mitochondrial 37S ribosomal protein YmS18|YmS18 chromosome 14 14 58155 58808 W 1996-07-31 1996-07-31 Mitochondrial ribosomal protein of the small subunit; essential for viability, unlike most other mitoribosomal proteins +S000033967 CDS YNL306W 14 58155 58808 W 1996-07-31 1996-07-31 +S000005249 ORF Verified YNL305C BXI1 YBH3 chromosome 14 14 59791 58898 C 1996-07-31 1996-07-31 Protein involved in apoptosis; variously described as containing a BCL-2 homology (BH3) domain or as a member of the BAX inhibitor family; reported to promote apoptosis under some conditions and to inhibit it in others; localizes to ER and vacuole; may link the unfolded protein response to apoptosis via regulation of calcium-mediated signaling; translocates to mitochondria under apoptosis-inducing conditions in a process involving Mir1p and Cor1p +S000033769 CDS YNL305C 14 59791 58898 C 1996-07-31 1996-07-31 +S000005248 ORF Verified YNL304W YPT11 Rab family GTPase YPT11 chromosome 14 14 60297 61550 W 2005-11-07 1996-07-31|2005-11-07 Rab GTPase; Myo2p-binding protein implicated in mother-to-bud transport of cortical endoplasmic reticulum (ER), late Golgi, and mitochondria during cell division; function is regulated at multiple levels; abundance of active Ypt11p forms is controlled by phosphorylation status and degradation; normally a low-abundance protein whose ER localization is only detected when protein is highly over expressed +S000033723 CDS YNL304W 14 60297 61550 W 2005-11-07 1996-07-31|2005-11-07 +S000005247 ORF Dubious YNL303W chromosome 14 14 61510 61857 W 2005-11-07 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033069 CDS YNL303W 14 61510 61857 W 2005-11-07 1996-07-31 +S000118383 ARS ARS1406 ARSXIV-62 chromosome 14 14 61599 61895 2006-08-30 2006-08-30 Autonomously Replicating Sequence +S000178166 ARS_consensus_sequence ARS1406 14 61694 61710 W 2014-11-18 2014-11-18 +S000005246 ORF Verified YNL302C RPS19B eS19|ribosomal 40S subunit protein S19B|S19e|rp55B|YS16B|S19B|S16aB|RP55B chromosome 14 L000002703|L000002725 14 62943 61958 C 2005-11-07 1996-07-31 Protein component of the small (40S) ribosomal subunit; required for assembly and maturation of pre-40 S particles; homologous to mammalian ribosomal protein S19, no bacterial homolog; mutations in human RPS19 are associated with Diamond Blackfan anemia; RPS19B has a paralog, RPS19A, that arose from the whole genome duplication +S000032915 CDS YNL302C 14 62372 61958 C 2005-11-07 1996-07-31 +S000032914 CDS YNL302C 14 62943 62924 C 2005-11-07 1996-07-31 +S000032916 intron YNL302C 14 62923 62373 C 2005-11-07 1996-07-31 +S000005245 ORF Verified YNL301C RPL18B eL18|ribosomal 60S subunit protein L18B|L18e|rp28B|L18B|RP28B chromosome 14 L000002702 14 64562 63570 C 2005-11-07 1996-07-31 Ribosomal 60S subunit protein L18B; homologous to mammalian ribosomal protein L18, no bacterial homolog; RPL18B has a paralog, RPL18A, that arose from the whole genome duplication +S000032846 CDS YNL301C 14 64018 63570 C 2005-11-07 1996-07-31 +S000032845 CDS YNL301C 14 64562 64451 C 2005-11-07 1996-07-31 +S000032847 intron YNL301C 14 64450 64019 C 2005-11-07 1996-07-31 +S000005244 ORF Uncharacterized YNL300W TOS6 chromosome 14 14 65744 66052 W 2005-11-07 1996-07-31 Glycosylphosphatidylinositol-dependent cell wall protein; expression is periodic and decreases in respone to ergosterol perturbation or upon entry into stationary phase; depletion increases resistance to lactic acid +S000032776 CDS YNL300W 14 65744 66052 W 2005-11-07 1996-07-31 +S000005243 ORF Verified YNL299W TRF5 non-canonical poly(A) polymerase TRF5 chromosome 14 L000003385 14 66517 68445 W 2005-11-07 1996-07-31|2005-11-03 Non-canonical poly(A) polymerase; involved in nuclear RNA degradation as a component of the TRAMP complex; catalyzes polyadenylation of hypomodified tRNAs, and snoRNA and rRNA precursors; overlapping but non-redundant functions with Pap2p +S000035690 CDS YNL299W 14 66517 68445 W 2005-11-07 1996-07-31|2005-11-03 +S000005242 ORF Verified YNL298W CLA4 serine/threonine protein kinase CLA4|ERC10 chromosome 14 L000000564|L000002643 14 68915 71443 W 2005-11-07 1996-07-31 Cdc42p-activated signal transducing kinase; member of the PAK (p21-activated kinase) family, along with Ste20p and Skm1p; involved in septin ring assembly, vacuole inheritance, cytokinesis, sterol uptake regulation; phosphorylates Cdc3p and Cdc10p; CLA4 has a paralog, SKM1, that arose from the whole genome duplication +S000035601 CDS YNL298W 14 68915 71443 W 2005-11-07 1996-07-31 +S000005240 ORF Dubious YNL296W chromosome 14 14 76273 76587 W 2005-11-07 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; deletion adversely affects sporulation; deletion mutant exhibits synthetic phenotype under expression of mutant huntingtin fragment, but gene does not have human ortholog +S000034476 CDS YNL296W 14 76273 76587 W 2005-11-07 1996-07-31 +S000005241 ORF Verified YNL297C MON2 YSL2 chromosome 14 14 76583 71673 C 2005-11-07 1996-07-31 Protein with a role in endocytosis and vacuole integrity; peripheral membrane protein; interacts with and negatively regulates Arl1p; localizes to the endosome; member of the Sec7p family of proteins +S000034548 CDS YNL297C 14 76583 71673 C 2005-11-07 1996-07-31 +S000005239 ORF Uncharacterized YNL295W MRX6 chromosome 14 14 76946 78520 W 2005-11-07 1996-07-31 Protein that associates with mitochondrial ribosome +S000034395 CDS YNL295W 14 76946 78520 W 2005-11-07 1996-07-31 +S000005238 ORF Verified YNL294C RIM21 PAL2 chromosome 14 14 80260 78659 C 2005-11-07 1996-07-31 pH sensor molecule, component of the RIM101 pathway; has a role in cell wall construction and alkaline pH response; is glycosylated and phosphorylated; interacts with Dfg16p and Rim9p to form a pH-sensing complex; localization to the plasma membrane is dependent on Dfg16p and Rim9p; has similarity to A. nidulans PalH +S000033436 CDS YNL294C 14 80260 78659 C 2005-11-07 1996-07-31 +S000005237 ORF Verified YNL293W MSB3 Rab GTPase-activating protein MSB3|GYP3 chromosome 14 L000003918 14 80640 82541 W 2005-11-07 1996-07-31 Rab GTPase-activating protein; regulates endocytosis via inactivation of Vps21p at endosomes and vacuole fusion via inactivation of Ypt7p at vacuoles; also acts on Ypt52p and Sec4p; localizes to plasma membrane, sites of polarized growth; relocalizes from bud neck to cytoplasm upon DNA replication stress; similar to TBC-domain Tre2 oncogene; MSB3 has a paralog, MSB4, that arose from the whole genome duplication; human homolog USP6NL can complement yeast msb3 msb4 double null +S000033388 CDS YNL293W 14 80640 82541 W 2005-11-07 1996-07-31 +S000005236 ORF Verified YNL292W PUS4 pseudouridine synthase PUS4 chromosome 14 L000003347 14 82806 84017 W 2005-11-07 1996-07-31 Pseudouridine synthase; catalyzes only the formation of pseudouridine-55 (Psi55), a highly conserved tRNA modification, in mitochondrial and cytoplasmic tRNAs; also responsible for pseudouracil modification of some mRNAs; PUS4 overexpression leads to translational derepression of GCN4 (Gcd- phenotype) +S000033311 CDS YNL292W 14 82806 84017 W 2005-11-07 1996-07-31 +S000005235 ORF Verified YNL291C MID1 chromosome 14 L000002584 14 85815 84169 C 2005-11-07 1996-07-31 N-glycosylated integral membrane protein of the ER and plasma membrane; functions as a stretch-activated Ca2+-permeable cation channel required for Ca2+ influx stimulated by pheromone; interacts with Cch1p; forms an oligomer +S000033221 CDS YNL291C 14 85815 84169 C 2005-11-07 1996-07-31 +S000005234 ORF Verified YNL290W RFC3 replication factor C subunit 3 chromosome 14 L000001624 14 86218 87240 W 2005-11-07 1996-07-31 Subunit of heteropentameric Replication factor C (RF-C); which is a DNA binding protein and ATPase that acts as a clamp loader of the proliferating cell nuclear antigen (PCNA) processivity factor for DNA polymerases delta and epsilon; relocalizes to the cytosol in response to hypoxia +S000032410 CDS YNL290W 14 86218 87240 W 2005-11-07 1996-07-31 +S000005233 ORF Verified YNL289W PCL1 HCS26 chromosome 14 L000002783 14 87897 88736 W 2005-11-07 1996-07-31 Cyclin, interacts with cyclin-dependent kinase Pho85p; member of the Pcl1,2-like subfamily, involved in the regulation of polarized growth and morphogenesis and progression through the cell cycle; is ubiquitinated by Dma1p; phosphorylation by Pho85p targets it for degradation; localizes to sites of polarized cell growth +S000032399 CDS YNL289W 14 87897 88736 W 2005-11-07 1996-07-31 +S000007304 snoRNA_gene snR40 SNR40 chromosome 14 L000003055 14 89210 89306 W 2005-11-07 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U898 and small subunit (SSU) rRNA at position G1271 +S000030610 noncoding_exon snR40 14 89210 89306 W 2005-11-07 2000-05-19 +S000118384 ARS ARS1407 ARSXIV-90 chromosome 14 14 89531 89804 2006-08-30 2006-08-30 Autonomously Replicating Sequence +S000178167 ARS_consensus_sequence ARS1407 14 89755 89739 C 2014-11-18 2014-11-18 +S000005232 ORF Verified YNL288W CAF40 CCR4-NOT core subunit CAF40 chromosome 14 14 90303 91424 W 2005-11-07 1996-07-31 Component of the CCR4-NOT transcriptional complex; evolutionarily conserved; involved in controlling mRNA initiation, elongation, and degradation; binds Cdc39p +S000031389 CDS YNL288W 14 90303 91424 W 2005-11-07 1996-07-31 +S000005231 ORF Verified YNL287W SEC21 coatomer subunit gamma chromosome 14 L000001844 14 91994 94801 W 2005-11-07 1996-07-31 Gamma subunit of coatomer; coatomer is a heptameric protein complex that together with Arf1p forms the COPI coat; involved in ER to Golgi transport of selective cargo +S000031285 CDS YNL287W 14 91994 94801 W 2005-11-07 1996-07-31 +S000005230 ORF Verified YNL286W CUS2 U2 snRNP complex subunit CUS2 chromosome 14 L000003273 14 95223 96080 W 2005-11-07 1996-07-31 Putative checkpoint factor in transcription; binds to U2 snRNA and Prp11p; regulates toggling of the U2 snRNA stem II region between different structures; contains two RNA recognition motifs (RRMs) +S000031155 CDS YNL286W 14 95223 96080 W 2005-11-07 1996-07-31 +S000005229 ORF Dubious YNL285W chromosome 14 14 96173 96544 W 2005-11-07 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030192 CDS YNL285W 14 96173 96544 W 2005-11-07 1996-07-31 +S000130140 ARS ARS1409 chromosome 14 14 96247 96463 2009-05-06 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000006591 tRNA_gene tG(UCC)N SUF6 chromosome 14 L000003700|L000002154 14 96312 96241 C -192 2005-11-07 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons +S000037566 noncoding_exon tG(UCC)N 14 96312 96241 C 2005-11-07 2000-05-19 +S000007140 long_terminal_repeat YNLWtau1 chromosome 14 14 96451 96609 W 2005-11-07 2000-05-19 Ty4 LTR +S000007129 long_terminal_repeat YNLCdelta1 chromosome 14 14 96941 96610 C 2005-11-07 2000-05-19 Ty1 LTR +S000007387 transposable_element_gene YNL284C-B gag-pol fusion protein chromosome 14 S000029017 14 102232 96964 C 2005-11-07 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000031728 CDS YNL284C-B 14 100926 96964 C 2005-11-07 1999-07-17 +S000031727 CDS YNL284C-B 14 102232 100928 C 2005-11-07 1999-07-17 +S000031729 plus_1_translational_frameshift YNL284C-B 14 100927 100927 C 2005-11-07 1999-07-17 +S000007386 transposable_element_gene YNL284C-A gag protein chromosome 14 14 102232 100910 C 2005-11-07 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000031717 CDS YNL284C-A 14 102232 100910 C 2005-11-07 1999-07-17 +S000007134 LTR_retrotransposon YNLCTy1-1 Ty1 chromosome 14 14 102523 96610 C 2005-11-07 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007130 long_terminal_repeat YNLCdelta2 chromosome 14 14 102523 102192 C 2005-11-07 2000-05-19 Ty1 LTR +S000007133 long_terminal_repeat YNLCsigma1 chromosome 14 14 102700 102632 C 2005-11-07 2000-05-19 Ty3 LTR +S000006673 tRNA_gene tN(GUU)N1 chromosome 14 L000003687 14 102716 102789 W 2005-11-07 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis +S000035559 noncoding_exon tN(GUU)N1 14 102716 102789 W 2005-11-07 2000-05-19 +S000005228 ORF Verified YNL284C MRPL10 mitochondrial 54S ribosomal protein YmL10/YmL18|YmL10|YmL18|MRPL18 chromosome 14 L000002689|S000029308|L000002685 14 104102 103134 C 2005-11-07 1996-07-31 Mitochondrial ribosomal protein of the large subunit; appears as two protein spots (YmL10 and YmL18) on two-dimensional SDS gels +S000029964 CDS YNL284C 14 104102 103134 C 2005-11-07 1996-07-31 +S000006744 tRNA_gene tT(AGU)N1 chromosome 14 L000003688 14 104805 104877 W 2005-11-07 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000037414 noncoding_exon tT(AGU)N1 14 104805 104877 W 2005-11-07 2000-05-19 +S000005227 ORF Verified YNL283C WSC2 STA3 chromosome 14 L000004217 14 106695 105184 C 2005-11-07 1996-07-31 Sensor-transducer of the stress-activated PKC1-MPK1 signaling pathway; involved in maintenance of cell wall integrity and recovery from heat shock; required for the arrest of secretion response; WSC2 has a paralog, WSC3, that arose from the whole genome duplication +S000037312 CDS YNL283C 14 106695 105184 C 2005-11-07 1996-07-31 +S000005226 ORF Verified YNL282W POP3 chromosome 14 L000004338 14 107687 108274 W 2005-11-07 1996-07-31 Subunit of both RNase MRP and nuclear RNase P; RNase MRP cleaves pre-rRNA, while nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs; relocalizes to the cytosol in response to hypoxia +S000037263 CDS YNL282W 14 107687 108274 W 2005-11-07 1996-07-31 +S000005225 ORF Verified YNL281W HCH1 chromosome 14 L000004817 14 108467 108928 W 2005-11-07 1996-07-31 Heat shock protein regulator; binds to Hsp90p and may stimulate ATPase activity; originally identified as a high-copy number suppressor of a HSP90 loss-of-function mutation; role in regulating Hsp90 inhibitor drug sensitivity; GFP-fusion protein localizes to the cytoplasm and nucleus; protein abundance increases in response to DNA replication stress +S000037163 CDS YNL281W 14 108467 108928 W 2005-11-07 1996-07-31 +S000005224 ORF Verified YNL280C ERG24 delta(14)-sterol reductase chromosome 14 L000000580 14 110411 109095 C 2005-11-07 1996-07-31 C-14 sterol reductase; acts in ergosterol biosynthesis; mutants accumulate the abnormal sterol ignosterol (ergosta-8,14 dienol), and are viable under anaerobic growth conditions but inviable on rich medium under aerobic conditions +S000037018 CDS YNL280C 14 110411 109095 C 2005-11-07 1996-07-31 +S000005223 ORF Verified YNL279W PRM1 pheromone-regulated protein PRM1 chromosome 14 14 110917 112902 W 2005-11-07 1996-07-31 Pheromone-regulated multispanning membrane protein; involved in membrane fusion during mating; predicted to have 5 transmembrane segments and a coiled coil domain; localizes to the shmoo tip; regulated by Ste12p +S000035312 CDS YNL279W 14 110917 112902 W 2005-11-07 1996-07-31 +S000005222 ORF Verified YNL278W CAF120 chromosome 14 14 113271 116453 W 2005-11-07 1996-07-31 Part of the CCR4-NOT transcriptional regulatory complex; involved in controlling mRNA initiation, elongation, and degradation; contains a PH-like domain; CAF120 has a paralog, SKG3, that arose from the whole genome duplication +S000035145 CDS YNL278W 14 113271 116453 W 2005-11-07 1996-07-31 +S000028852 ORF Uncharacterized YNL277W-A chromosome 14 14 116679 116867 W 2005-11-07 2003-07-29 Putative protein of unknown function +S000034565 CDS YNL277W-A 14 116679 116867 W 2005-11-07 2003-07-29 +S000005221 ORF Verified YNL277W MET2 homoserine O-acetyltransferase chromosome 14 L000001077 14 117349 118809 W -187 2005-11-07 1996-07-31 L-homoserine-O-acetyltransferase; catalyzes the conversion of homoserine to O-acetyl homoserine which is the first step of the methionine biosynthetic pathway +S000034987 CDS YNL277W 14 117349 118809 W 2005-11-07 1996-07-31 +S000005220 ORF Dubious YNL276C chromosome 14 14 118826 118431 C 2005-11-07 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene MET2/YNL277W +S000033996 CDS YNL276C 14 118826 118431 C 2005-11-07 1996-07-31 +S000005219 ORF Verified YNL275W BOR1 chromosome 14 14 119268 120998 W 2005-11-07 1996-07-31 Boron efflux transporter of the plasma membrane; binds HCO3-, I-, Br-, NO3- and Cl-; has similarity to the characterized boron efflux transporter A. thaliana BOR1 +S000033936 CDS YNL275W 14 119268 120998 W 2005-11-07 1996-07-31 +S000005218 ORF Verified YNL274C GOR1 glyoxylate reductase chromosome 14 14 122170 121118 C 2005-11-07 1996-07-31 Glyoxylate reductase; null mutation results in increased biomass after diauxic shift; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; protein abundance increases in response to DNA replication stress +S000033106 CDS YNL274C 14 122170 121118 C 2005-11-07 1996-07-31 +S000005217 ORF Verified YNL273W TOF1 chromosome 14 L000004244 14 122883 126599 W 2005-11-07 1996-07-31 Subunit of a replication-pausing checkpoint complex; Tof1p-Mrc1p-Csm3p acts at the stalled replication fork to promote sister chromatid cohesion after DNA damage, facilitating gap repair of damaged DNA; interacts with the MCM helicase; relocalizes to the cytosol in response to hypoxia +S000033053 CDS YNL273W 14 122883 126599 W 2005-11-07 1996-07-31 +S000130141 ARS ARS1410 chromosome 14 14 126599 126805 2009-05-06 2009-05-06 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay +S000005216 ORF Verified YNL272C SEC2 guanine nucleotide exchange factor SEC2 chromosome 14 L000001828 14 129084 126805 C -176 2005-11-07 1996-07-31 Guanyl-nucleotide exchange factor for the small G-protein Sec4p; essential for post-Golgi vesicle transport and for autophagy; associates with the exocyst, via exocyst subunit Sec15p, on secretory vesicles +S000032904 CDS YNL272C 14 129084 126805 C 2005-11-07 1996-07-31 +S000005215 ORF Verified YNL271C BNI1 formin BNI1|SHE5|PPF3 chromosome 14 L000000190 14 135383 129522 C 2011-02-03 1996-07-31|2011-02-03 Formin; polarisome component; nucleates the formation of linear actin filaments, involved in cell processes such as budding and mitotic spindle orientation which require the formation of polarized actin cables; recruited to the division site in a Glc7p/Ref2p dependent manner following release of Bnr1p; functionally redundant with BNR1 +S000032829 CDS YNL271C 14 135383 129522 C 2011-02-03 1996-07-31|2011-02-03 +S000005214 ORF Verified YNL270C ALP1 arginine permease ALP1|APL1 chromosome 14 L000000080 14 137661 135940 C 2011-02-03 1996-07-31 Arginine transporter; expression is normally very low and it is unclear what conditions would induce significant expression; ALP1 has a paralog, CAN1, that arose from the whole genome duplication +S000031915 CDS YNL270C 14 137661 135940 C 2011-02-03 1996-07-31 +S000005213 ORF Verified YNL269W BSC4 chromosome 14 14 137699 138094 W 2011-02-03 1996-07-31 Protein of unknown function; protein-coding gene that evolved de novo via a series of point mutations in noncoding sequence; ORF exhibits genomic organization compatible with a translational readthrough-dependent mode of expression; readthrough is increased upon depletion of Sup35p; may be involved in DNA repair pathway during stationary phase and contribute to robustness of cells when shifted to a nutrient-poor environment +S000032644 CDS YNL269W 14 137699 138094 W 2011-02-03 1996-07-31 +S000005212 ORF Verified YNL268W LYP1 lysine permease chromosome 14 L000000963 14 138550 140385 W 2011-02-03 1996-07-31 Lysine permease; one of three amino acid permeases (Alp1p, Can1p, Lyp1p) responsible for uptake of cationic amino acids +S000031660 CDS YNL268W 14 138550 140385 W 2011-02-03 1996-07-31 +S000005211 ORF Verified YNL267W PIK1 1-phosphatidylinositol 4-kinase|PIK120|PIK41 chromosome 14 L000001439|L000001438 14 140878 144078 W 2011-02-03 1996-07-31 Phosphatidylinositol 4-kinase; catalyzes first step in the biosynthesis of phosphatidylinositol-4,5-biphosphate; may control cytokinesis through the actin cytoskeleton; may control nonselective autophagy and mitophagy through trafficking of Atg9p +S000031530 CDS YNL267W 14 140878 144078 W 2011-02-03 1996-07-31 +S000005210 ORF Dubious YNL266W chromosome 14 14 144245 144664 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF IST1/YNL265C +S000031404 CDS YNL266W 14 144245 144664 W 2011-02-03 1996-07-31 +S000005209 ORF Verified YNL265C IST1 chromosome 14 14 145281 144280 C 2011-02-03 1996-07-31 Protein with positive role in the multivesicular body sorting pathway; functions and forms a complex with Did2p; recruitment to endosomes is mediated by the Vps2p-Vps24p subcomplex of ESCRT-III; also interacts with Vps4p +S000030432 CDS YNL265C 14 145149 144280 C 2011-02-03 1996-07-31 +S000030431 CDS YNL265C 14 145281 145255 C 2011-02-03 1996-07-31 +S000030433 intron YNL265C 14 145254 145150 C 2011-02-03 1996-07-31 +S000005208 ORF Verified YNL264C PDR17 phosphatidylinositol transporter|SFH4|ISS1 chromosome 14 L000004780 14 146615 145563 C 2011-02-03 1996-07-31 Phosphatidylinositol transfer protein (PITP); downregulates Plb1p-mediated turnover of phosphatidylcholine; forms a complex with Psd2p which appears essential for maintenance of vacuolar PE levels; found in the cytosol and microsomes; homologous to Pdr16p; deletion affects phospholipid composition +S000030276 CDS YNL264C 14 146615 145563 C 2011-02-03 1996-07-31 +S000005207 ORF Verified YNL263C YIF1 chromosome 14 L000004141|L000003364 14 147840 146896 C 2011-02-03 1996-07-31 Integral membrane protein; required for the fusion of ER-derived COPII transport vesicles with the Golgi; interacts with Yip1p and Yos1p; localizes to the Golgi, the ER, and COPII vesicles; homolog of human YIPF3 +S000037532 CDS YNL263C 14 147840 146896 C 2011-02-03 1996-07-31 +S000005206 ORF Verified YNL262W POL2 DNA polymerase epsilon catalytic subunit|DUN2 chromosome 14 L000001461 14 148212 154880 W -170 2011-02-03 1996-07-31 Catalytic subunit of DNA polymerase (II) epsilon; a chromosomal DNA replication polymerase that exhibits processivity and proofreading exonuclease activity; participates in leading-strand synthesis during DNA replication; also involved in DNA synthesis during DNA repair; interacts extensively with Mrc1p +S000037477 CDS YNL262W 14 148212 154880 W 2011-02-03 1996-07-31 +S000005205 ORF Verified YNL261W ORC5 origin recognition complex subunit 5 chromosome 14 L000002814 14 155100 156539 W 2011-02-03 1996-07-31 Subunit of the origin recognition complex (ORC); ORC directs DNA replication by binding to replication origins and is also involved in transcriptional silencing +S000037358 CDS YNL261W 14 155100 156539 W 2011-02-03 1996-07-31 +S000005204 ORF Verified YNL260C LTO1 ribosome biosynthesis protein LTO1 chromosome 14 14 157455 156859 C 2011-02-03 1996-07-31 Essential protein that forms a complex with Rli1p and Yae1p; ortholog of human ORAOV1, which is overexpressed in solid tumors; inviability of null mutant under standard conditions is complemented by overexpression of ORAOV1; essential for growth under standard (aerobic) conditions but not under anaerobic conditions; may have a role in protection of ribosomal assembly and function from damage due to reactive oxygen species +S000036594 CDS YNL260C 14 157455 156859 C 2011-02-03 1996-07-31 +S000005203 ORF Verified YNL259C ATX1 copper metallochaperone ATX1 chromosome 14 L000000155 14 157865 157644 C 2011-02-03 1996-07-31 Cytosolic copper metallochaperone; transports copper to the secretory vesicle copper transporter Ccc2p for eventual insertion into Fet3p, which is a multicopper oxidase required for high-affinity iron uptake; human homolog ATOX1 can complement yeast atx1 mutant; overexpression of human ATOX1 suppresses lysine auxotrophy of the yeast sod1 null mutant, as does overexpression of yeast ATX1 +S000035583 CDS YNL259C 14 157865 157644 C 2011-02-03 1996-07-31 +S000005202 ORF Verified YNL258C DSL1 RNS1 chromosome 14 L000004950 14 160373 158109 C 2011-02-03 1996-07-31 Peripheral membrane protein needed for Golgi-to-ER retrograde traffic; mediates Sey1p-independent homotypic ER fusion; forms Dsl1 tethering complex with Sec39p and Tip20p that forms a stable complex with ER SNAREs Sec20p, Ufe1p and Use1p and is functionally conserved from yeast to mammalian cells; component of the ER target site that interacts with coatomer; interacts with different subunits of COPI vesicle coat; interacts with Cin5p; homolog of fly and human ZW10 gene +S000035489 CDS YNL258C 14 160373 158109 C 2011-02-03 1996-07-31 +S000005201 ORF Verified YNL257C SIP3 LAM3 chromosome 14 L000001892 14 164320 160631 C 2011-02-03 1996-07-31 Putative sterol transfer protein; has a probable role in retrograde transport of sterols from the plasma membrane to the ER; co-localizes to puncta in the cortical ER with Ysp2p; contains GRAM, StART-like (VASt) and two PH-like domains; one of 6 StART-like domain-containing proteins in yeast that may be involved in sterol transfer between intracellular membranes; conserved across eukaryotes; previously identified as a transcription cofactor that interacts with DNA-bound Snf1p +S000035355 CDS YNL257C 14 164320 160631 C 2011-02-03 1996-07-31 +S000005200 ORF Verified YNL256W FOL1 trifunctional dihydropteroate synthetase/dihydrohydroxymethylpterin pyrophosphokinase/dihydroneopterin aldolase FOL1 chromosome 14 L000000620 14 164623 167097 W -170 2011-02-03 2003-09-22|1996-07-31 Multifunctional enzyme of the folic acid biosynthesis pathway; has dihydropteroate synthetase, dihydro-6-hydroxymethylpterin pyrophosphokinase, and dihydroneopterin aldolase activities +S000034407 CDS YNL256W 14 164623 167097 W 2011-02-03 2003-09-22|1996-07-31 +S000005199 ORF Verified YNL255C GIS2 mRNA-binding translational activator GIS2 chromosome 14 L000004862 14 167790 167329 C 2011-02-03 1996-07-31 Translational activator for mRNAs with internal ribosome entry sites; associates with polysomes and binds to a specific subset of mRNAs; localizes to RNA processing bodies (P bodies) and to stress granules; may have a role in translation regulation under stress conditions; ortholog of human ZNF9/CNBP, a gene involved in myotonic dystrophy type 2 +S000034231 CDS YNL255C 14 167790 167329 C 2011-02-03 1996-07-31 +S000005198 ORF Verified YNL254C RTC4 chromosome 14 14 169248 168043 C 2011-02-03 1996-07-31 Protein of unknown function; null mutation suppresses cdc13-1 temperature sensitivity; (GFP)-fusion protein localizes to both the cytoplasm and the nucleus +S000034113 CDS YNL254C 14 169248 168043 C 2011-02-03 1996-07-31 +S000077373 ARS ARS1411 ARSXIV-170 chromosome 14 14 169675 169753 2014-11-18 2014-11-18|2004-10-18|2006-09-07 ARS activated in late S phase +S000178168 ARS_consensus_sequence ARS1411 14 169748 169732 C 2014-11-18 2014-11-18 +S000005197 ORF Verified YNL253W TEX1 chromosome 14 14 170018 171286 W 2011-02-03 1996-07-31 Protein involved in mRNA export; component of the transcription export (TREX) complex +S000033293 CDS YNL253W 14 170018 171286 W 2011-02-03 1996-07-31 +S000005196 ORF Verified YNL252C MRPL17 mitochondrial 54S ribosomal protein YmL17/YmL30|YmL17|YmL30|MRPL30 chromosome 14 L000001703|L000002266|L000002692 14 172286 171441 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000033203 CDS YNL252C 14 172286 171441 C 2011-02-03 1996-07-31 +S000005195 ORF Verified YNL251C NRD1 Nrd1 complex RNA-binding subunit chromosome 14 L000002862 14 174315 172588 C 2011-02-03 1996-07-31 RNA-binding subunit of Nrd1 complex; complex interacts with exosome to mediate 3'-end formation of some mRNAs, snRNAs, snoRNAs, and CUTs; interacts with CTD of RNA pol II large subunit Rpo21p at phosphorylated Ser5 to direct transcription termination of non-polyadenylated transcripts; H3K4 trimethylation of transcribed regions by Set1p enhances recruitment of Nrd1p to those sites; role in regulation of mitochondrial abundance and cell size +S000033151 CDS YNL251C 14 174315 172588 C 2011-02-03 1996-07-31 +S000005194 ORF Verified YNL250W RAD50 MRX complex DNA-binding subunit chromosome 14 L000001570 14 175410 179348 W -170 2011-02-03 1996-07-31 Subunit of MRX complex with Mre11p and Xrs2p; complex is involved in processing double-strand DNA breaks in vegetative cells, initiation of meiotic DSBs, telomere maintenance, and nonhomologous end joining; forms nuclear foci upon DNA replication stress +S000033124 CDS YNL250W 14 175410 179348 W 2011-02-03 1996-07-31 +S000005193 ORF Verified YNL249C MPA43 chromosome 14 L000003096 14 181022 179394 C 2011-02-03 1996-07-31 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000032322 CDS YNL249C 14 181022 179394 C 2011-02-03 1996-07-31 +S000005192 ORF Verified YNL248C RPA49 DNA-directed RNA polymerase I subunit RPA49|A49 chromosome 14 L000001673 14 182608 181361 C 2011-02-03 1996-07-31 RNA polymerase I subunit A49; essential for nucleolar assembly and for high polymerase loading rate; required for nucleolar localization of Rpa34p +S000032212 CDS YNL248C 14 182608 181361 C 2011-02-03 1996-07-31 +S000005191 ORF Verified YNL247W cysteine--tRNA ligase chromosome 14 14 182875 185178 W 2011-02-03 1996-07-31 Cysteinyl-tRNA synthetase; may interact with ribosomes, based on co-purification experiments; human gene CARS allows growth of the yeast haploid null mutant after sporulation of a heterozygous diploid +S000031279 CDS YNL247W 14 182875 185178 W 2011-02-03 1996-07-31 +S000005190 ORF Verified YNL246W VPS75 chromosome 14 14 185460 186349 W 2011-02-03 1996-07-31 NAP family histone chaperone; binds to histones and Rtt109p, stimulating histone acetyltransferase activity; possesses nucleosome assembly activity in vitro; proposed role in vacuolar protein sorting and in double-strand break repair; protein abundance increases in response to DNA replication stress; relocalizes to the cytosol in response to hypoxia +S000031149 CDS YNL246W 14 185460 185491 W 2011-02-03 1996-07-31 +S000031150 CDS YNL246W 14 185587 186349 W 2011-02-03 1996-07-31 +S000031151 intron YNL246W 14 185492 185586 W 2011-02-03 1996-07-31 +S000005189 ORF Verified YNL245C CWC25 U2-type spliceosomal complex subunit CWC25 chromosome 14 14 186885 186346 C 2011-02-03 1996-07-31 Splicing factor required for the first step of pre-mRNA splicing; binding to the spliceosome requires Prp2p and Yju2p; heat-stable protein; has similarity to S. pombe Cwf25p +S000030978 CDS YNL245C 14 186885 186346 C 2011-02-03 1996-07-31 +S000005188 ORF Verified YNL244C SUI1 translation initiation factor eIF1|RFR1|MOF2 chromosome 14 L000002177 14 187496 187170 C -171 2011-02-03 1996-07-31 Translation initiation factor eIF1; component of a complex involved in recognition of the initiator codon; modulates translation accuracy at the initiation phase +S000029973 CDS YNL244C 14 187496 187170 C 2011-02-03 1996-07-31 +S000005187 ORF Verified YNL243W SLA2 MOP2|END4 chromosome 14 L000001913|L000002421 14 188051 190957 W 2011-02-03 1996-07-31|2011-02-03 Adaptor protein that links actin to clathrin and endocytosis; involved in membrane cytoskeleton assembly and cell polarization; present in the actin cortical patch of the emerging bud tip; dimer in vivo +S000029929 CDS YNL243W 14 188051 190957 W 2011-02-03 1996-07-31|2011-02-03 +S000005186 ORF Verified YNL242W ATG2 APG2|AUT8|SPO72 chromosome 14 L000004782 14 191324 196102 W 2011-02-03 1996-07-31 Peripheral membrane protein required for autophagic vesicle formation; also required for vesicle formation during pexophagy and the cytoplasm-to-vaucole targeting (Cvt) pathway; involved in Atg9p cycling between the phagophore assembly site and mitochondria; contains an APT1 domain that binds phosphatidylinositol-3-phosphate; essential for cell cycle progression from G2/M to G1 under nitrogen starvation; forms cytoplasmic foci upon DNA replication stress +S000037889 CDS YNL242W 14 191324 196102 W 2011-02-03 1996-07-31 +S000077374 ARS ARS1412 ARSXIV-196 chromosome 14 14 196134 196232 2014-11-18 2014-11-18|2004-10-18|2006-09-07 ARS activated in late S phase +S000005185 ORF Verified YNL241C ZWF1 glucose-6-phosphate dehydrogenase|POS10|MET19 chromosome 14 L000002572 14 197943 196426 C -153 2011-02-03 1996-07-31 Glucose-6-phosphate dehydrogenase (G6PD); catalyzes the first step of the pentose phosphate pathway; involved in adapting to oxidative stress; protein abundance increases in response to DNA replication stress; homolog of human G6PD which is deficient in patients with hemolytic anemia; human G6PD can complement yeast zwf1 null mutant +S000037074 CDS YNL241C 14 197943 196426 C 2011-02-03 1996-07-31 +S000005184 ORF Verified YNL240C NAR1 chromosome 14 14 199977 198502 C 2011-02-03 1996-07-31 Subunit of the cytosolic iron-sulfur (FeS) protein assembly machinery; required for maturation of cytosolic and nuclear FeS proteins and for normal resistance to oxidative stress; deficiency results in shortened lifespan and sensitivity to paraquat; homologous to human Narf +S000037001 CDS YNL240C 14 199977 198502 C 2011-02-03 1996-07-31 +S000005183 ORF Verified YNL239W LAP3 bleomycin hydrolase|YCP1|GAL6|BLH1 chromosome 14 L000002502|L000000929 14 200569 201933 W -152 2011-02-03 2003-01-07|1996-07-31 Cysteine aminopeptidase with homocysteine-thiolactonase activity; protects cells against homocysteine toxicity; has bleomycin hydrolase activity in vitro; transcription is regulated by galactose via Gal4p; orthologous to human BLMH +S000036318 CDS YNL239W 14 200569 201933 W 2011-02-03 2003-01-07|1996-07-31 +S000005182 ORF Verified YNL238W KEX2 kexin KEX2|yscF|SRB1|VMA45|QDS1 chromosome 14 L000000896 14 202428 204872 W -147 2011-02-03 1996-07-31 Kexin, a subtilisin-like protease (proprotein convertase); a calcium-dependent serine protease involved in the activation of proproteins of the secretory pathway +S000036210 CDS YNL238W 14 202428 204872 W 2011-02-03 1996-07-31 +S000005181 ORF Verified YNL237W YTP1 chromosome 14 L000003036 14 205188 206567 W 2011-02-03 1996-07-31 Probable type-III integral membrane protein of unknown function; has regions of similarity to mitochondrial electron transport proteins +S000036063 CDS YNL237W 14 205188 206567 W 2011-02-03 1996-07-31 +S000005180 ORF Verified YNL236W SIN4 SSX3|MED16|RYE1|TSF3|SSN4|SSF5|SDI3|GAL22|BEL2 chromosome 14 L000001888|S000029516|L000002099 14 206930 209854 W -145 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; contributes to both postive and negative transcriptional regulation; dispensible for basal transcription +S000035179 CDS YNL236W 14 206930 209854 W 2011-02-03 1996-07-31 +S000005179 ORF Dubious YNL235C chromosome 14 14 209979 209548 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF SIN4/YNL236W, a subunit of the mediator complex +S000034886 CDS YNL235C 14 209979 209548 C 2011-02-03 1996-07-31 +S000005178 ORF Verified YNL234W chromosome 14 14 210233 211513 W 2011-02-03 1996-07-31 Protein of unknown function with similarity to globins; has a functional heme-binding domain; mutant has aneuploidy tolerance; transcription induced by stress conditions; may be involved in glucose signaling or metabolism; regulated by Rgt1 +S000034841 CDS YNL234W 14 210233 211513 W 2011-02-03 1996-07-31 +S000005177 ORF Verified YNL233W BNI4 chromosome 14 L000003517 14 211922 214600 W 2011-02-03 1996-07-31 Targeting subunit for Glc7p protein phosphatase; localized to the bud neck, required for localization of chitin synthase III to the bud neck via interaction with the chitin synthase III regulatory subunit Skt5p; phosphorylation by Slt2p and Kss1p involved in regulating Bni4p in septum assembly +S000033930 CDS YNL233W 14 211922 214600 W 2011-02-03 1996-07-31 +S000005176 ORF Verified YNL232W CSL4 exosome non-catalytic core subunit CSL4|SKI4 chromosome 14 L000001905|L000004677 14 214923 215801 W 2011-02-03 1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; predicted to contain an S1 RNA binding domain; human homolog EXOSC1 partially complements yeast csl4 null mutant, and can complement inviability of strain in which expression of CSL4 is repressed +S000033848 CDS YNL232W 14 214923 215801 W 2011-02-03 1996-07-31 +S000005175 ORF Verified YNL231C PDR16 phosphatidylinositol transporter|SFH3 chromosome 14 L000004779 14 217042 215987 C 2011-02-03 1996-07-31 Phosphatidylinositol transfer protein (PITP); controlled by the multiple drug resistance regulator Pdr1p; localizes to lipid particles and microsomes; controls levels of various lipids, may regulate lipid synthesis; homologous to Pdr17p; protein abundance increases in response to DNA replication stress +S000033675 CDS YNL231C 14 217042 215987 C 2011-02-03 1996-07-31 +S000005174 ORF Verified YNL230C ELA1 elongin A chromosome 14 L000004956 14 218662 217523 C 2011-02-03 1996-07-31 Elongin A; F-box protein that forms a heterodimer with Elc1p and is required for ubiquitin-dependent degradation of the RNA Polymerase II subunit Rpo21p; subunit of the Elongin-Cullin-Socs (ECS) ligase complex +S000033008 CDS YNL230C 14 218662 217523 C 2011-02-03 1996-07-31 +S000005173 ORF Verified YNL229C URE2 [URE3] chromosome 14 L000002439 14 220201 219137 C -142 2011-02-03 1996-07-31 Nitrogen catabolite repression transcriptional regulator; inhibits GLN3 transcription in good nitrogen source; role in sequestering Gln3p and Gat1p to the cytoplasm; has glutathione peroxidase activity and can mutate to acquire GST activity; self-assembly under limited nitrogen conditions creates [URE3] prion and releases catabolite repression +S000034177 CDS YNL229C 14 220201 219137 C 2011-02-03 1996-07-31 +S000005172 ORF Dubious YNL228W chromosome 14 14 220645 221421 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF YNL227C/JJJ1 +S000034107 CDS YNL228W 14 220645 221421 W 2011-02-03 1996-07-31 +S000005170 ORF Dubious YNL226W chromosome 14 14 222239 222649 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene JJJ1/YNL227C +S000032023 CDS YNL226W 14 222239 222649 W 2011-02-03 1996-07-31 +S000005171 ORF Verified YNL227C JJJ1 chromosome 14 14 222431 220659 C 2011-02-03 1996-07-31 Co-chaperone that stimulates the ATPase activity of Ssa1p; required for a late step of ribosome biogenesis; associated with the cytosolic large ribosomal subunit; contains a J-domain; mutation causes defects in fluid-phase endocytosis +S000032103 CDS YNL227C 14 222431 220659 C 2011-02-03 1996-07-31 +S000005169 ORF Verified YNL225C CNM67 chromosome 14 L000004012 14 224469 222724 C 2011-02-03 1996-07-31 Component of the spindle pole body outer plaque; required for spindle orientation and mitotic nuclear migration; CNM67 has a paralog, ADY3, that arose from the whole genome duplication +S000031798 CDS YNL225C 14 224469 222724 C 2011-02-03 1996-07-31 +S000005168 ORF Verified YNL224C SQS1 PFA1 chromosome 14 14 227099 224796 C 2011-02-03 1996-07-31 Protein that stimulates the ATPase and helicase activities of Prp43p; acts with Prp43p to stimulate 18s rRNA maturation by Nob1p; overexpression antagonizes the suppression of splicing defects by spp382 mutants; component of pre-ribosomal particles; relocalizes from nucleus to nucleolus upon DNA replication stress +S000030829 CDS YNL224C 14 227099 224796 C 2011-02-03 1996-07-31 +S000005167 ORF Verified YNL223W ATG4 cysteine protease ATG4|AUT2|APG4 chromosome 14 L000004606|L000004784 14 227370 228854 W 2011-02-03 2003-09-22|1996-07-31 Conserved cysteine protease required for autophagy; cleaves Atg8p to a form required for autophagosome and Cvt vesicle generation +S000030783 CDS YNL223W 14 227370 228854 W 2011-02-03 2003-09-22|1996-07-31 +S000005166 ORF Verified YNL222W SSU72 RNA polymerase II subunit A C-terminal domain phosphatase chromosome 14 L000003154 14 229094 229714 W 2011-02-03 1996-07-31 Phosphatase and transcription/RNA-processing factor; associates with TFIIB and cleavage/polyadenylation factor Pta1p; exhibits phosphatase activity on serine-5 and serine-7 of the RNA polymerase II C-terminal domain; affects start site selection and transcriptional read through in vivo +S000030662 CDS YNL222W 14 229094 229714 W 2011-02-03 1996-07-31 +S000007295 snRNA_gene snR19 SNR19 U1 chromosome 14 L000001967 14 230672 230105 C 2011-02-03 2004-04-02 U1 spliceosomal RNA (U1 snRNA); snRNA U1 homolog +S000036596 noncoding_exon snR19 14 230672 230105 C 2011-02-03 2004-04-02 +S000005165 ORF Verified YNL221C POP1 ribonuclease P/MRP protein subunit POP1 chromosome 14 L000002587 14 233695 231068 C 2011-02-03 1996-07-31 Subunit of RNase MRP, nuclear RNase P and telomerase complexes; RNase MRP cleaves pre-rRNA, nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs, while telomerase replenishes telomeric DNA; binds to the RPR1 RNA subunit in RNase P +S000037760 CDS YNL221C 14 233695 231068 C 2011-02-03 1996-07-31 +S000005164 ORF Verified YNL220W ADE12 adenylosuccinate synthase|BRA9 chromosome 14 L000000039 14 234413 235714 W -151 2011-02-03 1996-07-31 Adenylosuccinate synthase; catalyzes the first step in synthesis of adenosine monophosphate from inosine 5'monophosphate during purine nucleotide biosynthesis; exhibits binding to single-stranded autonomously replicating (ARS) core sequence +S000037738 CDS YNL220W 14 234413 235714 W 2011-02-03 1996-07-31 +S000005163 ORF Verified YNL219C ALG9 dolichyl-P-Man:Man(6)GlcNAc(2)-PP-dolichol alpha-1,2-mannosyltransferase chromosome 14 L000003394 14 237663 235996 C 2011-02-03 1996-07-31 Mannosyltransferase, involved in N-linked glycosylation; catalyzes the transfer of both the seventh mannose residue on B-arm and ninth mannose residue on the C-arm from Dol-P-Man to lipid-linked oligosaccharides; human homolog ALG9 can complement yeast null mutant; mutation of human homolog causes type 1 congenital disorders of glycosylation +S000029975 CDS YNL219C 14 237663 235996 C 2011-02-03 1996-07-31 +S000005162 ORF Verified YNL218W MGS1 ssDNA-dependent ATPase MGS1 chromosome 14 14 238238 240001 W 2011-02-03 1996-07-31 Protein with DNA-dependent ATPase and ssDNA annealing activities; involved in maintenance of genome; interacts functionally with DNA polymerase delta; homolog of human Werner helicase interacting protein (WHIP); forms nuclear foci upon DNA replication stress +S000029915 CDS YNL218W 14 238238 240001 W 2011-02-03 1996-07-31 +S000005161 ORF Uncharacterized YNL217W putative serine/threonine-protein phosphatase chromosome 14 14 240331 241311 W 2011-02-03 1996-07-31 Putative protein of unknown function; weak sequence similarity to bis (5'-nucleotidyl)-tetraphosphatases; (GFP)-fusion protein localizes to the vacuole; null mutant is highly sensitive to azaserine and resistant to sodium-O-vandate +S000037905 CDS YNL217W 14 240331 241311 W 2011-02-03 1996-07-31 +S000005160 ORF Verified YNL216W RAP1 DNA-binding transcription factor RAP1|TUF1|TBA1|GRF1 chromosome 14 L000001581 14 241689 244172 W -148 2011-02-03 1996-07-31 Essential DNA-binding transcription regulator that binds many loci; involved in transcription activation, repression, chromatin silencing, telomere length maintenance; relocalizes to cytosol under hypoxia; conserved protein with N-terminal BRCT domain, central region with homology to Myb DNA binding domain, and C-terminal Rap1-specific protein-interaction domain (RCT domain); recruits Sir complex to telomeric DNA; present in quiescent cell telomere hyperclusters +S000037812 CDS YNL216W 14 241689 244172 W 2011-02-03 1996-07-31 +S000005159 ORF Verified YNL215W IES2 chromosome 14 14 244468 245430 W 2011-02-03 1996-07-31 Protein that associates with the INO80 chromatin remodeling complex; associates with the INO80 complex under low-salt conditions; essential for growth under anaerobic conditions; protein abundance increases in response to DNA replication stress +S000035947 CDS YNL215W 14 244468 245430 W 2011-02-03 1996-07-31 +S000005158 ORF Verified YNL214W PEX17 PAS9 chromosome 14 L000003963 14 245617 246216 W 2011-02-03 1996-07-31 Membrane peroxin of the peroxisomal importomer complex; complex facilitates the import of peroxisomal matrix proteins; required for peroxisome biogenesis +S000035811 CDS YNL214W 14 245617 246216 W 2011-02-03 1996-07-31 +S000005157 ORF Verified YNL213C RRG9 chromosome 14 14 247104 246460 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant lacks mitochondrial DNA and cannot grow on glycerol; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000034770 CDS YNL213C 14 247104 246460 C 2011-02-03 1996-07-31 +S000005156 ORF Verified YNL212W VID27 chromosome 14 14 247461 249809 W 2011-02-03 1996-07-31 Cytoplasmic protein of unknown function; possibly involved in vacuolar protein degradation; not essential for proteasome-dependent degradation of fructose-1,6-bisphosphatase (FBPase); null mutants exhibit normal growth; contains two PH-like domains +S000034713 CDS YNL212W 14 247461 249809 W 2011-02-03 1996-07-31 +S000005155 ORF Uncharacterized YNL211C MRX7 chromosome 14 14 250315 250055 C 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; green fluorescent protein (GFP)-fusion protein localizes to mitochondria; YNL211C is not an essential gene +S000034553 CDS YNL211C 14 250315 250055 C 2011-02-03 1996-07-31 +S000077375 ARS ARS1413 chromosome 14 14 250315 250931 2011-02-03 2004-10-18 Strong origin of replication activated in late S phase +S000005154 ORF Verified YNL210W MER1 chromosome 14 L000001074 14 250931 251743 W -138 2011-02-03 1996-07-31 mRNA-binding protein required for meiosis-specific mRNA splicing; required for chromosome pairing and meiotic recombination; Mer1p regulon embraces four essential meiotic pre-mRNAs: REC107, HFM1, AMA1 and SPO22 +S000034504 CDS YNL210W 14 250931 251743 W 2011-02-03 1996-07-31 +S000005153 ORF Verified YNL209W SSB2 Hsp70 family ATPase SSB2|YG103 chromosome 14 L000002715 14 252059 253900 W 2011-02-03 1996-07-31 Cytoplasmic ATPase that is a ribosome-associated molecular chaperone; functions with J-protein partner Zuo1p; may be involved in the folding of newly-synthesized polypeptide chains; member of the HSP70 family; SSB2 has a paralog, SSB1, that arose from the whole genome duplication +S000035043 CDS YNL209W 14 252059 253900 W 2011-02-03 1996-07-31 +S000005152 ORF Verified YNL208W chromosome 14 14 254418 255017 W 2011-02-03 2004-02-19|1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; authentic, non-tagged protein is detected in purified mitochondria in high-throughput studies; potential orthologs found in other fungi +S000034895 CDS YNL208W 14 254418 255017 W 2011-02-03 2004-02-19|1996-07-31 +S000005151 ORF Verified YNL207W RIO2 protein kinase RIO2 chromosome 14 14 255353 256630 W 2011-02-03 1996-07-31 Essential serine kinase involved in the processing of 20S pre-rRNA; involved in the processing of the 20S pre-rRNA into mature 18S rRNA; has similarity to Rio1p +S000034789 CDS YNL207W 14 255353 256630 W 2011-02-03 1996-07-31 +S000005150 ORF Verified YNL206C RTT106 chromosome 14 14 258155 256788 C 2011-02-03 1996-07-31 Histone chaperone; involved in regulation of chromatin structure in both transcribed and silenced chromosomal regions; affects transcriptional elongation; has a role in regulation of Ty1 transposition; interacts physically and functionally with Chromatin Assembly Factor-1 (CAF-1) +S000033853 CDS YNL206C 14 258155 256788 C 2011-02-03 1996-07-31 +S000005149 ORF Dubious YNL205C chromosome 14 14 258577 258155 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033703 CDS YNL205C 14 258577 258155 C 2011-02-03 1996-07-31 +S000005148 ORF Verified YNL204C SPS18 SPX18 chromosome 14 L000002042 14 259277 258375 C 2011-02-03 1996-07-31 Protein of unknown function, contains a putative zinc-binding domain; expressed during sporulation; SPS18 has a paralog, GCS1, that arose from the whole genome duplication +S000030383 CDS YNL204C 14 259277 258375 C 2011-02-03 1996-07-31 +S000005146 ORF Verified YNL202W SPS19 SPX19 chromosome 14 L000002043 14 259578 260456 W 2011-02-03 1996-07-31|2006-05-10 Peroxisomal 2,4-dienoyl-CoA reductase; auxiliary enzyme of fatty acid beta-oxidation; homodimeric enzyme required for growth and sporulation on petroselineate medium; expression induced during late sporulation and in the presence of oleate +S000030188 CDS YNL202W 14 259578 260456 W 2011-02-03 1996-07-31|2006-05-10 +S000005147 ORF Dubious YNL203C chromosome 14 14 260050 259439 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030248 CDS YNL203C 14 260050 259439 C 2011-02-03 1996-07-31 +S000005145 ORF Verified YNL201C PSY2 chromosome 14 14 263203 260627 C 2011-02-03 1996-07-31 Subunit of protein phosphatase PP4 complex; Pph3p and Psy2p form the active complex, Psy4p may provide additional substrate specificity; regulates recovery from the DNA damage checkpoint, the gene conversion- and single-strand annealing-mediated pathways of meiotic double-strand break repair and efficient Non-Homologous End-Joining (NHEJ) pathway; Pph3p and Psy2p localize to foci on meiotic chromosomes; putative homolog of mammalian R3 +S000030016 CDS YNL201C 14 263203 260627 C 2011-02-03 1996-07-31 +S000005144 ORF Verified YNL200C NNR1 NADHX epimerase chromosome 14 14 264453 263713 C 2011-02-03 1996-07-31 NADHX epimerase; catalyzes isomerization of (R)- and (S)-NADHX; homologous to AIBP in mammals and the N- terminal domain of YjeF in E.coli; enzyme is widespread in eukaryotes, prokaryotes and archaea; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000037373 CDS YNL200C 14 264453 263713 C 2011-02-03 1996-07-31 +S000005143 ORF Verified YNL199C GCR2 chromosome 14 L000000691 14 266530 264926 C 2011-02-03 1996-07-31 Transcriptional activator of genes involved in glycolysis; interacts and functions with the DNA-binding protein Gcr1p +S000032854 CDS YNL199C 14 266530 264926 C 2011-02-03 1996-07-31 +S000005142 ORF Dubious YNL198C chromosome 14 14 266816 266514 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032762 CDS YNL198C 14 266816 266514 C 2011-02-03 1996-07-31 +S000005141 ORF Verified YNL197C WHI3 mRNA-binding protein WHI3 chromosome 14 L000002486 14 269593 267608 C 2011-02-03 1996-07-31 RNA binding protein that sequesters CLN3 mRNA in cytoplasmic foci; regulates genes involved in the cell cycle, sister chromatid cohesion, and stress response; acts as a cytoplasmic retention factor for Cdc28p and associated cyclins; regulates cell fate and dose-dependently regulates the critical cell size required for passage through Start; Tpk1p (PKA) mediated phosphorylation (S568) inhibits Whi3p function, decreasing its interaction with CLN3 mRNA; regulates ploidy +S000032683 CDS YNL197C 14 269593 267608 C 2011-02-03 1996-07-31 +S000005140 ORF Verified YNL196C SLZ1 chromosome 14 L000004192 14 271171 270275 C 2011-02-03 1996-07-31 Sporulation-specific protein with a leucine zipper motif; subunit of the MIS complex which controls mRNA methylation during during the induction of sporulation +S000032589 CDS YNL196C 14 271171 270275 C 2011-02-03 1996-07-31 +S000005139 ORF Uncharacterized YNL195C chromosome 14 14 272308 271523 C 2011-02-03 2004-02-18|1996-07-31 Protein of unknown function; shares a promoter with YNL194C; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YNL195C has a paralog, HBT1, that arose from the whole genome duplication +S000031608 CDS YNL195C 14 272308 271523 C 2011-02-03 2004-02-18|1996-07-31 +S000005138 ORF Verified YNL194C chromosome 14 14 273615 272710 C 2011-02-03 1996-07-31 Integral membrane protein; required for sporulation and plasma membrane sphingolipid content; similar to SUR7; GFP-fusion protein is induced in response to the DNA-damaging agent MMS; GFP-fusion protein is more abundant at MCCs (membrane compartment occupied by Can1) in the presence of glycerol and oleate; YNL194C has a paralog, FMP45, that arose from the whole genome duplication +S000031471 CDS YNL194C 14 273615 272710 C 2011-02-03 1996-07-31 +S000005137 ORF Uncharacterized YNL193W chromosome 14 14 274368 276044 W 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; exhibits a two-hybrid interaction with Yhr151cp in a large-scale analysis +S000031402 CDS YNL193W 14 274368 276044 W 2011-02-03 1996-07-31|2011-02-03 +S000005136 ORF Verified YNL192W CHS1 chitin synthase CHS1|USA4 chromosome 14 L000000329 14 276502 279897 W 2011-02-03 1996-07-31|2011-02-03 Chitin synthase I; requires activation from zymogenic form in order to catalyze the transfer of N-acetylglucosamine (GlcNAc) to chitin; required for repairing the chitin septum during cytokinesis; transcription activated by mating factor +S000030484 CDS YNL192W 14 276502 279897 W 2011-02-03 1996-07-31|2011-02-03 +S000077376 ARS ARS1414 ARSXIV-280 chromosome 14 14 279982 280071 2014-11-18 2014-11-18|2004-10-18|2006-09-07 ARS activated in mid-S phase +S000178169 ARS_consensus_sequence ARS1414 14 280063 280047 C 2014-11-18 2014-11-18 +S000005135 ORF Verified YNL191W DUG3 glutamine amidotransferase subunit DUG3 chromosome 14 14 280432 281505 W 2011-02-03 1996-07-31 Component of glutamine amidotransferase (GATase II); forms a complex with Dug2p to degrade glutathione (GSH) and other peptides containing a gamma-glu-X bond in an alternative pathway to GSH degradation by gamma-glutamyl transpeptidase (Ecm38p) +S000030357 CDS YNL191W 14 280432 281505 W 2011-02-03 1996-07-31 +S000005134 ORF Verified YNL190W chromosome 14 14 282395 283009 W 2011-02-03 1996-07-31 Hydrophilin essential in desiccation-rehydration process; cell wall protein; contains a putative GPI-attachment site +S000030164 CDS YNL190W 14 282395 283009 W 2011-02-03 1996-07-31 +S000005133 ORF Verified YNL189W SRP1 karyopherin alpha|SCM1|KAP60 chromosome 14 L000002755|L000002780 14 284260 285888 W 2011-02-03 1996-07-31 Karyopherin alpha homolog; forms a dimer with karyopherin beta Kap95p to mediate import of nuclear proteins, binds the nuclear localization signal of the substrate during import; involved in cotranslational protein degradation; binds ribosome-bound nascent polypeptides; Srp1p and Sts1p couple proteasomes to nascent polypeptides emerging from the ribosome for cotranslational degradation +S000036720 CDS YNL189W 14 284260 285888 W 2011-02-03 1996-07-31 +S000005132 ORF Verified YNL188W KAR1 chromosome 14 L000000886 14 286308 287609 W -208 2011-02-03 1996-07-31 Protein involved in karyogamy and spindle pole body duplication; involved in karyogamy during mating; involved in spindle pole body duplication during mitosis; localizes to the half-bridge of the spindle pole body; interacts with Spc72p during karyogamy; also interacts with Cdc31p; essential gene +S000036621 CDS YNL188W 14 286308 287609 W 2011-02-03 1996-07-31 +S000005131 ORF Verified YNL187W SWT21 chromosome 14 14 287994 289067 W 2011-02-03 1996-07-31 Protein involved in mRNA splicing; contains a consensus nuclear export signal (NES) sequence similar to the consensus sequence recognized by Crm1p; interacts genetically with Prp40p and Tgs1p; contains WD40 repeats +S000036547 CDS YNL187W 14 287994 289067 W 2011-02-03 1996-07-31 +S000005130 ORF Verified YNL186W UBP10 ubiquitin-specific protease UBP10|DOT4 chromosome 14 L000004391|L000004588 14 289498 291876 W 2011-02-03 1996-07-31|2011-02-03 Ubiquitin-specific protease, deubiquitinates Ub-protein moieties; interacts with proteins that function in rRNA production and ribosome biogenesis via its intrinsically disordered regions; stabilizes Rpa190p by deubiquitination; controls PCNA deubiquitylation; may regulate silencing by acting on Sir4p; involved in posttranscriptionally regulating Gap1p, possibly other transporters; localized to the nucleolus; null mutant phenotypes are functionally complemented by human USP36 +S000035619 CDS YNL186W 14 289498 291876 W 2011-02-03 1996-07-31|2011-02-03 +S000005129 ORF Verified YNL185C MRPL19 mitochondrial 54S ribosomal protein YmL19|YmL19 chromosome 14 14 292669 292193 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000035486 CDS YNL185C 14 292669 292193 C 2011-02-03 1996-07-31 +S000005128 ORF Uncharacterized YNL184C chromosome 14 14 292883 292557 C 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels +S000035350 CDS YNL184C 14 292883 292557 C 2011-02-03 1996-07-31 +S000005127 ORF Verified YNL183C NPR1 serine/threonine protein kinase NPR1 chromosome 14 L000001273 14 295509 293137 C 2011-02-03 1996-07-31 Protein kinase; stabilizes several plasma membrane amino acid transporters by antagonizing their ubiquitin-mediated degradation; phosphorylates Aly2p; negatively regulates Ldb19p-mediated endocytosis through phosphorylation of Ldb19p, which prevents its association with the plasma membrane; Npr1p activity is negatively regulated via phosphorylation by the TOR complex; NPR1 has a paralog, PRR2, that arose from the whole genome duplication +S000034359 CDS YNL183C 14 295509 293137 C 2011-02-03 1996-07-31 +S000005126 ORF Verified YNL182C IPI3 chromatin-binding/pre-rRNA-processing protein IPI3 chromosome 14 14 297627 295960 C 2011-02-03 1996-07-31 Component of the Rix1 complex and pre-replicative complexes (pre-RCs); required for processing of ITS2 sequences from 35S pre-rRNA; component of the pre-60S ribosomal particle with the dynein-related AAA-type ATPase Mdn1p; required for pre-RC formation and maintenance during DNA replication licensing; highly conserved protein which contains several WD40 motifs; IPI3 is an essential gene; other members include Rix1p, Ipi1p, and Ipi3p +S000034229 CDS YNL182C 14 297627 295960 C 2011-02-03 1996-07-31 +S000005125 ORF Uncharacterized YNL181W PBR1 putative oxidoreductase chromosome 14 14 298335 299558 W 2011-02-03 1996-07-31|2011-02-03 Putative oxidoreductase; required for cell viability +S000034164 CDS YNL181W 14 298335 299558 W 2011-02-03 1996-07-31|2011-02-03 +S000005124 ORF Verified YNL180C RHO5 Rho family GTPase RHO5|YNS0 chromosome 14 L000004798 14 300649 299654 C 2011-02-03 1998-11-10|1996-07-31 Non-essential small GTPase of the Rho/Rac family of Ras-like proteins; RAC1 ortholog; regulated by phosphorylation and ubiquitination; likely involved in protein kinase C (Pkc1p)-dependent signal transduction pathway that controls cell integrity +S000033264 CDS YNL180C 14 300649 299654 C 2011-02-03 1998-11-10|1996-07-31 +S000005123 ORF Dubious YNL179C SRF6 chromosome 14 14 301103 300666 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; deletion in cyr1 mutant results in loss of stress resistance +S000034571 CDS YNL179C 14 301103 300666 C 2011-02-03 1996-07-31 +S000005122 ORF Verified YNL178W RPS3 uS3|ribosomal 40S subunit protein S3|rp13|YS3|S3|SUF14 chromosome 14 L000002161|L000001749 14 302680 303402 W -125 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; has apurinic/apyrimidinic (AP) endonuclease activity; essential for viability; nascent Rps3p is bound by specific chaperone Yar1p during translation; homologous to mammalian ribosomal protein S3 and bacterial S3 +S000034489 CDS YNL178W 14 302680 303402 W 2011-02-03 1996-07-31 +S000005121 ORF Verified YNL177C MRPL22 mitochondrial 54S ribosomal protein YmL22|YmL22 chromosome 14 14 304615 303686 C 2011-02-03 1996-07-31|2011-02-03 Mitochondrial ribosomal protein of the large subunit +S000032401 CDS YNL177C 14 304615 303686 C 2011-02-03 1996-07-31|2011-02-03 +S000005120 ORF Verified YNL176C TDA7 chromosome 14 14 306980 305070 C 2011-02-03 1996-07-31|2011-02-03 Cell cycle-regulated gene of unknown function; promoter bound by Fkh2p; null mutant is sensitive to expression of the top1-T722A allele; TDA7 has a paralog, YDL211C, that arose from the whole genome duplication +S000032321 CDS YNL176C 14 306980 305070 C 2011-02-03 1996-07-31|2011-02-03 +S000005118 ORF Dubious YNL174W chromosome 14 14 308074 308646 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene NOP13/YNL175C +S000031277 CDS YNL174W 14 308074 308646 W 2011-02-03 1996-07-31 +S000005119 ORF Verified YNL175C NOP13 chromosome 14 14 308612 307401 C 2011-02-03 1996-07-31|2011-02-03 Nucleolar protein found in preribosomal complexes; contains an RNA recognition motif (RRM); relative distribution to the nucleolus increases upon DNA replication stress +S000032207 CDS YNL175C 14 308612 307401 C 2011-02-03 1996-07-31|2011-02-03 +S000005117 ORF Verified YNL173C MDG1 chromosome 14 L000001044 14 310057 308957 C 2011-02-03 1996-07-31 Plasma membrane protein; involved in G-protein mediated pheromone signaling pathway; overproduction suppresses bem1 mutations; MDG1 has a paralog, CRP1, that arose from the whole genome duplication +S000031079 CDS YNL173C 14 310057 308957 C 2011-02-03 1996-07-31 +S000005116 ORF Verified YNL172W APC1 anaphase promoting complex subunit 1 chromosome 14 L000004053 14 310636 315882 W 2011-02-03 1996-07-31|2011-02-03 Largest subunit of the Anaphase-Promoting Complex/Cyclosome; APC/C is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; component of the platform domain of the APC/C, based on structural analysis; localizes to nuclear foci that become diffuse upon DNA replication stress +S000031033 CDS YNL172W 14 310636 315882 W 2011-02-03 1996-07-31|2011-02-03 +S000005114 ORF Dubious YNL170W chromosome 14 14 315978 316373 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000029916 CDS YNL170W 14 315978 316373 W 2011-02-03 1996-07-31 +S000005115 ORF Dubious YNL171C chromosome 14 14 315997 315629 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000029970 CDS YNL171C 14 315997 315629 C 2011-02-03 1996-07-31 +S000005113 ORF Verified YNL169C PSD1 phosphatidylserine decarboxylase 1 chromosome 14 L000001518 14 317671 316169 C 2011-02-03 1996-07-31 Phosphatidylserine decarboxylase of the mitochondrial inner membrane; converts phosphatidylserine to phosphatidylethanolamine; regulates mitochondrial fusion and morphology by affecting lipid mixing in the mitochondrial membrane and by influencing the ratio of long to short forms of Mgm1p; partly exposed to the mitochondrial intermembrane space; autocatalytically processed +S000030171 CDS YNL169C 14 317671 316169 C 2011-02-03 1996-07-31 +S000005112 ORF Uncharacterized YNL168C FMP41 chromosome 14 14 318809 318030 C 2011-02-03 1996-07-31 Putative protein of unknown function; GFP-fusion protein is induced in response to the DNA-damaging agent MMS; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000036435 CDS YNL168C 14 318809 318030 C 2011-02-03 1996-07-31 +S000005111 ORF Verified YNL167C SKO1 ACR1 chromosome 14 L000001909 14 321359 319416 C -110 2011-02-03 1996-07-31 Basic leucine zipper transcription factor of the ATF/CREB family; forms a complex with Tup1p and Cyc8p to both activate and repress transcription; cytosolic and nuclear protein involved in osmotic and oxidative stress responses +S000036358 CDS YNL167C 14 321359 319416 C 2011-02-03 1996-07-31 +S000118385 ARS ARS1415 ARSXIV-322 chromosome 14 14 321921 322213 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178170 ARS_consensus_sequence ARS1415 14 322000 322016 W 2014-11-18 2014-11-18 +S000005110 ORF Verified YNL166C BNI5 chromosome 14 14 323565 322219 C 2011-02-03 1996-07-31 Linker protein responsible for recruitment of myosin to the bud neck; interacts with the C-terminal extensions of septins Cdc11p and Shs1p and binds Myo1p to promote cytokinesis +S000036259 CDS YNL166C 14 323565 322219 C 2011-02-03 1996-07-31 +S000005109 ORF Uncharacterized YNL165W chromosome 14 14 323832 325052 W 2011-02-03 1996-07-31 Putative protein of unknown function; YNL165W is not an essential gene +S000036209 CDS YNL165W 14 323832 325052 W 2011-02-03 1996-07-31 +S000130142 ARS ARS1416 chromosome 14 14 325054 325267 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000005108 ORF Verified YNL164C IBD2 chromosome 14 14 326320 325265 C 2011-02-03 1996-07-31 Component of the BUB2-dependent spindle checkpoint pathway; interacts with Bfa1p and functions upstream of Bub2p and Bfa1p +S000035227 CDS YNL164C 14 326320 325265 C 2011-02-03 1996-07-31 +S000005107 ORF Verified YNL163C RIA1 GTPase RIA1|EFL1 chromosome 14 14 330073 326741 C 2011-02-03 1996-07-31 Cytoplasmic GTPase/eEF2-like factor involved in ribosomal biogenesis; with Sdo1p, a guanine nucleotide exchange factor (GEF), promotes release of Tif6p from 60S ribosomal subunits in the cytoplasm so that they can assemble with 40S subunits to generate mature ribosomes; required for quality control check of newly made large ribosomal subunits before they are released into the pool of translating ribosomes +S000035069 CDS YNL163C 14 330073 326741 C 2011-02-03 1996-07-31 +S000007624 ORF Uncharacterized YNL162W-A chromosome 14 14 330329 330547 W 2011-02-03 2001-02-26 Putative protein of unknown function; identified by homology +S000037222 CDS YNL162W-A 14 330329 330547 W 2011-02-03 2001-02-26 +S000005106 ORF Verified YNL162W RPL42A eL42|ribosomal 60S subunit protein L42A|L44e|YL27|L42A|L41A chromosome 14 L000001731 14 331322 332154 W 2011-02-03 1999-11-17|1996-07-31 Ribosomal 60S subunit protein L42A; homologous to mammalian ribosomal protein L36A, no bacterial homolog; RPL42A has a paralog, RPL42B, that arose from the whole genome duplication +S000034972 CDS YNL162W 14 331322 331325 W 2011-02-03 1996-07-31 +S000034973 CDS YNL162W 14 331838 332154 W 2011-02-03 1999-11-17|1996-07-31 +S000034974 intron YNL162W 14 331326 331837 W 2011-02-03 1999-11-17|1996-07-31 +S000005105 ORF Verified YNL161W CBK1 serine/threonine protein kinase CBK1 chromosome 14 L000004609 14 332597 334867 W 2011-02-03 1996-07-31 Serine/threonine protein kinase of the the RAM signaling network; Ndr/LATS family member; binds regulatory subunit Mob2p; involved in regulation of cellular morphogenesis, polarized growth, and septum destruction; phosphorylation by Cbk1p regulates localization and activity of Ace2p transcription factor and Ssd1p translational repressor; Cbk1p activity is regulated by both phosphorylation and specific localization; relocalizes to cytoplasm upon DNA replication stress +S000034836 CDS YNL161W 14 332597 334867 W 2011-02-03 1996-07-31 +S000005104 ORF Verified YNL160W YGP1 chromosome 14 L000002509 14 336545 337609 W 2011-02-03 1996-07-31 Cell wall-related secretory glycoprotein; induced by nutrient deprivation-associated growth arrest and upon entry into stationary phase; may be involved in adaptation prior to stationary phase entry; YGP1 has a paralog, SPS100, that arose from the whole genome duplication +S000033927 CDS YNL160W 14 336545 337609 W 2011-02-03 1996-07-31 +S000005103 ORF Verified YNL159C ASI2 chromosome 14 14 339347 338478 C 2011-02-03 1996-07-31 Subunit of the inner nuclear membrane Asi ubiquitin ligase complex; the Asi complex targets both misfolded proteins of the inner nuclear membrane-associated degradation (INMAD) pathway and inner for ubiquitin-mediated degradation; acts with Asi1p and Asi3p to ensure the fidelity of SPS-sensor signaling by targeting latent unprocessed forms of Stp1p and Stp2p, maintaining the repressed state of gene expression in the absence of inducing amino acids +S000035302 CDS YNL159C 14 339347 338478 C 2011-02-03 1996-07-31 +S000005102 ORF Verified YNL158W PGA1 chromosome 14 14 339612 340208 W 2011-02-03 1996-07-31 Essential component of GPI-mannosyltransferase II; complex is responsible for second mannose addition to GPI precursors as a partner of Gpi18p; required for maturation of Gas1p and Pho8p; has synthetic genetic interactions with secretory pathway genes +S000034371 CDS YNL158W 14 339612 340208 W 2011-02-03 1996-07-31 +S000005101 ORF Verified YNL157W IGO1 phosphatase regulator chromosome 14 14 340352 340858 W 2011-02-03 1996-07-31 Protein required for initiation of G0 program; prevents degradation of nutrient-regulated mRNAs via the 5'-3' mRNA decay pathway; phosphorylated by Rim15p; GFP protein localizes to the cytoplasm and nucleus; IGO1 has a paralog, IGO2, that arose from the whole genome duplication +S000034306 CDS YNL157W 14 340352 340858 W 2011-02-03 1996-07-31 +S000005100 ORF Verified YNL156C NSG2 chromosome 14 14 341968 341069 C 2011-02-03 1996-07-31 Protein involved in regulation of sterol biosynthesis; specifically stabilizes Hmg2p, one of two HMG-CoA isoenzymes that catalyze the rate-limiting step in sterol biosynthesis; homolog of mammalian INSIG proteins; NSG2 has a paralog, NSG1, that arose from the whole genome duplication +S000034171 CDS YNL156C 14 341968 341069 C 2011-02-03 1996-07-31 +S000005099 ORF Verified YNL155W CUZ1 chromosome 14 14 342516 343340 W 2011-02-03 1996-07-31 Protein with a role in the ubiquitin-proteasome pathway; interacts with ubiquitinated protein, Cdc48p and the proteasomal regulatory particle; may protect cells from trivalent metalloid induced proteotoxicity; contains a PACE promoter element and is co-regulated with proteasome subunit genes; AN1-type zinc finger protein, with DHHC and ubiquitin-like domains (UBL); ortholog of ZFAND1, a human gene linked to cancer; protein abundance increases under DNA replication stress +S000034106 CDS YNL155W 14 342516 343340 W 2011-02-03 1996-07-31 +S000005098 ORF Verified YNL154C YCK2 serine/threonine protein kinase YCK2 chromosome 14 L000002501 14 345276 343636 C 2011-02-03 1996-07-31 Palmitoylated plasma membrane-bound casein kinase I (CK1) isoform; shares redundant functions with Yck1p in morphogenesis, proper septin assembly, endocytic trafficking, and glucose sensing; stabilized by Sod1p binding in the presence of glucose and oxygen, causing glucose repression of respiratory metabolism; involved in the phosphorylation and regulation of glucose sensor Rgt2p; YCK2 has a paralog, YCK1, that arose from the whole genome duplication +S000032102 CDS YNL154C 14 345276 343636 C 2011-02-03 1996-07-31 +S000005097 ORF Verified YNL153C GIM3 tubulin-binding prefolding complex subunit GIM3|PFD4 chromosome 14 L000004369 14 346058 345669 C 2011-02-03 1996-07-31 Subunit of the heterohexameric cochaperone prefoldin complex; prefoldin binds specifically to cytosolic chaperonin and transfers target proteins to it; prefoldin complex also localizes to chromatin of actively transcribed genes in the nucleus and facilitates transcriptional elongation +S000031948 CDS YNL153C 14 346058 345669 C 2011-02-03 1996-07-31 +S000005096 ORF Verified YNL152W INN1 chromosome 14 14 346313 347542 W 2011-02-03 1996-07-31 Essential protein that associates with contractile actomyosin ring; required for ingression of the plasma membrane into the bud neck during cytokinesis; C2 domain, a membrane targeting module, is required for function; activates chitin synthase activity of Chs2p during cytokinesis +S000031853 CDS YNL152W 14 346313 347542 W 2011-02-03 1996-07-31 +S000005095 ORF Verified YNL151C RPC31 DNA-directed RNA polymerase III subunit C31|C31|RPC8|ACP2 chromosome 14 L000001688 14 348521 347766 C -237 2011-02-03 1996-07-31 RNA polymerase III subunit C31 +S000030811 CDS YNL151C 14 348521 347766 C 2011-02-03 1996-07-31 +S000005094 ORF Dubious YNL150W chromosome 14 14 349251 349658 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; extensive overlap with PGA2/YNL149C, an uncharacterized gene with a proposed role in protein trafficking +S000030782 CDS YNL150W 14 349251 349658 W 2011-02-03 1996-07-31 +S000005093 ORF Verified YNL149C PGA2 chromosome 14 14 349756 349367 C 2011-02-03 1996-07-31 Essential protein required for maturation of Gas1p and Pho8p; involved in protein trafficking; GFP-fusion protein localizes to the ER and YFP-fusion protein to the nuclear envelope-ER network; null mutants have a cell separation defect +S000031137 CDS YNL149C 14 349756 349367 C 2011-02-03 1996-07-31 +S000005092 ORF Verified YNL148C ALF1 chromosome 14 L000003527 14 350671 349907 C 2011-02-03 1996-07-31 Alpha-tubulin folding protein; similar to mammalian cofactor B; Alf1p-GFP localizes to cytoplasmic microtubules; required for the folding of alpha-tubulin and may play an additional role in microtubule maintenance +S000031037 CDS YNL148C 14 350671 349907 C 2011-02-03 1996-07-31 +S000005091 ORF Verified YNL147W LSM7 Sm-like protein LSM7 chromosome 14 L000004686 14 350940 351383 W 2011-02-03 1996-07-31|2007-09-06 Lsm (Like Sm) protein; part of heteroheptameric complexes (Lsm2p-7p and either Lsm1p or 8p): cytoplasmic Lsm1p complex involved in mRNA decay; nuclear Lsm8p complex part of U6 snRNP and possibly involved in processing tRNA, snoRNA, and rRNA; protein abundance increases and forms cytoplasmic foci in response to DNA replication stress +S000031001 CDS YNL147W 14 350940 350957 W 2011-02-03 1996-07-31 +S000031002 CDS YNL147W 14 351054 351383 W 2011-02-03 1996-07-31|2007-09-06 +S000031003 intron YNL147W 14 350958 351053 W 2011-02-03 1996-07-31|2007-09-06 +S000028851 ORF Uncharacterized YNL146C-A chromosome 14 14 351580 351386 C 2011-02-03 2003-07-29 Putative protein of unknown function +S000034564 CDS YNL146C-A 14 351580 351386 C 2011-02-03 2003-07-29 +S000005090 ORF Uncharacterized YNL146W chromosome 14 14 351715 352017 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; YNL146W is not an essential gene +S000030919 CDS YNL146W 14 351715 352017 W 2011-02-03 1996-07-31 +S000005089 ORF Verified YNL145W MFA2 mating pheromone a chromosome 14 L000001097 14 352414 352530 W -107.4 2011-02-03 1996-07-31 Mating pheromone a-factor; made by a cells; interacts with alpha cells to induce cell cycle arrest and other responses leading to mating; biogenesis involves C-terminal modification, N-terminal proteolysis, and export; also encoded by MFA1 +S000029912 CDS YNL145W 14 352414 352530 W 2011-02-03 1996-07-31 +S000028702 ORF Dubious YNL144W-A chromosome 14 14 353061 353144 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized gene YNL144C +S000032635 CDS YNL144W-A 14 353061 353144 W 2011-02-03 2003-07-29 +S000005088 ORF Uncharacterized YNL144C chromosome 14 14 355042 352820 C 2011-02-03 1996-07-31 Putative protein of unknown function; non-tagged protein is detected in highly purified mitochondria in high-throughput studies; contains a PH domain and binds phosphatidylinositols and phosphatidylethanolamine in a large-scale study; YNL144C has a paralog, YHR131C, that arose from the whole genome duplication +S000037844 CDS YNL144C 14 355042 352820 C 2011-02-03 1996-07-31 +S000005087 ORF Uncharacterized YNL143C chromosome 14 14 357186 356794 C 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels +S000036002 CDS YNL143C 14 357186 356794 C 2011-02-03 1996-07-31 +S000005086 ORF Verified YNL142W MEP2 ammonium permease MEP2 chromosome 14 L000002583 14 357453 358952 W 2011-02-03 1996-07-31 Ammonium permease involved in regulation of pseudohyphal growth; belongs to a ubiquitous family of cytoplasmic membrane proteins that transport only ammonium (NH4+); expression is under the nitrogen catabolite repression regulation +S000035924 CDS YNL142W 14 357453 358952 W 2011-02-03 1996-07-31 +S000005085 ORF Verified YNL141W AAH1 adenine deaminase chromosome 14 L000004289 14 359596 360639 W 2011-02-03 1996-07-31 Adenine deaminase (adenine aminohydrolase); converts adenine to hypoxanthine; involved in purine salvage; transcriptionally regulated by nutrient levels and growth phase; Aah1p degraded upon entry into quiescence via SCF and the proteasome +S000035807 CDS YNL141W 14 359596 360639 W 2011-02-03 1996-07-31 +S000005084 ORF Uncharacterized YNL140C chromosome 14 14 361486 360917 C 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels; partially overlaps THO2/YNL139C +S000034768 CDS YNL140C 14 361486 360917 C 2011-02-03 1996-07-31 +S000005083 ORF Verified YNL139C THO2 RLR1|LDB5|ZRG13 chromosome 14 L000002589 14 365717 360924 C 2011-02-03 1996-07-31 Subunit of the THO complex; THO is required for efficient transcription elongation and involved in transcriptional elongation-associated recombination; required for LacZ RNA expression from certain plasmids +S000036082 CDS YNL139C 14 365717 360924 C 2011-02-03 1996-07-31 +S000028509 ORF Verified YNL138W-A YSF3 U2 snRNP complex subunit YSF3|RCP10 chromosome 14 14 366033 366412 W 2011-02-03 2003-07-29 Component of the SF3b subcomplex of the U2 snRNP; essential protein required for splicing and for assembly of SF3b +S000030223 CDS YNL138W-A 14 366033 366035 W 2011-02-03 2003-07-29 +S000030224 CDS YNL138W-A 14 366158 366412 W 2011-02-03 2003-07-29 +S000030225 intron YNL138W-A 14 366036 366157 W 2011-02-03 2003-07-29 +S000005082 ORF Verified YNL138W SRV2 adenylate cyclase-binding protein|CAP chromosome 14 L000002068 14 366741 368321 W -101 2011-02-03 1996-07-31 CAP (cyclase-associated protein); N-terminus binds adenylate cyclase and facilitates activation by RAS; N-terminus forms novel hexameric star-shaped shuriken structures that directly catalyze cofilin-mediated severing of actin filaments; C-terminus binds and recycles cofilin bound, ADP-actin monomers, facilitating regulation of actin dynamics and cell morphogenesis; N- and C-termini can function as physically separate proteins; mCAP1 is the mouse homolog +S000036041 CDS YNL138W 14 366741 368321 W 2011-02-03 1996-07-31 +S000005081 ORF Verified YNL137C NAM9 mitochondrial 37S ribosomal protein NAM9|MNA6 chromosome 14 L000001231 14 370055 368595 C 2011-02-03 1996-07-31 Mitochondrial ribosomal component of the small subunit +S000035090 CDS YNL137C 14 370055 368595 C 2011-02-03 1996-07-31 +S000005080 ORF Verified YNL136W EAF7 chromosome 14 14 370368 371645 W 2011-02-03 1996-07-31 Subunit of the NuA4 histone acetyltransferase complex; NuA4 acetylates the N-terminal tails of histones H4 and H2A +S000035041 CDS YNL136W 14 370368 371645 W 2011-02-03 1996-07-31 +S000005079 ORF Verified YNL135C FPR1 peptidylprolyl isomerase FPR1|RBP1|FKB1 chromosome 14 L000000623 14 372226 371882 C -105 2011-02-03 1996-07-31 Peptidyl-prolyl cis-trans isomerase (PPIase); binds to the drugs FK506 and rapamycin; also binds to the nonhistone chromatin binding protein Hmo1p and may regulate its assembly or function; N-terminally propionylated in vivo; mutation is functionally complemented by human FKBP1A +S000034848 CDS YNL135C 14 372226 371882 C 2011-02-03 1996-07-31 +S000005078 ORF Verified YNL134C chromosome 14 14 373581 372451 C 2011-02-03 1996-07-31 NADH-dependent aldehyde reductase, involved in detoxification of furfural; expression is up-regulated in the presence of furfural and 5-hydroxymethylfurfural, which are compounds generated during lignocellulosic biomass pre-treatment; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and nucleus; protein abundance increases in response to DNA replication stress +S000033976 CDS YNL134C 14 373581 372451 C 2011-02-03 1996-07-31 +S000005077 ORF Verified YNL133C FYV6 chromosome 14 14 374692 374171 C 2011-02-03 1996-07-31 Protein of unknown function; required for survival upon exposure to K1 killer toxin; proposed to regulate double-strand break repair via non-homologous end-joining +S000033840 CDS YNL133C 14 374692 374171 C 2011-02-03 1996-07-31 +S000006569 tRNA_gene tF(GAA)N chromosome 14 L000003689 14 374869 374959 W 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis +S000035429 intron tF(GAA)N 14 374906 374923 W 2011-02-03 2000-05-19 +S000035427 noncoding_exon tF(GAA)N 14 374869 374905 W 2011-02-03 2000-05-19 +S000035428 noncoding_exon tF(GAA)N 14 374924 374959 W 2011-02-03 2000-05-19 +S000005076 ORF Verified YNL132W KRE33 ribosome biosynthesis protein KRE33|RRA1 chromosome 14 14 375321 378491 W 2011-02-03 1996-07-31 Protein required for biogenesis of the small ribosomal subunit; heterozygous mutant shows haploinsufficiency in K1 killer toxin resistance; essential gene; NAT10, the human homolog, implicated in several types of cancer and premature aging. +S000033781 CDS YNL132W 14 375321 378491 W 2011-02-03 1996-07-31 +S000005075 ORF Verified YNL131W TOM22 MOM22|MAS22|MAS17 chromosome 14 L000002582 14 378767 379225 W 2011-02-03 1996-07-31 Component of the TOM (Translocase of Outer Membrane) complex; responsible for initial import of mitochondrially directed proteins; mediates interaction between TOM and TIM complexes and acts as a receptor for precursor proteins +S000033651 CDS YNL131W 14 378767 379225 W 2011-02-03 1996-07-31 +S000005074 ORF Verified YNL130C CPT1 diacylglycerol cholinephosphotransferase chromosome 14 L000000404 14 380831 379558 C 2011-02-03 2004-02-03|1996-07-31 Cholinephosphotransferase; required for phosphatidylcholine biosynthesis and for inositol-dependent regulation of EPT1 transcription; CPT1 has a paralog, EPT1, that arose from the whole genome duplication +S000030245 CDS YNL130C 14 380689 379558 C 2011-02-03 1996-07-31 +S000030243 CDS YNL130C 14 380831 380782 C 2011-02-03 2004-02-03|1996-07-31 +S000030246 intron YNL130C 14 380781 380690 C 2011-02-03 2004-02-03|1996-07-31 +S000028579 ORF Uncharacterized YNL130C-A DGR1 chromosome 14 14 381391 381245 C 2011-02-03 2003-07-29 Protein of unknown function; dgr1 null mutant is resistant to 2-deoxy-D-glucose +S000031313 CDS YNL130C-A 14 381391 381245 C 2011-02-03 2003-07-29 +S000005073 ORF Verified YNL129W NRK1 ribosylnicotinamide kinase chromosome 14 S000029011|S000029327 14 381480 382202 W 2011-02-03 1996-07-31 Nicotinamide riboside kinase; catalyzes the phosphorylation of nicotinamide riboside and nicotinic acid riboside in salvage pathways for NAD+ biosynthesis +S000031557 CDS YNL129W 14 381480 382202 W 2011-02-03 1996-07-31 +S000005072 ORF Verified YNL128W TEP1 putative phosphatidylinositol-3,4,5-trisphosphate 3-phosphatase chromosome 14 L000003922 14 382359 383663 W 2011-02-03 1996-07-31|2011-02-03 PTEN homolog with no demonstrated inositol lipid phosphatase activity; plays a role in normal sporulation; homolog of human tumor suppressor gene PTEN/MMAC1/TEP1 and fission yeast ptn1 +S000030721 CDS YNL128W 14 382359 383663 W 2011-02-03 1996-07-31|2011-02-03 +S000005071 ORF Verified YNL127W FAR11 chromosome 14 14 383987 386848 W 2011-02-03 1996-07-31 Protein involved in recovery from cell cycle arrest; acts in response to pheromone; also involved in regulation of intra-S DNA damage checkpoint and autophagy; is essential for dephosphorylation of Atg13p; interacts with Far3p, Far7p, Far8p, Far9p, Far10p and with the phosphatases Pph21p, Pph22p and Pph3p; has similarity to the N- and C-termini of N. crassa HAM-2; similar to human Fam40A and Fam40B +S000030640 CDS YNL127W 14 383987 386848 W 2011-02-03 1996-07-31 +S000005070 ORF Verified YNL126W SPC98 chromosome 14 L000003430 14 387227 389767 W 2011-02-03 1996-07-31 Component of the microtubule-nucleating Tub4p (gamma-tubulin) complex; interacts with Spc110p at the spindle pole body (SPB) inner plaque and with Spc72p at the SPB outer plaque +S000030533 CDS YNL126W 14 387227 389767 W 2011-02-03 1996-07-31 +S000005069 ORF Verified YNL125C ESBP6 MCH3 chromosome 14 L000004077 14 392167 390146 C 2011-02-03 1996-07-31 Protein with similarity to monocarboxylate permeases; appears not to be involved in transport of monocarboxylates such as lactate, pyruvate or acetate across the plasma membrane +S000037681 CDS YNL125C 14 392167 390146 C 2011-02-03 1996-07-31 +S000005068 ORF Verified YNL124W NAF1 RNA-binding snoRNP assembly protein chromosome 14 14 392892 394370 W 2011-02-03 1996-07-31 RNA-binding protein required for the assembly of box H/ACA snoRNPs; thus required for pre-rRNA processing; forms a complex with Shq1p and interacts with H/ACA snoRNP components Nhp2p and Cbf5p; similar to Gar1p +S000037659 CDS YNL124W 14 392892 394370 W 2011-02-03 1996-07-31 +S000005067 ORF Verified YNL123W NMA111 YNM3 chromosome 14 14 394685 397678 W 2011-02-03 1996-07-31 Serine protease and general molecular chaperone; involved in response to heat stress and promotion of apoptosis; may contribute to lipid homeostasis; sequence similarity to the mammalian Omi/HtrA2 family of serine proteases +S000037577 CDS YNL123W 14 394685 397678 W 2011-02-03 1996-07-31 +S000005066 ORF Verified YNL122C chromosome 14 14 398370 398023 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; homologous to bacterial L35 and human MRPL35 ribosomal proteins +S000037427 CDS YNL122C 14 398370 398023 C 2011-02-03 1996-07-31 +S000005065 ORF Verified YNL121C TOM70 protein channel TOM70|OMP1|MOM72|MAS70 chromosome 14 L000001030|L000003141 14 400537 398684 C 2011-02-03 1996-07-31 Component of the TOM (translocase of outer membrane) complex; involved in the recognition and initial import steps for all mitochondrially directed proteins; acts as a receptor for incoming precursor proteins; TOM70 has a paralog, TOM71, that arose from the whole genome duplication +S000031934 CDS YNL121C 14 400537 398684 C 2011-02-03 1996-07-31 +S000005063 ORF Verified YNL119W NCS2 TUC2 chromosome 14 14 401040 402521 W 2011-02-03 1996-07-31 Protein required for uridine thiolation of Lys(UUU) and Glu(UUC) tRNAs; required for the thiolation of uridine at the wobble position of Lys(UUU) and Glu(UUC) tRNAs; has a role in urmylation and in invasive and pseudohyphal growth; inhibits replication of Brome mosaic virus in S. cerevisiae +S000036308 CDS YNL119W 14 401040 402521 W 2011-02-03 1996-07-31 +S000005064 ORF Dubious YNL120C chromosome 14 14 401518 401033 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; deletion enhances replication of Brome mosaic virus in S. cerevisiae, but likely due to effects on the overlapping gene +S000031820 CDS YNL120C 14 401518 401033 C 2011-02-03 1996-07-31 +S000005062 ORF Verified YNL118C DCP2 decapping enzyme complex catalytic subunit|PSU1 chromosome 14 L000002866 14 405564 402652 C 2011-02-03 1996-07-31 Catalytic subunit of Dcp1p-Dcp2p decapping enzyme complex; removes 5' cap structure from mRNAs prior to their degradation; also enters nucleus and positively regulates transcription initiation; nudix hydrolase family member; forms cytoplasmic foci upon DNA replication stress; human homolog DCP2 complements yeast dcp2 thermosensitive mutant +S000035360 CDS YNL118C 14 405564 402652 C 2011-02-03 1996-07-31 +S000005061 ORF Verified YNL117W MLS1 malate synthase MLS1 chromosome 14 L000001123 14 406358 408022 W 2011-02-03 1996-07-31 Malate synthase, enzyme of the glyoxylate cycle; involved in utilization of non-fermentable carbon sources; expression is subject to carbon catabolite repression; localizes in peroxisomes during growth on oleic acid, otherwise cytosolic; can accept butyryl-CoA as acyl-CoA donor in addition to traditional substrate acetyl-CoA +S000035332 CDS YNL117W 14 406358 408022 W 2011-02-03 1996-07-31 +S000005060 ORF Verified YNL116W DMA2 ubiquitin-conjugating protein DMA2|CHF2 chromosome 14 S000029720 14 408341 409909 W 2011-02-03 1996-07-31 Ubiquitin-protein ligase (E3); controls septin dynamics and spindle position checkpoint (SPOC) with ligase Dma1p by regulating recruitment of Elm1p to bud neck; regulates levels of eIF2 subunit Gcd11p, as well as abundance, localization, and ubiquitination of Cdk inhibitory kinase Swe1p; ortholog of human RNF8, similar to human Chfr; contains FHA and RING finger domains; DMA2 has a paralog, DMA1, that arose from the whole genome duplication +S000035249 CDS YNL116W 14 408341 409909 W 2011-02-03 1996-07-31 +S000005059 ORF Uncharacterized YNL115C chromosome 14 14 412053 410119 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to mitochondria; YNL115C is not an essential gene +S000034227 CDS YNL115C 14 412053 410119 C 2011-02-03 1996-07-31 +S000118386 ARS ARS1417 ARSXIV-412 chromosome 14 14 412267 412496 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000005057 ORF Verified YNL113W RPC19 DNA-directed RNA polymerase core subunit RPC19|AC19 chromosome 14 L000001687 14 412771 413199 W 2011-02-03 1996-07-31 RNA polymerase subunit AC19; common to RNA polymerases I and III +S000034093 CDS YNL113W 14 412771 413199 W 2011-02-03 1996-07-31 +S000005058 ORF Dubious YNL114C chromosome 14 14 413055 412684 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF RPC19/YNL113W, an RNA polymerase subunit +S000034126 CDS YNL114C 14 413055 412684 C 2011-02-03 1996-07-31 +S000005056 ORF Verified YNL112W DBP2 DEAD-box ATP-dependent RNA helicase DBP2 chromosome 14 L000000493 14 413639 416281 W 2011-02-03 1996-07-31 ATP-dependent RNA helicase of the DEAD-box protein family; has strong preference for dsRNA; interacts with YRA1; required for assembly of Yra1p, Nab2p and Mex67p onto mRNA and formation of nuclear mRNP; involved in mRNA decay and rRNA processing; may be involved in suppression of transcription from cryptic initiation sites +S000033962 CDS YNL112W 14 413639 414911 W 2011-02-03 1996-07-31 +S000033963 CDS YNL112W 14 415914 416281 W 2011-02-03 1996-07-31 +S000033964 intron YNL112W 14 414912 415913 W 2011-02-03 1996-07-31 +S000005055 ORF Verified YNL111C CYB5 chromosome 14 L000002498 14 417302 416940 C 2011-02-03 1996-07-31 Cytochrome b5; involved in the sterol and lipid biosynthesis pathways; acts as an electron donor to support sterol C5-6 desaturation +S000033131 CDS YNL111C 14 417302 416940 C 2011-02-03 1996-07-31 +S000005054 ORF Verified YNL110C NOP15 rRNA-binding ribosome biosynthesis protein NOP15 chromosome 14 14 418488 417826 C 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; involved in 60S ribosomal subunit biogenesis; localizes to both nucleolus and cytoplasm +S000033055 CDS YNL110C 14 418488 417826 C 2011-02-03 1996-07-31 +S000005053 ORF Dubious YNL109W chromosome 14 14 418964 419509 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YNL108C +S000032014 CDS YNL109W 14 418964 419509 W 2011-02-03 1996-07-31 +S000005052 ORF Verified YNL108C HUF chromosome 14 14 419826 419014 C 2011-02-03 1996-07-31 Protein phosphatase; similar to prokaryotic phosphotransfer enzymes; null mutant shows alterations in glucose metabolism; GFP-fusion protein localizes to the cytoplasm and nucleus; YNL108C has a paralog, TFC7, that arose from the whole genome duplication +S000031012 CDS YNL108C 14 419826 419014 C 2011-02-03 1996-07-31 +S000005051 ORF Verified YNL107W YAF9 chromosome 14 S000007495 14 420098 420778 W 2011-02-03 1996-07-31 Subunit of NuA4 histone H4 acetyltransferase and SWR1 complexes; may function to antagonize silencing near telomeres; interacts directly with Swc4p; has homology to human leukemogenic protein AF9; contains a YEATS domain +S000030966 CDS YNL107W 14 420098 420778 W 2011-02-03 1996-07-31 +S000005049 ORF Dubious YNL105W RRT16 chromosome 14 14 424155 424583 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene INP52; identified in a screen for mutants with decreased levels of rDNA transcription +S000030822 CDS YNL105W 14 424155 424583 W 2011-02-03 1996-07-31 +S000005050 ORF Verified YNL106C INP52 phosphatidylinositol-3-/phosphoinositide 5-phosphatase INP52|SJL2 chromosome 14 L000003985 14 424495 420944 C 2011-02-03 1996-07-31 Polyphosphatidylinositol phosphatase; dephosphorylates a number of phosphatidylinositol phosphates (PtdInsPs, PIPs) to PI; involved in endocytosis; hyperosmotic stress causes translocation to actin patches; synaptojanin-like protein with a Sac1 domain; INP52 has a paralog, INP53, that arose from the whole genome duplication +S000030872 CDS YNL106C 14 424495 420944 C 2011-02-03 1996-07-31 +S000028701 ORF Dubious YNL103W-A chromosome 14 14 426719 426808 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene MET4/YNL104C +S000032634 CDS YNL103W-A 14 426719 426808 W 2011-02-03 2003-07-29 +S000005048 ORF Verified YNL104C LEU4 2-isopropylmalate synthase LEU4 chromosome 14 L000000945 14 426754 424895 C -76 2011-02-03 1996-07-31 Alpha-isopropylmalate synthase (2-isopropylmalate synthase); the main isozyme responsible for the first step in the leucine biosynthesis pathway; LEU4 has a paralog, LEU9, that arose from the whole genome duplication +S000037846 CDS YNL104C 14 426754 424895 C 2011-02-03 1996-07-31 +S000005047 ORF Verified YNL103W MET4 chromosome 14 L000001079 14 427735 429753 W -76 2011-02-03 1996-07-31|2006-11-09 Leucine-zipper transcriptional activator; responsible for regulation of sulfur amino acid pathway; requires different combinations of auxiliary factors Cbf1p, Met28p, Met31p and Met32p; feedforward loop exists in the regulation of genes controlled by Met4p and Met32p; can be ubiquitinated by ubiquitin ligase SCF-Met30p, is either degraded or maintained in an inactive state; regulates degradation of its own DNA-binding cofactors by targeting them to SCF-Met30p +S000037804 CDS YNL103W 14 427735 429753 W 2011-02-03 1996-07-31|2006-11-09 +S000005046 ORF Verified YNL102W POL1 DNA-directed DNA polymerase alpha catalytic subunit POL1|HPR3|CRT5|CDC17 chromosome 14 L000000257 14 430087 434493 W -74 2011-02-03 1996-07-31 Catalytic subunit of the DNA polymerase I alpha-primase complex; required for the initiation of DNA replication during mitotic DNA synthesis and premeiotic DNA synthesis +S000037722 CDS YNL102W 14 430087 434493 W 2011-02-03 1996-07-31 +S000005045 ORF Verified YNL101W AVT4 chromosome 14 14 434999 437140 W 2011-02-03 1996-07-31 Vacuolar transporter; exports large neutral amino acids from the vacuole; member of a family of seven S. cerevisiae genes (AVT1-7) related to vesicular GABA-glycine transporters; localizes to sites of contact between the vacuole and mitochondria (vCLAMPs) +S000036962 CDS YNL101W 14 434999 437140 W 2011-02-03 1996-07-31 +S000005044 ORF Verified YNL100W MIC27 AIM37|MCS27 chromosome 14 14 437613 438317 W 2011-02-03 1996-07-31 Component of the MICOS complex; MICOS (formerly MINOS or MitOS) is a mitochondrial inner membrane complex that extends into the intermembrane space and has a role in the maintenance of crista junctions, inner membrane architecture, and formation of contact sites to the outer membrane; forms a subcomplex with Mic10p and Mic12p whose assembly and stability requires cardiolipin +S000036897 CDS YNL100W 14 437613 438317 W 2011-02-03 1996-07-31 +S000005043 ORF Verified YNL099C OCA1 putative tyrosine protein phosphatase OCA1 chromosome 14 14 439283 438567 C 2011-02-03 1996-07-31 Putative protein tyrosine phosphatase; required for cell cycle arrest in response to oxidative damage of DNA +S000031337 CDS YNL099C 14 439283 438567 C 2011-02-03 1996-07-31 +S000005042 ORF Verified YNL098C RAS2 Ras family GTPase RAS2|TSL7|GLC5|CYR3|CTN5 chromosome 14 L000001583 14 440570 439602 C -71.5 2011-02-03 1996-07-31 GTP-binding protein; regulates nitrogen starvation response, sporulation, and filamentous growth; farnesylation and palmitoylation required for activity and localization to plasma membrane; homolog of mammalian Ras proto-oncogenes; RAS2 has a paralog, RAS1, that arose from the whole genome duplication +S000030460 CDS YNL098C 14 440570 439602 C 2011-02-03 1996-07-31 +S000028699 ORF Uncharacterized YNL097C-B YNL097C-A chromosome 14 14 440919 440797 C 2011-02-03 2003-07-29 Putative protein of unknown function +S000032611 CDS YNL097C-B 14 440919 440797 C 2011-02-03 2003-07-29 +S000028700 ORF Dubious YNL097W-A chromosome 14 14 441431 441586 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene PHO23/YNL097C +S000032629 CDS YNL097W-A 14 441431 441586 W 2011-02-03 2003-07-29 +S000005041 ORF Verified YNL097C PHO23 chromosome 14 L000004300 14 442358 441366 C 2011-02-03 1996-07-31 Component of the Rpd3L histone deacetylase complex; involved in transcriptional regulation of PHO5; affects termination of snoRNAs and cryptic unstable transcripts (CUTs); C-terminus shares significant sequence identity with the human candidate tumor suppressor p33-ING1 and its isoform ING3 +S000030326 CDS YNL097C 14 442358 441366 C 2011-02-03 1996-07-31 +S000006645 tRNA_gene tL(CAA)N chromosome 14 L000003690 14 443006 443119 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000033817 intron tL(CAA)N 14 443044 443075 W 2011-02-03 2000-05-19 +S000033815 noncoding_exon tL(CAA)N 14 443006 443043 W 2011-02-03 2000-05-19 +S000033816 noncoding_exon tL(CAA)N 14 443076 443119 W 2011-02-03 2000-05-19 +S000005040 ORF Verified YNL096C RPS7B eS7|ribosomal 40S subunit protein S7B|S7e|rp30|S7B chromosome 14 L000004473 14 444315 443398 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; interacts with Kti11p; deletion causes hypersensitivity to zymocin; homologous to mammalian ribosomal protein S7, no bacterial homolog; RPS7B has a paralog, RPS7A, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000030167 CDS YNL096C 14 443826 443398 C 2011-02-03 1996-07-31 +S000030166 CDS YNL096C 14 444315 444172 C 2011-02-03 1996-07-31 +S000030168 intron YNL096C 14 444171 443827 C 2011-02-03 1996-07-31 +S000005039 ORF Uncharacterized YNL095C chromosome 14 14 446840 444912 C 2011-02-03 1996-07-31 Putative protein of unknown function; predicted to contain a transmembrane domain; not an essential gene; YNL095C has a paralog, ECM3, that arose from the whole genome duplication +S000036433 CDS YNL095C 14 446840 444912 C 2011-02-03 1996-07-31 +S000005038 ORF Verified YNL094W APP1 phosphatidate phosphatase APP1 chromosome 14 14 447611 449374 W 2011-02-03 1996-07-31 Phosphatidate phosphatase, converts phosphatidate to diacylglycerol; App1p, Pah1p, Dpp1p, and Lpp1p are responsible for all the phosphatidate phosphatase activity; component of cortical actin patches; interacts with components of endocytic pathway +S000036404 CDS YNL094W 14 447611 449374 W 2011-02-03 1996-07-31 +S000118387 ARS ARS1419 ARSXIV-450 chromosome 14 14 449429 449588 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178171 ARS_consensus_sequence ARS1419 14 449534 449518 C 2014-11-18 2014-11-18 +S000005037 ORF Verified YNL093W YPT53 Rab family GTPase YPT53 chromosome 14 L000002547 14 449868 450530 W 2011-02-03 1996-07-31 Stress-induced Rab family GTPase; required for vacuolar protein sorting and endocytosis; involved in ionic stress tolerance; similar to Vps21p and Ypt52p; functional homolog of Vps21p; mammalian Rab5 homolog; YPT53 has a paralog, VPS21, that arose from the whole genome duplication +S000036317 CDS YNL093W 14 449868 450530 W 2011-02-03 1996-07-31 +S000005036 ORF Verified YNL092W S-adenosylmethionine-dependent methyltransferase chromosome 14 14 450871 452073 W 2011-02-03 1996-07-31 S-adenosylmethionine-dependent protein methyltransferase; capable of automethylation; member of the seven beta-strand family; YNL092W is not an essential gene +S000036208 CDS YNL092W 14 450871 452073 W 2011-02-03 1996-07-31 +S000005035 ORF Verified YNL091W NST1 chromosome 14 14 452408 456130 W 2011-02-03 1996-07-31 Protein of unknown function; mediates sensitivity to salt stress; interacts physically with the splicing factor Msl1p and also displays genetic interaction with MSL1 +S000036061 CDS YNL091W 14 452408 456130 W 2011-02-03 1996-07-31 +S000005034 ORF Verified YNL090W RHO2 Rho family GTPase RHO2 chromosome 14 L000001631 14 456565 457143 W 2011-02-03 1996-07-31 Non-essential small GTPase of the Rho/Rac family of Ras-like proteins; involved in the establishment of cell polarity and in microtubule assembly +S000035133 CDS YNL090W 14 456565 457143 W 2011-02-03 1996-07-31 +S000005033 ORF Dubious YNL089C chromosome 14 14 457169 456693 C 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; almost completely overlaps YNL090W/RHO2 which encodes a small GTPase of the Rho/Rac subfamily of Ras-like proteins +S000035490 CDS YNL089C 14 457169 456693 C 2011-02-03 1996-07-31 +S000005032 ORF Verified YNL088W TOP2 DNA topoisomerase 2|TRF3|TOR3 chromosome 14 L000002320 14 457704 461990 W -70 2011-02-03 1996-07-31 Topoisomerase II; relieves torsional strain in DNA by cleaving and re-sealing phosphodiester backbone of both positively and negatively supercoiled DNA; cleaves complementary strands; localizes to axial cores in meiosis; required for replication slow zone (RSZ) breakage following Mec1p inactivation; human homolog TOP2A implicated in cancers, and can complement yeast null mutant +S000035464 CDS YNL088W 14 457704 461990 W 2011-02-03 1996-07-31 +S000005031 ORF Verified YNL087W TCB2 tricalbin chromosome 14 14 462411 465947 W 2011-02-03 1996-07-31 ER protein involved in ER-plasma membrane tethering; one of 6 proteins (Ist2p, Scs2p, Scs22p, Tcb1p, Tcb2p, Tcb3p) that connect ER to plasma membrane (PM) and regulate PM phosphatidylinositol-4-phosphate (PI4P) levels by controlling access of Sac1p phosphatase to its substrate PI4P in the PM; contains 3 calcium and lipid binding domains; mRNA is targeted to bud; TCB2 has a paralog, TCB1, that arose from the whole genome duplication +S000035400 CDS YNL087W 14 462411 465947 W 2011-02-03 1996-07-31 +S000005030 ORF Verified YNL086W SNN1 BLS1 chromosome 14 14 466334 466642 W 2011-02-03 1996-07-31 Subunit of the BLOC-1 complex involved in endosomal maturation; interacts with Msb3p; green fluorescent protein (GFP)-fusion protein localizes to endosomes +S000035333 CDS YNL086W 14 466334 466642 W 2011-02-03 1996-07-31 +S000005029 ORF Verified YNL085W MKT1 chromosome 14 L000001120 14 467131 469623 W -69 2011-02-03 1996-07-31 Protein similar to nucleases that forms a complex with Pbp1p; complex may mediate posttranscriptional regulation of HO; involved in propagation of M2 dsRNA satellite of L-A virus; allelic variation affects mitochondrial genome stability, drug resistance, and more; forms cytoplasmic foci upon DNA replication stress; localization to P-bodies under ethanol stress differs between strains +S000034367 CDS YNL085W 14 467131 469623 W 2011-02-03 1996-07-31 +S000005028 ORF Verified YNL084C END3 chromosome 14 L000000558 14 471102 470053 C 2011-02-03 1996-07-31 EH domain-containing protein involved in endocytosis; actin cytoskeletal organization and cell wall morphogenesis; forms a complex with Sla1p and Pan1p +S000034279 CDS YNL084C 14 471102 470053 C 2011-02-03 1996-07-31 +S000005027 ORF Verified YNL083W SAL1 Ca(2+)-binding ATP:ADP antiporter SAL1 chromosome 14 14 471377 472861 W 2011-02-03 2004-02-18|2010-01-05|1996-07-31 ADP/ATP transporter; member of the Ca2+-binding subfamily of mitochondrial carriers, with two EF-hand motifs; transport activity of either Sal1p or Pet9p is critical for viability; polymorphic in different S. cerevisiae strains +S000034242 CDS YNL083W 14 471377 472861 W 2011-02-03 2004-02-18|2010-01-05|1996-07-31 +S000005026 ORF Verified YNL082W PMS1 ATP-binding mismatch repair protein chromosome 14 L000001457 14 473391 476012 W -66 2011-02-03 2004-04-21|1996-07-31 ATP-binding protein required for mismatch repair; required for both mitosis and meiosis; functions as a heterodimer with Mlh1p; binds double- and single-stranded DNA via its N-terminal domain, similar to E. coli MutL +S000034101 CDS YNL082W 14 473391 476012 W 2011-02-03 2004-04-21|1996-07-31 +S000005025 ORF Verified YNL081C SWS2 putative mitochondrial 37S ribosomal protein SWS2 chromosome 14 14 476619 476188 C 2011-02-03 1996-07-31 Putative mitochondrial ribosomal protein of the small subunit; has similarity to E. coli S13 ribosomal protein; participates in controlling sporulation efficiency; localizes to vacuole in response to H2O2 +S000032072 CDS YNL081C 14 476619 476188 C 2011-02-03 1996-07-31 +S000005024 ORF Verified YNL080C EOS1 chromosome 14 14 478032 476932 C 2011-02-03 1996-07-31 Protein involved in N-glycosylation; deletion mutation confers sensitivity to exidative stress and shows synthetic lethality with mutations in the spindle checkpoint genes BUB3 and MAD1; YNL080C is not an essential gene +S000031947 CDS YNL080C 14 478032 476932 C 2011-02-03 1996-07-31 +S000005023 ORF Verified YNL079C TPM1 tropomyosin TPM1 chromosome 14 L000002328 14 479165 478566 C 2011-02-03 1996-07-31 Major isoform of tropomyosin; binds to and stabilizes actin cables and filaments, which direct polarized cell growth and the distribution of several organelles; acetylated by the NatB complex and acetylated form binds actin most efficiently; TPM1 has a paralog, TPM2, that arose from the whole genome duplication +S000032271 CDS YNL079C 14 479165 478566 C 2011-02-03 1996-07-31 +S000005022 ORF Verified YNL078W NIS1 JIP1 chromosome 14 14 479768 480991 W 2011-02-03 1996-07-31 Protein localized in the bud neck at G2/M phase; physically interacts with septins; possibly involved in a mitotic signaling network +S000032241 CDS YNL078W 14 479768 480991 W 2011-02-03 1996-07-31 +S000005021 ORF Verified YNL077W APJ1 chromosome 14 14 481391 482977 W 2011-02-03 1996-07-31 Chaperone with a role in SUMO-mediated protein degradation; member of the DnaJ-like family; conserved across eukaryotes; overexpression interferes with propagation of the [Psi+] prion; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; forms nuclear foci upon DNA replication stress +S000032158 CDS YNL077W 14 481391 482977 W 2011-02-03 1996-07-31 +S000005020 ORF Verified YNL076W MKS1 LYS80 chromosome 14 L000001119 14 483556 485310 W 2011-02-03 1996-07-31 Pleiotropic negative transcriptional regulator; involved in Ras-CAMP and lysine biosynthetic pathways and nitrogen regulation; involved in retrograde (RTG) mitochondria-to-nucleus signaling +S000031187 CDS YNL076W 14 483556 485310 W 2011-02-03 1996-07-31 +S000005019 ORF Verified YNL075W IMP4 snoRNA-binding rRNA-processing protein IMP4 chromosome 14 S000007424 14 485607 486479 W 2011-02-03 1996-07-31 Component of the SSU processome; SSU processome is required for pre-18S rRNA processing; interacts with Mpp10p; member of a superfamily of proteins that contain a sigma(70)-like motif and associate with RNAs +S000031099 CDS YNL075W 14 485607 486479 W 2011-02-03 1996-07-31 +S000005018 ORF Verified YNL074C MLF3 YMK1 chromosome 14 L000004166 14 488124 486766 C 2011-02-03 1996-07-31 Serine-rich protein of unknown function; predicted to be palmitoylated; overproduction suppresses growth inhibition caused by exposure to immunosuppressant leflunomide; MLF3 has a paralog, VHS2, that arose from the whole genome duplication +S000030955 CDS YNL074C 14 488124 486766 C 2011-02-03 1996-07-31 +S000005017 ORF Verified YNL073W MSK1 lysine--tRNA ligase MSK1 chromosome 14 L000001195 14 488386 490116 W 2011-02-03 1996-07-31 Mitochondrial lysine-tRNA synthetase; required for import of both aminoacylated and deacylated forms of tRNA(Lys) into mitochondria and for aminoacylation of mitochondrially encoded tRNA(Lys) +S000030916 CDS YNL073W 14 488386 490116 W 2011-02-03 1996-07-31 +S000005016 ORF Verified YNL072W RNH201 ribonuclease H2 catalytic subunit RNH201|Rnh2A|RNH35 chromosome 14 L000004047 14 490317 491240 W 2011-02-03 1996-07-31 Ribonuclease H2 catalytic subunit; removes RNA primers during Okazaki fragment synthesis and errant ribonucleotides misincorporated during DNA replication; role in ribonucleotide excision repair; homolog of RNAse HI; related to human AGS4 which causes Aicardi-Goutieres syndrome +S000029909 CDS YNL072W 14 490317 491240 W 2011-02-03 1996-07-31 +S000005015 ORF Verified YNL071W LAT1 dihydrolipoyllysine-residue acetyltransferase|PDA2|ODP2 chromosome 14 L000000932|L000003242 14 491523 492971 W 2011-02-03 1996-07-31 Dihydrolipoamide acetyltransferase component (E2) of the PDC; the pyruvate dehydrogenase complex (PDC) catalyzes the oxidative decarboxylation of pyruvate to acetyl-CoA +S000037903 CDS YNL071W 14 491523 492971 W 2011-02-03 1996-07-31 +S000005014 ORF Verified YNL070W TOM7 YOK22|MOM7 chromosome 14 L000003250 14 493366 493548 W 2011-02-03 1996-07-31 Component of the TOM (translocase of outer membrane) complex; responsible for recognition and initial import steps for all mitochondrially directed proteins; promotes assembly and stability of the TOM complex +S000037807 CDS YNL070W 14 493366 493548 W 2011-02-03 1996-07-31 +S000005013 ORF Verified YNL069C RPL16B uL13|ribosomal 60S subunit protein L16B|L13|rp23|YL15|L21B|L16B|RP23 chromosome 14 L000003244 14 495001 493956 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L16B; N-terminally acetylated, binds 5.8 S rRNA; transcriptionally regulated by Rap1p; homologous to mammalian ribosomal protein L13A and bacterial L13; RPL16B has a paralog, RPL16A, that arose from the whole genome duplication +S000036374 CDS YNL069C 14 494524 493956 C 2011-02-03 1996-07-31 +S000036373 CDS YNL069C 14 495001 494974 C 2011-02-03 1996-07-31 +S000036375 intron YNL069C 14 494973 494525 C 2011-02-03 1996-07-31 +S000005012 ORF Verified YNL068C FKH2 forkhead family transcription factor FKH2 chromosome 14 L000002608 14 498289 495701 C 2011-02-03 1996-07-31 Forkhead family transcription factor; rate-limiting activator of replication origins; evolutionarily conserved regulator of lifespan; binds multiple chromosomal elements with distinct specificities, cell cycle dynamics; positively regulates transcriptional elongation; facilitates clustering, activation of early-firing replication origins; negative role in chromatin silencing at HML and HMR; major role in expression of G2/M phase genes; relocalizes to cytosol under hypoxia +S000036272 CDS YNL068C 14 498289 495701 C 2011-02-03 1996-07-31 +S000007623 ORF Dubious YNL067W-A YNL067W-B chromosome 14 14 498538 498684 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037221 CDS YNL067W-A 14 498538 498684 W 2011-02-03 2001-02-26 +S000118388 ARS ARS1420 ARSXIV-499 chromosome 14 14 498970 499154 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178172 ARS_consensus_sequence ARS1420 14 499037 499053 W 2014-11-18 2014-11-18 +S000028810 ORF Uncharacterized YNL067W-B YNL067W-A chromosome 14 14 499417 499557 W 2011-02-03 2003-07-29 Putative protein of unknown function +S000033610 CDS YNL067W-B 14 499417 499557 W 2011-02-03 2003-07-29 +S000005011 ORF Verified YNL067W RPL9B uS4|uL6|ribosomal 60S subunit protein L9B|L6|rp24|YL11|L9B|L8B chromosome 14 L000003165 14 499681 500256 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L9B; homologous to mammalian ribosomal protein L9 and bacterial L6; RPL9B has a paralog, RPL9A, that arose from a single-locus duplication +S000036228 CDS YNL067W 14 499681 500256 W 2011-02-03 1996-07-31 +S000005010 ORF Verified YNL066W SUN4 putative glucosidase SUN4|SCW3 chromosome 14 L000004564|L000004151 14 501515 502777 W 2011-02-03 1996-07-31 Cell wall protein related to glucanases; possibly involved in cell wall septation; member of the SUN family; SUN4 has a paralog, SIM1, that arose from the whole genome duplication +S000036134 CDS YNL066W 14 501515 502777 W 2011-02-03 1996-07-31 +S000122110 five_prime_UTR_intron YNL066W 14 501157 501502 W 2011-02-03 2007-04-04 +S000005009 ORF Verified YNL065W AQR1 chromosome 14 14 503724 505484 W 2011-02-03 1996-07-31 Plasma membrane transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; confers resistance to short-chain monocarboxylic acids and quinidine; involved in the excretion of excess amino acids; AQR1 has a paralog, QDR1, that arose from the whole genome duplication; relocalizes from plasma membrane to cytoplasm upon DNA replication stress +S000036037 CDS YNL065W 14 503724 505484 W 2011-02-03 1996-07-31 +S000005008 ORF Verified YNL064C YDJ1 MAB3|type I HSP40 co-chaperone YDJ1|HSP40|MAS5 chromosome 14 L000002503|L000003567|S000029274 14 507097 505868 C 2011-02-03 1996-07-31 Type I HSP40 co-chaperone; involved in regulation of HSP90 and HSP70 functions; acts as an adaptor that helps Rsp5p recognize cytosolic misfolded proteins for ubiquitination after heat shock; critical for determining cell size at Start as a function of growth rate; involved in protein translocation across membranes; member of the DnaJ family; chimeric protein in which human p58IPK J domain replaces yeast Ydj1p J domain can complement yeast ydj1 mutant +S000035088 CDS YNL064C 14 507097 505868 C 2011-02-03 1996-07-31 +S000005007 ORF Verified YNL063W MTQ1 S-adenosylmethionine-dependent methyltransferase chromosome 14 14 507758 508702 W 2011-02-03 1996-07-31 S-adenosylmethionine-dependent methyltransferase; methylates translational release factor Mrf1p; similar to E.coli PrmC; is not an essential gene +S000035039 CDS YNL063W 14 507758 508702 W 2011-02-03 1996-07-31 +S000005006 ORF Verified YNL062C GCD10 tRNA 1-methyladenosine methyltransferase subunit GCD10|TRM6 chromosome 14 L000000676 14 510212 508776 C 2011-02-03 1996-07-31 Subunit of tRNA (1-methyladenosine) methyltransferase with Gcd14p; required for the modification of the adenine at position 58 in tRNAs, especially tRNAi-Met; first identified as a negative regulator of GCN4 expression +S000034822 CDS YNL062C 14 510212 508776 C 2011-02-03 1996-07-31 +S000005005 ORF Verified YNL061W NOP2 rRNA (cytosine-C5-)-methyltransferase NOP2|YNA1 chromosome 14 L000002535 14 510540 512396 W 2011-02-03 1996-07-31 rRNA m5C methyltransferase; methylates cytosine at position 2870 of 25S rRNA; has an essential function independent of rRNA methylation; contains seven beta-strand methyltransferase motif; essential for processing and maturation of 27S pre-rRNA and large ribosomal subunit biogenesis; localized to the nucleolus; constituent of 66S pre-ribosomal particles; rRNA methylation defect and lethality are functionally complemented by human NOP2, a gene upregulated in cancer +S000034786 CDS YNL061W 14 510540 512396 W 2011-02-03 1996-07-31 +S000005004 ORF Verified YNL059C ARP5 chromosome 14 L000003434 14 514935 512668 C 2011-02-03 1997-01-28 Nuclear actin-related protein involved in chromatin remodeling; component of chromatin-remodeling enzyme complexes; promotes nucleosome shifts in the 3 prime direction +S000031814 CDS YNL059C 14 514935 512668 C 2011-02-03 1997-01-28 +S000005002 ORF Dubious YNL057W chromosome 14 14 516403 516735 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031644 CDS YNL057W 14 516403 516735 W 2011-02-03 1997-01-28 +S000005003 ORF Uncharacterized YNL058C chromosome 14 14 516713 515763 C 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to vacuole; not an essential gene; YNL058C has a paralog, PRM5, that arose from the whole genome duplication +S000031675 CDS YNL058C 14 516713 515763 C 2011-02-03 1997-01-28 +S000005001 ORF Verified YNL056W OCA2 chromosome 14 14 517249 517842 W 2011-02-03 1997-01-28 Protein of unknown function; similar to predicted tyrosine phosphatases Oca1p and Siw14p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YNL056W is not an essential gene +S000031555 CDS YNL056W 14 517249 517842 W 2011-02-03 1997-01-28 +S000005000 ORF Verified YNL055C POR1 porin POR1|VDAC|YVDAC1|OMP2 chromosome 14 L000001302 14 518845 517994 C 2011-02-03 1997-01-28 Mitochondrial porin (voltage-dependent anion channel); outer membrane protein required for maintenance of mitochondrial osmotic stability and mitochondrial membrane permeability; couples the glutathione pools of the intermembrane space (IMS) and the cytosol; interacts with Om45 and Om14 in the outer membrane; phosphorylated; protein abundance increases in response to DNA replication stress +S000030679 CDS YNL055C 14 518845 517994 C 2011-02-03 1997-01-28 +S000007136 long_terminal_repeat YNLWdelta3 chromosome 14 14 519163 519496 W 2011-02-03 2000-05-19 Ty1 LTR +S000007142 LTR_retrotransposon YNLWTy1-2 Ty1 chromosome 14 14 519163 525062 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000006544 tRNA_gene tD(GUC)N chromosome 14 L000003699 14 519169 519099 C 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000030423 noncoding_exon tD(GUC)N 14 519169 519099 C 2011-02-03 2000-05-19 +S000007384 transposable_element_gene YNL054W-A gag protein chromosome 14 14 519456 520778 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000033062 CDS YNL054W-A 14 519456 520778 W 2011-02-03 1999-07-17 +S000007385 transposable_element_gene YNL054W-B gag-pol fusion protein chromosome 14 14 519456 524706 W 2011-02-03 1999-07-17 TyB Gag-Pol protein; proteolytically processed to make the Gag, reverse transcriptase (RT), protease (PR), and integrase (IN) proteins that are required for retrotransposition +S000033063 CDS YNL054W-B 14 519456 520760 W 2011-02-03 1999-07-17 +S000033064 CDS YNL054W-B 14 520762 524706 W 2011-02-03 1999-07-17 +S000033065 plus_1_translational_frameshift YNL054W-B 14 520761 520761 W 2011-02-03 1999-07-17 +S000007137 long_terminal_repeat YNLWdelta4 chromosome 14 14 524729 525062 W 2011-02-03 2000-05-19 Ty1 LTR +S000004999 ORF Verified YNL054W VAC7 chromosome 14 L000004051 14 526086 529583 W 2011-02-03 1997-01-28 Integral vacuolar membrane protein; involved in vacuole inheritance and morphology; activates Fab1p kinase activity under basal conditions and also after hyperosmotic shock +S000030639 CDS YNL054W 14 526086 529583 W 2011-02-03 1997-01-28 +S000004998 ORF Verified YNL053W MSG5 tyrosine/serine/threonine protein phosphatase MSG5 chromosome 14 L000001188 14 529942 531411 W 2011-02-03 1997-01-28 Dual-specificity protein phosphatase; exists in 2 isoforms; required for maintenance of a low level of signaling through the cell integrity pathway, adaptive response to pheromone; regulates and is regulated by Slt2p; dephosphorylates Fus3p; MSG5 has a paralog, SDP1, that arose from the whole genome duplication +S000030532 CDS YNL053W 14 529942 531411 W 2011-02-03 1997-01-28 +S000004997 ORF Verified YNL052W COX5A cytochrome c oxidase subunit Va chromosome 14 L000000388|L000000387 14 531725 532186 W 2011-02-03 1997-01-28 Subunit Va of cytochrome c oxidase; cytochrome c oxidase is the terminal member of the mitochondrial inner membrane electron transport chain; Cox5Ap is predominantly expressed during aerobic growth while its isoform Vb (Cox5Bp) is expressed during anaerobic growth; COX5A has a paralog, COX5B, that arose from the whole genome duplication +S000030467 CDS YNL052W 14 531725 532186 W 2011-02-03 1997-01-28 +S000004996 ORF Verified YNL051W COG5 Golgi transport complex subunit COG5|COD4|API4 chromosome 14 14 532659 533870 W 2011-02-03 1997-01-28 Component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments +S000037658 CDS YNL051W 14 532659 533870 W 2011-02-03 1997-01-28 +S000004995 ORF Uncharacterized YNL050C chromosome 14 14 534982 534079 C 2011-02-03 1997-01-28 Putative protein of unknown function; YNL050c is not an essential gene +S000037523 CDS YNL050C 14 534874 534079 C 2011-02-03 1997-01-28 +S000037522 CDS YNL050C 14 534982 534966 C 2011-02-03 1997-01-28 +S000037524 intron YNL050C 14 534965 534875 C 2011-02-03 1997-01-28 +S000004994 ORF Verified YNL049C SFB2 COPII subunit SFB2|ISS1 chromosome 14 L000004658 14 537911 535281 C 2011-02-03 1997-01-28 Component of the Sec23p-Sfb2p heterodimer of the COPII vesicle coat; required for cargo selection during vesicle formation in ER to Golgi transport; homologous to Sfb3p; SFB2 has a paralog, SEC24, that arose from the whole genome duplication +S000036531 CDS YNL049C 14 537911 535281 C 2011-02-03 1997-01-28 +S000004993 ORF Verified YNL048W ALG11 alpha-1,2-mannosyltransferase ALG11 chromosome 14 L000003378 14 538173 539819 W 2011-02-03 1997-01-28 Alpha-1,2-mannosyltransferase; catalyzes sequential addition of the two terminal alpha 1,2-mannose residues to the Man5GlcNAc2-PP-dolichol intermediate during asparagine-linked glycosylation in the ER +S000036480 CDS YNL048W 14 538173 539819 W 2011-02-03 1997-01-28 +S000004992 ORF Verified YNL047C SLM2 phosphatidylinositol 4,5-bisphosphate-binding protein|LIT1 chromosome 14 14 541881 539911 C 2011-02-03 1997-01-28 Phosphoinositide PI4,5P(2) binding protein, forms a complex with Slm1p; acts downstream of Mss4p in a pathway regulating actin cytoskeleton organization in response to stress; TORC2 complex substrate and effector; SLM2 has a paralog, SLM1, that arose from the whole genome duplication +S000036346 CDS YNL047C 14 541881 539911 C 2011-02-03 1997-01-28 +S000004991 ORF Uncharacterized YNL046W chromosome 14 14 542304 542822 W 2011-02-03 1997-01-28 Putative protein of unknown function; expression depends on Swi5p; GFP-fusion protein localizes to the endoplasmic reticulum; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO) +S000036307 CDS YNL046W 14 542304 542822 W 2011-02-03 1997-01-28 +S000004990 ORF Verified YNL045W LAP2 bifunctional aminopeptidase/epoxide hydrolase chromosome 14 14 542963 544978 W 2011-02-03 1997-01-28 Leucyl aminopeptidase yscIV with epoxide hydrolase activity; metalloenzyme containing one zinc atom; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; also known as leukotriene A4 hydrolase +S000035413 CDS YNL045W 14 542963 544978 W 2011-02-03 1997-01-28 +S000004989 ORF Verified YNL044W YIP3 chromosome 14 L000003269 14 545268 545877 W 2011-02-03 1999-11-17|1997-01-28 Protein localized to COPII vesicles; proposed to be involved in ER to Golgi transport; interacts with members of the Rab GTPase family and Yip1p; also interacts with Rtn1p +S000035328 CDS YNL044W 14 545268 545291 W 2011-02-03 1999-11-17 +S000035329 CDS YNL044W 14 545371 545877 W 2011-02-03 1999-11-17|1997-01-28 +S000035330 intron YNL044W 14 545292 545370 W 2011-02-03 1999-11-17 +S000004988 ORF Dubious YNL043C chromosome 14 14 545909 545589 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YIP3/YNL044W +S000035201 CDS YNL043C 14 545909 545589 C 2011-02-03 1997-01-28 +S000118389 ARS ARS1421 ARSXIV-546 chromosome 14 14 546072 546170 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178173 ARS_consensus_sequence ARS1421 14 546146 546130 C 2014-11-18 2014-11-18 +S000007138 long_terminal_repeat YNLWsigma2 chromosome 14 14 546423 546714 W 2011-02-03 2000-05-19 Ty3 LTR +S000007139 long_terminal_repeat YNLWsigma3 chromosome 14 14 546738 547077 W 2011-02-03 2000-05-19 Ty3 LTR +S000006685 tRNA_gene tP(UGG)N1 chromosome 14 L000003691 14 547094 547196 W 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin +S000030970 intron tP(UGG)N1 14 547130 547160 W 2011-02-03 2000-05-19 +S000030968 noncoding_exon tP(UGG)N1 14 547094 547129 W 2011-02-03 2000-05-19 +S000030969 noncoding_exon tP(UGG)N1 14 547161 547196 W 2011-02-03 2000-05-19 +S000028850 ORF Uncharacterized YNL042W-B chromosome 14 14 547113 547370 W 2011-02-03 2003-07-29 Putative protein of unknown function +S000034563 CDS YNL042W-B 14 547113 547370 W 2011-02-03 2003-07-29 +S000004987 ORF Verified YNL042W BOP3 chromosome 14 L000004723 14 548100 549290 W 2011-02-03 1997-01-28 Protein of unknown function; potential Cdc28p substrate; overproduction confers resistance to methylmercury +S000035157 CDS YNL042W 14 548100 549290 W 2011-02-03 1997-01-28 +S000004986 ORF Verified YNL041C COG6 Golgi transport complex subunit COG6|SEC37|COD2 chromosome 14 14 551987 549468 C 2011-02-03 1997-01-28 Component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments +S000034122 CDS YNL041C 14 551987 549468 C 2011-02-03 1997-01-28 +S000004985 ORF Verified YNL040W putative alanine--tRNA ligase chromosome 14 14 553380 554750 W 2011-02-03 1997-01-28 Protein of unknown function; has strong similarity to alanyl-tRNA synthases from Eubacteria; null mutant displays decreased translation rate and increased readthrough of premature stop codons; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YNL040W is not an essential gene +S000034091 CDS YNL040W 14 553380 554750 W 2011-02-03 1997-01-28 +S000004984 ORF Verified YNL039W BDP1 transcription factor TFIIIB subunit BDP1|TFC7|TFIIIB90|TFC5 chromosome 14 L000003032 14 555048 556832 W 2011-02-03 1997-01-28 Essential subunit of RNA polymerase III transcription factor (TFIIIB); TFIIIB is involved in transcription of genes encoding tRNAs, 5S rRNA, U6 snRNA, and other small RNAs +S000032264 CDS YNL039W 14 555048 556832 W 2011-02-03 1997-01-28 +S000004983 ORF Verified YNL038W GPI15 phosphatidylinositol N-acetylglucosaminyltransferase GPI15 chromosome 14 14 557020 557783 W 2011-02-03 2003-09-27|1997-01-28 Protein involved in the synthesis of GlcNAc-PI; GlcNAc-PI is the first intermediate in the synthesis of glycosylphosphatidylinositol (GPI) anchors; homologous to the human PIG-H protein; GlcNAc-PI stands for N-acetylglucosaminyl phosphatidylinositol +S000032181 CDS YNL038W 14 557020 557610 W 2011-02-03 2003-09-27|1997-01-28 +S000032182 CDS YNL038W 14 557685 557783 W 2011-02-03 2003-09-27 +S000032183 intron YNL038W 14 557611 557684 W 2011-02-03 2003-09-27 +S000004982 ORF Verified YNL037C IDH1 isocitrate dehydrogenase (NAD(+)) IDH1 chromosome 14 L000000849 14 559002 557920 C 2011-02-03 1997-01-28 Subunit of mitochondrial NAD(+)-dependent isocitrate dehydrogenase; complex catalyzes the oxidation of isocitrate to alpha-ketoglutarate in the TCA cycle +S000032073 CDS YNL037C 14 559002 557920 C 2011-02-03 1997-01-28 +S000004981 ORF Verified YNL036W NCE103 carbonate dehydratase NCE103|NCE3 chromosome 14 L000003213 14 559814 560479 W 2011-02-03 1997-01-28 Carbonic anhydrase; metalloenzyme that catalyzes CO2 hydration to bicarbonate, which is an important metabolic substrate, and protons; not expressed under conditions of high CO2, such as inside a growing colony, but transcription is induced in response to low CO2 levels, such as on the colony surface in ambient air; poorly transcribed under aerobic conditions and at an undetectable level under anaerobic conditions; abundance increases in response to DNA replication stress +S000032012 CDS YNL036W 14 559814 560479 W 2011-02-03 1997-01-28 +S000006745 tRNA_gene tT(AGU)N2 chromosome 14 L000003698 14 560765 560693 C 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000037431 noncoding_exon tT(AGU)N2 14 560765 560693 C 2011-02-03 2000-05-19 +S000118390 ARS ARS1422 ARSXIV-561 chromosome 14 14 561111 561388 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178174 ARS_consensus_sequence ARS1422 14 561327 561311 C 2014-11-18 2014-11-18 +S000007141 long_terminal_repeat YNLWtau2 chromosome 14 14 561607 561977 W 2011-02-03 2000-05-19 Ty4 LTR +S000007131 long_terminal_repeat YNLCdelta5 chromosome 14 14 562364 562033 C 2011-02-03 2000-05-19 Ty2 LTR +S000007135 LTR_retrotransposon YNLCTy2-1 Ty2 chromosome 14 14 567660 562364 C 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; mutated in S288C +S000007132 long_terminal_repeat YNLCdelta6 chromosome 14 14 567992 567660 C 2011-02-03 2000-05-19 Ty2 LTR +S000006686 tRNA_gene tP(UGG)N2 chromosome 14 L000003692 14 568115 568217 W 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin +S000030974 intron tP(UGG)N2 14 568151 568181 W 2011-02-03 2000-05-19 +S000030972 noncoding_exon tP(UGG)N2 14 568115 568150 W 2011-02-03 2000-05-19 +S000030973 noncoding_exon tP(UGG)N2 14 568182 568217 W 2011-02-03 2000-05-19 +S000130143 ARS ARS1423 chromosome 14 14 568219 568524 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000004980 ORF Verified YNL035C chromosome 14 14 569691 568522 C 2011-02-03 1997-01-28 Nuclear protein of unknown function; relocalizes to the cytosol in response to hypoxia; contains WD-40 domains; not an essential gene; protein abundance increases in response to DNA replication stress +S000031007 CDS YNL035C 14 569691 568522 C 2011-02-03 1997-01-28 +S000006609 tRNA_gene tI(AAU)N1 chromosome 14 L000003697 14 569940 569867 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000034901 noncoding_exon tI(AAU)N1 14 569940 569867 C 2011-02-03 2000-05-19 +S000004979 ORF Uncharacterized YNL034W chromosome 14 14 570477 572315 W 2011-02-03 1997-01-28 Putative protein of unknown function; not an essential gene; YNL034W has a paralog, YNL018C, that arose from a segmental duplication +S000030964 CDS YNL034W 14 570477 572315 W 2011-02-03 1997-01-28 +S000004978 ORF Uncharacterized YNL033W chromosome 14 14 572999 573853 W 2011-02-03 1997-01-28 Putative protein of unknown function; YNL033W has a paralog, YNL019C, that arose from a segmental duplication +S000030908 CDS YNL033W 14 572999 573853 W 2011-02-03 1997-01-28 +S000004977 ORF Verified YNL032W SIW14 putative tyrosine protein phosphatase SIW14|OCA3 chromosome 14 L000004216 14 574506 575351 W 2011-02-03 1997-01-28 Tyrosine phosphatase involved in actin organization and endocytosis; localized to the cytoplasm +S000030820 CDS YNL032W 14 574506 575351 W 2011-02-03 1997-01-28 +S000004976 ORF Verified YNL031C HHT2 histone H3 chromosome 14 L000000773 14 576050 575640 C 2011-02-03 1997-01-28 Histone H3; core histone protein required for chromatin assembly, part of heterochromatin-mediated telomeric and HM silencing; one of two identical histone H3 proteins (see HHT1); regulated by acetylation, methylation, and phosphorylation; H3K14 acetylation plays an important role in the unfolding of strongly positioned nucleosomes during repair of UV damage +S000037842 CDS YNL031C 14 576050 575640 C 2011-02-03 1997-01-28 +S000004975 ORF Verified YNL030W HHF2 histone H4 chromosome 14 L000000771 14 576727 577038 W 2011-02-03 1997-01-28 Histone H4; core histone protein required for chromatin assembly and chromosome function; one of two identical histone proteins (see also HHF1); contributes to telomeric silencing; N-terminal domain involved in maintaining genomic integrity +S000037800 CDS YNL030W 14 576727 577038 W 2011-02-03 1997-01-28 +S000004973 ORF Dubious YNL028W chromosome 14 14 578679 578996 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036923 CDS YNL028W 14 578679 578996 W 2011-02-03 1997-01-28 +S000004974 ORF Verified YNL029C KTR5 putative mannosyltransferase chromosome 14 L000004099 14 578773 577205 C 2011-02-03 1997-01-28 Putative mannosyltransferase involved in protein glycosylation; member of the KRE2/MNT1 mannosyltransferase family; KTR5 has a paralog, KTR7, that arose from the whole genome duplication +S000036950 CDS YNL029C 14 578773 577205 C 2011-02-03 1997-01-28 +S000004972 ORF Verified YNL027W CRZ1 DNA-binding transcription factor CRZ1|TCN1|HAL8 chromosome 14 L000004202 14 579580 581616 W 2011-02-03 1997-01-28 Transcription factor, activates transcription of stress response genes; nuclear localization is positively regulated by calcineurin-mediated dephosphorylation; rapidly localizes to the nucleus under blue light stress; can be activated in stochastic pulses of nuclear localization in response to calcium +S000036172 CDS YNL027W 14 579580 581616 W 2011-02-03 1997-01-28 +S000004971 ORF Verified YNL026W SAM50 SAM complex subunit SAM50|TOB55|OMP85 chromosome 14 14 581920 583374 W 2011-02-03 1997-01-28 Component of the Sorting and Assembly Machinery (SAM) complex; the SAM (or TOB) complex is located in the mitochondrial outer membrane; the complex binds precursors of beta-barrel proteins and facilitates their outer membrane insertion; homologous to bacterial Omp85 +S000035990 CDS YNL026W 14 581920 583374 W 2011-02-03 1997-01-28 +S000004970 ORF Verified YNL025C SSN8 cyclin-dependent protein serine/threonine kinase regulator SSN8|CNC1|CycC|RYE2|UME3|SRB11|NUT9|GIG3 chromosome 14 L000002796 14 585291 584320 C 2011-02-03 1997-01-28 Cyclin-like component of the RNA polymerase II holoenzyme; involved in phosphorylation of the RNA polymerase II C-terminal domain; forms a kinase-cyclin pair in the RNAPII holoenzyme with Ssn3p; required for both entry into and execution of the meiotic program; involved in glucose repression and telomere maintenance; cyclin homolog 35% identical to human cyclin C +S000034989 CDS YNL025C 14 585291 584320 C 2011-02-03 1997-01-28 +S000007436 snoRNA_gene NME1 NME1 RRP2 chromosome 14 L000001258 14 585587 585926 W 2011-02-03 2000-05-19 RNA component of RNase MRP; RNase MRP cleaves pre-rRNA and has a role in cell cycle-regulated degradation of daughter cell-specific mRNAs; human ortholog is implicated in cartilage-hair hypoplasia (CHH) +S000032302 noncoding_exon NME1 14 585587 585926 W 2011-02-03 2000-05-19 +S000006457 snoRNA_gene snR66 SNR66 chromosome 14 L000004535 14 586090 586175 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U2417 +S000030852 noncoding_exon snR66 14 586090 586175 W 2011-02-03 2000-05-19 +S000028698 ORF Verified YNL024C-A KSH1 chromosome 14 14 586820 586602 C 2011-02-03 2003-07-29 Essential protein suggested to function early in the secretory pathway; inviability is suppressed by overexpression of Golgi protein Tvp23p; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and cytosol respectively; ortholog of human Kish +S000032608 CDS YNL024C-A 14 586820 586602 C 2011-02-03 2003-07-29 +S000004969 ORF Uncharacterized YNL024C EFM6 putative protein-lysine N-methyltransferase chromosome 14 14 587847 587107 C 2011-02-03 1997-01-28 Putative S-adenosylmethionine-dependent lysine methyltransferase; responsible for modifying Lys-390 in translational elongation factor EF-1 alpha (eEF1A); has seven beta-strand methyltransferase motif; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000034856 CDS YNL024C 14 587847 587107 C 2011-02-03 1997-01-28 +S000004968 ORF Verified YNL023C FAP1 chromosome 14 L000004577 14 591160 588263 C 2011-02-03 1997-01-28 Protein that binds to Fpr1p; confers rapamycin resistance by competing with rapamycin for Fpr1p binding; accumulates in the nucleus upon treatment of cells with rapamycin; has similarity to D. melanogaster shuttle craft and human NFX1 +S000034736 CDS YNL023C 14 591160 588263 C 2011-02-03 1997-01-28 +S000004967 ORF Verified YNL022C RCM1 rRNA (cytosine-C5-)-methyltransferase RCM1 chromosome 14 14 592899 591427 C 2011-02-03 1997-01-28 rRNA m5C methyltransferase; methylates cytosine at position 2278 of 25S rRNA while Nop2p methylates cytosine at position 2870; contains seven beta-strand methyltransferase motif; localized to the nucleolus; interacts with Trm112p; homolog of NSUN5A, a human gene which is deleted in Williams-Beuren Syndrome +S000033831 CDS YNL022C 14 592899 591427 C 2011-02-03 1997-01-28 +S000004966 ORF Verified YNL021W HDA1 histone deacetylase HDA1 chromosome 14 L000004088 14 593227 595347 W 2011-02-03 1997-01-28 Putative catalytic subunit of a class II histone deacetylase complex; role in azole resistance via Hsp90p, and in the heat shock response; Hda1p interacts with the Hda2p-Hda3p subcomplex to form an active tetramer; deletion increases histone H2B, H3 and H4 acetylation; other members of the HDA1 histone deacetylase complex are Hda2p and Hda3p +S000033782 CDS YNL021W 14 593227 595347 W 2011-02-03 1997-01-28 +S000004965 ORF Verified YNL020C ARK1 serine/threonine protein kinase ARK1 chromosome 14 L000004430 14 597539 595623 C 2011-02-03 1997-01-28 Serine/threonine protein kinase; involved in regulation of the cortical actin cytoskeleton; involved in control of endocytosis; ARK1 has a paralog, PRK1, that arose from the whole genome duplication +S000033598 CDS YNL020C 14 597539 595623 C 2011-02-03 1997-01-28 +S000004964 ORF Uncharacterized YNL019C chromosome 14 14 599230 598376 C 2011-02-03 1997-01-28 Putative protein of unknown function; expression induced during heat stress; YNL019C has a paralog, YNL033W, that arose from a segmental duplication +S000032941 CDS YNL019C 14 599230 598376 C 2011-02-03 1997-01-28 +S000004963 ORF Uncharacterized YNL018C chromosome 14 14 601774 599936 C 2011-02-03 1997-01-28 Putative protein of unknown function; YNL018C has a paralog, YNL034W, that arose from a segmental duplication +S000032852 CDS YNL018C 14 601774 599936 C 2011-02-03 1997-01-28 +S000006610 tRNA_gene tI(AAU)N2 chromosome 14 L000003693 14 602312 602385 W 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000034903 noncoding_exon tI(AAU)N2 14 602312 602385 W 2011-02-03 2000-05-19 +S000004962 ORF Dubious YNL017C chromosome 14 14 602476 602138 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the tRNA ORF tI(AAU)N2 +S000031913 CDS YNL017C 14 602476 602138 C 2011-02-03 1997-01-28 +S000004961 ORF Verified YNL016W PUB1 RNP1 chromosome 14 L000001529 14 602907 604268 W 2011-02-03 1997-01-28 Poly (A)+ RNA-binding protein; abundant mRNP-component protein that binds mRNA and is required for stability of many mRNAs; component of glucose deprivation induced stress granules, involved in P-body-dependent granule assembly; implicated in regulation of translation; carries Q/N-rich domain at C- terminus, identified as candidate prion; human homolog Tia1 is critical for normal synaptic plasticity; protein abundance increases in response to DNA replication stress +S000031862 CDS YNL016W 14 602907 604268 W 2011-02-03 1997-01-28 +S000004960 ORF Verified YNL015W PBI2 IB2|I2B|LMA1 chromosome 14 L000001344 14 605384 605611 W 2011-02-03 1997-01-28 Cytosolic inhibitor of vacuolar proteinase B (PRB1); required for efficient vacuole inheritance; with thioredoxin forms protein complex LMA1, which assists in priming SNARE molecules and promotes vacuole fusion; protein abundance increases in response to DNA replication stress +S000031753 CDS YNL015W 14 605384 605611 W 2011-02-03 1997-01-28 +S000004959 ORF Verified YNL014W HEF3 translation elongation factor EF-3|ZRG7 chromosome 14 14 606319 609453 W 2011-02-03 1997-01-28 Translational elongation factor EF-3; member of the ABC superfamily; stimulates EF-1 alpha-dependent binding of aminoacyl-tRNA by the ribosome; normally expressed in zinc deficient cells; HEF3 has a paralog, YEF3, that arose from the whole genome duplication +S000031664 CDS YNL014W 14 606319 609453 W 2011-02-03 1997-01-28 +S000004958 ORF Dubious YNL013C chromosome 14 14 609510 609133 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF HEF3/YNL014W +S000031500 CDS YNL013C 14 609510 609133 C 2011-02-03 1997-01-28 +S000118391 ARS ARS1424 ARSXIV-610 chromosome 14 14 609520 609607 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178175 ARS_consensus_sequence ARS1424 14 609532 609548 W 2014-11-18 2014-11-18 +S000004957 ORF Verified YNL012W SPO1 putative carboxylic ester hydrolase chromosome 14 L000001999 14 609686 611665 W -1 2011-02-03 2000-07-14|1997-01-28 Meiosis-specific prospore protein; required for meiotic spindle pole body duplication and separation; required to produce bending force necessary for proper prospore membrane assembly during sporulation; has similarity to phospholipase B +S000030704 CDS YNL012W 14 609686 609790 W 2011-02-03 2000-07-14 +S000030705 CDS YNL012W 14 609875 611665 W 2011-02-03 2000-07-14|1997-01-28 +S000030706 intron YNL012W 14 609791 609874 W 2011-02-03 2000-07-14 +S000004956 ORF Uncharacterized YNL011C chromosome 14 14 613170 611836 C 2011-02-03 1997-01-28 Putative protein of unknown function; YNL011C is not an essential gene +S000030538 CDS YNL011C 14 613170 611836 C 2011-02-03 1997-01-28 +S000004955 ORF Uncharacterized YNL010W putative phosphoric monoester hydrolase chromosome 14 14 613635 614360 W 2011-02-03 1997-01-28 Putative protein of unknown function; similar to phosphoserine phosphatases; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; homozygous diploid mutant shows an increase in glycogen accumulation +S000030490 CDS YNL010W 14 613635 614360 W 2011-02-03 1997-01-28 +S000004954 ORF Verified YNL009W IDP3 isocitrate dehydrogenase (NADP(+)) IDP3 chromosome 14 L000003946 14 614821 616083 W 2011-02-03 1997-01-28 Peroxisomal NADP-dependent isocitrate dehydrogenase; catalyzes oxidation of isocitrate to alpha-ketoglutarate with the formation of NADP(H+), required for growth on unsaturated fatty acids; IDP3 has a paralog, IDP2, that arose from the whole genome duplication +S000037693 CDS YNL009W 14 614821 616083 W 2011-02-03 1997-01-28 +S000130144 ARS ARS1425 chromosome 14 14 616311 617125 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000004953 ORF Verified YNL008C ASI3 putative ubiquitin-protein ligase ASI3 chromosome 14 14 618241 616211 C 2011-02-03 1997-01-28|2011-02-03 Subunit of the inner nuclear membrane Asi ubiquitin ligase complex; Asi complex targets both misfolded proteins of the inner nuclear membrane-associated degradation (INMAD) pathway and regulators of sterol biosynthesis for ubiquitin-mediated degradation; acts with Asi1p and Asi2p to ensure the fidelity of SPS-sensor signaling by targeting latent unprocessed forms of Stp1p and Stp2p, maintaining the repressed state of gene expression in the absence of inducing amino acids +S000037593 CDS YNL008C 14 618241 616211 C 2011-02-03 1997-01-28|2011-02-03 +S000004952 ORF Verified YNL007C SIS1 type II HSP40 co-chaperone SIS1 chromosome 14 L000001898 14 619565 618507 C 3 2011-02-03 1997-01-28 Type II HSP40 co-chaperone that interacts with the HSP70 protein Ssa1p; shuttles between cytosol and nucleus; mediates delivery of misfolded proteins into the nucleus for degradation; involved in proteasomal degradation of misfolded cytosolic proteins; protein abundance increases in response to DNA replication stress; polyQ aggregates sequester Sis1p and interfere with clearance of misfolded proteins; similar to bacterial DnaJ proteins and mammalian DnaJB1 +S000036851 CDS YNL007C 14 619565 618507 C 2011-02-03 1997-01-28 +S000004951 ORF Verified YNL006W LST8 TOR complex subunit LST8 chromosome 14 L000004356 14 620067 620978 W 2011-02-03 1997-01-28 Protein required for the transport of Gap1p; required for the transport of amino acid permease Gap1p from the Golgi to the cell surface; component of the TOR signaling pathway; associates with both Tor1p and Tor2p; contains a WD-repeat +S000036826 CDS YNL006W 14 620067 620978 W 2011-02-03 1997-01-28 +S000004950 ORF Verified YNL005C MRP7 mitochondrial 54S ribosomal protein YmL2|YmL2|MRPL2 chromosome 14 L000002682|S000029309|L000001155|L000003239 14 622428 621313 C 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit +S000036741 CDS YNL005C 14 622428 621313 C 2011-02-03 1997-01-28 +S000004949 ORF Verified YNL004W HRB1 mRNA-binding protein|TOM34 chromosome 14 L000002318 14 622915 624621 W 2011-02-03 1997-01-28|2007-07-09 Poly(A+) RNA-binding protein; key surveillance factor for the selective export of spliced mRNAs from the nucleus to the cytoplasm; preference for intron-containing genes; similar to Npl3p; HRB1 has a paralog, GBP2, that arose from the whole genome duplication +S000036718 CDS YNL004W 14 622915 622944 W 2011-02-03 1997-01-28|2007-07-09 +S000123273 CDS YNL004W 14 623287 624621 W 2011-02-03 2007-07-09 +S000123272 intron YNL004W 14 622945 623286 W 2011-02-03 2007-07-09 +S000004948 ORF Verified YNL003C PET8 SAM5 chromosome 14 L000001385 14 625829 624975 C 3 2011-02-03 1997-01-28 S-adenosylmethionine transporter of the mitochondrial inner membrane; member of the mitochondrial carrier family; required for biotin biosynthesis and respiratory growth +S000035777 CDS YNL003C 14 625829 624975 C 2011-02-03 1997-01-28 +S000004947 ORF Verified YNL002C RLP7 RPL7 chromosome 14 L000001647 14 627142 626174 C 2011-02-03 1997-01-28 Nucleolar protein similar to large ribosomal subunit L7 proteins; constituent of 66S pre-ribosomal particles; plays an essential role in processing of precursors to the large ribosomal subunit RNAs; binds junction of ITS2 and ITS2-proximal stem between the 3' end of 5.8S rRNA and the 5' end of 25S rRNA +S000035659 CDS YNL002C 14 627142 626174 C 2011-02-03 1997-01-28 +S000004946 ORF Verified YNL001W DOM34 ribosome dissociation factor DOM34 chromosome 14 L000000517 14 627456 628616 W 2011-02-03 1997-01-28 Protein that facilitates ribosomal subunit dissociation; Dom34-Hbs1 complex and Rli1p have roles in dissociating inactive ribosomes to facilitate translation restart, particularly ribosomes stalled in 3' UTRs; required for RNA cleavage in no-go decay, but reports conflict on endonuclease activity; Pelota ortholog; protein abundance increases in response to DNA replication stress; DOM34 has a paralog, YCL001W-B, that arose from the whole genome duplication +S000035621 CDS YNL001W 14 627456 628616 W 2011-02-03 1997-01-28 +S000006475 centromere CEN14 CEN14 chromosome 14 L000000307 14 628758 628875 W 0 2011-02-03 2000-05-19|2004-10-08 Chromosome XIV centromere +S000077302 centromere_DNA_Element_I CEN14 14 628758 628767 W 2011-02-03 2004-10-08 +S000077303 centromere_DNA_Element_II CEN14 14 628768 628850 W 2011-02-03 2004-10-08 +S000077304 centromere_DNA_Element_III CEN14 14 628851 628875 W 2011-02-03 2004-10-08 +S000005284 ORF Verified YNR001C CIT1 citrate (Si)-synthase CIT1|LYS6|CS1 chromosome 14 L000000341 14 631061 629622 C 2011-02-03 1997-01-28 Citrate synthase; catalyzes the condensation of acetyl coenzyme A and oxaloacetate to form citrate; the rate-limiting enzyme of the TCA cycle; nuclear encoded mitochondrial protein; CIT1 has a paralog, CIT2, that arose from the whole genome duplication +S000031441 CDS YNR001C 14 631061 629622 C 2011-02-03 1997-01-28 +S000007625 ORF Dubious YNR001W-A chromosome 14 14 631263 631481 W 2011-02-03 2001-02-26 Dubious open reading frame unlikely to encode a functional protein; identified by homology +S000037252 CDS YNR001W-A 14 631263 631481 W 2011-02-03 2001-02-26 +S000006679 tRNA_gene tP(AGG)N SUF10 chromosome 14 L000002158|L000003696 14 631917 631846 C -3 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in proline codons +S000033281 noncoding_exon tP(AGG)N 14 631917 631846 C 2011-02-03 2000-05-19 +S000007143 long_terminal_repeat YNRCdelta7 chromosome 14 14 632114 631998 C 2011-02-03 2000-05-19 Ty1 LTR +S000007146 long_terminal_repeat YNRCtau3 chromosome 14 14 632489 632119 C 2011-02-03 2000-05-19 Ty4 LTR +S000006674 tRNA_gene tN(GUU)N2 chromosome 14 L000003694 14 632599 632672 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis +S000035574 noncoding_exon tN(GUU)N2 14 632599 632672 W 2011-02-03 2000-05-19 +S000005285 ORF Verified YNR002C ATO2 putative ammonium permease ATO2|FUN34 chromosome 14 L000000647 14 633856 633008 C 2011-02-03 1997-01-28 Putative transmembrane protein involved in export of ammonia; ammonia is a starvation signal that promotes cell death in aging colonies; phosphorylated in mitochondria; member of the TC 9.B.33 YaaH family; homolog of Y. lipolytica Gpr1p; ATO2 has a paralog, ADY2, that arose from the whole genome duplication +S000031565 CDS YNR002C 14 633856 633008 C 2011-02-03 1997-01-28 +S000028705 ORF Dubious YNR003W-A chromosome 14 14 634420 634518 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene RPC34/YNR003C +S000032645 CDS YNR003W-A 14 634420 634518 W 2011-02-03 2003-07-29 +S000005286 ORF Verified YNR003C RPC34 DNA-directed RNA polymerase III subunit C34|C34 chromosome 14 L000001689 14 635297 634344 C 3 2011-02-03 1997-01-28 RNA polymerase III subunit C34; interacts with TFIIIB70 and is a key determinant in pol III recruitment by the preinitiation complex +S000031697 CDS YNR003C 14 635297 634344 C 2011-02-03 1997-01-28 +S000118392 ARS ARS1426 ARSXIV-636 chromosome 14 14 635664 635904 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178176 ARS_consensus_sequence ARS1426 14 635831 635815 C 2014-11-18 2014-11-18 +S000005287 ORF Verified YNR004W SWM2 chromosome 14 14 635943 636383 W 2011-02-03 1997-01-28 Protein with a role in snRNA and snoRNA cap trimethylation; interacts with Tgs1p and shows similar phenotypes; required for trimethylation of the caps of spliceosomal snRNAs and the U3 snoRNA, and for efficient 3' end processing of U3 snoRNA; may act as a specificity factor for Tgs1p +S000032703 CDS YNR004W 14 635943 636383 W 2011-02-03 1997-01-28 +S000005289 ORF Verified YNR006W VPS27 ESCRT-0 subunit protein VPS27|DID7|VPT27|VPL23|SSV17|GRD11 chromosome 14 L000002790 14 636986 638854 W 2011-02-03 1997-01-28 Endosomal protein that forms a complex with Hse1p; required for recycling Golgi proteins, forming lumenal membranes and sorting ubiquitinated proteins destined for degradation; has Ubiquitin Interaction Motifs which bind ubiquitin (Ubi4p) +S000032897 CDS YNR006W 14 636986 638854 W 2011-02-03 1997-01-28 +S000005288 ORF Dubious YNR005C chromosome 14 14 637335 636931 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032733 CDS YNR005C 14 637335 636931 C 2011-02-03 1997-01-28 +S000005290 ORF Verified YNR007C ATG3 AUT1|APG3 chromosome 14 L000004056|L000004783 14 640114 639182 C 2011-02-03 1997-01-28 E2-like enzyme; involved in autophagy and cytoplasm-to-vacuole targeting (Cvt) pathway; plays a role in formation of Atg8p-phosphatidylethanolamine conjugates, which are involved in membrane dynamics during autophagy and Cvt; interaction with Atg8p regulated by acetylation by NuA4 histone acetyltransferase Esa1p while attenuation of Atg3 acetylation is mediated by histone deacetylase Rpd3p; Atg12p-Atg5p conjugate enhances E2 activity of Atg3p by rearranging its catalytic site +S000034825 CDS YNR007C 14 640114 639182 C 2011-02-03 1997-01-28 +S000005291 ORF Verified YNR008W LRO1 phospholipid:diacylglycerol acyltransferase chromosome 14 S000007453 14 640396 642381 W 2011-02-03 1997-01-28 Acyltransferase that catalyzes diacylglycerol esterification; one of several acyltransferases that contribute to triglyceride synthesis; Lro1p and Dga1p can O-acylate ceramides; putative homolog of human lecithin cholesterol acyltransferase +S000035018 CDS YNR008W 14 640396 642381 W 2011-02-03 1997-01-28 +S000005292 ORF Verified YNR009W NRM1 chromosome 14 S000080164 14 642690 643439 W 2011-02-03 1997-01-28 Transcriptional co-repressor of MBF-regulated gene expression; Nrm1p associates stably with promoters via MCB binding factor (MBF) to repress transcription upon exit from G1 phase +S000035110 CDS YNR009W 14 642690 643439 W 2011-02-03 1997-01-28 +S000005293 ORF Verified YNR010W CSE2 MED9 chromosome 14 L000000426 14 643744 644193 W 2011-02-03 1997-01-28 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; component of the Middle domain of mediator; required for regulation of RNA polymerase II activity; relocalizes to the cytosol in response to hypoxia +S000034052 CDS YNR010W 14 643744 644193 W 2011-02-03 1997-01-28 +S000005294 ORF Verified YNR011C PRP2 DEAH-box RNA-dependent ATPase PRP2|RNA2 chromosome 14 L000001495 14 646950 644320 C 8 2011-02-03 1997-01-28 RNA-dependent DExD/H-box ATPase; required for activation of spliceosome before first transesterification step in RNA splicing; implicated in rearranging and proofreading snRNA structure in catalytic activation of spliceosome; ortholog of human protein DHX16 +S000034087 CDS YNR011C 14 646950 644320 C 2011-02-03 1997-01-28 +S000005295 ORF Verified YNR012W URK1 uridine kinase URK1 chromosome 14 L000002440 14 647432 648937 W 2011-02-03 1997-01-28 Uridine/cytidine kinase; component of the pyrimidine ribonucleotide salvage pathway that converts uridine into UMP and cytidine into CMP; involved in the pyrimidine deoxyribonucleotide salvage pathway, converting deoxycytidine into dCMP +S000035092 CDS YNR012W 14 647432 648937 W 2011-02-03 1997-01-28 +S000005296 ORF Verified YNR013C PHO91 chromosome 14 14 651712 649028 C 2011-02-03 1997-01-28 Low-affinity vacuolar phosphate transporter; exports phosphate from the vacuolar lumen to the cytosol; regulates phosphate and polyphosphate metabolism; acts upstream of Pho81p in regulation of the PHO pathway; localizes to sites of contact between the vacuole and mitochondria (vCLAMPs); deletion of pho84, pho87, pho89, pho90, and pho91 causes synthetic lethality; transcription independent of Pi and Pho4p activity; overexpression results in vigorous growth +S000035190 CDS YNR013C 14 651712 649028 C 2011-02-03 1997-01-28 +S000005297 ORF Uncharacterized YNR014W chromosome 14 14 652465 653103 W 2011-02-03 1997-01-28 Putative protein of unknown function; expression is cell-cycle regulated, Azf1p-dependent, and heat-inducible; YNR014W has a paralog, YMR206W, that arose from the whole genome duplication +S000036187 CDS YNR014W 14 652465 653103 W 2011-02-03 1997-01-28 +S000005298 ORF Verified YNR015W SMM1 DUS2 chromosome 14 L000003407 14 653387 654541 W 2011-02-03 1997-01-28 Dihydrouridine synthase; member of a family of dihydrouridine synthases including Dus1p, Smm1p, Dus3p, and Dus4p; modifies uridine residues at position 20 of cytoplasmic tRNAs +S000036301 CDS YNR015W 14 653387 654541 W 2011-02-03 1997-01-28 +S000005299 ORF Verified YNR016C ACC1 acetyl-CoA carboxylase ACC1|MTR7|FAS3|ABP2 chromosome 14 L000000017|L000000014|L000000603 14 661374 654673 C 2011-02-03 1997-01-28 Acetyl-CoA carboxylase, biotin containing enzyme; catalyzes carboxylation of cytosolic acetyl-CoA to form malonyl-CoA and regulates histone acetylation by regulating the availablity of acetyl-CoA; required for de novo biosynthesis of long-chain fatty acids; ACC1 has a paralog, HFA1, that arose from the whole genome duplication +S000036342 CDS YNR016C 14 661374 654673 C 2011-02-03 1997-01-28 +S000005300 ORF Verified YNR017W TIM23 protein transporter TIM23|MAS6|MPI3|MIM23 chromosome 14 L000001140|L000001028 14 662913 663581 W 2011-02-03 1997-01-28 Essential component of the TIM23 complex; involved in protein import into mitochondrial matrix and inner membrane; with Tim17p, contributes to architecture and function of the import channel; TIM23 complex is short for the translocase of the inner mitochondrial membrane +S000036476 CDS YNR017W 14 662913 663581 W 2011-02-03 1997-01-28 +S000005301 ORF Verified YNR018W RCF2 AIM38 chromosome 14 14 664270 664944 W 2011-02-03 1997-01-28 Cytochrome c oxidase subunit; has a role in assembly of respiratory supercomplexes; similar to Rcf1p, and either Rcf1p or Rcf2p is required for late-stage assembly of the Cox12p and Cox13p subunits and for cytochrome c oxidase activity; associates with the cytochrome c oxidase - cytochrome bc1 supercomplex; null mutant accumulates reactive oxygen species; member of the conserved hypoxia induced gene family; C. elegans homolog is functional in yeast +S000037162 CDS YNR018W 14 664270 664944 W 2011-02-03 1997-01-28 +S000005302 ORF Verified YNR019W ARE2 sterol acyltransferase|SAT1 chromosome 14 L000003220|L000002769 14 665339 667267 W 2011-02-03 1997-01-28 Acyl-CoA:sterol acyltransferase; endoplasmic reticulum enzyme that contributes the major sterol esterification activity in the presence of oxygen; ARE2 has a paralog, ARE1, that arose from the whole genome duplication +S000037242 CDS YNR019W 14 665339 667267 W 2011-02-03 1997-01-28 +S000005303 ORF Verified YNR020C ATP23 putative metalloprotease chromosome 14 14 668222 667410 C 2011-02-03 1997-01-28 Putative metalloprotease of the mitochondrial inner membrane; required for processing of Atp6p; has an additional role in assembly of the F0 sector of the F1F0 ATP synthase complex; substrate of the Mia40p-Erv1p disulfide relay system, and folding is assisted by Mia40p +S000030232 CDS YNR020C 14 668222 667410 C 2011-02-03 1997-01-28 +S000005304 ORF Uncharacterized YNR021W chromosome 14 14 668377 669591 W 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; YNR021W is not an essential gene +S000031253 CDS YNR021W 14 668377 669591 W 2011-02-03 1997-01-28 +S000005305 ORF Verified YNR022C MRPL50 mitochondrial 54S ribosomal protein MRPL50 chromosome 14 14 670193 669774 C 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit; not essential for mitochondrial translation +S000031291 CDS YNR022C 14 670193 669774 C 2011-02-03 1997-01-28 +S000005306 ORF Verified YNR023W SNF12 SWP73 chromosome 14 L000003408 14 670418 672118 W 2011-02-03 1997-01-28 73 kDa subunit of the SWI/SNF chromatin remodeling complex; involved in transcriptional regulation; relocates to the cytosol under hypoxic conditions; deletion mutants are temperature-sensitive; SNF12 has a paralog, RSC6, that arose from the whole genome duplication +S000032359 CDS YNR023W 14 670418 672118 W 2011-02-03 1997-01-28 +S000005307 ORF Verified YNR024W MPP6 chromosome 14 14 672409 672969 W 2011-02-03 1997-01-28 Nuclear exosome-associated RNA binding protein; involved in surveillance of pre-rRNAs and pre-mRNAs, and the degradation of cryptic non-coding RNAs (ncRNA); copurifies with ribosomes; relocalizes to the cytosol in response to hypoxia +S000032477 CDS YNR024W 14 672409 672969 W 2011-02-03 1997-01-28 +S000005308 ORF Dubious YNR025C chromosome 14 14 673061 672702 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; deletion reduces expression of PIS1 gene encoding phosphatidylinositol synthase +S000032509 CDS YNR025C 14 673061 672702 C 2011-02-03 1997-01-28 +S000005309 ORF Verified YNR026C SEC12 Sar family guanine nucleotide exchange factor SEC12|SED2 chromosome 14 L000001837 14 674689 673274 C 2011-02-03 1997-01-28 Guanine nucleotide exchange factor (GEF); activates Sar1p by catalyzing the exchange of GDP for GTP; required for the initiation of COPII vesicle formation in ER to Golgi transport; glycosylated integral membrane protein of the ER; SEC12 has a paralog, SED4, that arose from the whole genome duplication +S000032620 CDS YNR026C 14 674689 673274 C 2011-02-03 1997-01-28 +S000005310 ORF Verified YNR027W BUD17 putative pyridoxal kinase BUD17 chromosome 14 14 674923 675876 W 2011-02-03 1997-01-28 Putative pyridoxal kinase; a key enzyme in vitamin B6 metabolism; involved in bud-site selection; diploid mutants display a random rather than a bipolar budding pattern; similarity to yeast BUD16 and human pyridoxal kinase (PDXK) +S000033356 CDS YNR027W 14 674923 675876 W 2011-02-03 1997-01-28 +S000005311 ORF Verified YNR028W CPR8 peptidylprolyl isomerase family protein CPR8 chromosome 14 L000004349 14 676177 677103 W 2011-02-03 1997-01-28 Peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; potential role in the secretory pathway; CPR8 has a paralog, CPR4, that arose from the whole genome duplication +S000033423 CDS YNR028W 14 676177 677103 W 2011-02-03 1997-01-28 +S000005312 ORF Uncharacterized YNR029C chromosome 14 14 678488 677199 C 2011-02-03 1997-01-28 Putative protein of unknown function; deletion confers reduced fitness in saline +S000033458 CDS YNR029C 14 678488 677199 C 2011-02-03 1997-01-28 +S000005313 ORF Verified YNR030W ALG12 dolichyl-P-Man:Man(7)GlcNAc(2)-PP-dolichol alpha-1,6-mannosyltransferase|ECM39 chromosome 14 L000003906 14 678799 680454 W 2011-02-03 1997-01-28 Alpha-1,6-mannosyltransferase localized to the ER; responsible for addition of alpha-1,6 mannose to dolichol-linked Man7GlcNAc2; acts in the dolichol pathway for N-glycosylation; human homolog ALG12 complements yeast null mutant +S000034448 CDS YNR030W 14 678799 680454 W 2011-02-03 1997-01-28 +S000005314 ORF Verified YNR031C SSK2 mitogen-activated protein kinase kinase kinase SSK2 chromosome 14 L000002826 14 685433 680694 C 2011-02-03 1997-01-28 MAP kinase kinase kinase of HOG1 mitogen-activated signaling pathway; interacts with Ssk1p, leading to autophosphorylation and activation of Ssk2p which phosphorylates Pbs2p; also mediates actin cytoskeleton recovery from osmotic stress; a HOG-independent function of Ssk2p mediates the calcium-sensitive phenotype of the ptp2 msg5 double disruptant; SSK2 has a paralog, SSK22, that arose from the whole genome duplication +S000034513 CDS YNR031C 14 685433 680694 C 2011-02-03 1997-01-28 +S000005315 ORF Verified YNR032W PPG1 putative serine/threonine-protein kinase PPG1 chromosome 14 L000001470 14 686010 687116 W 2011-02-03 1997-01-28 Putative serine/threonine protein phosphatase; putative phosphatase of the type 2A-like phosphatase family, required for glycogen accumulation; interacts with Tap42p, which binds to and regulates other protein phosphatases +S000035579 CDS YNR032W 14 686010 687116 W 2011-02-03 1997-01-28 +S000007251 ORF Verified YNR032C-A HUB1 ubiquitin-like protein HUB1 chromosome 14 14 687464 687243 C 2011-02-03 1999-07-17 Ubiquitin-like protein modifier; promotes alternative splicing of SRC1 pre-mRNA; binds non-covalently to the HIND domain of Snu66, may function in modification of Sph1p and Hbt1p, functionally complemented by the human or S. pombe ortholog; mechanism of Hub1p adduct formation not yet clear +S000030977 CDS YNR032C-A 14 687464 687243 C 2011-02-03 1999-07-17 +S000005316 ORF Verified YNR033W ABZ1 4-amino-4-deoxychorismate synthase chromosome 14 L000000015 14 687635 689998 W 2011-02-03 1997-01-28 Para-aminobenzoate (PABA) synthase; has similarity to Escherichia coli PABA synthase components PabA and PabB; required for the synthesis of para-aminobenzoic acid, an important intermediate for folate and ubiquinone Q biosynthesis; protein abundance increases in response to DNA replication stress +S000035655 CDS YNR033W 14 687635 689998 W 2011-02-03 1997-01-28 +S000005317 ORF Verified YNR034W SOL1 chromosome 14 L000003102 14 690321 691286 W 2011-02-03 1997-01-28 Protein with a possible role in tRNA export; shows similarity to 6-phosphogluconolactonase non-catalytic domains but does not exhibit this enzymatic activity; homologous to Sol3p and Sol4p; SOL1 has a paralog, SOL2, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000035772 CDS YNR034W 14 690321 691286 W 2011-02-03 1997-01-28 +S000118393 ARS ARS1427 ARSXIV-692 chromosome 14 14 691486 691730 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178177 ARS_consensus_sequence ARS1427 14 691678 691662 C 2014-11-18 2014-11-18 +S000007525 ORF Verified YNR034W-A EGO4 chromosome 14 14 692561 692857 W 2011-02-03 2000-07-14 Protein of unknown function; expression is regulated by Msn2p/Msn4p; YNR034W-A has a paralog, YCR075W-A, that arose from the whole genome duplication +S000037062 CDS YNR034W-A 14 692561 692857 W 2011-02-03 2000-07-14 +S000005318 ORF Verified YNR035C ARC35 END9 chromosome 14 L000004558|L000004035 14 694047 693019 C 2011-02-03 1997-01-28 Subunit of the ARP2/3 complex; ARP2/3 is required for the motility and integrity of cortical actin patches; required for cortical localization of calmodulin +S000036635 CDS YNR035C 14 694047 693019 C 2011-02-03 1997-01-28 +S000005319 ORF Verified YNR036C MRPS12 putative mitochondrial 37S ribosomal protein MRPS12 chromosome 14 14 694822 694361 C 2011-02-03 1997-01-28 Mitochondrial protein; may interact with ribosomes based on co-purification experiments; similar to E. coli and human mitochondrial S12 ribosomal proteins +S000036702 CDS YNR036C 14 694822 694361 C 2011-02-03 1997-01-28 +S000005320 ORF Verified YNR037C RSM19 mitochondrial 37S ribosomal protein RSM19 chromosome 14 14 695327 695052 C 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the small subunit; has similarity to E. coli S19 ribosomal protein +S000036762 CDS YNR037C 14 695327 695052 C 2011-02-03 1997-01-28 +S000005321 ORF Verified YNR038W DBP6 putative ATP-dependent RNA helicase DBP6 chromosome 14 L000003940 14 695595 697484 W 2011-02-03 1997-01-28 Essential protein involved in ribosome biogenesis; putative ATP-dependent RNA helicase of the DEAD-box protein family; human homolog DDX51 complements yeast dbp6 mutant +S000036850 CDS YNR038W 14 695595 697484 W 2011-02-03 1997-01-28 +S000005322 ORF Verified YNR039C ZRG17 Zn(2+) transporter ZRG17 chromosome 14 S000007519 14 699431 697614 C 2011-02-03 1997-01-28 Endoplasmic reticulum zinc transporter; part of a heterodimeric transporter with Msc2p that transfers zinc from the cytosol to the ER lumen; member of the cation diffusion facilitator family of efflux pumps; zinc-regulated directly through Zap1p; transcription induced under conditions of zinc deficiency +S000036872 CDS YNR039C 14 699431 697614 C 2011-02-03 1997-01-28 +S000005323 ORF Uncharacterized YNR040W chromosome 14 14 699690 700460 W 2011-02-03 1997-01-28 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000037624 CDS YNR040W 14 699690 700460 W 2011-02-03 1997-01-28 +S000005325 ORF Dubious YNR042W chromosome 14 14 701238 701666 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified gene COQ2 +S000030522 CDS YNR042W 14 701238 701666 W 2011-02-03 1997-01-28 +S000005324 ORF Verified YNR041C COQ2 4-hydroxybenzoate octaprenyltransferase chromosome 14 L000000379 14 701659 700541 C 2011-02-03 1997-01-28 Para hydroxybenzoate polyprenyl transferase; catalyzes the second step in ubiquinone (coenzyme Q) biosynthesis; human COQ2, mutations in which are implicated in an increased risk of mutiple-system atrophy, can complement a yeast coq2 null mutant +S000037655 CDS YNR041C 14 701659 700541 C 2011-02-03 1997-01-28 +S000005326 ORF Verified YNR043W MVD1 diphosphomevalonate decarboxylase MVD1|ERG19 chromosome 14 L000003136 14 701895 703085 W 2011-02-03 1997-01-28 Mevalonate pyrophosphate decarboxylase; essential enzyme involved in the biosynthesis of isoprenoids and sterols, including ergosterol; acts as a homodimer +S000030635 CDS YNR043W 14 701895 703085 W 2011-02-03 1997-01-28 +S000005327 ORF Verified YNR044W AGA1 chromosome 14 L000000061 14 703699 705876 W 42 2011-02-03 1997-01-28 Anchorage subunit of a-agglutinin of a-cells; highly O-glycosylated protein with N-terminal secretion signal and C-terminal signal for addition of GPI anchor to cell wall, linked to adhesion subunit Aga2p via two disulfide bonds; AGA1 has a paralog, FIG2, that arose from the whole genome duplication +S000031496 CDS YNR044W 14 703699 705876 W 2011-02-03 1997-01-28 +S000005328 ORF Verified YNR045W PET494 chromosome 14 L000001402 14 706139 707608 W 42 2011-02-03 1997-01-28 Mitochondrial translational activator specific for the COX3 mRNA; acts together with Pet54p and Pet122p; located in the mitochondrial inner membrane +S000031585 CDS YNR045W 14 706139 707608 W 2011-02-03 1997-01-28 +S000005329 ORF Verified YNR046W TRM112 RNA methylation protein TRM112 chromosome 14 S000079653 14 707788 708195 W 2011-02-03 1997-01-28 Protein involved in methylation of tRNA, rRNA, and translation factors; also involved in ribosome biogenesis; subunit of tRNA methyltransferase (MTase) complexes in combination with Trm9p and Trm11p; N7-methylates G1575 of 18S rRNA as complex with Bud23p; subunit of complex with Mtq2p that methylates Sup45p (eRF1) in the ternary complex eRF1-eRF3-GTP; relative distribution to the nucleus increases upon DNA replication stress; functional homolog of human TRMT112 +S000031700 CDS YNR046W 14 707788 708195 W 2011-02-03 1997-01-28 +S000005330 ORF Verified YNR047W FPK1 serine/threonine protein kinase FPK1 chromosome 14 14 708523 711204 W 2011-02-03 1997-01-28 Ser/Thr protein kinase; phosphorylates several aminophospholipid translocase family members, regulating phospholipid translocation and membrane asymmetry; phosphorylates and inhibits upstream inhibitory kinase, Ypk1p; localizes to the cytoplasm, early endosome/TGN compartments and thplasma membrane; localizes to the shmoo tip where it has a redundant role in the cellular response to mating pheromone; FPK1 has a paralog, KIN82, that arose from the whole genome duplication +S000031803 CDS YNR047W 14 708523 711204 W 2011-02-03 1997-01-28 +S000005331 ORF Verified YNR048W putative aminophospholipid translocase regulatory protein|CRF1 chromosome 14 14 711630 712811 W 2011-02-03 1997-01-28 Potential noncatalytic subunit for phospholipid translocase Dnf3p; YNR048W has a paralog, CDC50, that arose from the whole genome duplication +S000031910 CDS YNR048W 14 711630 712811 W 2011-02-03 1997-01-28 +S000005332 ORF Verified YNR049C MSO1 chromosome 14 L000003070 14 713655 713023 C 2011-02-03 1997-01-28 Lipid-interacting protein in SNARE complex assembly machinery; acts at late step in secretion; interacts with membranes through two distinct binding sites; shows genetic and physical interactions with Sec1p; required for prospore membrane formation during sporulation; N-terminus closely associates with plasma membrane, C-terminus colocalizes with Sec4p on intracellular membranes; relocalizes from bud neck to nucleus upon DNA replication stress +S000032764 CDS YNR049C 14 713655 713023 C 2011-02-03 1997-01-28 +S000005333 ORF Verified YNR050C LYS9 saccharopine dehydrogenase (NADP+, L-glutamate-forming)|LYS13 chromosome 14 L000000969 14 715388 714048 C 44 2011-02-03 1997-01-28 Saccharopine dehydrogenase (NADP+, L-glutamate-forming); catalyzes the formation of saccharopine from alpha-aminoadipate 6-semialdehyde, the seventh step in lysine biosynthesis pathway; exhibits genetic and physical interactions with TRM112 +S000032832 CDS YNR050C 14 715388 714048 C 2011-02-03 1997-01-28 +S000007460 snoRNA_gene snR49 SNR49 chromosome 14 14 716120 716284 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U990 and small subunit (SSU) rRNA at positions U120, U211, and U302 +S000030653 noncoding_exon snR49 14 716120 716284 W 2011-02-03 2000-05-19 +S000005334 ORF Verified YNR051C BRE5 chromosome 14 14 718327 716780 C 2011-02-03 1997-01-28 Ubiquitin protease cofactor; forms deubiquitination complex with Ubp3p that coregulates anterograde and retrograde transport between the endoplasmic reticulum and Golgi compartments; null is sensitive to brefeldin A +S000033539 CDS YNR051C 14 718327 716780 C 2011-02-03 1997-01-28 +S000005335 ORF Verified YNR052C POP2 CCR4-NOT core DEDD family RNase subunit POP2|CAF1 chromosome 14 L000001465 14 720647 719346 C 2011-02-03 1997-01-28 RNase of the DEDD superfamily; subunit of the Ccr4-Not complex that mediates 3' to 5' mRNA deadenylation +S000033632 CDS YNR052C 14 720647 719346 C 2011-02-03 1997-01-28 +S000029463 snoRNA_gene snR191 SNR191 chromosome 14 S000028465 14 722211 721938 C 2011-02-03 2003-12-09 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at positions U2258 and U2260; encoded within the intron of NOG2/YNR053C +S000034351 noncoding_exon snR191 14 722211 721938 C 2011-02-03 2003-12-09 +S000005336 ORF Verified YNR053C NOG2 putative GTPase NOG2|NUG2 chromosome 14 14 723112 721120 C 2011-02-03 1997-01-28|2011-02-03 Putative GTPase; associates with pre-60S ribosomal subunits in the nucleolus and is required for their nuclear export and maturation; recruited by ribosomal proteins L17, L35, and L37 to assembling ribosomes after 27SB pre-rRNA is generated, immediately preceding removal of ITS2 +S000033758 CDS YNR053C 14 721770 721120 C 2011-02-03 1997-01-28 +S000033757 CDS YNR053C 14 723112 722303 C 2011-02-03 1997-01-28 +S000033759 intron YNR053C 14 722302 721771 C 2011-02-03 1997-01-28|2011-02-03 +S000005337 ORF Verified YNR054C ESF2 RNA-binding ATPase activator ESF2|ABT1 chromosome 14 14 724306 723356 C 2011-02-03 1997-01-28 Essential nucleolar protein involved in pre-18S rRNA processing; binds to RNA and stimulates ATPase activity of Dbp8; involved in assembly of the small subunit (SSU) processome +S000034628 CDS YNR054C 14 724306 723356 C 2011-02-03 1997-01-28 +S000006653 tRNA_gene tL(UAA)N chromosome 14 L000003695 14 726217 726134 C 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000037416 noncoding_exon tL(UAA)N 14 726217 726134 C 2011-02-03 2000-05-19 +S000007147 long_terminal_repeat YNRWsigma4 chromosome 14 14 726234 726574 W 2011-02-03 2000-05-19 Ty3 LTR +S000007144 long_terminal_repeat YNRCdelta8 chromosome 14 14 726945 726614 C 2011-02-03 2000-05-19 Ty1 LTR +S000007145 long_terminal_repeat YNRCdelta9 chromosome 14 14 727661 727363 C 2011-02-03 2000-05-19 Ty1 LTR +S000005338 ORF Verified YNR055C HOL1 chromosome 14 L000000798 14 730186 728426 C 48 2011-02-03 1997-01-28 Putative transporter in the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; mutations in membrane-spanning domains permit cation and histidinol uptake +S000034785 CDS YNR055C 14 730186 728426 C 2011-02-03 1997-01-28 +S000005339 ORF Verified YNR056C BIO5 chromosome 14 L000003530 14 733303 731618 C 2011-02-03 1997-01-28 Putative transmembrane protein involved in the biotin biosynthesis; responsible for uptake of 7-keto 8-aminopelargonic acid; BIO5 is in a cluster of 3 genes (BIO3, BIO4, and BIO5) that mediate biotin synthesis +S000034927 CDS YNR056C 14 733303 731618 C 2011-02-03 1997-01-28 +S000005340 ORF Verified YNR057C BIO4 dethiobiotin synthase chromosome 14 L000003307 14 734069 733356 C 2011-02-03 1997-01-28 Dethiobiotin synthetase; catalyzes the third step in the biotin biosynthesis pathway; BIO4 is in a cluster of 3 genes (BIO3, BIO4, and BIO5) that mediate biotin synthesis; BIO3 and BIO4 were acquired by horizontal gene transfer (HGT) from bacteria; expression appears to be repressed at low iron levels +S000035846 CDS YNR057C 14 734069 733356 C 2011-02-03 1997-01-28 +S000005341 ORF Verified YNR058W BIO3 adenosylmethionine-8-amino-7-oxononanoate transaminase chromosome 14 L000003176 14 734291 735733 W 2011-02-03 1997-01-28 7,8-diamino-pelargonic acid aminotransferase (DAPA); catalyzes the second step in the biotin biosynthesis pathway; BIO3 is in a cluster of 3 genes (BIO3, BIO4, and BIO5) that mediate biotin synthesis; BIO3 and BIO4 were acquired by horizontal gene transfer (HGT) from bacteria +S000036073 CDS YNR058W 14 734291 735733 W 2011-02-03 1997-01-28 +S000005342 ORF Verified YNR059W MNT4 putative alpha-1,3-mannosyltransferase chromosome 14 14 736803 738545 W 2011-02-03 1997-01-28 Putative alpha-1,3-mannosyltransferase; not required for protein O-glycosylation; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively +S000036222 CDS YNR059W 14 736803 738545 W 2011-02-03 1997-01-28 +S000005343 ORF Verified YNR060W FRE4 ferric-chelate reductase chromosome 14 L000003556 14 739951 742110 W 2011-02-03 1997-01-28 Ferric reductase; reduces a specific subset of siderophore-bound iron prior to uptake by transporters; expression induced by low iron levels +S000036976 CDS YNR060W 14 739951 742110 W 2011-02-03 1997-01-28 +S000005344 ORF Verified YNR061C chromosome 14 14 743540 742881 C 2011-02-03 1997-01-28 Protein of unknown function; relocalizes from vacuole to cytoplasm upon DNA replication stress +S000037708 CDS YNR061C 14 743540 742881 C 2011-02-03 1997-01-28 +S000005345 ORF Uncharacterized YNR062C chromosome 14 14 745343 744360 C 2011-02-03 1997-01-28 Putative membrane protein of unknown function +S000037784 CDS YNR062C 14 745343 744360 C 2011-02-03 1997-01-28 +S000005346 ORF Uncharacterized YNR063W chromosome 14 14 746943 748766 W 2011-02-03 1997-01-28 Putative zinc-cluster protein of unknown function +S000029847 CDS YNR063W 14 746943 748766 W 2011-02-03 1997-01-28 +S000005347 ORF Verified YNR064C epoxide hydrolase chromosome 14 14 750008 749136 C 2011-02-03 1997-01-28 Epoxide hydrolase; member of the alpha/beta hydrolase fold family; may have a role in detoxification of epoxides +S000030815 CDS YNR064C 14 750008 749136 C 2011-02-03 1997-01-28 +S000005348 ORF Uncharacterized YNR065C YSN1 chromosome 14 14 753700 750350 C 2011-02-03 1997-01-28 Protein of unknown function; protein-protein interactions suggest a possible role in actin patch formation; YNR065C is not an essential gene +S000030902 CDS YNR065C 14 753700 750350 C 2011-02-03 1997-01-28 +S000005349 ORF Uncharacterized YNR066C chromosome 14 14 755035 753725 C 2011-02-03 1997-01-28 Putative membrane-localized protein of unknown function +S000030952 CDS YNR066C 14 755035 753725 C 2011-02-03 1997-01-28 +S000005350 ORF Verified YNR067C DSE4 endo-1,3(4)-beta-glucanase|ENG1 chromosome 14 14 759099 755746 C 2011-02-03 1997-01-28 Daughter cell-specific secreted protein with similarity to glucanases; degrades cell wall from the daughter side causing daughter to separate from mother +S000031043 CDS YNR067C 14 759099 755746 C 2011-02-03 1997-01-28 +S000005351 ORF Uncharacterized YNR068C BUL3 chromosome 14 14 760885 760067 C 2011-02-03 1997-01-28 Putative protein of unknown function; exhibits homology to C-terminal end of Bul1p; expressed as a readthrough product of BSC5, the readthrough locus being termed BUL3; the BUL3 readthrough product is involved in ubiquitin-mediated sorting of plasma membrane proteins and interacts with WW domains of Rsp5p in vitro, but in a functionally different way than the non-readthrough form +S000032003 CDS YNR068C 14 760885 760067 C 2011-02-03 1997-01-28 +S000005352 ORF Verified YNR069C BSC5 BUL3 chromosome 14 14 762592 761123 C 2011-02-03 1997-01-28 Protein of unknown function; shows homology with N-terminal end of Bul1p; ORF exhibits genomic organization compatible with a translational readthrough-dependent mode of expression; readthrough expression includes YNR068C and the locus for this readthrough is termed BUL3; Bul3p is involved in ubiquitin-mediated sorting of plasma membrane proteins; readthrough and shortened forms of Bul3p interact with Rsp5p differently in vitro +S000032095 CDS YNR069C 14 762592 761123 C 2011-02-03 1997-01-28 +S000005353 ORF Verified YNR070W PDR18 ATP-binding cassette multidrug transporter PDR18 chromosome 14 14 765375 769376 W 2011-02-03 1997-01-28|2011-02-03 Putative transporter of the ATP-binding cassette (ABC) family; role in plasma membrane sterol incorporation; implicated in pleiotropic drug resistance; provides resistance to ethanol stress and contributes to a decreased intracellular accumulation of ethanol; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000033201 CDS YNR070W 14 765375 769376 W 2011-02-03 1997-01-28|2011-02-03 +S000005354 ORF Uncharacterized YNR071C aldose 1-epimerase superfamily protein chromosome 14 14 771468 770440 C 2011-02-03 1997-01-28 Putative aldose 1-epimerase +S000033956 CDS YNR071C 14 771468 770440 C 2011-02-03 1997-01-28 +S000005355 ORF Verified YNR072W HXT17 HLT4|hexose transporter HXT17 chromosome 14 L000003265 14 772657 774351 W 2011-02-03 1997-01-28 Putative transmembrane polyol transporter; supports growth on and uptake of mannitol and sorbitol with moderate affinity when overexpressed in a strain deleted for hexose family members; minor hexose transport activity when overexpressed in a similar strain; induced by raffinose and galactose at pH 7.7 versus pH 4.7, repressed by high levels of glucose; HXT17 has a paralog, HXT13, that arose from a segmental duplication +S000034105 CDS YNR072W 14 772657 774351 W 2011-02-03 1997-01-28 +S000005356 ORF Verified YNR073C MAN2 putative mannitol dehydrogenase chromosome 14 14 776300 774792 C 2011-02-03 1997-01-28 Mannitol dehydrogenase; MAN2 has a paralog, DSF1, that arose from a segmental duplication +S000034161 CDS YNR073C 14 776300 774792 C 2011-02-03 1997-01-28 +S000005357 ORF Verified YNR074C AIF1 CPD1 chromosome 14 14 778738 777602 C 2011-02-03 1997-01-28 Mitochondrial cell death effector; translocates to the nucleus in response to apoptotic stimuli, homolog of mammalian Apoptosis-Inducing Factor, putative reductase +S000035101 CDS YNR074C 14 778738 777602 C 2011-02-03 1997-01-28 +S000005358 ORF Verified YNR075W COS10 chromosome 14 L000004068 14 779916 781040 W 2011-02-03 1997-01-28 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins +S000035300 CDS YNR075W 14 779916 781040 W 2011-02-03 1997-01-28 +S000028706 ORF Uncharacterized YNR075C-A chromosome 14 14 781603 781511 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032648 CDS YNR075C-A 14 781603 781511 C 2011-02-03 2003-07-29 +S000005359 ORF Verified YNR076W PAU6 seripauperin PAU6 chromosome 14 L000002880 14 781918 782280 W 2011-02-03 1997-01-28 Member of the seripauperin multigene family; encoded mainly in subtelomeric regions; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole; active during alcoholic fermentation; regulated by anaerobiosis; negatively regulated by oxygen; repressed by heme; identical to Pau18p +S000035359 CDS YNR076W 14 781918 782280 W 2011-02-03 1997-01-28 +S000028993 telomere TEL14R chromosome 14 14 783278 784333 W 54 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome XIV; composed of an X element core sequence, X element combinatorial repeats, and a terminal stretch of telomeric repeats +S000028994 telomeric_repeat TEL14R 14 784038 784333 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome XIV +S000028995 X_element TEL14R 14 783278 783740 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome XIV; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YNR077C +S000028996 X_element_combinatorial_repeat TEL14R 14 783741 784037 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr XIV; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000005360 ORF Uncharacterized YNR077C chromosome 14 14 783541 783287 C 2011-02-03 1997-01-28 Protein of unknown function, abundance changes with carbon source +S000035391 CDS YNR077C 14 783541 783287 C 2011-02-03 1997-01-28 +S000028709 ORF Uncharacterized YOL166W-A chromosome 15 15 585 740 W 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032654 CDS YOL166W-A 15 585 740 W 2003-07-29 2003-07-29 +S000028929 telomere TEL15L chromosome 15 15 847 1 C -132 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome XV; composed of an X element core sequence, X element combinatorial repeats, and a terminal stretch of telomeric repeats +S000028930 telomeric_repeat TEL15L 15 117 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome XV +S000028931 X_element TEL15L 15 847 389 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome XV; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YOL166W-A +S000028932 X_element_combinatorial_repeat TEL15L 15 388 118 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr XV; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000005526 ORF Dubious YOL166C chromosome 15 15 1338 1000 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036497 CDS YOL166C 15 1338 1000 C 1996-07-31 1996-07-31 +S000005525 ORF Verified YOL165C AAD15 putative aryl-alcohol dehydrogenase chromosome 15 L000004640 15 2078 1647 C 1996-07-31 1996-07-31 Putative aryl-alcohol dehydrogenase; similar to P. chrysosporium aryl-alcohol dehydrogenase; mutational analysis has not yet revealed a physiological role; AAD15 has a paralog, AAD3, that arose from a segmental duplication; members of the AAD gene family comprise three pairs (AAD3 + AAD15, AAD6/AAD16 + AAD4, AAD10 + AAD14) whose two genes are more related to one another than to other members of the family +S000035578 CDS YOL165C 15 2078 1647 C 1996-07-31 1996-07-31 +S000007148 long_terminal_repeat YOLCdelta1 chromosome 15 15 3223 2894 C 2000-05-19 2000-05-19 Ty1 LTR +S000007160 long_terminal_repeat YOLWtau1 chromosome 15 15 3809 3986 W 2000-05-19 2000-05-19 Ty4 LTR +S000028580 ORF Uncharacterized YOL164W-A chromosome 15 15 4130 4312 W 2003-07-29 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031327 CDS YOL164W-A 15 4130 4312 W 2003-07-29 2003-07-29 +S000005524 ORF Verified YOL164W BDS1 sulfuric ester hydrolase chromosome 15 15 6175 8115 W 1996-07-31 1996-07-31 Bacterially-derived sulfatase; required for use of alkyl- and aryl-sulfates as sulfur sources +S000035536 CDS YOL164W 15 6175 8115 W 1996-07-31 1996-07-31 +S000005523 ORF Uncharacterized YOL163W chromosome 15 15 9597 10106 W 2011-02-03 1996-07-31 Putative protein of unknown function; member of the Dal5p subfamily of the major facilitator family +S000035451 CDS YOL163W 15 9597 10106 W 2011-02-03 1996-07-31 +S000005522 ORF Uncharacterized YOL162W chromosome 15 15 10119 10766 W 2011-02-03 1996-07-31 Putative protein of unknown function; member of the Dal5p subfamily of the major facilitator family +S000034399 CDS YOL162W 15 10119 10766 W 2011-02-03 1996-07-31 +S000005521 ORF Verified YOL161C PAU20 seripauperin PAU20 chromosome 15 15 11911 11549 C 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP and mCherry fusion proteins localize to the vacuole; expression induced by low temperature and also by anaerobic conditions; induced during alcoholic fermentation +S000034226 CDS YOL161C 15 11911 11549 C 2011-02-03 1996-07-31 +S000005520 ORF Dubious YOL160W chromosome 15 15 14313 14654 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034155 CDS YOL160W 15 14313 14654 W 2011-02-03 1996-07-31 +S000007627 ORF Verified YOL159C-A chromosome 15 15 15505 15233 C 2011-02-03 2001-02-26 Protein of unknown function; overexpression affects endocytic protein trafficking; identified by sequence comparison with hemiascomycetous yeast species +S000037257 CDS YOL159C-A 15 15505 15233 C 2011-02-03 2001-02-26 +S000005519 ORF Verified YOL159C CSS3 chromosome 15 15 17796 17281 C 2011-02-03 1996-07-31 Protein of unknown function, secreted when constitutively expressed; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the cell periphery, SWAT-GFP fusion also localizes to the extracellular region, and mCherry fusion also localizes to the vacuole; deletion mutants are viable and have elevated levels of Ty1 retrotransposition and Ty1 cDNA +S000034633 CDS YOL159C 15 17796 17281 C 2011-02-03 1996-07-31 +S000007149 long_terminal_repeat YOLCdelta2 chromosome 15 15 18561 18302 C 2011-02-03 2000-05-19 Ty1 LTR +S000005518 ORF Verified YOL158C ENB1 ARN4 chromosome 15 15 21311 19491 C 2011-02-03 1996-07-31 Endosomal ferric enterobactin transporter; expressed under conditions of iron deprivation; member of the major facilitator superfamily; expression is regulated by Rcs1p and affected by chloroquine treatment +S000034544 CDS YOL158C 15 21311 19491 C 2011-02-03 1996-07-31 +S000005517 ORF Verified YOL157C IMA2 oligo-1,6-glucosidase IMA2 chromosome 15 15 24294 22525 C 2011-02-03 1996-07-31 Isomaltase (alpha-1,6-glucosidase/alpha-methylglucosidase); preferred specificity for isomaltose, alpha-methylglucoside, and palatinose, but also exhibits alpha-1,2 glucosidase activity on sucrose and kojibiose, and can cleave the 1,3-alpha linkage of nigerose and turanose and the alpha-1,5 linkage of leucrose in vitro; not required for isomaltose utilization, but Ima2p overexpression allows the ima1 null mutant to grow on isomaltose +S000034426 CDS YOL157C 15 24294 22525 C 2011-02-03 1996-07-31 +S000005516 ORF Verified YOL156W HXT11 hexose transporter HXT11|LGT3 chromosome 15 L000000947 15 25273 26976 W 2011-02-03 1996-07-31 Hexose transporter; capable of transporting a broad range of substrates including: glucose, fructose, mannose and galactose; polyol transporter that supports the growth on and uptake of xylitol with low affinity when overexpressed in a strain deleted for hexose family members; nearly identical in sequence to Hxt9p; has similarity to major facilitator superfamily (MFS) transporters; involved in pleiotropic drug resistance +S000032470 CDS YOL156W 15 25273 26976 W 2011-02-03 1996-07-31 +S000028855 ORF Uncharacterized YOL155W-A chromosome 15 15 27084 27218 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000034568 CDS YOL155W-A 15 27084 27218 W 2011-02-03 2003-07-29 +S000005515 ORF Verified YOL155C HPF1 mannoprotein chromosome 15 15 31606 28703 C 2011-02-03 1996-07-31 Haze-protective mannoprotein; reduces the particle size of aggregated proteins in white wines +S000032305 CDS YOL155C 15 31606 28703 C 2011-02-03 1996-07-31 +S000005514 ORF Verified YOL154W ZPS1 chromosome 15 15 34658 35407 W 2011-02-03 1996-07-31 Putative GPI-anchored protein; transcription is induced under low-zinc conditions, as mediated by the Zap1p transcription factor, and at alkaline pH +S000032261 CDS YOL154W 15 34658 35407 W 2011-02-03 1996-07-31 +S000118995 ARS ARS1531 ARSXV-36|ARS1506.5 chromosome 15 15 35669 35904 2011-02-03 2006-10-02|2011-02-03 Autonomously Replicating Sequence +S000178178 ARS_consensus_sequence ARS1531 15 35713 35729 W 2014-11-18 2014-11-18 +S000005513 blocked_reading_frame YOL153C chromosome 15 15 38567 36822 C 2011-02-03 1996-07-31 Blocked reading frame, contains two in-frame stops in translation; this ORF is conserved, without the stops, in Saccharomyces paradoxus, S. mikatae, and S. bayanus; RNA sequencing data indicate the presence of a transcription unit at this reading frame +S000031205 CDS YOL153C 15 38567 36822 C 2011-02-03 1996-07-31 +S000005512 ORF Verified YOL152W FRE7 putative ferric-chelate reductase chromosome 15 L000003559 15 40748 42610 W 2011-02-03 1996-07-31|2006-01-05 Putative ferric reductase with similarity to Fre2p; expression induced by low copper levels +S000031126 CDS YOL152W 15 40748 42610 W 2011-02-03 1996-07-31|2006-01-05 +S000005511 ORF Verified YOL151W GRE2 methylglyoxal reductase (NADPH-dependent) GRE2 chromosome 15 L000004177 15 43694 44722 W 2011-02-03 1996-07-31 3-methylbutanal reductase and NADPH-dependent methylglyoxal reductase; stress induced (osmotic, ionic, oxidative, heat shock and heavy metals); regulated by the HOG pathway; restores resistance to glycolaldehyde by coupling reduction of glycolaldehyde to ethylene glycol and oxidation of NADPH to NADP+; protein abundance increases in response to DNA replication stress; methylglyoxal reductase (NADPH-dependent) is also known as D-lactaldehyde dehydrogenase +S000031026 CDS YOL151W 15 43694 44722 W 2011-02-03 1996-07-31 +S000005510 ORF Dubious YOL150C chromosome 15 15 44784 44473 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000029963 CDS YOL150C 15 44784 44473 C 2011-02-03 1996-07-31 +S000005509 ORF Verified YOL149W DCP1 MRT2 chromosome 15 L000002960|L000003045|S000029311 15 44938 45633 W 2011-02-03 1996-07-31 Subunit of the Dcp1p-Dcp2p decapping enzyme complex; decapping complex removes the 5' cap structure from mRNAs prior to their degradation; enhances the activity of catalytic subunit Dcp2p; regulated by DEAD box protein Dhh1p; forms cytoplasmic foci upon DNA replication stress +S000030376 CDS YOL149W 15 44938 45633 W 2011-02-03 1996-07-31 +S000005508 ORF Verified YOL148C SPT20 ADA5 chromosome 15 L000002593 15 47574 45760 C 2011-02-03 1996-07-31 Subunit of the SAGA transcriptional regulatory complex; involved in maintaining the integrity of the complex; mutant displays reduced transcription elongation in the G-less-based run-on (GLRO) assay +S000030163 CDS YOL148C 15 47574 45760 C 2011-02-03 1996-07-31 +S000005507 ORF Verified YOL147C PEX11 PMP27|PMP24 chromosome 15 L000002650|L000004117 15 48643 47933 C 2011-02-03 1996-07-31 Peroxisomal protein required for medium-chain fatty acid oxidation; also required for peroxisome proliferation, possibly by inducing membrane curvature; localization regulated by phosphorylation; transcription regulated by Adr1p and Pip2p-Oaf1p +S000036432 CDS YOL147C 15 48643 47933 C 2011-02-03 1996-07-31 +S000005506 ORF Verified YOL146W PSF3 DNA replication protein PSF3 chromosome 15 15 48864 49448 W 2011-02-03 2003-09-22|1996-07-31 Subunit of the GINS complex (Sld5p, Psf1p, Psf2p, Psf3p); complex is localized to DNA replication origins and implicated in assembly of the DNA replication machinery +S000036403 CDS YOL146W 15 48864 49448 W 2011-02-03 2003-09-22|1996-07-31 +S000005505 ORF Verified YOL145C CTR9 CDP1 chromosome 15 L000003477 15 52788 49555 C 2011-02-03 1996-07-31|2011-02-03 Component of the Paf1p complex involved in transcription elongation; binds to and modulates the activity of RNA polymerases I and II; required for expression of a subset of genes, including cyclin genes; involved in SER3 repression by helping to maintain SRG1 transcription-dependent nucleosome occupancy; contains TPR repeats +S000036252 CDS YOL145C 15 52788 49555 C 2011-02-03 1996-07-31|2011-02-03 +S000005504 ORF Verified YOL144W NOP8 chromosome 15 L000004849 15 53098 54552 W 2011-02-03 1996-07-31 Nucleolar protein required for 60S ribosomal subunit biogenesis +S000036206 CDS YOL144W 15 53098 54552 W 2011-02-03 1996-07-31 +S000005503 ORF Verified YOL143C RIB4 lumazine synthase RIB4 chromosome 15 L000003027 15 55104 54595 C 2011-02-03 1996-07-31 Lumazine synthase (DMRL synthase); catalyzes synthesis of immediate precursor to riboflavin; DMRL synthase stands for 6,7-dimethyl-8-ribityllumazine synthase +S000035226 CDS YOL143C 15 55104 54595 C 2011-02-03 1996-07-31 +S000005502 ORF Verified YOL142W RRP40 exosome non-catalytic core subunit RRP40|MTR14 chromosome 15 L000004799 15 55558 56280 W 2011-02-03 1996-07-31|2011-02-03 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; predicted to contain both S1 and KH RNA binding domains; has similarity to human hRrp40p (EXOSC3) +S000035132 CDS YOL142W 15 55558 56280 W 2011-02-03 1996-07-31|2011-02-03 +S000005501 ORF Verified YOL141W PPM2 tRNA methyltransferase PPM2|TYW4 chromosome 15 15 56452 58539 W 2011-02-03 1996-07-31|2011-02-03 AdoMet-dependent tRNA methyltransferase; also involved in methoxycarbonylation; required for the synthesis of wybutosine (yW), a modified guanosine found at the 3'-position adjacent to the anticodon of phe-tRNA; similarity to Ppm1p +S000034965 CDS YOL141W 15 56452 58539 W 2011-02-03 1996-07-31|2011-02-03 +S000077073 matrix_attachment_site ETC2 ETC2 chromosome 15 15 58541 58563 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; can act as a transcription-blocking insulator or as a heterochromatin barrier element; remains predominantly localized to the nuclear periphery throughout cell cycle; located between PPM2 and ARG8 +S000005500 ORF Verified YOL140W ARG8 acetylornithine transaminase chromosome 15 L000000111 15 58759 60030 W -130 2006-01-05 1996-07-31 Acetylornithine aminotransferase; catalyzes the fourth step in the biosynthesis of the arginine precursor ornithine +S000034835 CDS YOL140W 15 58759 60030 W 2006-01-05 1996-07-31 +S000005499 ORF Verified YOL139C CDC33 translation initiation factor eIF4E|eIF4E|TIF45 chromosome 15 L000000270 15 61024 60383 C 2006-01-05 1996-07-31 mRNA cap binding protein and translation initiation factor eIF4E; the eIF4E-cap complex is responsible for mediating cap-dependent mRNA translation via interactions with translation initiation factor eIF4G (Tif4631p or Tif4632p); protein abundance increases in response to DNA replication stress; mutants are defective for adhesion and pseudohyphal growth; human homolog EIF4E can complement yeast cdc33 null mutant +S000035358 CDS YOL139C 15 61024 60383 C 2006-01-05 1996-07-31 +S000005498 ORF Verified YOL138C RTC1 SEA2 chromosome 15 15 65350 61325 C 2006-01-05 1996-07-31|2011-02-03 Subunit of SEACAT, a subcomplex of the SEA complex; Rtc1p, along with Mtc5p and Sea4p, redundantly inhibit the TORC1 inhibitory role of the Iml1p/SEACIT (Iml1p-Npr2p-Npr3p) subcomplex, a GAP for GTPase Gtr1p (EGOC subunit) in response to amino acid limitation, thereby resulting in activation of TORC1 signaling; SEA is a coatomer-related complex that associates dynamically with the vacuole; has N-terminal WD-40 repeats and a C-terminal RING motif; null suppresses cdc13-1 +S000035295 CDS YOL138C 15 65350 61325 C 2006-01-05 1996-07-31|2011-02-03 +S000005497 ORF Verified YOL137W BSC6 chromosome 15 15 65621 67114 W 2006-01-05 1996-07-31 Protein of unknown function with 8 putative transmembrane segments; ORF exhibits genomic organization compatible with a translational readthrough-dependent mode of expression +S000034363 CDS YOL137W 15 65621 67114 W 2006-01-05 1996-07-31 +S000005496 ORF Verified YOL136C PFK27 6-phosphofructo-2-kinase|PFK-2 chromosome 15 L000003077 15 68754 67561 C 2006-01-05 1996-07-31 6-phosphofructo-2-kinase; catalyzes synthesis of fructose-2,6-bisphosphate; inhibited by phosphoenolpyruvate and sn-glycerol 3-phosphate, expression induced by glucose and sucrose, transcriptional regulation involves protein kinase A +S000034276 CDS YOL136C 15 68754 67561 C 2006-01-05 1996-07-31 +S000005495 ORF Verified YOL135C MED7 mediator complex subunit MED7 chromosome 15 L000003916 15 70044 69376 C 2006-01-05 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation +S000034163 CDS YOL135C 15 70044 69376 C 2006-01-05 1996-07-31 +S000005493 ORF Verified YOL133W HRT1 SCF ubiquitin ligase complex subunit HRT1|HRT2|ROC1|RBX1 chromosome 15 L000004443 15 70325 70690 W 2006-01-05 1996-07-31 RING-H2 domain core subunit of multiple ubiquitin ligase complexes; subunit of Skp1-Cullin-F-box (SCF) that tethers the Cdc34p (E2) and Cdc53p (cullin) SCF subunits, and is required for degradation of Gic2p, Far1p, Sic1p and Cln2p; subunit of the Rtt101p-Mms1p-Mms22p ubiquitin ligase that stabilizes replication forks after DNA lesions; subunit of the Cul3p-Elc1p-Ela1p ubiquitin ligase involved in Rpb1p degradation as part of transcription-coupled repair +S000032132 CDS YOL133W 15 70325 70690 W 2006-01-05 1996-07-31 +S000005494 ORF Dubious YOL134C chromosome 15 15 70545 70156 C 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps HRT1, a verified gene that encodes an SCF ubiquitin ligase subunit +S000034069 CDS YOL134C 15 70545 70156 C 2006-01-05 1996-07-31 +S000005492 ORF Verified YOL132W GAS4 1,3-beta-glucanosyltransferase chromosome 15 15 71300 72715 W 2006-01-05 1996-07-31 1,3-beta-glucanosyltransferase; involved with Gas2p in spore wall assembly; has similarity to Gas1p; localizes to the cell wall +S000032019 CDS YOL132W 15 71300 72715 W 2006-01-05 1996-07-31 +S000118484 ARS ARS1507 ARSXV-73 chromosome 15 15 72683 72753 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178179 ARS_consensus_sequence ARS1507 15 72687 72703 W 2014-11-18 2014-11-18 +S000005491 ORF Uncharacterized YOL131W chromosome 15 15 73031 73357 W 2006-01-05 1996-07-31 Putative protein of unknown function; YOL131W has a paralog, STB1, that arose from the whole genome duplication +S000031851 CDS YOL131W 15 73031 73357 W 2006-01-05 1996-07-31 +S000005490 ORF Verified YOL130W ALR1 Mg(2+) transporter ALR1|SWC3 chromosome 15 L000002887 15 74400 76979 W 2006-01-05 1996-07-31 Plasma membrane Mg(2+) transporter; expression and turnover are regulated by Mg(2+) concentration; overexpression confers increased tolerance to Al(3+) and Ga(3+) ions; magnesium transport defect of the null mutant is functionally complemented by either of the human genes MAGT1 and TUSC3 that are not orthologous to ALR1 +S000030868 CDS YOL130W 15 74400 76979 W 2006-01-05 1996-07-31 +S000005489 ORF Verified YOL129W VPS68 chromosome 15 15 77560 78114 W 2006-01-05 1996-07-31 Vacuolar membrane protein of unknown function; involved in vacuolar protein sorting; also detected in the mitochondria +S000032156 CDS YOL129W 15 77560 78114 W 2006-01-05 1996-07-31 +S000005488 ORF Verified YOL128C YGK3 serine/threonine protein kinase YGK3 chromosome 15 15 79479 78352 C 2006-01-05 1996-07-31 Protein kinase related to mammalian GSK-3 glycogen synthase kinases; GSK-3 homologs (Mck1p, Rim11p, Mrk1p, Ygk3p) are involved in control of Msn2p-dependent transcription of stress responsive genes and in protein degradation; YGK3 has a paralog, MCK1, that arose from the whole genome duplication +S000031135 CDS YOL128C 15 79479 78352 C 2006-01-05 1996-07-31 +S000005487 ORF Verified YOL127W RPL25 uL23|ribosomal 60S subunit protein L25|L23|rpl6L|YL25|L25 chromosome 15 L000001722 15 80348 81190 W 2006-01-05 1996-07-31 Ribosomal 60S subunit protein L25; primary rRNA-binding ribosomal protein component of large ribosomal subunit; binds to 25S rRNA via a conserved C-terminal motif; homologous to mammalian ribosomal protein L23A and bacterial L23 +S000031095 CDS YOL127W 15 80348 80360 W 2006-01-05 1996-07-31 +S000031096 CDS YOL127W 15 80775 81190 W 2006-01-05 1996-07-31 +S000031097 intron YOL127W 15 80361 80774 W 2006-01-05 1996-07-31 +S000005486 ORF Verified YOL126C MDH2 malate dehydrogenase MDH2 chromosome 15 L000001046 15 82920 81787 C 2006-10-06 1996-07-31|2006-10-06 Cytoplasmic malate dehydrogenase; one of three isozymes that catalyze interconversion of malate and oxaloacetate; involved in the glyoxylate cycle and gluconeogenesis during growth on two-carbon compounds; interacts with Pck1p and Fbp1 +S000030943 CDS YOL126C 15 82920 81787 C 2006-10-06 1996-07-31|2006-10-06 +S000005485 ORF Verified YOL125W TRM13 tRNA:m4X modification enzyme chromosome 15 15 83834 85264 W 2006-01-05 1996-07-31|2011-02-03 2'-O-methyltransferase; responsible for modification of tRNA at position 4; C-terminal domain has similarity to Rossmann-fold (RFM) superfamily of RNA methyltransferases +S000030912 CDS YOL125W 15 83834 85264 W 2006-01-05 1996-07-31|2011-02-03 +S000118485 ARS ARS1508 ARSXV-85 chromosome 15 15 85270 85361 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178180 ARS_consensus_sequence ARS1508 15 85360 85344 C 2014-11-18 2014-11-18 +S000005484 ORF Verified YOL124C TRM11 tRNA (guanine-N2-)-methyltransferase chromosome 15 S000029604|S000028498 15 86757 85456 C 2006-01-05 1996-07-31 Catalytic subunit of adoMet-dependent tRNA methyltransferase complex; required for the methylation of the guanosine nucleotide at position 10 (m2G10) in tRNAs; contains a THUMP domain and a methyltransferase domain; another complex member is Trm112p +S000029846 CDS YOL124C 15 86757 85456 C 2006-01-05 1996-07-31 +S000005483 ORF Verified YOL123W HRP1 NAB5|NAB4 chromosome 15 L000003337|L000003022|L000003015 15 87844 89448 W 2006-01-05 1996-07-31 Subunit of cleavage factor I; cleavage factor I is a five-subunit complex required for the cleavage and polyadenylation of pre-mRNA 3' ends; RRM-containing heteronuclear RNA binding protein and hnRNPA/B family member that binds to poly (A) signal sequences; required for genome stability +S000037901 CDS YOL123W 15 87844 89448 W 2006-01-05 1996-07-31 +S000005482 ORF Verified YOL122C SMF1 divalent metal ion transporter SMF1|SBS1 chromosome 15 L000001931 15 91419 89692 C 2006-01-05 1996-07-31 Divalent metal ion transporter; broad specificity for di-valent and tri-valent metals; post-translationally regulated by levels of metal ions; member of the Nramp family of metal transport proteins +S000036001 CDS YOL122C 15 91419 89692 C 2006-01-05 1996-07-31 +S000005481 ORF Verified YOL121C RPS19A eS19|ribosomal 40S subunit protein S19A|S19e|rp55a|YS16A|S19A|S16aA chromosome 15 L000003299 15 92850 92026 C 2006-01-05 1996-07-31 Protein component of the small (40S) ribosomal subunit; required for assembly and maturation of pre-40 S particles; homologous to mammalian ribosomal protein S19, no bacterial homolog; mutations in human RPS19 are associated with Diamond Blackfan anemia; RPS19A has a paralog, RPS19B, that arose from the whole genome duplication +S000035838 CDS YOL121C 15 92440 92026 C 2006-01-05 1996-07-31 +S000035837 CDS YOL121C 15 92850 92831 C 2006-01-05 1996-07-31 +S000035839 intron YOL121C 15 92830 92441 C 2006-01-05 1996-07-31 +S000005480 ORF Verified YOL120C RPL18A eL18|ribosomal 60S subunit protein L18A|L18e|rp28A|L18A|RP28A chromosome 15 L000001668 15 94402 93395 C 2006-01-05 1996-07-31 Ribosomal 60S subunit protein L18A; intron of RPL18A pre-mRNA forms stem-loop structures that are a target for Rnt1p cleavage leading to degradation; homologous to mammalian ribosomal protein L18, no bacterial homolog; RPL18A has a paralog, RPL18B, that arose from the whole genome duplication +S000035727 CDS YOL120C 15 93843 93395 C 2006-01-05 1996-07-31 +S000035726 CDS YOL120C 15 94402 94291 C 2006-01-05 1996-07-31 +S000035728 intron YOL120C 15 94290 93844 C 2006-01-05 1996-07-31 +S000005479 ORF Verified YOL119C MCH4 chromosome 15 15 96361 94856 C 2006-01-05 1996-07-31 Protein with similarity to mammalian monocarboxylate permeases; monocarboxylate permeases are involved in transport of monocarboxylic acids across the plasma membrane but mutant is not deficient in monocarboxylate transport +S000036182 CDS YOL119C 15 96361 94856 C 2006-01-05 1996-07-31 +S000005478 ORF Dubious YOL118C chromosome 15 15 96916 96608 C 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036070 CDS YOL118C 15 96916 96608 C 2006-01-05 1996-07-31 +S000005477 ORF Verified YOL117W RRI2 CSN10 chromosome 15 S000007579 15 97551 99488 W 2006-01-05 1996-07-31 Subunit of the COP9 signalosome (CSN) complex; this complex cleaves the ubiquitin-like protein Nedd8 from SCF ubiquitin ligases; plays a role in the mating pheromone response +S000036034 CDS YOL117W 15 97551 99488 W 2006-01-05 1996-07-31 +S000005476 ORF Verified YOL116W MSN1 PHD2|MSS10|HRB382|FUP1 chromosome 15 L000001197 15 99809 100957 W 2006-01-05 1996-07-31 Transcriptional activator; involved in regulation of invertase and glucoamylase expression, invasive growth and pseudohyphal differentiation, iron uptake, chromium accumulation, and response to osmotic stress; localizes to the nucleus; relative distribution to the nucleus increases upon DNA replication stress +S000035148 CDS YOL116W 15 99809 100957 W 2006-01-05 1996-07-31 +S000005475 ORF Verified YOL115W PAP2 non-canonical poly(A) polymerase PAP2|TRF4 chromosome 15 L000002953 15 101475 103229 W 2006-01-05 1996-07-31 Non-canonical poly(A) polymerase; involved in nuclear RNA degradation as a component of TRAMP; catalyzes polyadenylation of hypomodified tRNAs, and snoRNA and rRNA precursors; required for mRNA surveillance and maintenance of genome integrity, serving as a link between RNA and DNA metabolism; overlapping but non-redundant functions with Trf5p; relocalizes to cytosol in response to hypoxia +S000035037 CDS YOL115W 15 101475 103229 W 2006-01-05 1996-07-31 +S000005474 ORF Verified YOL114C PTH4 chromosome 15 15 103925 103317 C 2006-01-05 1996-07-31 Protein similar to the human peptidyl-tRNA hydrolase gene ICT1; associates with mitochondrial large subunit; may function in translation termination; YOL114C is not an essential gene +S000034821 CDS YOL114C 15 103925 103317 C 2006-01-05 1996-07-31 +S000005473 ORF Verified YOL113W SKM1 putative serine/threonine protein kinase SKM1 chromosome 15 L000004142 15 104326 106293 W 2006-01-05 1996-07-31 Member of the PAK family of serine/threonine protein kinases; similar to Ste20p; involved in down-regulation of sterol uptake; proposed to be a downstream effector of Cdc42p during polarized growth; SKM1 has a paralog, CLA4, that arose from the whole genome duplication +S000034781 CDS YOL113W 15 104326 106293 W 2006-01-05 1996-07-31 +S000005472 ORF Verified YOL112W MSB4 Rab GTPase-activating protein MSB4 chromosome 15 L000003919 15 106710 108188 W 2006-01-05 1996-07-31 GTPase-activating protein of the Ras superfamily; acts primarily on Sec4p, localizes to the bud site and bud tip; msb3 msb4 double mutation causes defects in secretion and actin organization; similar to the TBC-domain Tre2 oncogene; MSB4 has a paralog, MSB3, that arose from the whole genome duplication; human homolog USP6NL can complement yeast msb3 msb4 double null mutant +S000033897 CDS YOL112W 15 106710 108188 W 2006-01-05 1996-07-31 +S000005471 ORF Verified YOL111C MDY2 GET5|TMA24 chromosome 15 15 108896 108258 C 2006-01-05 1996-07-31 Protein involved in inserting tail-anchored proteins into ER membranes; forms a complex with Get4p; required for efficient mating; involved in shmoo formation and nuclear migration in the pre-zygote; associates with ribosomes +S000033697 CDS YOL111C 15 108896 108258 C 2006-01-05 1996-07-31 +S000005470 ORF Verified YOL110W SHR5 ERF4 chromosome 15 L000002592 15 109176 109889 W 2006-01-05 1996-07-31 Palmitoyltransferase subunit; this complex adds a palmitoyl lipid moiety to heterolipidated substrates such as Ras1p and Ras2p through a thioester linkage; palmitoylation is required for Ras2p membrane localization; Palmitoyltransferase is composed of Shr5p and Erf2 +S000033648 CDS YOL110W 15 109176 109889 W 2006-01-05 1996-07-31 +S000005469 ORF Verified YOL109W ZEO1 chromosome 15 L000003927 15 110297 110638 W 2006-01-05 1996-07-31 Peripheral membrane protein of the plasma membrane; interacts with Mid2p; regulates the cell integrity pathway mediated by Pkc1p and Slt2p; the authentic protein is detected in a phosphorylated state in highly purified mitochondria +S000031643 CDS YOL109W 15 110297 110638 W 2006-01-05 1996-07-31 +S000006592 tRNA_gene tG(UCC)O SUF1 chromosome 15 L000002149|L000003720 15 111033 110962 C -110 2006-01-05 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons +S000037569 noncoding_exon tG(UCC)O 15 111033 110962 C 2006-01-05 2000-05-19 +S000005468 ORF Verified YOL108C INO4 chromosome 15 L000000869 15 111886 111431 C 2006-01-05 1996-07-31 Transcription factor involved in phospholipid synthesis; required for derepression of inositol-choline-regulated genes involved in phospholipid synthesis; forms a complex, with Ino2p, that binds the inositol-choline-responsive element through a basic helix-loop-helix domain +S000030752 CDS YOL108C 15 111886 111431 C 2006-01-05 1996-07-31 +S000005467 ORF Uncharacterized YOL107W chromosome 15 15 112102 113130 W 2006-01-05 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and colocalizes in a punctate pattern with the early golgi/COPI vesicles; YOL107W is not an essential protein +S000030688 CDS YOL107W 15 112102 113130 W 2006-01-05 1996-07-31 +S000005466 ORF Dubious YOL106W chromosome 15 15 113226 113579 W 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030608 CDS YOL106W 15 113226 113579 W 2006-01-05 1996-07-31 +S000007150 long_terminal_repeat YOLCdelta3 chromosome 15 15 113626 113294 C 2006-01-05 2000-05-19 Ty1 LTR +S000006746 tRNA_gene tT(AGU)O1 chromosome 15 L000003701 15 113802 113874 W 2006-01-05 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000037533 noncoding_exon tT(AGU)O1 15 113802 113874 W 2006-01-05 2000-05-19 +S000118486 ARS ARS1509 ARSXV-114 chromosome 15 15 113885 113983 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178181 ARS_consensus_sequence ARS1509 15 113894 113910 W 2014-11-18 2014-11-18 +S000005465 ORF Verified YOL105C WSC3 chromosome 15 L000004218 15 115808 114138 C 2006-01-05 1996-07-31 Sensor-transducer of the stress-activated PKC1-MPK1 signaling pathway; involved in maintenance of cell wall integrity; involved in response to heat shock and other stressors; regulates 1,3-beta-glucan synthesis; WSC3 has a paralog, WSC2, that arose from the whole genome duplication +S000030500 CDS YOL105C 15 115808 114138 C 2006-01-05 1996-07-31 +S000005464 ORF Verified YOL104C NDJ1 TAM1 chromosome 15 L000003266|L000003597 15 117454 116396 C 2006-01-05 1996-07-31 Protein that regulates meiotic SPB cohesion and telomere clustering; localizes to both spindle pole bodies (SPBs) and telomeres; required for bouquet formation, effective homolog pairing, ordered cross-over distribution, sister chromatid cohesion at meiotic telomeres, chromosomal segregation and telomere-led rapid prophase movement +S000037679 CDS YOL104C 15 117454 116396 C 2006-01-05 1996-07-31 +S000007154 long_terminal_repeat YOLWdelta4 chromosome 15 15 117703 118040 W 2006-01-05 2000-05-19 Ty1 LTR +S000007161 LTR_retrotransposon YOLWTy1-1 Ty1 chromosome 15 15 117703 123628 W 2006-01-05 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007349 transposable_element_gene YOL103W-A gag protein chromosome 15 15 118000 119322 W 2006-01-05 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000030410 CDS YOL103W-A 15 118000 119322 W 2006-01-05 1999-07-17 +S000007350 transposable_element_gene YOL103W-B gag-pol fusion protein chromosome 15 S000029018 15 118000 123268 W 2006-01-05 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000030418 CDS YOL103W-B 15 118000 119304 W 2006-01-05 1999-07-17 +S000030419 CDS YOL103W-B 15 119306 123268 W 2006-01-05 1999-07-17 +S000030420 plus_1_translational_frameshift YOL103W-B 15 119305 119305 W 2006-01-05 1999-07-17 +S000007155 long_terminal_repeat YOLWdelta5 chromosome 15 15 123291 123628 W 2006-01-05 2000-05-19 Ty1 LTR +S000005463 ORF Verified YOL103W ITR2 myo-inositol transporter ITR2|HRB612 chromosome 15 L000000880 15 124001 125830 W 2006-01-05 2003-09-22|1996-07-31 Myo-inositol transporter; member of the sugar transporter superfamily; expressed constitutively; ITR2 has a paralog, ITR1, that arose from the whole genome duplication +S000037640 CDS YOL103W 15 124001 125830 W 2006-01-05 2003-09-22|1996-07-31 +S000005462 ORF Verified YOL102C TPT1 tRNA 2'-phosphotransferase chromosome 15 L000003433 15 126689 125997 C 2006-01-05 1996-07-31 tRNA 2'-phosphotransferase that catalyzes final step in tRNA splicing: the transfer of the 2'-PO(4) from the splice junction to NAD(+) to form ADP-ribose 1''-2''cyclic phosphate and nicotinamide +S000037519 CDS YOL102C 15 126689 125997 C 2006-01-05 1996-07-31 +S000005461 ORF Verified YOL101C IZH4 chromosome 15 15 127920 126982 C 2006-01-05 1996-07-31 Membrane protein involved in zinc ion homeostasis; member of the four-protein IZH family; expression induced by fatty acids and altered zinc levels; deletion reduces sensitivity to excess zinc; possible role in sterol metabolism; protein increases in abundance and relocalizes from nucleus to ER upon DNA replication stress; IZH4 has a paralog, IZH1, that arose from the whole genome duplication +S000037425 CDS YOL101C 15 127920 126982 C 2006-01-05 1996-07-31 +S000005460 ORF Verified YOL100W PKH2 serine/threonine protein kinase PKH2 chromosome 15 L000004617 15 129237 132482 W 2006-01-05 1996-07-31 Serine/threonine protein kinase; involved in sphingolipid-mediated signaling pathway that controls endocytosis; activates Ypk1p and Ykr2p, components of signaling cascade required for maintenance of cell wall integrity; contains a PH-like domain; redundant with Pkh1p; PKH2 has a paralog, PKH1, that arose from the whole genome duplication +S000032002 CDS YOL100W 15 129237 132482 W 2006-01-05 1996-07-31 +S000005459 ORF Dubious YOL099C chromosome 15 15 132508 132017 C 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene PKH2/YOL100W; may interact with ribosomes +S000030816 CDS YOL099C 15 132508 132017 C 2006-01-05 1996-07-31 +S000005458 ORF Verified YOL098C SDD3 chromosome 15 15 135838 132725 C 2006-01-05 1996-07-31 Putative metalloprotease; overproduction suppresses lethality due to expression of the dominant PET9 allele AAC2-A128P +S000030730 CDS YOL098C 15 135838 132725 C 2006-01-05 1996-07-31 +S000006449 snoRNA_gene snR58 SNR58 chromosome 15 L000004527 15 136183 136088 C 2006-01-05 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position C663 +S000030765 noncoding_exon snR58 15 136183 136088 C 2006-01-05 2000-05-19 +S000028854 ORF Uncharacterized YOL097W-A chromosome 15 15 136220 136405 W 2006-01-05 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000034567 CDS YOL097W-A 15 136220 136405 W 2006-01-05 2003-07-29 +S000005457 ORF Verified YOL097C WRS1 tryptophan--tRNA ligase WRS1|HRE342 chromosome 15 L000003253 15 137825 136527 C 2006-01-05 1996-07-31 Cytoplasmic tryptophanyl-tRNA synthetase; aminoacylates tryptophanyl-tRNA; human homolog WARS can complement yeast null mutant +S000030577 CDS YOL097C 15 137825 136527 C 2006-01-05 1996-07-31 +S000005456 ORF Verified YOL096C COQ3 hexaprenyldihydroxybenzoate methyltransferase chromosome 15 L000000380 15 139045 138107 C 2006-01-05 2003-09-22|1996-07-31 O-methyltransferase; catalyzes two different O-methylation steps in ubiquinone (Coenzyme Q) biosynthesis; component of a mitochondrial ubiquinone-synthesizing complex; phosphoprotein +S000036749 CDS YOL096C 15 139045 138107 C 2006-01-05 2003-09-22|1996-07-31 +S000005455 ORF Verified YOL095C HMI1 ATP-dependent 3'-5' DNA helicase chromosome 15 L000004614 15 141347 139227 C 2006-01-05 1996-07-31 Mitochondrial inner membrane localized ATP-dependent DNA helicase; required for the maintenance of the mitochondrial genome; not required for mitochondrial transcription; has homology to E. coli helicase uvrD +S000036656 CDS YOL095C 15 141347 139227 C 2006-01-05 1996-07-31 +S000005454 ORF Verified YOL094C RFC4 replication factor C subunit 4 chromosome 15 L000001625 15 142555 141584 C 2006-01-05 1996-07-31 Subunit of heteropentameric Replication factor C (RF-C); which is a DNA binding protein and ATPase that acts as a clamp loader of the proliferating cell nuclear antigen (PCNA) processivity factor for DNA polymerases delta and epsilon; relocalizes to the cytosol in response to hypoxia +S000036576 CDS YOL094C 15 142555 141584 C 2006-01-05 1996-07-31 +S000005453 ORF Verified YOL093W TRM10 tRNA (guanine(9)-N(1))-methyltransferase chromosome 15 15 142815 143696 W 2006-01-05 1996-07-31 tRNA methyltransferase; methylates the N-1 position of guanine at position 9 in tRNAs; protein abundance increases in response to DNA replication stress; member of the SPOUT (SpoU-TrmD) methyltransferase family; human ortholog TRMT10A plays a role in the pathogenesis of microcephaly and early onset diabetes; an 18-mer originates from the TRM10 locus; genetic analysis shows the 18-mer is the translation regulator +S000036530 CDS YOL093W 15 142815 143696 W 2006-01-05 1996-07-31 +S000005452 ORF Verified YOL092W YPQ1 cationic amino acid transporter chromosome 15 15 144204 145130 W 2006-01-05 1996-07-31 Putative vacuolar membrane transporter for cationic amino acids; likely contributes to amino acid homeostasis by exporting cationic amino acids from the vacuole; member of the PQ-loop family, with seven transmembrane domains; similar to mammalian PQLC2 vacuolar transporter; YPQ1 has a paralog, RTC2, that arose from the whole genome duplication +S000035613 CDS YOL092W 15 144204 145130 W 2006-01-05 1996-07-31 +S000005451 ORF Verified YOL091W SPO21 MPC70 chromosome 15 L000004853 15 145334 147163 W 2006-01-05 1996-07-31 Component of the meiotic outer plaque of the spindle pole body; involved in modifying the meiotic outer plaque that is required prior to prospore membrane formation; SPO21 has a paralog, YSW1, that arose from the whole genome duplication +S000035535 CDS YOL091W 15 145334 147163 W 2006-01-05 1996-07-31 +S000005450 ORF Verified YOL090W MSH2 mismatch repair ATPase MSH2|PMS5 chromosome 15 L000001190 15 147382 150276 W -83.8 2006-01-05 1996-07-31 Protein that binds to DNA mismatches; forms heterodimers with Msh3p and Msh6p that bind to DNA mismatches to initiate the mismatch repair process; contains a Walker ATP-binding motif required for repair activity and involved in interstrand cross-link repair; Msh2p-Msh6p binds to and hydrolyzes ATP +S000035449 CDS YOL090W 15 147382 150276 W 2006-01-05 1996-07-31 +S000005449 ORF Verified YOL089C HAL9 chromosome 15 L000004704 15 153490 150398 C 2006-01-05 1996-07-31 Putative transcription factor containing a zinc finger; overexpression increases salt tolerance through increased expression of the ENA1 (Na+/Li+ extrusion pump) gene while gene disruption decreases both salt tolerance and ENA1 expression; HAL9 has a paralog, TBS1, that arose from the whole genome duplication +S000035681 CDS YOL089C 15 153490 150398 C 2006-01-05 1996-07-31 +S000005448 ORF Verified YOL088C MPD2 protein disulfide isomerase MPD2 chromosome 15 L000004182 15 154745 153912 C 2006-01-05 1996-07-31 Member of the protein disulfide isomerase (PDI) family; exhibits chaperone activity; overexpression suppresses the lethality of a pdi1 deletion but does not complement all Pdi1p functions; undergoes oxidation by Ero1p +S000034755 CDS YOL088C 15 154745 153912 C 2006-01-05 1996-07-31 +S000005447 ORF Verified YOL087C DUF1 chromosome 15 15 158637 155287 C 2006-01-05 1996-07-31 Ubiquitin-binding protein of unknown function; contains one WD40 repeat in a beta-propeller fold; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; homolog of human WDR48/UAF1, which is involved in regulating the Fanconi anemia pathway; deletion mutant is sensitive to various chemicals including phenanthroline, sanguinarine, and nordihydroguaiaretic acid +S000034693 CDS YOL087C 15 158637 155287 C 2006-01-05 1996-07-31 +S000007626 ORF Verified YOL086W-A MHF1 chromosome 15 15 159173 159445 W 2006-01-05 2001-02-26 Component of the heterotetrameric MHF histone-fold complex; in humans the MHF complex interacts with both DNA and Mph1p ortholog FANCM, a Fanconi anemia complementation group protein, to stabilize and remodel blocked replication forks and repair damaged DNA; mhf1 srs2 double mutants are MMS hypersensitive; ortholog of human centromere constitutive-associated network (CCAN) subunit CENP-S, also known as MHF1 +S000037254 CDS YOL086W-A 15 159173 159445 W 2006-01-05 2001-02-26 +S000005446 ORF Verified YOL086C ADH1 alcohol dehydrogenase ADH1|ADC1 chromosome 15 L000000041 15 160594 159548 C -86 2006-01-05 1996-07-31 Alcohol dehydrogenase; fermentative isozyme active as homo- or heterotetramers; required for the reduction of acetaldehyde to ethanol, the last step in the glycolytic pathway; ADH1 has a paralog, ADH5, that arose from the whole genome duplication +S000034629 CDS YOL086C 15 160594 159548 C 2006-01-05 1996-07-31 +S000028708 ORF Dubious YOL085W-A chromosome 15 15 161579 161791 W 2006-01-05 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YOL085C +S000032652 CDS YOL085W-A 15 161579 161791 W 2006-01-05 2003-07-29 +S000005445 ORF Uncharacterized YOL085C chromosome 15 15 162014 161673 C 2006-01-05 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YOL085C is not an essential gene; partially overlaps dubious ORF YOL085W-A +S000034541 CDS YOL085C 15 162014 161673 C 2006-01-05 1996-07-31 +S000005444 ORF Verified YOL084W PHM7 chromosome 15 15 162356 165331 W 2006-01-05 1996-07-31 Protein of unknown function; expression is regulated by phosphate levels; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery and vacuole; protein abundance increases in response to DNA replication stress +S000034487 CDS YOL084W 15 162356 165331 W 2006-01-05 1996-07-31 +S000005443 ORF Verified YOL083W ATG34 ATG19-B chromosome 15 15 165714 166952 W 2006-01-05 1996-07-31 Receptor protein involved in selective autophagy during starvation; specifically involved in the transport of cargo protein alpha-mannosidase (Ams1p); Atg19p paralog +S000032467 CDS YOL083W 15 165714 166952 W 2006-01-05 1996-07-31 +S000028853 ORF Dubious YOL083C-A chromosome 15 15 166601 166461 C 2006-01-05 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by expression profiling and mass spectrometry +S000034566 CDS YOL083C-A 15 166601 166461 C 2006-01-05 2003-07-29 +S000118487 ARS ARS1510 ARSXV-167 chromosome 15 15 166976 167221 2006-08-30 2006-08-30 Autonomously Replicating Sequence +S000178182 ARS_consensus_sequence ARS1510 15 167002 167018 W 2014-11-18 2014-11-18 +S000005442 ORF Verified YOL082W ATG19 CVT19 chromosome 15 15 168727 169974 W 2006-01-05 1996-07-31 Receptor protein for the cytoplasm-to-vacuole targeting (Cvt) pathway; delivers cargo proteins aminopeptidase I (Ape1p) and alpha-mannosidase (Ams1p) to the phagophore assembly site for packaging into Cvt vesicles; interaction with Atg19p during the Cvt pathway requires phosphorylation by Hrr25p +S000032367 CDS YOL082W 15 168727 169974 W 2006-01-05 1996-07-31 +S000005441 ORF Verified YOL081W IRA2 Ras GTPase activating protein IRA2|GLC4|CCS1 chromosome 15 L000000874 15 171070 180309 W -72 2006-01-05 1996-07-31 GTPase-activating protein; negatively regulates RAS by converting it from the GTP- to the GDP-bound inactive form, required for reducing cAMP levels under nutrient limiting conditions; IRA2 has a paralog, IRA1, that arose from the whole genome duplication; defects in human homolog NF1 are associated with neurofibromatosis +S000032260 CDS YOL081W 15 171070 180309 W 2006-01-05 1996-07-31 +S000005439 ORF Dubious YOL079W chromosome 15 15 181057 181455 W 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031476 CDS YOL079W 15 181057 181455 W 2006-01-05 1996-07-31 +S000005440 ORF Verified YOL080C REX4 putative 3'-5' exonuclease chromosome 15 15 181427 180558 C 2006-01-05 1996-07-31 Putative RNA exonuclease; possibly involved in pre-rRNA processing and ribosome assembly +S000031202 CDS YOL080C 15 181427 180558 C 2006-01-05 1996-07-31 +S000005438 ORF Verified YOL078W AVO1 chromosome 15 15 181682 185212 W 2006-01-05 1996-07-31 Component of a membrane-bound complex containing the Tor2p kinase; contains Tor2p kinase and other proteins; may have a role in regulation of cell growth +S000031371 CDS YOL078W 15 181682 185212 W 2006-01-05 1996-07-31 +S000007339 ORF Verified YOL077W-A ATP19 F1F0 ATP synthase subunit k chromosome 15 15 185438 185644 W 2006-01-05 1999-07-17 Subunit k of the mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; associated only with the dimeric form of ATP synthase +S000031206 CDS YOL077W-A 15 185438 185644 W 2006-01-05 1999-07-17 +S000005437 ORF Verified YOL077C BRX1 chromosome 15 15 186723 185848 C 2006-01-05 1996-07-31|2011-02-03 Nucleolar protein; constituent of 66S pre-ribosomal particles; depletion leads to defects in rRNA processing and a block in the assembly of large ribosomal subunits; possesses a sigma(70)-like RNA-binding motif +S000030456 CDS YOL077C 15 186723 185848 C 2006-01-05 1996-07-31|2011-02-03 +S000005436 ORF Verified YOL076W MDM20 NAA25|DEC1 chromosome 15 L000002975 15 187024 189414 W 2006-01-05 1996-07-31 Non-catalytic subunit of the NatB N-terminal acetyltransferase; NatB catalyzes N-acetylation of proteins with specific N-terminal sequences; involved in mitochondrial inheritance and actin assembly +S000030374 CDS YOL076W 15 187024 189414 W 2006-01-05 1996-07-31 +S000005435 ORF Verified YOL075C chromosome 15 15 193542 189658 C 2006-01-05 1999-07-17|1996-07-31|2011-02-03 Putative ABC transporter +S000030157 CDS YOL075C 15 193542 189658 C 2006-01-05 1999-07-17|1996-07-31|2011-02-03 +S000005434 ORF Verified YOL073C DSC2 chromosome 15 15 194800 193832 C 2006-01-05 1996-07-31 Multi-transmembrane subunit of the DSC ubiquitin ligase complex; similar in sequence to rhomboid pseudoproteases Der1p and UBAC2 that function in ERAD; ortholog of fission yeast dsc2 +S000036354 CDS YOL073C 15 194800 193832 C 2006-01-05 1996-07-31 +S000005433 ORF Verified YOL072W THP1 BUD29 chromosome 15 15 194970 196337 W 2006-01-05 1996-07-31 Nuclear pore-associated protein; component of TREX-2 complex (Sac3p-Thp1p-Sus1p-Cdc31p) involved in transcription elongation and mRNA export from the nucleus; involved in post-transcriptional tethering of active genes to the nuclear periphery and to non-nascent mRNP; contains a PAM domain implicated in protein-protein binding +S000036289 CDS YOL072W 15 194970 196337 W 2006-01-05 1996-07-31 +S000005432 ORF Verified YOL071W SDH5 EMI5|succinate dehydrogenase assembly factor SDH5 chromosome 15 15 196507 196995 W 2006-01-05 1996-07-31 Protein required for flavinylation of Sdh1p; binds to Sdh1p and promotes FAD cofactor attachment, which is necessary for succinate dehydrogenase (SDH) complex assembly and activity; mutations in human ortholog PGL2 are associated with neuroendocrine tumors (paraganglioma) +S000036205 CDS YOL071W 15 196507 196995 W 2006-01-05 1996-07-31 +S000005431 ORF Verified YOL070C NBA1 chromosome 15 15 198725 197220 C 2006-01-05 1996-07-31 Protein of unknown function; localizes to the bud neck and cytoplasm; interacts with Nap1p; may interact with ribosomes, based on co-purification experiments; potential Cdc28p substrate +S000035224 CDS YOL070C 15 198725 197220 C 2006-01-05 1996-07-31 +S000005430 ORF Verified YOL069W NUF2 kinetochore-associated Ndc80 complex subunit NUF2 chromosome 15 L000001286 15 198942 200297 W 2006-01-05 1996-07-31 Component of the kinetochore-associated Ndc80 complex; involved in chromosome segregation, spindle checkpoint activity, and kinetochore clustering; evolutionarily conserved; other members include Ndc80p, Nuf2p, Spc24p, and Spc25p +S000035586 CDS YOL069W 15 198942 200297 W 2006-01-05 1996-07-31 +S000005429 ORF Verified YOL068C HST1 histone deacetylase HST1 chromosome 15 L000000826 15 201879 200368 C 2006-01-05 1996-07-31 NAD(+)-dependent histone deacetylase; essential subunit of the Sum1p/Rfm1p/Hst1p complex required for ORC-dependent silencing and meiotic repression; non-essential subunit of the Set3C deacetylase complex; involved in telomere maintenance; HST1 has a paralog, SIR2, that arose from the whole genome duplication +S000035472 CDS YOL068C 15 201879 200368 C 2006-01-05 1996-07-31 +S000005428 ORF Verified YOL067C RTG1 chromosome 15 L000001783 15 202518 201985 C 2006-01-05 1996-07-31 Transcription factor (bHLH) involved in interorganelle communication; contributes to communication between mitochondria, peroxisomes, and nucleus; target of Hog1p; activated in stochastic pulses of nuclear localization +S000035434 CDS YOL067C 15 202518 201985 C 2006-01-05 1996-07-31 +S000005427 ORF Verified YOL066C RIB2 bifunctional DRAP deaminase/tRNA pseudouridine synthase RIB2|PUS8 chromosome 15 L000003026 15 204471 202696 C 2006-01-05 1996-07-31 Bifunctional DRAP deaminase tRNA:pseudouridine synthase; the deaminase catalyzes the third step in riboflavin biosynthesis and the synthase catalyzes formation of pseudouridine at position 32 in cytoplasmic tRNAs; RIB2 has a paralog, PUS9, that arose from the whole genome duplication +S000035357 CDS YOL066C 15 204471 202696 C 2006-01-05 1996-07-31 +S000005426 ORF Verified YOL065C INP54 phosphoinositide 5-phosphatase INP54 chromosome 15 L000004299 15 205885 204731 C 2006-01-05 1996-07-31 Phosphatidylinositol 4,5-bisphosphate 5-phosphatase; role in secretion; localizes to the endoplasmic reticulum via the C-terminal tail; lacks the Sac1 domain and proline-rich region found in the other 3 INP proteins +S000034381 CDS YOL065C 15 205885 204731 C 2006-01-05 1996-07-31 +S000005425 ORF Verified YOL064C MET22 3'(2'),5'-bisphosphate nucleotidase|HAL2 chromosome 15 L000001090 15 207176 206103 C 2006-01-05 1996-07-31 Bisphosphate-3'-nucleotidase; involved in salt tolerance and methionine biogenesis; dephosphorylates 3'-phosphoadenosine-5'-phosphate and 3'-phosphoadenosine-5'-phosphosulfate, intermediates of the sulfate assimilation pathway; human homolog BPNT1 complements yeast null mutant +S000034318 CDS YOL064C 15 207176 206103 C 2006-01-05 1996-07-31 +S000005424 ORF Verified YOL063C CRT10 HUS1 chromosome 15 15 210265 207392 C 2006-01-05 1996-07-31 Protein involved in transcriptional regulation of RNR2 and RNR3; expression of the gene is induced by DNA damage and null mutations confer increased resistance to hydroxyurea; N-terminal region has a leucine repeat and a WD40 repeat +S000034270 CDS YOL063C 15 210265 207392 C 2006-01-05 1996-07-31 +S000005423 ORF Verified YOL062C APM4 AMP1 chromosome 15 L000003288 15 211995 210520 C 2006-01-05 1996-07-31 Cargo-binding mu subunit of AP-2; AP-2 is a heterotetrameric endocytic cargo-binding adaptor that facilitates uptake of membrane proteins during clathrin-mediated endocytosis; Apm4p is required for AP-2 function and localization, and binds cell wall stress receptor Mid2p; AP-2 is required for cell polarity responses to pheromone, nutritional status and cell wall damage in S. cerevisiae, and for hyphal growth in C. albicans; AP-2 complex is conserved in mammals +S000034160 CDS YOL062C 15 211995 210520 C 2006-01-05 1996-07-31 +S000005422 ORF Verified YOL061W PRS5 ribose phosphate diphosphokinase subunit PRS5 chromosome 15 L000004120 15 212244 213734 W 2006-01-05 1996-07-31 5-phospho-ribosyl-1(alpha)-pyrophosphate synthetase; synthesizes PRPP, which is required for nucleotide, histidine, and tryptophan biosynthesis; one of five related enzymes, which are active as heteromultimeric complexes; forms cytoplasmic foci upon DNA replication stress +S000034100 CDS YOL061W 15 212244 213734 W 2006-01-05 1996-07-31 +S000005421 ORF Verified YOL060C MAM3 chromosome 15 15 216137 214017 C 2006-01-05 1996-07-31 Protein required for normal mitochondrial morphology; has similarity to hemolysins +S000032070 CDS YOL060C 15 216137 214017 C 2006-01-05 1996-07-31 +S000005420 ORF Verified YOL059W GPD2 glycerol-3-phosphate dehydrogenase (NAD(+)) GPD2|GPD3 chromosome 15 L000000723|L000003160 15 217126 218448 W 2006-01-05 1996-07-31 NAD-dependent glycerol 3-phosphate dehydrogenase; expression is controlled by an oxygen-independent signaling pathway required to regulate metabolism under anoxic conditions; located in cytosol and mitochondria; constitutively active but is inactivated via phosphorylation by energy-stress responsive kinase SNF1; GPD2 has a paralog, GPD1, that arose from the whole genome duplication +S000032438 CDS YOL059W 15 217126 218448 W 2006-01-05 1996-07-31 +S000005419 ORF Verified YOL058W ARG1 argininosuccinate synthase|ARG10 chromosome 15 L000000107 15 219211 220473 W -56 2011-02-03 1996-07-31|2011-02-03 Arginosuccinate synthetase; catalyzes the formation of L-argininosuccinate from citrulline and L-aspartate in the arginine biosynthesis pathway; potential Cdc28p substrate +S000032317 CDS YOL058W 15 219211 220473 W 2011-02-03 1996-07-31|2011-02-03 +S000005418 ORF Verified YOL057W dipeptidyl-peptidase III chromosome 15 15 220767 222902 W 2011-02-03 1996-07-31 Dipeptidyl-peptidase III; cleaves dipeptides from the amino terminus of target proteins; highly active on synthetic substrate Arg-Arg-2-naphthylamide; mammalian ortholog may be a biomarker for some cancers +S000032234 CDS YOL057W 15 220767 222902 W 2011-02-03 1996-07-31 +S000005417 ORF Verified YOL056W GPM3 phosphoglycerate mutase family protein GPM3 chromosome 15 L000002980 15 223268 224179 W 2011-02-03 1996-07-31 Homolog of Gpm1p phosphoglycerate mutase; converts 3-phosphoglycerate to 2-phosphoglycerate in glycolysis; may be non-functional; GPM3 has a paralog, GPM2, that arose from the whole genome duplication +S000032154 CDS YOL056W 15 223268 224179 W 2011-02-03 1996-07-31 +S000005416 ORF Verified YOL055C THI20 trifunctional hydroxymethylpyrimidine kinase/phosphomethylpyrimidine kinase/thiaminase chromosome 15 15 226075 224420 C 2011-02-03 1996-07-31 Trifunctional enzyme of thiamine biosynthesis, degradation and salvage; has hydroxymethylpyrimidine (HMP) kinase, HMP-phosphate (HMP-P) kinase and thiaminase activities; member of a gene family with THI21 and THI22; HMP and HMP-P kinase activity redundant with Thi21p +S000031133 CDS YOL055C 15 226075 224420 C 2011-02-03 1996-07-31 +S000006586 tRNA_gene tG(GCC)O1 chromosome 15 L000003719 15 226681 226611 C 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis +S000031599 noncoding_exon tG(GCC)O1 15 226681 226611 C 2011-02-03 2000-05-19 +S000007158 long_terminal_repeat YOLWsigma1 chromosome 15 15 226696 227037 W 2011-02-03 2000-05-19 Ty3 LTR +S000007156 long_terminal_repeat YOLWdelta6 chromosome 15 15 227096 227293 W 2011-02-03 2000-05-19 Ty1 LTR +S000007151 long_terminal_repeat YOLCdelta7 chromosome 15 15 228178 227851 C 2011-02-03 2000-05-19 Ty1 LTR +S000006675 tRNA_gene tN(GUU)O1 chromosome 15 L000003702 15 228331 228404 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis +S000035637 noncoding_exon tN(GUU)O1 15 228331 228404 W 2011-02-03 2000-05-19 +S000005415 ORF Verified YOL054W PSH1 ubiquitin-protein ligase PSH1 chromosome 15 15 228614 229834 W 2011-02-03 1996-07-31 E3 ubiquitin ligase targeting centromere-binding protein Cse4p; mediates polyubiquitination and degradation of histone H3 variant Cse4p, preventing its mislocalization to euchromatin independent of Slx5p; ubiquitination of Cse4p may be antagonized by Scm3p +S000031092 CDS YOL054W 15 228614 229834 W 2011-02-03 1996-07-31 +S000005414 ORF Verified YOL053W AIM39 chromosome 15 15 230085 231272 W 2011-02-03 1996-07-31 Protein of unknown function; null mutant displays elevated frequency of mitochondrial genome loss +S000030999 CDS YOL053W 15 230085 231272 W 2011-02-03 1996-07-31 +S000005413 ORF Verified YOL052C-A DDR2 YOL053C-A|DDRA2 chromosome 15 L000003478 15 231755 231570 C 2011-02-03 1996-07-31 Multi-stress response protein; expression is activated by a variety of xenobiotic agents and environmental or physiological stresses; DDR2 has a paralog, HOR7, that arose from the whole genome duplication +S000035236 CDS YOL052C-A 15 231755 231570 C 2011-02-03 1996-07-31 +S000005412 ORF Verified YOL052C SPE2 adenosylmethionine decarboxylase SPE2 chromosome 15 L000001994 15 233636 232446 C -58 2011-02-03 1996-07-31 S-adenosylmethionine decarboxylase; required for the biosynthesis of spermidine and spermine; cells lacking Spe2p require spermine or spermidine for growth in the presence of oxygen but not when grown anaerobically +S000029956 CDS YOL052C 15 233636 232446 C 2011-02-03 1996-07-31 +S000081375 snoRNA_gene snR81 SNR81 chromosome 15 15 234346 234546 W 2011-02-03 2006-01-24 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U1052, constitutive pseudouridylation of U2 snRNA (LSR1) at position 42, and stress-induced U2 pseudouridylation at position 93 +S000114173 noncoding_exon snR81 15 234346 234546 W 2011-02-03 2006-01-24 +S000005411 ORF Verified YOL051W GAL11 MED15|ABE1|SPT13|SDS4|RAR3 chromosome 15 L000000664 15 234940 238185 W -53 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; affects transcription by acting as target of activators and repressors; forms part of the tail domain of mediator +S000029897 CDS YOL051W 15 234940 238185 W 2011-02-03 1996-07-31 +S000005410 ORF Dubious YOL050C chromosome 15 15 238202 237882 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps verified gene GAL11; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO) +S000037840 CDS YOL050C 15 238202 237882 C 2011-02-03 1996-07-31 +S000005409 ORF Verified YOL049W GSH2 glutathione synthase chromosome 15 L000003548 15 238619 240094 W 2011-02-03 1996-07-31 Glutathione synthetase; catalyzes the ATP-dependent synthesis of glutathione (GSH) from gamma-glutamylcysteine and glycine; induced by oxidative stress and heat shock +S000037056 CDS YOL049W 15 238619 240094 W 2011-02-03 1996-07-31 +S000005408 ORF Verified YOL048C RRT8 chromosome 15 15 241310 240204 C 2011-02-03 2003-09-27|1996-07-31 Protein involved in spore wall assembly; shares similarity with Lds1p and Lds2p and a strain mutant for all 3 genes exhibits reduced dityrosine fluorescence relative to the single mutants; identified in a screen for mutants with increased levels of rDNA transcription; green fluorescent protein (GFP)-fusion protein localizes to lipid particles; protein abundance increases in response to DNA replication stress +S000036368 CDS YOL048C 15 240947 240204 C 2011-02-03 2003-09-27 +S000036367 CDS YOL048C 15 241310 241026 C 2011-02-03 2003-09-27|1996-07-31 +S000036369 intron YOL048C 15 241025 240948 C 2011-02-03 2003-09-27 +S000005407 ORF Verified YOL047C LDS2 chromosome 15 15 242747 241614 C 2011-02-03 2000-07-14|1996-07-31 Protein Involved in spore wall assembly; localizes to lipid droplets found on or outside of the prospore membrane; shares similarity with Lds1p and Rrt8p, and a strain mutant for all 3 genes exhibits reduced dityrosine fluorescence relative to the single mutants; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern +S000036270 CDS YOL047C 15 242441 241614 C 2011-02-03 2000-07-14|1996-07-31 +S000036269 CDS YOL047C 15 242747 242505 C 2011-02-03 2000-07-14|1996-07-31 +S000036271 intron YOL047C 15 242504 242442 C 2011-02-03 2000-07-14|1996-07-31 +S000005405 ORF Verified YOL045W PSK2 serine/threonine protein kinase PSK2 chromosome 15 15 243497 246802 W 2011-02-03 1996-07-31 PAS-domain containing serine/threonine protein kinase; regulates sugar flux and translation in response to an unknown metabolite by phosphorylating Ugp1p and Gsy2p (sugar flux) and Caf20p, Tif11p and Sro9p (translation); PSK2 has a paralog, PSK1, that arose from the whole genome duplication +S000036127 CDS YOL045W 15 243497 246802 W 2011-02-03 1996-07-31 +S000005406 ORF Dubious YOL046C chromosome 15 15 244140 243466 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the verified gene PSK2/YOL045W +S000036179 CDS YOL046C 15 244140 243466 C 2011-02-03 1996-07-31 +S000005404 ORF Verified YOL044W PEX15 PAS21 chromosome 15 L000003971 15 247150 248301 W 2011-02-03 1996-07-31 Tail-anchored type II integral peroxisomal membrane protein; required for peroxisome biogenesis; cells lacking Pex15p mislocalize peroxisomal matrix proteins to cytosol; overexpression results in impaired peroxisome assembly +S000036032 CDS YOL044W 15 247150 248301 W 2011-02-03 1996-07-31 +S000005403 ORF Verified YOL043C NTG2 bifunctional N-glycosylase/AP lyase NTG2|SCR2 chromosome 15 L000004115 15 249534 248392 C 2011-02-03 1996-07-31 DNA N-glycosylase and apurinic/apyrimidinic (AP) lyase; involved in base excision repair, localizes to the nucleus; sumoylated; NTG2 has a paralog, NTG1, that arose from the whole genome duplication +S000035085 CDS YOL043C 15 249534 248392 C 2011-02-03 1996-07-31 +S000005402 ORF Verified YOL042W NGL1 RNA exonuclease chromosome 15 15 249825 250916 W 2011-02-03 1996-07-31 Putative endonuclease; has a domain similar to a magnesium-dependent endonuclease motif in mRNA deadenylase Ccr4p; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000035032 CDS YOL042W 15 249825 250916 W 2011-02-03 1996-07-31 +S000005401 ORF Verified YOL041C NOP12 chromosome 15 S000007491 15 252646 251267 C 2011-02-03 1996-07-31 Nucleolar protein involved in pre-25S rRNA processing; also involved in biogenesis of large 60S ribosomal subunit; contains an RNA recognition motif (RRM); binds to Ebp2; similar to Nop13p and Nsr1p +S000034818 CDS YOL041C 15 252646 251267 C 2011-02-03 1996-07-31 +S000005400 ORF Verified YOL040C RPS15 uS19|ribosomal 40S subunit protein S15|S19|rp52|S21|S15|RPS21 chromosome 15 L000002709|L000001759 15 253577 253149 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S15 and bacterial S19 +S000033943 CDS YOL040C 15 253577 253149 C 2011-02-03 1996-07-31 +S000005399 ORF Verified YOL039W RPP2A P2A|ribosomal protein P2A|RPLA2|RPL44 chromosome 15 L000001733|L000001735|L000002820 15 254297 254617 W 2011-02-03 1996-07-31 Ribosomal protein P2 alpha; a component of the ribosomal stalk, which is involved in the interaction between translational elongation factors and the ribosome; free (non-ribosomal) P2 stimulates the phosphorylation of the eIF2 alpha subunit (Sui2p) by Gcn2p; regulates the accumulation of P1 (Rpp1Ap and Rpp1Bp) in the cytoplasm +S000032787 CDS YOL039W 15 254297 254617 W 2011-02-03 1996-07-31 +S000028812 ORF Uncharacterized YOL038C-A chromosome 15 15 255021 254926 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by SAGE analysis +S000033612 CDS YOL038C-A 15 255021 254926 C 2011-02-03 2003-07-29 +S000005398 ORF Verified YOL038W PRE6 proteasome core particle subunit alpha 4 chromosome 15 L000001488 15 255337 256101 W 2011-02-03 1996-07-31 Alpha 4 subunit of the 20S proteasome; may replace alpha 3 subunit (Pre9p) under stress conditions to create a more active proteasomal isoform; GFP-fusion protein relocates from cytosol to the mitochondrial surface upon oxidative stress +S000031873 CDS YOL038W 15 255337 256101 W 2011-02-03 1996-07-31 +S000005396 ORF Uncharacterized YOL036W chromosome 15 15 256745 259030 W 2011-02-03 1996-07-31 Protein of unknown function; potential Cdc28p substrate; YOL036W has a paralog, YIR016W, that arose from the whole genome duplication +S000031637 CDS YOL036W 15 256745 259030 W 2011-02-03 1996-07-31 +S000005397 ORF Dubious YOL037C chromosome 15 15 257019 256666 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YOL036W +S000031673 CDS YOL037C 15 257019 256666 C 2011-02-03 1996-07-31 +S000005395 ORF Dubious YOL035C chromosome 15 15 259105 258803 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030751 CDS YOL035C 15 259105 258803 C 2011-02-03 1996-07-31 +S000006441 snoRNA_gene snR50 SNR50 chromosome 15 L000004519 15 259489 259578 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position G867 +S000030731 noncoding_exon snR50 15 259489 259578 W 2011-02-03 2000-05-19 +S000005394 ORF Verified YOL034W SMC5 DNA repair ATPase SMC5 chromosome 15 15 259923 263204 W 2011-02-03 1996-07-31 Subunit of the SMC5-SMC6 complex; the SMC5-SMC6 complex plays a key role in the removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair; binds single-stranded DNA and has ATPase activity; supports nucleolar function; S. pombe homolog forms a heterodimer with S. pombe Rad18p that is involved in DNA repair +S000030687 CDS YOL034W 15 259923 263204 W 2011-02-03 1996-07-31 +S000005393 ORF Verified YOL033W MSE1 glutamate--tRNA ligase MSE1 chromosome 15 L000002617 15 263475 265085 W 2011-02-03 1996-07-31 Mitochondrial glutamyl-tRNA synthetase; predicted to be palmitoylated +S000030607 CDS YOL033W 15 263475 265085 W 2011-02-03 1996-07-31 +S000005392 ORF Verified YOL032W OPI10 chromosome 15 15 265429 266169 W 2011-02-03 1996-07-31 Protein with a possible role in phospholipid biosynthesis; null mutant displays an inositol-excreting phenotype that is suppressed by exogenous choline; protein abundance increases in response to DNA replication stress +S000030531 CDS YOL032W 15 265429 266169 W 2011-02-03 1996-07-31 +S000005391 ORF Verified YOL031C SIL1 SLS1 chromosome 15 15 267529 266264 C 2011-02-03 1996-07-31 Nucleotide exchange factor for the ER lumenal Hsp70 chaperone Kar2p; required for protein translocation into the endoplasmic reticulum (ER); homolog of Yarrowia lipolytica SLS1; GrpE-like protein +S000037678 CDS YOL031C 15 267529 266264 C 2011-02-03 1996-07-31 +S000005390 ORF Verified YOL030W GAS5 1,3-beta-glucanosyltransferase chromosome 15 15 268187 269641 W 2011-02-03 1996-07-31 1,3-beta-glucanosyltransferase; has similarity to Gas1p; localizes to the cell wall +S000037638 CDS YOL030W 15 268187 269641 W 2011-02-03 1996-07-31 +S000005389 ORF Uncharacterized YOL029C chromosome 15 15 270420 269815 C 2011-02-03 1996-07-31 Putative protein of unknown function; identified as interacting with Hsc82p and Hsp82p in high-throughput two-hybrid screens +S000036601 CDS YOL029C 15 270420 269815 C 2011-02-03 1996-07-31 +S000005388 ORF Verified YOL028C YAP7 chromosome 15 L000004347 15 271370 270633 C 2011-02-03 1996-07-31 Putative basic leucine zipper (bZIP) transcription factor; YAP7 has a paralog, YAP5, that arose from the whole genome duplication +S000036521 CDS YOL028C 15 271370 270633 C 2011-02-03 1996-07-31 +S000005387 ORF Verified YOL027C MDM38 ribosome-binding protein MDM38|MKH1 chromosome 15 15 273724 272003 C 2011-02-03 1996-07-31 Mitochondrial protein; forms a complex with Mba1p to facilitate recruitment of mRNA-specific translational activators to ribosomes; roles in protein export and K+/H+ exchange; human ortholog Letm1 implicated in Wolf-Hirschhorn syndrome +S000036426 CDS YOL027C 15 273724 272003 C 2011-02-03 1996-07-31 +S000005386 ORF Verified YOL026C MIM1 TOM13 chromosome 15 15 274353 274012 C 2011-02-03 1996-07-31 Mitochondrial protein required for outer membrane protein import; cooperates with Tom70p to import the subset of proteins with multiple alpha-helical transmembrane segments, including Ugo1p, Tom20p, and others; present in a complex with Mim2p in the outer membrane that may create a local environment to facilitate membrane insertion of substrate proteins; also has a role in assembly of Tom20p into the TOM complex +S000036344 CDS YOL026C 15 274353 274012 C 2011-02-03 1996-07-31 +S000006733 tRNA_gene tS(GCU)O chromosome 15 L000003703 15 274673 274773 W 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000037500 intron tS(GCU)O 15 274710 274728 W 2011-02-03 2000-05-19 +S000037498 noncoding_exon tS(GCU)O 15 274673 274709 W 2011-02-03 2000-05-19 +S000037499 noncoding_exon tS(GCU)O 15 274729 274773 W 2011-02-03 2000-05-19 +S000005385 ORF Verified YOL025W LAG2 ECM36 chromosome 15 L000003402 15 274957 276939 W 2011-02-03 1996-07-31|1997-07-27 Protein that negatively regulates the SCF E3-ubiquitin ligase; regulates by interacting with and preventing neddyation of the cullin subunit, Cdc53p; longevity determinant that is preferentially expressed in young cells; similar to mammalian Cand1 +S000035469 CDS YOL025W 15 274957 276939 W 2011-02-03 1997-07-27|1996-07-31 +S000005384 ORF Uncharacterized YOL024W chromosome 15 15 277086 277604 W 2011-02-03 1996-07-31 Putative protein of unknown function; predicted to have thiol-disulfide oxidoreductase active site; YOL024W has a paralog, IGD1, that arose from the whole genome duplication +S000035404 CDS YOL024W 15 277086 277604 W 2011-02-03 1996-07-31 +S000118488 ARS ARS1511 ARSXV-278 chromosome 15 15 277530 277778 2011-02-03 2006-08-30 Autonomously Replicating Sequence; replication capacity dependent upon Sum1p +S000178183 ARS_consensus_sequence ARS1511 15 277733 277717 C 2014-11-18 2014-11-18 +S000005383 ORF Verified YOL023W IFM1 translation initiation factor 2 chromosome 15 L000000854 15 278056 280086 W 2011-02-03 1996-07-31 Mitochondrial translation initiation factor 2 +S000035326 CDS YOL023W 15 278056 280086 W 2011-02-03 1996-07-31 +S000005382 ORF Verified YOL022C TSR4 chromosome 15 15 281498 280272 C 2011-02-03 1996-07-31|2011-02-03 Cytoplasmic protein required for correct processing of 20S pre-rRNA; protein required for processing of the 20S pre-rRNA at site D to generate mature 18S rRNA; essential gene in S288C background but not in CEN.PK2 +S000035200 CDS YOL022C 15 281498 280272 C 2011-02-03 1996-07-31|2011-02-03 +S000006587 tRNA_gene tG(GCC)O2 SUF17 chromosome 15 L000002164|L000003704 15 282164 282234 W -53 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons +S000031601 noncoding_exon tG(GCC)O2 15 282164 282234 W 2011-02-03 2000-05-19 +S000005381 ORF Verified YOL021C DIS3 exosome catalytic subunit DIS3|MTR17|RRP44 chromosome 15 L000003486 15 285426 282421 C 2011-02-03 1996-07-31 Exosome core complex catalytic subunit; has both endonuclease and 3'-5' exonuclease activity; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; role in degradation of tRNAs; similar to E. coli RNase R and to human DIS3, which partially complements dis3-81 heat sensitivity; mutations in Dis3p analogous to human mutations implicated in multiple myeloma impair exosome function; protein abundance increases under to DNA replication stress +S000034208 CDS YOL021C 15 285426 282421 C 2011-02-03 1996-07-31 +S000005380 ORF Verified YOL020W TAT2 aromatic amino acid transmembrane transporter TAT2|TAP2|SCM2|SAB2|LTG3 chromosome 15 L000002263|L000000956|L000001813 15 286172 287950 W 2011-02-03 1996-07-31 High affinity tryptophan and tyrosine permease; overexpression confers FK506 and FTY720 resistance +S000034169 CDS YOL020W 15 286172 287950 W 2011-02-03 1996-07-31 +S000006785 tRNA_gene tY(GUA)O SUP3 chromosome 15 L000003705|L000002182 15 288192 288280 W -16 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations +S000034708 intron tY(GUA)O 15 288231 288244 W 2011-02-03 2000-05-19 +S000034706 noncoding_exon tY(GUA)O 15 288192 288230 W 2011-02-03 2000-05-19 +S000034707 noncoding_exon tY(GUA)O 15 288245 288280 W 2011-02-03 2000-05-19 +S000028707 ORF Uncharacterized YOL019W-A chromosome 15 15 288420 288572 W 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032650 CDS YOL019W-A 15 288420 288572 W 2011-02-03 2003-07-29 +S000005379 ORF Uncharacterized YOL019W TOS7 chromosome 15 15 288898 290553 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery and vacuole; YOL019W has a paralog, DCV1, that arose from the whole genome duplication +S000033133 CDS YOL019W 15 288898 290553 W 2011-02-03 1996-07-31 +S000005378 ORF Verified YOL018C TLG2 chromosome 15 L000004228 15 292074 290881 C 2011-02-03 1996-07-31 Syntaxin-like t-SNARE; forms a complex with Tlg1p and Vti1p and mediates fusion of endosome-derived vesicles with the late Golgi; required along with VPS45 for an early step of the constitutive CVT pathway; interactions with Vps45 prevents Tlg2p degradation, and facilitates t-SNARE complex formation; homologous to mammalian SNARE protein syntaxin 16 (Sx16) +S000032218 CDS YOL018C 15 292074 290881 C 2011-02-03 1996-07-31 +S000005377 ORF Verified YOL017W ESC8 chromosome 15 15 292529 294673 W 2011-02-03 1996-07-31 Protein involved in telomeric and mating-type locus silencing; interacts with Sir2p and also interacts with Gal11p, which is a component of the RNA pol II mediator complex; ESC8 has a paralog, IOC3, that arose from the whole genome duplication +S000032174 CDS YOL017W 15 292529 294673 W 2011-02-03 1996-07-31 +S000005376 ORF Verified YOL016C CMK2 calmodulin-dependent protein kinase CMK2 chromosome 15 L000000367 15 296120 294777 C 2011-02-03 1996-07-31 Calmodulin-dependent protein kinase; may play a role in stress response, many CA++/calmodulan dependent phosphorylation substrates demonstrated in vitro, amino acid sequence similar to mammalian Cam Kinase II; CMK2 has a paralog, CMK1, that arose from the whole genome duplication +S000032049 CDS YOL016C 15 296120 294777 C 2011-02-03 1996-07-31 +S000005375 ORF Verified YOL015W IRC10 chromosome 15 15 297078 298838 W 2011-02-03 1996-07-31 Protein of unknown function; subunit of the leading edge protein (LEP) complex (Ssp1-Ady3-Don1-Irc10) that forms a ring-like structure at the leading edge of the prospore membrane during meiosis II; null mutant displays increased levels of spontaneous Rad52p foci +S000032011 CDS YOL015W 15 297078 298838 W 2011-02-03 1996-07-31 +S000005374 ORF Uncharacterized YOL014W chromosome 15 15 299693 300067 W 2011-02-03 1996-07-31 Putative protein of unknown function; mCherry fusion protein localizes to the cytosol and nucleus +S000031065 CDS YOL014W 15 299693 300067 W 2011-02-03 1996-07-31 +S000007252 ORF Dubious YOL013W-B YOL013W-A chromosome 15 15 300690 300980 W 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the long terminal repeat (LTR) of a Ty1 element +S000033838 CDS YOL013W-B 15 300690 300980 W 2011-02-03 1999-07-17 +S000007152 long_terminal_repeat YOLCdelta8 chromosome 15 15 301021 300683 C 2011-02-03 2000-05-19 Ty1 LTR +S000028811 ORF Uncharacterized YOL013W-A YOL013W-B chromosome 15 15 301047 301238 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by SAGE +S000033611 CDS YOL013W-A 15 301047 301238 W 2011-02-03 2003-07-29 +S000006687 tRNA_gene tP(UGG)O1 chromosome 15 L000003706 15 301097 301198 W 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin +S000031042 intron tP(UGG)O1 15 301133 301162 W 2011-02-03 2000-05-19 +S000031040 noncoding_exon tP(UGG)O1 15 301097 301132 W 2011-02-03 2000-05-19 +S000031041 noncoding_exon tP(UGG)O1 15 301163 301198 W 2011-02-03 2000-05-19 +S000005373 ORF Verified YOL013C HRD1 E3 ubiquitin-protein ligase HRD1|DER3 chromosome 15 L000002963 15 303035 301380 C 2011-02-03 1996-07-31 Ubiquitin-protein ligase involved in ER-associated degradation (ERAD) of misfolded proteins; upon autoubiquitination triggers retrotranslocation of misfolded proteins to cytosol for degradation; genetically linked to the unfolded protein response (UPR); regulated through association with Hrd3p; contains an H2 ring finger; likely plays a general role in targeting proteins that persistently associate with and potentially obstruct the ER-localized translocon +S000030928 CDS YOL013C 15 303035 301380 C 2011-02-03 1996-07-31 +S000005372 ORF Verified YOL012C HTZ1 histone H2AZ|H2AZ|H2A.F/Z|HTA3 chromosome 15 L000003930|L000004094 15 303983 303579 C 2011-02-03 1996-07-31 Histone variant H2AZ; exchanged for histone H2A in nucleosomes by the SWR1 complex; involved in transcriptional regulation through prevention of the spread of silent heterochromatin; Htz1p-containing nucleosomes facilitate RNA Pol II passage by affecting correct assembly and modification status of RNA Pol II elongation complexes and by favoring efficient nucleosome remodeling +S000030851 CDS YOL012C 15 303983 303579 C 2011-02-03 1996-07-31 +S000005371 ORF Verified YOL011W PLB3 lysophospholipase chromosome 15 S000007426 15 305349 307409 W 2011-02-03 1996-07-31 Phospholipase B (lysophospholipase) involved in lipid metabolism; hydrolyzes phosphatidylinositol and phosphatidylserine and displays transacylase activity in vitro; PLB3 has a paralog, PLB1, that arose from the whole genome duplication +S000030818 CDS YOL011W 15 305349 307409 W 2011-02-03 1996-07-31 +S000005370 ORF Verified YOL010W RCL1 rRNA-processing endoribonuclease chromosome 15 15 307938 309041 W 2011-02-03 1996-07-31 Endonuclease that cleaves pre-rRNA at site A2 for 18S rRNA biogenesis; subunit of U3-containing 90S preribosome processome complex involved in small ribosomal subunit assembly; stimulates Bms1p GTPase and U3 binding activity; similar to RNA cyclase-like proteins but no cyclase activity detected +S000037888 CDS YOL010W 15 307938 309041 W 2011-02-03 1996-07-31 +S000130135 ARS ARS1512 ARSXV-309 chromosome 15 15 309359 309925 2011-02-03 2009-05-05 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay +S000005369 ORF Verified YOL009C MDM12 ERMES complex subunit MDM12 chromosome 15 L000002933 15 310139 309324 C 2011-02-03 1996-07-31 Mitochondrial outer membrane protein, ERMES complex subunit; required for transmission of mitochondria to daughter cells; required for mitophagy; may influence import and assembly of outer membrane beta-barrel proteins; ERMES complex is often co-localized with peroxisomes and with concentrated areas of pyruvate dehydrogenase +S000037008 CDS YOL009C 15 310139 309324 C 2011-02-03 1996-07-31 +S000005368 ORF Verified YOL008W COQ10 ubiquinone-binding protein COQ10 chromosome 15 15 310312 310935 W 2011-02-03 1996-07-31 Coenzyme Q (ubiquinone) binding protein; functions in the delivery of Q6 to its proper location for electron transport during respiration; START domain protein with homologs in bacteria and eukaryotes; respiratory growth defect of the null mutant is functionally complemented by human COQ10A +S000036984 CDS YOL008W 15 310312 310935 W 2011-02-03 1996-07-31 +S000005367 ORF Verified YOL007C CSI2 chromosome 15 L000004387 15 312367 311342 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)- fusion protein localizes to the mother side of the bud neck and the vacuole; YOL007C is not an essential gene +S000036219 CDS YOL007C 15 312367 311342 C 2011-02-03 1996-07-31 +S000005366 ORF Verified YOL006C TOP1 DNA topoisomerase 1|MAK17|MAK1 chromosome 15 L000002319 15 315387 313078 C 3 2011-02-03 1996-07-31 Topoisomerase I; nuclear enzyme that relieves torsional strain in DNA by cleaving and re-sealing the phosphodiester backbone; relaxes both positively and negatively supercoiled DNA; functions in replication, transcription, and recombination; role in processing ribonucleoside monophosphates in genomic DNA into irreversible single-strand breaks; enzymatic activity and interaction with Nsr1p are negatively regulated by polyphosphorylation +S000036071 CDS YOL006C 15 315387 313078 C 2011-02-03 1996-07-31 +S000005365 ORF Verified YOL005C RPB11 DNA-directed RNA polymerase II core subunit RPB11|B12.5 chromosome 15 L000001685 15 316175 315813 C 2011-02-03 1996-07-31 RNA polymerase II subunit B12.5; part of central core; similar to Rpc19p and bacterial alpha subunit +S000035928 CDS YOL005C 15 316175 315813 C 2011-02-03 1996-07-31 +S000005364 ORF Verified YOL004W SIN3 transcriptional regulator SIN3|UME4|SDS16|SDI1|RPD1|GAM2|CPE1 chromosome 15 L000001695 15 316938 321548 W 1 2011-02-03 1996-07-31 Component of both the Rpd3S and Rpd3L histone deacetylase complexes; involved in transcriptional repression and activation of diverse processes, including mating-type switching and meiosis; involved in the maintenance of chromosomal integrity +S000035863 CDS YOL004W 15 316938 321548 W 2011-02-03 1996-07-31 +S000005363 ORF Verified YOL003C PFA4 palmitoyltransferase PFA4 chromosome 15 15 322994 321858 C 2011-02-03 1996-07-31 Palmitoyltransferase with autoacylation activity; required for palmitoylation of amino acid permeases containing a C-terminal Phe-Trp-Cys site; required for modification of Chs3p; member of the DHHC family of putative palmitoyltransferases +S000034853 CDS YOL003C 15 322994 321858 C 2011-02-03 1996-07-31 +S000005362 ORF Verified YOL002C IZH2 PAQR-type receptor|PHO36 chromosome 15 15 324364 323411 C 2011-02-03 2003-01-09|1996-07-31 Plasma membrane receptor for plant antifungal osmotin; involved in zinc ion homeostasis, apoptosis; negatively regulates ZRT1 and other functionally divergent genes through CCCTC promoter motif (IzRE); modulates FET3 activity in iron-independent manner; affects gene expression by influencing balance of competition between Msn2p/Msn4p and Nrg1p/Nrg2p for binding to IzRE; transcription regulated by Zap1p, zinc, fatty acid levels; homolog of mammalian adiponectin receptor +S000034704 CDS YOL002C 15 324364 323411 C 2011-02-03 2003-01-09|1996-07-31 +S000005361 ORF Verified YOL001W PHO80 phoR|VAC5|TUP7|AGS3 chromosome 15 L000001426 15 325249 326130 W -1 2011-02-03 1996-07-31 Cyclin; interacts with cyclin-dependent kinase Pho85p; regulates the response to nutrient levels and environmental conditions, including the response to phosphate limitation and stress-dependent calcium signaling +S000034656 CDS YOL001W 15 325249 326130 W 2011-02-03 1996-07-31 +S000006476 centromere CEN15 CEN15 chromosome 15 L000000308 15 326702 326584 C 0 2011-02-03 2000-05-19|2004-10-08 Chromosome XV centromere +S000077290 centromere_DNA_Element_I CEN15 15 326702 326693 C 2011-02-03 2004-10-08 +S000077291 centromere_DNA_Element_II CEN15 15 326692 326609 C 2011-02-03 2004-10-08 +S000077292 centromere_DNA_Element_III CEN15 15 326608 326584 C 2011-02-03 2004-10-08 +S000005527 ORF Verified YOR001W RRP6 exosome nuclease subunit RRP6 chromosome 15 L000003540 15 326832 329033 W 2011-02-03 1996-07-31 Nuclear exosome exonuclease component; has 3'-5' exonuclease activity that is regulated by Lrp1p; involved in RNA processing, maturation, surveillance, degradation, tethering, and export; role in sn/snoRNAs precursor degradation; forms a stable heterodimer with Lrp1p; has similarity to E. coli RNase D and to human PM-Sc1 100 (EXOSC10); mutant displays reduced transcription elongation in the G-less-based +S000031325 CDS YOR001W 15 326832 329033 W 2011-02-03 1996-07-31 +S000005528 ORF Verified YOR002W ALG6 dolichyl-P-Glc:Man(9)GlcNAc(2)-PP-dolichol alpha-1,3-glucosyltransferase chromosome 15 L000003977 15 329417 331051 W 2011-02-03 1996-07-31 Alpha 1,3 glucosyltransferase; involved in transfer of oligosaccharides from dolichyl pyrophosphate to asparagine residues of proteins during N-linked protein glycosylation; C998T transition in human ortholog ALG6 causes carbohydrate-deficient glycoprotein syndrome type-Ic; wild-type human ortholog ALG6 can partially complement yeast alg6 mutant +S000032338 CDS YOR002W 15 329417 331051 W 2011-02-03 1996-07-31 +S000005529 ORF Verified YOR003W YSP3 putative subtilisin-like protease YSP3 chromosome 15 L000002552 15 331455 332891 W 2011-02-03 1996-07-31 Putative precursor of the subtilisin-like protease III; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; YSP3 has a paralog, PRB1, that arose from the whole genome duplication +S000032469 CDS YOR003W 15 331455 332891 W 2011-02-03 1996-07-31 +S000005530 ORF Verified YOR004W UTP23 rRNA-binding ribosome biosynthesis protein UTP23 chromosome 15 15 333592 334356 W 2011-02-03 1996-07-31 Component of the small subunit processome; involved in 40S ribosomal subunit biogenesis; interacts with snR30 and is required for dissociation of snR30 from large pre-ribosomal particles; has homology to PINc domain protein Fcf1p, although the PINc domain of Utp23p is not required for function; essential protein +S000032573 CDS YOR004W 15 333592 334356 W 2011-02-03 1996-07-31 +S000005531 ORF Verified YOR005C DNL4 DNA ligase (ATP) DNL4|LIG4 chromosome 15 L000003479 15 337343 334509 C 2011-02-03 1996-07-31 DNA ligase required for nonhomologous end-joining (NHEJ); forms stable heterodimer with required cofactor Lif1p, interacts with Nej1p; involved in meiosis, not essential for vegetative growth; mutations in human ortholog lead to ligase IV syndrome and Dubowitz syndrome +S000032618 CDS YOR005C 15 337343 334509 C 2011-02-03 1996-07-31 +S000118489 ARS ARS1513 ARSXV-337 chromosome 15 15 337424 337491 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000005532 ORF Verified YOR006C TSR3 chromosome 15 15 338621 337680 C 2011-02-03 1996-07-31 Protein required for 20S pre-rRNA processing; involved in processing of the 20S pre-rRNA at site D to generate mature 18S rRNA; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus; relative distribution to the nucleus increases upon DNA replication stress +S000033336 CDS YOR006C 15 338621 337680 C 2011-02-03 1996-07-31 +S000005533 ORF Verified YOR007C SGT2 chromosome 15 L000004506 15 339978 338938 C 2011-02-03 1996-07-31 Glutamine-rich cytoplasmic cochaperone; serves as a scaffold bringing together Get4, Get5p, and other TRC complex members that are required to mediate posttranslational insertion of tail-anchored proteins into the ER membrane; interacts with the prion domain of Sup35p; amyloid sensor; plays a role in targeting chaperones to prion aggregates; similar to human cochaperone SGT; forms cytoplasmic foci upon DNA replication stress +S000033384 CDS YOR007C 15 339978 338938 C 2011-02-03 1996-07-31 +S000006705 tRNA_gene tR(ACG)O chromosome 15 L000003718 15 340371 340299 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 6 nuclear tRNA genes containing the tDNA-anticodon ACG (converted to ICG in the mature tRNA), decodes CGU, CGC, and probably CGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000030451 noncoding_exon tR(ACG)O 15 340371 340299 C 2011-02-03 2000-05-19 +S000007153 long_terminal_repeat YORCdelta9 YOLCdelta9 chromosome 15 15 340898 340598 C 2011-02-03 2000-05-19 Ty1 LTR +S000005534 ORF Verified YOR008C SLG1 WSC1|HCS77 chromosome 15 L000003080 15 342414 341278 C 2011-02-03 1996-07-31 Sensor-transducer of the stress-activated PKC1-MPK1 kinase pathway; involved in maintenance of cell wall integrity; required for mitophagy; involved in organization of the actin cytoskeleton; secretory pathway Wsc1p is required for the arrest of secretion response +S000033455 CDS YOR008C 15 342414 341278 C 2011-02-03 1996-07-31 +S000006431 ORF Uncharacterized YOR008C-A chromosome 15 L000003931 15 343081 342857 C 2011-02-03 1999-07-17 Putative protein of unknown function; includes a potential transmembrane domain; deletion results in slightly lengthened telomeres; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively +S000034860 CDS YOR008C-A 15 343081 342857 C 2011-02-03 1999-07-17 +S000007628 ORF Dubious YOR008W-B chromosome 15 15 343929 344030 W 2006-01-05 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037258 CDS YOR008W-B 15 343929 344030 W 2006-01-05 2001-02-26 +S000005535 ORF Verified YOR009W TIR4 chromosome 15 15 344335 345798 W 2006-01-05 1996-07-31 Cell wall mannoprotein; expressed under anaerobic conditions and required for anaerobic growth; transcription is also induced by cold shock; member of the Srp1p/Tip1p family of serine-alanine-rich proteins +S000033574 CDS YOR009W 15 344335 345798 W 2006-01-05 1996-07-31 +S000005536 ORF Verified YOR010C TIR2 putative GPI-anchored mannoprotein|SRP2 chromosome 15 L000002312 15 346950 346195 C 2006-01-05 1996-07-31 Putative cell wall mannoprotein; member of the Srp1p/Tip1p family of serine-alanine-rich proteins; transcription is induced by cold shock and anaerobiosis; TIR2 has a paralog, TIR3, that arose from the whole genome duplication +S000034479 CDS YOR010C 15 346950 346195 C 2006-01-05 1996-07-31 +S000005537 ORF Verified YOR011W AUS1 ATP-binding cassette sterol transporter AUS1 chromosome 15 15 349679 353863 W 2006-01-05 1996-07-31 Plasma membrane sterol transporter of the ATP-binding cassette family; required, along with Pdr11p, for uptake of exogenous sterols and their incorporation into the plasma membrane; activity is stimulated by phosphatidylserine; sterol uptake is required for anaerobic growth because sterol biosynthesis requires oxygen; AUS1 has a paralog, PDR11, that arose from the whole genome duplication +S000035557 CDS YOR011W 15 349679 353863 W 2006-01-05 1996-07-31 +S000006747 tRNA_gene tT(AGU)O2 chromosome 15 L000003717 15 354113 354041 C 2006-01-05 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000037535 noncoding_exon tT(AGU)O2 15 354113 354041 C 2006-01-05 2000-05-19 +S000007159 long_terminal_repeat YORWsigma2 YOLWsigma2 chromosome 15 15 354128 354466 W 2006-01-05 2000-05-19 Ty3 LTR +S000007157 long_terminal_repeat YORWdelta10 YOLWdelta10 chromosome 15 15 354681 354958 W 2006-01-05 2000-05-19 Ty1 LTR +S000028581 ORF Uncharacterized YOR011W-A chromosome 15 15 355652 355858 W 2006-01-05 2003-07-29 Putative protein of unknown function +S000031328 CDS YOR011W-A 15 355652 355858 W 2006-01-05 2003-07-29 +S000005538 ORF Uncharacterized YOR012W chromosome 15 15 356543 356956 W 2006-01-05 1996-07-31 Putative protein of unknown function +S000035636 CDS YOR012W 15 356543 356956 W 2006-01-05 1996-07-31 +S000005539 ORF Dubious YOR013W IRC11 chromosome 15 15 356751 357221 W 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized gene YOR012C; null mutant displays increased levels of spontaneous Rad52 foci +S000035766 CDS YOR013W 15 356751 357221 W 2006-01-05 1996-07-31 +S000005540 ORF Verified YOR014W RTS1 protein phosphatase 2A regulatory subunit RTS1|SCS1 chromosome 15 L000001786 15 357674 359947 W 2006-01-05 1996-07-31 B-type regulatory subunit of protein phosphatase 2A (PP2A); Rts1p and Cdc55p are alternative regulatory subunits for PP2A catalytic subunits, Pph21p and Pph22p; PP2A-Rts1p protects cohesin when recruited by Sgo1p to the pericentromere; highly enriched at centromeres in the absence of Cdc55p; required for maintenance of septin ring organization during cytokinesis, for ring disassembly in G1 and for dephosphorylation of septin, Shs1p; homolog of the mammalian B' subunit of PP2A +S000036675 CDS YOR014W 15 357674 359947 W 2006-01-05 1996-07-31 +S000005541 ORF Uncharacterized YOR015W chromosome 15 15 359993 360352 W 2006-01-05 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YOR015W is not an essential gene +S000036735 CDS YOR015W 15 359993 360352 W 2006-01-05 1996-07-31 +S000005542 ORF Verified YOR016C ERP4 chromosome 15 L000004681 15 361084 360461 C 2006-01-05 1996-07-31 Member of the p24 family involved in ER to Golgi transport; similar to Emp24p and Erv25p; ERP4 has a paralog, ERP2, that arose from the whole genome duplication +S000036758 CDS YOR016C 15 361084 360461 C 2006-01-05 1996-07-31 +S000005543 ORF Verified YOR017W PET127 chromosome 15 L000001399 15 361412 363814 W 5.5 2006-01-05 1996-07-31 Protein with a role in 5'-end processing of mitochondrial RNAs; located in the mitochondrial membrane +S000036848 CDS YOR017W 15 361412 363814 W 2006-01-05 1996-07-31 +S000005544 ORF Verified YOR018W ROD1 ART4 chromosome 15 L000003079 15 364369 366882 W 2006-01-05 1996-07-31 Alpha-arrestin involved in ubiquitin-dependent endocytosis; activating dephosphorylation relays glucose signaling to transporter endocytosis; calcineurin dephosphorylation is required for Rsp5p-dependent internalization of agonist-occupied Ste2p, as part of signal desensitization; recruits Rsp5p to Ste2p via its 2 PPXY motifs; protein abundance increases in response to DNA replication stress; ROD1 has a paralog, ROG3, that arose from the whole genome duplication +S000037590 CDS YOR018W 15 364369 366882 W 2006-01-05 1996-07-31 +S000005545 ORF Verified YOR019W chromosome 15 15 368127 370319 W 2006-01-05 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; YOR019W has a paralog, JIP4, that arose from the whole genome duplication +S000037647 CDS YOR019W 15 368127 370319 W 2006-01-05 1996-07-31 +S000005546 ORF Verified YOR020C HSP10 CPN10 chromosome 15 L000000815 15 370844 370524 C 2006-01-05 1996-07-31 Mitochondrial matrix co-chaperonin; inhibits the ATPase activity of Hsp60p, a mitochondrial chaperonin; involved in protein folding and sorting in the mitochondria; 10 kD heat shock protein with similarity to E. coli groES +S000037650 CDS YOR020C 15 370844 370524 C 2006-01-05 1996-07-31 +S000028526 ORF Uncharacterized YOR020W-A chromosome 15 15 371685 371957 W 2006-01-05 2003-07-29 Putative protein of unknown function; conserved in A. gossypii; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000030330 CDS YOR020W-A 15 371685 371957 W 2006-01-05 2003-07-29 +S000005547 ORF Verified YOR021C SFM1 protein-arginine N-methyltransferase SFM1 chromosome 15 15 373439 372798 C 2006-01-05 1996-07-31 SPOUT methyltransferase; catalyzes omega-monomethylation of Rps3p on Arg-146; not an essential gene; predicted to be involved in rRNA processing and ribosome biogenesis and in biopolymer catabolism +S000030445 CDS YOR021C 15 373439 372798 C 2006-01-05 1996-07-31 +S000005548 ORF Verified YOR022C DDL1 putative carboxylic ester hydrolase chromosome 15 15 375857 373710 C 2006-01-05 1996-07-31 DDHD domain-containing phospholipase A1; mitochondrial matrix enzyme with sn-1-specific activity, hydrolyzing cardiolipin, PE, PC, PG and PA; implicated in remodeling of mitochondrial phospholipids; antagonistically regulated by Aft1p and Aft2p; in humans, mutations in DDHD1 and DDHD2 genes cause specific types of hereditary spastic paraplegia, while DDL1-defective yeast share similar phenotypes such as mitochondrial dysfunction and defects in lipid metabolism +S000030587 CDS YOR022C 15 375857 373710 C 2006-01-05 1996-07-31 +S000005549 ORF Verified YOR023C AHC1 chromosome 15 15 377712 376012 C 2006-01-05 1996-07-31 Subunit of the Ada histone acetyltransferase complex; required for structural integrity of the complex; Ahc2p and Ahc1p are unique to the ADA complex and not shared with the related SAGA and SLIK complexes; Ahc2p may tether Ahc1p to the complex +S000030673 CDS YOR023C 15 377712 376012 C 2006-01-05 1996-07-31 +S000005550 ORF Dubious YOR024W IRC12 chromosome 15 15 377847 378170 W 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031578 CDS YOR024W 15 377847 378170 W 2006-01-05 1996-07-31 +S000005551 ORF Verified YOR025W HST3 NAD-dependent histone deacetylase HST3 chromosome 15 L000003042 15 378219 379562 W 2006-01-05 1996-07-31 Member of the Sir2 family of NAD(+)-dependent protein deacetylases; involved along with Hst4p in telomeric silencing, cell cycle progression, radiation resistance, genomic stability and short-chain fatty acid metabolism +S000031696 CDS YOR025W 15 378219 379562 W 2006-01-05 1996-07-31 +S000005552 ORF Verified YOR026W BUB3 PAC9 chromosome 15 L000000198 15 379781 380806 W 2006-01-05 1996-07-31 Kinetochore checkpoint WD40 repeat protein; localizes to kinetochores during prophase and metaphase, delays anaphase in the presence of unattached kinetochores; forms complexes with Mad1p-Bub1p and with Cdc20p, binds Mad2p and Mad3p; functions at kinetochore to activate APC/C-Cdc20p for normal mitotic progression +S000031797 CDS YOR026W 15 379781 380806 W 2006-01-05 1996-07-31 +S000005553 ORF Verified YOR027W STI1 Hsp90 cochaperone STI1 chromosome 15 L000002129 15 381053 382822 W 2006-01-05 1996-07-31 Hsp90 cochaperone; regulates spatial organization of amyloid-like proteins in the cytosol, thereby buffering the proteotoxicity caused by amyloid-like proteins; interacts with the Ssa group of the cytosolic Hsp70 chaperones and activates Ssa1p ATPase activity; interacts with Hsp90 chaperones and inhibits their ATPase activity; homolog of mammalian Hop +S000031906 CDS YOR027W 15 381053 382822 W 2006-01-05 1996-07-31 +S000005554 ORF Verified YOR028C CIN5 YAP4|HAL6 chromosome 15 L000000339|L000004263 15 384420 383533 C 2006-01-05 1996-07-31 Basic leucine zipper (bZIP) transcription factor of the yAP-1 family; physically interacts with the Tup1-Cyc8 complex and recruits Tup1p to its targets; mediates pleiotropic drug resistance and salt tolerance; nuclearly localized under oxidative stress and sequestered in the cytoplasm by Lot6p under reducing conditions; CIN5 has a paralog, YAP6, that arose from the whole genome duplication +S000032760 CDS YOR028C 15 384420 383533 C 2006-01-05 1996-07-31 +S000005555 ORF Uncharacterized YOR029W chromosome 15 15 384600 384935 W 2006-01-05 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YOR029W is not an essential gene +S000032920 CDS YOR029W 15 384600 384935 W 2006-01-05 1996-07-31 +S000005556 ORF Verified YOR030W DFG16 ZRG12|ECM41 chromosome 15 L000003877 15 386825 388684 W 2006-01-05 1996-07-31 Probable multiple transmembrane protein; involved in diploid invasive and pseudohyphal growth upon nitrogen starvation; is glycosylated and phosphorylated; interacts with Rim21p and Rim9p in the plasma membrane to form a pH-sensing complex in the Rim101 pathway and is required to maintain Rim21p levels; required for accumulation of processed Rim101p +S000033591 CDS YOR030W 15 386825 388684 W 2006-01-05 1996-07-31 +S000005557 blocked_reading_frame YOR031W CRS5 metallothionein CRS5 chromosome 15 L000000421 15 389213 389422 W 2006-01-05 1996-07-31 Copper-binding metallothionein; required for wild-type copper resistance +S000033679 CDS YOR031W 15 389213 389422 W 2006-01-05 1996-07-31 +S000005558 ORF Verified YOR032C HMS1 chromosome 15 L000004441 15 391075 389771 C 2006-01-05 1996-07-31 bHLH protein with similarity to myc-family transcription factors; overexpression confers hyperfilamentous growth and suppresses the pseudohyphal filamentation defect of a diploid mep1 mep2 homozygous null mutant +S000033735 CDS YOR032C 15 391075 389771 C 2006-01-05 1996-07-31 +S000028710 ORF Uncharacterized YOR032W-A chromosome 15 15 392176 392376 W 2006-01-05 2003-07-29 Protein of unknown function; SWAT-GFP and seamless-GFP fusion proteins localize to the endoplasmic reticulum; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032675 CDS YOR032W-A 15 392176 392376 W 2006-01-05 2003-07-29 +S000005559 ORF Verified YOR033C EXO1 Rad2 family nuclease EXO1|DHS1 chromosome 15 L000000505|L000003929 15 394524 392416 C 2006-01-05 1996-07-31 5'-3' exonuclease and flap-endonuclease; involved in recombination, double-strand break repair, MMS2 error-free branch of the post replication (PRR) pathway and DNA mismatch repair; role in telomere maintenance; member of the Rad2p nuclease family, with conserved N and I nuclease domains; relative distribution to the nucleus increases upon DNA replication stress; EXO1 has a paralog, DIN7, that arose from the whole genome duplication +S000034621 CDS YOR033C 15 394524 392416 C 2006-01-05 1996-07-31 +S000005560 ORF Verified YOR034C AKR2 putative palmitoyltransferase AKR2 chromosome 15 L000004052 15 397086 394837 C 2006-01-05 1996-07-31 Ankyrin repeat-containing protein; member of a family of putative palmitoyltransferases containing an Asp-His-His-Cys-cysteine rich (DHHC-CRD) domain; possibly involved in constitutive endocytosis of Ste3p; AKR2 has a paralog, AKR1, that arose from the whole genome duplication +S000034777 CDS YOR034C 15 397086 394837 C 2006-01-05 1996-07-31 +S000028856 ORF Uncharacterized YOR034C-A chromosome 15 15 397668 397426 C 2006-01-05 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000034569 CDS YOR034C-A 15 397668 397426 C 2006-01-05 2003-07-29 +S000005561 ORF Verified YOR035C SHE4 DIM1 chromosome 15 L000004572 15 400104 397735 C 2006-01-05 1996-07-31 Protein containing a UCS (UNC-45/CRO1/SHE4) domain; binds to myosin motor domains to regulate myosin function; involved in endocytosis, polarization of the actin cytoskeleton, and asymmetric mRNA localization +S000034897 CDS YOR035C 15 400104 397735 C 2006-01-05 1996-07-31 +S000005562 ORF Verified YOR036W PEP12 SNAP receptor PEP12|VPT13|VPS6|VPL6 chromosome 15 L000001379 15 400348 401214 W -5 2006-01-05 1996-07-31 Target membrane receptor (t-SNARE); for vesicular intermediates traveling between the Golgi apparatus and the vacuole; controls entry of biosynthetic, endocytic, and retrograde traffic into the prevacuolar compartment; syntaxin +S000035899 CDS YOR036W 15 400348 401214 W 2006-01-05 1996-07-31 +S000005563 ORF Verified YOR037W CYC2 oxidoreductase chromosome 15 L000000449 15 401555 402655 W 12 2006-01-05 2003-09-22|1996-07-31 Mitochondrial peripheral inner membrane protein; contains a FAD cofactor in a domain exposed in the intermembrane space; exhibits redox activity in vitro; likely participates in ligation of heme to acytochromes c and c1 (Cyc1p and Cyt1p) +S000036064 CDS YOR037W 15 401555 402655 W 2006-01-05 2003-09-22|1996-07-31 +S000005564 ORF Verified YOR038C HIR2 SPT1 chromosome 15 L000000777 15 405388 402761 C 2006-01-05 1996-07-31 Subunit of HIR nucleosome assembly complex; involved in regulation of histone gene transcription; recruits Swi-Snf complexes to histone gene promoters; promotes heterochromatic gene silencing with Asf1p; relocalizes to the cytosol in response to hypoxia +S000036118 CDS YOR038C 15 405388 402761 C 2006-01-05 1996-07-31 +S000005565 ORF Verified YOR039W CKB2 casein kinase 2 regulatory subunit CKB2 chromosome 15 L000000345 15 405768 406544 W 2006-01-05 1996-07-31 Beta' regulatory subunit of casein kinase 2 (CK2); a Ser/Thr protein kinase with roles in cell growth and proliferation; CK2, comprised of CKA1, CKA2, CKB1 and CKB2, has many substrates including transcription factors and all RNA polymerase +S000036946 CDS YOR039W 15 405768 406544 W 2006-01-05 1996-07-31 +S000005566 ORF Verified YOR040W GLO4 hydroxyacylglutathione hydrolase GLO4 chromosome 15 L000003489 15 407064 407921 W 2006-01-05 1996-07-31 Mitochondrial glyoxalase II; catalyzes the hydrolysis of S-D-lactoylglutathione into glutathione and D-lactate; GLO4 has a paralog, GLO2, that arose from the whole genome duplication +S000037742 CDS YOR040W 15 407064 407921 W 2006-01-05 1996-07-31 +S000007292 snoRNA_gene snR9 SNR9 chromosome 15 L000001964 15 408134 407948 C 2006-01-05 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2340 and U2345 +S000034330 noncoding_exon snR9 15 408134 407948 C 2006-01-05 2000-05-19 +S000005568 ORF Verified YOR042W CUE5 ubiquitin-binding protein CUE5 chromosome 15 15 408425 409660 W 2006-01-05 1996-07-31 Ubiquitin-binding protein; functions as ubiquitin-Atg8p adaptor in ubiquitin-dependent autophagy; serves as proteaphagy receptor for inactivated 26S proteasomes; contains CUE domain that binds ubiquitin, which may facilitate intramolecular monoubiquitination; CUE5 has a paralog, DON1, that arose from the whole genome duplication; human TOLLIP is a functional CUE-domain homolog, can complement yeast null mutant, rescuing hypersensitivity of cue5 null mutant cells to Htt-96Q +S000029840 CDS YOR042W 15 408425 409660 W 2006-01-05 1996-07-31 +S000005567 ORF Dubious YOR041C SRF5 chromosome 15 15 408789 408358 C 2006-01-05 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 85% of ORF overlaps the uncharacterized gene CUE5; deletion in cyr1 mutant results in loss of stress resistance +S000037769 CDS YOR041C 15 408789 408358 C 2006-01-05 1996-07-31 +S000006453 snoRNA_gene snR62 SNR62 chromosome 15 L000004531 15 409864 409765 C 2006-01-05 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U1888 +S000030839 noncoding_exon snR62 15 409864 409765 C 2006-01-05 2000-05-19 +S000005569 ORF Verified YOR043W WHI2 chromosome 15 L000002485 15 410870 412330 W 9 2006-01-05 1996-07-31 Protein required for full activation of the general stress response; required with binding partner Psr1p, possibly through Msn2p dephosphorylation; regulates growth during the diauxic shift; negative regulator of G1 cyclin expression; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the cell periphery +S000030841 CDS YOR043W 15 410870 412330 W 2006-01-05 1996-07-31 +S000005570 ORF Verified YOR044W IRC23 chromosome 15 15 413007 413480 W 2006-01-05 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion localizes to the ER; null mutant displays increased levels of spontaneous Rad52p foci; IRC23 has a paralog, BSC2, that arose from the whole genome duplication +S000030924 CDS YOR044W 15 413007 413480 W 2006-01-05 1996-07-31 +S000005571 ORF Verified YOR045W TOM6 MOM8B|ISP6 chromosome 15 L000000877 15 413852 414037 W 2006-01-05 1996-07-31 Component of the TOM (translocase of outer membrane) complex; responsible for recognition and initial import steps for all mitochondrially directed proteins; promotes assembly and stability of the TOM complex +S000030996 CDS YOR045W 15 413852 414037 W 2006-01-05 1996-07-31 +S000005572 ORF Verified YOR046C DBP5 ATP-dependent RNA helicase DBP5|RAT8 chromosome 15 L000003292 15 415907 414459 C 2011-02-03 1996-07-31 Cytoplasmic ATP-dependent RNA helicase of the DEAD-box family; involved in mRNA export from the nucleus, remodeling messenger ribonucleoprotein particles (mRNPs), with ATPase activity stimulated by Gle1p, IP6 and Nup159p; involved in translation termination along with Sup45p (eRF1); role in the cellular response to heat stress +S000031032 CDS YOR046C 15 415907 414459 C 2011-02-03 1996-07-31 +S000005573 ORF Verified YOR047C STD1 SFS3|MSN3 chromosome 15 L000002111 15 417681 416347 C 2011-02-03 1996-07-31 Protein involved in control of glucose-regulated gene expression; interacts with kinase Snf1p, glucose sensors Snf3p and Rgt2p, TATA-binding Spt15p; regulator of transcription factor Rgt1p; interactions with Pma1p appear to propagate [GAR+]; STD1 has a paralog, MTH1, that arose from the whole genome duplication +S000032001 CDS YOR047C 15 417681 416347 C 2011-02-03 1996-07-31 +S000005574 ORF Verified YOR048C RAT1 ssRNA exonuclease RAT1|XRN2|TAP1|HKE1 chromosome 15 L000001584 15 421650 418630 C 17.1 2011-02-03 1996-07-31 Nuclear 5' to 3' single-stranded RNA exonuclease; involved in RNA metabolism, including rRNA and snoRNA processing, as well as poly (A+) dependent and independent mRNA transcription termination; required for cotranscriptional pre-rRNA cleavage; displaces Cdk1p from elongating transcripts, especially as RNAPII reaches the poly(A) site, negatively regulates phosphorylation of the CTD of RNAPII, and inhibits RNAPII transcriptional elongation +S000032091 CDS YOR048C 15 421650 418630 C 2011-02-03 1996-07-31 +S000005575 ORF Verified YOR049C RSB1 phospholipid-translocating ATPase RSB1 chromosome 15 15 423732 422668 C 2011-02-03 1996-07-31 Putative sphingoid long-chain base (LCB) efflux transporter; integral membrane transporter that localizes to the plasma membrane and may transport long chain bases (LCBs) from the cytoplasmic side toward the extracytoplasmic side of the membrane; role in glycerophospholipid translocation; suppressor of the sphingoid LCB sensitivity of an LCB-lyase mutation +S000032150 CDS YOR049C 15 423732 422668 C 2011-02-03 1996-07-31 +S000005576 ORF Dubious YOR050C YOR29-01 chromosome 15 15 424617 424270 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; null mutant is viable +S000033916 CDS YOR050C 15 424617 424270 C 2011-02-03 1996-07-31 +S000005577 ORF Verified YOR051C ETT1 NRO1|YOR29-02 chromosome 15 15 426084 424846 C 2011-02-03 1996-07-31 Nuclear protein that inhibits replication of Brome mosaic virus; S. cerevisiae is a model system for studying replication of positive-strand RNA viruses in their natural hosts; deletion increases stop codon readthrough +S000034062 CDS YOR051C 15 426084 424846 C 2011-02-03 1996-07-31 +S000005578 ORF Verified YOR052C TMC1 YOR29-03 chromosome 15 15 427224 426772 C 2011-02-03 1996-07-31 AN1-type zinc finger protein, effector of proteotoxic stress response; stress-inducible transcriptional target of Rpn4p; induced by nitrogen limitation, weak acid, misfolded proteins; short-lived protein, degraded by proteasome; may protect cells from trivalent metalloid induced proteotoxicity; contains PACE promoter element; ortholog of human AIRAP, which stimulates proteasome activity in response to arsenic; protein abundance increases under DNA replication stress +S000034154 CDS YOR052C 15 427224 426772 C 2011-02-03 1996-07-31 +S000005579 ORF Dubious YOR053W YOR29-04 chromosome 15 15 427817 428158 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene VHS3/YOR054C +S000035170 CDS YOR053W 15 427817 428158 W 2011-02-03 1996-07-31 +S000005581 ORF Dubious YOR055W YOR29-06 chromosome 15 15 429478 429912 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035354 CDS YOR055W 15 429478 429912 W 2011-02-03 1996-07-31 +S000005580 ORF Verified YOR054C VHS3 phosphopantothenoylcysteine decarboxylase complex subunit VHS3|YOR29-05 chromosome 15 15 429857 427833 C 2011-02-03 1996-07-31 Negative regulatory subunit of protein phosphatase 1 Ppz1p; involved in coenzyme A biosynthesis; subunit of the phosphopantothenoylcysteine decarboxylase (PPCDC; Cab3p, Sis2p, Vhs3p) complex and the CoA-Synthesizing Protein Complex (CoA-SPC: Cab2p, Cab3p, Cab4p, Cab5p, Sis2p and Vhs3p) +S000035210 CDS YOR054C 15 429857 427833 C 2011-02-03 1996-07-31 +S000005582 ORF Verified YOR056C NOB1 rRNA-binding endoribonuclease|YOR29-07 chromosome 15 15 431626 430247 C 2011-02-03 1996-07-31 Protein involved in proteasomal and 40S ribosomal subunit biogenesis; required for cleavage of the 20S pre-rRNA to generate the mature 18S rRNA; cleavage is activated by Fun12p, a GTPase and translation initiation factor; relocalizes from nucleus to nucleolus upon DNA replication stress +S000035381 CDS YOR056C 15 431626 430247 C 2011-02-03 1996-07-31 +S000005583 ORF Verified YOR057W SGT1 co-chaperone SGT1|YOR29-08 chromosome 15 L000003443|L000004087 15 432186 433373 W 2011-02-03 1996-07-31 Cochaperone protein; regulates activity of adenylyl cyclase Cyr1p; involved in kinetochore complex assembly; associates with the SCF (Skp1p/Cdc53p/F box protein) ubiquitin ligase complex; acts as a linker between Skp1p and HSP90 complexes; protein abundance increases in response to DNA replication stress +S000036316 CDS YOR057W 15 432186 433373 W 2011-02-03 1996-07-31 +S000005584 ORF Verified YOR058C ASE1 YOR29-09 chromosome 15 L000000125 15 436345 433688 C 2011-02-03 1996-07-31 Mitotic spindle midzone-localized microtubule bundling protein; microtubule-associated protein (MAP) family member; required for spindle elongation and stabilization; undergoes cell cycle-regulated degradation by anaphase promoting complex; potential Cdc28p substrate; relative distribution to microtubules decreases upon DNA replication stress +S000036352 CDS YOR058C 15 436345 433688 C 2011-02-03 1996-07-31 +S000007162 long_terminal_repeat YORCdelta11 chromosome 15 15 438483 438175 C 2011-02-03 2000-05-19 Ty1 LTR +S000006634 tRNA_gene tK(UUU)O chromosome 15 L000003707 15 438643 438738 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000034218 intron tK(UUU)O 15 438680 438702 W 2011-02-03 2000-05-19 +S000034216 noncoding_exon tK(UUU)O 15 438643 438679 W 2011-02-03 2000-05-19 +S000034217 noncoding_exon tK(UUU)O 15 438703 438738 W 2011-02-03 2000-05-19 +S000005585 ORF Verified YOR059C LPL1 putative hydrolase|YOR29-10 chromosome 15 15 440258 438906 C 2011-02-03 1996-07-31 Phospholipase; contains lipase specific GXSXG motif; maintains lipid droplet (LD) morphology; induced by transcription factor Rpn4p; protein abundance increases in response to DNA replication stress +S000036452 CDS YOR059C 15 440258 438906 C 2011-02-03 1996-07-31 +S000005586 ORF Verified YOR060C SLD7 YOR29-11 chromosome 15 15 441163 440390 C 2011-02-03 1996-07-31 Protein with a role in chromosomal DNA replication; interacts with Sld3p and reduces its affinity for Cdc45p; deletion mutant has aberrant mitochondria +S000037458 CDS YOR060C 15 441163 440390 C 2011-02-03 1996-07-31 +S000005587 ORF Verified YOR061W CKA2 casein kinase 2 catalytic subunit CKA2|YOR29-12 chromosome 15 L000000344 15 441534 442553 W 2011-02-03 1996-07-31 Alpha' catalytic subunit of casein kinase 2 (CK2); CK2 is a Ser/Thr protein kinase with roles in cell growth and proliferation; CK2, comprised of CKA1, CKA2, CKB1 and CKB2, has many substrates including transcription factors and all RNA polymerases; protein abundance increases in response to DNA replication stress; regulates Fkh1p-mediated donor preference during mating-type switching +S000037585 CDS YOR061W 15 441534 442553 W 2011-02-03 1996-07-31 +S000005588 ORF Uncharacterized YOR062C YOR29-13 chromosome 15 15 443531 442725 C 2011-02-03 1996-07-31 Protein of unknown function; similar to Reg1p; expression regulated by glucose and Rgt1p; GFP-fusion protein is induced in response to the DNA-damaging agent MMS; YOR062C has a paralog, YKR075C, that arose from the whole genome duplication +S000037610 CDS YOR062C 15 443531 442725 C 2011-02-03 1996-07-31 +S000005589 ORF Verified YOR063W RPL3 uL3|ribosomal 60S subunit protein L3|rp1|YL1|L3|YOR29-14|TCM1|MAK8 chromosome 15 15 444686 445849 W 22 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L3; homologous to mammalian ribosomal protein L3 and bacterial L3; plays an important role in function of eIF5B in stimulating 3' end processing of 18S rRNA in context of 80S ribosomes that have not yet engaged in translation; involved in replication and maintenance of killer double stranded RNA virus +S000030496 CDS YOR063W 15 444686 445849 W 2011-02-03 1996-07-31 +S000005590 ORF Verified YOR064C YNG1 YOR29-15 chromosome 15 S000007517 15 446738 446079 C 2011-02-03 1996-07-31 Subunit of the NuA3 histone acetyltransferase complex; this complex acetylates histone H3; contains PHD finger domain that interacts with methylated histone H3; shares significant sequence identity with the human candidate tumor suppressor p33-ING1 in C-terminal region +S000030526 CDS YOR064C 15 446738 446079 C 2011-02-03 1996-07-31 +S000005591 ORF Verified YOR065W CYT1 ubiquinol--cytochrome-c reductase catalytic subunit CYT1|YOR29-16|CTC1 chromosome 15 L000000472 15 447439 448368 W 2011-02-03 1996-07-31 Cytochrome c1; component of the mitochondrial respiratory chain; expression is regulated by the heme-activated, glucose-repressed Hap2p/3p/4p/5p CCAAT-binding complex +S000030648 CDS YOR065W 15 447439 448368 W 2011-02-03 1996-07-31 +S000005592 ORF Verified YOR066W MSA1 YOR29-17 chromosome 15 15 449436 451325 W 2011-02-03 1996-07-31 Activator of G1-specific transcription factors MBF and SBF; involved in regulation of the timing of G1-specific gene transcription and cell cycle initiation; localization is cell-cycle dependent and regulated by Cdc28p phosphorylation; MSA1 has a paralog, MSA2, that arose from the whole genome duplication +S000030728 CDS YOR066W 15 449436 451325 W 2011-02-03 1996-07-31 +S000005593 ORF Verified YOR067C ALG8 dolichyl-P-Glc:Glc1Man(9)GlcNAc(2)-PP-dolichol alpha-1,3-glucosyltransferase|YOR29-18 chromosome 15 L000000079 15 453462 451729 C 2011-02-03 1996-07-31 Glucosyl transferase; involved in N-linked glycosylation; adds glucose to the dolichol-linked oligosaccharide precursor prior to transfer to protein during lipid-linked oligosaccharide biosynthesis; similar to Alg6p; human homolog ALG8 can complement yeast null mutant +S000030756 CDS YOR067C 15 453462 451729 C 2011-02-03 1996-07-31 +S000005595 ORF Verified YOR069W VPS5 sorting nexin 1|YOR29-20|VPT5|PEP10|GRD2 chromosome 15 L000002920 15 453768 455795 W 2011-02-03 2004-04-21|1996-07-31 Nexin-1 homolog; required for localizing membrane proteins from a prevacuolar/late endosomal compartment back to late Golgi; structural component of retromer membrane coat complex; forms a retromer subcomplex with Vps17p; required for recruiting the retromer complex to the endosome membranes; VPS5 has a paralog, YKR078W, that arose from the whole genome duplication +S000031779 CDS YOR069W 15 453768 455795 W 2011-02-03 2004-04-21|1996-07-31 +S000005594 ORF Verified YOR068C VAM10 YOR29-19 chromosome 15 15 454213 453869 C 2011-02-03 1996-07-31 Protein involved in vacuole morphogenesis; acts at an early step of homotypic vacuole fusion that is required for vacuole tethering +S000031602 CDS YOR068C 15 454213 453869 C 2011-02-03 1996-07-31 +S000005596 ORF Verified YOR070C GYP1 YOR29-21 chromosome 15 L000004377 15 457820 455907 C 2011-02-03 1996-07-31 Cis-golgi GTPase-activating protein (GAP) for yeast Rabs; the Rab family members are Ypt1p (in vivo) and for Ypt1p, Sec4p, Ypt7p, and Ypt51p (in vitro); involved in vesicle docking and fusion +S000033733 CDS YOR070C 15 457820 455907 C 2011-02-03 1996-07-31 +S000005597 ORF Verified YOR071C NRT1 nicotinamide riboside transporter|THI71|YOR29-22 chromosome 15 15 461276 459480 C 2011-02-03 1996-07-31 High-affinity nicotinamide riboside transporter; also transports thiamine with low affinity; major transporter for 5-aminoimidazole-4-carboxamide-1-beta-D-ribofuranoside (acadesine) uptake; shares sequence similarity with Thi7p and Thi72p; proposed to be involved in 5-fluorocytosine sensitivity +S000033867 CDS YOR071C 15 461276 459480 C 2011-02-03 1996-07-31 +S000005598 ORF Dubious YOR072W YOR29-23 chromosome 15 15 461502 461816 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious gene YOR072W-A; diploid deletion strains are methotrexate, paraquat and wortmannin sensitive +S000034814 CDS YOR072W 15 461502 461816 W 2011-02-03 1996-07-31 +S000028582 ORF Dubious YOR072W-A chromosome 15 15 461791 462039 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YOR072W; originally identified by fungal homology and RT-PCR +S000031329 CDS YOR072W-A 15 461791 462039 W 2011-02-03 2003-07-29 +S000006688 tRNA_gene tP(UGG)O2 SUF11 chromosome 15 L000002159|L000003708 15 464450 464551 W 30 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin; can mutate to suppress +1 frameshift mutations in proline codons +S000031047 intron tP(UGG)O2 15 464486 464515 W 2011-02-03 2000-05-19 +S000031045 noncoding_exon tP(UGG)O2 15 464450 464485 W 2011-02-03 2000-05-19 +S000031046 noncoding_exon tP(UGG)O2 15 464516 464551 W 2011-02-03 2000-05-19 +S000028516 ORF Uncharacterized YOR072W-B chromosome 15 15 464469 464630 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000030289 CDS YOR072W-B 15 464469 464630 W 2011-02-03 2003-07-29 +S000005599 ORF Verified YOR073W SGO1 YOR29-24 chromosome 15 15 464771 466543 W 2011-02-03 1996-07-31 Component of the spindle checkpoint; involved in sensing lack of tension on mitotic chromosomes; protects centromeric Rec8p at meiosis I; required for accurate chromosomal segregation at meiosis II and for mitotic chromosome stability; recruits condensin to the pericentric region of chromosomes during meiosis; dissociates from pericentromeres when sister kinetochores are under tension +S000034945 CDS YOR073W 15 464771 466543 W 2011-02-03 1996-07-31 +S000028583 ORF Dubious YOR073W-A chromosome 15 15 467390 467623 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially/completely overlaps the verified ORF CDC21/YOR074C; identified by RT-PCR +S000031330 CDS YOR073W-A 15 467390 467623 W 2011-02-03 2003-07-29 +S000005600 ORF Verified YOR074C CDC21 thymidylate synthase|YOR29-25|TMP1|CRT9 chromosome 15 L000000260 15 467589 466675 C 32 2011-02-03 1996-07-31|2005-12-01 Thymidylate synthase; required for de novo biosynthesis of pyrimidine deoxyribonucleotides; expression is induced at G1/S; human homolog TYMSOS can complement yeast cdc21 temperature-sensitive mutant at restrictive temperature +S000034991 CDS YOR074C 15 467589 466675 C 2011-02-03 1996-07-31|2005-12-01 +S000005601 ORF Verified YOR075W UFE1 YOR29-26 chromosome 15 L000002637 15 468212 469252 W 2011-02-03 1996-07-31 t-SNARE protein required for retrograde vesicular traffic; involved in Sey1p-independent homotypic ER fusion; required for efficient nuclear fusion during mating; forms a complex with the SNAREs Sec22p, Sec20p and Use1p to mediate fusion of Golgi-derived vesicles at the ER +S000035197 CDS YOR075W 15 468212 469252 W 2011-02-03 1996-07-31 +S000005602 ORF Verified YOR076C SKI7 YOR29-27 chromosome 15 15 471620 469377 C 2011-02-03 1996-07-31 GTP-binding protein that couples the Ski complex and exosome; putative pseudo-translational GTPase involved in 3'-to-5' mRNA decay pathway; interacts with both the cytoplasmic exosome and the Ski complex; eRF3-like domain targets nonstop mRNA for degradation; null mutants have a superkiller phenotype; SKI7 has a paralog, HBS1, that arose from the whole genome duplication +S000036014 CDS YOR076C 15 471620 469377 C 2011-02-03 1996-07-31 +S000005603 ORF Verified YOR077W RTS2 YOR29-28 chromosome 15 L000001787 15 471899 472597 W 2011-02-03 1996-07-31 Basic zinc-finger protein; similar to human and mouse Kin17 proteins which are chromatin-associated proteins involved in UV response and DNA replication +S000036174 CDS YOR077W 15 471899 472597 W 2011-02-03 1996-07-31 +S000005604 ORF Verified YOR078W BUD21 YOR29-29|UTP16 chromosome 15 15 472725 473369 W 2011-02-03 1996-07-31 Component of small ribosomal subunit (SSU) processosome; this complex contains U3 snoRNA; required at post-transcriptional step for efficient retrotransposition; absence results in decreased Ty1 Gag:GFP protein levels; originally isolated as bud-site selection mutant that displays a random budding pattern +S000036267 CDS YOR078W 15 472725 473369 W 2011-02-03 1996-07-31 +S000005605 ORF Verified YOR079C ATX2 Mn(2+) transporter ATX2|YOR29-30 chromosome 15 L000003290 15 474416 473475 C 2011-02-03 1996-07-31 Golgi membrane protein involved in manganese homeostasis; overproduction suppresses the sod1 (copper, zinc superoxide dismutase) null mutation +S000036294 CDS YOR079C 15 474416 473475 C 2011-02-03 1996-07-31 +S000005606 ORF Verified YOR080W DIA2 DNA-binding SCF ubiquitin ligase subunit DIA2|YOR29-31 chromosome 15 15 474594 476792 W 2011-02-03 1996-07-31|2010-01-05 Origin-binding F-box protein; forms SCF ubiquitin ligase complex with Skp1p and Cdc53p; functions in ubiquitination of silent chromatin structural protein Sir4p; required to target Cdc6p for destruction during G1 phase; required for deactivation of Rad53 checkpoint kinase, completion of DNA replication during recovery from DNA damage, assembly of RSC complex, RSC-mediated transcription regulation, and nucleosome positioning; involved in invasive and pseudohyphal growth +S000035995 CDS YOR080W 15 474594 476792 W 2011-02-03 1996-07-31|2010-01-05 +S000005607 ORF Verified YOR081C TGL5 STC2 chromosome 15 15 479188 476939 C 2011-02-03 1996-07-31 Bifunctional triacylglycerol lipase and LPA acyltransferase; lipid particle-localized triacylglycerol (TAG) lipase involved in triacylglycerol mobilization; catalyzes acylation of lysophosphatidic acid (LPA); potential Cdc28p substrate; TGL5 has a paralog, TGL4, that arose from the whole genome duplication +S000037799 CDS YOR081C 15 479188 476939 C 2011-02-03 1996-07-31 +S000005609 ORF Verified YOR083W WHI5 transcriptional repressor WHI5 chromosome 15 15 479533 480420 W 2011-02-03 1996-07-31 Repressor of G1 transcription; binds to SCB binding factor (SBF) at SCB target promoters in early G1; dilution of Whi5p concentration during cell growth determines cell size; phosphorylation of Whi5p by the CDK, Cln3p/Cdc28p relieves repression and promoter binding by Whi5, and contributes to both the determination of critical cell size at START and cell fate; periodically expressed in G1 +S000029953 CDS YOR083W 15 479533 480420 W 2011-02-03 1996-07-31 +S000005608 ORF Dubious YOR082C chromosome 15 15 479637 479296 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YOR083W +S000037872 CDS YOR082C 15 479637 479296 C 2011-02-03 1996-07-31 +S000005610 ORF Verified YOR084W LPX1 triglyceride lipase chromosome 15 15 480587 481750 W 2011-02-03 1996-07-31 Peroxisomal matrix-localized lipase; required for normal peroxisome morphology; contains a peroxisomal targeting signal type 1 (PTS1) and a lipase motif; peroxisomal import requires the PTS1 receptor, Pex5p and self-interaction; transcriptionally activated by Yrm1p along with genes involved in multidrug resistance; oleic acid inducible +S000030939 CDS YOR084W 15 480587 481750 W 2011-02-03 1996-07-31 +S000005611 ORF Verified YOR085W OST3 dolichyl-diphosphooligosaccharide--protein glycotransferase OST3 chromosome 15 L000002943 15 482033 483085 W 2011-02-03 1996-07-31 Gamma subunit of the oligosaccharyltransferase complex of the ER lumen; complex catalyzes asparagine-linked glycosylation of newly synthesized proteins; Ost3p is important for N-glycosylation of a subset of proteins +S000031015 CDS YOR085W 15 482033 483085 W 2011-02-03 1996-07-31 +S000005612 ORF Verified YOR086C TCB1 tricalbin chromosome 15 15 486779 483219 C 2011-02-03 1996-07-31 Lipid-binding ER protein involved in ER-plasma membrane tethering; one of 6 proteins (Ist2p, Scs2p, Scs22p, Tcb1p, Tcb2p, Tcb3p) that connect ER to plasma membrane and regulate PI4P levels by controlling access of Sac1p phosphatase to its substrate PI4P in PM; contains 3 calcium and lipid binding domains; non-tagged protein also localizes to mitochondria; C-termini of Tcb1p, Tcb2p and Tcb3p interact; TCB1 has a paralog, TCB2, that arose from the whole genome duplication +S000031064 CDS YOR086C 15 486779 483219 C 2011-02-03 1996-07-31 +S000006676 tRNA_gene tN(GUU)O2 chromosome 15 L000003709 15 487439 487512 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis +S000035653 noncoding_exon tN(GUU)O2 15 487439 487512 W 2011-02-03 2000-05-19 +S000005613 ORF Verified YOR087W YVC1 TRPY1|YOR088W chromosome 15 15 487707 489734 W 2011-02-03 2003-01-09|1996-07-31 Vacuolar cation channel; mediates release of Ca(2+) from the vacuole in response to hyperosmotic shock +S000031212 CDS YOR087W 15 487707 489734 W 2011-02-03 2003-01-09|1996-07-31 +S000007554 ARS ARS1501 ARS1514|ARS245 chromosome 15 15 489683 489942 2014-11-18 2000-10-17|2014-11-18 Autonomously Replicating Sequence +S000178184 ARS_consensus_sequence ARS1501 15 489891 489907 W 2014-11-18 2014-11-18 +S000005615 ORF Verified YOR089C VPS21 Rab family GTPase VPS21|YPT51|YPT21|VPT12|VPS12 chromosome 15 L000002474 15 490828 490196 C 2011-02-03 1996-07-31 Endosomal Rab family GTPase; required for endocytic transport and sorting of vacuolar hydrolases; required for endosomal localization of the CORVET complex; required with YPT52 for MVB biogenesis and sorting; involved in autophagy and ionic stress tolerance; geranylgeranylation required for membrane association; protein abundance increases in response to DNA replication stress; mammalian Rab5 homolog; VPS21 has a paralog, YPT53, that arose from the whole genome duplication +S000032213 CDS YOR089C 15 490828 490196 C 2011-02-03 1996-07-31 +S000005616 ORF Verified YOR090C PTC5 type 2C protein phosphatase PTC5|PPP1 chromosome 15 15 492841 491123 C 2011-02-03 1996-07-31 Mitochondrial type 2C protein phosphatase (PP2C); involved in regulation of pyruvate dehydrogenase activity by dephosphorylating the serine 133 of the Pda1p subunit; localizes to the intermembrane space and is imported via the presequence pathway and processed by the inner membrane protease (Imp1p-Imp2p); acts in concert with kinases Pkp1p and Pkp2p and phosphatase Ptc6p +S000031844 CDS YOR090C 15 492841 491123 C 2011-02-03 1996-07-31 +S000005617 ORF Verified YOR091W TMA46 RBF46 chromosome 15 15 493433 494470 W 2011-02-03 1996-07-31|2005-12-01 Protein of unknown function that associates with translating ribosomes; interacts with GTPase Rbg1p +S000032061 CDS YOR091W 15 493433 494470 W 2011-02-03 1996-07-31|2005-12-01 +S000005618 ORF Verified YOR092W ECM3 putative ATPase ECM3|YOR3165W chromosome 15 L000003879 15 495127 496968 W 2011-02-03 1996-07-31 Non-essential protein of unknown function; involved in signal transduction and the genotoxic response; induced rapidly in response to treatment with 8-methoxypsoralen and UVA irradiation; relocalizes from ER to cytoplasm upon DNA replication stress; ECM3 has a paralog, YNL095C, that arose from the whole genome duplication +S000032141 CDS YOR092W 15 495127 496968 W 2011-02-03 1996-07-31 +S000005619 ORF Uncharacterized YOR093C CMR2 chromosome 15 15 502452 497506 C 2011-02-03 1996-07-31 Putative protein of unknown function; deletion causes sensitivity to unfolded protein response-inducing agents +S000034073 CDS YOR093C 15 502452 497506 C 2011-02-03 1996-07-31 +S000005620 ORF Verified YOR094W ARF3 Arf family GTPase ARF3|ARL2 chromosome 15 L000000106 15 502795 503346 W 2011-02-03 1996-07-31 Glucose-repressible ADP-ribosylation factor; GTPase of Ras superfamily involved in regulating cell polarity and invasive growth; localizes to dynamic spots at plasma membrane and modulates PtdIns(4,5)P2 levels to facilitate endocytosis; required for localization of endocytic protein Lsb5p to correct cortical site in cells; also has mRNA binding activity; homolog of mammalian Arf6 +S000034255 CDS YOR094W 15 502795 503346 W 2011-02-03 1996-07-31 +S000005621 ORF Verified YOR095C RKI1 ribose-5-phosphate isomerase RKI1 chromosome 15 L000003519 15 504328 503552 C 2011-02-03 1996-07-31 Ribose-5-phosphate ketol-isomerase; catalyzes the interconversion of ribose 5-phosphate and ribulose 5-phosphate in the pentose phosphate pathway; participates in pyridoxine biosynthesis +S000034285 CDS YOR095C 15 504328 503552 C 2011-02-03 1996-07-31 +S000005622 ORF Verified YOR096W RPS7A eS7|ribosomal 40S subunit protein S7A|S7e|rp30|S7A|RPS30 chromosome 15 L000003300 15 505794 506767 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; interacts with Kti11p; deletion causes hypersensitivity to zymocin; homologous to mammalian ribosomal protein S7, no bacterial homolog; RPS7A has a paralog, RPS7B, that arose from the whole genome duplication +S000034377 CDS YOR096W 15 505794 505937 W 2011-02-03 1996-07-31 +S000034378 CDS YOR096W 15 506339 506767 W 2011-02-03 1996-07-31 +S000034379 intron YOR096W 15 505938 506338 W 2011-02-03 1996-07-31 +S000005623 ORF Uncharacterized YOR097C chromosome 15 15 507505 506978 C 2011-02-03 1996-07-31 Putative protein of unknown function; identified as interacting with Hsp82p in a high-throughput two-hybrid screen; YOR097C is not an essential gene +S000035307 CDS YOR097C 15 507505 506978 C 2011-02-03 1996-07-31 +S000005624 ORF Verified YOR098C NUP1 FG-nucleoporin NUP1 chromosome 15 L000001288 15 511178 507948 C 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; contributes directly to nucleocytoplasmic transport and maintenance of thenuclear pore complex (NPC) permeability barrier; possible karyopherin release factor that accelerates release of karyopherin-cargo complexes after transport across NPC; both NUP1 and NUP60 are homologous to human NUP153 +S000035367 CDS YOR098C 15 511178 507948 C 2011-02-03 1996-07-31 +S000005625 ORF Verified YOR099W KTR1 alpha-1,2-mannosyltransferase KTR1 chromosome 15 L000000924 15 511825 513006 W 54 2011-02-03 1996-07-31 Alpha-1,2-mannosyltransferase; involved in O- and N-linked protein glycosylation; type II membrane protein; member of the KRE2/MNT1 mannosyltransferase family; relocalizes from vacuole to cytoplasm upon DNA replication stress +S000035471 CDS YOR099W 15 511825 513006 W 2011-02-03 1996-07-31 +S000005626 ORF Verified YOR100C CRC1 carnitine:acyl carnitine antiporter chromosome 15 S000007462 15 514278 513295 C 2011-02-03 1996-07-31 Mitochondrial inner membrane carnitine transporter; required for carnitine-dependent transport of acetyl-CoA from peroxisomes to mitochondria during fatty acid beta-oxidation; human homolog SLC25A20 complements yeast null mutant +S000032610 CDS YOR100C 15 514278 513295 C 2011-02-03 1996-07-31 +S000005627 ORF Verified YOR101W RAS1 Ras family GTPase RAS1 chromosome 15 L000001582 15 515244 516173 W 53 2011-02-03 1996-07-31 GTPase involved in G-protein signaling in adenylate cyclase activation; plays a role in cell proliferation; localized to the plasma membrane; homolog of mammalian RAS proto-oncogenes; relative distribution to the nucleus increases upon DNA replication stress; RAS1 has a paralog, RAS2, that arose from the whole genome duplication +S000032754 CDS YOR101W 15 515244 516173 W 2011-02-03 1996-07-31 +S000005628 ORF Dubious YOR102W chromosome 15 15 516423 516773 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; extensively overlaps essential OST2 gene encoding a subunit of the ER lumen oligosaccharyltransferase complex +S000033499 CDS YOR102W 15 516423 516773 W 2011-02-03 1996-07-31 +S000005629 ORF Verified YOR103C OST2 dolichyl-diphosphooligosaccharide-protein glycotransferase chromosome 15 L000002942 15 516841 516449 C 2011-02-03 2003-09-22|1996-07-31 Epsilon subunit of the oligosaccharyltransferase complex; located in the ER lumen; catalyzes asparagine-linked glycosylation of newly synthesized proteins +S000033537 CDS YOR103C 15 516841 516449 C 2011-02-03 2003-09-22|1996-07-31 +S000005630 ORF Verified YOR104W PIN2 chromosome 15 15 517642 518490 W 2011-02-03 1996-07-31 Exomer-dependent cargo protein; induces appearance of [PIN+] prion when overproduced; prion-like domain serves as a retention signal in the trans-Golgi network; predicted to be palmitoylated +S000033687 CDS YOR104W 15 517642 518490 W 2011-02-03 1996-07-31 +S000005631 ORF Uncharacterized YOR105W chromosome 15 15 518195 518521 W 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels +S000033820 CDS YOR105W 15 518195 518521 W 2011-02-03 1996-07-31 +S000005632 ORF Verified YOR106W VAM3 SNAP receptor VAM3|PTH1 chromosome 15 L000003267|L000003302 15 519121 519972 W 2011-02-03 1996-07-31 Syntaxin-like vacuolar t-SNARE; functions with Vam7p in vacuolar protein trafficking; mediates docking/fusion of late transport intermediates with the vacuole; has an acidic di-leucine sorting signal and C-terminal transmembrane region +S000034700 CDS YOR106W 15 519121 519972 W 2011-02-03 1996-07-31 +S000005633 ORF Verified YOR107W RGS2 GTPase-activating protein RGS2 chromosome 15 15 521353 522282 W 2011-02-03 1996-07-31 Negative regulator of glucose-induced cAMP signaling; directly activates the GTPase activity of the heterotrimeric G protein alpha subunit Gpa2p +S000034847 CDS YOR107W 15 521353 522282 W 2011-02-03 1996-07-31 +S000005634 ORF Verified YOR108W LEU9 2-isopropylmalate synthase LEU9 chromosome 15 15 523027 524841 W 2011-02-03 1996-07-31 Alpha-isopropylmalate synthase II (2-isopropylmalate synthase); catalyzes the first step in the leucine biosynthesis pathway; the minor isozyme, responsible for the residual alpha-IPMS activity detected in a leu4 null mutant; LEU9 has a paralog, LEU4, that arose from the whole genome duplication +S000034978 CDS YOR108W 15 523027 524841 W 2011-02-03 1996-07-31 +S000028711 ORF Dubious YOR108C-A chromosome 15 15 524814 524605 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032677 CDS YOR108C-A 15 524814 524605 C 2011-02-03 2003-07-29 +S000005635 ORF Verified YOR109W INP53 phosphatidylinositol-3-/phosphoinositide 5-phosphatase INP53|SOP2|SJL3 chromosome 15 L000003984 15 525278 528601 W 2011-02-03 1996-07-31 Polyphosphatidylinositol phosphatase; dephosphorylates multiple phosphatidylinositol phosphates; involved in trans Golgi network-to-early endosome pathway; hyperosmotic stress causes translocation to actin patches; contains Sac1 and 5-ptase domains; INP53 has a paralog, INP52, that arose from the whole genome duplication +S000035927 CDS YOR109W 15 525278 528601 W 2011-02-03 1996-07-31 +S000005636 ORF Verified YOR110W TFC7 transcription factor TFIIIC subunit TFC7|tau 55 chromosome 15 15 528941 530248 W 2011-02-03 1996-07-31 RNA pol III transcription initiation factor complex (TFIIIC) subunit; part of the TauA globular domain of TFIIIC that binds DNA at the BoxA promoter sites of tRNA and similar genes; TFC7 has a paralog, YNL108C, that arose from the whole genome duplication +S000036863 CDS YOR110W 15 528941 530248 W 2011-02-03 1996-07-31 +S000005637 ORF Uncharacterized YOR111W chromosome 15 15 530429 531127 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000036919 CDS YOR111W 15 530429 531127 W 2011-02-03 1996-07-31 +S000005638 ORF Verified YOR112W CEX1 chromosome 15 15 531508 533793 W 2011-02-03 1996-07-31 Component of nuclear aminoacylation-dependent tRNA export pathway; cytoplasmic; interacts with nuclear pore component Nup116p; copurifies with tRNA export receptors Los1p and Msn5p, as well as eIF-1a; required for activation of RAN GTPase Gsp1p and dissociation of receptor-tRNA-Gsp1p export complex; recruits Rna1p from cytoplasm to NPC, facilitates Rna1p activation of Gsp1p GTPase activity by enabling Rna1p to gain access to Gsp1p-GTP bound to export receptor tRNA complex +S000036975 CDS YOR112W 15 531508 533793 W 2011-02-03 1996-07-31 +S000005639 ORF Verified YOR113W AZF1 chromosome 15 L000000158 15 534075 536819 W 2011-02-03 1996-07-31 Zinc-finger transcription factor; involved in diauxic shift; in the presence of glucose, activates transcription of genes involved in growth and carbon metabolism; in nonfermentable carbon sources, activates transcription of genes involved in maintenance of cell wall integrity; relocalizes to the cytosol in response to hypoxia +S000037745 CDS YOR113W 15 534075 536819 W 2011-02-03 1996-07-31 +S000005640 ORF Uncharacterized YOR114W chromosome 15 15 537570 538454 W 2011-02-03 1996-07-31 Putative protein of unknown function; null mutant is viable +S000037834 CDS YOR114W 15 537570 538454 W 2011-02-03 1996-07-31 +S000005641 ORF Verified YOR115C TRS33 chromosome 15 S000007434 15 539465 538659 C 2011-02-03 1996-07-31 Core component of TRAPP complexes I, II and IV; transport protein particle (TRAPP) complexes are related multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating ER-Golgi traffic (TRAPPI), intra-Golgi traffic (TRAPPII), endosome-Golgi traffic (TRAPPII and III) and autophagy (TRAPPIII, and IV); proposed subunit of a novel complex, TRAPPIV, that may function redundantly with TRAPPIII as a GEF that activates Ypt1 during autophagy +S000037875 CDS YOR115C 15 539465 538659 C 2011-02-03 1996-07-31 +S000005642 ORF Verified YOR116C RPO31 DNA-directed RNA polymerase III core subunit RPO31|C160|RPC160|RPC1 chromosome 15 L000001746|L000001694 15 544145 539763 C 59 2011-02-03 1996-07-31 RNA polymerase III largest subunit C160; part of core enzyme; similar to bacterial beta-prime subunit and to RPA190 and RPO21 +S000030813 CDS YOR116C 15 544145 539763 C 2011-02-03 1996-07-31 +S000005643 ORF Verified YOR117W RPT5 proteasome regulatory particle base subunit RPT5|YTA1 chromosome 15 L000002555 15 545029 546333 W 2011-02-03 1996-07-31 ATPase of the 19S regulatory particle of the 26S proteasome; one of six ATPases of the regulatory particle; involved in the degradation of ubiquitinated substrates; recruited to the GAL1-10 promoter region upon induction of transcription; similar to human TBP1 +S000030925 CDS YOR117W 15 545029 546333 W 2011-02-03 1996-07-31 +S000005644 ORF Verified YOR118W RTC5 chromosome 15 15 546857 548560 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; null mutation suppresses cdc13-1 temperature sensitivity +S000030998 CDS YOR118W 15 546857 548560 W 2011-02-03 1996-07-31 +S000005645 ORF Verified YOR119C RIO1 protein kinase RIO1|RRP10 chromosome 15 L000003989 15 550246 548792 C 2011-02-03 1996-07-31 Serine kinase involved in cell cycle regulation and rDNA integrity; associated with late pre-40S particles via its conserved C-terminal domain and participates in late 40S biogenesis; association with pre-40S particles regulated by its catalytic ATPase site and likely occurs after the release of Rio2p from these particles; involved in cell cycle progression and processing of the 20S pre-rRNA into mature 18S rRNA; phosphorylates Rpa43p in anaphase to remove Pol I from rDNA +S000031034 CDS YOR119C 15 550246 548792 C 2011-02-03 1996-07-31 +S000005646 ORF Verified YOR120W GCY1 glycerol 2-dehydrogenase (NADP(+)) GCY1|GCY chromosome 15 L000000694 15 551114 552052 W 2011-02-03 1996-07-31 Glycerol dehydrogenase; involved in an alternative pathway for glycerol catabolism used under microaerobic conditions; also has mRNA binding activity; member of the aldo-keto reductase (AKR) family; human homolog AKR1B1 can complement yeast null mutant; protein abundance increases in response to DNA replication stress; GCY1 has a paralog, YPR1, that arose from the whole genome duplication +S000033029 CDS YOR120W 15 551114 552052 W 2011-02-03 1996-07-31 +S000005647 ORF Dubious YOR121C chromosome 15 15 552103 551798 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame overlaps the verified gene GCY1/YOR120W +S000033061 CDS YOR121C 15 552103 551798 C 2011-02-03 1996-07-31 +S000005648 ORF Verified YOR122C PFY1 profilin|CLS5|PRF1 chromosome 15 L000001407 15 552887 552298 C 64 2011-02-03 1996-07-31 Profilin; binds actin, phosphatidylinositol 4,5-bisphosphate, and polyproline regions; involved in cytoskeleton organization; required for normal timing of actin polymerization in response to thermal stress; protein abundance increases in response to DNA replication stress; highly conserved protein; human PFN1 (profilin 1) complements temperature sensitive pfy1 mutants, PFN1 mutations are a rare cause of ALS +S000033159 CDS YOR122C 15 552665 552298 C 2011-02-03 1996-07-31 +S000033158 CDS YOR122C 15 552887 552875 C 2011-02-03 1996-07-31 +S000033160 intron YOR122C 15 552874 552666 C 2011-02-03 1996-07-31 +S000005649 ORF Verified YOR123C LEO1 chromosome 15 L000000936 15 554570 553176 C 2011-02-03 1996-07-31 Component of the Paf1 complex; which associates with RNA polymerase II and is involved in histone methylation; plays a role in regulating Ty1 transposition; involved in transcription elongation as demonstrated by the G-less-based run-on (GLRO) assay +S000033954 CDS YOR123C 15 554570 553176 C 2011-02-03 1996-07-31 +S000005650 ORF Verified YOR124C UBP2 ubiquitin-specific protease UBP2 chromosome 15 L000002416 15 558642 554824 C 2011-02-03 1996-07-31 Ubiquitin-specific protease; removes ubiquitin from ubiquitinated proteins; controls K63 homeostasis during oxidative stress; deubiquitinates Rsp5p and is required for MVB sorting of membrane proteins; can cleave polyubiquitin and has isopeptidase activity +S000034064 CDS YOR124C 15 558642 554824 C 2011-02-03 1996-07-31 +S000005651 ORF Verified YOR125C CAT5 putative monooxygenase CAT5|COQ7 chromosome 15 L000000219 15 559731 559030 C 2011-02-03 2003-09-22|1996-07-31 Protein required for ubiquinone (Coenzyme Q) biosynthesis; localizes to the matrix face of the mitochondrial inner membrane in a large complex with ubiquinone biosynthetic enzymes; required for gluconeogenic gene activation +S000034156 CDS YOR125C 15 559731 559030 C 2011-02-03 2003-09-22|1996-07-31 +S000005652 ORF Verified YOR126C IAH1 isoamyl acetate-hydrolyzing esterase chromosome 15 L000003383 15 560677 559961 C 2011-02-03 1996-07-31 Isoamyl acetate-hydrolyzing esterase; required in balance with alcohol acetyltransferase to maintain optimal amounts of isoamyl acetate, which is particularly important in sake brewing +S000035099 CDS YOR126C 15 560677 559961 C 2011-02-03 1996-07-31 +S000005653 ORF Verified YOR127W RGA1 THE1|DBM1 chromosome 15 L000002626 15 561170 564193 W 2011-02-03 1996-07-31 GTPase-activating protein for polarity-establishment protein Cdc42p; implicated in control of septin organization, pheromone response, and haploid invasive growth; relocalizes from bud neck to cytoplasm upon DNA replication stress; RGA1 has a paralog, RGA2, that arose from the whole genome duplication +S000035296 CDS YOR127W 15 561170 564193 W 2011-02-03 1996-07-31 +S000005654 ORF Verified YOR128C ADE2 phosphoribosylaminoimidazole carboxylase ADE2 chromosome 15 L000000032 15 566191 564476 C 64 2011-02-03 1996-07-31 Phosphoribosylaminoimidazole carboxylase; catalyzes a step in the 'de novo' purine nucleotide biosynthetic pathway; red pigment accumulates in mutant cells deprived of adenine +S000035306 CDS YOR128C 15 566191 564476 C 2011-02-03 1996-07-31 +S000114843 ARS ARS1516 ARS1516 ARSXV-567|ADE2 ARS chromosome 15 15 566410 566643 2011-02-03 2006-04-12|2006-09-08 Autonomously Replicating Sequence +S000005655 ORF Verified YOR129C AFI1 chromosome 15 15 569558 566877 C 2011-02-03 1996-07-31 Arf3p polarization-specific docking factor; required for the polarized distribution of the ADP-ribosylation factor, Arf3p; participates in polarity development and maintenance of a normal haploid budding pattern; interacts with Cnm7p +S000035385 CDS YOR129C 15 569558 566877 C 2011-02-03 1996-07-31 +S000005656 ORF Verified YOR130C ORT1 ARG11 chromosome 15 L000003289 15 570807 569929 C 2011-02-03 1996-07-31|2011-02-03 Ornithine transporter of the mitochondrial inner membrane; exports ornithine from mitochondria as part of arginine biosynthesis; functionally complemented by human ortholog, SLC25A15, which is associated with hyperammonaemia-hyperornithinaemia-homocitrullinuria (HHH) syndrome, but HHH-associated variants fail to complement +S000031722 CDS YOR130C 15 570807 569929 C 2011-02-03 1996-07-31|2011-02-03 +S000006545 tRNA_gene tD(GUC)O chromosome 15 L000003710 15 571958 572029 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000030425 noncoding_exon tD(GUC)O 15 571958 572029 W 2011-02-03 2000-05-19 +S000005657 ORF Verified YOR131C putative haloacid dehalogenase-like hydrolase chromosome 15 15 572838 572182 C 2011-02-03 1996-07-31 Putative haloacid dehalogenase-like hydrolase; non-essential gene; overexpression causes a cell cycle delay or arrest; protein abundance increases in response to DNA replication stress +S000031872 CDS YOR131C 15 572838 572182 C 2011-02-03 1996-07-31 +S000005658 ORF Verified YOR132W VPS17 retromer subunit VPS17|VPT3|PEP21 chromosome 15 L000002472|S000029642|L000002479 15 573175 574830 W 2011-02-03 1996-07-31 Subunit of the membrane-associated retromer complex; essential for endosome-to-Golgi retrograde protein transport; peripheral membrane protein that assembles onto the membrane with Vps5p to promote vesicle formation; required for recruiting the retromer complex to the endosome membranes +S000037422 CDS YOR132W 15 573175 574830 W 2011-02-03 1996-07-31 +S000005659 ORF Verified YOR133W EFT1 elongation factor 2 chromosome 15 L000000543 15 575098 577626 W 2011-02-03 1996-07-31 Elongation factor 2 (EF-2), also encoded by EFT2; catalyzes ribosomal translocation during protein synthesis; contains diphthamide, the unique posttranslationally modified histidine residue specifically ADP-ribosylated by diphtheria toxin; EFT1 has a paralog, EFT2, that arose from the whole genome duplication +S000037496 CDS YOR133W 15 575098 577626 W 2011-02-03 1996-07-31 +S000005660 ORF Verified YOR134W BAG7 chromosome 15 L000003395 15 578564 579793 W 2011-02-03 1996-07-31 Rho GTPase activating protein (RhoGAP); stimulates the intrinsic GTPase activity of Rho1p, which plays a bud growth by regulating actin cytoskeleton organization and cell wall biosynthesis, resulting in the downregulation of Rho1p; structurally and functionally related to Sac7p; BAG7 has a paralog, SAC7, that arose from the whole genome duplication +S000037586 CDS YOR134W 15 578564 579793 W 2011-02-03 1996-07-31 +S000005662 ORF Verified YOR136W IDH2 isocitrate dehydrogenase (NAD(+)) IDH2 chromosome 15 L000000850 15 580250 581359 W 2011-02-03 1996-07-31 Subunit of mitochondrial NAD(+)-dependent isocitrate dehydrogenase; complex catalyzes the oxidation of isocitrate to alpha-ketoglutarate in the TCA cycle; phosphorylated +S000030498 CDS YOR136W 15 580250 581359 W 2011-02-03 1996-07-31 +S000005661 ORF Dubious YOR135C IRC14 chromosome 15 15 580500 580159 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YOR136W; null mutant displays increased levels of spontaneous Rad52 foci +S000037633 CDS YOR135C 15 580500 580159 C 2011-02-03 1996-07-31 +S000005663 ORF Verified YOR137C SIA1 chromosome 15 15 583681 581813 C 2011-02-03 1996-07-31 Protein of unassigned function; involved in activation of the Pma1p plasma membrane H+-ATPase by glucose; contains peptide signal for membrane localization +S000030527 CDS YOR137C 15 583681 581813 C 2011-02-03 1996-07-31 +S000005664 ORF Verified YOR138C RUP1 chromosome 15 15 586324 584309 C 2011-02-03 1996-07-31 Protein that regulates ubiquitination of Rsp5p; has a WW domain consensus motif of PPPSY (residues 131-135) that mediates binding of Rsp5p to Ubp2p; contains an UBA domain; relative distribution to the nucleus increases upon DNA replication stress +S000030602 CDS YOR138C 15 586324 584309 C 2011-02-03 1996-07-31 +S000005666 ORF Verified YOR140W SFL1 chromosome 15 L000001869 15 586981 589281 W 2011-02-03 1996-07-31|2011-02-03 Transcriptional repressor and activator; involved in repression of flocculation-related genes, and activation of stress responsive genes; has direct role in INO1 transcriptional memory; negatively regulated by cAMP-dependent protein kinase A subunit Tpk2p; premature stop codon (C1430T, Q477-stop) in SK1 background is linked to the aggressively invasive phenotype of SK1 relative to BY4741 (S288C) +S000030239 CDS YOR140W 15 586981 589281 W 2011-02-03 1996-07-31|2011-02-03 +S000005665 ORF Dubious YOR139C chromosome 15 15 587342 586950 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF SFL1/YOR140W +S000030683 CDS YOR139C 15 587342 586950 C 2011-02-03 1996-07-31 +S000005667 ORF Verified YOR141C ARP8 chromosome 15 L000003437 15 592587 589942 C 2011-02-03 1996-07-31 Nuclear actin-related protein involved in chromatin remodeling; component of chromatin-remodeling enzyme complexes; has mRNA binding activity +S000030308 CDS YOR141C 15 592587 589942 C 2011-02-03 1996-07-31 +S000005668 ORF Verified YOR142W LSC1 succinate--CoA ligase (GDP-forming) subunit alpha chromosome 15 L000004591 15 593057 594046 W 2011-02-03 1996-07-31 Alpha subunit of succinyl-CoA ligase; succinyl-CoA ligase is a mitochondrial enzyme of the TCA cycle that catalyzes the nucleotide-dependent conversion of succinyl-CoA to succinate; phosphorylated +S000033682 CDS YOR142W 15 593057 594046 W 2011-02-03 1996-07-31 +S000006573 tRNA_gene tG(CCC)O SUF5 chromosome 15 L000002153|L000003716 15 594425 594354 C 76 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons +S000032361 noncoding_exon tG(CCC)O 15 594425 594354 C 2011-02-03 2000-05-19 +S000007169 long_terminal_repeat YORWdelta12 chromosome 15 15 594512 594819 W 2011-02-03 2000-05-19 Ty1 LTR +S000007170 long_terminal_repeat YORWdelta13 chromosome 15 15 594820 595151 W 2011-02-03 2000-05-19 Ty1 LTR +S000007182 LTR_retrotransposon YORWTy1-2 Ty1 chromosome 15 15 594820 600733 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007351 transposable_element_gene YOR142W-A gag protein chromosome 15 15 595112 596434 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000036110 CDS YOR142W-A 15 595112 596434 W 2011-02-03 1999-07-17 +S000007352 transposable_element_gene YOR142W-B gag-pol fusion protein chromosome 15 15 595112 600380 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000036113 CDS YOR142W-B 15 595112 596416 W 2011-02-03 1999-07-17 +S000036114 CDS YOR142W-B 15 596418 600380 W 2011-02-03 1999-07-17 +S000036115 plus_1_translational_frameshift YOR142W-B 15 596417 596417 W 2011-02-03 1999-07-17 +S000007171 long_terminal_repeat YORWdelta14 chromosome 15 15 600402 600733 W 2011-02-03 2000-05-19 Ty1 LTR +S000007643 ARS ARS1502 ARS1517 chromosome 15 15 600886 600960 2011-02-03 2001-03-06 Autonomously Replicating Sequence +S000005669 ORF Verified YOR143C THI80 thiamine diphosphokinase chromosome 15 L000002297 15 602342 601383 C 2011-02-03 1996-07-31 Thiamine pyrophosphokinase; phosphorylates thiamine to produce the coenzyme thiamine pyrophosphate (thiamine diphosphate) +S000033738 CDS YOR143C 15 602342 601383 C 2011-02-03 1996-07-31 +S000005670 ORF Verified YOR144C ELG1 RTT110 chromosome 15 S000007438 15 605092 602717 C 2011-02-03 1996-07-31 Subunit of an alternative replication factor C complex; important for DNA replication and genome integrity; suppresses spontaneous DNA damage; involved in homologous recombination-mediated repair and telomere homeostasis; required for PCNA (Pol30p) unloading during DNA replication +S000033871 CDS YOR144C 15 605092 602717 C 2011-02-03 1996-07-31 +S000005672 ORF Dubious YOR146W chromosome 15 15 605873 606178 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame overlaps the verified gene PNO1/YOR145C +S000034948 CDS YOR146W 15 605873 606178 W 2011-02-03 1996-07-31 +S000005671 ORF Verified YOR145C PNO1 RRP20|DIM2 chromosome 15 15 606171 605347 C 2011-02-03 1996-07-31 Essential nucleolar protein required for pre-18S rRNA processing; interacts with Dim1p, an 18S rRNA dimethyltransferase, and also with Nob1p, which is involved in proteasome biogenesis; contains a KH domain +S000033985 CDS YOR145C 15 606171 605347 C 2011-02-03 1996-07-31 +S000005673 ORF Verified YOR147W MDM32 chromosome 15 15 606607 608475 W 2011-02-03 1996-07-31|2005-11-30 Mitochondrial inner membrane protein with similarity to Mdm31p; required for normal mitochondrial morphology and inheritance; interacts genetically with MMM1, MDM10, MDM12, and MDM34; variation between SK1 and S288C at residues 182 and 262 impacts invasive growth and mitochondrial network structure +S000035083 CDS YOR147W 15 606607 608475 W 2011-02-03 1996-07-31|2005-11-30 +S000005674 ORF Verified YOR148C SPP2 chromosome 15 L000002631 15 609197 608640 C 2011-02-03 1996-07-31 Essential protein that promotes the first step of splicing; required for the final stages of spliceosome maturation and activation; interacts with Prp2p, which may release Spp2p from the spliceosome following the first cleavage reaction; stimulates Prp2p ATPase activity +S000035131 CDS YOR148C 15 609197 608640 C 2011-02-03 1996-07-31 +S000005675 ORF Verified YOR149C SMP3 glycosylphosphatidylinositol-alpha 1,2 mannosyltransferase|SAP2|LAS2 chromosome 15 L000001935 15 611388 609838 C 2011-02-03 1996-07-31|2011-02-03 Alpha 1,2-mannosyltransferase; involved in glycosyl phosphatidyl inositol (GPI) biosynthesis; required for addition of the fourth, side branching mannose to the GPI core structure +S000036016 CDS YOR149C 15 611388 609838 C 2011-02-03 1996-07-31|2011-02-03 +S000005676 ORF Verified YOR150W MRPL23 mitochondrial 54S ribosomal protein YmL23|YmL23 chromosome 15 15 611999 612490 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; localizes to vacuole in response to H2O2 +S000034760 CDS YOR150W 15 611999 612490 W 2011-02-03 1996-07-31 +S000130136 ARS ARS1518 ARSXV-618 chromosome 15 15 616670 617517 2011-02-03 2009-05-05 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000005677 ORF Verified YOR151C RPB2 DNA-directed RNA polymerase II core subunit RPB2|B150|SOH2|SIT2|RPO22|RPB150 chromosome 15 L000001588|L000001676 15 616671 612997 C 80 2011-02-03 1996-07-31 RNA polymerase II second largest subunit B150; part of central core; similar to bacterial beta subunit +S000035654 CDS YOR151C 15 616671 612997 C 2011-02-03 1996-07-31 +S000005678 ORF Verified YOR152C ATG40 chromosome 15 15 618288 617518 C 2011-02-03 1996-07-31 Autophagy receptor with a role in endoplasmic reticulum degradation; involved specifically in autophagy of cortical and cytoplasmic ER in response to nitrogen starvation or rapamycin treatment; localizes to the cortical and cytoplasmic ER; similar to human FAM134B, which is also involved in ER autophagy and is associated with sensory neuropathy +S000035770 CDS YOR152C 15 618288 617518 C 2011-02-03 1996-07-31 +S000005679 ORF Verified YOR153W PDR5 ATP-binding cassette multidrug transporter PDR5|STS1|YDR1|LEM1 chromosome 15 L000001365|L000002136|L000002504 15 619840 624375 W 85 2011-02-03 1996-07-31 Plasma membrane ATP-binding cassette (ABC) transporter; multidrug transporter actively regulated by Pdr1p; also involved in steroid transport, cation resistance, and cellular detoxification during exponential growth; PDR5 has a paralog, PDR15, that arose from the whole genome duplication +S000035997 CDS YOR153W 15 619840 624375 W 2011-02-03 1996-07-31 +S000005680 ORF Verified YOR154W SLP1 chromosome 15 15 624729 626492 W 2011-02-03 1996-07-31 Glycosylated integral ER membrane protein of unknown function; forms an ER-membrane associated protein complex with Emp65p; member of the SUN-like family of proteins; genetic interactions suggest a role in folding of ER membrane proteins; required for nuclear envelope localization of Mps3p +S000037835 CDS YOR154W 15 624729 626492 W 2011-02-03 1996-07-31 +S000005681 ORF Verified YOR155C ISN1 IMP 5'-nucleotidase chromosome 15 15 627980 626628 C 2011-02-03 1996-07-31 Inosine 5'-monophosphate (IMP)-specific 5'-nucleotidase; catalyzes the breakdown of IMP to inosine; responsible for production of nicotinamide riboside and nicotinic acid riboside; expression positively regulated by nicotinic acid and glucose availability; does not show similarity to known 5'-nucleotidases from other organisms +S000037874 CDS YOR155C 15 627980 626628 C 2011-02-03 1996-07-31 +S000005682 ORF Verified YOR156C NFI1 SUMO ligase NFI1|SIZ2 chromosome 15 L000002966 15 630540 628360 C 2011-02-03 1996-07-31 SUMO E3 ligase; catalyzes sumoylation of Yku70p/80p and Sir4p promoting telomere anchoring to the nuclear envelope and regulating telomerase activity; DNA-bound form catalyzes a DNA-damaged triggered sumoylation wave resulting in multisite modification of several DNA repair proteins, enhancing interactions between these proteins and accelerating repair; sumoylates Cse4p, a prerequisite for STUbL-mediated Ub-dependent degradation; role in telomere length maintenance +S000029894 CDS YOR156C 15 630540 628360 C 2011-02-03 1996-07-31 +S000005683 ORF Verified YOR157C PUP1 proteasome core particle subunit beta 2 chromosome 15 L000001530 15 631751 630966 C 84.6 2011-02-03 1996-07-31 Beta 2 subunit of the 20S proteasome; endopeptidase with trypsin-like activity that cleaves after basic residues; synthesized as a proprotein before being proteolytically processed for assembly into 20S particle; human homolog is subunit Z +S000029992 CDS YOR157C 15 631751 630966 C 2011-02-03 1996-07-31 +S000005684 ORF Verified YOR158W PET123 mitochondrial 37S ribosomal protein PET123 chromosome 15 L000001398 15 632164 633120 W 84.2 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; PET123 exhibits genetic interactions with PET122, which encodes a COX3 mRNA-specific translational activator +S000031031 CDS YOR158W 15 632164 633120 W 2011-02-03 1996-07-31 +S000005685 ORF Verified YOR159C SME1 mRNA splicing protein SME1|Sm E|SmE chromosome 15 L000004252 15 633566 633282 C 2011-02-03 1996-07-31 Core Sm protein Sm E; part of heteroheptameric complex (with Smb1p, Smd1p, Smd2p, Smd3p, Smx3p, and Smx2p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; homolog of human Sm E +S000031069 CDS YOR159C 15 633566 633282 C 2011-02-03 1996-07-31 +S000005686 ORF Verified YOR160W MTR10 KAP111 chromosome 15 L000003296 15 633839 636757 W 2011-02-03 1996-07-31 Nuclear import receptor; mediates the nuclear localization of proteins involved in mRNA-nucleus export; promotes dissociation of mRNAs from the nucleus-cytoplasm mRNA shuttling protein Npl3p; required for retrograde import of mature tRNAs; relocalizes from cytoplasm to the nuclear periphery upon DNA replication stress +S000030698 CDS YOR160W 15 633839 636757 W 2011-02-03 1996-07-31 +S000028713 ORF Dubious YOR161W-A chromosome 15 15 637574 637654 W 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032680 CDS YOR161W-A 15 637574 637654 W 2011-02-03 2003-07-29 +S000028714 ORF Dubious YOR161W-B chromosome 15 15 637975 638235 W 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032682 CDS YOR161W-B 15 637975 638235 W 2011-02-03 2003-07-29 +S000005687 ORF Verified YOR161C PNS1 chromosome 15 15 638558 636939 C 2011-02-03 1996-07-31 Protein of unknown function; has similarity to Torpedo californica tCTL1p, which is postulated to be a choline transporter, neither null mutation nor overexpression affects choline transport +S000030748 CDS YOR161C 15 638558 636939 C 2011-02-03 1996-07-31 +S000028712 ORF Uncharacterized YOR161C-C chromosome 15 15 639267 639121 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032678 CDS YOR161C-C 15 639267 639121 C 2011-02-03 2003-07-29 +S000005688 ORF Verified YOR162C YRR1 PDR2 chromosome 15 L000004200|S000029349|L000001362 15 641992 639560 C 89 2011-02-03 1996-07-31 Zn2-Cys6 zinc-finger transcription factor; activates genes involved in multidrug resistance; paralog of Yrm1p, acting on an overlapping set of target genes; YRR1 has a paralog, PDR8, that arose from the whole genome duplication +S000030856 CDS YOR162C 15 641992 639560 C 2011-02-03 1996-07-31 +S000005689 ORF Verified YOR163W DDP1 polyphosphatase DDP1 chromosome 15 S000007498 15 642741 643307 W 2011-02-03 1996-07-31 Polyphosphate phosphatase; hydrolyzes diphosphorylated inositol polyphosphates and diadenosine polyphosphates; high specificity for diadenosine hexa- and pentaphosphates; contains endopolyphosphatase activity with a high affinity for polyphosphates, an activity also observed for its human DIPP homologs; possesses mRNA decapping activity; nudix hydrolase family member; protein abundance increases in response to DNA replication stress +S000031902 CDS YOR163W 15 642741 643307 W 2011-02-03 1996-07-31 +S000005690 ORF Verified YOR164C GET4 ENV8 chromosome 15 15 644332 643394 C 2011-02-03 1996-07-31 Protein involved in inserting tail-anchored proteins into ER membranes; forms a complex with Mdy2p; highly conserved across species and homologous to human gene C7orf20 +S000031981 CDS YOR164C 15 644332 643394 C 2011-02-03 1996-07-31 +S000005691 ORF Verified YOR165W SEY1 dynamin-like GTPase SEY1 chromosome 15 15 644566 646896 W 2011-02-03 1996-07-31 Dynamin-like GTPase that mediates homotypic ER fusion; has a role in ER morphology; interacts physically and genetically with Yop1p and Rtn1p; functional ortholog of the human atlastin ATL1, defects in which cause a form of the human disease hereditary spastic paraplegia; homolog of Arabidopsis RHD3 +S000034063 CDS YOR165W 15 644566 646896 W 2011-02-03 1996-07-31 +S000005692 ORF Verified YOR166C SWT1 mRNA-processing endoribonuclease chromosome 15 15 648502 647126 C 2011-02-03 1996-07-31 RNA endoribonuclease involved in perinuclear mRNP quality control; involved in perinuclear mRNP quality control via the turnover of aberrant, unprocessed pre-mRNAs; interacts with subunits of THO/TREX, TREX-2, and RNA polymerase II; contains a PIN (PilT N terminus) domain +S000034075 CDS YOR166C 15 648502 647126 C 2011-02-03 1996-07-31 +S000005693 ORF Verified YOR167C RPS28A eS28|ribosomal 40S subunit protein S28A|S28e|YS27|S33A|S28A|RPS33A chromosome 15 L000001767 15 649007 648804 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; has an extraribosomal function in regulation of RPS28B, in which Rps28Ap binds to a decapping complex via Edc3p, which then binds to RPS28B mRNA leading to its decapping and degradation; homologous to mammalian ribosomal protein S28, no bacterial homolog; RPS28A has a paralog, RPS28B, that arose from the whole genome duplication +S000034207 CDS YOR167C 15 649007 648804 C 2011-02-03 1996-07-31 +S000005694 ORF Verified YOR168W GLN4 glutamine--tRNA ligase chromosome 15 L000000711 15 649303 651732 W 88 2011-02-03 1996-07-31 Glutamine tRNA synthetase; monomeric class I tRNA synthetase that catalyzes the specific glutaminylation of tRNA(Gln); N-terminal domain proposed to be involved in enzyme-tRNA interactions +S000034317 CDS YOR168W 15 649303 651732 W 2011-02-03 1996-07-31 +S000005695 ORF Dubious YOR169C chromosome 15 15 651840 651376 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame overlaps the verified gene GLN4/YOR168W +S000034343 CDS YOR169C 15 651840 651376 C 2011-02-03 1996-07-31 +S000005696 ORF Dubious YOR170W chromosome 15 15 651858 652163 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene LCB4 +S000033855 CDS YOR170W 15 651858 652163 W 2011-02-03 1996-07-31 +S000005697 ORF Verified YOR171C LCB4 sphinganine kinase LCB4 chromosome 15 L000004328 15 653884 652010 C 2011-02-03 1996-07-31 Sphingoid long-chain base kinase; responsible for synthesis of long-chain base phosphates, which function as signaling molecules, regulates synthesis of ceramide from exogenous long-chain bases, localizes to the Golgi and late endosomes; LCB4 has a paralog, LCB5, that arose from the whole genome duplication +S000033881 CDS YOR171C 15 653884 652010 C 2011-02-03 1996-07-31 +S000005698 ORF Verified YOR172W YRM1 chromosome 15 15 654210 656570 W 2011-02-03 1996-07-31 Zinc finger transcription factor involved in multidrug resistance; Zn(2)-Cys(6) zinc finger transcription factor; activates genes involved in multidrug resistance; paralog of Yrr1p, acting on an overlapping set of target genes +S000034873 CDS YOR172W 15 654210 656570 W 2011-02-03 1996-07-31 +S000118490 ARS ARS1519 ARSXV-657 chromosome 15 15 656701 656772 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000005699 ORF Verified YOR173W DCS2 5'-(N(7)-methyl 5'-triphosphoguanosine)-(mRNA) diphosphatase chromosome 15 15 657264 658325 W 2011-02-03 1996-07-31|2006-10-05 m(7)GpppX pyrophosphatase regulator; non-essential, stress induced regulatory protein; modulates m7G-oligoribonucleotide metabolism; inhibits Dcs1p; regulated by Msn2p, Msn4p, and the Ras-cAMP-cAPK signaling pathway; mutant has increased aneuploidy tolerance; DCS2 has a paralog, DCS1, that arose from the whole genome duplication +S000035026 CDS YOR173W 15 657264 658325 W 2011-02-03 1996-07-31|2006-10-05 +S000005700 ORF Verified YOR174W MED4 chromosome 15 L000003915 15 658747 659601 W 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation +S000035222 CDS YOR174W 15 658747 659601 W 2011-02-03 1996-07-31 +S000005701 ORF Verified YOR175C ALE1 lysophospholipid acyltransferase|LCA1|LPT1|SLC4 chromosome 15 15 661674 659815 C 2011-02-03 1996-07-31 Broad-specificity lysophospholipid acyltransferase; part of MBOAT family of membrane-bound O-acyltransferases; key component of Lands cycle; may have role in fatty acid exchange at sn-2 position of mature glycerophospholipids +S000035274 CDS YOR175C 15 661674 659815 C 2011-02-03 1996-07-31 +S000005702 ORF Verified YOR176W HEM15 ferrochelatase HEM15 chromosome 15 L000000766 15 662401 663582 W 2011-02-03 1996-07-31 Ferrochelatase; a mitochondrial inner membrane protein, catalyzes insertion of ferrous iron into protoporphyrin IX, the eighth and final step in the heme biosynthetic pathway; human homolog FECH can complement yeast mutant and allow growth of haploid null after sporulation of a heterozygous diploid +S000036250 CDS YOR176W 15 662401 663582 W 2011-02-03 1996-07-31 +S000006766 tRNA_gene tV(AAC)O chromosome 15 L000003715 15 663885 663812 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000032969 noncoding_exon tV(AAC)O 15 663885 663812 C 2011-02-03 2000-05-19 +S000007163 long_terminal_repeat YORCdelta15 chromosome 15 15 664324 664003 C 2011-02-03 2000-05-19 Ty1 LTR +S000007172 long_terminal_repeat YORWdelta16 chromosome 15 15 664325 664469 W 2011-02-03 2000-05-19 Ty1 LTR +S000007173 long_terminal_repeat YORWdelta17 chromosome 15 15 664813 665145 W 2011-02-03 2000-05-19 Ty2 LTR +S000005703 ORF Verified YOR177C MPC54 chromosome 15 15 667179 665785 C 2011-02-03 1996-07-31 Component of the meiotic outer plaque; a membrane-organizing center which is assembled on the cytoplasmic face of the spindle pole body during meiosis II and triggers the formation of the prospore membrane; potential Cdc28p substrate +S000036281 CDS YOR177C 15 667179 665785 C 2011-02-03 1996-07-31 +S000005704 ORF Verified YOR178C GAC1 protein phosphatase regulator GAC1 chromosome 15 L000000657 15 670241 667860 C 113 2011-02-03 1996-07-31 Regulatory subunit for Glc7p type-1 protein phosphatase (PP1); tethers Glc7p to Gsy2p glycogen synthase, binds Hsf1p heat shock transcription factor, required for induction of some HSF-regulated genes under heat shock; GAC1 has a paralog, PIG1, that arose from the whole genome duplication +S000036360 CDS YOR178C 15 670241 667860 C 2011-02-03 1996-07-31 +S000005705 ORF Verified YOR179C SYC1 cleavage polyadenylation factor subunit SYC1 chromosome 15 15 672411 671845 C 2011-02-03 1996-07-31 Subunit of the APT subcomplex of cleavage and polyadenylation factor; may have a role in 3' end formation of both polyadenylated and non-polyadenylated RNAs; SYC1 has a paralog, YSH1, that arose from the whole genome duplication +S000030078 CDS YOR179C 15 672411 671845 C 2011-02-03 1996-07-31 +S000005706 ORF Verified YOR180C DCI1 putative dodecenoyl-CoA isomerase DCI1|ECI2 chromosome 15 L000004175 15 675167 674352 C 2011-02-03 1996-07-31 Peroxisomal protein; identification as a delta(3,5)-delta(2,4)-dienoyl-CoA isomerase involved in fatty acid metabolism is disputed; DCI1 has a paralog, ECI1, that arose from the whole genome duplication +S000037854 CDS YOR180C 15 675167 674352 C 2011-02-03 1996-07-31 +S000005707 ORF Verified YOR181W LAS17 actin-binding protein LAS17|BEE1 chromosome 15 L000003068|L000003581 15 675939 677840 W 2011-02-03 1996-07-31 Actin assembly factor; C-terminal WCA domain activates Arp2/3 complex-mediated nucleation of branched actin filaments, polyproline domain nucleates actin filaments independent of Arp2/3; mutants are defective in endocytosis, bud site selection, cytokinesis; human homolog WAS (Wiskott-Aldrich Syndrome) implicated in severe immunodeficiency; human WAS complements yeast null mutant, but only in presence of WIPF1, which mediates localization of WAS to cortical patches +S000029943 CDS YOR181W 15 675939 677840 W 2011-02-03 1996-07-31 +S000005708 ORF Verified YOR182C RPS30B eS30|ribosomal 40S subunit protein S30B|S30e|S30B chromosome 15 L000003497 15 678793 678191 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S30, no bacterial homolog; RPS30B has a paralog, RPS30A, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000030004 CDS YOR182C 15 678379 678191 C 2011-02-03 1996-07-31 +S000030003 CDS YOR182C 15 678793 678791 C 2011-02-03 1996-07-31 +S000030005 intron YOR182C 15 678790 678380 C 2011-02-03 1996-07-31 +S000005709 ORF Uncharacterized YOR183W FYV12 chromosome 15 15 678872 679261 W 2011-02-03 1996-07-31 Protein of unknown function; required for survival upon exposure to K1 killer toxin +S000031055 CDS YOR183W 15 678872 679261 W 2011-02-03 1996-07-31 +S000005710 ORF Verified YOR184W SER1 O-phospho-L-serine:2-oxoglutarate transaminase|ADE9 chromosome 15 L000001865 15 679357 680544 W 98.2 2011-02-03 1996-07-31 3-phosphoserine aminotransferase; catalyzes the formation of phosphoserine from 3-phosphohydroxypyruvate, required for serine and glycine biosynthesis; regulated by the general control of amino acid biosynthesis mediated by Gcn4p; protein abundance increases in response to DNA replication stress +S000031176 CDS YOR184W 15 679357 680544 W 2011-02-03 1996-07-31 +S000007300 snoRNA_gene snR36 SNR36 chromosome 15 L000001974 15 680866 680685 C 2011-02-03 2000-05-19|2007-05-10 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of small subunit (SSU) rRNA at position U1187 +S000036766 noncoding_exon snR36 15 680866 680685 C 2011-02-03 2000-05-19|2007-05-10 +S000005711 ORF Verified YOR185C GSP2 Ran GTPase GSP2|CNR2 chromosome 15 L000000737 15 682106 681444 C 98.6 2011-02-03 1996-07-31 GTP binding protein (mammalian Ranp homolog); involved in the maintenance of nuclear organization, RNA processing and transport; interacts with Kap121p, Kap123p and Pdr6p (karyophilin betas); not required for viability; protein abundance increases in response to DNA replication stress; GSP2 has a paralog, GSP1, that arose from the whole genome duplication +S000031246 CDS YOR185C 15 682106 681444 C 2011-02-03 1996-07-31 +S000005712 ORF Uncharacterized YOR186W chromosome 15 15 683111 683545 W 2011-02-03 1996-07-31 Putative protein of unknown function; proper regulation of expression during heat stress is sphingolipid-dependent; mCherry fusion protein localizes to the vacuole; YOR186W has a paralog, YLR297W, that arose from the whole genome duplication +S000032297 CDS YOR186W 15 683111 683545 W 2011-02-03 1996-07-31 +S000028715 ORF Dubious YOR186C-A chromosome 15 15 683538 683329 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032684 CDS YOR186C-A 15 683538 683329 C 2011-02-03 2003-07-29 +S000005713 ORF Verified YOR187W TUF1 translation elongation factor Tu|tufM chromosome 15 L000002390 15 684030 685343 W 2011-02-03 1996-07-31 Mitochondrial translation elongation factor Tu (EF-Tu); involved in fundamental pathway of mtDNA homeostasis; comprises both GTPase and guanine nucleotide exchange factor activities, while these activities are found in separate proteins in S. pombe and humans; rare mutations in human mitochondrial elongation factor Tu (EFTu) associated with severe lactic acidosis, rapidly progressive fatal encephalopathy, severe infantile macrocystic leukodystrophy with micropolygyria +S000032398 CDS YOR187W 15 684030 685343 W 2011-02-03 1996-07-31 +S000005714 ORF Verified YOR188W MSB1 chromosome 15 L000001184 15 685767 689180 W 103 2011-02-03 1996-07-31 Protein of unknown function; may be involved in positive regulation of 1,3-beta-glucan synthesis and the Pkc1p-MAPK pathway; multicopy suppressor of temperature-sensitive mutations in CDC24 and CDC42, and of mutations in BEM4; potential Cdc28p substrate; relocalizes from bud neck to cytoplasm upon DNA replication stress +S000032501 CDS YOR188W 15 685767 689180 W 2011-02-03 1996-07-31 +S000005715 ORF Verified YOR189W IES4 chromosome 15 15 689624 689974 W 2011-02-03 1996-07-31 Component of the INO80 chromatiin remodeling complex; target of the Mec1p/Tel1p DNA damage signaling pathway; proposed to link chromatin remodeling to replication checkpoint responses +S000034540 CDS YOR189W 15 689624 689974 W 2011-02-03 1996-07-31 +S000005716 ORF Verified YOR190W SPR1 glucan 1,3-beta-glucosidase|SSG1 chromosome 15 L000002020|L000002083 15 690695 692032 W 2011-02-03 1996-07-31 Sporulation-specific exo-1,3-beta-glucanase; contributes to ascospore thermoresistance; SPR1 has a paralog, EXG1, that arose from the whole genome duplication +S000033255 CDS YOR190W 15 690695 692032 W 2011-02-03 1996-07-31 +S000005717 ORF Verified YOR191W ULS1 translocase ULS1|RIS1|TID4|DIS1 chromosome 15 L000004381 15 692475 697334 W 2011-02-03 1996-07-31 Swi2/Snf2-related translocase, SUMO-Targeted Ubiquitin Ligase (STUbL); required for maintenance of NHEJ inhibition at telomeres; functions at telomeres to translocate and ubiquitinylate poly-sumoylated Rap1p for proteosomal degradation; plays role in antagonizing silencing during mating-type switching; only known STUbL with a translocase activity; contains RING finger domain; relocalizes from nucleus to cytoplasm upon DNA replication stress +S000033303 CDS YOR191W 15 692475 697334 W 2011-02-03 1996-07-31 +S000005718 ORF Verified YOR192C THI72 thiamine transporter chromosome 15 15 700567 698768 C 2011-02-03 1996-07-31 Transporter of thiamine or related compound; contributes to uptake of 5-aminoimidazole-4-carboxamide-1-beta-D-ribofuranoside (acadesine); shares sequence similarity with Thi7p +S000034124 CDS YOR192C 15 700567 698768 C 2011-02-03 1996-07-31 +S000007164 long_terminal_repeat YORCdelta18 chromosome 15 15 703582 703429 C 2011-02-03 2000-05-19 Ty1 LTR +S000007174 long_terminal_repeat YORWdelta19 chromosome 15 15 703612 703762 W 2011-02-03 2000-05-19 Ty1 LTR +S000007180 long_terminal_repeat YORWtau2 chromosome 15 15 703772 704062 W 2011-02-03 2000-05-19 Ty4 LTR +S000028857 ORF Uncharacterized YOR192C-C chromosome 15 15 704224 703988 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000034570 CDS YOR192C-C 15 704224 703988 C 2011-02-03 2003-07-29 +S000007165 long_terminal_repeat YORCdelta20 chromosome 15 15 704395 704063 C 2011-02-03 2000-05-19 Ty2 LTR +S000007354 transposable_element_gene YOR192C-B gag-pol fusion protein chromosome 15 S000029019 15 709732 704419 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000034414 CDS YOR192C-B 15 708438 704419 C 2011-02-03 1999-07-17 +S000034413 CDS YOR192C-B 15 709732 708440 C 2011-02-03 1999-07-17 +S000034415 plus_1_translational_frameshift YOR192C-B 15 708439 708439 C 2011-02-03 1999-07-17 +S000007353 transposable_element_gene YOR192C-A gag protein chromosome 15 15 709732 708416 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000034406 CDS YOR192C-A 15 709732 708416 C 2011-02-03 1999-07-17 +S000007168 LTR_retrotransposon YORCTy2-1 Ty2 chromosome 15 15 710023 704063 C 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007166 long_terminal_repeat YORCdelta21 chromosome 15 15 710023 709691 C 2011-02-03 2000-05-19 Ty2 LTR +S000007181 long_terminal_repeat YORWtau3 chromosome 15 15 710024 710107 W 2011-02-03 2000-05-19 Ty4 LTR +S000006665 tRNA_gene tM(CAU)O1 IMT1 chromosome 15 L000003711 15 710201 710272 W 2011-02-03 2000-05-19 Methionine initiator tRNA (tRNA-Met); predicted by tRNAscan-SE analysis; one of four initiator methionine tRNAs in yeast that are functional for translation +S000032163 noncoding_exon tM(CAU)O1 15 710201 710272 W 2011-02-03 2000-05-19 +S000005719 ORF Verified YOR193W PEX27 chromosome 15 15 710446 711576 W 2011-02-03 1996-07-31 Peripheral peroxisomal membrane protein; involved in controlling peroxisome size and number, interacts with Pex25p; PEX27 has a paralog, PEX25, that arose from the whole genome duplication +S000034339 CDS YOR193W 15 710446 711576 W 2011-02-03 1996-07-31 +S000005720 ORF Verified YOR194C TOA1 transcription initiation factor IIA large subunit chromosome 15 L000002316 15 712543 711683 C 2011-02-03 1996-07-31 TFIIA large subunit; involved in transcriptional activation, acts as antirepressor or as coactivator; required, along with Toa2p, for ribosomal protein gene transcription in vivo; homologous to largest and second largest subunits of human and Drosophila TFIIA +S000034366 CDS YOR194C 15 712543 711683 C 2011-02-03 1996-07-31 +S000005721 ORF Verified YOR195W SLK19 chromosome 15 L000004340 15 712866 715331 W 2011-02-03 1996-07-31 Kinetochore-associated protein; required for chromosome segregation and kinetochore clustering; required for normal segregation of chromosomes in meiosis and mitosis; component of the FEAR regulatory network, which promotes Cdc14p release from the nucleolus during anaphase; potential Cdc28p substrate +S000035480 CDS YOR195W 15 712866 715331 W 2011-02-03 1996-07-31 +S000005722 ORF Verified YOR196C LIP5 putative lipoate synthase chromosome 15 L000002613 15 716837 715593 C 2011-02-03 1996-07-31 Protein involved in biosynthesis of the coenzyme lipoic acid; has similarity to E. coli lipoic acid synthase +S000035507 CDS YOR196C 15 716837 715593 C 2011-02-03 1996-07-31 +S000005723 ORF Verified YOR197W MCA1 Ca(2+)-dependent cysteine protease MCA1|YCA1 chromosome 15 15 717086 718384 W 2011-02-03 1996-07-31|2006-05-11 Ca2+-dependent cysteine protease; may cleave specific substrates during the stress response; regulates apoptosis upon H2O2 treatment; required for clearance of insoluble protein aggregates during normal growth; implicated in cell cycle dynamics and lifespan extension; undergoes autocatalytic processing; similar to mammalian metacaspases, but exists as a monomer due to an extra pair of anti-parallel beta-strands that block potential dimerization +S000035631 CDS YOR197W 15 717086 718384 W 2011-02-03 1996-07-31|2006-05-11 +S000005724 ORF Verified YOR198C BFR1 chromosome 15 L000000174 15 720065 718653 C 2011-02-03 1996-07-31 Component of mRNP complexes associated with polyribosomes; involved in localization of mRNAs to P bodies; implicated in secretion and nuclear segregation; multicopy suppressor of BFA (Brefeldin A) sensitivity +S000036502 CDS YOR198C 15 720065 718653 C 2011-02-03 1996-07-31 +S000005725 ORF Dubious YOR199W chromosome 15 15 720181 720510 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036654 CDS YOR199W 15 720181 720510 W 2011-02-03 1996-07-31 +S000005726 ORF Dubious YOR200W chromosome 15 15 720417 720815 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF MRM1/YOR201c +S000036053 CDS YOR200W 15 720417 720815 W 2011-02-03 1996-07-31 +S000005727 ORF Verified YOR201C MRM1 PET56 chromosome 15 L000001392 15 721708 720470 C 112 2011-02-03 1996-07-31 Ribose methyltransferase; modifies a functionally critical, conserved nucleotide in mitochondrial 21S rRNA +S000036099 CDS YOR201C 15 721708 720470 C 2011-02-03 1996-07-31 +S000005728 ORF Verified YOR202W HIS3 imidazoleglycerol-phosphate dehydratase HIS3|HIS8|HIS10 chromosome 15 L000000780|S000029212|L000000785 15 721946 722608 W 112 2011-02-03 1996-07-31 Imidazoleglycerol-phosphate dehydratase; catalyzes the sixth step in histidine biosynthesis; mutations cause histidine auxotrophy and sensitivity to Cu, Co, and Ni salts; transcription is regulated by general amino acid control via Gcn4p +S000029880 CDS YOR202W 15 721946 722608 W 2011-02-03 1996-07-31 +S000005729 ORF Dubious YOR203W chromosome 15 15 722565 722918 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps 5' end of essential DED1 gene required for translation initiation +S000031781 CDS YOR203W 15 722565 722918 W 2011-02-03 1996-07-31 +S000005730 ORF Verified YOR204W DED1 DEAD-box ATP-dependent RNA helicase DED1|SPP81 chromosome 15 L000000500 15 722911 724725 W 114 2011-02-03 1996-07-31 ATP-dependent DEAD (Asp-Glu-Ala-Asp)-box RNA helicase; required for translation initiation of all yeast mRNAs; binds to mRNA cap-associated factors, and binding stimulates Ded1p RNA-dependent ATPase activity; mutation in human homolog DBY is associated with male infertility; human homolog DDX3X complements ded1 null mutation; DED1 has a paralog, DBP1, that arose from the whole genome duplication +S000031924 CDS YOR204W 15 722911 724725 W 2011-02-03 1996-07-31 +S000005731 ORF Verified YOR205C GEP3 MTG3|AIM40|LRC5|FMP38 chromosome 15 15 727234 725564 C 2011-02-03 1996-07-31 Protein required for mitochondrial ribosome small subunit biogenesis; null mutant is defective in respiration and in maturation of 15S rRNA; protein is localized to the mitochondrial inner membrane; null mutant interacts synthetically with prohibitin (Phb1p) +S000031991 CDS YOR205C 15 727234 725564 C 2011-02-03 1996-07-31 +S000005732 ORF Verified YOR206W NOC2 mRNA-binding ribosome synthesis protein NOC2 chromosome 15 15 727512 729644 W 2011-02-03 1996-07-31 Protein involved in ribosome biogenesis; forms a nucleolar complex with Mak21p that binds to 90S and 66S pre-ribosomes; forms a nuclear complex with Noc3p that binds to 66S pre-ribosomes; both complexes mediate intranuclear transport of ribosomal precursors; acts as part of a Mak21p-Noc2p-Rrp5p module that associates with nascent pre-rRNA during transcription and has a role in bigenesis of the large ribosomal subunit +S000037497 CDS YOR206W 15 727512 729644 W 2011-02-03 1996-07-31 +S000118491 ARS ARS1521 ARSXV-730 chromosome 15 15 729740 729969 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178185 ARS_consensus_sequence ARS1521 15 729795 729811 W 2014-11-18 2014-11-18 +S000005733 ORF Verified YOR207C RET1 DNA-directed RNA polymerase III core subunit RET1|C128|RPC128|RPC2|PDS2 chromosome 15 L000001614 15 733457 730008 C 117 2011-02-03 1996-07-31 Second-largest subunit of RNA polymerase III; RNA polymerase III is responsible for the transcription of tRNA and 5S RNA genes, and other low molecular weight RNAs +S000037554 CDS YOR207C 15 733457 730008 C 2011-02-03 1996-07-31 +S000005734 ORF Verified YOR208W PTP2 tyrosine protein phosphatase PTP2 chromosome 15 L000001526 15 733925 736177 W 2011-02-03 1996-07-31 Nuclear phosphotyrosine-specific phosphatase involved in osmosensing; involved in the inactivation of mitogen-activated protein kinase (MAPK) during osmolarity sensing; dephosporylates Hog1p MAPK and regulates its localization; with Msg5p co-regulates the calcium signaling pathway +S000037667 CDS YOR208W 15 733925 736177 W 2011-02-03 1996-07-31 +S000005735 ORF Verified YOR209C NPT1 nicotinate phosphoribosyltransferase chromosome 15 L000001275 15 737726 736437 C 2011-02-03 1996-07-31 Nicotinate phosphoribosyltransferase; acts in the salvage pathway of NAD+ biosynthesis; required for silencing at rDNA and telomeres and has a role in silencing at mating-type loci; localized to the nucleus +S000030426 CDS YOR209C 15 737726 736437 C 2011-02-03 1996-07-31 +S000005736 ORF Verified YOR210W RPB10 DNA-directed RNA polymerase core subunit RPB10|ABC10-beta chromosome 15 L000001684 15 738320 738532 W 2011-02-03 1996-07-31 RNA polymerase subunit ABC10-beta; common to RNA polymerases I, II, and III +S000037369 CDS YOR210W 15 738320 738532 W 2011-02-03 1996-07-31 +S000005737 ORF Verified YOR211C MGM1 dynamin-related GTPase MGM1|MNA1 chromosome 15 L000001103 15 741569 738924 C 123 2011-02-03 1996-07-31|2006-10-03 Mitochondrial GTPase, present in complex with Ugo1p and Fzo1p; required for mitochondrial morphology, fusion, and genome maintenance; promotes membrane bending; exists as long and short form with different distributions; ratio of long to short forms is regulated by Psd1p; homolog of human OPA1 involved in autosomal dominant optic atrophy +S000037397 CDS YOR211C 15 741569 738924 C 2011-02-03 1996-07-31|2006-10-03 +S000005738 ORF Verified YOR212W STE4 G protein subunit beta|HMD2 chromosome 15 L000002114 15 742910 744181 W 124 2011-02-03 1996-07-31 G protein beta subunit; forms a dimer with Ste18p to activate mating signaling pathway, forms heterotrimer with Gpa1p and Ste18p to dampen signaling; pheromone-induced phosphorylation plays critical role in chemotropism; may recruit Rho1p to polarized growth site during mating; contains WD40 repeats +S000030085 CDS YOR212W 15 742910 744181 W 2011-02-03 1996-07-31 +S000005739 ORF Verified YOR213C SAS5 chromosome 15 L000004215 15 745281 744535 C 2011-02-03 1996-07-31 Subunit of the SAS complex (Sas2p, Sas4p, Sas5p); acetylates free histones and nucleosomes and regulates transcriptional silencing; stimulates Sas2p HAT activity +S000030141 CDS YOR213C 15 745281 744535 C 2011-02-03 1996-07-31 +S000005740 ORF Verified YOR214C SPR2 chromosome 15 S000029500|L000002021 15 746303 745593 C 2011-02-03 1996-07-31 Putative spore wall protein; expression increases during sporulation; not an essential gene; YOR214C has a paralog, SPO19, that arose from the whole genome duplication +S000030340 CDS YOR214C 15 746303 745593 C 2011-02-03 1996-07-31 +S000005741 ORF Verified YOR215C AIM41 chromosome 15 15 747282 746725 C 2011-02-03 1996-07-31 Protein of unknown function; the authentic protein is detected in highly purified mitochondria in high-throughput studies; null mutant displays reduced frequency of mitochondrial genome loss +S000033625 CDS YOR215C 15 747282 746725 C 2011-02-03 1996-07-31 +S000005742 ORF Verified YOR216C RUD3 GRP1 chromosome 15 L000004185 15 748979 747525 C 2011-02-03 1996-07-31 Golgi matrix protein; involved in the structural organization of the cis-Golgi; interacts genetically with COG3 and USO1 +S000033741 CDS YOR216C 15 748979 747525 C 2011-02-03 1996-07-31 +S000005743 ORF Verified YOR217W RFC1 replication factor C subunit 1|CDC44 chromosome 15 L000000278 15 749301 751886 W 2011-02-03 1996-07-31 Subunit of heteropentameric Replication factor C (RF-C); RF-C is a DNA binding protein and ATPase that acts as a clamp loader of the proliferating cell nuclear antigen (PCNA) processivity factor for DNA polymerases delta and epsilon +S000033941 CDS YOR217W 15 749301 751886 W 2011-02-03 1996-07-31 +S000005744 ORF Dubious YOR218C chromosome 15 15 751895 751476 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame overlaps the verified gene RFC1/YOR217W +S000033989 CDS YOR218C 15 751895 751476 C 2011-02-03 1996-07-31 +S000005745 ORF Verified YOR219C STE13 YCI1 chromosome 15 L000002120 15 755009 752214 C 129 2011-02-03 1996-07-31 Dipeptidyl aminopeptidase; Golgi integral membrane protein that cleaves on the carboxyl side of repeating -X-Ala- sequences, required for maturation of alpha factor, transcription is induced by a-factor +S000034857 CDS YOR219C 15 755009 752214 C 2011-02-03 1996-07-31 +S000005746 ORF Verified YOR220W RCN2 WSP1 chromosome 15 15 755328 756125 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; phosphorylated in response to alpha factor; protein abundance increases in response to DNA replication stress +S000033604 CDS YOR220W 15 755328 756125 W 2011-02-03 1996-07-31 +S000005747 ORF Verified YOR221C MCT1 [acyl-carrier-protein] S-malonyltransferase chromosome 15 15 757558 756476 C 2011-02-03 1996-07-31|2005-12-01 Predicted malonyl-CoA:ACP transferase; putative component of a type-II mitochondrial fatty acid synthase that produces intermediates for phospholipid remodeling +S000034462 CDS YOR221C 15 757558 756476 C 2011-02-03 1996-07-31|2005-12-01 +S000005748 ORF Verified YOR222W ODC2 mitochondrial 2-oxodicarboxylate carrier chromosome 15 15 758330 759253 W 2011-02-03 1996-07-31 Mitochondrial inner membrane transporter; 2-oxodicarboxylate transporter, exports 2-oxoadipate and 2-oxoglutarate from the mitochondrial matrix to the cytosol for use in lysine and glutamate biosynthesis and in lysine catabolism; ODC2 has a paralog, ODC1, that arose from the whole genome duplication +S000034614 CDS YOR222W 15 758330 759253 W 2011-02-03 1996-07-31 +S000007299 snoRNA_gene snR35 SNR35 chromosome 15 L000001973 15 759529 759326 C 2011-02-03 2000-05-19|2007-05-10 H/ACA box small nucleolar RNA (snoRNA); predicted to guide pseudouridylation of small subunit (SSU) rRNA at position 1191 +S000036764 noncoding_exon snR35 15 759529 759326 C 2011-02-03 2000-05-19|2007-05-10 +S000005749 ORF Verified YOR223W DSC3 chromosome 15 15 759782 760660 W 2011-02-03 1996-07-31 Subunit of the DSC ubiquitin ligase complex; protein of unknown function that localizes to the ER and vacuole lumen; overexpression affects endocytic protein trafficking; ortholog of fission yeast dsc3 +S000034765 CDS YOR223W 15 759782 760660 W 2011-02-03 1996-07-31 +S000005750 ORF Verified YOR224C RPB8 DNA-directed RNA polymerase core subunit RPB8|ABC14.5 chromosome 15 L000001682 15 761265 760825 C 2011-02-03 1996-07-31 RNA polymerase subunit ABC14.5; common to RNA polymerases I, II, and III +S000035658 CDS YOR224C 15 761265 760825 C 2011-02-03 1996-07-31 +S000005751 ORF Dubious YOR225W chromosome 15 15 761392 761721 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035836 CDS YOR225W 15 761392 761721 W 2011-02-03 1996-07-31 +S000005752 ORF Verified YOR226C ISU2 putative iron-binding protein ISU2|NUA2 chromosome 15 L000004770 15 762084 761614 C 2011-02-03 1996-07-31 Mitochondrial protein required for iron-sulfur protein synthesis; performs scaffolding function during Fe/S cluster assembly; involved in Fe-S cluster assembly for both mitochondrial and cytosolic proteins; protein abundance increases under DNA replication stress; ISU2 has a paralog, ISU1, that arose from the whole genome duplication; isu1 isu2 double mutant is inviable; human homolog ISCU implicated in mitochondrial myopathy, can complement isu1 isu2 double mutant +S000035907 CDS YOR226C 15 762084 761614 C 2011-02-03 1996-07-31 +S000005753 ORF Verified YOR227W HER1 chromosome 15 S000124018 15 762825 766565 W 2011-02-03 1996-07-31 Protein of unknown function; required for proliferation or remodeling of the ER that is caused by overexpression of Hmg2p; may interact with ribosomes, based on co-purification experiments; HER1 has a paralog, GIP3, that arose from the whole genome duplication +S000037838 CDS YOR227W 15 762825 766565 W 2011-02-03 1996-07-31 +S000118492 ARS ARS1523 ARSXV-767 chromosome 15 15 766605 766788 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000005754 ORF Verified YOR228C MCP1 chromosome 15 15 767777 766869 C 2011-02-03 1996-07-31 Mitochondrial protein of unknown function involved in lipid homeostasis; integral membrane protein that localizes to the mitochondrial outer membrane; involved in mitochondrial morphology; interacts genetically with MDM10, and other members of the ERMES complex; contains five predicted transmembrane domains +S000037878 CDS YOR228C 15 767777 766869 C 2011-02-03 1996-07-31 +S000077078 matrix_attachment_site ETC7 ETC7 chromosome 15 15 768106 768128 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; can act as a transcription-blocking insulator or as a heterochromatin barrier element; located between divergently transcribed genes MCP1 and WTM2 +S000005755 ORF Verified YOR229W WTM2 transcriptional modulator chromosome 15 L000003516 15 768409 769812 W 2011-02-03 1996-07-31 Transcriptional modulator; involved in regulation of meiosis, silencing, and expression of RNR genes; involved in response to replication stress; contains WD repeats; relocalizes to the cytosol in response to hypoxia; WTM2 has a paralog, UME1, that arose from the whole genome duplication +S000029954 CDS YOR229W 15 768409 769812 W 2011-02-03 1996-07-31 +S000005756 ORF Verified YOR230W WTM1 transcriptional modulator chromosome 15 L000003515 15 770800 772113 W 2011-02-03 1996-07-31 Transcriptional modulator; involved in regulation of meiosis, silencing, and expression of RNR genes; required for nuclear localization of the ribonucleotide reductase small subunit Rnr2p and Rnr4p; contains WD repeats +S000037695 CDS YOR230W 15 770800 772113 W 2011-02-03 1996-07-31 +S000005757 ORF Verified YOR231W MKK1 mitogen-activated protein kinase kinase MKK1|SSP32 chromosome 15 L000001117 15 772601 774127 W 2011-02-03 1996-07-31 MAPKK involved in the protein kinase C signaling pathway; involved in control of cell integrity; upon activation by Bck1p phosphorylates downstream target, Slt2p; functionally redundant with Mkk2p; MKK1 has a paralog, MKK2, that arose from the whole genome duplication +S000037755 CDS YOR231W 15 772601 774127 W 2011-02-03 1996-07-31 +S000028716 ORF Dubious YOR231C-A chromosome 15 15 773363 773163 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032687 CDS YOR231C-A 15 773363 773163 C 2011-02-03 2003-07-29 +S000005758 ORF Verified YOR232W MGE1 GRPE|YGE1 chromosome 15 L000000729|L000002638|L000001101 15 774573 775259 W 2011-02-03 1996-07-31 Mitochondrial matrix cochaperone; nucleotide release factor for Ssc1p in protein translocation and folding; also acts as cochaperone for Ssq1p in folding of Fe-S cluster proteins; acts as oxidative sensor to regulate mitochondrial Ssc1p; in presence of oxidative stress, dimeric Mge1p becomes a monomer and unable to regulate Ssc1p function; homolog of E. coli GrpE and human Mge1 (GRPEL1), which also responds to oxidative stress +S000030589 CDS YOR232W 15 774573 775259 W 2011-02-03 1996-07-31 +S000005759 ORF Verified YOR233W KIN4 putative serine/threonine protein kinase KIN4|KIN3|KIN31 chromosome 15 L000000904 15 775846 778248 W 2011-02-03 1996-07-31 Serine/threonine protein kinase; inhibits the mitotic exit network (MEN) when the spindle position checkpoint is activated; localized asymmetrically to mother cell cortex, spindle pole body and bud neck; KIN4 has a paralog, FRK1, that arose from the whole genome duplication +S000030703 CDS YOR233W 15 775846 778248 W 2011-02-03 1996-07-31 +S000005760 ORF Verified YOR234C RPL33B eL33|ribosomal 60S subunit protein L33B|L33e|rp47|Yl37|L37B|L33B|RPL37B chromosome 15 L000001729 15 779405 778555 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L33B; rpl33b null mutant exhibits normal growth while rpl33a rpl33b double null mutant is inviable; homologous to mammalian ribosomal protein L35A, no bacterial homolog; RPL33B has a paralog, RPL33A, that arose from the whole genome duplication +S000030771 CDS YOR234C 15 778859 778555 C 2011-02-03 1996-07-31 +S000030770 CDS YOR234C 15 779405 779387 C 2011-02-03 1996-07-31 +S000030772 intron YOR234C 15 779386 778860 C 2011-02-03 1996-07-31 +S000005761 ORF Dubious YOR235W IRC13 chromosome 15 15 779870 780184 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; null mutant displays increased levels of spontaneous Rad52 foci +S000031752 CDS YOR235W 15 779870 780184 W 2011-02-03 1996-07-31 +S000007294 snoRNA_gene snR17a SNR17A U3 chromosome 15 L000001966 15 780107 780596 W 136 2011-02-03 2000-05-19 Small nucleolar RNA (snoRNA) U3; part of Small ribosomal SubUnit (SSU) processosome; SNR17B also encodes snoRNA U3 +S000030175 intron snR17a 15 780121 780277 W 2011-02-03 2000-05-19 +S000030173 noncoding_exon snR17a 15 780107 780120 W 2011-02-03 2000-05-19 +S000030174 noncoding_exon snR17a 15 780278 780596 W 2011-02-03 2000-05-19 +S000005762 ORF Verified YOR236W DFR1 dihydrofolate reductase chromosome 15 L000000503 15 780906 781541 W 135 2011-02-03 1996-07-31 Dihydrofolate reductase involved in tetrahydrofolate biosynthesis; required for respiratory metabolism; mutation is functionally complemented by human DHFR +S000031908 CDS YOR236W 15 780906 781541 W 2011-02-03 1996-07-31 +S000005763 ORF Verified YOR237W HES1 oxysterol-binding protein related protein HES1|OSH5 chromosome 15 L000000767 15 781994 783298 W 2011-02-03 1996-07-31 Protein implicated in the regulation of ergosterol biosynthesis; one of a seven member gene family with a common essential function and non-essential unique functions; similar to human oxysterol binding protein (OSBP); SWAT-GFP and mCherry fusion proteins localize to the bud neck and vacuolar membrane; HES1 has a paralog, KES1, that arose from the whole genome duplication +S000032069 CDS YOR237W 15 781994 783298 W 2011-02-03 1996-07-31 +S000118493 ARS ARS1524 ARSXV-783 chromosome 15 15 783345 783563 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178186 ARS_consensus_sequence ARS1524 15 783386 783402 W 2014-11-18 2014-11-18 +S000005764 ORF Uncharacterized YOR238W chromosome 15 15 783677 784588 W 2011-02-03 2003-09-22|1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000034067 CDS YOR238W 15 783677 784588 W 2011-02-03 2003-09-22|1996-07-31 +S000005765 ORF Verified YOR239W ABP140 TRM140|YOR240W chromosome 15 15 784857 786744 W 2011-02-03 2000-08-14|1996-07-31 AdoMet-dependent tRNA methyltransferase and actin binding protein; C-terminal domain is responsible for 3-methylcytidine modification of residue 32 of the tRNA anticodon loop of tRNA-Thr and tRNA-Ser and contains an S-adenosylmethionine (AdoMet) binding motif; N-terminal actin binding sequence interacts with actin filaments and localizes to actin patches and cables; N- and C-terminal domains are encoded in separate ORFs that are translated into one protein via a +1 frameshift +S000034147 CDS YOR239W 15 784857 785687 W 2011-02-03 2000-08-14|1996-07-31 +S000034148 CDS YOR239W 15 785689 786744 W 2011-02-03 2000-08-14 +S000034149 plus_1_translational_frameshift YOR239W 15 785688 785688 W 2011-02-03 2000-08-14 +S000005767 ORF Verified YOR241W MET7 tetrahydrofolate synthase|MET23 chromosome 15 L000001082 15 786995 788641 W 136 2011-02-03 1996-07-31 Folylpolyglutamate synthetase; catalyzes extension of the glutamate chains of the folate coenzymes, required for methionine synthesis and for maintenance of mitochondrial DNA; protein abundance increases in response to DNA replication stress +S000033075 CDS YOR241W 15 786995 788641 W 2011-02-03 1996-07-31 +S000005768 ORF Verified YOR242C SSP2 chromosome 15 L000004585 15 789857 788742 C 2011-02-03 1996-07-31 Sporulation specific protein that localizes to the spore wall; required for sporulation at a point after meiosis II and during spore wall formation; expression controlled by a tightly regulated middle-meiotic promoter that is activated by Ndt80p; translation of SSP2 mRNA is delayed, such that the mRNA is present as nuclear divisions are taking place but is not engaged by ribosomes until relatively late in meiotic development +S000033690 CDS YOR242C 15 789857 788742 C 2011-02-03 1996-07-31 +S000005769 ORF Verified YOR243C PUS7 pseudouridine synthase PUS7 chromosome 15 15 792241 790211 C 2011-02-03 1996-07-31 Pseudouridine synthase; catalyzes pseudouridylation at positions 35 and 56 in U2 snRNA, position 50 in 5S rRNA, position 13 in cytoplasmic tRNAs, and position 35 in pre-tRNA(Tyr); also pseudouridylates some mRNAs; relocates from nucleus to cytoplasm during heat shock and differentially modifies some mRNAs during heat shock; conserved in archaea, vertebrates, and some bacteria +S000033806 CDS YOR243C 15 792241 790211 C 2011-02-03 1996-07-31 +S000005770 ORF Verified YOR244W ESA1 NuA4 histone acetyltransferase complex catalytic subunit ESA1|KAT5|TAS1 chromosome 15 L000003952 15 792531 793868 W 2011-02-03 1996-07-31 Catalytic subunit of the histone acetyltransferase complex (NuA4); acetylates four conserved internal lysines of histone H4 N-terminal tail and can acetylate histone H2A; master regulator of cellular acetylation balance; required for cell cycle progression and transcriptional silencing at the rDNA locus and regulation of autophagy; human ortholog TIP60/KAT5 is implicated in cancer and other diseases, functionally complements lethality of the esa1 null mutation +S000033978 CDS YOR244W 15 792531 793868 W 2011-02-03 1996-07-31 +S000005771 ORF Verified YOR245C DGA1 diacylglycerol O-acyltransferase chromosome 15 15 795332 794076 C 2011-02-03 1996-07-31 Diacylglycerol acyltransferase; catalyzes the terminal step of triacylglycerol (TAG) formation, acylates diacylglycerol using acyl-CoA as an acyl donor; Lro1p and Dga1p can O-acylate ceramides; localized to lipid particles +S000034041 CDS YOR245C 15 795332 794076 C 2011-02-03 1996-07-31 +S000005772 ORF Verified YOR246C ENV9 chromosome 15 15 796793 795801 C 2011-02-03 1996-07-31 Protein proposed to be involved in vacuolar functions; mutant shows defect in CPY processing and defects in vacuolar morphology; has similarity to oxidoreductases, found in lipid particles; required for replication of Brome mosaic virus in S. cerevisiae, a model system for studying replication of positive-strand RNA viruses in their natural hosts +S000034930 CDS YOR246C 15 796793 795801 C 2011-02-03 1996-07-31 +S000005773 ORF Verified YOR247W SRL1 chromosome 15 L000004669 15 797676 798308 W 2011-02-03 1996-07-31 Mannoprotein that exhibits a tight association with the cell wall; required for cell wall stability in the absence of GPI-anchored mannoproteins; has a high serine-threonine content; expression is induced in cell wall mutants; SRL1 has a paralog, SVS1, that arose from the whole genome duplication +S000035223 CDS YOR247W 15 797676 798308 W 2011-02-03 1996-07-31 +S000005774 ORF Dubious YOR248W TOS11 chromosome 15 15 798013 798315 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036109 CDS YOR248W 15 798013 798315 W 2011-02-03 1996-07-31 +S000005775 ORF Verified YOR249C APC5 anaphase promoting complex subunit 5|RMC1 chromosome 15 L000004320 15 800731 798674 C 2011-02-03 1996-07-31 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); APC/C is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; component of the platform domain of the APC/C, based on structural analysis; relative distribution to nuclear foci decreases upon DNA replication stress +S000036169 CDS YOR249C 15 800731 798674 C 2011-02-03 1996-07-31 +S000005776 ORF Verified YOR250C CLP1 cleavage polyadenylation factor subunit CLP1 chromosome 15 L000004201 15 802307 800970 C 2011-02-03 1996-07-31 Component of the cleavage and polyadenylation factor I (CF I); CF 1, composed of the CF 1A complex (Rna14p, Rna15p, Clp1p, Pcf11p) and Hrp1, is involved in cleavage and polyadenylation of mRNA 3' ends; involved in both the endonucleolyitc cleavage and polyadenylation steps of mRNA 3'-end maturation and in gene looping which affects reinitiation of transcription +S000036960 CDS YOR250C 15 802307 800970 C 2011-02-03 1996-07-31 +S000005777 ORF Verified YOR251C TUM1 thiosulfate sulfurtransferase chromosome 15 15 803464 802550 C 2011-02-03 1996-07-31 Rhodanese domain sulfur transferase; accepts persulfite from Nfs1p and transfers it to Uba4p in the pathway for 2-thiolation of the wobble uridine base of tRNAs; also stimulates sulfur transfer by Nfs1p; may be mitochondrially localized +S000037035 CDS YOR251C 15 803464 802550 C 2011-02-03 1996-07-31 +S000005778 ORF Verified YOR252W TMA16 RBF17 chromosome 15 15 803667 804203 W 2011-02-03 1996-07-31|2006-01-05 Protein of unknown function that associates with ribosomes +S000037174 CDS YOR252W 15 803667 804203 W 2011-02-03 1996-07-31|2006-01-05 +S000005779 ORF Verified YOR253W NAT5 peptide alpha-N-acetyltransferase subunit NAT5|NAA50|ROG2|ARD2 chromosome 15 15 804377 804907 W 2011-02-03 1996-07-31 Subunit of protein N-terminal acetyltransferase NatA; NatA is comprised of Nat1p, Ard1p, and Nat5p; N-terminally acetylates many proteins, which influences multiple processes such as the cell cycle, heat-shock resistance, mating, sporulation, and telomeric silencing +S000029833 CDS YOR253W 15 804377 804907 W 2011-02-03 1996-07-31 +S000005780 ORF Verified YOR254C SEC63 protein-transporting protein SEC63|PTL1 chromosome 15 L000001854|L000001269 15 807023 805032 C 2011-02-03 1996-07-31 Essential subunit of Sec63 complex; with Sec61 complex, Kar2p/BiP and Lhs1p forms a channel competent for SRP-dependent and post-translational SRP-independent protein targeting and import into the ER; other members are Sec62p, Sec66p, and Sec72p +S000029878 CDS YOR254C 15 807023 805032 C 2011-02-03 1996-07-31 +S000005781 ORF Verified YOR255W OSW1 chromosome 15 15 807271 808107 W 2011-02-03 1996-07-31 Protein involved in sporulation; required for the construction of the outer spore wall layers; required for proper localization of Spo14p +S000030954 CDS YOR255W 15 807271 808107 W 2011-02-03 1996-07-31 +S000005782 ORF Verified YOR256C TRE2 putative zinc metalloprotease chromosome 15 15 810683 808254 C 2006-01-05 1996-07-31|2011-02-03 Transferrin receptor-like protein; functions with Tre1p to regulate ubiquitination and vacuolar degradation of the metal transporter Smf1p; inviability of null mutant in systematic studies is due to proximity to CDC31; TRE2 has a paralog, TRE1, that arose from the whole genome duplication +S000030990 CDS YOR256C 15 810683 808254 C 2006-01-05 1996-07-31|2011-02-03 +S000005783 ORF Verified YOR257W CDC31 centrin|DSK1 chromosome 15 L000000269 15 811008 811493 W 147 2006-01-05 1996-07-31 Calcium-binding component of the spindle pole body (SPB) half-bridge; required for SPB duplication in mitosis and meiosis II; homolog of mammalian centrin; binds multiubiquitinated proteins and is involved in proteasomal protein degradation +S000031201 CDS YOR257W 15 811008 811493 W 2006-01-05 1996-07-31 +S000005784 ORF Verified YOR258W HNT3 DNA 5'-adenosine monophosphate hydrolase chromosome 15 15 811671 812324 W 2006-01-05 1996-07-31 DNA 5' AMP hydrolase involved in DNA repair; member of the histidine triad (HIT) superfamily of nucleotide-binding proteins; homolog of Aprataxin, a Hint related protein that is mutated in individuals with ataxia with oculomotor apraxia; relative distribution to nuclear foci decreases upon DNA replication stress +S000032199 CDS YOR258W 15 811671 812324 W 2006-01-05 1996-07-31 +S000005785 ORF Verified YOR259C RPT4 proteasome regulatory particle base subunit RPT4|SUG2|PCS1|CRL13 chromosome 15 L000003423|L000003107|L000000413 15 813708 812395 C 143 2006-01-05 1996-07-31 ATPase of the 19S regulatory particle of the 26S proteasome; one of six ATPases of the regulatory particle; involved in degradation of ubiquitinated substrates; contributes preferentially to ERAD; required for spindle pole body duplication; mainly nuclear localization +S000032229 CDS YOR259C 15 813708 812395 C 2006-01-05 1996-07-31 +S000005786 ORF Verified YOR260W GCD1 translation initiation factor eIF2B subunit gamma|TRA3 chromosome 15 L000000670 15 813984 815720 W 143 2006-01-05 1996-07-31 Gamma subunit of the translation initiation factor eIF2B; the guanine-nucleotide exchange factor for eIF2; activity subsequently regulated by phosphorylated eIF2; first identified as a negative regulator of GCN4 expression +S000032270 CDS YOR260W 15 813984 815720 W 2006-01-05 1996-07-31 +S000005787 ORF Verified YOR261C RPN8 proteasome regulatory particle lid subunit RPN8 chromosome 15 L000004308 15 816931 815915 C 2006-01-05 1996-07-31 Essential non-ATPase regulatory subunit of the 26S proteasome; has similarity to the human p40 proteasomal subunit and to another S. cerevisiae regulatory subunit, Rpn11p +S000032281 CDS YOR261C 15 816931 815915 C 2006-01-05 1996-07-31 +S000005788 ORF Verified YOR262W GPN2 putative GTPase GPN2 chromosome 15 15 817292 818335 W 2011-02-03 1996-07-31 Putative GTPase with a role in biogenesis of RNA pol II and polIII; may be involved in assembly of RNA polymerases II and III and in their transport into the nucleus; contains a Gly-Pro-Asn motif in the G domain; similar to Npa3p and Gpn3p; highly conserved across species and homologous to human gene GPN2/ATPBD1B; required for establishment of sister chromatid cohesion +S000033195 CDS YOR262W 15 817292 818335 W 2011-02-03 1996-07-31 +S000005790 ORF Verified YOR264W DSE3 chromosome 15 15 818866 820158 W 2011-02-03 1996-07-31 Daughter cell-specific protein, may help establish daughter fate; relocalizes from bud neck to cytoplasm upon DNA replication stress +S000033310 CDS YOR264W 15 818866 820158 W 2011-02-03 1996-07-31 +S000005789 ORF Dubious YOR263C chromosome 15 15 819164 818757 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF DES3/YOR264W +S000033220 CDS YOR263C 15 819164 818757 C 2011-02-03 1996-07-31 +S000005791 ORF Verified YOR265W RBL2 chromosome 15 L000002910 15 820454 820774 W 2011-02-03 1996-07-31 Protein involved in microtubule morphogenesis; required for protection from excess free beta-tubulin; proposed to be involved the folding of beta-tubulin; similar to mouse beta-tubulin cofactor A; protein abundance increases in response to DNA replication stress +S000034224 CDS YOR265W 15 820454 820774 W 2011-02-03 1996-07-31 +S000005792 ORF Verified YOR266W PNT1 chromosome 15 L000001460 15 821023 822294 W 2011-02-03 1996-07-31 Mitochondrial integral inner membrane protein; involved in membrane insertion of C-terminus of Cox2p, interacts genetically and physically with Cox18p; deletion mutant sensitive to the anti-Pneumocystis carinii drug pentamidine +S000034354 CDS YOR266W 15 821023 822294 W 2011-02-03 1996-07-31 +S000005793 ORF Verified YOR267C HRK1 putative serine/threonine protein kinase HRK1 chromosome 15 15 824867 822588 C 2011-02-03 1996-07-31 Protein kinase; implicated in activation of the plasma membrane H(+)-ATPase Pma1p in response to glucose metabolism; plays a role in ion homeostasis; protein abundance increases in response to DNA replication stress +S000034383 CDS YOR267C 15 824867 822588 C 2011-02-03 1996-07-31 +S000005794 ORF Uncharacterized YOR268C chromosome 15 15 825932 825534 C 2011-02-03 1996-07-31 Putative protein of unknown function; sporulation is abnormal in homozygous diploid; SWAT-GFP fusion protein localizes to the nucleus; YOR268C is not an essential gene +S000035396 CDS YOR268C 15 825932 825534 C 2011-02-03 1996-07-31 +S000005795 ORF Verified YOR269W PAC1 chromosome 15 L000001328 15 826385 827869 W 2011-02-03 1996-07-31 Involved in nuclear migration, part of the dynein/dynactin pathway; targets dynein to microtubule tips, which is necessary for sliding of microtubules along bud cortex; serves at interface between dynein's ATPase site and its microtubule binding stalk, causing individual dynein motors to remain attached to microtubules for long periods; synthetic lethal with bni1; homolog of human LIS1, mutations in which cause the severe brain disorder lissencephaly +S000035573 CDS YOR269W 15 826385 827869 W 2011-02-03 1996-07-31 +S000005796 ORF Verified YOR270C VPH1 H(+)-transporting V0 sector ATPase subunit a chromosome 15 L000002467 15 830574 828052 C 2011-02-03 1996-07-31 Subunit a of vacuolar-ATPase V0 domain; one of two isoforms (Vph1p and Stv1p); Vph1p is located in V-ATPase complexes of the vacuole while Stv1p is located in V-ATPase complexes of the Golgi and endosomes; relative distribution to the vacuolar membrane decreases upon DNA replication stress; human homolog ATP6V0A4 implicated in renal tubular acidosis, can complement yeast null mutant +S000036537 CDS YOR270C 15 830574 828052 C 2011-02-03 1996-07-31 +S000005797 ORF Uncharacterized YOR271C FSF1 chromosome 15 15 832042 831059 C 2011-02-03 1996-07-31 Putative protein; predicted to be an alpha-isopropylmalate carrier; belongs to the sideroblastic-associated protein family; non-tagged protein is detected in purified mitochondria; likely to play a role in iron homeostasis +S000036610 CDS YOR271C 15 832042 831059 C 2011-02-03 1996-07-31 +S000006497 snoRNA_gene snR8 SNR8 chromosome 15 L000001963 15 832332 832521 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at positions U960 and U986 +S000034324 noncoding_exon snR8 15 832332 832521 W 2011-02-03 2000-05-19 +S000005798 ORF Verified YOR272W YTM1 CST14 chromosome 15 L000003547|L000002998|S000029121 15 832813 834195 W 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; forms a complex with Nop7p and Erb1p that is required for maturation of the large ribosomal subunit; has seven C-terminal WD repeats +S000037380 CDS YOR272W 15 832813 834195 W 2011-02-03 1996-07-31 +S000005799 ORF Verified YOR273C TPO4 chromosome 15 15 836431 834452 C 2011-02-03 1996-07-31 Polyamine transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; recognizes spermine, putrescine, and spermidine; localizes to the plasma membrane +S000037433 CDS YOR273C 15 836431 834452 C 2011-02-03 1996-07-31 +S000005800 ORF Verified YOR274W MOD5 tRNA dimethylallyltransferase|[MOD+] chromosome 15 L000001131 15 837674 838960 W 2011-02-03 1996-07-31 Delta 2-isopentenyl pyrophosphate:tRNA isopentenyl transferase; required for biosynthesis of isopentenyladenosine in mitochondrial and cytoplasmic tRNAs; also has a role in tRNA gene-mediated silencing; gene encodes two isozymic forms; converts to a prion form, prion conversion contributes to azole antifungal resistance by upregulating ergosterol biosynthesis; homolog of human TRIT1, a mutation in which is associated with severe combined respiratory chain defects +S000030255 CDS YOR274W 15 837674 838960 W 2011-02-03 1996-07-31 +S000005801 ORF Verified YOR275C RIM20 chromosome 15 15 841069 839084 C 2011-02-03 1996-07-31 Protein involved in proteolytic activation of Rim101p; part of response to alkaline pH; PalA/AIP1/Alix family member; interaction with the ESCRT-III subunit Snf7p suggests a relationship between pH response and multivesicular body formation +S000030312 CDS YOR275C 15 841069 839084 C 2011-02-03 1996-07-31 +S000005802 ORF Verified YOR276W CAF20 p20|CAP20|CAF2 chromosome 15 L000000208|L000003291 15 841333 841818 W 2011-02-03 1996-07-31 Phosphoprotein of the mRNA cap-binding complex; involved in translational control; repressor of cap-dependent translation initiation; competes with eIF4G for binding to eIF4E +S000030543 CDS YOR276W 15 841333 841818 W 2011-02-03 1996-07-31 +S000005803 ORF Dubious YOR277C chromosome 15 15 841823 841515 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the verified gene CAF20 +S000031370 CDS YOR277C 15 841823 841515 C 2011-02-03 1996-07-31 +S000007296 snoRNA_gene snR31 SNR31 chromosome 15 L000001969 15 842182 841958 C 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of small subunit (SSU) rRNA at position U999 +S000036752 noncoding_exon snR31 15 842182 841958 C 2011-02-03 2000-05-19 +S000007291 snoRNA_gene snR5 SNR5 chromosome 15 L000001960 15 842403 842606 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at positions U1004 and U1124 +S000034319 noncoding_exon snR5 15 842403 842606 W 2011-02-03 2000-05-19 +S000005804 ORF Verified YOR278W HEM4 uroporphyrinogen-III synthase HEM4|SLU2 chromosome 15 L000002903 15 842817 843644 W 2011-02-03 1996-07-31 Uroporphyrinogen III synthase; catalyzes the conversion of hydroxymethylbilane to uroporphyrinogen III, the fourth step in heme biosynthesis; deficiency in the human homolog can result in the disease congenital erythropoietic porphyria +S000031577 CDS YOR278W 15 842817 843644 W 2011-02-03 1996-07-31 +S000005805 ORF Verified YOR279C RFM1 chromosome 15 15 844630 843698 C 2011-02-03 1996-07-31 Component of the Sum1p-Rfm1p-Hst1p complex; Rfm1p tethers the Hst1p histone deacetylase to the DNA-binding protein Sum1p; complex is involved in transcriptional repression of middle sporulation genes and in initiation of DNA replication +S000031617 CDS YOR279C 15 844630 843698 C 2011-02-03 1996-07-31 +S000005806 ORF Verified YOR280C FSH3 putative serine hydrolase chromosome 15 15 845792 844992 C 2011-02-03 1996-07-31 Putative serine hydrolase; likely target of Cyc8p-Tup1p-Rfx1p transcriptional regulation; sequence is similar to S. cerevisiae Fsh1p and Fsh2p and the human candidate tumor suppressor OVCA2 +S000031815 CDS YOR280C 15 845792 844992 C 2011-02-03 1996-07-31 +S000005808 ORF Dubious YOR282W chromosome 15 15 847000 847320 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps essential, verified gene PLP2/YOR281C +S000032900 CDS YOR282W 15 847000 847320 W 2011-02-03 1996-07-31 +S000005807 ORF Verified YOR281C PLP2 chromosome 15 15 847129 846269 C 2011-02-03 1996-07-31 Protein that interacts with the CCT complex to stimulate actin folding; has similarity to phosducins; null mutant lethality is complemented by mouse phosducin-like protein MgcPhLP; CCT is short for chaperonin containing TCP-1; essential gene +S000031925 CDS YOR281C 15 847129 846269 C 2011-02-03 1996-07-31 +S000005809 ORF Verified YOR283W phosphoglycerate mutase chromosome 15 15 847453 848145 W 2011-02-03 1996-07-31 Phosphatase with a broad substrate specificity; has some similarity to GPM1/YKL152C, a phosphoglycerate mutase; YOR283W is not an essential gene +S000032989 CDS YOR283W 15 847453 848145 W 2011-02-03 1996-07-31 +S000005810 ORF Verified YOR284W HUA2 chromosome 15 15 848478 849209 W 2011-02-03 1996-07-31 Cytoplasmic protein of unknown function; computational analysis of large-scale protein-protein interaction data suggests a possible role in actin patch assembly +S000033085 CDS YOR284W 15 848478 849209 W 2011-02-03 1996-07-31 +S000005811 ORF Verified YOR285W RDL1 thiosulfate sulfurtransferase RDL1 chromosome 15 15 849635 850054 W 2011-02-03 1996-07-31 Thiosulfate sulfurtransferase; contains a rhodanese-like domain; localized to the mitochondrial outer membrane; protein abundance increases in response to DNA replication stress; similar to the human TSTD gene +S000033844 CDS YOR285W 15 849635 850054 W 2011-02-03 1996-07-31 +S000005812 ORF Verified YOR286W RDL2 thiosulfate sulfurtransferase RDL2|AIM42|FMP31 chromosome 15 15 850280 850729 W 2011-02-03 1996-07-31 Protein with rhodanese activity; contains a rhodanese-like domain similar to Rdl1p, Uba4p, Tum1p, and Ych1p; overexpression causes a cell cycle delay; null mutant displays elevated frequency of mitochondrial genome loss +S000033993 CDS YOR286W 15 850280 850729 W 2011-02-03 1996-07-31 +S000005813 ORF Verified YOR287C RRP36 rRNA-processing protein RRP36 chromosome 15 15 851839 850937 C 2011-02-03 1996-07-31 Component of 90S preribosomes; involved in early cleavages of the 35S pre-rRNA and in production of the 40S ribosomal subunit +S000034025 CDS YOR287C 15 851839 850937 C 2011-02-03 1996-07-31 +S000005814 ORF Verified YOR288C MPD1 protein disulfide isomerase MPD1 chromosome 15 L000003038 15 853077 852121 C 2011-02-03 1996-07-31 Member of the protein disulfide isomerase (PDI) family; interacts with and inhibits the chaperone activity of Cne1p; MPD1 overexpression in a pdi1 null mutant suppresses defects in Pdi1p functions such as carboxypeptidase Y maturation +S000034906 CDS YOR288C 15 853077 852121 C 2011-02-03 1996-07-31 +S000005815 ORF Uncharacterized YOR289W chromosome 15 15 853357 854112 W 2011-02-03 1996-07-31 Putative protein of unknown function; transcription induced by the unfolded protein response; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus +S000035198 CDS YOR289W 15 853357 854112 W 2011-02-03 1996-07-31 +S000006525 tRNA_gene tA(UGC)O chromosome 15 L000003714 15 854259 854187 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 5 nuclear tRNA genes containing the tDNA-anticodon TGC (mature tRNA may be UGC or may contain modified bases), decodes GCA and probably GCG codons into alanine, one of 16 nuclear tRNAs for alanine +S000034894 noncoding_exon tA(UGC)O 15 854259 854187 C 2011-02-03 2000-05-19 +S000007178 long_terminal_repeat YORWsigma3 chromosome 15 15 854275 854614 W 2011-02-03 2000-05-19 Ty3 LTR +S000005816 ORF Verified YOR290C SNF2 SWI/SNF catalytic subunit SNF2|TYE3|SWI2|HAF1|GAM1 chromosome 15 L000001945 15 860258 855147 C 2011-02-03 1996-07-31 Catalytic subunit of the SWI/SNF chromatin remodeling complex; involved in transcriptional regulation; contains DNA-stimulated ATPase activity; functions interdependently in transcriptional activation with Snf5p and Snf6p +S000036380 CDS YOR290C 15 860258 855147 C 2011-02-03 1996-07-31 +S000005817 ORF Verified YOR291W YPK9 putative acid anhydride hydrolase chromosome 15 15 861175 865593 W 2011-02-03 1996-07-31 Vacuolar protein with a possible role in sequestering heavy metals; has similarity to the type V P-type ATPase Spf1p; homolog of human ATP13A2 (PARK9), mutations in which are associated with Parkinson disease and Kufor-Rakeb syndrome +S000037072 CDS YOR291W 15 861175 865593 W 2011-02-03 1996-07-31 +S000005818 ORF Uncharacterized YOR292C chromosome 15 15 866582 865653 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole; YOR292C is not an essential gene +S000037114 CDS YOR292C 15 866582 865653 C 2011-02-03 1996-07-31 +S000005819 ORF Verified YOR293W RPS10A eS10|ribosomal 40S subunit protein S10A|S10e|S10A chromosome 15 L000004475 15 867098 867852 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S10, no bacterial homolog; RPS10A has a paralog, RPS10B, that arose from the whole genome duplication; mutations in the human homolog associated with Diamond-Blackfan anemia +S000037299 CDS YOR293W 15 867098 867149 W 2011-02-03 1996-07-31 +S000037300 CDS YOR293W 15 867587 867852 W 2011-02-03 1996-07-31 +S000037301 intron YOR293W 15 867150 867586 W 2011-02-03 1996-07-31 +S000028858 ORF Uncharacterized YOR293C-A chromosome 15 15 868147 867998 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000034572 CDS YOR293C-A 15 868147 867998 C 2011-02-03 2003-07-29 +S000005820 ORF Verified YOR294W RRS1 chromosome 15 15 868340 868951 W 2011-02-03 1996-07-31 Essential protein that binds ribosomal protein L11; required for nuclear export of the 60S pre-ribosomal subunit during ribosome biogenesis; localizes to the nucleolus and in foci along nuclear periphery; cooperates with Ebp2p and Mps3p to mediate telomere clustering by binding Sir4p, but is not involved in telomere tethering; mouse homolog shows altered expression in Huntington's disease model mice +S000029945 CDS YOR294W 15 868340 868951 W 2011-02-03 1996-07-31 +S000005821 ORF Verified YOR295W UAF30 chromosome 15 15 869208 869894 W 2011-02-03 1996-07-31 Subunit of UAF (upstream activation factor) complex; UAF is an RNA polymerase I specific transcription stimulatory factor composed of Uaf30p, Rrn5p, Rrn9p, Rrn10p, histones H3 and H4; targeting factor for the UAF that facilitates activation of many rDNA genes; deletion decreases cellular growth rate; UAF30 has a paralog, TRI1, that arose from the whole genome duplication +S000030055 CDS YOR295W 15 869208 869894 W 2011-02-03 1996-07-31 +S000005822 ORF Uncharacterized YOR296W chromosome 15 15 870202 874071 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; expressed during copper starvation; YOR296W is not an essential gene +S000031083 CDS YOR296W 15 870202 874071 W 2011-02-03 1996-07-31 +S000118494 ARS ARS1526 ARSXV-874 chromosome 15 15 874251 874412 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000005823 ORF Verified YOR297C TIM18 chromosome 15 S000007448 15 875321 874743 C 2011-02-03 1996-07-31|2011-02-03 Component of the mitochondrial TIM22 complex; involved in insertion of polytopic proteins into the inner membrane; may mediate assembly or stability of the complex +S000031114 CDS YOR297C 15 875321 874743 C 2011-02-03 1996-07-31|2011-02-03 +S000005824 ORF Verified YOR298W MUM3 chromosome 15 15 875599 877038 W 2011-02-03 1996-07-31 Protein of unknown function involved in outer spore wall organization; has similarity to the tafazzins superfamily of acyltransferases +S000031297 CDS YOR298W 15 875599 877038 W 2011-02-03 1996-07-31 +S000007253 ORF Verified YOR298C-A MBF1 SUF13 chromosome 15 L000002160|L000004688 15 877685 877230 C 165 2011-02-03 2004-02-12|1999-07-17 Transcriptional coactivator; bridges the DNA-binding region of Gcn4p and TATA-binding protein Spt15p; suppressor of frameshift mutations; protein abundance increases in response to DNA replication stress +S000030828 CDS YOR298C-A 15 877685 877230 C 2011-02-03 2004-02-12|1999-07-17 +S000005825 ORF Verified YOR299W BUD7 exomer complex subunit chromosome 15 L000003554 15 878435 880675 W 2011-02-03 1996-07-31 Member of the ChAPs family (Chs5p-Arf1p-binding proteins); members include Bch1p, Bch2p, Bud7p, and Chs6p; ChAPs family proteins form the exomer complex with Chs5p to mediate export of specific cargo proteins, including Chs3p, from the Golgi to the plasma membrane; BUD7 has a paralog, BCH1, that arose from the whole genome duplication +S000031429 CDS YOR299W 15 878435 880675 W 2011-02-03 1996-07-31 +S000005826 ORF Dubious YOR300W HUF1 chromosome 15 15 880575 880883 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps with verified gene BUD7/YOR299W; mutation affects bipolar budding and bud site selection, though phenotype could be due to the mutation's effects on BUD7 +S000036845 CDS YOR300W 15 880575 880883 W 2011-02-03 1996-07-31 +S000005827 ORF Verified YOR301W RAX1 chromosome 15 15 880965 882272 W 2011-02-03 1996-07-31 Protein involved in bud site selection during bipolar budding; localization requires Rax2p; has similarity to members of the insulin-related peptide superfamily +S000037565 CDS YOR301W 15 880965 882272 W 2011-02-03 1996-07-31 +S000005828 ORF Verified YOR302W chromosome 15 15 882765 882842 W 2011-02-03 1996-07-31 CPA1 uORF; Arginine attenuator peptide, regulates translation of the CPA1 mRNA +S000037642 CDS YOR302W 15 882765 882842 W 2011-02-03 1996-07-31 +S000005829 ORF Verified YOR303W CPA1 carbamoyl-phosphate synthase (glutamine-hydrolyzing) CPA1 chromosome 15 L000000399 15 882899 884134 W 161 2011-02-03 1996-07-31 Small subunit of carbamoyl phosphate synthetase; carbamoyl phosphate synthetase catalyzes a step in the synthesis of citrulline, an arginine precursor; translationally regulated by an attenuator peptide encoded by YOR302W within the CPA1 mRNA 5'-leader +S000037697 CDS YOR303W 15 882899 884134 W 2011-02-03 1996-07-31 +S000005831 ORF Verified YOR304W ISW2 DNA translocase chromosome 15 L000004448 15 884514 887876 W 2011-02-03 1996-07-31 ATP-dependent DNA translocase involved in chromatin remodeling; ATPase component that, with Itc1p, forms a complex required for repression of a-specific genes, INO1, and early meiotic genes during mitotic growth; the Isw2 complex exhibits basal levels of chromatin binding throughout the genome as well as target-specific chromatin interactions; targeted by Ume6p- and Sua7p-dependent DNA looping to many loci genome-wide +S000037758 CDS YOR304W 15 884514 887876 W 2011-02-03 1996-07-31 +S000005830 ORF Verified YOR304C-A BIL1 EDO1 chromosome 15 15 888750 888520 C 2011-02-03 1997-07-01|1996-07-31 Protein that binds Bud6p and has a role in actin cable assembly; involved in the Bnr1p-dependent pathway of cable assembly; localizes to bud tip and bud neck +S000032659 CDS YOR304C-A 15 888750 888520 C 2011-02-03 1997-07-01|1996-07-31 +S000005832 ORF Verified YOR305W RRG7 chromosome 15 15 889022 889750 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the mitochondrion; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO); YOR305W is not an essential gene +S000030593 CDS YOR305W 15 889022 889750 W 2011-02-03 1996-07-31 +S000005833 ORF Verified YOR306C MCH5 chromosome 15 15 891432 889867 C 2011-02-03 1996-07-31|2011-02-03 Plasma membrane riboflavin transporter; facilitates the uptake of vitamin B2; required for FAD-dependent processes; sequence similarity to mammalian monocarboxylate permeases, however mutants are not deficient in monocarboxylate transport +S000030631 CDS YOR306C 15 891432 889867 C 2011-02-03 1996-07-31|2011-02-03 +S000005834 ORF Verified YOR307C SLY41 chromosome 15 L000001925 15 894092 892731 C 2011-02-03 1996-07-31 Protein involved in ER-to-Golgi transport +S000030776 CDS YOR307C 15 894092 892731 C 2011-02-03 1996-07-31 +S000005835 ORF Verified YOR308C SNU66 U4/U6-U5 snRNP complex subunit SNU66 chromosome 15 15 896387 894624 C 2011-02-03 1996-07-31 Component of the U4/U6.U5 snRNP complex; involved in pre-mRNA splicing via spliceosome; also required for pre-5S rRNA processing and may act in concert with Rnh70p; has homology to human SART-1 +S000030861 CDS YOR308C 15 896387 894624 C 2011-02-03 1996-07-31 +S000005836 ORF Dubious YOR309C chromosome 15 15 897078 896698 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene NOP58 +S000031849 CDS YOR309C 15 897078 896698 C 2011-02-03 1996-07-31 +S000005837 ORF Verified YOR310C NOP58 RNA-processing protein NOP58|NOP5 chromosome 15 L000004000 15 898360 896825 C 2011-02-03 1996-07-31 Protein involved in producing mature rRNAs and snoRNAs; involved in pre-rRNA processing, 18S rRNA synthesis, and snoRNA synthesis; component of the small subunit processome complex, which is required for processing of pre-18S rRNA +S000031855 CDS YOR310C 15 898360 896825 C 2011-02-03 1996-07-31 +S000005838 ORF Verified YOR311C DGK1 diacylglycerol kinase|HSD1 chromosome 15 15 899928 899056 C 2011-02-03 1996-07-31 Diacylglycerol kinase; localized to the endoplasmic reticulum (ER); overproduction induces enlargement of ER-like membrane structures and suppresses a temperature-sensitive sly1 mutation; contains a CTP transferase domain +S000032742 CDS YOR311C 15 899928 899056 C 2011-02-03 1996-07-31 +S000005839 ORF Verified YOR312C RPL20B eL20|ribosomal 60S subunit protein L20B|L20e|L20B|L18B|RPL18A1 chromosome 15 L000003148 15 901194 900250 C 2011-02-03 1996-07-31|2007-07-10 Ribosomal 60S subunit protein L20B; homologous to mammalian ribosomal protein L18A, no bacterial homolog; RPL20B has a paralog, RPL20A, that arose from the whole genome duplication +S000032858 CDS YOR312C 15 900767 900250 C 2011-02-03 1996-07-31 +S000032857 CDS YOR312C 15 901194 901194 C 2011-02-03 1996-07-31|2007-07-10 +S000032859 intron YOR312C 15 901193 900768 C 2011-02-03 1996-07-31|2007-07-10 +S000005840 ORF Verified YOR313C SPS4 chromosome 15 L000002026 15 902874 901858 C 2011-02-03 1996-07-31 Protein whose expression is induced during sporulation; not required for sporulation; heterologous expression in E. coli induces the SOS response that senses DNA damage +S000032971 CDS YOR313C 15 902874 901858 C 2011-02-03 1996-07-31 +S000005841 ORF Dubious YOR314W chromosome 15 15 903043 903372 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033076 CDS YOR314W 15 903043 903372 W 2011-02-03 1996-07-31 +S000007629 ORF Dubious YOR314W-A chromosome 15 15 904458 904568 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037260 CDS YOR314W-A 15 904458 904568 W 2011-02-03 2001-02-26 +S000005842 ORF Verified YOR315W SFG1 chromosome 15 15 904760 905800 W 2011-02-03 1996-07-31 Nuclear protein putative transcription factor; required for growth of superficial pseudohyphae (which do not invade the agar substrate) but not for invasive pseudohyphal growth; may act together with Phd1p; potential Cdc28p substrate +S000033756 CDS YOR315W 15 904760 905800 W 2011-02-03 1996-07-31 +S000005843 ORF Verified YOR316C COT1 metal cation transporter COT1 chromosome 15 L000000382 15 907555 906236 C 2011-02-03 1996-07-31 Vacuolar transporter that mediates zinc transport into the vacuole; overexpression confers resistance to cobalt and rhodium; protein abundance increases in response to DNA replication stress; COT1 has a paralog, ZRC1, that arose from the whole genome duplication +S000033807 CDS YOR316C 15 907555 906236 C 2011-02-03 1996-07-31 +S000028584 ORF Uncharacterized YOR316C-A chromosome 15 15 907935 907726 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031332 CDS YOR316C-A 15 907935 907726 C 2011-02-03 2003-07-29 +S000118495 ARS ARS1528 ARSXV-908 chromosome 15 15 908296 908544 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178187 ARS_consensus_sequence ARS1528 15 908306 908322 W 2014-11-18 2014-11-18 +S000005844 ORF Verified YOR317W FAA1 long-chain fatty acid-CoA ligase FAA1 chromosome 15 L000000594 15 909343 911445 W 2011-02-03 1996-07-31 Long chain fatty acyl-CoA synthetase; activates fatty acids with a preference for C12:0-C16:0 chain lengths; role in the competitive import of long-chain fatty acids and sphingoid long-chain bases; accounts for most acyl-CoA synthetase activity; localizes to lipid particles and the plasma membrane; role in sphingolipid-to-glycerolipid metabolism; forms ER foci upon replication stress; faa1 faa4 double null complemented by any of human ACSBG1, ACSL1, 3, 4, 5, 6, SLC27A2, or 4 +S000034010 CDS YOR317W 15 909343 911445 W 2011-02-03 1996-07-31 +S000005845 ORF Dubious YOR318C chromosome 15 15 912436 911784 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; transcript is predicted to be spliced but there is no evidence that it is spliced in vivo +S000034044 CDS YOR318C 15 912085 911784 C 2011-02-03 1996-07-31 +S000034043 CDS YOR318C 15 912436 912433 C 2011-02-03 1996-07-31 +S000034045 intron YOR318C 15 912432 912086 C 2011-02-03 1996-07-31 +S000005846 ORF Verified YOR319W HSH49 U2 snRNP complex subunit HSH49 chromosome 15 L000003014 15 912822 913463 W 2011-02-03 1996-07-31 U2-snRNP associated splicing factor; similar to the mammalian splicing factor SAP49; proposed to function as a U2-snRNP assembly factor along with Hsh155p and binding partner Cus1p; contains two RNA recognition motifs (RRM) +S000035030 CDS YOR319W 15 912822 913463 W 2011-02-03 1996-07-31 +S000005847 ORF Verified YOR320C GNT1 glucose N-acetyltransferase chromosome 15 15 915094 913619 C 2011-02-03 1996-07-31 N-acetylglucosaminyltransferase; capable of modification of N-linked glycans in the Golgi apparatus +S000035936 CDS YOR320C 15 915094 913619 C 2011-02-03 1996-07-31 +S000005848 ORF Verified YOR321W PMT3 dolichyl-phosphate-mannose-protein mannosyltransferase PMT3 chromosome 15 L000002622 15 916030 918291 W 2011-02-03 1996-07-31 Protein O-mannosyltransferase; transfers mannose residues from dolichyl phosphate-D-mannose to protein serine/threonine residues; acts in a complex with Pmt5p, can instead interact with Pmt1p in some conditions; antifungal drug target; PMT3 has a paralog, PMT2, that arose from the whole genome duplication +S000036207 CDS YOR321W 15 916030 918291 W 2011-02-03 1996-07-31 +S000005849 ORF Verified YOR322C LDB19 ART1 chromosome 15 15 921062 918606 C 2011-02-03 1996-07-31 Alpha-arrestin involved in ubiquitin-dependent endocytosis; regulates endocytosis of plasma membrane proteins by recruiting the ubiquitin ligase Rsp5p to its targets; involved in the basal internalization and turnover of alpha-factor receptor Ste2p; recruits ubiquitin ligase Rsp5p to Ste2p via its 2 PPXY motifs; inhibited by Npr1p-mediated phosphorylation, which affects translocation between the cytosol and the plasma membrane +S000036901 CDS YOR322C 15 921062 918606 C 2011-02-03 1996-07-31 +S000005850 ORF Verified YOR323C PRO2 glutamate-5-semialdehyde dehydrogenase chromosome 15 L000001492 15 922905 921535 C 175 2011-02-03 1996-07-31 Gamma-glutamyl phosphate reductase; catalyzes the second step in proline biosynthesis +S000036961 CDS YOR323C 15 922905 921535 C 2011-02-03 1996-07-31 +S000005852 ORF Dubious YOR325W chromosome 15 15 924577 925050 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF FRT1 +S000037825 CDS YOR325W 15 924577 925050 W 2011-02-03 1996-07-31 +S000005851 ORF Verified YOR324C FRT1 HPH1 chromosome 15 15 925040 923232 C 2011-02-03 1996-07-31 Tail-anchored ER membrane protein of unknown function; substrate of the phosphatase calcineurin; interacts with homolog Frt2p; promotes cell growth in stress conditions, possibly via a role in posttranslational translocation; FRT1 has a paralog, FRT2, that arose from the whole genome duplication +S000037039 CDS YOR324C 15 925040 923232 C 2011-02-03 1996-07-31 +S000005853 ORF Verified YOR326W MYO2 myosin 2|CDC66 chromosome 15 L000001223 15 925721 930445 W 174 2011-02-03 1996-07-31 Type V myosin motor involved in actin-based transport of cargos; required for the polarized delivery of secretory vesicles, the vacuole, late Golgi elements, peroxisomes, and the mitotic spindle; MYO2 has a paralog, MYO4, that arose from the whole genome duplication +S000029839 CDS YOR326W 15 925721 930445 W 2011-02-03 1996-07-31 +S000005854 ORF Verified YOR327C SNC2 SNAP receptor SNC2 chromosome 15 L000001943 15 931081 930734 C 2011-02-03 1996-07-31 Vesicle membrane receptor protein (v-SNARE); involved in the fusion between Golgi-derived secretory vesicles with the plasma membrane; Snc2p levels regulated by Vps45p; member of the synaptobrevin/VAMP family of R-type v-SNARE proteins; SNC2 has a paralog, SNC1, that arose from the whole genome duplication +S000029884 CDS YOR327C 15 931081 930734 C 2011-02-03 1996-07-31 +S000005855 ORF Verified YOR328W PDR10 ATP-binding cassette multidrug transporter PDR10 chromosome 15 L000002865 15 931803 936497 W 2011-02-03 1996-07-31 ATP-binding cassette (ABC) transporter; multidrug transporter involved in the pleiotropic drug resistance network; regulated by Pdr1p and Pdr3p +S000030958 CDS YOR328W 15 931803 936497 W 2011-02-03 1996-07-31 +S000028585 ORF Dubious YOR329W-A chromosome 15 15 939348 939557 W 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by fungal homology and RT-PCR +S000031335 CDS YOR329W-A 15 939348 939557 W 2011-02-03 2003-07-29 +S000005856 ORF Verified YOR329C SCD5 SCD7|FTB1 chromosome 15 L000001805|S000029433|L000001807 15 939349 936731 C 2011-02-03 1996-07-31 Protein required for normal actin organization and endocytosis; targeting subunit for protein phosphatase type 1; undergoes Crm1p-dependent nuclear-cytoplasmic shuttling; multicopy suppressor of clathrin deficiency +S000030995 CDS YOR329C 15 939349 936731 C 2011-02-03 1996-07-31 +S000005857 ORF Verified YOR330C MIP1 DNA-directed DNA polymerase gamma MIP1 chromosome 15 L000001113 15 943385 939621 C 181 2011-02-03 1996-07-31|2005-11-30 Mitochondrial DNA polymerase gamma; single subunit of mitochondrial DNA polymerase in yeast, in contrast to metazoan complex of catalytic and accessory subunits; polymorphic in yeast, petites occur more frequently in some lab strains; human ortholog POLG complements yeast mip1 mutant; mutations in human POLG associated with Alpers-Huttenlocher syndrome (AHS), progressive external ophthalmoplegia (PEO), parkinsonism, other mitochondrial diseases +S000031997 CDS YOR330C 15 943385 939621 C 2011-02-03 1996-07-31|2005-11-30 +S000005859 ORF Verified YOR332W VMA4 H(+)-transporting V1 sector ATPase subunit E chromosome 15 L000002459 15 943656 944357 W 2011-02-03 1996-07-31 Subunit E of the V1 domain of the vacuolar H+-ATPase (V-ATPase); V-ATPase is an electrogenic proton pump found throughout the endomembrane system; V1 domain has eight subunits; required for the V1 domain to assemble onto the vacuolar membrane; protein abundance increases in response to DNA replication stress +S000032201 CDS YOR332W 15 943656 944357 W 2011-02-03 1996-07-31 +S000005858 ORF Dubious YOR331C chromosome 15 15 944122 943565 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame overlaps the verified gene VMA4/YOR332W +S000032076 CDS YOR331C 15 944122 943565 C 2011-02-03 1996-07-31 +S000005861 ORF Verified YOR334W MRS2 chromosome 15 L000001178 15 944596 946008 W 2011-02-03 1996-07-31 Mitochondrial inner membrane Mg(2+) channel; required for maintenance of intramitochondrial Mg(2+) concentrations at the correct level to support splicing of group II introns; similar to bacterial CorA +S000033146 CDS YOR334W 15 944596 946008 W 2011-02-03 1996-07-31 +S000005860 ORF Dubious YOR333C SWF5 chromosome 15 15 944957 944541 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps 5' end of MRS2 gene required for respiratory growth +S000032222 CDS YOR333C 15 944957 944541 C 2011-02-03 1996-07-31 +S000028717 ORF Dubious YOR335W-A chromosome 15 15 946568 946648 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene ALA1/YOR335C +S000032688 CDS YOR335W-A 15 946568 946648 W 2011-02-03 2003-07-29 +S000005862 ORF Verified YOR335C ALA1 alanine--tRNA ligase|CDC64 chromosome 15 L000000286|L000002757 15 949109 946233 C 188 2011-02-03 1996-07-31 Cytoplasmic and mitochondrial alanyl-tRNA synthetase; required for protein synthesis; point mutation (cdc64-1 allele) causes cell cycle arrest at G1; lethality of null mutation is functionally complemented by human homolog AARS; mutations in human homolog AARS are associated with autoimmune disease polymyositis/dermatomyositis +S000033157 CDS YOR335C 15 949109 946233 C 2011-02-03 1996-07-31 +S000005863 ORF Verified YOR336W KRE5 chromosome 15 L000000914 15 949773 953870 W 2011-02-03 1996-07-31 Protein required for beta-1,6 glucan biosynthesis; mutations result in aberrant morphology and severe growth defects +S000033259 CDS YOR336W 15 949773 953870 W 2011-02-03 1996-07-31 +S000005864 ORF Verified YOR337W TEA1 chromosome 15 L000003020 15 954344 956623 W 193 2011-02-03 1996-07-31 Ty1 enhancer activator involved in Ty enhancer-mediated transcription; required for full levels of Ty enhancer-mediated transcription; C6 zinc cluster DNA-binding protein +S000033317 CDS YOR337W 15 954344 956623 W 2011-02-03 1996-07-31 +S000005865 ORF Uncharacterized YOR338W chromosome 15 15 956898 957989 W 2011-02-03 1996-07-31 Putative protein of unknown function; YOR338W transcription is regulated by Azf1p and its transcript is a specific target of the G protein effector Scp160p; identified as being required for sporulation in a high-throughput mutant screen; YOR338W has a paralog, FUN19, that arose from the whole genome duplication +S000034225 CDS YOR338W 15 956898 957989 W 2011-02-03 1996-07-31 +S000005866 ORF Verified YOR339C UBC11 putative E2 ubiquitin-protein ligase UBC11 chromosome 15 L000004673 15 958832 958362 C 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme; most similar in sequence to Xenopus ubiquitin-conjugating enzyme E2-C, but not a true functional homolog of this E2; unlike E2-C, not required for the degradation of mitotic cyclin Clb2 +S000034261 CDS YOR339C 15 958832 958362 C 2011-02-03 1996-07-31 +S000005867 ORF Verified YOR340C RPA43 DNA-directed RNA polymerase I subunit RPA43|A43 chromosome 15 L000003029 15 960182 959202 C 2011-02-03 1996-07-31 RNA polymerase I subunit A43 +S000035445 CDS YOR340C 15 960182 959202 C 2011-02-03 1996-07-31 +S000005868 ORF Verified YOR341W RPA190 DNA-directed RNA polymerase I core subunit RPA190|A190|RRN1 chromosome 15 L000001675 15 960987 965981 W 192 2011-02-03 1996-07-31 RNA polymerase I largest subunit A190 +S000036421 CDS YOR341W 15 960987 965981 W 2011-02-03 1996-07-31 +S000005869 ORF Verified YOR342C chromosome 15 15 967625 966666 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and the nucleus; relocalizes from nucleus to cytoplasm upon DNA replication stress; YOR342C has a paralog, YAL037W, that arose from the whole genome duplication +S000036448 CDS YOR342C 15 967625 966666 C 2011-02-03 1996-07-31 +S000005870 ORF Dubious YOR343C chromosome 15 15 968474 968148 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036546 CDS YOR343C 15 968474 968148 C 2011-02-03 1996-07-31 +S000007179 long_terminal_repeat YORWsigma4 chromosome 15 15 968991 969301 W 2011-02-03 2000-05-19 Ty3 LTR +S000007175 long_terminal_repeat YORWdelta22 chromosome 15 15 969293 969431 W 2011-02-03 2000-05-19 Ty1 LTR +S000007176 long_terminal_repeat YORWdelta23 chromosome 15 15 970286 970617 W 2011-02-03 2000-05-19 Ty2 LTR +S000007183 LTR_retrotransposon YORWTy2-2 Ty2 chromosome 15 15 970286 976244 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007355 transposable_element_gene YOR343W-A gag protein|YOR343C-A chromosome 15 15 970578 971894 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000036395 CDS YOR343W-A 15 970578 971894 W 2011-02-03 1999-07-17 +S000007356 transposable_element_gene YOR343W-B gag-pol fusion protein|YOR343C-B chromosome 15 15 970578 975891 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000036396 CDS YOR343W-B 15 970578 971871 W 2011-02-03 1999-07-17 +S000036397 CDS YOR343W-B 15 971873 975891 W 2011-02-03 1999-07-17 +S000036398 plus_1_translational_frameshift YOR343W-B 15 971872 971872 W 2011-02-03 1999-07-17 +S000007177 long_terminal_repeat YORWdelta24 chromosome 15 15 975913 976244 W 2011-02-03 2000-05-19 Ty2 LTR +S000006666 tRNA_gene tM(CAU)O2 EMT2 chromosome 15 L000000552|L000003712 15 976421 976493 W 2011-02-03 2000-05-19 Methionine tRNA (tRNA-Met), functions in translational elongation; not involved in translational initiation; predicted by tRNAscan-SE analysis +S000032168 noncoding_exon tM(CAU)O2 15 976421 976493 W 2011-02-03 2000-05-19 +S000005871 ORF Verified YOR344C TYE7 SGC1 chromosome 15 L000002401 15 978069 977194 C 199 2011-02-03 1996-07-31 Serine-rich protein that contains a bHLH DNA binding motif; binds E-boxes of glycolytic genes and contributes to their activation; may function as a transcriptional activator in Ty1-mediated gene expression; bHLH stands for basic-helix-loop-helix +S000036612 CDS YOR344C 15 978069 977194 C 2011-02-03 1996-07-31 +S000007167 long_terminal_repeat YORCdelta25 chromosome 15 15 980590 980259 C 2011-02-03 2000-05-19 Ty1 LTR +S000006689 tRNA_gene tP(UGG)O3 chromosome 15 L000003713 15 980683 980787 W 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin +S000031061 intron tP(UGG)O3 15 980719 980751 W 2011-02-03 2000-05-19 +S000031059 noncoding_exon tP(UGG)O3 15 980683 980718 W 2011-02-03 2000-05-19 +S000031060 noncoding_exon tP(UGG)O3 15 980752 980787 W 2011-02-03 2000-05-19 +S000118496 ARS ARS1529 ARSXV-982 chromosome 15 15 981462 981697 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000005873 ORF Verified YOR346W REV1 deoxycytidyl transferase chromosome 15 L000001615 15 981828 984785 W 2011-02-03 1996-07-31 Deoxycytidyl transferase; involved in repair of abasic sites and adducted guanines in damaged DNA by translesion synthesis (TLS); forms a complex with the subunits of DNA polymerase zeta, Rev3p and Rev7p; relocalizes from nucleus to cytoplasm upon DNA replication stress +S000037530 CDS YOR346W 15 981828 984785 W 2011-02-03 1996-07-31 +S000005872 ORF Dubious YOR345C chromosome 15 15 982162 981812 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene REV1; null mutant displays increased resistance to antifungal agents gliotoxin, cycloheximide and H2O2 +S000037325 CDS YOR345C 15 982162 981812 C 2011-02-03 1996-07-31 +S000005874 ORF Verified YOR347C PYK2 pyruvate kinase PYK2 chromosome 15 L000004122 15 986462 984942 C 2011-02-03 1996-07-31 Pyruvate kinase; appears to be modulated by phosphorylation; transcription repressed by glucose, and Pyk2p may be active under low glycolytic flux; PYK2 has a paralog, CDC19, that arose from the whole genome duplication +S000037542 CDS YOR347C 15 986462 984942 C 2011-02-03 1996-07-31 +S000005875 ORF Verified YOR348C PUT4 proline permease PUT4 chromosome 15 L000001538 15 988782 986899 C 2011-02-03 1996-07-31 Proline permease; required for high-affinity transport of proline; also transports the toxic proline analog azetidine-2-carboxylate (AzC); PUT4 transcription is repressed in ammonia-grown cells +S000030314 CDS YOR348C 15 988782 986899 C 2011-02-03 1996-07-31 +S000005876 ORF Verified YOR349W CIN1 chromosome 15 L000000336 15 989789 992833 W 215 2011-02-03 1996-07-31 Tubulin folding factor D involved in beta-tubulin (Tub2p) folding; isolated as mutant with increased chromosome loss and sensitivity to benomyl +S000030549 CDS YOR349W 15 989789 992833 W 2011-02-03 1996-07-31 +S000005877 ORF Verified YOR350C MNE1 chromosome 15 L000003295 15 994855 992864 C 2011-02-03 1996-07-31 Protein involved in splicing Group I aI5-beta intron from COX1 mRNA; mitochondrial matrix protein +S000030755 CDS YOR350C 15 994855 992864 C 2011-02-03 1996-07-31 +S000005878 ORF Verified YOR351C MEK1 serine/threonine protein kinase MEK1|MRE4 chromosome 15 L000001062|L000001148 15 996511 995018 C 175 2011-02-03 1996-07-31 Meiosis-specific serine/threonine protein kinase; functions in meiotic checkpoint, promotes recombination between homologous chromosomes by suppressing double strand break repair between sister chromatids; stabilizes Hop1-Thr318 phosphorylation to promote interhomolog recombination and checkpoint responses during meiosis +S000031597 CDS YOR351C 15 996511 995018 C 2011-02-03 1996-07-31 +S000005879 ORF Verified YOR352W TFB6 TFIIH complex subunit TFB6 chromosome 15 15 997213 998244 W 2011-02-03 1996-07-31 Subunit of TFIIH complex; facilities dissociation of the Ssl2p helices from TFIIH; expression levels regulated by Arg5,6p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus +S000031766 CDS YOR352W 15 997213 998244 W 2011-02-03 1996-07-31 +S000005880 ORF Verified YOR353C SOG2 chromosome 15 15 1000828 998453 C 2011-02-03 1996-07-31 Key component of the RAM signaling network; required for proper cell morphogenesis and cell separation after mitosis +S000031817 CDS YOR353C 15 1000828 998453 C 2011-02-03 1996-07-31 +S000005881 ORF Verified YOR354C MSC6 chromosome 15 15 1003225 1001147 C 2011-02-03 1996-07-31 Multicopy suppressor of HER2 involved in mitochondrial translation; mutant is defective in directing meiotic recombination events to homologous chromatids +S000031931 CDS YOR354C 15 1003225 1001147 C 2011-02-03 1996-07-31 +S000005882 ORF Verified YOR355W GDS1 chromosome 15 L000002580 15 1005137 1006705 W 2011-02-03 1996-07-31 Protein of unknown function; required for growth on glycerol as a carbon source; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000032902 CDS YOR355W 15 1005137 1006705 W 2011-02-03 1996-07-31 +S000005883 ORF Verified YOR356W CIR2 putative electron-transferring-flavoprotein dehydrogenase chromosome 15 15 1007221 1009116 W 2011-02-03 1996-07-31 Putative ortholog of human ETF-dH; found in a large supramolecular complex with other mitochondrial dehydrogenases; may have a role in oxidative stress response; ETF-dH is also known as electron transfer flavoprotein dehydrogenase +S000032990 CDS YOR356W 15 1007221 1009116 W 2011-02-03 1996-07-31 +S000005884 ORF Verified YOR357C SNX3 GRD19 chromosome 15 L000002931 15 1009712 1009224 C 2011-02-03 1996-07-31 Sorting nexin for late-Golgi enzymes; required to maintain late-Golgi resident enzymes in their proper location by recycling molecules from the prevacuolar compartment; contains a PX domain and sequence similarity to human Snx3p +S000033017 CDS YOR357C 15 1009712 1009224 C 2011-02-03 1996-07-31 +S000005885 ORF Verified YOR358W HAP5 chromosome 15 L000003021 15 1010161 1010889 W 2011-02-03 1996-07-31 Subunit of the Hap2p/3p/4p/5p CCAAT-binding complex; complex is heme-activated and glucose repressed; complex is a transcriptional activator and global regulator of respiratory gene expression; required for assembly and DNA binding activity of the complex +S000033859 CDS YOR358W 15 1010161 1010889 W 2011-02-03 1996-07-31 +S000005886 ORF Verified YOR359W VTS1 chromosome 15 15 1011189 1012760 W 2011-02-03 1996-07-31 Flap-structured DNA-binding and RNA-binding protein; stimulates deadenylation-dependent mRNA degradation mediated by the CCR4-NOT deadenylase complex; member of the Smaug (Smg) family of post-transcriptional regulators which bind RNA through a conserved sterile alpha motif (SAM) domain that interacts with Smg recognition element (SREs) containing transcripts; stimulates Dna2p endonuclease activity +S000033994 CDS YOR359W 15 1011189 1012760 W 2011-02-03 1996-07-31 +S000005887 ORF Verified YOR360C PDE2 3',5'-cyclic-nucleotide phosphodiesterase PDE2|SRA5 chromosome 15 L000002046 15 1014821 1013241 C 220 2011-02-03 1996-07-31 High-affinity cyclic AMP phosphodiesterase; component of the cAMP-dependent protein kinase signaling system, protects the cell from extracellular cAMP, contains readthrough motif surrounding termination codon +S000036087 CDS YOR360C 15 1014821 1013241 C 2011-02-03 1996-07-31 +S000005888 ORF Verified YOR361C PRT1 translation initiation factor eIF3 core subunit b|DNA26|CDC63 chromosome 15 L000001515 15 1017652 1015361 C 221 2011-02-03 1996-07-31 eIF3b subunit of the eukaryotic translation initiation factor 3 (eIF3); subunit of the core complex of eIF3; essential for translation; part of a subcomplex (Prt1p-Rpg1p-Nip1p) that stimulates binding of mRNA and tRNA(i)Met to ribosomes; eIF3 is also involved in programmed stop codon readthrough +S000036186 CDS YOR361C 15 1017652 1015361 C 2011-02-03 1996-07-31 +S000005889 ORF Verified YOR362C PRE10 proteasome core particle subunit alpha 7 chromosome 15 L000003146 15 1018746 1017880 C 2011-02-03 1996-07-31 Alpha 7 subunit of the 20S proteasome; protein abundance increases in response to DNA replication stress +S000036287 CDS YOR362C 15 1018746 1017880 C 2011-02-03 1996-07-31 +S000005890 ORF Verified YOR363C PIP2 oleate-activated transcription factor PIP2|OAF2 chromosome 15 L000003144 15 1023212 1020222 C 2011-02-03 1996-07-31 Autoregulatory, oleate-activated transcription factor; subunit of a heterodimeric complex with Oaf1p, which binds to oleate-response elements (ORE) in the promoter of genes involved in beta-oxidation of fatty acids, peroxisome organization and biogenesis, activating transcription in the presence of oleate; PIP2 has a paralog, OAF1, that arose from the whole genome duplication +S000036382 CDS YOR363C 15 1023212 1020222 C 2011-02-03 1996-07-31 +S000005891 ORF Dubious YOR364W chromosome 15 15 1023371 1023739 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YOR365C +S000037077 CDS YOR364W 15 1023371 1023739 W 2011-02-03 1996-07-31 +S000005893 ORF Dubious YOR366W chromosome 15 15 1025256 1025609 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YOR365C +S000037303 CDS YOR366W 15 1025256 1025609 W 2011-02-03 1996-07-31 +S000005892 ORF Uncharacterized YOR365C putative flavin adenine dinucleotide transporter chromosome 15 15 1025572 1023461 C 2011-02-03 1996-07-31 Putative protein of unknown function; not an essential protein; YOR365C has a paralog, FLC2, that arose from the whole genome duplication +S000037119 CDS YOR365C 15 1025572 1023461 C 2011-02-03 1996-07-31 +S000005894 ORF Verified YOR367W SCP1 chromosome 15 L000004232 15 1026007 1026609 W 2011-02-03 1996-07-31 Component of yeast cortical actin cytoskeleton; binds and cross links actin filaments; originally identified by its homology to calponin (contains a calponin-like repeat) but the Scp1p domain structure is more similar to transgelin +S000029952 CDS YOR367W 15 1026007 1026609 W 2011-02-03 1996-07-31 +S000005895 ORF Verified YOR368W RAD17 chromosome 15 L000001566 15 1026843 1028048 W 214 2011-02-03 1996-07-31 Checkpoint protein; involved in the activation of the DNA damage and meiotic pachytene checkpoints; with Mec3p and Ddc1p, forms a clamp that is loaded onto partial duplex DNA; homolog of human and S. pombe Rad1 and U. maydis Rec1 proteins +S000030058 CDS YOR368W 15 1026843 1028048 W 2011-02-03 1996-07-31 +S000005896 ORF Verified YOR369C RPS12 eS12|ribosomal 40S subunit protein S12|S12e|S12 chromosome 15 L000002785 15 1028625 1028194 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S12, no bacterial homolog +S000030088 CDS YOR369C 15 1028625 1028194 C 2011-02-03 1996-07-31 +S000005897 ORF Verified YOR370C MRS6 GTPase-activating protein MRS6|MSI4 chromosome 15 L000001182|L000001194 15 1030994 1029183 C 2011-02-03 1996-07-31 Rab escort protein; forms a complex with the Ras-like small GTPase Ypt1p that is required for the prenylation of Ypt1p by protein geranylgeranyltransferase type II (Bet2p-Bet4p); sequence similarity to mammalian choroideraemia gene; relative distribution to the nucleus increases upon DNA replication stress +S000031162 CDS YOR370C 15 1030994 1029183 C 2011-02-03 1996-07-31 +S000005898 ORF Verified YOR371C GPB1 KRH2 chromosome 15 15 1034182 1031489 C 2011-02-03 1996-07-31 Multistep regulator of cAMP-PKA signaling; inhibits PKA downstream of Gpa2p and Cyr1p, thereby increasing cAMP dependency; promotes ubiquitin-dependent proteolysis of Ira2p; regulated by G-alpha protein Gpa2p; GPB1 has a paralog, GPB2, that arose from the whole genome duplication +S000031222 CDS YOR371C 15 1034182 1031489 C 2011-02-03 1996-07-31 +S000005899 ORF Verified YOR372C NDD1 chromosome 15 15 1036471 1034807 C 2011-02-03 1996-07-31 Transcriptional activator essential for nuclear division; localized to the nucleus; essential component of the mechanism that activates the expression of a set of late-S-phase-specific genes; turnover is tightly regulated during cell cycle and in response to DNA damage +S000032194 CDS YOR372C 15 1036471 1034807 C 2011-02-03 1996-07-31 +S000005900 ORF Verified YOR373W NUD1 chromosome 15 L000002752 15 1036834 1039389 W 2011-02-03 1996-07-31 Component of the spindle pole body outer plaque; acts through the mitotic exit network to specify asymmetric spindle pole body inheritance +S000032346 CDS YOR373W 15 1036834 1039389 W 2011-02-03 1996-07-31 +S000005901 ORF Verified YOR374W ALD4 aldehyde dehydrogenase (NADP(+)) ALD4|ALDH2|ALD7 chromosome 15 L000004220 15 1039840 1041399 W 2011-02-03 1996-07-31 Mitochondrial aldehyde dehydrogenase; required for growth on ethanol and conversion of acetaldehyde to acetate; phosphorylated; activity is K+ dependent; utilizes NADP+ or NAD+ equally as coenzymes; expression is glucose repressed; can substitute for cytosolic NADP-dependent aldehyde dehydrogenase when directed to the cytosol; human homolog ALDH2 can complement yeast ald4 mutant +S000033216 CDS YOR374W 15 1039840 1041399 W 2011-02-03 1996-07-31 +S000005902 ORF Verified YOR375C GDH1 glutamate dehydrogenase (NADP(+)) GDH1|DHE4|GDHA|GDH-A|URE1 chromosome 15 L000000696 15 1043042 1041678 C 2011-02-03 1996-07-31 NADP(+)-dependent glutamate dehydrogenase; synthesizes glutamate from ammonia and alpha-ketoglutarate; rate of alpha-ketoglutarate utilization differs from Gdh3p; expression regulated by nitrogen and carbon sources; GDH1 has a paralog, GDH3, that arose from the whole genome duplication +S000033231 CDS YOR375C 15 1043042 1041678 C 2011-02-03 1996-07-31 +S000005903 ORF Uncharacterized YOR376W chromosome 15 15 1043191 1043559 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YOR376W is not an essential gene +S000033346 CDS YOR376W 15 1043191 1043559 W 2011-02-03 1996-07-31 +S000028586 ORF Uncharacterized YOR376W-A chromosome 15 15 1045196 1045351 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031336 CDS YOR376W-A 15 1045196 1045351 W 2011-02-03 2003-07-29 +S000005904 ORF Verified YOR377W ATF1 alcohol O-acetyltransferase chromosome 15 L000000138 15 1046226 1047803 W 2011-02-03 1996-07-31 Alcohol acetyltransferase; responsible for the major part of volatile acetate ester production during fermentation; main enzyme involved in terpenyl acetate synthesis; potential roles in lipid and sterol metabolism +S000033432 CDS YOR377W 15 1046226 1047803 W 2011-02-03 1996-07-31 +S000005905 ORF Verified YOR378W AMF1 chromosome 15 15 1049511 1051058 W 2011-02-03 1996-07-31 Low affinity NH4+ transporter; member of the DHA2 family of drug:H+ anti porters; putative paralog of ATR1; but not required for boron tolerance; non-essential gene +S000034342 CDS YOR378W 15 1049511 1051058 W 2011-02-03 1996-07-31 +S000005906 ORF Dubious YOR379C chromosome 15 15 1051064 1050726 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YOR378W +S000034365 CDS YOR379C 15 1051064 1050726 C 2011-02-03 1996-07-31 +S000005907 ORF Verified YOR380W RDR1 chromosome 15 15 1051290 1052930 W 2011-02-03 1996-07-31 Transcriptional repressor involved in regulating multidrug resistance; negatively regulates expression of the PDR5 gene; member of the Gal4p family of zinc cluster proteins +S000035338 CDS YOR380W 15 1051290 1052930 W 2011-02-03 1996-07-31 +S000005908 ORF Verified YOR381W FRE3 ferric-chelate reductase chromosome 15 L000003555 15 1055545 1057680 W 2011-02-03 1996-07-31 Ferric reductase; reduces siderophore-bound iron prior to uptake by transporters; expression induced by low iron levels +S000035406 CDS YOR381W 15 1055545 1057680 W 2011-02-03 1996-07-31 +S000028587 ORF Uncharacterized YOR381W-A chromosome 15 15 1058423 1058590 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031338 CDS YOR381W-A 15 1058423 1058590 W 2011-02-03 2003-07-29 +S000005909 ORF Verified YOR382W FIT2 chromosome 15 15 1059531 1059992 W 2011-02-03 1996-07-31 Mannoprotein that is incorporated into the cell wall; incorporated via a glycosylphosphatidylinositol (GPI) anchor; involved in the retention of siderophore-iron in the cell wall +S000035468 CDS YOR382W 15 1059531 1059992 W 2011-02-03 1996-07-31 +S000005910 ORF Verified YOR383C FIT3 chromosome 15 15 1061055 1060441 C 2011-02-03 1996-07-31 Mannoprotein that is incorporated into the cell wall; incorporated via a glycosylphosphatidylinositol (GPI) anchor; involved in the retention of siderophore-iron in the cell wall +S000035495 CDS YOR383C 15 1061055 1060441 C 2011-02-03 1996-07-31 +S000005911 ORF Verified YOR384W FRE5 putative ferric-chelate reductase chromosome 15 L000003557 15 1061564 1063648 W 2011-02-03 1996-07-31 Putative ferric reductase with similarity to Fre2p; expression induced by low iron levels; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000035594 CDS YOR384W 15 1061564 1063648 W 2011-02-03 1996-07-31 +S000005912 ORF Uncharacterized YOR385W chromosome 15 15 1065043 1065915 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YOR385W is not an essential gene +S000036492 CDS YOR385W 15 1065043 1065915 W 2011-02-03 1996-07-31 +S000005913 ORF Verified YOR386W PHR1 deoxyribodipyrimidine photo-lyase PHR1 chromosome 15 L000001432 15 1066839 1068536 W 205 2011-02-03 1996-07-31 DNA photolyase involved in photoreactivation; repairs pyrimidine dimers in the presence of visible light; induced by DNA damage; regulated by transcriptional repressor Rph1p +S000036613 CDS YOR386W 15 1066839 1068536 W 2011-02-03 1996-07-31 +S000005914 ORF Uncharacterized YOR387C chromosome 15 15 1070241 1069621 C 2011-02-03 1996-07-31 Putative protein of unknown function; regulated by the metal-responsive Aft1p transcription factor; highly inducible in zinc-depleted conditions; localizes to the soluble fraction; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively; YOR387C has a paralog, VEL1, that arose from a single-locus duplication +S000036646 CDS YOR387C 15 1070241 1069621 C 2011-02-03 1996-07-31 +S000005915 ORF Verified YOR388C FDH1 formate dehydrogenase (NAD+) chromosome 15 L000004078 15 1072923 1071793 C 2011-02-03 1996-07-31 NAD(+)-dependent formate dehydrogenase; may protect cells from exogenous formate +S000036744 CDS YOR388C 15 1072923 1071793 C 2011-02-03 1996-07-31 +S000005916 ORF Uncharacterized YOR389W chromosome 15 15 1074213 1076087 W 2011-02-03 1996-07-31 Putative protein of unknown function; expression regulated by copper levels +S000037549 CDS YOR389W 15 1074213 1076087 W 2011-02-03 1996-07-31 +S000005917 ORF Verified YOR390W FEX1 fluoride transporter chromosome 15 15 1076784 1077911 W 2011-02-03 1996-07-31 Protein involved in fluoride export; nearly identical to FEX2, and deletion of both proteins results in a large increase in fluoride sensitivity compared with the single mutant; contains two FEX domains connected by a linker; part of a widespread family of conserved fluoride export proteins +S000030291 CDS YOR390W 15 1076784 1077911 W 2011-02-03 1996-07-31 +S000005918 ORF Verified YOR391C HSP33 glutathione-independent methylglyoxalase family protein chromosome 15 15 1079258 1078545 C 2011-02-03 1996-07-31 Possible chaperone and cysteine protease; required for transcriptional reprogramming during the diauxic shift and for survival in stationary phase; similar to E. coli Hsp31 and S. cerevisiae Hsp31p, Hsp32p, and Sno4p; member of the DJ-1/ThiJ/PfpI superfamily, which includes human DJ-1 involved in Parkinson's disease and cancer +S000030329 CDS YOR391C 15 1079258 1078545 C 2011-02-03 1996-07-31 +S000005919 ORF Dubious YOR392W chromosome 15 15 1079282 1079725 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; gene expression induced by heat +S000031315 CDS YOR392W 15 1079282 1079725 W 2011-02-03 1996-07-31 +S000005920 ORF Verified YOR393W ERR1 phosphopyruvate hydratase ERR1 chromosome 15 L000002735 15 1080276 1081589 W 2011-02-03 1996-07-31 Putative phosphopyruvate hydratase +S000031378 CDS YOR393W 15 1080276 1081589 W 2011-02-03 1996-07-31 +S000005921 ORF Verified YOR394W PAU21 seripauperin PAU21 chromosome 15 15 1082718 1083212 W 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the cytosol; identical to Pau22p; encodes two proteins that are translated from 2 different start codons +S000031488 CDS YOR394W 15 1082718 1083212 W 2011-02-03 1996-07-31 +S000028997 telomere TEL15R chromosome 15 15 1083922 1091291 W 229 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome XV; composed of an X element core sequence, X element combinatorial repeats, a long Y' element, and a very short terminal stretch of telomeric repeats +S000028998 telomeric_repeat TEL15R 15 1091274 1091291 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome XV +S000028999 X_element TEL15R 15 1083922 1084367 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome XV; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YOR394C-A +S000029000 X_element_combinatorial_repeat TEL15R 15 1084368 1084620 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr XV; contains repeats of the D, C, and B types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000029001 Y_prime_element TEL15R 15 1084621 1091273 W 2011-02-03 2003-09-09 Telomeric long Y' element on the right arm of Chromosome XV; contains an ARS consensus sequence, a region of 36-bp repeats, and ORFs YOR396W and YOR396C-A +S000028718 ORF Uncharacterized YOR394C-A chromosome 15 15 1084369 1084202 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032689 CDS YOR394C-A 15 1084369 1084202 C 2011-02-03 2003-07-29 +S000007526 ORF Uncharacterized YOR396W YRF1-8 Y' element ATP-dependent helicase protein 1 copy 8 chromosome 15 15 1085473 1090863 W 2011-02-03 2000-07-14|2007-02-07 One of several telomeric Y' element-encoded DNA helicases; known as Y'-Help1 (Y'-HELicase Protein 1) +S000037061 CDS YOR396W 15 1085473 1090863 W 2011-02-03 2000-07-14|2007-02-07 +S000028719 ORF Dubious YOR396C-A chromosome 15 15 1090497 1090015 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032691 CDS YOR396C-A 15 1090497 1090015 C 2011-02-03 2003-07-29 +S000028724 ORF Dubious YPL283W-B chromosome 16 16 643 1125 W 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032709 CDS YPL283W-B 16 643 1125 W 2003-07-29 2003-07-29 +S000028723 ORF Dubious YPL283W-A chromosome 16 16 1426 2001 W 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032706 CDS YPL283W-A 16 1426 2001 W 2003-07-29 2003-07-29 +S000006204 ORF Verified YPL283C YRF1-7 Y' element ATP-dependent helicase protein 1 copy 7|YRF1 chromosome 16 16 6007 280 C 1996-07-31 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p +S000036889 CDS YPL283C 16 5840 280 C 1996-07-31 1996-07-31 +S000036888 CDS YPL283C 16 6007 5989 C 1996-07-31 1996-07-31 +S000036890 intron YPL283C 16 5988 5841 C 1996-07-31 1996-07-31 +S000028933 telomere TEL16L chromosome 16 16 7223 1 C -169 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome XVI; annotated components include an X element core sequence, X element combinatorial repeats, and a long Y' element; TEL16L does have telomeric repeats (TEL16L-TR), but they are missing from the genome annotation due to difficulties encountered during sequencing and/or assembly +S000028934 X_element TEL16L 16 7223 6778 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome XVI; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028935 X_element_combinatorial_repeat TEL16L 16 6777 6525 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr XVI; contains repeats of the D, C and B types; formerly called SubTelomeric Repeats +S000028936 Y_prime_element TEL16L 16 6524 1 C 2003-09-09 2003-09-09 Telomeric long Y' element on the left arm of Chromosome XVI; contains an ARS consensus sequence, a region of 36-bp repeats, and ORFs YRF1-7/YPL283C, YPL283W-A, YPL283W-B +S000006203 ORF Verified YPL282C PAU22 seripauperin PAU22 chromosome 16 16 8427 7933 C 1996-07-31 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to just the vacuole; identical to Pau21p; encodes two proteins that are translated from two different start codons +S000036818 CDS YPL282C 16 8427 7933 C 1996-07-31 1996-07-31 +S000006202 ORF Verified YPL281C ERR2 phosphopyruvate hydratase ERR2 chromosome 16 L000004075 16 10870 9557 C 1996-07-31 1996-07-31 Enolase, a phosphopyruvate hydratase; catalyzes the conversion of 2-phosphoglycerate to phosphoenolpyruvate; complements the growth defect of an ENO1 ENO2 double mutant +S000035948 CDS YPL281C 16 10870 9557 C 1996-07-31 1996-07-31 +S000006201 ORF Verified YPL280W HSP32 glutathione-independent methylglyoxalase family protein chromosome 16 16 11887 12600 W 1996-07-31 1996-07-31 Possible chaperone and cysteine protease; required for transcriptional reprogramming during the diauxic shift and for survival in stationary phase; similar to E. coli Hsp31 and S. cerevisiae Hsp31p, Hsp33p, and Sno4p; member of the DJ-1/ThiJ/PfpI superfamily, which includes human DJ-1 involved in Parkinson's disease and cancer +S000035901 CDS YPL280W 16 11887 12600 W 1996-07-31 1996-07-31 +S000006200 ORF Verified YPL279C FEX2 fluoride transporter chromosome 16 16 14355 13228 C 1996-07-31 1996-07-31 Protein involved in fluoride export; nearly identical to FEX1, and deletion of both proteins results in a large increase in fluoride sensitivity compared with the single mutant; contains two FEX domains connected by a linker; part of a widespread family of conserved fluoride export proteins +S000034797 CDS YPL279C 16 14355 13228 C 1996-07-31 1996-07-31 +S000006199 ORF Uncharacterized YPL278C chromosome 16 16 15355 15053 C 1996-07-31 1996-07-31 Putative protein of unknown function; gene expression regulated by copper levels +S000034632 CDS YPL278C 16 15355 15053 C 1996-07-31 1996-07-31 +S000006198 ORF Uncharacterized YPL277C chromosome 16 16 16868 15405 C 1996-07-31 1996-07-31 Putative protein of unknown function; localized to the membranes; gene expression regulated by copper levels +S000033762 CDS YPL277C 16 16868 15405 C 1996-07-31 1996-07-31 +S000006197 pseudogene YPL276W FDH2 chromosome 16 16 17948 18385 W 1996-07-31 1996-07-31 NAD(+)-dependent formate dehydrogenase; may protect cells from exogenous formate; YPL275W and YPL276W comprise a continuous open reading frame in some S. cerevisiae strains but not in the genomic reference strain S288C +S000033699 CDS YPL276W 16 17948 18385 W 1996-07-31 1996-07-31 +S000006196 pseudogene YPL275W FDH2 chromosome 16 16 18369 19079 W 1996-07-31 1996-07-31 NAD(+)-dependent formate dehydrogenase; may protect cells from exogenous formate; YPL275W and YPL276W comprise a continuous open reading frame in some S. cerevisiae strains but not in the genomic reference strain S288C +S000033615 CDS YPL275W 16 18369 19079 W 1996-07-31 1996-07-31 +S000130195 ARS ARS1603 chromosome 16 16 18370 19069 2009-05-08 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000006195 ORF Verified YPL274W SAM3 bifunctional polyamine/amino acid permease SAM3 chromosome 16 L000004875 16 22938 24701 W 1996-07-31 1996-07-31 High-affinity S-adenosylmethionine permease; required for utilization of S-adenosylmethionine as a sulfur source; has similarity to S-methylmethionine permease Mmp1p +S000033506 CDS YPL274W 16 22938 24701 W 1996-07-31 1996-07-31 +S000006194 ORF Verified YPL273W SAM4 S-adenosylmethionine-homocysteine S-methyltransferase SAM4 chromosome 16 16 25087 26064 W 1996-07-31 1996-07-31 S-adenosylmethionine-homocysteine methyltransferase; functions along with Mht1p in the conversion of S-adenosylmethionine (AdoMet) to methionine to control the methionine/AdoMet ratio; SAM4 has a paralog, YMR321C, that arose from a single-locus duplication +S000032785 CDS YPL273W 16 25087 26064 W 1996-07-31 1996-07-31 +S000006193 ORF Uncharacterized YPL272C PBI1 chromosome 16 16 28164 26611 C 1996-07-31 1996-07-31 Putative protein of unknown function; gene expression induced in response to ketoconazole; YPL272C is not an essential gene +S000032642 CDS YPL272C 16 28164 26611 C 1996-07-31 1996-07-31 +S000006192 ORF Verified YPL271W ATP15 F1F0 ATP synthase subunit epsilon|ATPEPSILON chromosome 16 L000000151|L000000152 16 30079 30267 W 1996-07-31 1996-07-31 Epsilon subunit of the F1 sector of mitochondrial F1F0 ATP synthase; which is a large, evolutionarily conserved enzyme complex required for ATP synthesis; F1 translationally regulates ATP6 and ATP8 expression to achieve a balanced output of ATP synthase genes encoded in nucleus and mitochondria; phosphorylated +S000032564 CDS YPL271W 16 30079 30267 W 1996-07-31 1996-07-31 +S000006191 ORF Verified YPL270W MDL2 ATP-binding cassette permease MDL2 chromosome 16 L000001050 16 30482 32803 W 2003-09-22 2003-09-22|1996-07-31 Mitochondrial inner membrane half-type ABC transporter; required for respiratory growth at high temperature; localizes to vacuole membrane in response to H2O2; similar to human TAP1 and TAP2 implicated in bare lymphocyte syndrome and Wegener-like granulomatosis +S000031583 CDS YPL270W 16 30482 32803 W 2003-09-22 2003-09-22|1996-07-31 +S000006190 ORF Verified YPL269W KAR9 chromosome 16 L000002932 16 33013 34947 W 1996-07-31 1996-07-31 Spindle positioning factor; orients astral microtubules, connecting them to actin cables at the cortex with Bim1p and Myo2, resulting in proper spindle positioning; targeted for StuBL-dependent degradation at kinetochores by Slx5p-Slx8p, ensuring chromosome transmission fidelity and correct spindle positioning; role in karyogamy; localizes to the shmoo tip, the growing bud-tip, the nucleus, the kinetochore, the spindle and microtubules; homolog of adenomatous polyposis coli +S000031613 CDS YPL269W 16 33013 34947 W 1996-07-31 1996-07-31 +S000006189 ORF Verified YPL268W PLC1 phosphatidylinositol phospholipase C chromosome 16 L000001448 16 35236 37845 W -167.2 1996-07-31 1996-07-31 Phospholipase C; hydrolyzes phosphatidylinositol 4,5-biphosphate (PIP2) to generate the signaling molecules inositol 1,4,5-triphosphate (IP3) and 1,2-diacylglycerol (DAG); involved in regulating many cellular processes; Plc1p and inositol polyphosphates are required for acetyl-CoA homeostasis which regulates global histone acetylation +S000031510 CDS YPL268W 16 35236 37845 W 1996-07-31 1996-07-31 +S000006188 ORF Verified YPL267W ACM1 chromosome 16 16 38169 38798 W 1996-07-31 1996-07-31 Pseudosubstrate inhibitor of the APC/C; suppresses APC/C [Cdh1]-mediated proteolysis of mitotic cyclins; associates with Cdh1p, Bmh1p and Bmh2p; cell cycle regulated protein; the anaphase-promoting complex/cyclosome is also known as APC/C +S000030663 CDS YPL267W 16 38169 38798 W 1996-07-31 1996-07-31 +S000006187 ORF Verified YPL266W DIM1 putative dimethyladenosine transferase|CDH1 chromosome 16 L000002579 16 39121 40077 W 1996-07-31 1996-07-31 Essential 18S rRNA dimethylase (dimethyladenosine transferase); responsible for conserved m6(2)Am6(2)A dimethylation in 3'-terminal loop of 18S rRNA, part of 90S and 40S pre-particles in nucleolus, involved in pre-ribosomal RNA processing; human homolog DIMT1 complements yeast dim1 mutant +S000030548 CDS YPL266W 16 39121 40077 W 1996-07-31 1996-07-31 +S000006186 ORF Verified YPL265W DIP5 chromosome 16 L000003178 16 41043 42869 W 1996-07-31 1996-07-31 Dicarboxylic amino acid permease; mediates high-affinity and high-capacity transport of L-glutamate and L-aspartate; also a transporter for Gln, Asn, Ser, Ala, and Gly; relocalizes from plasma membrane to vacuole upon DNA replication stress +S000030403 CDS YPL265W 16 41043 42869 W 1996-07-31 1996-07-31 +S000118411 ARS ARS1604 ARSXVI-43 chromosome 16 16 42977 43212 2006-08-30 2006-08-30 Autonomously Replicating Sequence +S000178190 ARS_consensus_sequence ARS1604 16 43163 43147 C 2014-11-18 2014-11-18 +S000006185 ORF Uncharacterized YPL264C chromosome 16 16 44344 43283 C 1996-07-31 1996-07-31 Putative membrane protein of unknown function; physically interacts with Hsp82p; YPL264C is not an essential gene +S000037545 CDS YPL264C 16 44344 43283 C 1996-07-31 1996-07-31 +S000006184 ORF Verified YPL263C KEL3 chromosome 16 16 46506 44551 C 1996-07-31 1996-07-31 Cytoplasmic protein of unknown function +S000037435 CDS YPL263C 16 46506 44551 C 1996-07-31 1996-07-31 +S000006183 ORF Verified YPL262W FUM1 fumarase FUM1 chromosome 16 L000000632 16 47336 48802 W 1996-07-31 1996-07-31 Fumarase; converts fumaric acid to L-malic acid in the TCA cycle; cytosolic and mitochondrial distribution determined by the N-terminal targeting sequence, protein conformation, and status of glyoxylate shunt; phosphorylated in mitochondria +S000037382 CDS YPL262W 16 47336 48802 W 1996-07-31 1996-07-31 +S000006181 ORF Verified YPL260W CUB1 chromosome 16 16 49303 50958 W 1996-07-31 1996-07-31 Conserved fungal gene linked to DNA repair and proteasome function; putative substrate of cAMP-dependent protein kinase (PKA); green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; YPL260W is not an essential gene; protein abundance increases in response to DNA replication stress +S000036555 CDS YPL260W 16 49303 50958 W 1996-07-31 1996-07-31 +S000006182 ORF Uncharacterized YPL261C chromosome 16 16 49304 48996 C 1996-07-31 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YPL261C is not an essential gene; partially overlaps verified ORF YPL260W +S000036608 CDS YPL261C 16 49304 48996 C 1996-07-31 1996-07-31 +S000006180 ORF Verified YPL259C APM1 YAP54 chromosome 16 L000002494 16 52671 51244 C 1996-07-31 1996-07-31 Mu1-like medium subunit of the AP-1 complex; binds clathrin; involved in clathrin-dependent Golgi protein sorting; the AP-1 complex is the clathrin-associated protein complex +S000036655 CDS YPL259C 16 52671 51244 C 1996-07-31 1996-07-31 +S000006179 ORF Verified YPL258C THI21 bifunctional hydroxymethylpyrimidine kinase/phosphomethylpyrimidine kinase chromosome 16 16 55153 53498 C 1996-07-31 1996-07-31 Hydroxymethylpyrimidine (HMP) and HMP-phosphate kinase; involved in thiamine biosynthesis; member of a gene family with THI20 and THI22; functionally redundant with Thi20p +S000035722 CDS YPL258C 16 55153 53498 C 1996-07-31 1996-07-31 +S000007184 long_terminal_repeat YPLCdelta1 chromosome 16 16 55858 55657 C 2000-05-19 2000-05-19 Ty1 LTR +S000006776 tRNA_gene tW(CCA)P chromosome 16 L000003737 16 56274 56169 C 2000-05-19 2000-05-19 Tryptophan tRNA (tRNA-Trp), predicted by tRNAscan-SE analysis +S000034120 intron tW(CCA)P 16 56238 56205 C 2000-05-19 2000-05-19 +S000034119 noncoding_exon tW(CCA)P 16 56204 56169 C 2000-05-19 2000-05-19 +S000034118 noncoding_exon tW(CCA)P 16 56274 56239 C 2000-05-19 2000-05-19 +S000007198 long_terminal_repeat YPLWsigma1 chromosome 16 16 56290 56358 W 2000-05-19 2000-05-19 Ty3 LTR +S000007189 long_terminal_repeat YPLWdelta2 chromosome 16 16 56409 56451 W 2000-05-19 2000-05-19 Ty1 LTR +S000007190 long_terminal_repeat YPLWdelta3 chromosome 16 16 56452 56788 W 2000-05-19 2000-05-19 Ty1 LTR +S000007199 LTR_retrotransposon YPLWTy1-1 Ty1 chromosome 16 16 56452 62375 W 2000-05-19 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007357 transposable_element_gene YPL257W-A gag protein chromosome 16 16 56748 58070 W 1996-07-31 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000033164 CDS YPL257W-A 16 56748 58070 W 1996-07-31 1996-07-31 +S000007358 transposable_element_gene YPL257W-B gag-pol fusion protein chromosome 16 16 56748 62016 W 1997-07-17 1997-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000033173 CDS YPL257W-B 16 56748 58052 W 1997-07-17 1997-07-17 +S000033174 CDS YPL257W-B 16 58054 62016 W 1997-07-17 1997-07-17 +S000033175 plus_1_translational_frameshift YPL257W-B 16 58053 58053 W 1997-07-17 1997-07-17 +S000007191 long_terminal_repeat YPLWdelta4 chromosome 16 16 62039 62375 W 2000-05-19 2000-05-19 Ty1 LTR +S000007192 long_terminal_repeat YPLWdelta5 chromosome 16 16 62389 62720 W 2000-05-19 2000-05-19 Ty2 LTR +S000007193 long_terminal_repeat YPLWdelta6 chromosome 16 16 62724 63006 W 2000-05-19 2000-05-19 Ty1 LTR +S000006178 ORF Uncharacterized YPL257W chromosome 16 16 63279 63860 W 1996-07-31 1996-07-31 Putative protein of unknown function; homozygous diploid deletion strain exhibits low budding index; physically interacts with Hsp82p; YPL257W is not an essential gene +S000035666 CDS YPL257W 16 63279 63860 W 1996-07-31 1996-07-31 +S000006177 ORF Verified YPL256C CLN2 cyclin CLN2 chromosome 16 L000000358 16 66614 64977 C 1996-07-31 1996-07-31 G1 cyclin involved in regulation of the cell cycle; activates Cdc28p kinase to promote the G1 to S phase transition; late G1 specific expression depends on transcription factor complexes, MBF (Swi6p-Mbp1p) and SBF (Swi6p-Swi4p); CLN2 has a paralog, CLN1, that arose from the whole genome duplication; cell cycle arrest phenotype of the cln1 cln2 cln3 triple null mutant is complemented by any of human cyclins CCNA2, CCNB1, CCNC, CCND1, or CCNE1 +S000035542 CDS YPL256C 16 66614 64977 C 1996-07-31 1996-07-31 +S000006176 ORF Verified YPL255W BBP1 chromosome 16 L000003060 16 67725 68882 W 1996-07-31 1996-07-31 Protein required for the spindle pole body (SPB) duplication; localizes at the cytoplasmic side of the central plaque periphery of the SPB; forms a complex with a nuclear envelope protein Mps2p and SPB components Spc29p and Kar1p; required for mitotic functions of Cdc5p +S000035492 CDS YPL255W 16 67725 68882 W 1996-07-31 1996-07-31 +S000006175 ORF Verified YPL254W HFI1 GAN1|SRM12|SUP110|ADA1 chromosome 16 L000003094 16 69485 70951 W 1996-07-31 1996-07-31 Adaptor protein required for structural integrity of the SAGA complex; a histone acetyltransferase-coactivator complex that is involved in global regulation of gene expression through acetylation and transcription functions +S000034469 CDS YPL254W 16 69485 70951 W 1996-07-31 1996-07-31 +S000006174 ORF Verified YPL253C VIK1 chromosome 16 L000004276 16 73006 71063 C 1996-07-31 1996-07-31 Protein that forms a kinesin-14 heterodimeric motor with Kar3p; localizes Kar3p at mitotic spindle poles; has a structure similar to a kinesin motor domain but lacks an ATP-binding site and is catalytically inactive; binds microtubules; required for sister chromatid cohesion; VIK1 has a paralog, CIK1, that arose from the whole genome duplication +S000034335 CDS YPL253C 16 73006 71063 C 1996-07-31 1996-07-31 +S000118412 ARS ARS1605 ARSXVI-73 chromosome 16 16 73032 73227 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000006172 ORF Dubious YPL251W chromosome 16 16 73625 73927 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps 5' end of the verified, essential gene YAH1/YPL252C +S000033368 CDS YPL251W 16 73625 73927 W 1996-07-31 1996-07-31 +S000006173 ORF Verified YPL252C YAH1 adrenodoxin chromosome 16 L000004699 16 73881 73363 C 1996-07-31 1996-07-31 Ferredoxin of the mitochondrial matrix; required for formation of cellular iron-sulfur proteins; involved in heme A biosynthesis; human homolog FDX1L can complement yeast by allowing growth during down-regulation of yeast YAH1 +S000033428 CDS YPL252C 16 73881 73363 C 1996-07-31 1996-07-31 +S000006171 ORF Verified YPL250C ATG41 ICY2 chromosome 16 S000007528 16 74719 74309 C 1996-07-31 1996-07-31 Protein of unknown function; required for selective and nonselective autophagy, and mitophagy; regulates the rate of autophagosome formation; interacts with Atg9p, and has a similar peri-mitochondrial localization; elevated Gcn4p-dependent expression under autophagy-inducing conditions; mobilized into polysomes upon a shift from a fermentable to nonfermentable carbon source; potential Cdc28p substrate; ATG41 has a paralog, ICY1, that arose from the whole genome duplication +S000033279 CDS YPL250C 16 74719 74309 C 1996-07-31 1996-07-31 +S000028589 ORF Dubious YPL250W-A chromosome 16 16 75702 75989 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the verified ORF RPL36B/YPL249C-A; identified by fungal homology and RT-PCR +S000031342 CDS YPL250W-A 16 75702 75989 W 2003-07-29 2003-07-29 +S000006438 ORF Verified YPL249C-A RPL36B eL36|ribosomal 60S subunit protein L36B|L36e|YL39|L39|L36B chromosome 16 L000004515 16 76239 75699 C 1999-07-17 1999-07-17 Ribosomal 60S subunit protein L36B; binds to 5.8 S rRNA; homologous to mammalian ribosomal protein L36, no bacterial homolog; RPL36B has a paralog, RPL36A, that arose from the whole genome duplication +S000032350 CDS YPL249C-A 16 75985 75699 C 1997-07-17 1997-07-17 +S000032349 CDS YPL249C-A 16 76239 76224 C 1999-07-17 1999-07-17 +S000032351 intron YPL249C-A 16 76223 75986 C 1997-07-17 1997-07-17 +S000006170 ORF Verified YPL249C GYP5 chromosome 16 16 79353 76669 C 1996-07-31 1996-07-31 GTPase-activating protein (GAP) for yeast Rab family members; involved in ER to Golgi trafficking; exhibits GAP activity toward Ypt1p that is stimulated by Gyl1p, also acts on Sec4p; interacts with Gyl1p, Rvs161p and Rvs167p; involved in recruiting Rvs167p to the bud tip during polarized growth; relocalizes from bud neck to cytoplasm upon DNA replication stress; GYP5 has a paralog, GYL1, that arose from the whole genome duplication +S000032543 CDS YPL249C 16 79353 76669 C 1996-07-31 1996-07-31 +S000006169 ORF Verified YPL248C GAL4 galactose-responsive transcription factor GAL4|GAL81 chromosome 16 L000000661 16 82356 79711 C -143 1996-07-31 1996-07-31 DNA-binding transcription factor required for activating GAL genes; responds to galactose; repressed by Gal80p and activated by Gal3p +S000032436 CDS YPL248C 16 82356 79711 C 1996-07-31 1996-07-31 +S000006168 ORF Uncharacterized YPL247C chromosome 16 16 84196 82625 C 1996-07-31 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; similar to the petunia WD repeat protein an11; overexpression causes a cell cycle delay or arrest +S000031428 CDS YPL247C 16 84196 82625 C 1996-07-31 1996-07-31 +S000006167 ORF Verified YPL246C RBD2 putative rhomboid protease RBD2 chromosome 16 16 85297 84509 C 1996-07-31 1996-07-31 Possible rhomboid protease; has similarity to eukaryotic rhomboid proteases including Pcp1p +S000031296 CDS YPL246C 16 85297 84509 C 1996-07-31 1996-07-31 +S000006166 ORF Uncharacterized YPL245W chromosome 16 16 85586 86950 W 1996-07-31 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the nucleus and the cytoplasm +S000031264 CDS YPL245W 16 85586 86950 W 1996-07-31 1996-07-31 +S000006165 ORF Verified YPL244C HUT1 chromosome 16 16 88033 87014 C 1996-07-31 1996-07-31 Protein with a role in UDP-galactose transport to the Golgi lumen; has similarity to human UDP-galactose transporter UGTrel1, exhibits a genetic interaction with S. cerevisiae ERO1 +S000031081 CDS YPL244C 16 88033 87014 C 1996-07-31 1996-07-31 +S000006164 ORF Verified YPL243W SRP68 signal recognition particle subunit SRP68 chromosome 16 L000002065 16 88517 90316 W 1996-07-31 1996-07-31 Core component of the signal recognition particle (SRP) complex; SRP complex functions in targeting nascent secretory proteins to the endoplasmic reticulum (ER) membrane; relocalizes from cytoplasm to the nuclear periphery upon DNA replication stress +S000030136 CDS YPL243W 16 88517 90316 W 1996-07-31 1996-07-31 +S000006163 ORF Verified YPL242C IQG1 CYK1 chromosome 16 L000004180 16 95109 90622 C 1996-07-31 1996-07-31 Essential protein required for determination of budding pattern; promotes localization of axial markers Bud4p and Cdc12p and functionally interacts with Sec3p, localizes to the contractile ring during anaphase, member of the IQGAP family; relocalizes from bud neck to cytoplasm upon DNA replication stress +S000029942 CDS YPL242C 16 95109 90622 C 1996-07-31 1996-07-31 +S000006162 ORF Verified YPL241C CIN2 GTPase-activating protein CIN2 chromosome 16 L000000337 16 96258 95372 C -143 1996-07-31 1996-07-31 GTPase-activating protein (GAP) for Cin4p; tubulin folding factor C involved in beta-tubulin (Tub2p) folding; mutants display increased chromosome loss and benomyl sensitivity; human homolog RP2 complements yeast null mutant +S000037281 CDS YPL241C 16 96153 95372 C 1996-07-31 1996-07-31 +S000037280 CDS YPL241C 16 96258 96234 C 1996-07-31 1996-07-31 +S000037282 intron YPL241C 16 96233 96154 C 1996-07-31 1996-07-31 +S000006161 ORF Verified YPL240C HSP82 Hsp90 family chaperone HSP82|HSP90 chromosome 16 L000000822 16 98625 96496 C -137 1996-07-31 1996-07-31 Hsp90 chaperone; redundant in function with Hsc82p; required for pheromone signaling, negative regulation of Hsf1p; docks with Tom70p for mitochondrial preprotein delivery; promotes telomerase DNA binding, nucleotide addition; protein abundance increases in response to DNA replication stress; contains two acid-rich unstructured regions that promote solubility of chaperone-substrate complexes; HSP82 has a paralog, HSC82, that arose from the whole genome duplication +S000037196 CDS YPL240C 16 98625 96496 C 1996-07-31 1996-07-31 +S000006160 ORF Verified YPL239W YAR1 chromosome 16 L000002496 16 99484 100086 W 1996-07-31 1996-07-31 Ankyrin-repeat containing, nucleocytoplasmic shuttling chaperone; prevents aggregation of Rps3p in the cytoplasm, associates with nascent Rps3p during its translation in the cytoplasm and delivers it to the 90S in the nucleus; required for 40S ribosomal subunit export, biogenesis and adaptation to osmotic and oxidative stress; expression repressed by heat shock +S000036306 CDS YPL239W 16 99484 100086 W 1996-07-31 1996-07-31 +S000006158 ORF Verified YPL237W SUI3 translation initiation factor eIF2 subunit beta chromosome 16 L000002179 16 100496 101353 W 1996-07-31 1996-07-31 Beta subunit of the translation initiation factor eIF2; involved in the identification of the start codon; proposed to be involved in mRNA binding +S000035286 CDS YPL237W 16 100496 101353 W 1996-07-31 1996-07-31 +S000006159 ORF Dubious YPL238C chromosome 16 16 100863 100474 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps 5' end of the verified essential gene SUI3/YPL237W +S000036133 CDS YPL238C 16 100863 100474 C 1996-07-31 1996-07-31 +S000006157 ORF Verified YPL236C ENV7 putative serine/threonine protein kinase ENV7 chromosome 16 16 102702 101608 C 1996-07-31 1996-07-31 Vacuolar membrane protein kinase; negatively regulates membrane fusion; associates with vacuolar membrane through palmitoylation of one or more cysteines in consensus sequence; vacuolar membrane association is essential to its kinase activity; mutant shows defect in CPY processing; ortholog of human serine/threonine kinase 16 (STK16) +S000035042 CDS YPL236C 16 102702 101608 C 1996-07-31 1996-07-31 +S000006156 ORF Verified YPL235W RVB2 RuvB family ATP-dependent DNA helicase reptin|TIP48|TIH2|TIP49B chromosome 16 S000007484 16 103232 104647 W 1996-07-31 1996-07-31 ATP-dependent DNA helicase, also known as reptin; member of the AAA+ and RuvB protein families, similar to Rvb1p; conserved component of multiple complexes including the INO80 complex, the Swr1 complex, and the R2TP complex (Rvb1-Rvb2-Tah1-Pih1); involved in multiple processes such as chromatin remodeling, box C/D snoRNP assembly, and RNA polymerase II assembly +S000034953 CDS YPL235W 16 103232 104647 W 1996-07-31 1996-07-31 +S000006155 ORF Verified YPL234C VMA11 H(+)-transporting V0 sector ATPase subunit c'|TFP3|CLS9 chromosome 16 L000002290|L000002464 16 105440 104946 C 1996-07-31 1996-07-31 Vacuolar ATPase V0 domain subunit c'; involved in proton transport activity; hydrophobic integral membrane protein (proteolipid) containing four transmembrane segments; N and C termini are in the vacuolar lumen +S000033991 CDS YPL234C 16 105440 104946 C 1996-07-31 1996-07-31 +S000006154 ORF Verified YPL233W NSL1 MIND complex subunit NSL1 chromosome 16 L000004652 16 106172 106822 W 1996-07-31 1996-07-31 Essential component of the MIND kinetochore complex; joins kinetochore subunits contacting DNA to those contacting microtubules; required for accurate chromosome segregation; complex consists of Mtw1p Including Nnf1p-Nsl1p-Dsn1p (MIND) +S000033898 CDS YPL233W 16 106172 106822 W 1996-07-31 1996-07-31 +S000006153 ORF Verified YPL232W SSO1 syntaxin chromosome 16 L000002089 16 107275 108147 W 1996-07-31 1996-07-31 Plasma membrane t-SNARE; involved in fusion of secretory vesicles at the plasma membrane and in vesicle fusion during sporulation; forms a complex with Sec9p that binds v-SNARE Snc2p; syntaxin homolog; functionally redundant with Sso2p; SSO1 has a paralog, SSO2, that arose from the whole genome duplication +S000033777 CDS YPL232W 16 107275 108147 W 1996-07-31 1996-07-31 +S000006152 ORF Verified YPL231W FAS2 trifunctional fatty acid synthase subunit FAS2 chromosome 16 L000000602 16 108652 114315 W -125 1996-07-31 1996-07-31 Alpha subunit of fatty acid synthetase; complex catalyzes the synthesis of long-chain saturated fatty acids; contains the acyl-carrier protein domain and beta-ketoacyl reductase, beta-ketoacyl synthase and self-pantetheinylation activities +S000033048 CDS YPL231W 16 108652 114315 W 1996-07-31 1996-07-31 +S000006151 ORF Verified YPL230W USV1 NSF1 chromosome 16 L000004623 16 115312 116487 W 1996-07-31 1996-07-31 Putative transcription factor containing a C2H2 zinc finger; mutation affects transcriptional regulation of genes involved in growth on non-fermentable carbon sources, response to salt stress and cell wall biosynthesis; USV1 has a paralog, RGM1, that arose from the whole genome duplication +S000032959 CDS YPL230W 16 115312 116487 W 1996-07-31 1996-07-31 +S000122111 five_prime_UTR_intron YPL230W 16 115219 115293 W 2007-04-04 2007-04-04 +S000118413 ARS ARS1607 ARSXVI-117 chromosome 16 16 116566 116680 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178191 ARS_consensus_sequence ARS1607 16 116593 116609 W 2014-11-18 2014-11-18 +S000006150 ORF Uncharacterized YPL229W chromosome 16 16 117067 117687 W 1996-07-31 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; not an essential gene; YPL229W has a paralog, YMR181C, that arose from the whole genome duplication +S000032811 CDS YPL229W 16 117067 117687 W 1996-07-31 1996-07-31 +S000006149 ORF Verified YPL228W CET1 polynucleotide 5'-phosphatase|CES5 chromosome 16 L000004278 16 118382 120031 W 1996-07-31 1996-07-31 RNA 5'-triphosphatase involved in mRNA 5' capping; subunit of mRNA capping enzyme, which is a heterotetramer composed of a Cet1p homodimer and two molecules of guanylyltransferase Ceg1p; Cet1p also has a role in regulation of RNAPII pausing at promoter-proximal sites; interaction between Cet1p and Ceg1p is required for Ceg1p nuclear import; mammalian enzyme is single bifunctional polypeptide; human homolog RNGTT can complement yeast cet1 null mutant +S000032710 CDS YPL228W 16 118382 120031 W 1996-07-31 1996-07-31 +S000006148 ORF Verified YPL227C ALG5 dolichyl-phosphate beta-glucosyltransferase chromosome 16 L000000077 16 121167 120163 C 1996-07-31 1996-07-31 UDP-glucose:dolichyl-phosphate glucosyltransferase; involved in asparagine-linked glycosylation in the endoplasmic reticulum; human ortholog ALG5 can partially complement yeast alg5 mutant +S000032583 CDS YPL227C 16 121167 120163 C 1996-07-31 1996-07-31 +S000006147 ORF Verified YPL226W NEW1 chromosome 16 S000007490 16 121767 125357 W 1996-07-31 1996-07-31 ATP binding cassette protein; cosediments with polysomes and is required for biogenesis of the small ribosomal subunit; Asn/Gln-rich rich region supports [NU+] prion formation and susceptibility to [PSI+] prion induction +S000031654 CDS YPL226W 16 121767 125357 W 1996-07-31 1996-07-31 +S000006146 ORF Verified YPL225W chromosome 16 16 126006 126446 W 1996-07-31 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; protein abundance increases in response to DNA replication stress +S000031511 CDS YPL225W 16 126006 126446 W 1996-07-31 1996-07-31 +S000006145 ORF Verified YPL224C MMT2 MFT2 chromosome 16 L000004108 16 128088 126634 C 2011-02-03 1996-07-31|2011-02-03 Putative metal transporter involved in mitochondrial iron accumulation; MMT2 has a paralog, MMT1, that arose from the whole genome duplication +S000030540 CDS YPL224C 16 128088 126634 C 2011-02-03 1996-07-31|2011-02-03 +S000006144 ORF Verified YPL223C GRE1 chromosome 16 L000004176 16 129138 128632 C 2011-02-03 1996-07-31 Hydrophilin essential in desiccation-rehydration process; stress induced (osmotic, ionic, oxidative, heat shock and heavy metals); regulated by the HOG pathway; GRE1 has a paralog, SIP18, that arose from the whole genome duplication +S000030402 CDS YPL223C 16 129138 128632 C 2011-02-03 1996-07-31 +S000006143 ORF Uncharacterized YPL222W FMP40 chromosome 16 16 130162 132228 W 2011-02-03 1996-07-31 Putative protein of unknown function; proposed to be involved in responding to environmental stresses; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000030350 CDS YPL222W 16 130162 132228 W 2011-02-03 1996-07-31 +S000028722 ORF Dubious YPL222C-A chromosome 16 16 132115 131870 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032704 CDS YPL222C-A 16 132115 131870 C 2011-02-03 2003-07-29 +S000006142 ORF Verified YPL221W FLC1 flavin adenine dinucleotide transporter|BOP1|HUF1 chromosome 16 L000004721 16 133043 135424 W 2011-02-03 1996-07-31 Flavin adenine dinucleotide transporter; required for uptake of FAD into endoplasmic reticulum; involved in cell wall maintenance; FLC1 has a paralog, FLC3, that arose from the whole genome duplication +S000030150 CDS YPL221W 16 133043 135424 W 2011-02-03 1996-07-31 +S000006141 ORF Verified YPL220W RPL1A uL1|PUB2|ribosomal 60S subunit protein L1A|L1|L1A|SSM1 chromosome 16 L000002657 16 135790 136443 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L1A; N-terminally acetylated; homologous to mammalian ribosomal protein L10A and bacterial L1; RPL1A has a paralog, RPL1B, that arose from the whole genome duplication; rpl1a rpl1b double null mutation is lethal +S000037448 CDS YPL220W 16 135790 136443 W 2011-02-03 1996-07-31 +S000006140 ORF Verified YPL219W PCL8 chromosome 16 L000004040 16 136750 138228 W 2011-02-03 1996-07-31 Cyclin; interacts with Pho85p cyclin-dependent kinase (Cdk) to phosphorylate and regulate glycogen synthase, also activates Pho85p for Glc8p phosphorylation; PCL8 has a paralog, PCL10, that arose from the whole genome duplication +S000036617 CDS YPL219W 16 136750 138228 W 2011-02-03 1996-07-31 +S000006139 ORF Verified YPL218W SAR1 Arf family GTPase SAR1 chromosome 16 L000001801 16 138698 139409 W 2011-02-03 1996-07-31 ARF family GTPase; component of the COPII vesicle coat; required for transport vesicle formation during ER to Golgi protein transport; lowers membrane rigidity aiding vesicle formation; localizes to ER-mitochondrial contact sites where it enhances membrane curvature, thereby reducing contact size via its N-terminal amphipathic helix; regulates mitochondrial fission and fusion dynamics +S000036527 CDS YPL218W 16 138698 138725 W 2011-02-03 1996-07-31 +S000036528 CDS YPL218W 16 138865 139409 W 2011-02-03 1996-07-31 +S000036529 intron YPL218W 16 138726 138864 W 2011-02-03 1996-07-31 +S000006138 ORF Verified YPL217C BMS1 GTPase BMS1 chromosome 16 16 143171 139620 C 2011-02-03 1996-07-31 GTPase required for ribosomal subunit synthesis and rRNA processing; required for synthesis of 40S ribosomal subunits and for processing the 35S pre-rRNA at sites A0, A1, and A2; interacts with Rcl1p, which stimulates its GTPase and U3 snoRNA binding activities; has similarity to Tsr1p +S000035571 CDS YPL217C 16 143171 139620 C 2011-02-03 1996-07-31 +S000006137 ORF Uncharacterized YPL216W chromosome 16 16 143821 147129 W 2011-02-03 1996-07-31 Putative protein of unknown function; not an essential gene; YPL216W has a paralog, ITC1, that arose from the whole genome duplication +S000035522 CDS YPL216W 16 143821 147129 W 2011-02-03 1996-07-31 +S000006136 ORF Verified YPL215W CBP3 chromosome 16 L000000226 16 147416 148423 W 2011-02-03 1996-07-31 Mitochondrial protein required for assembly of cytochrome bc1 complex; forms a complex with Cbp6p that binds to mt ribosomes near the polypeptide tunnel exit and promotes efficient translation of the COB mRNA; Cbp3p-Cbp6p complex also interacts with newly synthesized cytochrome b (Cobp) and Cbp4p to promote assembly of Cobp into the cytochrome bc1 complex; Cbp3p-Cbp6p complex is sequestered if assembly of Complex III is blocked, downregulating COB mRNA translation +S000035433 CDS YPL215W 16 147416 148423 W 2011-02-03 1996-07-31 +S000006135 ORF Verified YPL214C THI6 bifunctional hydroxyethylthiazole kinase/thiamine-phosphate diphosphorylase chromosome 16 L000002634 16 150191 148569 C 2011-02-03 1996-07-31 Thiamine-phosphate diphosphorylase and hydroxyethylthiazole kinase; required for thiamine biosynthesis; GFP-fusion protein localizes to the cytoplasm in a punctate pattern +S000034353 CDS YPL214C 16 150191 148569 C 2011-02-03 1996-07-31 +S000006134 ORF Verified YPL213W LEA1 U2 snRNP complex subunit LEA1 chromosome 16 16 150614 151330 W 2011-02-03 1996-07-31 Component of U2 snRNP complex; disruption causes reduced U2 snRNP levels; physically interacts with Msl1p; putative homolog of human U2A' snRNP protein +S000034273 CDS YPL213W 16 150614 151330 W 2011-02-03 1996-07-31 +S000006133 ORF Verified YPL212C PUS1 pseudouridine synthase PUS1 chromosome 16 L000003360 16 153149 151515 C 2011-02-03 1996-07-31 tRNA:pseudouridine synthase; introduces pseudouridines at positions 26-28, 34-36, 65, and 67 of tRNA; also acts on U2 snRNA; also pseudouridylates some mRNAs, and pseudouridylation level varies with growth phase; nuclear protein that appears to be involved in tRNA export; PUS1 has a paralog, PUS2, that arose from the whole genome duplication +S000033309 CDS YPL212C 16 153149 151515 C 2011-02-03 1996-07-31 +S000006132 ORF Verified YPL211W NIP7 ribosome biosynthesis protein NIP7 chromosome 16 L000004183 16 153495 154040 W 2011-02-03 1996-07-31 Nucleolar protein required for 60S ribosome subunit biogenesis; constituent of 66S pre-ribosomal particles; physically interacts with Nop8p and the exosome subunit Rrp43p +S000033280 CDS YPL211W 16 153495 154040 W 2011-02-03 1996-07-31 +S000006131 ORF Verified YPL210C SRP72 signal recognition particle subunit SRP72 chromosome 16 L000002066 16 156212 154290 C 2011-02-03 2003-09-22|1996-07-31 Core component of the signal recognition particle (SRP); the SRP is a ribonucleoprotein (RNP) complex that functions in targeting nascent secretory proteins to the endoplasmic reticulum (ER) membrane +S000033194 CDS YPL210C 16 156212 154290 C 2011-02-03 2003-09-22|1996-07-31 +S000006130 ORF Verified YPL209C IPL1 aurora kinase|PAC15 chromosome 16 L000000871 16 157593 156490 C -116 2011-02-03 1996-07-31 Aurora kinase of chromosomal passenger complex; mediates release of mono-oriented kinetochores from microtubules in meiosis I, and kinetochore release from SPB clusters at meiotic exit; helps maintain condensed chromosomes during anaphase; required for SPB cohesion and prevention of multipolar spindle formation; promotes telomerase release at G2/M; Iocalizes to nuclear foci that diffuse upon DNA replication stress; required for inhibition of karyopherin Pse1p upon SAC arrest +S000032505 CDS YPL209C 16 157593 156490 C 2011-02-03 1996-07-31 +S000006129 ORF Verified YPL208W RKM1 protein-lysine N-methyltransferase chromosome 16 16 157842 159593 W 2011-02-03 1996-07-31 SET-domain lysine-N-methyltransferase; catalyzes the formation of dimethyllysine residues on the large ribosomal subunit proteins L23 (Rpl23Ap and Rpl23Bp) and monomethyllysine residues on L18 (Rps18Ap and Rps18Bp) +S000032466 CDS YPL208W 16 157842 159593 W 2011-02-03 1996-07-31 +S000006128 ORF Verified YPL207W TYW1 putative tRNA 4-demethylwyosine synthase chromosome 16 16 159909 162341 W 2011-02-03 1996-07-31 Iron-sulfer protein required for synthesis of Wybutosine modified tRNA; Wybutosine is a modified guanosine found at the 3'-position adjacent to the anticodon of phenylalanine tRNA which supports reading frame maintenance by stabilizing codon-anticodon interactions; induction by Yap5p in response to iron provides protection from high iron toxicity; overexpression results in increased cellular iron +S000032365 CDS YPL207W 16 159909 162341 W 2011-02-03 1996-07-31 +S000130196 ARS ARS1608 chromosome 16 16 162341 162632 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000006127 ORF Verified YPL206C PGC1 phosphatidylglycerol phospholipase chromosome 16 16 163597 162632 C 2011-02-03 1996-07-31 Phosphatidylglycerol phospholipase C; regulates phosphatidylglycerol (PG) accumulation via a phospholipase C-type degradation mechanism; PG levels affect mitochondrial function; contains glycerophosphodiester phosphodiesterase motifs +S000032198 CDS YPL206C 16 163597 162632 C 2011-02-03 1996-07-31 +S000006126 ORF Dubious YPL205C chromosome 16 16 164266 163922 C 2011-02-03 1996-07-31 Hypothetical protein; deletion of locus affects telomere length +S000031200 CDS YPL205C 16 164266 163922 C 2011-02-03 1996-07-31 +S000006125 ORF Verified YPL204W HRR25 serine/threonine protein kinase HRR25|KTI14 chromosome 16 L000000810 16 164276 165760 W 2011-02-03 1996-07-31 Conserved casein kinase; regulates diverse events including: vesicular traffic, DNA repair, the CVT pathway, monopolar attachment of sister kinetochores at meiosis I, and ribosomal subunit biogenesis; monopolin subunit; binds the RNAPII CTD; phosphorylates COPII coat subunits; interacts with Sit4p phosphatase; antagonizes calcineurin signaling, reducing nuclear accumulation of Crz1p; phosphorylates Dsn1p, the kinetochore receptor for monopolin; homolog of mammalian CK1delta +S000031120 CDS YPL204W 16 164276 165760 W 2011-02-03 1996-07-31 +S000006124 ORF Verified YPL203W TPK2 cAMP-dependent protein kinase catalytic subunit TPK2|PKA3|YKR1|PKA2 chromosome 16 L000001445 16 166256 167398 W -120 2011-02-03 1996-07-31 cAMP-dependent protein kinase catalytic subunit; promotes vegetative growth in response to nutrients via the Ras-cAMP signaling pathway; partially redundant with Tpk1p and Tpk3p; localizes to P-bodies during stationary phase; relocalizes to the cytosol in response to hypoxia +S000031020 CDS YPL203W 16 166256 167398 W 2011-02-03 1996-07-31 +S000006123 ORF Verified YPL202C AFT2 chromosome 16 16 169338 168088 C 2011-02-03 1996-07-31 Iron-regulated transcriptional activator; activates genes involved in intracellular iron use and required for iron homeostasis and resistance to oxidative stress; AFT2 has a paralog, AFT1, that arose from the whole genome duplication +S000029960 CDS YPL202C 16 169338 168088 C 2011-02-03 1996-07-31 +S000006122 ORF Verified YPL201C YIG1 chromosome 16 16 171155 169770 C 2011-02-03 1996-07-31 Protein that interacts with glycerol 3-phosphatase; plays a role in anaerobic glycerol production; localizes to the nucleus and cytosol +S000029831 CDS YPL201C 16 171155 169770 C 2011-02-03 1996-07-31 +S000006121 ORF Verified YPL200W CSM4 chromosome 16 16 171484 171954 W 2011-02-03 1996-07-31 Protein required for accurate chromosome segregation during meiosis; involved in meiotic telomere clustering (bouquet formation) and telomere-led rapid prophase movements; functions with meiosis-specific telomere-binding protein Ndj1p; CSM4 has a paralog, MPS2, that arose from the whole genome duplication +S000037884 CDS YPL200W 16 171484 171954 W 2011-02-03 1996-07-31 +S000006120 ORF Uncharacterized YPL199C chromosome 16 16 172755 172033 C 2011-02-03 1996-07-31 Putative protein of unknown function; predicted to be palmitoylated +S000031860 CDS YPL199C 16 172755 172033 C 2011-02-03 1996-07-31 +S000006119 ORF Verified YPL198W RPL7B uL30|ribosomal 60S subunit protein L7B|YL8|L7B|L6B|L30|rp11 chromosome 16 L000003304 16 173152 174702 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L7B; required for processing of 27SA3 pre-rRNA to 27SB pre-rRNA during assembly of large ribosomal subunit; depletion leads to a turnover of pre-rRNA; contains a conserved C-terminal Nucleic acid Binding Domain (NDB2); binds to Domain II of 25S and 5.8S rRNAs; homologous to mammalian ribosomal protein L7 and bacterial L30; RPL7B has a paralog, RPL7A, that arose from the whole genome duplication +S000031808 CDS YPL198W 16 173152 173162 W 2011-02-03 1996-07-31 +S000031809 CDS YPL198W 16 173572 173665 W 2011-02-03 1996-07-31 +S000031810 CDS YPL198W 16 174073 174702 W 2011-02-03 1996-07-31 +S000031811 intron YPL198W 16 173163 173571 W 2011-02-03 1996-07-31 +S000031812 intron YPL198W 16 173666 174072 W 2011-02-03 1996-07-31 +S000006450 snoRNA_gene snR59 SNR59 chromosome 16 L000004528 16 173827 173904 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A807 +S000030766 noncoding_exon snR59 16 173827 173904 W 2011-02-03 2000-05-19 +S000006118 ORF Dubious YPL197C chromosome 16 16 174756 174343 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the ribosomal gene RPL7B +S000031658 CDS YPL197C 16 174756 174343 C 2011-02-03 1996-07-31 +S000006117 ORF Verified YPL196W OXR1 chromosome 16 16 175043 175864 W 2011-02-03 1996-07-31 Protein of unknown function required for oxidative damage resistance; required for normal levels of resistance to oxidative damage; null mutants are sensitive to hydrogen peroxide; member of a conserved family of proteins found in eukaryotes +S000031609 CDS YPL196W 16 175043 175864 W 2011-02-03 1996-07-31 +S000006116 ORF Verified YPL195W APL5 YKS4 chromosome 16 L000003037 16 176223 179021 W 2011-02-03 1996-07-31 Delta adaptin-like subunit of the clathrin associated protein complex; functions in transport of alkaline phosphatase to the vacuole via the alternate pathway; suppressor of loss of casein kinase 1 function; the clathrin associated protein complex is also known as AP-3 +S000031504 CDS YPL195W 16 176223 179021 W 2011-02-03 1996-07-31 +S000006115 ORF Verified YPL194W DDC1 chromosome 16 L000004256 16 179277 181115 W 2011-02-03 1996-07-31 DNA damage checkpoint protein; part of a PCNA-like complex required for DNA damage response, required for pachytene checkpoint to inhibit cell cycle in response to unrepaired recombination intermediates; potential Cdc28p substrate; forms nuclear foci upon DNA replication stress +S000030638 CDS YPL194W 16 179277 181115 W 2011-02-03 1996-07-31 +S000006114 ORF Verified YPL193W RSA1 chromosome 16 L000004919 16 181403 182548 W 2011-02-03 1996-07-31 Protein involved in the assembly of 60S ribosomal subunits; functionally interacts with Dbp6p; functions in a late nucleoplasmic step of the assembly +S000030542 CDS YPL193W 16 181403 182548 W 2011-02-03 1996-07-31 +S000006113 ORF Verified YPL192C PRM3 pheromone-regulated protein PRM3 chromosome 16 16 183056 182655 C 2011-02-03 1996-07-31 Protein required for nuclear envelope fusion during karyogamy; pheromone-regulated; peripheral protein of the nuclear membrane; interacts with Kar5p at the spindle pole body +S000030353 CDS YPL192C 16 183056 182655 C 2011-02-03 1996-07-31 +S000006112 ORF Verified YPL191C chromosome 16 16 184679 183597 C 2011-02-03 1996-07-31 Protein of unknown function; diploid deletion strain exhibits high budding index; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YPL191C has a paralog, YGL082W, that arose from the whole genome duplication +S000037541 CDS YPL191C 16 184679 183597 C 2011-02-03 1996-07-31 +S000006111 ORF Verified YPL190C NAB3 HMD1 chromosome 16 L000001228 16 187725 185317 C 2011-02-03 1996-07-31 RNA-binding protein, subunit of Nrd1 complex (Nrd1p-Nab3p-Sen1p); complex interacts with exosome to mediate 3'-end formation of some mRNAs, snRNAs, snoRNAs, and CUTs; required for termination of non-poly(A) transcripts and efficient splicing; Nrd1-Nab3 pathway appears to have a role in rapid suppression of some genes when cells are shifted to poor growth conditions, indicating role for Nrd1-Nab3 in regulating cellular response to nutrient availability +S000037419 CDS YPL190C 16 187725 185317 C 2011-02-03 1996-07-31 +S000028527 ORF Verified YPL189C-A COA2 chromosome 16 16 188513 188307 C 2011-02-03 2003-07-29 Cytochrome oxidase assembly factor; null mutation results in respiratory deficiency with specific loss of cytochrome oxidase activity; functions downstream of assembly factors Mss51p and Coa1p and interacts with assembly factor Shy1p +S000030331 CDS YPL189C-A 16 188513 188307 C 2011-02-03 2003-07-29 +S000006110 ORF Verified YPL189W GUP2 putative O-acyltransferase chromosome 16 16 189154 190983 W 2011-02-03 1996-07-31 Probable membrane protein; possible role in proton symport of glycerol; member of the MBOAT family of putative membrane-bound O-acyltransferases; homolog of the mammalian Hedgehog pathway modulator HHAT; GUP2 has a paralog, GUP1, that arose from the whole genome duplication +S000036867 CDS YPL189W 16 189154 190983 W 2011-02-03 1996-07-31 +S000006109 ORF Verified YPL188W POS5 NADH kinase chromosome 16 L000002651 16 191406 192650 W 2011-02-03 1996-07-31 Mitochondrial NADH kinase; phosphorylates NADH; also phosphorylates NAD(+) with lower specificity; required for the response to oxidative stress +S000036799 CDS YPL188W 16 191406 192650 W 2011-02-03 1996-07-31 +S000006108 ORF Verified YPL187W MF(ALPHA)1 chromosome 16 L000001094 16 193648 194145 W -115 2011-02-03 1996-07-31 Mating pheromone alpha-factor, made by alpha cells; interacts with mating type a cells to induce cell cycle arrest and other responses leading to mating; also encoded by MF(ALPHA)2, although MF(ALPHA)1 produces most alpha-factor; binds copper(II) ions +S000036743 CDS YPL187W 16 193648 194145 W 2011-02-03 1996-07-31 +S000006106 ORF Dubious YPL185W chromosome 16 16 195253 195648 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene UIP4/YPL186C +S000035778 CDS YPL185W 16 195253 195648 W 2011-02-03 1996-07-31 +S000006107 ORF Verified YPL186C UIP4 chromosome 16 16 195426 194512 C 2011-02-03 1996-07-31 Protein that interacts with Ulp1p; a Ubl (ubiquitin-like protein)-specific protease for Smt3p protein conjugates; detected in a phosphorylated state in the mitochondrial outer membrane; also detected in ER and nuclear envelope +S000036644 CDS YPL186C 16 195426 194512 C 2011-02-03 1996-07-31 +S000006105 ORF Verified YPL184C MRN1 PTR69 chromosome 16 16 197788 195950 C 2011-02-03 1996-07-31 RNA-binding protein that may be involved in translational regulation; binds specific categories of mRNAs, including those that contain upstream open reading frames (uORFs) and internal ribosome entry sites (IRES); interacts genetically with chromatin remodelers and splicing factors, linking chromatin state, splicing and as a result mRNA maturation +S000035615 CDS YPL184C 16 197788 195950 C 2011-02-03 1996-07-31 +S000007224 ORF Verified YPL183W-A RTC6 putative mitochondrial 54S ribosomal protein RTC6|TAE4|GON5 chromosome 16 16 199095 199376 W 2011-02-03 1999-07-17 Protein involved in translation; mutants have defects in biogenesis of nuclear ribosomes; sequence similar to prokaryotic ribosomal protein L36, may be a mitochondrial ribosomal protein; protein abundance increases in response to DNA replication stress +S000035617 CDS YPL183W-A 16 199095 199376 W 2011-02-03 1999-07-17 +S000006104 ORF Verified YPL183C RTT10 TRM734|ERE2 chromosome 16 16 202536 199495 C 2011-02-03 1996-07-31 WD40 domain-containing protein involved in endosomal recycling; forms a complex with Rrt2p that functions in the retromer-mediated pathway for recycling internalized cell-surface proteins; interacts with Trm7p for 2'-O-methylation of N34 of substrate tRNAs; has a role in regulation of Ty1 transposition; human ortholog is WDR6 +S000035538 CDS YPL183C 16 202536 199495 C 2011-02-03 1996-07-31 +S000006102 ORF Verified YPL181W CTI6 RXT1 chromosome 16 16 203421 204941 W 2011-02-03 1996-07-31 Component of the Rpd3L histone deacetylase complex; relieves transcriptional repression by binding to the Cyc8p-Tup1p corepressor and recruiting the SAGA complex to the repressed promoter; contains a PHD finger domain +S000034453 CDS YPL181W 16 203421 204941 W 2011-02-03 1996-07-31 +S000006103 ORF Dubious YPL182C chromosome 16 16 203689 203306 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene CTI6/YPL181W +S000034519 CDS YPL182C 16 203689 203306 C 2011-02-03 1996-07-31 +S000006101 ORF Verified YPL180W TCO89 chromosome 16 16 205248 207647 W 2011-02-03 1996-07-31 Subunit of TORC1 (Tor1p or Tor2p-Kog1p-Lst8p-Tco89p); regulates global H3K56ac; TORC1 complex regulates growth in response to nutrient availability; cooperates with Ssd1p in the maintenance of cellular integrity; deletion strains are hypersensitive to rapamycin +S000034375 CDS YPL180W 16 205248 207647 W 2011-02-03 1996-07-31 +S000006100 ORF Verified YPL179W PPQ1 SAL6 chromosome 16 L000001797|L000001474 16 208157 209806 W 2011-02-03 1996-07-31 Protein phosphatase that regulates the mating response; negatively regulates the MAP kinase signaling cascade during mating; member of the serine/threonine phosphatase PP1 family +S000033429 CDS YPL179W 16 208157 209806 W 2011-02-03 1996-07-31 +S000006561 tRNA_gene tE(UUC)P chromosome 16 L000003736 16 210263 210192 C 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; target of K. lactis zymocin +S000036031 noncoding_exon tE(UUC)P 16 210263 210192 C 2011-02-03 2000-05-19 +S000007194 long_terminal_repeat YPLWdelta7 chromosome 16 16 210451 210771 W 2011-02-03 2000-05-19 Ty1 LTR +S000007195 long_terminal_repeat YPLWdelta8 chromosome 16 16 211577 211898 W 2011-02-03 2000-05-19 Ty2 LTR +S000006099 ORF Verified YPL178W CBC2 CBP20|SAE1|MUD13 chromosome 16 L000002891|L000004111 16 212158 212784 W 2011-02-03 1996-07-31 Small subunit of the heterodimeric cap binding complex with Sto1p; interacts with Npl3p, possibly to package mRNA for export from the nucleus; may have a role in telomere maintenance; contains an RNA-binding motif +S000033362 CDS YPL178W 16 212158 212784 W 2011-02-03 1996-07-31 +S000006098 ORF Verified YPL177C CUP9 chromosome 16 L000000442 16 213962 213042 C 2011-02-03 1996-07-31 Homeodomain-containing transcriptional repressor; regulates expression of PTR2, which encodes a major peptide transporter; imported peptides activate ubiquitin-dependent proteolysis, resulting in degradation of Cup9p and de-repression of PTR2 transcription; CUP9 has a paralog, TOS8, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000032622 CDS YPL177C 16 213962 213042 C 2011-02-03 1996-07-31 +S000006097 ORF Verified YPL176C TRE1 chromosome 16 16 218363 216012 C 2011-02-03 1996-07-31 Transferrin receptor-like protein; plasma membrane protein that binds Bsd2p and regulates ubiquitination and vacuolar degradation of the metal transporter Smf1p; functionally redundant with Tre2p; TRE1 has a paralog, TRE2, that arose from the whole genome duplication +S000032515 CDS YPL176C 16 218363 216012 C 2011-02-03 1996-07-31 +S000006096 ORF Verified YPL175W SPT14 phosphatidylinositol N-acetylglucosaminyltransferase SPT14|GPI3|CWH6 chromosome 16 L000002036 16 218630 220088 W -113 2011-02-03 2000-07-14|1996-07-31 UDP-glycosyltransferase subunit of the GPI-GnT complex; UDP-GlcNAc-binding and catalytic subunit of the enzyme that mediates the first step in glycosylphosphatidylinositol (GPI) biosynthesis, mutations cause defects in transcription and in biogenesis of cell wall proteins +S000032480 CDS YPL175W 16 218630 218646 W 2011-02-03 2000-07-14|1996-07-31 +S000032481 CDS YPL175W 16 218747 220088 W 2011-02-03 2000-07-14|1996-07-31 +S000032482 intron YPL175W 16 218647 218746 W 2011-02-03 2000-07-14|1996-07-31 +S000130197 ARS ARS1611 chromosome 16 16 220088 220167 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000006095 ORF Verified YPL174C NIP100 PAC13 chromosome 16 L000001254 16 222773 220167 C 2011-02-03 1996-07-31 Large subunit of the dynactin complex; dynactin is involved in partitioning the mitotic spindle between mother and daughter cells; putative ortholog of mammalian p150(glued) +S000031426 CDS YPL174C 16 222773 220167 C 2011-02-03 1996-07-31 +S000006094 ORF Verified YPL173W MRPL40 mitochondrial 54S ribosomal protein YmL40|YmL40 chromosome 16 L000002696 16 223143 224036 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000031355 CDS YPL173W 16 223143 224036 W 2011-02-03 1996-07-31 +S000006093 ORF Verified YPL172C COX10 protoheme IX farnesyltransferase chromosome 16 L000000394 16 225741 224353 C 2011-02-03 1996-07-31 Heme A:farnesyltransferase; catalyzes first step in conversion of protoheme to heme A prosthetic group required for cytochrome c oxidase activity; human ortholog COX10 can complement yeast cox10 null mutant; human ortholog COX10 is associated with mitochondrial disorders +S000031181 CDS YPL172C 16 225741 224353 C 2011-02-03 1996-07-31 +S000006092 ORF Verified YPL171C OYE3 NADPH dehydrogenase|ZRG6 chromosome 16 L000001326 16 227371 226169 C 2011-02-03 1996-07-31 Conserved NADPH oxidoreductase containing flavin mononucleotide (FMN); homologous to Oye2p with different ligand binding and catalytic properties; has potential roles in oxidative stress response and programmed cell death +S000030238 CDS YPL171C 16 227371 226169 C 2011-02-03 1996-07-31 +S000006091 ORF Verified YPL170W DAP1 chromosome 16 16 228314 228772 W 2011-02-03 1996-07-31 Heme-binding protein; involved in regulation of cytochrome P450 protein Erg11p; damage response protein, related to mammalian membrane progesterone receptors; mutations lead to defects in telomeres, mitochondria, and sterol synthesis +S000030129 CDS YPL170W 16 228314 228772 W 2011-02-03 1996-07-31 +S000006090 ORF Verified YPL169C MEX67 chromosome 16 L000004314 16 230838 229039 C 2011-02-03 1996-07-31 Poly(A)RNA binding protein involved in nuclear mRNA export; component of the nuclear pore; ortholog of human TAP +S000037096 CDS YPL169C 16 230838 229039 C 2011-02-03 1996-07-31 +S000006089 ORF Uncharacterized YPL168W MRX4 chromosome 16 16 231217 232509 W 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; green fluorescent protein (GFP)-fusion protein localizes to the mitochondrion; expression may be cell cycle-regulated +S000036477 CDS YPL168W 16 231217 232509 W 2011-02-03 1996-07-31 +S000006088 ORF Verified YPL167C REV3 PSO1 chromosome 16 L000001616 16 237107 232593 C -102 2011-02-03 1996-07-31 Catalytic subunit of DNA polymerase zeta; involved in translesion synthesis during post-replication repair; required for mutagenesis induced by DNA damage; involved in double-strand break repair; forms a complex with Rev7p, Pol31p and Pol32p +S000036379 CDS YPL167C 16 237107 232593 C 2011-02-03 1996-07-31 +S000006087 ORF Verified YPL166W ATG29 chromosome 16 16 237338 237979 W 2011-02-03 1996-07-31 Autophagy-specific protein; required for recruiting other ATG proteins to the pre-autophagosomal structure (PAS); interacts with Atg17p and localizas to the PAS in a manner interdependent with Atg17p and Cis1p; not conserved; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress +S000036304 CDS YPL166W 16 237338 237979 W 2011-02-03 1996-07-31 +S000006086 ORF Verified YPL165C SET6 chromosome 16 16 239077 237956 C 2011-02-03 1996-07-31 SET domain protein of unknown function; deletion heterozygote is sensitive to compounds that target ergosterol biosynthesis, may be involved in compound availability +S000036129 CDS YPL165C 16 239077 237956 C 2011-02-03 1996-07-31 +S000006085 ORF Verified YPL164C MLH3 mismatch repair protein MLH3 chromosome 16 16 241497 239350 C 2011-02-03 1996-07-31 Protein involved in DNA mismatch repair and meiotic recombination; involved in crossing-over during meiotic recombination; forms a complex with Mlh1p; mammalian homolog is implicated mammalian microsatellite instability +S000035196 CDS YPL164C 16 241497 239350 C 2011-02-03 1996-07-31 +S000006084 ORF Verified YPL163C SVS1 chromosome 16 L000002750 16 242700 241918 C 2011-02-03 1996-07-31 Cell wall and vacuolar protein; required for wild-type resistance to vanadate; SVS1 has a paralog, SRL1, that arose from the whole genome duplication +S000035038 CDS YPL163C 16 242700 241918 C 2011-02-03 1996-07-31 +S000006083 ORF Uncharacterized YPL162C chromosome 16 16 244027 243206 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the membrane of vacuole with cell cycle-correlated morphology +S000034090 CDS YPL162C 16 244027 243206 C 2011-02-03 1996-07-31 +S000006082 ORF Verified YPL161C BEM4 ROM7 chromosome 16 L000000170 16 246220 244319 C 2011-02-03 1996-07-31 Protein involved in establishment of cell polarity and bud emergence; interacts with the Rho1p small GTP-binding protein and with the Rho-type GTPase Cdc42p; involved in maintenance of proper telomere length +S000033986 CDS YPL161C 16 246220 244319 C 2011-02-03 1996-07-31 +S000006081 ORF Verified YPL160W CDC60 leucine--tRNA ligase CDC60|LeuRS chromosome 16 L000000283 16 246990 250262 W -65 2011-02-03 1996-07-31 Cytosolic leucyl tRNA synthetase; ligates leucine to the appropriate tRNA; human homolog LARS can complement yeast temperature-sensitive mutant at restrictive temperature +S000033896 CDS YPL160W 16 246990 250262 W 2011-02-03 1996-07-31 +S000006080 ORF Verified YPL159C PET20 chromosome 16 16 251668 250907 C 2011-02-03 1996-07-31 Mitochondrial protein; required for respiratory growth under some conditions and for stability of the mitochondrial genome +S000034917 CDS YPL159C 16 251668 250907 C 2011-02-03 1996-07-31 +S000006079 ORF Verified YPL158C AIM44 GPS1 chromosome 16 16 254310 252034 C 2011-02-03 1996-07-31 Protein that regulates Cdc42p and Rho1p; functions in the late steps of cytokinesis and cell separation; sustains Rho1p at the cell division site after actomyosin ring contraction; inhibits the activation of Cdc42-Cla4 at the cell division site to prevent budding inside the old bud neck; transcription is regulated by Swi5p; null mutant displays elevated frequency of mitochondrial genome loss; relocalizes from bud neck to cytoplasm upon DNA replication stress +S000034827 CDS YPL158C 16 254310 252034 C 2011-02-03 1996-07-31 +S000006078 ORF Verified YPL157W TGS1 RNA methyltransferase chromosome 16 16 254814 255761 W 2011-02-03 1996-07-31 Trimethyl guanosine synthase, conserved nucleolar methyl transferase; converts the m(7)G cap structure of snRNAs, snoRNAs, and telomerase TLC1 RNA to m(2,2,7)G; also required for nucleolar assembly and splicing of meiotic pre-mRNAs; interacts with Swm2p, which may confer substrate specificity on Tgs1p +S000032912 CDS YPL157W 16 254814 255761 W 2011-02-03 1996-07-31 +S000006077 ORF Verified YPL156C PRM4 pheromone-regulated protein PRM4 chromosome 16 16 256767 255913 C 2011-02-03 1996-07-31 Pheromone-regulated protein proposed to be involved in mating; predicted to have 1 transmembrane segment; transcriptionally regulated by Ste12p during mating and by Cat8p during the diauxic shift +S000032757 CDS YPL156C 16 256767 255913 C 2011-02-03 1996-07-31 +S000006076 ORF Verified YPL155C KIP2 chromosome 16 L000000908 16 259336 257216 C 2011-02-03 1996-07-31 Kinesin-related motor protein involved in mitotic spindle positioning; stabilizes microtubules by targeting Bik1p to the plus end; functions as a microtubule polymerase and catastrophe inhibitor in vitro; Kip2p levels are controlled during the cell cycle +S000032676 CDS YPL155C 16 259336 257216 C 2011-02-03 1996-07-31 +S000006075 ORF Verified YPL154C PEP4 proteinase A|yscA|PRA1|PHO9 chromosome 16 L000001375 16 260931 259714 C -95 2011-02-03 1996-07-31 Vacuolar aspartyl protease (proteinase A); required for posttranslational precursor maturation of vacuolar proteinases; important for protein turnover after oxidative damage; plays a protective role in acetic acid induced apoptosis; synthesized as a zymogen, self-activates +S000031707 CDS YPL154C 16 260931 259714 C 2011-02-03 1996-07-31 +S000130198 ARS ARS1612 chromosome 16 16 260931 261727 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000006074 ORF Verified YPL153C RAD53 serine/threonine/tyrosine protein kinase RAD53|SPK1|MEC2|LSD1 chromosome 16 L000001573 16 264192 261727 C -109 2011-02-03 1996-07-31 DNA damage response protein kinase; required for cell-cycle arrest, regulation of copper genes in response to DNA damage; phosphorylates nuclear pores to counteract gene gating, preventing aberrant transitions at forks approaching transcribed genes; activates downstream kinase Dun1p; differentially senses mtDNA depletion, mitochondrial ROS; relocalizes to cytosol under hypoxia; human homolog CHEK2 implicated in breast cancer can complement yeast null mutant +S000031574 CDS YPL153C 16 264192 261727 C 2011-02-03 1996-07-31 +S000028721 ORF Uncharacterized YPL152W-A chromosome 16 16 264602 264700 W 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032702 CDS YPL152W-A 16 264602 264700 W 2011-02-03 2003-07-29 +S000006073 ORF Verified YPL152W RRD2 peptidylprolyl isomerase RRD2|YPA2 chromosome 16 L000004484 16 265028 266104 W 2011-02-03 1996-07-31 Peptidyl-prolyl cis/trans-isomerase; also activates the phosphotyrosyl phosphatase activity of protein phosphatase 2A (PP2A); regulates G1 phase progression, the osmoresponse, microtubule dynamics; subunit of the Tap42p-Pph21p-Rrd2p complex; protein abundance increases in response to DNA replication stress +S000031507 CDS YPL152W 16 265028 266104 W 2011-02-03 1996-07-31 +S000006072 ORF Verified YPL151C PRP46 mRNA splicing protein PRP46|NTC50 chromosome 16 16 267535 266180 C 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); this complex contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs +S000030537 CDS YPL151C 16 267535 266180 C 2011-02-03 1996-07-31 +S000006071 ORF Uncharacterized YPL150W non-specific serine/threonine protein kinase chromosome 16 16 268188 270893 W 2011-02-03 1996-07-31 Protein kinase of unknown cellular role; binds phosphatidylinositols and cardiolipin in a large-scale study +S000030474 CDS YPL150W 16 268188 270893 W 2011-02-03 1996-07-31 +S000006070 ORF Verified YPL149W ATG5 APG5 chromosome 16 L000003303 16 271310 272194 W 2011-02-03 1996-07-31 Conserved protein involved in autophagy and the Cvt pathway; undergoes conjugation with Atg12p to form a complex involved in Atg8p lipidation; Atg5p-Atg12p conjugate enhances E2 activity of Atg3 by rearranging its catalytic site, also forms a complex with Atg16p; the Atg5-Atg12/Atg16 complex binds to membranes and is essential for autophagosome formation; also involved in methionine restriction extension of chronological lifespan in an autophagy-dependent manner +S000030694 CDS YPL149W 16 271310 272194 W 2011-02-03 1996-07-31 +S000006069 ORF Verified YPL148C PPT2 holo-[acyl-carrier-protein] synthase chromosome 16 L000004400 16 272815 272294 C 2011-02-03 2003-09-22|1996-07-31 Phosphopantetheine:protein transferase (PPTase); activates mitochondrial acyl carrier protein (Acp1p) by phosphopantetheinylation +S000036734 CDS YPL148C 16 272815 272294 C 2011-02-03 2003-09-22|1996-07-31 +S000006068 ORF Verified YPL147W PXA1 ATP-binding cassette long-chain fatty acid transporter PXA1|SSH2|PAT2|PAL1|LPI1 chromosome 16 L000001541 16 273255 275867 W 2011-02-03 1996-07-31 Subunit of heterodimeric peroxisomal ABC transport complex, with Pxa2p; required for import of long-chain fatty acids into peroxisomes; similar to human adrenoleukodystrophy transporters ABCD1and ABCD2, and ALD-related proteins; mutations in ABCD1 cause X-linked adrenoleukodystrophy (X-ALD), a peroxisomal disorder; human ABCD1 and ABCD2 can each partially complement yeast pxa1 pxa2 double null mutant +S000036715 CDS YPL147W 16 273255 275867 W 2011-02-03 1996-07-31 +S000006067 ORF Verified YPL146C NOP53 RRP16 chromosome 16 16 277529 276162 C 2011-02-03 1996-07-31 Nucleolar protein; involved in biogenesis of the 60S subunit of the ribosome; interacts with rRNA processing factors Cbf5p and Nop2p and with the nucleolar proteins Nop17p and Nip7p; null mutant is viable but growth is severely impaired +S000036573 CDS YPL146C 16 277529 276162 C 2011-02-03 1996-07-31 +S000006066 ORF Verified YPL145C KES1 oxysterol-binding protein KES1|BSR3|OSH4|LPI3 chromosome 16 L000000894 16 279699 278395 C 2011-02-03 1996-07-31 One of seven members of the yeast oxysterol binding protein family; involved in negative regulation of Sec14p-dependent Golgi complex secretory functions, peripheral membrane protein that localizes to the Golgi complex; KES1 has a paralog, HES1, that arose from the whole genome duplication +S000035629 CDS YPL145C 16 279699 278395 C 2011-02-03 1996-07-31 +S000006065 ORF Verified YPL144W POC4 DMP1|PBA4 chromosome 16 16 280480 280926 W 2011-02-03 1996-07-31 Component of a heterodimeric Poc4p-Irc25p chaperone; involved in assembly of alpha subunits into the 20S proteasome; may regulate formation of proteasome isoforms with alternative subunits under different conditions; upregulates proteasome assembly in response to the unfolded protein response activated by mistargeting of proteins (UPRam) +S000035609 CDS YPL144W 16 280480 280926 W 2011-02-03 1996-07-31 +S000007441 snoRNA_gene snR17b SNR17B U3 chromosome 16 L000004247 16 281517 281056 C 2011-02-03 2000-05-19 Small nucleolar RNA (snoRNA) U3; part of small (ribosomal) subunit (SSU) processosome; SNR17A also encodes snoRNA U3 +S000030181 intron snR17b 16 281503 281374 C 2011-02-03 2000-05-19 +S000030180 noncoding_exon snR17b 16 281373 281056 C 2011-02-03 2000-05-19 +S000030179 noncoding_exon snR17b 16 281517 281504 C 2011-02-03 2000-05-19 +S000006064 ORF Verified YPL143W RPL33A eL33|ribosomal 60S subunit protein L33A|L33e|rp47|l37A|YL37|L33A|RPL37A chromosome 16 L000001728 16 282122 282970 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L33A; N-terminally acetylated; rpl33a null mutant exhibits slow growth while rpl33a rpl33b double null mutant is inviable; homologous to mammalian ribosomal protein L35A, no bacterial homolog; RPL33A has a paralog, RPL33B, that arose from the whole genome duplication +S000035517 CDS YPL143W 16 282122 282140 W 2011-02-03 1996-07-31 +S000035518 CDS YPL143W 16 282666 282970 W 2011-02-03 1996-07-31 +S000035519 intron YPL143W 16 282141 282665 W 2011-02-03 1996-07-31 +S000006063 ORF Dubious YPL142C chromosome 16 16 283003 282686 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF RPL33A/YPL143W, a component of the large (60S) ribosomal subunit +S000035342 CDS YPL142C 16 283003 282686 C 2011-02-03 1996-07-31 +S000006062 ORF Verified YPL141C FRK1 protein kinase FRK1 chromosome 16 16 286061 283464 C 2011-02-03 1996-07-31 Protein kinase of unknown cellular role; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; interacts with rRNA transcription and ribosome biogenesis factors and the long chain fatty acyl-CoA synthetase Faa3p; FRK1 has a paralog, KIN4, that arose from the whole genome duplication +S000034336 CDS YPL141C 16 286061 283464 C 2011-02-03 1996-07-31 +S000006061 ORF Verified YPL140C MKK2 putative mitogen-activated protein kinase kinase MKK2|SSP33|LPI6 chromosome 16 L000001118 16 289034 287514 C 2011-02-03 1996-07-31 MAPKK involved in the protein kinase C signaling pathway; involved in control of cell integrity; upon activation by Bck1p phosphorylates downstream target, Slt2p; functionally redundant with Mkk1p; MKK2 has a paralog, MKK1, that arose from the whole genome duplication +S000034223 CDS YPL140C 16 289034 287514 C 2011-02-03 1996-07-31 +S000118414 ARS ARS1614 ARSXVI-290 chromosome 16 16 289485 289705 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178192 ARS_consensus_sequence ARS1614 16 289530 289546 W 2014-11-18 2014-11-18 +S000006060 ORF Verified YPL139C UME1 WTM3 chromosome 16 L000003500 16 291051 289669 C 2011-02-03 1996-07-31 Component of both the Rpd3S and Rpd3L histone deacetylase complexes; negative regulator of meiosis; required for repression of a subset of meiotic genes during vegetative growth, binding of histone deacetylase Rpd3p required for activity, contains a NEE box and a WD repeat motif; homologous with Wtm1p; UME1 has a paralog, WTM2, that arose from the whole genome duplication +S000034691 CDS YPL139C 16 291051 289669 C 2011-02-03 1996-07-31 +S000006059 ORF Verified YPL138C SPP1 SAF41|CPS40 chromosome 16 16 292427 291366 C 2011-02-03 1996-07-31 Subunit of COMPASS (Set1C); a complex which methylates histone H3 on lysine 4 and is required in telomeric transcriptional silencing; promotes meiotic DSB formation by interacting with H3K4me3 and Rec107p, a protein required for Spo11p-catalyzed DSB formation located on chromosome axes; interacts with Orc2p; PHD finger domain protein similar to human CGBP, an unmethylated CpG binding protein; relocalizes to cytosol in response to hypoxia +S000034627 CDS YPL138C 16 292427 291366 C 2011-02-03 1996-07-31 +S000006057 ORF Dubious YPL136W chromosome 16 16 296286 296654 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene GIP3/YPL137C +S000034466 CDS YPL136W 16 296286 296654 W 2011-02-03 1996-07-31 +S000006058 ORF Verified YPL137C GIP3 protein phosphatase regulator GIP3 chromosome 16 16 296647 292817 C 2011-02-03 1996-07-31 Cytoplasmic protein that regulates protein phosphatase 1 Glc7p; overexpression relocalizes Glc7p from the nucleus and prevents chromosome segregation; may interact with ribosomes, based on co-purification experiments; GIP3 has a paralog, HER1, that arose from the whole genome duplication +S000034539 CDS YPL137C 16 296647 292817 C 2011-02-03 1996-07-31 +S000006056 ORF Verified YPL135W ISU1 iron-binding protein ISU1|NUA1 chromosome 16 L000004769 16 297553 298050 W 2011-02-03 1996-07-31 Conserved protein of the mitochondrial matrix; performs a scaffolding function during assembly of iron-sulfur clusters, interacts physically and functionally with yeast frataxin (Yfh1p); ISU1 has a paralog, ISU2, that arose from the whole genome duplication; isu1 isu2 double mutant is inviable; human homolog ISCU implicated in mitochondrial myopathy, can complement isu1 isu2 double mutant +S000032464 CDS YPL135W 16 297553 298050 W 2011-02-03 1996-07-31 +S000028720 ORF Dubious YPL135C-A chromosome 16 16 297851 297678 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032700 CDS YPL135C-A 16 297851 297678 C 2011-02-03 2003-07-29 +S000006055 ORF Verified YPL134C ODC1 mitochondrial 2-oxodicarboxylate carrier chromosome 16 S000007520 16 299503 298571 C 2011-02-03 1996-07-31 Mitochondrial inner membrane transporter; 2-oxodicarboxylate transporter, exports 2-oxoadipate and 2-oxoglutarate from the mitochondrial matrix to the cytosol for lysine and glutamate biosynthesis and lysine catabolism; suppresses, in multicopy, an fmc1 null mutation; ODC1 has a paralog, ODC2, that arose from the whole genome duplication +S000032295 CDS YPL134C 16 299503 298571 C 2011-02-03 1996-07-31 +S000006054 ORF Verified YPL133C RDS2 chromosome 16 16 301228 299888 C 2011-02-03 1996-07-31 Transcription factor involved in regulating gluconeogenesis; also involved in the regulation of glyoxylate cycle genes; member of the zinc cluster family of proteins; confers resistance to ketoconazole +S000032197 CDS YPL133C 16 301228 299888 C 2011-02-03 1996-07-31 +S000006053 ORF Verified YPL132W COX11 PSO7|LPI13 chromosome 16 L000000395|L000004044 16 301716 302618 W 2011-02-03 1996-07-31 Protein required for delivery of copper to Cox1p; mitochondrial inner membrane protein; association with mitochondrial ribosomes suggests that copper delivery may occur during translation of Cox1p +S000031257 CDS YPL132W 16 301716 302618 W 2011-02-03 1996-07-31 +S000006052 ORF Verified YPL131W RPL5 uL18|ribosomal 60S subunit protein L5|L18|YL3|L5|L1a|RPL1|LPI14 chromosome 16 L000001699 16 303121 304014 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L5; nascent Rpl5p is bound by specific chaperone Syo1p during translation; homologous to mammalian ribosomal protein L5 and bacterial L18; binds 5S rRNA and is required for 60S subunit assembly +S000031118 CDS YPL131W 16 303121 304014 W 2011-02-03 1996-07-31 +S000006051 ORF Verified YPL130W SPO19 chromosome 16 16 304387 305058 W 2011-02-03 1996-07-31 Meiosis-specific prospore protein; required to produce bending force necessary for proper assembly of the prospore membrane during sporulation; identified as a weak high-copy suppressor of the spo1-1 ts mutation; SPO19 has a paralog, YOR214C, that arose from the whole genome duplication +S000031018 CDS YPL130W 16 304387 305058 W 2011-02-03 1996-07-31 +S000006050 ORF Verified YPL129W TAF14 TATA-binding protein-associated factor TAF14|TafII30|ANC1|TFG3|TAF30|SWP29 chromosome 16 L000000086 16 305298 306137 W 2011-02-03 1996-07-31 Subunit of TFIID, TFIIF, INO80, SWI/SNF, and NuA3 complexes; involved in RNA polymerase II transcription initiation and in chromatin modification; contains a YEATS domain +S000031306 CDS YPL129W 16 305298 305306 W 2011-02-03 1996-07-31 +S000031307 CDS YPL129W 16 305412 306137 W 2011-02-03 1996-07-31 +S000031308 intron YPL129W 16 305307 305411 W 2011-02-03 1996-07-31 +S000006049 ORF Verified YPL128C TBF1 LPI16 chromosome 16 L000002264 16 308221 306533 C -81.5 2011-02-03 1996-07-31 Telobox-containing general regulatory factor; binds TTAGGG repeats within subtelomeric anti-silencing regions (STARs), blocking silent chromatin propagation; binds majority of snoRNA gene promoters, required for full snoRNA expression; caps DSB flanked by long T2AG3 repeats and blocks checkpoint activation +S000030320 CDS YPL128C 16 308221 306533 C 2011-02-03 1996-07-31 +S000006048 ORF Verified YPL127C HHO1 histone H1 chromosome 16 L000003354 16 309604 308828 C 2011-02-03 1996-07-31 Histone H1, linker histone with roles in meiosis and sporulation; decreasing levels early in sporulation may promote meiosis, and increasing levels during sporulation facilitate compaction of spore chromatin; binds to promoters and within genes in mature spores; may be recruited by Ume6p to promoter regions, contributing to transcriptional repression outside of meiosis; suppresses DNA repair involving homologous recombination +S000030125 CDS YPL127C 16 309604 308828 C 2011-02-03 1996-07-31 +S000006047 ORF Verified YPL126W NAN1 UTP17 chromosome 16 16 310210 312900 W 2011-02-03 1996-07-31 U3 snoRNP protein; component of the small (ribosomal) subunit (SSU) processosome containing U3 snoRNA; required for the biogenesis of18S rRNA +S000030112 CDS YPL126W 16 310210 312900 W 2011-02-03 1996-07-31 +S000006046 ORF Verified YPL125W KAP120 LPH2 chromosome 16 16 313388 316486 W 2011-02-03 1996-07-31 Karyopherin responsible for the nuclear import of Rpf1p; Rpf1p is a ribosome maturation factor +S000036402 CDS YPL125W 16 313388 316486 W 2011-02-03 1996-07-31 +S000006045 ORF Verified YPL124W SPC29 NIP29|LPH3 chromosome 16 L000001253 16 316755 317516 W 2011-02-03 1996-07-31 Inner plaque spindle pole body (SPB) component; links the central plaque component Spc42p to the inner plaque component Spc110p; required for SPB duplication +S000036286 CDS YPL124W 16 316755 317516 W 2011-02-03 1996-07-31 +S000006044 ORF Verified YPL123C RNY1 ribonuclease T2 chromosome 16 16 318945 317641 C 2011-02-03 1996-07-31 Vacuolar RNase of the T(2) family; relocalizes to the cytosol where it cleaves tRNAs upon oxidative or stationary phase stress; required for tRNA-specific translational pausing suring oxidative stress; promotes apoptosis under stress conditions and this function is independent of Rny1p catalytic activity +S000036104 CDS YPL123C 16 318945 317641 C 2011-02-03 1996-07-31 +S000006043 ORF Verified YPL122C TFB2 TFIIH/NER complex subunit TFB2 chromosome 16 L000003495 16 320767 319226 C 2011-02-03 1996-07-31 Subunit of TFIIH and nucleotide excision repair factor 3 complexes; involved in transcription initiation, required for nucleotide excision repair, similar to 52 kDa subunit of human TFIIH +S000035221 CDS YPL122C 16 320767 319226 C 2011-02-03 1996-07-31 +S000006042 ORF Verified YPL121C MEI5 LPH6 chromosome 16 L000001061 16 321630 320962 C 2011-02-03 1996-07-31 Meiosis-specific protein involved in meiotic recombination; involved in DMC1-dependent meiotic recombination; forms heterodimer with Sae3p; proposed to be an assembly factor for Dmc1p +S000035025 CDS YPL121C 16 321630 320962 C 2011-02-03 1996-07-31 +S000006041 ORF Verified YPL120W VPS30 beclin 1|ATG6|VPT30|APG6 chromosome 16 L000003545 16 322071 323744 W 2011-02-03 1996-07-31 Subunit of phosphatidylinositol (PtdIns) 3-kinase complexes I and II; Complex I is essential in autophagy, Complex II is required for vacuolar protein sorting; required for overflow degradation of misfolded proteins when ERAD is saturated; C-terminus has novel globular fold essential for autophagy through the targeting of the PI3-kinase complex I to the pre-autophagosomal structure; ortholog of higher eukaryote gene Beclin 1; human BECN1 can complement yeast null mutant +S000034961 CDS YPL120W 16 322071 323744 W 2011-02-03 1996-07-31 +S000028859 ORF Uncharacterized YPL119C-A chromosome 16 16 324287 324024 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000034573 CDS YPL119C-A 16 324287 324024 C 2011-02-03 2003-07-29 +S000006040 ORF Verified YPL119C DBP1 putative DEAD-box ATP-dependent RNA helicase DBP1|LPH8 chromosome 16 L000000492 16 326264 324411 C 2011-02-03 1996-07-31 Putative ATP-dependent RNA helicase of the DEAD-box protein family; mutants show reduced stability of the 40S ribosomal subunit scanning through 5' untranslated regions of mRNAs; protein abundance increases in response to DNA replication stress; DBP1 has a paralog, DED1, that arose from the whole genome duplication +S000035431 CDS YPL119C 16 326264 324411 C 2011-02-03 1996-07-31 +S000006039 ORF Verified YPL118W MRP51 mitochondrial 37S ribosomal protein MRP51 chromosome 16 L000003325 16 326628 327662 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; MRP51 exhibits genetic interactions with mutations in the COX2 and COX3 mRNA 5'-untranslated leader sequences +S000035395 CDS YPL118W 16 326628 327662 W 2011-02-03 1996-07-31 +S000006038 ORF Verified YPL117C IDI1 isopentenyl-diphosphate delta-isomerase IDI1|LPH10|BOT2 chromosome 16 L000000851 16 328730 327864 C -69.8 2011-02-03 1996-07-31 Isopentenyl diphosphate:dimethylallyl diphosphate isomerase; catalyzes an essential activation step in the isoprenoid biosynthetic pathway; required for viability; isopentenyl diphosphate:dimethylallyl diphosphate isomerase is also known as IPP isomerase +S000034380 CDS YPL117C 16 328730 327864 C 2011-02-03 1996-07-31 +S000006037 ORF Verified YPL116W HOS3 histone deacetylase chromosome 16 L000004093 16 329606 331699 W 2011-02-03 1996-07-31 Trichostatin A-insensitive homodimeric histone deacetylase (HDAC); specificity in vitro for histones H3, H4, H2A, and H2B; similar to Hda1p, Rpd3p, Hos1p, and Hos2p; deletion results in increased histone acetylation at rDNA repeats +S000034349 CDS YPL116W 16 329606 331699 W 2011-02-03 1996-07-31 +S000130199 ARS ARS1617 chromosome 16 16 331699 332100 2011-02-03 2009-05-08 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay +S000006036 ORF Verified YPL115C BEM3 chromosome 16 L000000169 16 335486 332100 C 2011-02-03 1996-07-31 Rho GTPase activating protein (RhoGAP); involved in control of the cytoskeleton organization; targets the essential Rho-GTPase Cdc42p, which controls establishment and maintenance of cell polarity, including bud-site assembly +S000034256 CDS YPL115C 16 335486 332100 C 2011-02-03 1996-07-31 +S000006035 ORF Dubious YPL114W chromosome 16 16 335948 336367 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; largely overlaps ORF YPL113C; diploid deletion in BY4743 strain background exhibits high budding index +S000034237 CDS YPL114W 16 335948 336367 W 2011-02-03 1996-07-31 +S000006034 ORF Verified YPL113C glyoxylate reductase chromosome 16 16 337143 335953 C 2011-02-03 1996-07-31 Glyoxylate reductase; acts on glyoxylate and hydroxypyruvate substrates; YPL113C is not an essential gene +S000032142 CDS YPL113C 16 337143 335953 C 2011-02-03 1996-07-31 +S000006033 ORF Verified YPL112C PEX25 chromosome 16 16 338620 337436 C 2011-02-03 1996-07-31 Peripheral peroxisomal membrane peroxin; required for the regulation of peroxisome size and maintenance, recruits GTPase Rho1p to peroxisomes, induced by oleate, interacts with Pex27p; PEX25 has a paralog, PEX27, that arose from the whole genome duplication +S000032062 CDS YPL112C 16 338620 337436 C 2011-02-03 1996-07-31 +S000006667 tRNA_gene tM(CAU)P IMT2 chromosome 16 L000003735 16 338919 338848 C 2011-02-03 2000-05-19 Methionine initiator tRNA (tRNA-Met); predicted by tRNAscan-SE analysis; one of four initiator methionine tRNAs in yeast that are functional for translation +S000034575 noncoding_exon tM(CAU)P 16 338919 338848 C 2011-02-03 2000-05-19 +S000006032 ORF Verified YPL111W CAR1 arginase|cargA|LPH15 chromosome 16 L000000216 16 339944 340945 W -75 2011-02-03 1996-07-31 Arginase, catabolizes arginine to ornithine and urea; expression responds to both induction by arginine and nitrogen catabolite repression; disruption decreases production of carcinogen ethyl carbamate during wine fermentation and also enhances freeze tolerance +S000031989 CDS YPL111W 16 339944 340945 W 2011-02-03 1996-07-31 +S000006031 ORF Verified YPL110C GDE1 glycerophosphocholine phosphodiesterase chromosome 16 16 344739 341068 C 2011-02-03 1996-07-31 Glycerophosphocholine (GroPCho) phosphodiesterase; hydrolyzes GroPCho to choline and glycerolphosphate, for use as a phosphate source and as a precursor for phosphocholine synthesis; may interact with ribosomes +S000031745 CDS YPL110C 16 344739 341068 C 2011-02-03 1996-07-31 +S000006030 ORF Uncharacterized YPL109C chromosome 16 16 347389 345264 C 2011-02-03 2004-07-21|1996-07-31|2003-09-27 UbiB family protein; contains transmembrane domain and mitochondrial targeting sequence; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000032179 CDS YPL109C 16 345444 345264 C 2011-02-03 2003-09-27 +S000032178 CDS YPL109C 16 347389 345597 C 2011-02-03 2004-07-21|1996-07-31|2003-09-27 +S000032180 intron YPL109C 16 345596 345445 C 2011-02-03 2003-09-27 +S000006029 ORF Uncharacterized YPL108W chromosome 16 16 348446 348952 W 2011-02-03 1996-07-31 Cytoplasmic protein of unknown function; non-essential gene that is induced in a GDH1 deleted strain with altered redox metabolism; GFP-fusion protein is induced in response to the DNA-damaging agent MMS +S000032152 CDS YPL108W 16 348446 348952 W 2011-02-03 1996-07-31 +S000006028 ORF Uncharacterized YPL107W chromosome 16 16 349119 349865 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to mitochondria; YPL107W is not an essential gene +S000031186 CDS YPL107W 16 349119 349865 W 2011-02-03 1996-07-31 +S000006027 ORF Verified YPL106C SSE1 adenyl-nucleotide exchange factor SSE1|MSI3|LPG3 chromosome 16 L000002078 16 352275 350194 C 2011-02-03 1996-07-31 ATPase component of heat shock protein Hsp90 chaperone complex; serves as nucleotide exchange factor to load ATP onto the SSA class of cytosolic Hsp70s; plays a role in prion propagation and determining prion variants; binds unfolded proteins; member of Hsp110 subclass of HSP70 proteins; deletion results in spindle elongation in S phase; SSE1 has a paralog, SSE2, that arose from the whole genome duplication +S000031029 CDS YPL106C 16 352275 350194 C 2011-02-03 1996-07-31 +S000006026 ORF Verified YPL105C SYH1 MYR1 chromosome 16 16 355412 352863 C 2011-02-03 1996-07-31 Protein of unknown function that influences nuclear pore distribution; co-purifies with ribosomes; contains a GYF domain, which bind proline-rich sequences; deletion extends chronological lifespan; SYH1 has a paralog, SMY2, that arose from the whole genome duplication +S000030941 CDS YPL105C 16 355412 352863 C 2011-02-03 1996-07-31 +S000006025 ORF Verified YPL104W MSD1 aspartate--tRNA ligase MSD1|LPG5 chromosome 16 L000001186 16 355700 357676 W 2011-02-03 1996-07-31 Mitochondrial aspartyl-tRNA synthetase; required for acylation of aspartyl-tRNA; yeast and bacterial aspartyl-, asparaginyl-, and lysyl-tRNA synthetases contain regions with high sequence similarity, suggesting a common ancestral gene +S000030906 CDS YPL104W 16 355700 357676 W 2011-02-03 1996-07-31 +S000006024 ORF Verified YPL103C FMP30 N-acetylphosphatidylethanolamine-hydrolyzing phospholipase D chromosome 16 16 359406 358000 C 2011-02-03 1996-07-31 Protein with a role in maintaining mitochondrial morphology; also involved in maintaining normal cardiolipin levels; mitochondrial inner membrane protein; proposed to be involved in N-acylethanolamine metabolism; related to mammalian N-acylPE-specific phospholipase D +S000029844 CDS YPL103C 16 359406 358000 C 2011-02-03 1996-07-31 +S000006022 ORF Verified YPL101W ELP4 Elongator subunit ELP4|KTI9|TOT7|HAP1 chromosome 16 16 360209 361579 W 2011-02-03 1996-07-31 Subunit of hexameric RecA-like ATPase Elp456 Elongator subcomplex; which is required for modification of wobble nucleosides in tRNA; required for Elongator structural integrity; null mutation is functionally complemented by human ELP4 +S000037803 CDS YPL101W 16 360209 361579 W 2011-02-03 1996-07-31 +S000006023 ORF Dubious YPL102C chromosome 16 16 360305 360003 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; deletion mutation enhances replication of Brome mosaic virus in S. cerevisiae, but this is likely due to effects on the overlapping gene ELP4 +S000037833 CDS YPL102C 16 360305 360003 C 2011-02-03 1996-07-31 +S000006021 ORF Verified YPL100W ATG21 HSV1|MAI1 chromosome 16 16 361872 363362 W 2011-02-03 1996-07-31 Phosphoinositide binding protein; required for vesicle formation in the cytoplasm-to-vacuole targeting (Cvt) pathway; binds both phosphatidylinositol (3,5)-bisphosphate and phosphatidylinositol 3-phosphate; WD-40 repeat protein +S000035919 CDS YPL100W 16 361872 363362 W 2011-02-03 1996-07-31 +S000006020 ORF Verified YPL099C INA17 AIM43|FMP14 chromosome 16 16 364068 363520 C 2011-02-03 1996-07-31 F1F0 ATPase synthase peripheral stalk assembly factor; subunit of the matrix-exposed inner mitochondrial membrane localized INA complex (Ina22p-Ina17p) involved in assembly of the F1F0 peripheral stalk; co-purifies with Ina22p and ATP synthase subunits; null mutant displays elevated frequency of mitochondrial genome loss and has a respiratory growth defect +S000037350 CDS YPL099C 16 364068 363520 C 2011-02-03 1996-07-31 +S000006019 ORF Verified YPL098C MGR2 chromosome 16 16 364727 364386 C 2011-02-03 1996-07-31 Subunit of the TIM23 translocase complex; acts to couple Tim21p with the core Tim23 translocase; provides quality control for insertion of membrane proteins by regulating their release into the inner membrane by the TIM23 complex; absolutely required for mitochondrial import of presequence-containing proteins at elevated temperature; required for viability of cells lacking the mitochondrial genome (petite-negative phenotype) +S000037279 CDS YPL098C 16 364727 364386 C 2011-02-03 1996-07-31 +S000006018 ORF Verified YPL097W MSY1 tyrosine--tRNA ligase MSY1 chromosome 16 L000002838 16 364952 366430 W 2011-02-03 1996-07-31 Mitochondrial tyrosyl-tRNA synthetase +S000037246 CDS YPL097W 16 364952 366430 W 2011-02-03 1996-07-31 +S000028423 ORF Verified YPL096C-A ERI1 RIN1 chromosome 16 S000028417 16 366735 366529 C 2011-02-03 2002-06-20 Endoplasmic reticulum membrane protein that binds and inhibits Ras2p; binds to and inhibits GTP-bound Ras2p at the endoplasmic reticulum (ER); component of the GPI-GnT complex which catalyzes the first step in GPI-anchor biosynthesis; probable homolog of mammalian PIG-Y protein +S000029959 CDS YPL096C-A 16 366735 366529 C 2011-02-03 2002-06-20 +S000006017 ORF Verified YPL096W PNG1 peptide-N4-(N-acetyl-beta-glucosaminyl)asparagine amidase chromosome 16 16 366927 368018 W 2011-02-03 1996-07-31 Conserved peptide N-glycanase; deglycosylating enzyme that cleaves N-glycans that are attached to misfolded ERAD substrate glycoproteins prior to proteasome-dependent degradation; localizes to the cytoplasm and nucleus; activity is enhanced by interaction with Rad23p; human ortholog NGLY1 is associated with a syndrome characterized by developmental delays, epilepsy, absence of tears and liver disease +S000037168 CDS YPL096W 16 366927 368018 W 2011-02-03 1996-07-31 +S000006016 ORF Verified YPL095C EEB1 medium-chain fatty acid ethyl ester synthase/esterase chromosome 16 16 369441 368071 C 2011-02-03 1996-07-31 Acyl-coenzymeA:ethanol O-acyltransferase; responsible for the major part of medium-chain fatty acid ethyl ester biosynthesis during fermentation; possesses short-chain esterase activity; may be involved in lipid metabolism and detoxification; EEB1 has a paralog, EHT1, that arose from the whole genome duplication +S000036441 CDS YPL095C 16 369441 368071 C 2011-02-03 1996-07-31 +S000006015 ORF Verified YPL094C SEC62 Sec63 complex subunit SEC62|LPG14 chromosome 16 L000001853 16 370663 369839 C 2011-02-03 2004-01-09|1996-07-31 Essential subunit of Sec63 complex; with Sec61 complex, Kar2p/BiP and Lhs1p forms a channel competent for SRP-dependent and post-translational SRP-independent protein targeting and import into the ER; cotranslationally N-acetylated by NatA; other members are Sec63p, Sec66p, and Sec72p +S000036372 CDS YPL094C 16 370663 369839 C 2011-02-03 2004-01-09|1996-07-31 +S000006014 ORF Verified YPL093W NOG1 putative GTPase NOG1 chromosome 16 16 370978 372921 W 2011-02-03 1996-07-31 Putative GTPase; associates with free 60S ribosomal subunits in the nucleolus and is required for 60S ribosomal subunit biogenesis; constituent of 66S pre-ribosomal particles; member of the ODN family of nucleolar G-proteins +S000036303 CDS YPL093W 16 370978 372921 W 2011-02-03 1996-07-31 +S000006013 ORF Verified YPL092W SSU1 LPG16 chromosome 16 L000002094 16 373793 375169 W 2011-02-03 1996-07-31 Plasma membrane sulfite pump involved in sulfite metabolism; required for efficient sulfite efflux; major facilitator superfamily protein +S000036190 CDS YPL092W 16 373793 375169 W 2011-02-03 1996-07-31 +S000006012 ORF Verified YPL091W GLR1 glutathione-disulfide reductase GLR1|LPG17 chromosome 16 L000000714 16 375502 376953 W 2011-02-03 1996-07-31 Cytosolic and mitochondrial glutathione oxidoreductase; converts oxidized glutathione to reduced glutathione; cytosolic Glr1p is the main determinant of the glutathione redox state of the mitochondrial intermembrane space; mitochondrial Glr1p has a role in resistance to hyperoxia; protein abundance increases in response to DNA replication stress +S000035283 CDS YPL091W 16 375502 376953 W 2011-02-03 1996-07-31 +S000006011 ORF Verified YPL090C RPS6A eS6|ribosomal 40S subunit protein S6A|S6e|rp9|YS4|S6A|S10A chromosome 16 L000004472 16 378395 377291 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S6, no bacterial homolog; phosphorylated on S233 by Ypk3p in a TORC1-dependent manner, and on S232 in a TORC1/2-dependent manner by Ypk1/2/3p; RPS6A has a paralog, RPS6B, that arose from the whole genome duplication +S000035035 CDS YPL090C 16 377995 377291 C 2011-02-03 1996-07-31 +S000035034 CDS YPL090C 16 378395 378390 C 2011-02-03 1996-07-31 +S000035036 intron YPL090C 16 378389 377996 C 2011-02-03 1996-07-31 +S000006010 ORF Verified YPL089C RLM1 chromosome 16 L000003028 16 381150 379120 C 2011-02-03 1996-07-31 MADS-box transcription factor; component of the protein kinase C-mediated MAP kinase pathway involved in the maintenance of cell integrity; phosphorylated and activated by the MAP-kinase Slt2p; RLM1 has a paralog, SMP1, that arose from the whole genome duplication +S000035262 CDS YPL089C 16 381150 379120 C 2011-02-03 1996-07-31 +S000006009 ORF Uncharacterized YPL088W aldo-keto reductase superfamily protein chromosome 16 16 381965 382993 W 2011-02-03 1996-07-31 Putative aryl alcohol dehydrogenase; transcription is activated by paralogous transcription factors Yrm1p and Yrr1p along with genes involved in multidrug resistance +S000035218 CDS YPL088W 16 381965 382993 W 2011-02-03 1996-07-31 +S000006008 ORF Verified YPL087W YDC1 alkaline dihydroceramidase chromosome 16 16 383455 384408 W 2011-02-03 1996-07-31 Alkaline dihydroceramidase, involved in sphingolipid metabolism; preferentially hydrolyzes dihydroceramide to a free fatty acid and dihydrosphingosine; has a minor reverse activity; YDC1 has a paralog, YPC1, that arose from the whole genome duplication +S000035115 CDS YPL087W 16 383455 384408 W 2011-02-03 1996-07-31 +S000118415 ARS ARS1618 ARSXVI-385 chromosome 16 16 384542 384789 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178193 ARS_consensus_sequence ARS1618 16 384592 384608 W 2014-11-18 2014-11-18 +S000006007 ORF Verified YPL086C ELP3 Elongator subunit ELP3|KAT9|KTI8|TOT3|HPA1 chromosome 16 L000004378 16 386446 384773 C 2011-02-03 1996-07-31 Subunit of Elongator complex; Elongator is required for modification of wobble nucleosides in tRNA; exhibits histone acetyltransferase activity that is directed to histones H3 and H4; disruption confers resistance to K. lactis zymotoxin; human homolog ELP3 can partially complement yeast elp3 null mutant +S000034914 CDS YPL086C 16 386446 384773 C 2011-02-03 1996-07-31 +S000006006 ORF Verified YPL085W SEC16 LPF1 chromosome 16 L000003051 16 387067 393654 W 2011-02-03 1996-07-31 COPII vesicle coat protein required for ER transport vesicle budding; essential factor in endoplasmic reticulum exit site (ERES) formation, as well as in COPII-mediated ER-to-Golgi traffic; bound to periphery of ER membranes and may act to stabilize initial COPII complexes; interacts with Sec23p, Sec24p and Sec31p +S000034866 CDS YPL085W 16 387067 393654 W 2011-02-03 1996-07-31 +S000006005 ORF Verified YPL084W BRO1 NPI3|ASI6|VPS31|LPF2 chromosome 16 L000003061 16 394038 396572 W 2011-02-03 1996-07-31 Cytoplasmic class E vacuolar protein sorting (VPS) factor; coordinates deubiquitination in the multivesicular body (MVB) pathway by recruiting Doa4p to endosomes +S000032909 CDS YPL084W 16 394038 396572 W 2011-02-03 1996-07-31 +S000006004 ORF Verified YPL083C SEN54 tRNA splicing endonuclease subunit SEN54 chromosome 16 L000003974 16 398105 396702 C 2011-02-03 1996-07-31 Subunit of the tRNA splicing endonuclease; tRNA splicing endonuclease (Sen complex) is composed of Sen2p, Sen15p, Sen34p, and Sen54p; Sen complex also cleaves the CBP1 mRNA at the mitochondrial surface +S000032739 CDS YPL083C 16 398105 396702 C 2011-02-03 1996-07-31 +S000006003 ORF Verified YPL082C MOT1 DNA-binding ATPase|END10|BTAF1|LPF4|BUR3 chromosome 16 L000001136|L000004559|S000029158 16 404083 398480 C 2011-02-03 1996-07-31 Essential protein involved in regulation of transcription; removes Spt15p (TBP) from DNA via its C-terminal ATPase activity; may have a role in ensuring that soluble TBP is available to bind TATA-less promoters; forms a complex with TBP that binds TATA DNA with high affinity but with altered specificity; the Mot1p-Spt15p-DNA ternary complex contains unbent DNA; coregulates transcription with Spt16p through assembly of preinitiation complex and organization of nucleosomes +S000032674 CDS YPL082C 16 404083 398480 C 2011-02-03 1996-07-31 +S000006002 ORF Verified YPL081W RPS9A uS4|ribosomal 40S subunit protein S9A|rp21|YS11|S9A|S4|S13 chromosome 16 L000004474 16 404950 406044 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S9 and bacterial S4; RPS9A has a paralog, RPS9B, that arose from the whole genome duplication +S000032631 CDS YPL081W 16 404950 404956 W 2011-02-03 1996-07-31 +S000032632 CDS YPL081W 16 405458 406044 W 2011-02-03 1996-07-31 +S000032633 intron YPL081W 16 404957 405457 W 2011-02-03 1996-07-31 +S000006001 ORF Dubious YPL080C chromosome 16 16 406498 406172 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031568 CDS YPL080C 16 406498 406172 C 2011-02-03 1996-07-31 +S000006000 ORF Verified YPL079W RPL21B eL21|ribosomal 60S subunit protein L21B|L21e|L21B chromosome 16 L000004459 16 406636 407539 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L21B; homologous to mammalian ribosomal protein L21, no bacterial homolog; RPL21B has a paralog, RPL21A, that arose from the whole genome duplication +S000031935 CDS YPL079W 16 406636 406646 W 2011-02-03 1996-07-31 +S000031936 CDS YPL079W 16 407068 407539 W 2011-02-03 1996-07-31 +S000031937 intron YPL079W 16 406647 407067 W 2011-02-03 1996-07-31 +S000005999 ORF Verified YPL078C ATP4 F1F0 ATP synthase subunit 4|LPF7 chromosome 16 L000000144 16 408744 408010 C 2011-02-03 1996-07-31 Subunit b of the stator stalk of mitochondrial F1F0 ATP synthase; ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; contributes to the oligomerization of the complex, which in turn determines the shape of inner membrane cristae; phosphorylated +S000030814 CDS YPL078C 16 408744 408010 C 2011-02-03 1996-07-31 +S000005998 ORF Uncharacterized YPL077C chromosome 16 16 410090 409368 C 2011-02-03 1996-07-31 Putative protein of unknown function; regulates PIS1 expression; mutant displays spore wall assembly defect in ether sensitivity screen; YPL077C is not an essential gene; YPL077C has a paralog, YBR197C, that arose from the whole genome duplication +S000030729 CDS YPL077C 16 410090 409368 C 2011-02-03 1996-07-31 +S000005997 ORF Verified YPL076W GPI2 phosphatidylinositol N-acetylglucosaminyltransferase|GCR4 chromosome 16 L000002807 16 410443 411285 W 2011-02-03 1996-07-31 Protein involved in the synthesis of GlcNAc-PI; GlcNAc-PI is the first intermediate in the synthesis of glycosylphosphatidylinositol (GPI) anchors; homologous to the human PIG-C protein; GlcNAc-PI stands for N-acetylglucosaminyl phosphatidylinositol +S000030692 CDS YPL076W 16 410443 411285 W 2011-02-03 1996-07-31 +S000005996 ORF Verified YPL075W GCR1 transcription regulator GCR1|SIT3|LPF10 chromosome 16 L000000690|S000029447|L000001900 16 412254 415362 W 2011-02-03 1997-10-20|1996-07-31 Transcriptional activator of genes involved in glycolysis; DNA-binding protein that interacts and functions with the transcriptional activator Gcr2p +S000036778 CDS YPL075W 16 412254 412261 W 2011-02-03 1997-10-20|1996-07-31 +S000036779 CDS YPL075W 16 413013 415362 W 2011-02-03 1997-10-20 +S000036780 intron YPL075W 16 412262 413012 W 2011-02-03 1997-10-20 +S000005995 ORF Verified YPL074W YTA6 putative AAA family ATPase YTA6 chromosome 16 L000002560 16 415763 418027 W 2011-02-03 1996-07-31 Putative ATPase of the CDC48/PAS1/SEC18 (AAA) family; localized to the cortex of mother cells but not to daughter cells; relocalizes from cytoplasm to plasma membrane foci upon DNA replication stress +S000036699 CDS YPL074W 16 415763 418027 W 2011-02-03 1996-07-31 +S000118416 ARS ARS1619 ARSXVI-418 chromosome 16 16 418138 418364 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178194 ARS_consensus_sequence ARS1619 16 418178 418194 W 2014-11-18 2014-11-18 +S000005993 ORF Verified YPL072W UBP16 putative ubiquitin-specific protease UBP16 chromosome 16 L000004590 16 418512 420011 W 2011-02-03 1996-07-31 Deubiquitinating enzyme anchored to the outer mitochondrial membrane; probably not important for general mitochondrial functioning, but may perform a more specialized function at mitochondria +S000036526 CDS YPL072W 16 418512 420011 W 2011-02-03 1996-07-31 +S000005994 ORF Dubious YPL073C chromosome 16 16 418984 418499 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps with verified gene UBP16/YPL072W; may interact with ribosome based on co-purification experiments +S000036568 CDS YPL073C 16 418984 418499 C 2011-02-03 1996-07-31 +S000005992 ORF Uncharacterized YPL071C chromosome 16 16 420518 420048 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus +S000035569 CDS YPL071C 16 420518 420048 C 2011-02-03 1996-07-31 +S000005991 ORF Verified YPL070W MUK1 guanine nucleotide exchange factor MUK1 chromosome 16 16 420948 422786 W 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF); involved in vesicle-mediated vacuolar transport, including Golgi-endosome trafficking and sorting through the multivesicular body (MVB); specifically stimulates the intrinsic guanine nucleotide exchange activity of Rab family members (Vps21p/Ypt52p/Ypt53p); partially redundant with GEF VPS9; required for localization of the CORVET complex to endosomes; contains a VPS9 domain +S000035514 CDS YPL070W 16 420948 422786 W 2011-02-03 1996-07-31 +S000130200 ARS ARS1620 chromosome 16 16 422786 422885 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000005990 ORF Verified YPL069C BTS1 farnesyltranstransferase chromosome 16 L000003062 16 423892 422885 C 2011-02-03 1996-07-31 Geranylgeranyl diphosphate synthase (GGPS); increases the intracellular pool of geranylgeranyl diphosphate, suppressor of bet2 mutation that causes defective geranylgeranylation of small GTP-binding proteins that mediate vesicular traffic +S000035752 CDS YPL069C 16 423892 422885 C 2011-02-03 1996-07-31 +S000005989 ORF Uncharacterized YPL068C chromosome 16 16 425096 424215 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleus and is induced in response to the DNA-damaging agent MMS +S000035679 CDS YPL068C 16 425096 424215 C 2011-02-03 1996-07-31 +S000005988 ORF Uncharacterized YPL067C chromosome 16 16 425847 425251 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YPL067C is not an essential gene +S000034754 CDS YPL067C 16 425847 425251 C 2011-02-03 1996-07-31 +S000005987 ORF Verified YPL066W RGL1 chromosome 16 16 426233 427672 W 2011-02-03 1996-07-31 Regulator of Rho1p signaling, cofactor of Tus1p; required for the localization of Tus1p during all phases of cytokinesis; green fluorescent protein (GFP)-fusion protein localizes to the bud neck and cytoplasm; null mutant is viable and exhibits growth defect on a non-fermentable (respiratory) carbon source +S000034712 CDS YPL066W 16 426233 427672 W 2011-02-03 1996-07-31 +S000005986 ORF Verified YPL065W VPS28 ESCRT-I subunit protein VPS28|VPL13|VPT28 chromosome 16 L000003228 16 427927 428655 W 2011-02-03 1996-07-31 Component of the ESCRT-I complex; complex is involved in ubiquitin-dependent sorting of proteins into the endosome; conserved C-terminal domain interacts with ESCRT-III subunit Vps20p; other members include Stp22p, Srn2p, Vps28p, and Mvb12p +S000034662 CDS YPL065W 16 427927 428655 W 2011-02-03 1996-07-31 +S000005985 ORF Verified YPL064C CWC27 putative peptidylprolyl isomerase CWC27 chromosome 16 16 429616 428711 C 2011-02-03 1996-07-31 Component of a complex containing Cef1p; putatively involved in pre-mRNA splicing; has similarity to S. pombe Cwf27p; protein abundance increases in response to DNA replication stress +S000034538 CDS YPL064C 16 429616 428711 C 2011-02-03 1996-07-31 +S000005984 ORF Verified YPL063W TIM50 protein translocase subunit TIM50 chromosome 16 16 429939 431369 W 2011-02-03 1996-07-31 Essential component of the TIM23 complex; acts as receptor for the translocase of the inner mitochondrial membrane (TIM23) complex guiding incoming precursors from the TOM complex; may control the gating of the Tim23p-Tim17p channel +S000034464 CDS YPL063W 16 429939 431369 W 2011-02-03 1996-07-31 +S000005983 ORF Dubious YPL062W chromosome 16 16 431895 432299 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YPL062W is not an essential gene; homozygous diploid mutant shows a decrease in glycogen accumulation +S000032441 CDS YPL062W 16 431895 432299 W 2011-02-03 1996-07-31 +S000005982 ORF Verified YPL061W ALD6 aldehyde dehydrogenase (NADP(+)) ALD6|ALD1 chromosome 16 L000003206 16 432588 434090 W 2011-02-03 1996-07-31 Cytosolic aldehyde dehydrogenase; activated by Mg2+ and utilizes NADP+ as the preferred coenzyme; required for conversion of acetaldehyde to acetate; constitutively expressed; locates to the mitochondrial outer surface upon oxidative stress +S000032358 CDS YPL061W 16 432588 434090 W 2011-02-03 1996-07-31 +S000005981 ORF Verified YPL060W MFM1 LPE10 chromosome 16 16 434523 435764 W 2011-02-03 1996-07-31 Mitochondrial inner membrane magnesium transporter; involved in maintenance of mitochondrial magnesium concentrations and membrane potential; indirectly affects splicing of group II introns; functionally and structurally related to Mrs2p +S000032240 CDS YPL060W 16 434523 435764 W 2011-02-03 1996-07-31 +S000006528 tRNA_gene tC(GCA)P1 chromosome 16 L000003734 16 435964 435893 C 2011-02-03 2000-05-19 Cysteine tRNA (tRNA-Cys), predicted by tRNAscan-SE analysis +S000037832 noncoding_exon tC(GCA)P1 16 435964 435893 C 2011-02-03 2000-05-19 +S000007196 long_terminal_repeat YPLWdelta9 chromosome 16 16 436068 436249 W 2011-02-03 2000-05-19 Ty1 LTR +S000007185 long_terminal_repeat YPLCdelta10 chromosome 16 16 436587 436250 C 2011-02-03 2000-05-19 Ty1 LTR +S000007197 long_terminal_repeat YPLWdelta11 chromosome 16 16 436594 436731 W 2011-02-03 2000-05-19 Ty1 LTR +S000007186 long_terminal_repeat YPLCtau1 chromosome 16 16 437260 436890 C 2011-02-03 2000-05-19 Ty4 LTR +S000007388 transposable_element_gene YPL060C-A chromosome 16 16 442742 437333 C 2015-01-13 1999-07-17|2014-11-18|2015-01-13 TyA Gag protein; the main structural constituent of virus-like particles (VLPs); Gag processing produces capsid proteins +S000178189 CDS YPL060C-A 16 439427 437333 C 2015-01-13 2014-11-18|2015-01-13 +S000036843 CDS YPL060C-A 16 442742 439429 C 2015-01-13 1999-07-17|2015-01-13 +S000178188 plus_1_translational_frameshift YPL060C-A 16 439428 439428 C 2015-01-13 2014-11-18|2015-01-13 +S000007188 LTR_retrotransposon YPLCTy4-1 Ty4 chromosome 16 16 443112 436890 C 2011-02-03 2000-05-19 Ty4 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007187 long_terminal_repeat YPLCtau2 chromosome 16 16 443112 442742 C 2011-02-03 2000-05-19 Ty4 LTR +S000005980 ORF Verified YPL059W GRX5 monothiol glutaredoxin GRX5 chromosome 16 S000007446 16 444579 445031 W 2011-02-03 1996-07-31 Glutathione-dependent oxidoreductase; mitochondrial matrix protein involved at an early step in the biogenesis of iron-sulfur centers along with Bol1p; hydroperoxide and superoxide-radical responsive; monothiol glutaredoxin subfamily member along with Grx3p and Grx4p +S000031521 CDS YPL059W 16 444579 445031 W 2011-02-03 1996-07-31 +S000005979 ORF Verified YPL058C PDR12 ATP-binding cassette multidrug transporter PDR12 chromosome 16 L000003205 16 450377 445842 C 2011-02-03 1996-07-31 Plasma membrane ATP-binding cassette (ABC) transporter; weak-acid-inducible multidrug transporter required for weak organic acid resistance; induced by sorbate and benzoate and regulated by War1p; mutants exhibit sorbate hypersensitivity +S000031386 CDS YPL058C 16 450377 445842 C 2011-02-03 1996-07-31 +S000005978 ORF Verified YPL057C SUR1 mannosylinositol phosphorylceramide synthase catalytic subunit SUR1|LPE15|CSG1|BCL21 chromosome 16 L000002243 16 453057 451909 C 2011-02-03 1996-07-31 Mannosylinositol phosphorylceramide (MIPC) synthase catalytic subunit; forms a complex with regulatory subunit Csg2p; function in sphingolipid biosynthesis is overlapping with that of Csh1p; SUR1 has a paralog, CSH1, that arose from the whole genome duplication +S000031334 CDS YPL057C 16 453057 451909 C 2011-02-03 1996-07-31 +S000005977 ORF Uncharacterized YPL056C LCL1 chromosome 16 16 453735 453430 C 2011-02-03 1996-07-31 Putative protein of unknown function; deletion mutant is fluconazole resistant and has long chronological lifespan +S000030453 CDS YPL056C 16 453735 453430 C 2011-02-03 1996-07-31 +S000005976 ORF Verified YPL055C LGE1 chromosome 16 16 454990 453992 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant forms abnormally large cells, and homozygous diploid null mutant displays delayed premeiotic DNA synthesis and reduced efficiency of meiotic nuclear division +S000030299 CDS YPL055C 16 454990 453992 C 2011-02-03 1996-07-31 +S000005975 ORF Verified YPL054W LEE1 chromosome 16 L000002859 16 455759 456664 W 2011-02-03 1996-07-31 Zinc-finger protein of unknown function +S000030275 CDS YPL054W 16 455759 456664 W 2011-02-03 1996-07-31 +S000119038 ARS ARS1633 ARSXVI-457|ARS1620.5 chromosome 16 16 456563 456810 2011-02-03 2006-10-04 Autonomously Replicating Sequence +S000005974 ORF Verified YPL053C KTR6 putative mannosyltransferase|MNN6 chromosome 16 L000003131 16 458458 457118 C 2011-02-03 1996-07-31 Probable mannosylphosphate transferase; involved in the synthesis of core oligosaccharides in protein glycosylation pathway; member of the KRE2/MNT1 mannosyltransferase family; KTR6 has a paralog, KRE2, that arose from the whole genome duplication +S000036430 CDS YPL053C 16 458458 457118 C 2011-02-03 1996-07-31 +S000005973 ORF Verified YPL052W OAZ1 YPL052W-A chromosome 16 16 458799 459678 W 2011-02-03 1996-07-31|2005-12-14 Regulator of ornithine decarboxylase Spe1p; antizyme that binds to Spe1p to stimulate ubiquitin-independent degradation by the proteasome; binding of polyamines to nascent Oaz1p during translation stimulates +1 ribosomal frameshifting, allowing translation of full-length Oaz1p +S000036401 CDS YPL052W 16 458799 459005 W 2011-02-03 1996-07-31|2005-12-14 +S000113788 CDS YPL052W 16 459007 459678 W 2011-02-03 2005-12-14 +S000113787 plus_1_translational_frameshift YPL052W 16 459006 459006 W 2011-02-03 2005-12-14 +S000005972 ORF Verified YPL051W ARL3 Arf family GTPase ARL3 chromosome 16 L000004809 16 459963 460559 W 2011-02-03 1996-07-31 ARF-like small GTPase of the RAS superfamily; required for recruitment of Arl1p, a GTPase that regulates membrane traffic, to the Golgi apparatus; NatC-catalyzed N-terminal acetylation regulates Golgi membrane association mediated by interaction with membrane receptor, Sys1p; similar to ADP-ribosylation factor and orthologous to mammalian ARFRP1 +S000036285 CDS YPL051W 16 459963 460559 W 2011-02-03 1996-07-31 +S000005971 ORF Verified YPL050C MNN9 mannosyltransferase complex subunit MNN9 chromosome 16 L000001129 16 461966 460779 C 2011-02-03 1996-07-31 Subunit of Golgi mannosyltransferase complex; this complex mediates elongation of the polysaccharide mannan backbone; forms a separate complex with Van1p that is also involved in backbone elongation; this complex also contains Anp1p, Mnn10p, Mnn11p, and Hoc1p +S000036103 CDS YPL050C 16 461966 460779 C 2011-02-03 1996-07-31 +S000005970 ORF Verified YPL049C DIG1 RST1 chromosome 16 L000003122 16 463839 462481 C 2011-02-03 1996-07-31 MAP kinase-responsive inhibitor of the Ste12p transcription factor; involved in the regulation of mating-specific genes and the invasive growth pathway; related regulators Dig1p and Dig2p bind to Ste12p; DIG1 has a paralog, DIG2, that arose from the whole genome duplication +S000036451 CDS YPL049C 16 463839 462481 C 2011-02-03 1996-07-31 +S000005969 ORF Verified YPL048W CAM1 translation elongation factor EF1B gamma|CPBP|TEF3 chromosome 16 L000000212|L000002279 16 464401 465648 W -27.3 2011-02-03 1996-07-31 One of two isoforms of the gamma subunit of eEF1B; stimulates the release of GDP from eEF1A (Tef1p/Tef2p) post association with the ribosomal complex with eEF1Balpha subunit; nuclear protein required for transcription of MXR1; binds the MXR1 promoter in the presence of other nuclear factors; binds calcium and phospholipids +S000035577 CDS YPL048W 16 464401 465648 W 2011-02-03 1996-07-31 +S000005968 ORF Verified YPL047W SGF11 SAGA histone acetyltransferase complex subunit SGF11 chromosome 16 16 465962 466261 W 2011-02-03 1996-07-31 Integral subunit of SAGA histone acetyltransferase complex; regulates transcription of a subset of SAGA-regulated genes, required for the Ubp8p association with SAGA and for H2B deubiquitylation +S000035515 CDS YPL047W 16 465962 466261 W 2011-02-03 1996-07-31 +S000005967 ORF Verified YPL046C ELC1 elongin C chromosome 16 L000004351 16 466943 466644 C 2011-02-03 1996-07-31 Elongin C, conserved among eukaryotes; forms a complex with Cul3p that polyubiquitylates monoubiquitylated RNA polymerase II to trigger its proteolysis; plays a role in global genomic repair +S000035426 CDS YPL046C 16 466943 466644 C 2011-02-03 1996-07-31 +S000005966 ORF Verified YPL045W VPS16 tethering complex subunit VPS16|CVT15|VPT16|VAM9|SVL6 chromosome 16 L000002471|L000003119|L000004766|S000029128 16 467260 469656 W 2011-02-03 1996-07-31 Subunit of the HOPS and the CORVET complexes; part of the Class C Vps complex essential for membrane docking and fusion at Golgi-to-endosome and endosome-to-vacuole protein transport stages +S000035390 CDS YPL045W 16 467260 469656 W 2011-02-03 1996-07-31 +S000005964 ORF Verified YPL043W NOP4 mRNA-binding ribosome biosynthesis protein NOP4|NOP77 chromosome 16 L000001262|L000001263 16 469939 471996 W 2011-02-03 1996-07-31 Nucleolar protein; essential for processing and maturation of 27S pre-rRNA and large ribosomal subunit biogenesis; constituent of 66S pre-ribosomal particles; contains four RNA recognition motifs (RRMs) +S000034348 CDS YPL043W 16 469939 471996 W 2011-02-03 1996-07-31 +S000005965 ORF Dubious YPL044C chromosome 16 16 470474 469926 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene NOP4/YPL043W +S000034376 CDS YPL044C 16 470474 469926 C 2011-02-03 1996-07-31 +S000005963 ORF Verified YPL042C SSN3 cyclin-dependent serine/threonine protein kinase SSN3|URR1|SSX7|CDK8|RYE5|UME5|SRB10|NUT7|GIG2 chromosome 16 L000002795|S000029631|L000002443|S000029520|L000002103 16 474707 473040 C 2011-02-03 1996-07-31 Cyclin-dependent protein kinase; component of RNA polymerase II holoenzyme; involved in phosphorylation of the RNA polymerase II C-terminal domain; involved in glucose repression +S000034254 CDS YPL042C 16 474707 473040 C 2011-02-03 1996-07-31 +S000005962 ORF Uncharacterized YPL041C MRX11 chromosome 16 16 475741 475118 C 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; SWAT-GFP and mCherry fusion proteins localize to the mitochondria; involved in maintenance of telomere length +S000034145 CDS YPL041C 16 475741 475118 C 2011-02-03 1996-07-31 +S000005961 ORF Verified YPL040C ISM1 isoleucine--tRNA ligase ISM1 chromosome 16 L000002648 16 479001 475993 C 2011-02-03 1996-07-31 Mitochondrial isoleucyl-tRNA synthetase; null mutant is deficient in respiratory growth; human homolog IARS2 implicated in mitochondrial diseases, can partially complement yeast null mutant +S000032140 CDS YPL040C 16 479001 475993 C 2011-02-03 1996-07-31 +S000005960 ORF Uncharacterized YPL039W chromosome 16 16 479225 480175 W 2011-02-03 1996-07-31 Putative protein of unknown function; YPL039W is not an essential gene +S000033263 CDS YPL039W 16 479225 480175 W 2011-02-03 1996-07-31 +S000028588 ORF Uncharacterized YPL038W-A chromosome 16 16 480182 480373 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031340 CDS YPL038W-A 16 480182 480373 W 2011-02-03 2003-07-29 +S000005959 ORF Verified YPL038W MET31 chromosome 16 L000003469 16 480535 481068 W 2011-02-03 1996-07-31 Zinc-finger DNA-binding transcription factor; targets strong transcriptional activator Met4p to promoters of sulfur metabolic genes; involved in transcriptional regulation of the methionine biosynthetic genes; feedforward loop controlling expression of MET32 and the lack of such a loop for MET31 may account for the differential actions of Met31p and Met32p; MET31 has a paralog, MET32, that arose from the whole genome duplication +S000032414 CDS YPL038W 16 480535 481068 W 2011-02-03 1996-07-31 +S000005958 ORF Verified YPL037C EGD1 chromosome 16 L000000545 16 481901 481428 C 2011-02-03 1996-07-31 Subunit beta1 of the nascent polypeptide-associated complex (NAC); involved in protein targeting, associated with cytoplasmic ribosomes; enhances DNA binding of the Gal4p activator; homolog of human BTF3b; EGD1 has a paralog, BTT1, that arose from the whole genome duplication +S000032253 CDS YPL037C 16 481901 481428 C 2011-02-03 1996-07-31 +S000005957 ORF Verified YPL036W PMA2 H(+)-exporting P2-type ATPase PMA2 chromosome 16 L000001450 16 482843 485686 W 2011-02-03 1996-07-31 Plasma membrane H+-ATPase; isoform of Pma1p, involved in pumping protons out of the cell; regulator of cytoplasmic pH and plasma membrane potential +S000032226 CDS YPL036W 16 482843 485686 W 2011-02-03 1996-07-31 +S000005955 ORF Uncharacterized YPL034W chromosome 16 16 486712 487209 W 2011-02-03 1996-07-31 Putative protein of unknown function; YPL034W is not essential gene +S000031184 CDS YPL034W 16 486712 487209 W 2011-02-03 1996-07-31 +S000005956 ORF Dubious YPL035C chromosome 16 16 486911 486564 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized gene YPL034W; YPL035C is not an essential gene +S000031189 CDS YPL035C 16 486911 486564 C 2011-02-03 1996-07-31 +S000005954 ORF Verified YPL033C SRL4 chromosome 16 16 488207 487362 C 2011-02-03 1996-07-31 Protein of unknown function; involved in regulation of dNTP production; null mutant suppresses the lethality of lcd1 and rad53 mutations; expression is induced by Kar4p +S000031014 CDS YPL033C 16 488207 487362 C 2011-02-03 1996-07-31 +S000005953 ORF Verified YPL032C SVL3 chromosome 16 L000004235 16 491364 488887 C 2011-02-03 1996-07-31 Protein of unknown function; mutant phenotype suggests a potential role in vacuolar function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery, cytoplasm, bud, and bud neck; relocalizes from bud neck to cytoplasm upon DNA replication stress; SVL3 has a paralog, PAM1, that arose from the whole genome duplication +S000030938 CDS YPL032C 16 491364 488887 C 2011-02-03 1996-07-31 +S000005952 ORF Verified YPL031C PHO85 cyclin-dependent serine/threonine-protein kinase PHO85|phoU|LDB15 chromosome 16 L000001431 16 493037 492018 C -34 2011-02-03 1996-07-31 Cyclin-dependent kinase; has ten cyclin partners; involved in regulating the cellular response to nutrient levels and environmental conditions and progression through the cell cycle; human lissencephaly-associated homolog CDK5 functionally complements null mutation +S000029949 CDS YPL031C 16 492918 492018 C 2011-02-03 1996-07-31 +S000029948 CDS YPL031C 16 493037 493021 C 2011-02-03 1996-07-31 +S000029950 intron YPL031C 16 493020 492919 C 2011-02-03 1996-07-31 +S000005951 ORF Verified YPL030W TRM44 tRNA (uracil) methyltransferase chromosome 16 16 493543 495246 W 2011-02-03 1996-07-31 tRNA(Ser) Um(44) 2'-O-methyltransferase; involved in maintaining levels of the tRNA-Ser species tS(CGA) and tS(UGA); conserved among metazoans and fungi but there does not appear to be a homolog in plants; TRM44 is a non-essential gene +S000029895 CDS YPL030W 16 493543 495246 W 2011-02-03 1996-07-31 +S000005950 ORF Verified YPL029W SUV3 ATP-dependent RNA helicase SUV3|LPB2 chromosome 16 L000002247 16 495506 497719 W 2011-02-03 1996-07-31 ATP-dependent RNA helicase; component of the mitochondrial degradosome along with the RNase Dss1p; the degradosome associates with the ribosome and mediates RNA turnover; also required during splicing of the COX1 AI5_beta intron; expression of a processed form of human homolog SUPV3L1 carrying an N-terminal deletion of 46 amino acids rescues yeast suv3 null mutant +S000037169 CDS YPL029W 16 495506 497719 W 2011-02-03 1996-07-31 +S000005949 ORF Verified YPL028W ERG10 acetyl-CoA C-acetyltransferase|TSM0115|LPB3 chromosome 16 L000000576 16 498096 499292 W -22 2011-02-03 1996-07-31 Acetyl-CoA C-acetyltransferase (acetoacetyl-CoA thiolase); cytosolic enzyme that transfers an acetyl group from one acetyl-CoA molecule to another, forming acetoacetyl-CoA; involved in the first step in mevalonate biosynthesis; human ACAT1 functionally complements the growth defect caused by repression of ERG10 expression +S000037054 CDS YPL028W 16 498096 499292 W 2011-02-03 1996-07-31 +S000005948 ORF Verified YPL027W SMA1 chromosome 16 16 499665 500402 W 2011-02-03 1996-07-31 Protein of unknown function involved in prospore membrane assembly; involved in the assembly of the prospore membrane during sporulation; interacts with Spo14p +S000036999 CDS YPL027W 16 499665 500402 W 2011-02-03 1996-07-31 +S000005947 ORF Verified YPL026C SKS1 putative serine/threonine protein kinase SKS1|SHA3 chromosome 16 L000004139|L000002824 16 502183 500675 C 2011-02-03 1996-07-31 Putative serine/threonine protein kinase; involved in the adaptation to low concentrations of glucose independent of the SNF3 regulated pathway; SKS1 has a paralog, VHS1, that arose from the whole genome duplication +S000036265 CDS YPL026C 16 502183 500675 C 2011-02-03 1996-07-31 +S000005946 ORF Dubious YPL025C chromosome 16 16 503030 502473 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036171 CDS YPL025C 16 503030 502473 C 2011-02-03 1996-07-31 +S000005945 ORF Verified YPL024W RMI1 NCE4 chromosome 16 L000004399 16 503517 504242 W 2011-02-03 1996-07-31 Subunit of the RecQ (Sgs1p) - Topo III (Top3p) complex; stimulates superhelical relaxing, DNA catenation/decatenation and ssDNA binding activities of Top3p; involved in response to DNA damage; functions in S phase-mediated cohesion establishment via a pathway involving the Ctf18-RFC complex and Mrc1p; stimulates Top3p DNA catenation/decatenation activity; null mutants display increased rates of recombination and delayed S phase +S000036120 CDS YPL024W 16 503517 504242 W 2011-02-03 1996-07-31 +S000005944 ORF Verified YPL023C MET12 methylenetetrahydrofolate reductase (NAD(P)H) MET12 chromosome 16 L000003571 16 506312 504339 C 2011-02-03 1996-07-31 Protein with MTHFR activity in vitro; null mutant has no phenotype and is prototrophic for methionine; MET13 encodes major isozyme of methylenetetrahydrofolate reductase (MTHFR) +S000035195 CDS YPL023C 16 506312 504339 C 2011-02-03 1996-07-31 +S000005943 ORF Verified YPL022W RAD1 RAD12|ssDNA endodeoxyribonuclease RAD1|LPB9 chromosome 16 L000001555 16 506697 509999 W -18 2011-02-03 1996-07-31 Single-stranded DNA endonuclease (with Rad10p); cleaves single-stranded DNA during nucleotide excision repair and double-strand break repair; subunit of Nucleotide Excision Repair Factor 1 (NEF1); homolog of human XPF protein +S000035144 CDS YPL022W 16 506697 509999 W 2011-02-03 1996-07-31 +S000005942 ORF Verified YPL021W ECM23 SRD2 chromosome 16 L000003366 16 511101 511664 W 2011-02-03 1996-07-31 Non-essential protein of unconfirmed function; affects pre-rRNA processing, may act as a negative regulator of the transcription of genes involved in pseudohyphal growth; homologous to Srd1p +S000035028 CDS YPL021W 16 511101 511664 W 2011-02-03 1996-07-31 +S000118417 ARS ARS1621 ARSXVI-512 chromosome 16 16 511636 511793 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178195 ARS_consensus_sequence ARS1621 16 511704 511720 W 2014-11-18 2014-11-18 +S000005941 ORF Verified YPL020C ULP1 SUMO protease ULP1|NIB1 chromosome 16 S000029323|L000001249 16 514178 512313 C 2011-02-03 1996-07-31 Protease that specifically cleaves Smt3p protein conjugates; required for cell cycle progression; associates with nucleoporins and may interact with septin rings during telophase; sequestered to the nucleolus under stress conditions +S000034812 CDS YPL020C 16 514178 512313 C 2011-02-03 1996-07-31 +S000005940 ORF Verified YPL019C VTC3 vacuolar transporter chaperone|PHM2 chromosome 16 S000007512 16 517018 514511 C 2011-02-03 1996-07-31 Regulatory subunit of the vacuolar transporter chaperone (VTC) complex; involved in membrane trafficking, vacuolar polyphosphate accumulation, microautophagy and non-autophagic vacuolar fusion; VTC3 has a paralog, VTC2, that arose from the whole genome duplication +S000032833 CDS YPL019C 16 517018 514511 C 2011-02-03 1996-07-31 +S000005939 ORF Verified YPL018W CTF19 MCM18 chromosome 16 L000003420 16 517651 518760 W 2011-02-03 1996-07-31 Outer kinetochore protein, needed for accurate chromosome segregation; component of kinetochore sub-complex COMA (Ctf19p, Okp1p, Mcm21p, Ame1p) that functions as platform for kinetochore assembly; required for spindle assembly checkpoint; minimizes potentially deleterious centromere-proximal crossovers by preventing meiotic DNA break formation proximal to centromere; homolog of human centromere constitutive-associated network (CCAN) subunit CENP-P and fission yeast fta2 +S000031967 CDS YPL018W 16 517651 518760 W 2011-02-03 1996-07-31 +S000005938 ORF Verified YPL017C IRC15 chromosome 16 16 520233 518734 C 2011-02-03 1996-07-31 Microtubule associated protein; regulates microtubule dynamics; required for accurate meiotic chromosome segregation; null mutant displays large budded cells due to delayed mitotic progression, increased levels of spontaneous Rad52 foci; IRC15 has a paralog, LPD1, that arose from the whole genome duplication +S000031777 CDS YPL017C 16 520233 518734 C 2011-02-03 1996-07-31 +S000005937 ORF Verified YPL016W SWI1 [SWI(+)]|[SWI+]|LPA1|GAM3|ADR6 chromosome 16 L000000052|L000002250 16 521014 524958 W 2011-02-03 1996-07-31|2011-02-03 Subunit of the SWI/SNF chromatin remodeling complex; regulates transcription by remodeling chromatin; required for transcription of many genes, including ADH1, ADH2, GAL1, HO, INO1 and SUC2; self-assembles to form [SWI+] prion and to alter expression pattern; human homolog ARID1A is a candidate tumor suppressor gene in breast cancer +S000031725 CDS YPL016W 16 521014 524958 W 2011-02-03 1996-07-31|2011-02-03 +S000005936 ORF Verified YPL015C HST2 histone deacetylase HST2 chromosome 16 L000003041 16 526883 525810 C 2011-02-03 1996-07-31 Cytoplasmic NAD(+)-dependent protein deacetylase; deacetylation targets are primarily cytoplasmic proteins; member of the silencing information regulator 2 (Sir2) family of NAD(+)-dependent protein deacetylases; modulates nucleolar (rDNA) and telomeric silencing; possesses NAD(+)-dependent histone deacetylase activity in vitro; contains a nuclear export signal (NES); function regulated by its nuclear export +S000031593 CDS YPL015C 16 526883 525810 C 2011-02-03 1996-07-31 +S000005935 ORF Verified YPL014W CIP1 chromosome 16 16 527547 528692 W 2011-02-03 1996-07-31 Cyclin-dependent kinase inhibitor; interacts with and inhibits the Cdc28p/Cln2p, G1/S phase cyclin-dependent kinase complex but not S-phase, or M-phase complexes; overexpression blocks cells in G1 phase and stabilizes the Cdc28p inhibitor Sic1p, while disruption accelerates the G1/S phase transition; phosphorylated during S phase in a Cdc28p-dependent manner; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and to the nucleus +S000031551 CDS YPL014W 16 527547 528692 W 2011-02-03 1996-07-31 +S000005934 ORF Verified YPL013C MRPS16 mitochondrial 37S ribosomal protein MRPS16 chromosome 16 16 529350 528985 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit +S000030647 CDS YPL013C 16 529350 528985 C 2011-02-03 1996-07-31 +S000005933 ORF Verified YPL012W RRP12 mRNA-binding protein RRP12 chromosome 16 16 529723 533409 W 2011-02-03 1996-07-31 Protein required for export of the ribosomal subunits; associates with the RNA components of the pre-ribosomes; has a role in nuclear import in association with Pse1p; also plays a role in the cell cycle and the DNA damage response; contains HEAT-repeats +S000030606 CDS YPL012W 16 529723 533409 W 2011-02-03 1996-07-31 +S000005932 ORF Verified YPL011C TAF3 TafII47|TAF47 chromosome 16 L000004154 16 534703 533642 C 2011-02-03 1996-07-31 TFIID subunit (47 kDa); involved in promoter binding and RNA polymerase II transcription initiation +S000030495 CDS YPL011C 16 534703 533642 C 2011-02-03 1996-07-31 +S000005931 ORF Verified YPL010W RET3 coatomer subunit zeta chromosome 16 L000004128 16 535018 535587 W 2011-02-03 1996-07-31 Zeta subunit of the coatomer complex (COPI); COPI coats Golgi-derived transport vesicles; involved in retrograde transport between Golgi and ER +S000030459 CDS YPL010W 16 535018 535587 W 2011-02-03 1996-07-31 +S000005930 ORF Verified YPL009C RQC2 TAE2 chromosome 16 16 538936 535820 C 2011-02-03 1996-07-31 Component of RQC, which mediates nascent chain degradation; RQC (ribosome quality control complex) is a ribosome-bound complex required for degradation of polypeptides arising from stalled translation; recruits alanine- and threonine-charged tRNA to the A site and directs the elongation of nascent chains independently of mRNA or 40S subunits; monitors translation stress and signals this to Hsf1p +S000037295 CDS YPL009C 16 538936 535820 C 2011-02-03 1996-07-31 +S000005929 ORF Verified YPL008W CHL1 MCM12|LPA9|CTF1 chromosome 16 L000000318 16 539385 541970 W -6 2011-02-03 1996-07-31 Probable DNA helicase; involved in sister-chromatid cohesion and genome integrity and interstrand cross-link repair; interacts with ECO1 and CTF18; mutants are defective in silencing, rDNA recombination, aging and the heat shock response; FANCJ-like helicase family member; mutations in the human homolog, DDX11/ChLR1, cause Warsaw breakage syndrome +S000037256 CDS YPL008W 16 539385 541970 W 2011-02-03 1996-07-31 +S000005928 ORF Verified YPL007C TFC8 transcription factor TFIIIC subunit TFC8|tau 60 chromosome 16 16 543848 542082 C 2011-02-03 1996-07-31 Subunit of RNA polymerase III transcription initiation factor complex; one of six subunits of RNA polymerase III transcription initiation factor complex (TFIIIC); part of TFIIIC TauB domain that binds BoxB promoter sites of tRNA and other genes; linker between TauB and TauA domains; human homolog is TFIIIC-90 +S000036517 CDS YPL007C 16 543848 542082 C 2011-02-03 1996-07-31 +S000005927 ORF Verified YPL006W NCR1 sphingolipid transporter chromosome 16 L000003596 16 544631 548143 W 2011-02-03 1996-07-31 Vacuolar membrane protein; transits through the biosynthetic vacuolar protein sorting pathway, involved in sphingolipid metabolism; cells lacking Ncr1p exhibit high levels of long chain bases (LCB), similar to the accumulation of high amounts of lipids observed in patients with Neimann-Pick C, a disease caused by loss-of-function mutations in NPC1, the functional ortholog of Ncr1p +S000036461 CDS YPL006W 16 544631 548143 W 2011-02-03 1996-07-31 +S000005926 ORF Verified YPL005W AEP3 chromosome 16 16 548486 550306 W 2011-02-03 1996-07-31 Peripheral mitochondrial inner membrane protein; may facilitate use of unformylated tRNA-Met in mitochondrial translation initiation; stabilizes the bicistronic AAP1-ATP6 mRNA +S000036393 CDS YPL005W 16 548486 550306 W 2011-02-03 1996-07-31 +S000005925 ORF Verified YPL004C LSP1 lipid-binding protein LSP1 chromosome 16 16 551657 550632 C 2011-02-03 1996-07-31 Eisosome core component; eisosomes are large immobile patch structures at the cell cortex associated with endocytosis; phosphorylated on Thr233 upon Pkc1p hyperactivation in a Slt2p MAPK-dependent fashion; null mutants show activation of Pkc1p/Ypk1p stress resistance pathways; member of the BAR domain family +S000035436 CDS YPL004C 16 551657 550632 C 2011-02-03 1996-07-31 +S000005924 ORF Verified YPL003W ULA1 ENR2 chromosome 16 L000004374 16 552020 553408 W 2011-02-03 1996-07-31 Protein that activates Rub1p (NEDD8) before neddylation; acts together with Uba3p; may play a role in protein degradation +S000035402 CDS YPL003W 16 552020 553408 W 2011-02-03 1996-07-31 +S000005923 ORF Verified YPL002C SNF8 ESCRT-II subunit protein SNF8|VPL14|VPS22 chromosome 16 L000001951 16 554328 553627 C 2011-02-03 1996-07-31 Component of the ESCRT-II complex; ESCRT-II is involved in ubiquitin-dependent sorting of proteins into the endosome; appears to be functionally related to SNF7; involved in glucose derepression +S000035294 CDS YPL002C 16 554328 553627 C 2011-02-03 1996-07-31 +S000005922 ORF Verified YPL001W HAT1 histone acetyltransferase catalytic subunit HAT1|KAT1 chromosome 16 L000003002 16 554605 555729 W 2011-02-03 1996-07-31 Catalytic subunit of the Hat1p-Hat2p histone acetyltransferase complex; uses the cofactor acetyl coenzyme A to acetylate free nuclear and cytoplasmic histone H4; involved in telomeric silencing and DNA double-strand break repair +S000035246 CDS YPL001W 16 554605 555729 W 2011-02-03 1996-07-31 +S000006477 centromere CEN16 CEN16 chromosome 16 L000000309 16 555957 556073 W 0 2011-02-03 2000-05-19|2006-05-09 Chromosome XVI centromere +S000077281 centromere_DNA_Element_I CEN16 16 555957 555966 W 2011-02-03 2004-10-05 +S000077282 centromere_DNA_Element_II CEN16 16 555967 556048 W 2011-02-03 2004-10-05 +S000077283 centromere_DNA_Element_III CEN16 16 556049 556073 W 2011-02-03 2004-10-05 +S000006205 ORF Verified YPR001W CIT3 citrate (Si)-synthase CIT3 chromosome 16 L000002855 16 556377 557837 W 2011-02-03 1996-07-31 Dual specificity mitochondrial citrate and methylcitrate synthase; catalyzes the condensation of acetyl-CoA and oxaloacetate to form citrate and that of propionyl-CoA and oxaloacetate to form 2-methylcitrate +S000030627 CDS YPR001W 16 556377 557837 W 2011-02-03 1996-07-31 +S000006206 ORF Verified YPR002W PDH1 putative 2-methylcitrate dehydratase chromosome 16 16 558385 559935 W 2011-02-03 1996-07-31 Putative 2-methylcitrate dehydratase; mitochondrial protein that participates in respiration; induced by diauxic shift; homologous to E. coli PrpD, may take part in the conversion of 2-methylcitrate to 2-methylisocitrate +S000030711 CDS YPR002W 16 558385 559935 W 2011-02-03 1996-07-31 +S000006570 tRNA_gene tF(GAA)P1 chromosome 16 L000003733 16 560289 560198 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis +S000035230 intron tF(GAA)P1 16 560252 560234 C 2011-02-03 2000-05-19 +S000035229 noncoding_exon tF(GAA)P1 16 560233 560198 C 2011-02-03 2000-05-19 +S000035228 noncoding_exon tF(GAA)P1 16 560289 560253 C 2011-02-03 2000-05-19 +S000007210 long_terminal_repeat YPRWdelta12 chromosome 16 16 560481 560812 W 2011-02-03 2000-05-19 Ty1 LTR +S000007254 ORF Dubious YPR002C-A chromosome 16 16 560766 560569 C 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the Ty1 long terminal repeat, YPRWdelta12 +S000031182 CDS YPR002C-A 16 560766 560569 C 2011-02-03 1999-07-17 +S000006207 ORF Uncharacterized YPR003C chromosome 16 16 563768 561504 C 2011-02-03 1996-07-31 Putative sulfate permease; physically interacts with Hsp82p; green fluorescent protein (GFP)-fusion protein localizes to the ER; YPR003C is not an essential gene +S000031534 CDS YPR003C 16 563768 561504 C 2011-02-03 1996-07-31 +S000118418 ARS ARS1622 ARSXVI-564 chromosome 16 16 563852 563967 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178196 ARS_consensus_sequence ARS1622 16 563877 563893 W 2014-11-18 2014-11-18 +S000006208 ORF Verified YPR004C AIM45 chromosome 16 16 565041 564007 C 2011-02-03 1996-07-31 Putative ortholog of mammalian ETF-alpha; interacts with frataxin, Yfh1p; null mutant displays elevated frequency of mitochondrial genome loss; may have a role in oxidative stress response; ETF-alpha is an electron transfer flavoprotein complex subunit +S000031622 CDS YPR004C 16 565041 564007 C 2011-02-03 1996-07-31 +S000119040 ARS ARS1634 ARSXVI-565|ARS1622.5 chromosome 16 16 565052 565294 2011-02-03 2006-10-04 Autonomously Replicating Sequence +S000006209 ORF Verified YPR005C HAL1 chromosome 16 L000000750 16 566671 565787 C 2011-02-03 1996-07-31 Cytoplasmic protein involved in halotolerance; decreases intracellular Na+ (via Ena1p) and increases intracellular K+ by decreasing efflux; expression repressed by Ssn6p-Tup1p and Sko1p and induced by NaCl, KCl, and sorbitol through Gcn4p +S000031706 CDS YPR005C 16 566671 565787 C 2011-02-03 1996-07-31 +S000006210 ORF Verified YPR006C ICL2 methylisocitrate lyase ICL2 chromosome 16 L000004095 16 568996 567269 C 2011-02-03 1996-07-31 2-methylisocitrate lyase of the mitochondrial matrix; functions in the methylcitrate cycle to catalyze the conversion of 2-methylisocitrate to succinate and pyruvate; ICL2 transcription is repressed by glucose and induced by ethanol +S000031857 CDS YPR006C 16 568996 567269 C 2011-02-03 1996-07-31 +S000006211 ORF Verified YPR007C REC8 SPO69 chromosome 16 L000004667 16 571378 569336 C 2011-02-03 1996-07-31 Meiosis-specific component of the sister chromatid cohesion complex; alpha-kleisin family member that maintains cohesion between sister chromatids during meiosis I; maintains cohesion between centromeres of sister chromatids until meiosis II; independent of its role in sister chromatid cohesion, Rec8p promotes allelic collisions and prevents nonspecific chromosome interactions; homolog of S. pombe Rec8p +S000032749 CDS YPR007C 16 571378 569336 C 2011-02-03 1996-07-31 +S000007200 long_terminal_repeat YPRCdelta13 chromosome 16 16 572173 571845 C 2011-02-03 2000-05-19 Ty1 LTR +S000006588 tRNA_gene tG(GCC)P1 chromosome 16 L000003721 16 572269 572339 W 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis +S000031679 noncoding_exon tG(GCC)P1 16 572269 572339 W 2011-02-03 2000-05-19 +S000006212 ORF Verified YPR008W HAA1 chromosome 16 16 573018 575102 W 2011-02-03 1996-07-31 Transcriptional activator involved in adaptation to weak acid stress; activates transcription of TPO2, YRO2, and other genes encoding membrane stress proteins; HAA1 has a paralog, CUP2, that arose from the whole genome duplication; relocalizes from cytoplasm to nucleus upon DNA replication stress +S000032911 CDS YPR008W 16 573018 575102 W 2011-02-03 1996-07-31 +S000006213 ORF Verified YPR009W SUT2 chromosome 16 16 576552 577358 W 2011-02-03 1996-07-31 Zn2Cys6 family transcription factor; positively regulates sterol uptake under anaerobic conditions with SUT1; represses filamentation-inducing genes during non-starvation conditions; positively regulates mating along with SUT1 by repressing the expression of genes (PRR2, NCE102 and RHO5) which function as mating inhibitors; multicopy suppressor of mutations that cause low activity of the cAMP/PKA pathway; SUT2 has a paralog, SUT1, that arose from the whole genome duplication +S000033007 CDS YPR009W 16 576552 577358 W 2011-02-03 1996-07-31 +S000006214 ORF Verified YPR010C RPA135 DNA-directed RNA polymerase I core subunit RPA135|A135|SRP3|RRN2|RPA2 chromosome 16 L000001674 16 581196 577585 C 2011-02-03 1996-07-31 RNA polymerase I second largest subunit A135 +S000033628 CDS YPR010C 16 581196 577585 C 2011-02-03 1996-07-31 +S000006628 tRNA_gene tK(CUU)P chromosome 16 L000003722 16 582062 582134 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000036081 noncoding_exon tK(CUU)P 16 582062 582134 W 2011-02-03 2000-05-19 +S000122558 ORF Uncharacterized YPR010C-A chromosome 16 16 582734 582373 C 2011-02-03 2007-05-09 Putative protein of unknown function; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the cytosol; conserved among Saccharomyces sensu stricto species +S000122561 CDS YPR010C-A 16 582558 582373 C 2011-02-03 2007-05-09 +S000122559 CDS YPR010C-A 16 582734 582702 C 2011-02-03 2007-05-09 +S000122560 intron YPR010C-A 16 582701 582559 C 2011-02-03 2007-05-09 +S000006215 ORF Verified YPR011C chromosome 16 16 584042 583062 C 2011-02-03 1996-07-31 Mitochondrial transporter; major substrates are adenosine 5'-phosphosulfate (APS) and 3'-phospho-adenosine 5'-phosphosulfate (PAPS); member of the mitochondrial carrier family; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000033732 CDS YPR011C 16 584042 583062 C 2011-02-03 1996-07-31 +S000006216 ORF Dubious YPR012W chromosome 16 16 584309 584563 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YPR012W is not an essential gene +S000034684 CDS YPR012W 16 584309 584563 W 2011-02-03 1996-07-31 +S000006217 ORF Uncharacterized YPR013C CMR3 chromosome 16 16 585585 584632 C 2011-02-03 1996-07-31 Putative zinc finger protein; YPR013C is not an essential gene +S000034773 CDS YPR013C 16 585585 584632 C 2011-02-03 1996-07-31 +S000006218 ORF Dubious YPR014C chromosome 16 16 587518 587189 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YPR014C is not an essential gene +S000034892 CDS YPR014C 16 587518 587189 C 2011-02-03 1996-07-31 +S000006219 ORF Uncharacterized YPR015C chromosome 16 16 591026 590283 C 2011-02-03 1996-07-31 Putative zinc finger transcription factor; binds DNA in sequence-specific manner; overexpression causes a cell cycle delay or arrest +S000035843 CDS YPR015C 16 591026 590283 C 2011-02-03 1996-07-31 +S000006220 ORF Verified YPR016C TIF6 translation initiation factor 6|CDC95 chromosome 16 L000004376 16 593069 592332 C 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; has similarity to human translation initiation factor 6 (eIF6); may be involved in the biogenesis and or stability of 60S ribosomal subunits +S000035939 CDS YPR016C 16 593069 592332 C 2011-02-03 1996-07-31 +S000007630 ORF Dubious YPR016W-A chromosome 16 16 593096 593356 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037261 CDS YPR016W-A 16 593096 593356 W 2011-02-03 2001-02-26 +S000006221 ORF Verified YPR017C DSS4 guanine nucleotide exchange factor DSS4 chromosome 16 L000000529 16 593917 593486 C 2011-02-03 1996-07-31 Guanine nucleotide dissociation stimulator for Sec4p; functions in the post-Golgi secretory pathway; binds zinc, found both on membranes and in the cytosol +S000036108 CDS YPR017C 16 593917 593486 C 2011-02-03 1996-07-31 +S000006222 ORF Verified YPR018W RLF2 CAC1 chromosome 16 L000003990 16 594476 596296 W 2011-02-03 1996-07-31 Largest subunit (p90) of the Chromatin Assembly Complex (CAF-1); chromatin assembly by CAF-1 is important for multiple processes including silencing at telomeres, mating type loci, and rDNA; maintenance of kinetochore structure; deactivation of the DNA damage checkpoint after DNA repair; chromatin dynamics during transcription; and repression of divergent noncoding transcription +S000036938 CDS YPR018W 16 594476 596296 W 2011-02-03 1996-07-31 +S000006223 ORF Verified YPR019W MCM4 MCM DNA helicase complex subunit MCM4|CDC54|HCD21 chromosome 16 L000002761 16 596750 599551 W 2011-02-03 1996-07-31 Essential helicase component of heterohexameric MCM2-7 complexes; MCM2-7 complexes bind pre-replication complexes on DNA and melt DNA prior to replication; forms an Mcm4p-6p-7p subcomplex; shows nuclear accumulation in G1; homolog of S. pombe Cdc21p +S000036996 CDS YPR019W 16 596750 599551 W 2011-02-03 1996-07-31 +S000006224 ORF Verified YPR020W ATP20 F1F0 ATP synthase subunit g chromosome 16 L000004738 16 599870 600217 W 2011-02-03 1996-07-31 Subunit g of the mitochondrial F1F0 ATP synthase; reversibly phosphorylated on two residues; unphosphorylated form is required for dimerization of the ATP synthase complex, which in turn determines oligomerization of the complex and the shape of inner membrane cristae +S000037811 CDS YPR020W 16 599870 600217 W 2011-02-03 1996-07-31 +S000006225 ORF Verified YPR021C AGC1 amino acid transporter AGC1 chromosome 16 16 603357 600649 C 2011-02-03 1996-07-31 Mitochondrial amino acid transporter; acts both as a glutamate uniporter and as an aspartate-glutamate exchanger; involved in nitrogen metabolism and nitrogen compound biosynthesis; human homolog SLC25A13 complements yeast null mutant +S000037867 CDS YPR021C 16 603357 600649 C 2011-02-03 1996-07-31 +S000006226 ORF Verified YPR022C SDD4 chromosome 16 16 607312 603911 C 2011-02-03 1996-07-31 Putative transcription factor, as suggested by computational analysis; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus and is induced in response to the DNA-damaging agent MMS; overproduction of a truncation allele suppresses lethality due to expression of the dominant PET9 allele AAC2-A128P +S000030796 CDS YPR022C 16 607312 603911 C 2011-02-03 1996-07-31 +S000006227 ORF Verified YPR023C EAF3 chromosome 16 16 610031 608826 C 2011-02-03 1996-07-31 Component of the Rpd3S histone deacetylase complex; Esa1p-associated factor, nonessential component of the NuA4 acetyltransferase complex, homologous to Drosophila dosage compensation protein MSL3; plays a role in regulating Ty1 transposition +S000030882 CDS YPR023C 16 610031 608826 C 2011-02-03 1996-07-31 +S000006228 ORF Verified YPR024W YME1 i-AAA protease YME1|YTA11|OSD1 chromosome 16 L000002522 16 610481 612724 W 2011-02-03 1996-07-31 Catalytic subunit of i-AAA protease complex; complex is located in mitochondrial inner membrane; responsible for degradation of unfolded or misfolded mitochondrial gene products; serves as nonconventional translocation motor to pull PNPase into intermembrane space; also has role in intermembrane space protein folding; mutation causes elevated rate of mitochondrial turnover; human homolog YME1L1 can complement yeast null mutant +S000030985 CDS YPR024W 16 610481 612724 W 2011-02-03 1996-07-31 +S000006229 ORF Verified YPR025C CCL1 TFIIH complex kinase subunit CCL1 chromosome 16 L000000237 16 614558 613377 C 2011-02-03 1996-07-31 Cyclin associated with protein kinase Kin28p; Kin28p is the TFIIH-associated carboxy-terminal domain (CTD) kinase involved in transcription initiation at RNA polymerase II promoters; human homolog CCNH allows growth of yeast ccl1 temperature-sensitive mutant at restrictive temperature +S000031028 CDS YPR025C 16 614558 613377 C 2011-02-03 1996-07-31 +S000006230 ORF Verified YPR026W ATH1 alpha,alpha-trehalase ATH1 chromosome 16 L000003059 16 615379 619014 W 2011-02-03 1996-07-31 Acid trehalase required for utilization of extracellular trehalose; involved in intracellular trehalose degradation during growth recovery after saline stress +S000032041 CDS YPR026W 16 615379 619014 W 2011-02-03 1996-07-31 +S000006231 ORF Uncharacterized YPR027C chromosome 16 16 621258 620425 C 2011-02-03 1996-07-31 Putative protein of unknown function; SWAT-GFP and seamless-GFP fusion proteins localize to the endoplasmic reticulum, while the mCherry fusion protein localizes to the vacuole +S000032081 CDS YPR027C 16 621258 620425 C 2011-02-03 1996-07-31 +S000006571 tRNA_gene tF(GAA)P2 chromosome 16 L000003732 16 622631 622540 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis +S000035233 intron tF(GAA)P2 16 622594 622576 C 2011-02-03 2000-05-19 +S000035232 noncoding_exon tF(GAA)P2 16 622575 622540 C 2011-02-03 2000-05-19 +S000035231 noncoding_exon tF(GAA)P2 16 622631 622595 C 2011-02-03 2000-05-19 +S000006232 ORF Verified YPR028W YOP1 YIP2 chromosome 16 L000004674 16 623527 624202 W 2011-02-03 1996-07-31 Reticulon-interacting protein; ER integral membrane protein involved in the generation of tubular ER morphology; promotes membrane curvature; forms tubules in vitro; regulates the ER asymmetry-induced inheritance block during ER stress; role in ER-derived peroxisomal biogenesis; interacts with Yip1p to mediate membrane traffic and with Sey1p to maintain ER morphology; facilitates lipid exchange between the ER and mitochondria; forms ER foci upon DNA replication stress +S000032203 CDS YPR028W 16 623527 623577 W 2011-02-03 1996-07-31 +S000032204 CDS YPR028W 16 623711 624202 W 2011-02-03 1996-07-31 +S000032205 intron YPR028W 16 623578 623710 W 2011-02-03 1996-07-31 +S000006233 ORF Verified YPR029C APL4 chromosome 16 L000004054 16 626967 624469 C 2011-02-03 1996-07-31 Gamma-adaptin; large subunit of the clathrin-associated protein (AP-1) complex; binds clathrin; involved in vesicle mediated transport +S000032228 CDS YPR029C 16 626967 624469 C 2011-02-03 1996-07-31 +S000006234 ORF Verified YPR030W CSR2 ART8|MRG19 chromosome 16 S000007450 16 627880 631245 W 2011-02-03 1996-07-31 Nuclear ubiquitin protein ligase binding protein; may regulate utilization of nonfermentable carbon sources and endocytosis of plasma membrane proteins; overproduction suppresses chs5 spa2 lethality at high temp; ubiquitinated by Rsp5p, deubiquitinated by Ubp2p; CSR2 has a paralog, ECM21, that arose from the whole genome duplication +S000034095 CDS YPR030W 16 627880 631245 W 2011-02-03 1996-07-31 +S000006235 ORF Verified YPR031W NTO1 chromosome 16 16 631515 633761 W 2011-02-03 1996-07-31 Subunit of the NuA3 histone acetyltransferase complex; this complex acetylates histone H3; contains PHD finger domain that interacts with methylated histone H3 +S000034190 CDS YPR031W 16 631515 633761 W 2011-02-03 1996-07-31 +S000118419 ARS ARS1623 ARSXVI-634 chromosome 16 16 633874 634122 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178197 ARS_consensus_sequence ARS1623 16 633921 633937 W 2014-11-18 2014-11-18 +S000006236 ORF Verified YPR032W SRO7 Rab GTPase-binding protein SRO7|SOP1|SNI1 chromosome 16 L000003105|L000004193 16 634123 637224 W 2011-02-03 1996-07-31 Effector of Rab GTPase Sec4p; forms a complex with Sec4p and t-SNARE Sec9p; involved in exocytosis and docking and fusion of post-Golgi vesicles with plasma membrane; regulates cell proliferation and colony development via the Rho1-Tor1 pathway; homolog of Drosophila lgl tumor suppressor; SRO7 has a paralog, SRO77, that arose from the whole genome duplication +S000035166 CDS YPR032W 16 634123 637224 W 2011-02-03 1996-07-31 +S000006237 ORF Verified YPR033C HTS1 TS4572|histidine--tRNA ligase|TSM4572 chromosome 16 L000000832|S000029607|L000002364 16 639019 637379 C 26 2011-02-03 1996-07-31 Cytoplasmic and mitochondrial histidine tRNA synthetase; efficient mitochondrial localization requires both a presequence and an amino-terminal sequence; mutations in human ortholog HARS2 are associated with Perrault syndrome +S000035204 CDS YPR033C 16 639019 637379 C 2011-02-03 1996-07-31 +S000006238 ORF Verified YPR034W ARP7 RSC11|SWP61 chromosome 16 L000003436 16 639525 640958 W 2011-02-03 1996-07-31 Component of both the SWI/SNF and RSC chromatin remodeling complexes; actin-related protein involved in transcriptional regulation +S000035348 CDS YPR034W 16 639525 640958 W 2011-02-03 1996-07-31 +S000006239 ORF Verified YPR035W GLN1 glutamate--ammonia ligase chromosome 16 L000000709 16 642208 643320 W 29 2011-02-03 1996-07-31|2011-02-03 Glutamine synthetase (GS); synthesizes glutamine from glutamate and ammonia; with Glt1p, forms the secondary pathway for glutamate biosynthesis from ammonia; expression regulated by nitrogen source and by amino acid limitation; forms filaments of back-to-back stacks of cylindrical homo-decamers at low pH, leading to enzymatic inactivation and storage during states of advanced cellular starvation; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress +S000035425 CDS YPR035W 16 642208 643320 W 2011-02-03 1996-07-31|2011-02-03 +S000006240 ORF Verified YPR036W VMA13 H(+)-transporting V1 sector ATPase subunit H|CLS11 chromosome 16 L000002465 16 643836 645272 W 2011-02-03 1996-07-31 Subunit H of the V1 peripheral membrane domain of V-ATPase; part of the electrogenic proton pump found throughout the endomembrane system; serves as an activator or a structural stabilizer of the V-ATPase; the V1 peripheral membrane domain of the vacuolar H+-ATPase (V-ATPase) has eight subunits +S000036312 CDS YPR036W 16 643836 645272 W 2011-02-03 1996-07-31 +S000028425 ORF Verified YPR036W-A SPO24 chromosome 16 16 645950 646153 W 2011-02-03 2002-07-25 Small (67 amino acids) protein involved in sporulation; localizes to the prospore membrane; phosphorylated during meiosis; a longer, 5'-extended mRNA is also transcribed beginning in mid-meiosis, regulated by two MSEs (middle sporulation elements), and includes an uORF of 15 codons in its 5'-UTR; evidence transcription is regulated by Pdr1p +S000029999 CDS YPR036W-A 16 645950 646153 W 2011-02-03 2002-07-25 +S000006242 ORF Dubious YPR038W IRC16 chromosome 16 16 646836 647195 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene YPR037C; null mutant displays increased levels of spontaneous Rad52p foci +S000036501 CDS YPR038W 16 646836 647195 W 2011-02-03 1996-07-31 +S000006243 ORF Dubious YPR039W chromosome 16 16 647012 647347 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified non essential genes ERV2/YPR037C and TIP41/YPR040W +S000036592 CDS YPR039W 16 647012 647347 W 2011-02-03 1996-07-31 +S000006241 ORF Verified YPR037C ERV2 flavin-linked sulfhydryl oxidase chromosome 16 16 647038 646448 C 2011-02-03 1996-07-31 Flavin-linked sulfhydryl oxidase localized to the ER lumen; involved in disulfide bond formation within the endoplasmic reticulum (ER) +S000036350 CDS YPR037C 16 647038 646448 C 2011-02-03 1996-07-31 +S000006244 ORF Verified YPR040W TIP41 chromosome 16 16 647305 648375 W 2011-02-03 1996-07-31 Protein that interacts with Tap42p, which regulates PP2A; component of the TOR (target of rapamycin) signaling pathway; protein abundance increases in response to DNA replication stress +S000037582 CDS YPR040W 16 647305 648375 W 2011-02-03 1996-07-31 +S000006245 ORF Verified YPR041W TIF5 translation initiation factor eIF5|SUI5 chromosome 16 L000002305 16 648704 649921 W 2011-02-03 1996-07-31 Translation initiation factor eIF5; functions both as a GTPase-activating protein to mediate hydrolysis of ribosome-bound GTP and as a GDP dissociation inhibitor to prevent recycling of eIF2 +S000037662 CDS YPR041W 16 648704 649921 W 2011-02-03 1996-07-31 +S000006246 ORF Verified YPR042C PUF2 chromosome 16 16 653662 650435 C 2011-02-03 1996-07-31 PUF family mRNA-binding protein; Pumilio homology domain confers RNA binding activity; preferentially binds mRNAs encoding membrane-associated proteins; binding site composed of two UAAU tetranucleotides, separated by a 3-nt linker; PUF2 has a paralog, JSN1, that arose from the whole genome duplication +S000037689 CDS YPR042C 16 653662 650435 C 2011-02-03 1996-07-31 +S000006247 ORF Verified YPR043W RPL43A eL43|ribosomal 60S subunit protein L43A|L43e|L43A chromosome 16 L000004469 16 654166 654847 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L43A; null mutation confers a dominant lethal phenotype; homologous to mammalian ribosomal protein L37A, no bacterial homolog; RPL43A has a paralog, RPL43B, that arose from the whole genome duplication +S000030558 CDS YPR043W 16 654166 654167 W 2011-02-03 1996-07-31 +S000030559 CDS YPR043W 16 654571 654847 W 2011-02-03 1996-07-31 +S000030560 intron YPR043W 16 654168 654570 W 2011-02-03 1996-07-31 +S000006248 ORF Dubious YPR044C OPI11 chromosome 16 16 654877 654524 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; largely overlaps verified gene RPL43A/YPR043W; deletion confers sensitivity to GSAO +S000030601 CDS YPR044C 16 654877 654524 C 2011-02-03 1996-07-31 +S000006249 ORF Verified YPR045C THP3 MNI2 chromosome 16 16 656552 655140 C 2011-02-03 1996-07-31 Protein that may have a role in transcription elongation; forms a complex with Csn12p that is recruited to transcribed genes; possibly involved in splicing based on pre-mRNA accumulation defect for many intron-containing genes +S000030682 CDS YPR045C 16 656552 655140 C 2011-02-03 1996-07-31 +S000006250 ORF Verified YPR046W MCM16 chromosome 16 L000003997 16 656799 657344 W 2011-02-03 1996-07-31 Component of the Ctf19 complex and the COMA subcomplex; involved in kinetochore-microtubule mediated chromosome segregation; binds to centromere DNA; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-H and fission yeast fta3 +S000031562 CDS YPR046W 16 656799 657344 W 2011-02-03 1996-07-31 +S000006251 ORF Verified YPR047W MSF1 phenylalanine--tRNA ligase chromosome 16 L000001187 16 657529 658938 W 2011-02-03 2003-09-22|1996-07-31 Mitochondrial phenylalanyl-tRNA synthetase; active as a monomer, unlike the cytoplasmic subunit which is active as a dimer complexed to a beta subunit dimer; similar to the alpha subunit of E. coli phenylalanyl-tRNA synthetase +S000031671 CDS YPR047W 16 657529 658938 W 2011-02-03 2003-09-22|1996-07-31 +S000006252 ORF Verified YPR048W TAH18 NAPDH-dependent diflavin reductase chromosome 16 L000004734 16 659182 661053 W 2011-02-03 1996-07-31 Conserved NAPDH-dependent diflavin reductase; component of an early step in the cytosolic Fe-S protein assembly (CIA) machinery; transfers electrons from NADPH to the Fe-S cluster of Dre2p; plays a pro-death role under oxidative stress; Tah18p-dependent nitric oxide synthesis confers high-temperature stress tolerance; possible target for development of antifungal drugs +S000031770 CDS YPR048W 16 659182 661053 W 2011-02-03 1996-07-31 +S000006253 ORF Verified YPR049C ATG11 autophagy protein ATG11|CVT3|CVT9 chromosome 16 L000004760|L000004756|S000029130 16 664673 661137 C 2011-02-03 1996-07-31 Adapter protein for pexophagy and the Cvt targeting pathway; directs receptor-bound cargo to the phagophore assembly site (PAS) for packaging into vesicles; required for recruiting other proteins to the PAS; recruits Dnm1p to facilitate fission of mitochondria that are destined for removal by mitophagy +S000031821 CDS YPR049C 16 664673 661137 C 2011-02-03 1996-07-31 +S000006255 ORF Verified YPR051W MAK3 peptide alpha-N-acetyltransferase MAK3|NAA30 chromosome 16 L000000977 16 664960 665490 W 34 2011-02-03 1996-07-31 Catalytic subunit of the NatC type N-terminal acetyltransferase (NAT); involved in subcellular targeting of select N-terminally acetylated substrates to the Golgi apparatus (Arl3p and Grh1p) and the inner nuclear membrane (Trm1p); required for replication of dsRNA virus; human NatC ortholog, Naa60, functionally complements the null, requiring either auxiliary subunit Mak10p or co-expression of human ortholog, Naa35; Naa60, the human NatF gene, also complements the null allele +S000034802 CDS YPR051W 16 664960 665490 W 2011-02-03 1996-07-31 +S000006254 ORF Dubious YPR050C chromosome 16 16 665366 664953 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps verified ORF MAK3/YPR051W +S000033860 CDS YPR050C 16 665366 664953 C 2011-02-03 1996-07-31 +S000006256 ORF Verified YPR052C NHP6A high-mobility group nucleosome-binding protein chromosome 16 L000001244|L000001245 16 665974 665693 C 2011-02-03 1996-07-31 High-mobility group (HMG) protein; binds to and remodels nucleosomes; involved in recruiting FACT and other chromatin remodelling complexes to chromosomes; functionally redundant with Nhp6Bp; required for transcriptional initiation fidelity of some tRNA genes; homologous to mammalian HMGB1 and HMGB2; NHP6A has a paralog, NHP6B, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000034851 CDS YPR052C 16 665974 665693 C 2011-02-03 1996-07-31 +S000006257 ORF Uncharacterized YPR053C chromosome 16 16 666243 665788 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YPR053C is not an essential gene; partially overlaps verified ORF NHP6A/YPR052C +S000034981 CDS YPR053C 16 666243 665788 C 2011-02-03 1996-07-31 +S000006258 ORF Verified YPR054W SMK1 mitogen-activated protein kinase SMK1 chromosome 16 L000001933 16 666280 667446 W 2011-02-03 1996-07-31 Middle sporulation-specific mitogen-activated protein kinase (MAPK); required for production of the outer spore wall layers; negatively regulates activity of the glucan synthase subunit Gsc2p +S000035191 CDS YPR054W 16 666280 667446 W 2011-02-03 1996-07-31 +S000006259 ORF Verified YPR055W SEC8 exocyst subunit SEC8 chromosome 16 L000001834 16 667676 670873 W 2011-02-03 1996-07-31 Essential 121 kDa subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis at the plasma membrane prior to SNARE-mediated fusion; involved in ER and Golgi inheritance in small buds; relocalizes away from bud neck upon DNA replication stress +S000036048 CDS YPR055W 16 667676 670873 W 2011-02-03 1996-07-31 +S000006260 ORF Verified YPR056W TFB4 TFIIH/NER complex subunit TFB4 chromosome 16 L000004156 16 671126 672142 W 2011-02-03 1996-07-31 Subunit of TFIIH complex; involved in transcription initiation, similar to 34 kDa subunit of human TFIIH; interacts with Ssl1p +S000036167 CDS YPR056W 16 671126 672142 W 2011-02-03 1996-07-31 +S000006261 ORF Verified YPR057W BRR1 chromosome 16 L000004059 16 672471 673496 W 2011-02-03 1996-07-31 snRNP protein component of spliceosomal snRNPs; required for pre-mRNA splicing and snRNP biogenesis; in null mutant newly-synthesized snRNAs are destabilized and 3'-end processing is slowed +S000036258 CDS YPR057W 16 672471 673496 W 2011-02-03 1996-07-31 +S000006262 ORF Verified YPR058W YMC1 organic acid transporter chromosome 16 L000002520 16 673751 674674 W 39.7 2011-02-03 1996-07-31 Secondary mitochondrial inner membrane glycine transporter; required with HEM25 for the transport of glycine into mitochondria for the initiation of heme biosynthesis; proposed role in oleate metabolism and glutamate biosynthesis; member of the mitochondrial carrier (MCF) family; localizes to the vacuole in response to H2O2; YMC1 has a paralog, YMC2, that arose from the whole genome duplication +S000036364 CDS YPR058W 16 673751 674674 W 2011-02-03 1996-07-31 +S000006263 ORF Dubious YPR059C chromosome 16 16 674700 674314 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YMC1/YPR058W +S000036983 CDS YPR059C 16 674700 674314 C 2011-02-03 1996-07-31 +S000006264 ORF Verified YPR060C ARO7 chorismate mutase ARO7|TYR7|OSM2|HGS1 chromosome 16 L000000120 16 675631 674861 C 39.4 2011-02-03 1996-07-31 Chorismate mutase; catalyzes the conversion of chorismate to prephenate to initiate the tyrosine/phenylalanine-specific branch of aromatic amino acid biosynthesis +S000037791 CDS YPR060C 16 675631 674861 C 2011-02-03 1996-07-31 +S000006265 ORF Verified YPR061C JID1 chromosome 16 16 676882 675977 C 2011-02-03 1996-07-31 Probable Hsp40p co-chaperone; has a DnaJ-like domain and appears to be involved in ER-associated degradation of misfolded proteins containing a tightly folded cytoplasmic domain; inhibits replication of Brome mosaic virus in S. cerevisiae +S000037866 CDS YPR061C 16 676882 675977 C 2011-02-03 1996-07-31 +S000006266 ORF Verified YPR062W FCY1 cytosine deaminase|yCD chromosome 16 L000003485 16 677165 677641 W 2011-02-03 1996-07-31 Cytosine deaminase; zinc metalloenzyme that catalyzes the hydrolytic deamination of cytosine to uracil; of biomedical interest because it also catalyzes the deamination of 5-fluorocytosine (5FC) to form anticancer drug 5-fluorouracil (5FU) +S000029927 CDS YPR062W 16 677165 677641 W 2011-02-03 1996-07-31 +S000006267 ORF Uncharacterized YPR063C chromosome 16 16 678320 677812 C 2011-02-03 1996-07-31 ER-localized protein of unknown function +S000029984 CDS YPR063C 16 678193 677812 C 2011-02-03 1996-07-31 +S000029983 CDS YPR063C 16 678320 678280 C 2011-02-03 1996-07-31 +S000029985 intron YPR063C 16 678279 678194 C 2011-02-03 1996-07-31 +S000006268 ORF Uncharacterized YPR064W chromosome 16 16 678951 679370 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YPR064W is not an essential gene +S000031009 CDS YPR064W 16 678951 679370 W 2011-02-03 1996-07-31 +S000006269 ORF Verified YPR065W ROX1 REO1 chromosome 16 L000001661 16 679693 680799 W 2011-02-03 1996-07-31 Heme-dependent repressor of hypoxic genes; mediates aerobic transcriptional repression of hypoxia induced genes such as COX5b and CYC7; repressor function regulated through decreased promoter occupancy in response to oxidative stress; contains an HMG domain that is responsible for DNA bending activity; involved in the hyperosmotic stress resistance +S000031123 CDS YPR065W 16 679693 680799 W 2011-02-03 1996-07-31 +S000006270 ORF Verified YPR066W UBA3 NEDD8-activating protein UBA3 chromosome 16 L000004373 16 681213 682112 W 2011-02-03 1996-07-31 Protein that activates Rub1p (NEDD8) before neddylation; acts together with Ula1p; may play a role in protein degradation; GFP-fusion protein localizes to the cytoplasm in a punctate pattern +S000031188 CDS YPR066W 16 681213 682112 W 2011-02-03 1996-07-31 +S000006271 ORF Verified YPR067W ISA2 chromosome 16 L000004955 16 682220 682777 W 2011-02-03 1996-07-31 Protein required for maturation of mitochondrial [4Fe-4S] proteins; functions in a complex with Isa1p and possibly Iba57p; localizes to the mitochondrial intermembrane space, overexpression of ISA2 suppresses grx5 mutations +S000032172 CDS YPR067W 16 682220 682777 W 2011-02-03 1996-07-31 +S000006272 ORF Verified YPR068C HOS1 histone deacetylase|CST3 chromosome 16 L000004091|S000029124|L000002993 16 684353 682941 C 2011-02-03 1996-07-31 Class I histone deacetylase (HDAC) family member; deacetylates Smc3p on lysine residues at anaphase onset; has sequence similarity to Hda1p, Rpd3p, Hos2p, and Hos3p; interacts with the Tup1p-Ssn6p corepressor complex +S000032210 CDS YPR068C 16 684353 682941 C 2011-02-03 1996-07-31 +S000118420 ARS ARS1624 ARSXVI-684 chromosome 16 16 684389 684637 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178198 ARS_consensus_sequence ARS1624 16 684405 684421 W 2014-11-18 2014-11-18 +S000006273 ORF Verified YPR069C SPE3 spermidine synthase chromosome 16 L000003328 16 685437 684556 C 2011-02-03 1996-07-31 Spermidine synthase; involved in biosynthesis of spermidine and also in biosynthesis of pantothenic acid; spermidine is required for growth of wild-type cells +S000032285 CDS YPR069C 16 685437 684556 C 2011-02-03 1996-07-31 +S000006274 ORF Verified YPR070W MED1 chromosome 16 16 685898 687598 W 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation +S000032028 CDS YPR070W 16 685898 687598 W 2011-02-03 1996-07-31 +S000006275 ORF Uncharacterized YPR071W chromosome 16 16 688172 688807 W 2011-02-03 1996-07-31 Putative membrane protein; YPR071W is not an essential gene; YPR071W has a paralog, YIL029C, that arose from a single-locus duplication +S000032138 CDS YPR071W 16 688172 688807 W 2011-02-03 1996-07-31 +S000006736 tRNA_gene tS(UGA)P SUP16 SUQ5 chromosome 16 L000003723|S000029556|L000002242|L000002190 16 689565 689646 W 48 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations +S000034846 noncoding_exon tS(UGA)P 16 689565 689646 W 2011-02-03 2000-05-19 +S000006276 ORF Verified YPR072W NOT5 CCR4-NOT core subunit NOT5 chromosome 16 L000004651 16 690107 691789 W 2011-02-03 1996-07-31 Component of the CCR4-NOT core complex, involved in mRNA decapping; involved intranscription initiation and elongation and in mRNA degradation; conserved lysine in human homolog of Not5p and Not3p is mutated in cancers +S000034137 CDS YPR072W 16 690107 691789 W 2011-02-03 1996-07-31 +S000006277 ORF Verified YPR073C LTP1 tyrosine protein phosphatase LTP1 chromosome 16 L000000957 16 692418 691933 C 2011-02-03 1996-07-31 Protein phosphotyrosine phosphatase of unknown cellular role; activated by adenine +S000034196 CDS YPR073C 16 692418 691933 C 2011-02-03 1996-07-31 +S000006278 ORF Verified YPR074C TKL1 transketolase TKL1 chromosome 16 L000002313 16 694838 692796 C 2011-02-03 1996-07-31 Transketolase; catalyzes conversion of xylulose-5-phosphate and ribose-5-phosphate to sedoheptulose-7-phosphate and glyceraldehyde-3-phosphate in the pentose phosphate pathway; needed for synthesis of aromatic amino acids; TKL1 has a paralog, TKL2, that arose from the whole genome duplication +S000034281 CDS YPR074C 16 694838 692796 C 2011-02-03 1996-07-31 +S000007631 ORF Dubious YPR074W-A chromosome 16 16 695018 695188 W 2011-02-03 2001-02-26 Hypothetical protein identified by homology +S000037262 CDS YPR074W-A 16 695018 695188 W 2011-02-03 2001-02-26 +S000118421 ARS ARS1625 ARSXVI-696 chromosome 16 16 695461 695574 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178199 ARS_consensus_sequence ARS1625 16 695465 695481 W 2014-11-18 2014-11-18 +S000006280 ORF Dubious YPR076W chromosome 16 16 696476 696850 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035349 CDS YPR076W 16 696476 696850 W 2011-02-03 1996-07-31 +S000006279 ORF Verified YPR075C OPY2 chromosome 16 L000004017 16 696819 695737 C 2011-02-03 1996-07-31 Integral membrane protein that acts as a membrane anchor for Ste50p; involved in the signaling branch of the high-osmolarity glycerol (HOG) pathway and as a regulator of the filamentous growth pathway; overproduction blocks cell cycle arrest in the presence of mating pheromone; relocalizes from vacuole to plasma membrane upon DNA replication stress +S000034338 CDS YPR075C 16 696819 695737 C 2011-02-03 1996-07-31 +S000006281 ORF Dubious YPR077C chromosome 16 16 697502 697131 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; expression increased by deletion of NAP1 +S000035364 CDS YPR077C 16 697502 697131 C 2011-02-03 1996-07-31 +S000006282 ORF Uncharacterized YPR078C chromosome 16 16 698265 697147 C 2011-02-03 1996-07-31 Putative protein of unknown function; possible role in DNA metabolism and/or in genome stability; expression is heat-inducible +S000035444 CDS YPR078C 16 698265 697147 C 2011-02-03 1996-07-31 +S000006283 ORF Verified YPR079W MRL1 chromosome 16 16 698869 700014 W 2011-02-03 1996-07-31 Membrane protein; has similarity to mammalian mannose-6-phosphate receptors; possibly functions as a sorting receptor in the delivery of vacuolar hydrolases; protein abundance increases in response to DNA replication stress +S000035534 CDS YPR079W 16 698869 700014 W 2011-02-03 1996-07-31 +S000006284 ORF Verified YPR080W TEF1 translation elongation factor EF-1 alpha|eEF1A|EF-1 alpha chromosome 16 L000002277 16 700594 701970 W 46 2011-02-03 1996-07-31 Translational elongation factor EF-1 alpha; in the GTP-bound active form, binds to and delivers aminoacylated tRNA to the A-site of ribosomes for elongation of nascent polypeptides; associates with vacuolar Rho1p GTPase; may also have a role in tRNA re-export from the nucleus; TEF1 has a paralog, TEF2, that arose from the whole genome duplication +S000035186 CDS YPR080W 16 700594 701970 W 2011-02-03 1996-07-31 +S000006285 ORF Verified YPR081C GRS2 putative glycine--tRNA ligase chromosome 16 16 703970 702114 C 2011-02-03 1996-07-31 Glycine-tRNA synthetase, not expressed under normal growth conditions; expression is induced under heat, oxidative, pH, or ethanol stress conditions; more stable than the major glycine-tRNA synthetase Grs1p at 37 deg C; GRS2 has a paralog, GRS1, that arose from the whole genome duplication +S000035269 CDS YPR081C 16 703970 702114 C 2011-02-03 1996-07-31 +S000006286 ORF Verified YPR082C DIB1 U4/U6-U5 snRNP complex subunit DIB1|SNU16 chromosome 16 L000004542 16 704656 704225 C 2011-02-03 1996-07-31 17-kDa component of the U4/U6aU5 tri-snRNP; plays an essential role in pre-mRNA splicing; human ortholog TXNL4A (the human U5-specific 15-kDa protein) complements yeast dib1 null mutant +S000036157 CDS YPR082C 16 704656 704225 C 2011-02-03 1996-07-31 +S000006287 ORF Verified YPR083W MDM36 chromosome 16 16 704854 706593 W 2011-02-03 1996-07-31 Mitochondrial protein; required for normal mitochondrial morphology and inheritance; component of the mitochondria-ER-cortex-ancor (MECA); interacts with Num1p to link the ER and mitochondria at the cell cortex; proposed involvement in the formation of Dnm1p and Num1p-containing cortical anchor complexes that promote mitochondrial fission +S000036324 CDS YPR083W 16 704854 706593 W 2011-02-03 1996-07-31 +S000006288 ORF Uncharacterized YPR084W chromosome 16 16 706972 708342 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000036408 CDS YPR084W 16 706972 708342 W 2011-02-03 1996-07-31 +S000006289 ORF Verified YPR085C ASA1 chromosome 16 16 709828 708497 C 2011-02-03 2003-09-22|1996-07-31 Subunit of the ASTRA complex, involved in chromatin remodeling; telomere length regulator involved in the stability or biogenesis of PIKKs such as TORC1 +S000030072 CDS YPR085C 16 709828 708497 C 2011-02-03 2003-09-22|1996-07-31 +S000006290 ORF Verified YPR086W SUA7 transcription factor TFIIB|TFIIB|SOH4 chromosome 16 L000002141 16 710101 711138 W 2011-02-03 1996-07-31 Transcription factor TFIIB; a general transcription factor required for transcription initiation and start site selection by RNA polymerase II +S000030297 CDS YPR086W 16 710101 711138 W 2011-02-03 1996-07-31 +S000006291 ORF Dubious YPR087W VPS69 chromosome 16 16 711354 711674 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 85% of ORF overlaps the verified gene SRP54; deletion causes a vacuolar protein sorting defect +S000030448 CDS YPR087W 16 711354 711674 W 2011-02-03 1996-07-31 +S000006292 ORF Verified YPR088C SRP54 RNA-binding signal recognition particle subunit SRP54|SRH1 chromosome 16 L000002064 16 713028 711403 C 2011-02-03 1996-07-31 Signal recognition particle (SRP) subunit (homolog of mammalian SRP54); contains the signal sequence-binding activity of SRP, interacts with the SRP RNA, and mediates binding of SRP to signal receptor; contains GTPase domain +S000030479 CDS YPR088C 16 713028 711403 C 2011-02-03 1996-07-31 +S000006293 ORF Uncharacterized YPR089W YPR090W chromosome 16 16 713275 715941 W 2011-02-03 2003-09-29|1996-07-31 Protein of unknown function; exhibits genetic interaction with ERG11 and protein-protein interaction with Hsp82p +S000031385 CDS YPR089W 16 713275 715941 W 2011-02-03 2003-09-29|1996-07-31 +S000006296 ORF Dubious YPR092W chromosome 16 16 718379 718684 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032289 CDS YPR092W 16 718379 718684 W 2011-02-03 1996-07-31 +S000006295 ORF Verified YPR091C NVJ2 chromosome 16 16 718468 716156 C 2011-02-03 1996-07-31 Lipid-binding ER protein, enriched at nucleus-vacuolar junctions (NVJ); may be involved in sterol metabolism or signaling at the NVJ; contains a synaptotagmin-like-mitochondrial-lipid binding protein (SMP) domain; binds phosphatidylinositols and other lipids in a large-scale study; may interact with ribosomes, based on co-purification experiments +S000031211 CDS YPR091C 16 718468 716156 C 2011-02-03 1996-07-31 +S000006442 snoRNA_gene snR51 SNR51 chromosome 16 L000004520 16 718806 718700 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U2729 and small subunit (SSU) rRNA at position A100 +S000030732 noncoding_exon snR51 16 718806 718700 C 2011-02-03 2000-05-19 +S000006461 snoRNA_gene snR70 SNR70 chromosome 16 L000004539 16 719050 718887 C 2011-02-03 2000-05-19|2007-05-09 C/D box small nucleolar RNA (snoRNA); predicted to guide 2'-O-methylation of small subunit (SSU) rRNA at position C1639 +S000031744 noncoding_exon snR70 16 719050 718887 C 2011-02-03 2000-05-19|2007-05-09 +S000007305 snoRNA_gene snR41 SNR41 chromosome 16 L000003056 16 719242 719148 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at positions A541 and G1126 +S000030612 noncoding_exon snR41 16 719242 719148 C 2011-02-03 2000-05-19 +S000006297 ORF Verified YPR093C ASR1 ubiquitin-protein ligase ASR1 chromosome 16 16 720424 719558 C 2011-02-03 2003-09-22|1996-07-31 Ubiquitin ligase that modifies and regulates RNA Pol II; involved in a putative alcohol-responsive signaling pathway; accumulates in the nucleus under alcohol stress; has a role in organization of septins and the actin cytoskeleton; contains a Ring/PHD finger domain similar to the mammalian rA9 protein +S000032333 CDS YPR093C 16 720424 719558 C 2011-02-03 2003-09-22|1996-07-31 +S000006298 ORF Verified YPR094W RDS3 U2 snRNP complex subunit RDS3 chromosome 16 16 720637 720960 W 2011-02-03 1996-07-31 Component of the SF3b subcomplex of the U2 snRNP; zinc cluster protein involved in pre-mRNA splicing and cycloheximide resistance +S000032497 CDS YPR094W 16 720637 720960 W 2011-02-03 1996-07-31 +S000006299 ORF Verified YPR095C SYT1 Arf family guanine nucleotide exchange factor SYT1 chromosome 16 L000004575 16 724717 721037 C 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF) for Arf proteins; promotes activation of Arl1p, which recruits Imh1p to the Golgi; involved in vesicular transport; member of the Sec7-domain family; contains a PH domain +S000034455 CDS YPR095C 16 724717 721037 C 2011-02-03 1996-07-31 +S000006300 ORF Verified YPR096C chromosome 16 16 725144 724842 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments +S000034576 CDS YPR096C 16 725144 724842 C 2011-02-03 1996-07-31 +S000006301 ORF Verified YPR097W chromosome 16 16 725394 728615 W 2011-02-03 1996-07-31|2011-02-03 Protein that contains a PX domain and binds phosphoinositides; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; PX stands for Phox homology +S000034675 CDS YPR097W 16 725394 728615 W 2011-02-03 1996-07-31|2011-02-03 +S000006302 ORF Verified YPR098C chromosome 16 16 729528 728947 C 2011-02-03 2003-09-27|1996-07-31 Protein of unknown function; localized to the mitochondrial outer membrane +S000034698 CDS YPR098C 16 729385 728947 C 2011-02-03 2003-09-27 +S000034697 CDS YPR098C 16 729528 729482 C 2011-02-03 2003-09-27|1996-07-31 +S000034699 intron YPR098C 16 729481 729386 C 2011-02-03 2003-09-27 +S000006304 ORF Verified YPR100W MRPL51 mitochondrial 54S ribosomal protein MRPL51 chromosome 16 16 729791 730213 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000033115 CDS YPR100W 16 729791 730213 W 2011-02-03 1996-07-31 +S000006303 ORF Dubious YPR099C chromosome 16 16 730113 729757 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene MRPL51/YPR100W +S000035639 CDS YPR099C 16 730113 729757 C 2011-02-03 1996-07-31 +S000006305 ORF Verified YPR101W SNT309 NTC25 chromosome 16 L000004269 16 730492 731019 W 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); this complex contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs; interacts physically and genetically with Prp19p +S000033189 CDS YPR101W 16 730492 731019 W 2011-02-03 1996-07-31 +S000006306 ORF Verified YPR102C RPL11A uL5|ribosomal 60S subunit protein L11A|rp39A|YL22|L5|L16B|L11A chromosome 16 L000004453 16 731748 731224 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L11A; expressed at twice the level of Rpl11Bp; involved in ribosomal assembly; depletion causes degradation of 60S proteins and RNA; homologous to mammalian ribosomal protein L11 and bacterial L5; RPL11A has a paralog, RPL11B, that arose from the whole genome duplication +S000033914 CDS YPR102C 16 731748 731224 C 2011-02-03 1996-07-31 +S000006307 ORF Verified YPR103W PRE2 proteasome core particle subunit beta 5|SRR2|PRG1|DOA3 chromosome 16 L000001484 16 732349 733212 W 2011-02-03 1996-07-31 Beta 5 subunit of the 20S proteasome; responsible for the chymotryptic activity of the proteasome +S000034099 CDS YPR103W 16 732349 733212 W 2011-02-03 1996-07-31 +S000006308 ORF Verified YPR104C FHL1 SPP42 chromosome 16 L000000612 16 736433 733623 C 2011-02-03 1996-07-31 Regulator of ribosomal protein (RP) transcription; has forkhead associated domain that binds phosphorylated proteins; recruits coactivator Ifh1p or corepressor Crf1p to RP gene promoters; also has forkhead DNA-binding domain though in vitro DNA binding assays give inconsistent results; computational analyses suggest it binds DNA directly at highly active RP genes and indirectly through Rap1p motifs at others; suppresses RNA pol III and splicing factor prp4 mutants +S000034142 CDS YPR104C 16 736433 733623 C 2011-02-03 1996-07-31 +S000006309 ORF Verified YPR105C COG4 Golgi transport complex subunit COG4|SGF1|SEC38|COD1 chromosome 16 S000007660 16 739569 736984 C 2011-02-03 1996-07-31 Essential component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments +S000035097 CDS YPR105C 16 739569 736984 C 2011-02-03 1996-07-31 +S000006310 ORF Verified YPR106W ISR1 putative protein kinase ISR1 chromosome 16 L000004210 16 740061 741392 W 2011-02-03 1996-07-31 Predicted protein kinase; overexpression causes sensitivity to staurosporine, which is a potent inhibitor of protein kinase C +S000035292 CDS YPR106W 16 740061 741392 W 2011-02-03 1996-07-31 +S000006311 ORF Verified YPR107C YTH1 cleavage polyadenylation factor RNA-binding subunit YTH1 chromosome 16 L000003546 16 742064 741438 C 2011-02-03 1996-07-31 Essential RNA-binding component of cleavage and polyadenylation factor; contains five zinc fingers; required for pre-mRNA 3'-end processing and polyadenylation; relocalizes to the cytosol in response to hypoxia +S000035304 CDS YPR107C 16 742064 741438 C 2011-02-03 1996-07-31 +S000006312 ORF Verified YPR108W RPN7 proteasome regulatory particle lid subunit RPN7 chromosome 16 L000004307 16 742454 743743 W 2011-02-03 1996-07-31 Essential non-ATPase regulatory subunit of the 26S proteasome; similar to another S. cerevisiae regulatory subunit, Rpn5p, as well as to mammalian proteasome subunits +S000035430 CDS YPR108W 16 742454 743743 W 2011-02-03 1996-07-31 +S000028590 ORF Uncharacterized YPR108W-A chromosome 16 16 744175 744387 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031362 CDS YPR108W-A 16 744175 744387 W 2011-02-03 2003-07-29 +S000006752 tRNA_gene tT(UGU)P chromosome 16 L000003724 16 744284 744355 W 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000036277 noncoding_exon tT(UGU)P 16 744284 744355 W 2011-02-03 2000-05-19 +S000006313 ORF Uncharacterized YPR109W chromosome 16 16 744689 745573 W 2011-02-03 1996-07-31 Predicted membrane protein; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; diploid deletion strain has high budding index +S000036314 CDS YPR109W 16 744689 745573 W 2011-02-03 1996-07-31 +S000006314 ORF Verified YPR110C RPC40 DNA-directed RNA polymerase core subunit RPC40|RPC5 chromosome 16 L000001690|L000002890 16 746835 745828 C 72 2011-02-03 1996-07-31 RNA polymerase subunit AC40; common to RNA polymerase I and III; predominant determinant targeting Ty1 integration upstream of Pol III-transcribed genes +S000031868 CDS YPR110C 16 746835 745828 C 2011-02-03 1996-07-31 +S000006315 ORF Verified YPR111W DBF20 serine/threonine-protein kinase DBF20 chromosome 16 L000000490 16 747306 749000 W 66 2011-02-03 1999-07-17|1996-07-31 Ser/Thr kinase involved in late nuclear division; one of the mitotic exit network (MEN) proteins; necessary for the execution of cytokinesis; also plays a role in regulating the stability of SWI5 and CLB2 mRNAs; DBF20 has a paralog, DBF2, that arose from the whole genome duplication +S000032040 CDS YPR111W 16 747306 749000 W 2011-02-03 1999-07-17|1996-07-31 +S000118422 ARS ARS1626 ARSXVI-749 chromosome 16 16 749099 749345 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178200 ARS_consensus_sequence ARS1626 16 749117 749133 W 2014-11-18 2014-11-18 +S000006316 ORF Verified YPR112C MRD1 RNA-binding ribosome biosynthesis protein MRD1 chromosome 16 S000007482 16 751919 749256 C 2011-02-03 1996-07-31 Essential conserved small ribosomal subunit (40s) synthesis factor; component of the 90S preribosome; required for production of 18S rRNA and small ribosomal subunit; contains five consensus RNA-binding domains and binds to the pre-rRNA at two sites within the 18S region +S000037455 CDS YPR112C 16 751919 749256 C 2011-02-03 1996-07-31 +S000006317 ORF Verified YPR113W PIS1 CDP-diacylglycerol--inositol 3-phosphatidyltransferase chromosome 16 L000001444 16 752257 752919 W 2011-02-03 1996-07-31 Phosphatidylinositol synthase; required for biosynthesis of phosphatidylinositol, which is a precursor for polyphosphoinositides, sphingolipids, and glycolipid anchors for some of the plasma membrane proteins +S000037583 CDS YPR113W 16 752257 752919 W 2011-02-03 1996-07-31 +S000006318 ORF Uncharacterized YPR114W chromosome 16 16 753301 754248 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000037664 CDS YPR114W 16 753301 754248 W 2011-02-03 1996-07-31 +S000006319 ORF Verified YPR115W RGC1 GCA1 chromosome 16 16 754877 758128 W 2011-02-03 1996-07-31 Putative regulator of the Fps1p glycerol channel; multiply phosphorylated by Hog1p under osmotic stress; contains a pleckstrin homology domain; forms homodimers and heterodimerizes with paralog Ask10p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000030470 CDS YPR115W 16 754877 758128 W 2011-02-03 1996-07-31 +S000006320 ORF Verified YPR116W RRG8 chromosome 16 16 758648 759481 W 2011-02-03 1996-07-31 Protein of unknown function; required for mitochondrial genome maintenance; null mutation results in a decrease in plasma membrane electron transport +S000030562 CDS YPR116W 16 758648 759481 W 2011-02-03 1996-07-31 +S000006321 ORF Uncharacterized YPR117W BSH1 chromosome 16 16 760025 767494 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000030644 CDS YPR117W 16 760025 767494 W 2011-02-03 1996-07-31 +S000006322 ORF Verified YPR118W MRI1 S-methyl-5-thioribose-1-phosphate isomerase MRI1 chromosome 16 16 767752 768987 W 2011-02-03 1996-07-31 5'-methylthioribose-1-phosphate isomerase; catalyzes the isomerization of 5-methylthioribose-1-phosphate to 5-methylthioribulose-1-phosphate in the methionine salvage pathway +S000030727 CDS YPR118W 16 767752 768987 W 2011-02-03 1996-07-31 +S000006635 tRNA_gene tK(UUU)P chromosome 16 L000003731 16 769302 769207 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000034222 intron tK(UUU)P 16 769265 769243 C 2011-02-03 2000-05-19 +S000034221 noncoding_exon tK(UUU)P 16 769242 769207 C 2011-02-03 2000-05-19 +S000034220 noncoding_exon tK(UUU)P 16 769302 769266 C 2011-02-03 2000-05-19 +S000007216 long_terminal_repeat YPRWsigma2 chromosome 16 16 769319 769659 W 2011-02-03 2000-05-19 Ty3 LTR +S000006323 ORF Verified YPR119W CLB2 B-type cyclin CLB2 chromosome 16 L000000350 16 771653 773128 W 2011-02-03 1996-07-31 B-type cyclin involved in cell cycle progression; activates Cdc28p to promote the transition from G2 to M phase; accumulates during G2 and M, then targeted via a destruction box motif for ubiquitin-mediated degradation by the proteasome; CLB2 has a paralog, CLB1, that arose from the whole genome duplication +S000031564 CDS YPR119W 16 771653 773128 W 2011-02-03 1996-07-31 +S000006324 ORF Verified YPR120C CLB5 B-type cyclin CLB5 chromosome 16 L000000353 16 775182 773875 C 2011-02-03 1996-07-31 B-type cyclin involved in DNA replication during S phase; activates Cdc28p to promote initiation of DNA synthesis; functions in formation of mitotic spindles along with Clb3p and Clb4p; most abundant during late G1 phase; CLB5 has a paralog, CLB6, that arose from the whole genome duplication +S000030306 CDS YPR120C 16 775182 773875 C 2011-02-03 1996-07-31 +S000006529 tRNA_gene tC(GCA)P2 chromosome 16 L000003730 16 775836 775765 C 2011-02-03 2000-05-19 Cysteine tRNA (tRNA-Cys), predicted by tRNAscan-SE analysis +S000037837 noncoding_exon tC(GCA)P2 16 775836 775765 C 2011-02-03 2000-05-19 +S000007211 long_terminal_repeat YPRWdelta14 chromosome 16 16 776093 776413 W 2011-02-03 2000-05-19 Ty1 LTR +S000007201 long_terminal_repeat YPRCdelta15 chromosome 16 16 776796 776667 C 2011-02-03 2000-05-19 Ty1 LTR +S000119041 ARS ARS1635 ARSXVI-777|ARS1626.5 chromosome 16 16 776926 777156 2011-02-03 2006-10-04 Autonomously Replicating Sequence +S000119042 ARS_consensus_sequence ARS1635 16 777098 777084 C 2011-02-03 2006-10-04 +S000007212 long_terminal_repeat YPRWdelta16 chromosome 16 16 777832 778154 W 2011-02-03 2000-05-19 Ty1 LTR +S000006325 ORF Verified YPR121W THI22 putative phosphomethylpyrimidine kinase chromosome 16 16 778583 780301 W 2011-02-03 1996-07-31|2011-02-03 Protein with similarity to hydroxymethylpyrimidine phosphate kinases; member of a gene family with THI20 and THI21; not required for thiamine biosynthesis; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively +S000033668 CDS YPR121W 16 778583 780301 W 2011-02-03 1996-07-31|2011-02-03 +S000006326 ORF Verified YPR122W AXL1 STE22|FUS5 chromosome 16 L000002601 16 782045 785671 W 2011-02-03 1996-07-31 Haploid specific endoprotease of a-factor mating pheromone; performs one of two N-terminal cleavages during maturation of a-factor mating pheromone; required for axial budding pattern of haploid cells +S000033830 CDS YPR122W 16 782045 785671 W 2011-02-03 1996-07-31 +S000006328 ORF Verified YPR124W CTR1 high-affinity Cu transporter CTR1 chromosome 16 L000003063 16 786208 787428 W 2011-02-03 1996-07-31 High-affinity copper transporter of plasma membrane; mediates nearly all copper uptake under low copper conditions; transcriptionally induced at low copper levels and degraded at high copper levels; protein increases in abundance and relocalizes from nucleus to plasma membrane upon DNA replication stress; human homolog SLC31A1 can complement a yeast ctr1 ctr3 double deletion +S000034806 CDS YPR124W 16 786208 787428 W 2011-02-03 1996-07-31 +S000006327 ORF Dubious YPR123C chromosome 16 16 786575 786141 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially/completely overlaps the verified ORF CTR +S000033865 CDS YPR123C 16 786575 786141 C 2011-02-03 1996-07-31 +S000006329 ORF Verified YPR125W YLH47 MRS7 chromosome 16 16 787961 789325 W 2011-02-03 1996-07-31 Mitochondrial inner membrane protein; exposed to the mitochondrial matrix; associates with mitochondrial ribosomes; NOT required for respiratory growth; homolog of human Letm1, a protein implicated in Wolf-Hirschhorn syndrome +S000034935 CDS YPR125W 16 787961 789325 W 2011-02-03 1996-07-31 +S000006330 ORF Dubious YPR126C chromosome 16 16 789385 789077 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034988 CDS YPR126C 16 789385 789077 C 2011-02-03 1996-07-31 +S000006331 ORF Verified YPR127W pyridoxine 4-dehydrogenase chromosome 16 16 790083 791120 W 2011-02-03 1996-07-31 Putative pyridoxine 4-dehydrogenase; differentially expressed during alcoholic fermentation; expression activated by transcription factor YRM1/YOR172W; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus +S000035194 CDS YPR127W 16 790083 791120 W 2011-02-03 1996-07-31 +S000006332 ORF Verified YPR128C ANT1 chromosome 16 16 792204 791218 C 2011-02-03 1996-07-31 Peroxisomal adenine nucleotide transporter; involved in beta-oxidation of medium-chain fatty acid; required for peroxisome proliferation +S000036009 CDS YPR128C 16 792204 791218 C 2011-02-03 1996-07-31 +S000006333 ORF Verified YPR129W SCD6 LSM13 chromosome 16 L000001806 16 792687 793736 W 2011-02-03 1996-07-31 Repressor of translation initiation; binds eIF4G through its RGG domain and inhibits recruitment of the preinitiation complex; also contains an Lsm domain; may have a role in RNA processing; overproduction suppresses null mutation in clathrin heavy chain gene CHC1; forms cytoplasmic foci upon DNA replication stress +S000036168 CDS YPR129W 16 792687 793736 W 2011-02-03 1996-07-31 +S000006334 ORF Dubious YPR130C chromosome 16 16 793781 793374 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035652 CDS YPR130C 16 793781 793374 C 2011-02-03 1996-07-31 +S000006335 ORF Verified YPR131C NAT3 peptide alpha-N-acetyltransferase complex B subunit NAT3|RAD56|NAA20 chromosome 16 S000007464|S000029405|L000001576 16 794498 793911 C 84.8 2011-02-03 2003-05-23|1996-07-31 Catalytic subunit of the NatB N-terminal acetyltransferase; NatB catalyzes acetylation of the amino-terminal methionine residues of all proteins beginning with Met-Asp or Met-Glu and of some proteins beginning with Met-Asn or Met-Met +S000035762 CDS YPR131C 16 794498 793911 C 2011-02-03 2003-05-23|1996-07-31 +S000006336 ORF Verified YPR132W RPS23B uS12|ribosomal 40S subunit protein S23B|rp37|YS14|S28B|S23B|S12 chromosome 16 L000001765 16 794965 795767 W 2011-02-03 1996-07-31 Ribosomal protein 28 (rp28) of the small (40S) ribosomal subunit; required for translational accuracy; homologous to mammalian ribosomal protein S23 and bacterial S12; RPS23B has a paralog, RPS23A, that arose from the whole genome duplication; deletion of both RPS23A and RPS23B is lethal +S000035959 CDS YPR132W 16 794965 795029 W 2011-02-03 1996-07-31 +S000035960 CDS YPR132W 16 795395 795767 W 2011-02-03 1996-07-31 +S000035961 intron YPR132W 16 795030 795394 W 2011-02-03 1996-07-31 +S000006337 ORF Verified YPR133C SPN1 IWS1 chromosome 16 16 797210 795978 C 2011-02-03 1996-07-31 Protein involved in RNA polymerase II transcription; is constitutively recruited to the CYC1 promoter and is required for recruitment of chromatin remodeling factors for the expression of CYC1 gene; interacts genetically or physically with RNAP II, TBP, TFIIS, and chromatin remodelling factors; central domain highly conserved throughout eukaryotes; mutations confer an Spt- phenotype +S000037797 CDS YPR133C 16 797210 795978 C 2011-02-03 1996-07-31 +S000006433 ORF Verified YPR133W-A TOM5 MOM8A chromosome 16 L000003249 16 797557 797709 W 2011-02-03 1999-07-17 Component of the TOM (translocase of outer membrane) complex; responsible for recognition and initial import of all mitochondrially directed proteins; involved in transfer of precursors from the Tom70p and Tom20p receptors to the Tom40p pore +S000036542 CDS YPR133W-A 16 797557 797709 W 2011-02-03 1999-07-17 +S000006338 ORF Verified YPR134W MSS18 chromosome 16 L000001204 16 798051 798857 W 2011-02-03 1996-07-31 Nuclear encoded protein needed for splicing of mitochondrial intron; required for efficient splicing of mitochondrial COX1 aI5beta intron; mss18 mutations block cleavage of 5' exon - intron junction; phenotype of intronless strain suggests additional functions +S000029836 CDS YPR134W 16 798051 798857 W 2011-02-03 1996-07-31 +S000006339 ORF Verified YPR135W CTF4 chromatin-binding protein CTF4|POB1|CHL15 chromosome 16 L000000326 16 799234 802017 W 103 2011-02-03 1996-07-31 Chromatin-associated protein; required for sister chromatid cohesion; interacts with DNA polymerase alpha (Pol1p) and may link DNA synthesis to sister chromatid cohesion +S000029940 CDS YPR135W 16 799234 802017 W 2011-02-03 1996-07-31 +S000006341 ORF Verified YPR137W RRP9 chromosome 16 S000007466 16 802359 804080 W 2011-02-03 1996-07-31 Protein involved in pre-rRNA processing; associated with U3 snRNP; component of small ribosomal subunit (SSU) processosome; ortholog of the human U3-55k protein +S000031011 CDS YPR137W 16 802359 804080 W 2011-02-03 1996-07-31 +S000006340 ORF Dubious YPR136C chromosome 16 16 802837 802325 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF RRP9 +S000029987 CDS YPR136C 16 802837 802325 C 2011-02-03 1996-07-31 +S000007213 long_terminal_repeat YPRWdelta17 chromosome 16 16 804511 804638 W 2011-02-03 2000-05-19 Ty1 LTR +S000007202 long_terminal_repeat YPRCdelta18 chromosome 16 16 804978 804645 C 2011-02-03 2000-05-19 Ty1 LTR +S000007360 transposable_element_gene YPR137C-B gag-pol fusion protein chromosome 16 S000029020 16 810269 805001 C 2011-02-03 1997-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000034188 CDS YPR137C-B 16 808963 805001 C 2011-02-03 1997-07-17 +S000034187 CDS YPR137C-B 16 810269 808965 C 2011-02-03 1997-07-17 +S000034189 plus_1_translational_frameshift YPR137C-B 16 808964 808964 C 2011-02-03 1997-07-17 +S000007359 transposable_element_gene YPR137C-A gag protein chromosome 16 16 810269 808947 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000034186 CDS YPR137C-A 16 810269 808947 C 2011-02-03 1996-07-31 +S000007208 LTR_retrotransposon YPRCTy1-2 Ty1 chromosome 16 16 810562 804645 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007203 long_terminal_repeat YPRCdelta19 chromosome 16 16 810562 810229 C 2011-02-03 2000-05-19 Ty1 LTR +S000006677 tRNA_gene tN(GUU)P chromosome 16 L000003725 16 810676 810749 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis +S000030747 noncoding_exon tN(GUU)P 16 810676 810749 W 2011-02-03 2000-05-19 +S000006342 ORF Verified YPR138C MEP3 ammonium permease MEP3 chromosome 16 L000004105 16 812453 810984 C 2011-02-03 1996-07-31 Ammonium permease of high capacity and low affinity; belongs to a ubiquitous family of cytoplasmic membrane proteins that transport only ammonium (NH4+); expression is under the nitrogen catabolite repression regulation ammonia permease; MEP3 has a paralog, MEP1, that arose from the whole genome duplication +S000031048 CDS YPR138C 16 812453 810984 C 2011-02-03 1996-07-31 +S000006343 ORF Verified YPR139C LOA1 lysophosphatidic acid acyltransferase LOA1|VPS66 chromosome 16 16 814058 813156 C 2011-02-03 1996-07-31 Lysophosphatidic acid acyltransferase; involved in triacelglyceride homeostasis and lipid droplet formation; localized to lipid droplets and the ER; specificity for oleoyl-CoA +S000031180 CDS YPR139C 16 814058 813156 C 2011-02-03 1996-07-31 +S000006344 ORF Verified YPR140W TAZ1 lysophosphatidylcholine acyltransferase chromosome 16 16 814391 815536 W 2011-02-03 1996-07-31 Lyso-phosphatidylcholine acyltransferase; required for normal phospholipid content of mitochondrial membranes; major determinant of the final acyl chain composition of the mitochondrial-specific phospholipid cardiolipin; mutations in human ortholog tafazzin (TAZ) cause Barth syndrome, a rare X-linked disease characterized by skeletal and cardiomyopathy and bouts of cyclic neutropenia; a specific splice variant of human TAZ can complement yeast null mutant +S000030806 CDS YPR140W 16 814391 815536 W 2011-02-03 1996-07-31 +S000006345 ORF Verified YPR141C KAR3 OSR11 chromosome 16 L000000888 16 817923 815734 C 94.4 2011-02-03 1996-07-31 Minus-end-directed microtubule motor; functions in mitosis and meiosis, localizes to the spindle pole body and localization is dependent on functional Cik1p, required for nuclear fusion during mating; potential Cdc28p substrate +S000030832 CDS YPR141C 16 817923 815734 C 2011-02-03 1996-07-31 +S000006347 ORF Verified YPR143W RRP15 chromosome 16 16 818323 819075 W 2011-02-03 1996-07-31 Nucleolar protein; constituent of pre-60S ribosomal particles; required for proper processing of the 27S pre-rRNA at the A3 and B1 sites to yield mature 5.8S and 25S rRNAs +S000032060 CDS YPR143W 16 818323 819075 W 2011-02-03 1996-07-31 +S000006346 ORF Dubious YPR142C chromosome 16 16 818693 818130 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF RRP15, which is required for ribosomal RNA processing +S000031843 CDS YPR142C 16 818693 818130 C 2011-02-03 1996-07-31 +S000118423 ARS ARS1627 ARSXVI-819 chromosome 16 16 819160 819399 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178201 ARS_consensus_sequence ARS1627 16 819340 819324 C 2014-11-18 2014-11-18 +S000006611 tRNA_gene tI(AAU)P1 chromosome 16 L000003726 16 819529 819602 W 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000035185 noncoding_exon tI(AAU)P1 16 819529 819602 W 2011-02-03 2000-05-19 +S000006348 ORF Verified YPR144C NOC4 ribosome biosynthesis protein NOC4|UTP19 chromosome 16 16 821423 819765 C 2011-02-03 1996-07-31 Nucleolar protein; forms a complex with Nop14p that mediates maturation and nuclear export of 40S ribosomal subunits; relocalizes to the cytosol in response to hypoxia +S000032106 CDS YPR144C 16 821423 819765 C 2011-02-03 1996-07-31 +S000006505 snoRNA_gene snR45 SNR45 chromosome 16 L000003412 16 821732 821903 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA) but not shown to be active; no target site is predicted within the ribosomal RNAs +S000030617 noncoding_exon snR45 16 821732 821903 W 2011-02-03 2000-05-19 +S000006349 ORF Verified YPR145W ASN1 asparagine synthase (glutamine-hydrolyzing) 1 chromosome 16 L000002732 16 822620 824338 W 2011-02-03 1996-07-31 Asparagine synthetase; catalyzes the synthesis of L-asparagine from L-aspartate in the asparagine biosynthetic pathway; ASN1 has a paralog, ASN2, that arose from the whole genome duplication +S000034141 CDS YPR145W 16 822620 824338 W 2011-02-03 1996-07-31 +S000113589 ORF Uncharacterized YPR145C-A chromosome 16 16 824926 824690 C 2011-02-03 2005-11-21 Putative protein of unknown function +S000113590 CDS YPR145C-A 16 824926 824690 C 2011-02-03 2005-11-21 +S000006350 ORF Dubious YPR146C chromosome 16 16 825676 825347 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034200 CDS YPR146C 16 825676 825347 C 2011-02-03 1996-07-31 +S000006351 ORF Verified YPR147C chromosome 16 16 826559 825645 C 2011-02-03 1996-07-31 Protein of unknown function; may have a role in lipid metabolism, based on localization to lipid droplets; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and is induced in response to the DNA-damaging agent MMS +S000034283 CDS YPR147C 16 826559 825645 C 2011-02-03 1996-07-31 +S000006352 ORF Verified YPR148C chromosome 16 16 828140 826833 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern +S000034341 CDS YPR148C 16 828140 826833 C 2011-02-03 1996-07-31 +S000006353 ORF Verified YPR149W NCE102 NCE2 chromosome 16 L000003098 16 829918 830439 W 2011-02-03 1996-07-31 Protein of unknown function; contains transmembrane domains; involved in secretion of proteins that lack classical secretory signal sequences; component of the detergent-insoluble glycolipid-enriched complexes (DIGs); NCE102 has a paralog, FHN1, that arose from the whole genome duplication +S000035352 CDS YPR149W 16 829918 830439 W 2011-02-03 1996-07-31 +S000006354 ORF Dubious YPR150W chromosome 16 16 830999 831520 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene SUE1/YPR151C +S000033972 CDS YPR150W 16 830999 831520 W 2011-02-03 1996-07-31 +S000006355 ORF Verified YPR151C SUE1 chromosome 16 16 831675 831055 C 2011-02-03 1996-07-31 Protein required for degradation of unstable forms of cytochrome c; located in the mitochondria +S000034039 CDS YPR151C 16 831675 831055 C 2011-02-03 1996-07-31 +S000006356 ORF Verified YPR152C URN1 chromosome 16 16 833458 832061 C 2011-02-03 1996-07-31 Protein of unknown function containing WW and FF domains; overexpression causes accumulation of cells in G1 phase +S000034921 CDS YPR152C 16 833458 832061 C 2011-02-03 1996-07-31 +S000006357 ORF Verified YPR153W MAY24 chromosome 16 16 833689 834245 W 2011-02-03 1996-07-31|2007-07-10 Protein of unknown function +S000035217 CDS YPR153W 16 833689 833693 W 2011-02-03 1996-07-31|2007-07-10 +S000123277 CDS YPR153W 16 833828 834245 W 2011-02-03 2007-07-10 +S000123276 intron YPR153W 16 833694 833827 W 2011-02-03 2007-07-10 +S000006358 ORF Verified YPR154W PIN3 LSB2 chromosome 16 16 834565 835212 W 2011-02-03 1996-07-31 Negative regulator of actin nucleation-promoting factor activity; interacts with Las17p, a homolog of human Wiskott-Aldrich Syndrome protein (WASP), via an N-terminal SH3 domain, and along with LSB1 cooperatively inhibits the nucleation of actin filaments; short-lived protein whose levels increase in response to thermal stress; induces the formation of the [PIN+] and [RNQ+] prions when overproduced; PIN3 has a paralog, LSB1, that arose from the whole genome duplication +S000036101 CDS YPR154W 16 834565 835212 W 2011-02-03 1996-07-31 +S000006359 ORF Verified YPR155C NCA2 chromosome 16 L000003161 16 837413 835563 C 2011-02-03 1996-07-31 Protein that regulates expression of Fo-F1 ATP synthase subunits; involved in the regulation of mitochondrial expression of subunits 6 (Atp6p) and 8 (Atp8p) of the Fo-F1 ATP synthase; functions with Nca3p +S000036159 CDS YPR155C 16 837413 835563 C 2011-02-03 1996-07-31 +S000006360 ORF Verified YPR156C TPO3 spermine transporter chromosome 16 16 839777 837909 C 2011-02-03 1996-07-31 Polyamine transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; specific for spermine; localizes to the plasma membrane; TPO3 has a paralog, TPO2, that arose from the whole genome duplication +S000036260 CDS YPR156C 16 839777 837909 C 2011-02-03 1996-07-31 +S000006361 ORF Uncharacterized YPR157W TDA6 chromosome 16 16 841266 842669 W 2011-02-03 1996-07-31 Putative protein of unknown function; induced by treatment with 8-methoxypsoralen and UVA irradiation; null mutant is sensitive to expression of the top1-T722A allele; SWAT-GFP and mCherry fusion proteins localize to the cell periphery and vacuole; TDA6 has a paralog, VPS62, that arose from the whole genome duplication +S000036428 CDS YPR157W 16 841266 842669 W 2011-02-03 1996-07-31 +S000118424 ARS ARS1628 ARSXVI-843 chromosome 16 16 842653 842900 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178202 ARS_consensus_sequence ARS1628 16 842708 842724 W 2014-11-18 2014-11-18 +S000006362 ORF Verified YPR158W CUR1 chromosome 16 16 843262 844020 W 2011-02-03 1996-07-31 Sorting factor, central regulator of spatial protein quality control; physically and functionally interacts with chaperones to promote sorting and deposition of misfolded proteins into cytosolic compartments; involved in destabilization of [URE3] prions; CUR1 has a paralog, BTN2, that arose from the whole genome duplication +S000030121 CDS YPR158W 16 843262 844020 W 2011-02-03 1996-07-31 +S000007214 long_terminal_repeat YPRWdelta20 chromosome 16 16 844412 844749 W 2011-02-03 2000-05-19 Ty1 LTR +S000007220 LTR_retrotransposon YPRWTy1-3 Ty1 chromosome 16 16 844412 850340 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007363 transposable_element_gene YPR158W-A gag protein chromosome 16 16 844709 846031 W 2011-02-03 1999-07-17|1996-07-31 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000037619 CDS YPR158W-A 16 844709 846031 W 2011-02-03 1999-07-17 +S000007364 transposable_element_gene YPR158W-B gag-pol fusion protein chromosome 16 16 844709 849980 W 2011-02-03 1997-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000037621 CDS YPR158W-B 16 844709 846013 W 2011-02-03 1997-07-17 +S000037622 CDS YPR158W-B 16 846015 849980 W 2011-02-03 1997-07-17 +S000037623 plus_1_translational_frameshift YPR158W-B 16 846014 846014 W 2011-02-03 1997-07-17 +S000007215 long_terminal_repeat YPRWdelta21 chromosome 16 16 850003 850340 W 2011-02-03 2000-05-19 Ty1 LTR +S000007204 long_terminal_repeat YPRCdelta22 chromosome 16 16 850512 850357 C 2011-02-03 2000-05-19 Ty1 LTR +S000130201 ARS ARS1629 chromosome 16 16 850512 850629 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000007205 long_terminal_repeat YPRCdelta23 chromosome 16 16 850966 850629 C 2011-02-03 2000-05-19 Ty1 LTR +S000007362 transposable_element_gene YPR158C-D gag-pol fusion protein chromosome 16 S000029021 16 856257 850989 C 2011-02-03 1997-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000035820 CDS YPR158C-D 16 854951 850989 C 2011-02-03 1997-07-17 +S000035819 CDS YPR158C-D 16 856257 854953 C 2011-02-03 1997-07-17 +S000035821 plus_1_translational_frameshift YPR158C-D 16 854952 854952 C 2011-02-03 1997-07-17 +S000007361 transposable_element_gene YPR158C-C gag protein chromosome 16 16 856257 854935 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000035816 CDS YPR158C-C 16 856257 854935 C 2011-02-03 1999-07-17 +S000007217 long_terminal_repeat YPRWsigma3 chromosome 16 16 856545 856885 W 2011-02-03 2000-05-19 Ty3 LTR +S000007209 LTR_retrotransposon YPRCTy1-4 Ty1 chromosome 16 16 856554 850629 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007206 long_terminal_repeat YPRCdelta24 chromosome 16 16 856554 856217 C 2011-02-03 2000-05-19 Ty1 LTR +S000006520 tRNA_gene tA(AGC)P chromosome 16 L000003727 16 856902 856974 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine +S000032310 noncoding_exon tA(AGC)P 16 856902 856974 W 2011-02-03 2000-05-19 +S000006363 ORF Verified YPR159W KRE6 beta-glucan synthesis-associated protein KRE6|CWH48 chromosome 16 L000000915 16 857583 859745 W 95.9 2011-02-03 1996-07-31 Type II integral membrane protein; required for beta-1,6 glucan biosynthesis; putative beta-glucan synthase; localizes to ER, plasma membrane, sites of polarized growth and secretory vesicles; functionally redundant with Skn1p; KRE6 has a paralog, SKN1, that arose from the whole genome duplication +S000030298 CDS YPR159W 16 857583 859745 W 2011-02-03 1996-07-31 +S000006589 tRNA_gene tG(GCC)P2 chromosome 16 L000003728 16 860379 860449 W 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis +S000031683 noncoding_exon tG(GCC)P2 16 860379 860449 W 2011-02-03 2000-05-19 +S000028725 ORF Uncharacterized YPR159C-A chromosome 16 16 860415 860314 C 2011-02-03 2003-07-29 Protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the cytosol; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032712 CDS YPR159C-A 16 860415 860314 C 2011-02-03 2003-07-29 +S000006364 ORF Verified YPR160W GPH1 glycogen phosphorylase chromosome 16 L000000724 16 861306 864014 W 2011-02-03 1996-07-31 Glycogen phosphorylase required for the mobilization of glycogen; non-essential; regulated by cyclic AMP-mediated phosphorylation; phosphorylation by Cdc28p may coordinately regulate carbohydrate metabolism and the cell cycle; expression is regulated by stress-response elements and by the HOG MAP kinase pathway +S000029939 CDS YPR160W 16 861306 864014 W 2011-02-03 1996-07-31 +S000028860 ORF Dubious YPR160W-A chromosome 16 16 861934 862014 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by expression profiling and mass spectrometry +S000034591 CDS YPR160W-A 16 861934 862014 W 2011-02-03 2003-07-29 +S000028726 ORF Dubious YPR160C-A chromosome 16 16 862861 862577 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032715 CDS YPR160C-A 16 862861 862577 C 2011-02-03 2003-07-29 +S000006365 ORF Verified YPR161C SGV1 cyclin-dependent serine/threonine protein kinase SGV1|BUR1 chromosome 16 L000001878 16 866422 864449 C 2011-02-03 1996-07-31 Cyclin (Bur2p)-dependent protein kinase; part of the BUR kinase complex which functions in transcriptional regulation; phosphorylates the carboxy-terminal domain (CTD) of Rpo21p and the C-terminal repeat domain of Spt5p; recruits Spt6p to the CTD at the onset of transcription; regulated by Cak1p; similar to metazoan CDK9 proteins +S000030002 CDS YPR161C 16 866422 864449 C 2011-02-03 1996-07-31 +S000006366 ORF Verified YPR162C ORC4 origin recognition complex subunit 4 chromosome 16 L000003075 16 868304 866715 C 2011-02-03 1996-07-31 Subunit of the origin recognition complex (ORC); ORC directs DNA replication by binding to replication origins and is also involved in transcriptional silencing; ORC4 has a paralog, RIF2, that arose from the whole genome duplication +S000030984 CDS YPR162C 16 868304 866715 C 2011-02-03 1996-07-31 +S000006367 ORF Verified YPR163C TIF3 eIF4B|STM1|RBL3 chromosome 16 L000002304 16 869955 868645 C 2011-02-03 1996-07-31 Translation initiation factor eIF-4B; contains an RNA recognition motif and binds to single-stranded RNA; has RNA annealing activity; interacts with Rps20p at the head of the 40S ribosomal subunit and alters the structure of the mRNA entry channel +S000031085 CDS YPR163C 16 869955 868645 C 2011-02-03 1996-07-31 +S000006368 ORF Verified YPR164W MMS1 SLM6|RTT108 chromosome 16 L000003933 16 870703 874926 W 2011-02-03 1996-07-31 Subunit of E3 ubiquitin ligase complex involved in replication repair; stabilizes protein components of the replication fork such as the fork-pausing complex and leading strand polymerase, preventing fork collapse and promoting efficient recovery during replication stress; regulates Ty1 transposition; involved with Rtt101p in nonfunctional rRNA decay +S000032195 CDS YPR164W 16 870703 874926 W 2011-02-03 1996-07-31 +S000006369 ORF Verified YPR165W RHO1 Rho family GTPase RHO1 chromosome 16 L000001630 16 875368 875997 W 2011-02-03 1996-07-31 GTP-binding protein of the rho subfamily of Ras-like proteins; involved in establishment of cell polarity; regulates protein kinase C (Pkc1p) and the cell wall synthesizing enzyme 1,3-beta-glucan synthase (Fks1p and Gsc2p) +S000032291 CDS YPR165W 16 875368 875997 W 2011-02-03 1996-07-31 +S000006370 ORF Verified YPR166C MRP2 mitochondrial 37S ribosomal protein MRP2 chromosome 16 L000001153 16 876629 876282 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit +S000032335 CDS YPR166C 16 876629 876282 C 2011-02-03 1996-07-31 +S000006371 ORF Verified YPR167C MET16 phosphoadenylyl-sulfate reductase (thioredoxin) chromosome 16 L000001087 16 877632 876847 C 2011-02-03 1996-07-31 3'-phosphoadenylsulfate reductase; reduces 3'-phosphoadenylyl sulfate to adenosine-3',5'-bisphosphate and free sulfite using reduced thioredoxin as cosubstrate, involved in sulfate assimilation and methionine metabolism +S000032426 CDS YPR167C 16 877632 876847 C 2011-02-03 1996-07-31 +S000006372 ORF Verified YPR168W NUT2 mediator complex subunit NUT2|MED10 chromosome 16 L000003447|L000004593 16 878076 878549 W 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; required for transcriptional activation and has a role in basal transcription; protein abundance increases in response to DNA replication stress +S000034534 CDS YPR168W 16 878076 878549 W 2011-02-03 1996-07-31 +S000006373 ORF Verified YPR169W JIP5 chromosome 16 16 878690 880168 W 2011-02-03 1996-07-31|2005-12-01 Protein required for biogenesis of the large ribosomal subunit; required for biogenesis of the large ribosomal subunit; interacts with proteins involved in RNA processing, ribosome biogenesis, ubiquitination and demethylation; similar to WDR55, a human WD repeat protein; essential gene +S000034622 CDS YPR169W 16 878690 880168 W 2011-02-03 1996-07-31|2005-12-01 +S000006612 tRNA_gene tI(AAU)P2 chromosome 16 L000003729 16 880369 880296 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000035187 noncoding_exon tI(AAU)P2 16 880369 880296 C 2011-02-03 2000-05-19 +S000007218 long_terminal_repeat YPRWsigma4 chromosome 16 16 880386 880726 W 2011-02-03 2000-05-19 Ty3 LTR +S000118425 ARS ARS1630 ARSXVI-881 chromosome 16 16 880861 881108 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178203 ARS_consensus_sequence ARS1630 16 880905 880921 W 2014-11-18 2014-11-18 +S000007207 long_terminal_repeat YPRCtau3 chromosome 16 16 881830 881487 C 2011-02-03 2000-05-19 Ty4 LTR +S000028591 ORF Dubious YPR169W-A chromosome 16 16 883239 883457 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps two other dubious ORFs: YPR170C and YPR170W-B +S000031363 CDS YPR169W-A 16 883239 883457 W 2011-02-03 2003-07-29 +S000028515 ORF Uncharacterized YPR170W-B chromosome 16 16 883239 883595 W 2011-02-03 2003-07-29 Putative protein of unknown function; conserved in fungi; SWAT-GFP fusion protein localizes to the vacuole membrane; partially overlaps the dubious genes YPR169W-A, YPR170W-A and YRP170C +S000030284 CDS YPR170W-B 16 883239 883387 W 2011-02-03 2003-07-29 +S000030285 CDS YPR170W-B 16 883487 883595 W 2011-02-03 2003-07-29 +S000030286 intron YPR170W-B 16 883388 883486 W 2011-02-03 2003-07-29 +S000006374 ORF Dubious YPR170C chromosome 16 16 883318 882983 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORFs YPR169W-A and YPR170W-B +S000033271 CDS YPR170C 16 883318 882983 C 2011-02-03 1996-07-31 +S000028861 ORF Dubious YPR170W-A chromosome 16 16 883378 883563 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by expression profiling and mass spectrometry +S000034592 CDS YPR170W-A 16 883378 883563 W 2011-02-03 2003-07-29 +S000006375 ORF Verified YPR171W BSP1 chromosome 16 16 883828 885558 W 2011-02-03 1996-07-31 Adapter that links synaptojanins to the cortical actin cytoskeleton; the synaptojanins are Inp52p and Inp53p +S000034199 CDS YPR171W 16 883828 885558 W 2011-02-03 1996-07-31 +S000006376 ORF Uncharacterized YPR172W pyridoxal 5'-phosphate synthase chromosome 16 16 885796 886398 W 2011-02-03 1996-07-31 Protein of unknown function; predicted to encode a pyridoxal 5'-phosphate synthase based on sequence similarity but purified protein does not possess this activity, nor does it bind flavin mononucleotide (FMN); transcriptionally activated by Yrm1p along with genes involved in multidrug resistance; YPR172W has a paralog, YLR456W, that arose from the whole genome duplication +S000034326 CDS YPR172W 16 885796 886398 W 2011-02-03 1996-07-31 +S000006377 ORF Verified YPR173C VPS4 AAA family ATPase VPS4|DID6|VPT10|VPL4|GRD13|END13|CSC1 chromosome 16 L000002956 16 887837 886524 C 2011-02-03 1996-07-31 AAA-ATPase involved in multivesicular body (MVB) protein sorting; ATP-bound Vps4p localizes to endosomes and catalyzes ESCRT-III disassembly and membrane release; ATPase activity is activated by Vta1p; regulates cellular sterol metabolism +S000034362 CDS YPR173C 16 887837 886524 C 2011-02-03 1996-07-31 +S000006378 ORF Verified YPR174C chromosome 16 16 888708 888043 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nuclear periphery; potential Cdc28p substrate; binds phosphatidylinositols and phosphatidylethanolamine in a large-scale study; relative distribution to foci at the nuclear periphery increases upon DNA replication stress; YPR174C has a paralog, NBP1, that arose from the whole genome duplication +S000035379 CDS YPR174C 16 888708 888043 C 2011-02-03 1996-07-31 +S000006379 ORF Verified YPR175W DPB2 DNA polymerase epsilon noncatalytic subunit chromosome 16 L000000519 16 888974 891043 W 2011-02-03 2003-09-22|1996-07-31 Second largest subunit of DNA polymerase II (DNA polymerase epsilon); required for maintenance of fidelity of chromosomal replication; essential motif in C-terminus is required for formation of the four-subunit Pol epsilon; expression peaks at the G1/S phase boundary; Cdc28p substrate +S000035567 CDS YPR175W 16 888974 891043 W 2011-02-03 2003-09-22|1996-07-31 +S000006380 ORF Verified YPR176C BET2 Rab geranylgeranyltransferase BET2 chromosome 16 L000000172 16 892078 891101 C 2011-02-03 1996-07-31 Beta subunit of Type II geranylgeranyltransferase; required for vesicular transport between the endoplasmic reticulum and the Golgi; provides a membrane attachment moiety to Rab-like proteins Ypt1p and Sec4p; human homolog RABGGTB can complement yeast BET2 mutant +S000035598 CDS YPR176C 16 892078 891101 C 2011-02-03 1996-07-31 +S000006382 ORF Verified YPR178W PRP4 U4/U6-U5 snRNP complex subunit PRP4|RNA4 chromosome 16 L000001497 16 892332 893729 W 2011-02-03 1996-07-31 Splicing factor; component of the U4/U6-U5 snRNP complex +S000036653 CDS YPR178W 16 892332 893729 W 2011-02-03 1996-07-31 +S000006381 ORF Dubious YPR177C chromosome 16 16 892684 892313 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the 5' end of the essential PRP4 gene encoding a component of the U4/U6-U5 snRNP complex +S000036500 CDS YPR177C 16 892684 892313 C 2011-02-03 1996-07-31 +S000006383 ORF Verified YPR179C HDA3 PLO1 chromosome 16 16 895764 893797 C 2011-02-03 1996-07-31 Subunit of the HDA1 histone deacetylase complex; possibly tetrameric trichostatin A-sensitive class II histone deacetylase complex contains Hda1p homodimer and an Hda2p-Hda3p heterodimer; required for the activity of the complex; relocalizes to the cytosol in response to hypoxia; similar to Hda2p +S000036672 CDS YPR179C 16 895764 893797 C 2011-02-03 1996-07-31 +S000006384 ORF Verified YPR180W AOS1 E1 ubiquitin-activating protein AOS1|RHC31 chromosome 16 L000004031 16 895961 897004 W 2011-02-03 1996-07-31 Subunit of heterodimeric nuclear SUMO activating enzyme E1 with Uba2p; activates Smt3p (SUMO) before its conjugation to proteins (sumoylation), which may play a role in protein targeting; essential for viability; relocalizes to the cytosol in response to hypoxia +S000030253 CDS YPR180W 16 895961 897004 W 2011-02-03 1996-07-31 +S000006385 ORF Verified YPR181C SEC23 GTPase-activating protein SEC23 chromosome 16 L000001846|S000028412 16 899667 897361 C 2011-02-03 1996-07-31 GTPase-activating protein, stimulates the GTPase activity of Sar1p; component of the Sec23p-Sec24p heterodimer of the COPII vesicle coat, involved in ER to Golgi transport; substrate of Ubp3/Bre5 complex; ubiquitylated by Ub-ligase Rsp5p; proteasome-mediated degradation of Sec23p is regulated by Cdc48p +S000030311 CDS YPR181C 16 899667 897361 C 2011-02-03 1996-07-31 +S000006386 ORF Verified YPR182W SMX3 mRNA splicing protein SMX3|Sm F|SmF chromosome 16 L000002786 16 900194 900454 W 2011-02-03 1996-07-31 Core Sm protein Sm F; part of heteroheptameric complex (with Smb1p, Smd1p, Smd2p, Smd3p, Sme1p, and Smx2p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; homolog of human Sm F +S000030535 CDS YPR182W 16 900194 900454 W 2011-02-03 1996-07-31 +S000006387 ORF Verified YPR183W DPM1 dolichyl-phosphate beta-D-mannosyltransferase|SED3 chromosome 16 L000000524 16 900755 901558 W 2011-02-03 1996-07-31 Dolichol phosphate mannose (Dol-P-Man) synthase of ER membrane; catalyzes formation of Dol-P-Man from Dol-P and GDP-Man; required for biosynthesis of glycosyl phosphatidylinositol (GPI) membrane anchor, as well as O-mannosylation and protein N- and O-linked glycosylation; human homolog DPM1 can complement yeast mutant strains +S000031445 CDS YPR183W 16 900755 901558 W 2011-02-03 1996-07-31 +S000006388 ORF Verified YPR184W GDB1 bifunctional 4-alpha-glucanotransferase/amylo-alpha-1,6-glucosidase chromosome 16 16 902044 906654 W 2011-02-03 1996-07-31 Glycogen debranching enzyme; contains glucanotranferase and alpha-1,6-amyloglucosidase activities; required for glycogen degradation; phosphorylated in mitochondria; activity is inhibited by Igd1p; protein abundance increases in response to DNA replication stress +S000031566 CDS YPR184W 16 902044 906654 W 2011-02-03 1996-07-31 +S000006389 ORF Verified YPR185W ATG13 serine/threonine protein kinase regulatory subunit ATG13|APG13 chromosome 16 L000003956 16 907218 909434 W 2011-02-03 1996-07-31 Regulatory subunit of the Atg1p signaling complex; stimulates Atg1p kinase activity; required for vesicle formation during autophagy and the cytoplasm-to-vacuole targeting (Cvt) pathway; contains a HORMA domain required for autophagy and for recruitment of the phosphatidylinositol 3-kinase complex subunit Atg14p to the pre-autophagosomal structure +S000031704 CDS YPR185W 16 907218 909434 W 2011-02-03 1996-07-31 +S000006390 ORF Verified YPR186C PZF1 TFC2 chromosome 16 L000002286|L000001544 16 911022 909733 C 2011-02-03 1996-07-31 Transcription factor IIIA (TFIIIA); essential DNA binding protein required for transcription of 5S rRNA by RNA polymerase III; not involved in transcription of other RNAP III genes; nine conserved zinc fingers; may also bind 5S rRNA +S000032601 CDS YPR186C 16 911022 909733 C 2011-02-03 1996-07-31 +S000006391 ORF Verified YPR187W RPO26 DNA-directed RNA polymerase core subunit RPO26|ABC23|RPB6 chromosome 16 L000001745 16 911257 911800 W 2011-02-03 1996-07-31 RNA polymerase subunit ABC23; common to RNA polymerases I, II, and III; part of central core; similar to bacterial omega subunit +S000032734 CDS YPR187W 16 911257 911276 W 2011-02-03 1996-07-31 +S000032735 CDS YPR187W 16 911353 911800 W 2011-02-03 1996-07-31 +S000032736 intron YPR187W 16 911277 911352 W 2011-02-03 1996-07-31 +S000006392 ORF Verified YPR188C MLC2 chromosome 16 S000007532 16 912479 911988 C 2011-02-03 1996-07-31 Regulatory light chain for the type II myosin Myo1p; binds to an IQ motif of Myo1p, localization to the bud neck depends on Myo1p; involved in the disassembly of the Myo1p ring +S000032770 CDS YPR188C 16 912479 911988 C 2011-02-03 1996-07-31 +S000006393 ORF Verified YPR189W SKI3 SKI complex subunit tetratricopeptide repeat protein SKI3|SKI5 chromosome 16 L000001904 16 912664 916962 W 2011-02-03 1996-07-31 Ski complex component and TPR protein; mediates 3'-5' RNA degradation by the cytoplasmic exosome; null mutants have superkiller phenotype of increased viral dsRNAs and are synthetic lethal with mutations in 5'-3' mRNA decay; mutations in the human ortholog, TTC37, causes Syndromic diarrhea/Trichohepatoenteric (SD/THE) syndrome +S000034826 CDS YPR189W 16 912664 916962 W 2011-02-03 1996-07-31 +S000006394 ORF Verified YPR190C RPC82 DNA-directed RNA polymerase III subunit C82|RPC80|RPC3 chromosome 16 L000001693|S000029422|L000001692 16 919041 917077 C 2011-02-03 1996-07-31 RNA polymerase III subunit C82 +S000033015 CDS YPR190C 16 919041 917077 C 2011-02-03 1996-07-31 +S000006395 ORF Verified YPR191W QCR2 ubiquinol--cytochrome-c reductase subunit 2|UCR2|COR2 chromosome 16 L000001545 16 919381 920487 W 2011-02-03 1996-07-31 Subunit 2 of ubiquinol cytochrome-c reductase (Complex III); Complex III is a component of the mitochondrial inner membrane electron transport chain; phosphorylated; transcription is regulated by Hap1p, Hap2p/Hap3p, and heme +S000033835 CDS YPR191W 16 919381 920487 W 2011-02-03 1996-07-31 +S000006396 ORF Verified YPR192W AQY1 chromosome 16 L000004720 16 921860 922777 W 2011-02-03 1996-07-31 Spore-specific water channel; mediates the transport of water across cell membranes, developmentally controlled; may play a role in spore maturation, probably by allowing water outflow, may be involved in freeze tolerance +S000033980 CDS YPR192W 16 921860 922777 W 2011-02-03 1996-07-31 +S000006397 ORF Verified YPR193C HPA2 histone acetyltransferase|KAT10 chromosome 16 L000004379 16 923379 922909 C 2011-02-03 1996-07-31 Tetrameric histone acetyltransferase; has similarity to Gcn5p, Hat1p, Elp3p, and Hpa3p; acetylates histones H3 and H4 in vitro and exhibits autoacetylation activity; also acetylates polyamines +S000034022 CDS YPR193C 16 923379 922909 C 2011-02-03 1996-07-31 +S000006398 ORF Verified YPR194C OPT2 chromosome 16 16 926937 924304 C 2011-02-03 1996-07-31 Oligopeptide transporter; localized to peroxisomes and affects glutathione redox homeostasis; also localizes to the plasma membrane (PM) and to the late Golgi, and has a role in maintenance of lipid asymmetry between the inner and outer leaflets of the PM; member of the OPT family, with potential orthologs in S. pombe and C. albicans; also plays a role in formation of mature vacuoles and in polarized cell growth +S000034902 CDS YPR194C 16 926937 924304 C 2011-02-03 1996-07-31 +S000006399 ORF Dubious YPR195C chromosome 16 16 928294 927965 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035080 CDS YPR195C 16 928294 927965 C 2011-02-03 1996-07-31 +S000006400 ORF Uncharacterized YPR196W putative maltose-responsive transcription factor chromosome 16 16 931376 932788 W 2011-02-03 1996-07-31 Putative maltose-responsive transcription factor +S000036124 CDS YPR196W 16 931376 932788 W 2011-02-03 1996-07-31 +S000118426 ARS ARS1631 ARSXVI-933 chromosome 16 16 932983 933229 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178204 ARS_consensus_sequence ARS1631 16 933165 933149 C 2014-11-18 2014-11-18 +S000007219 long_terminal_repeat YPRWtau4 chromosome 16 16 933071 933404 W 2011-02-03 2000-05-19 Ty4 LTR +S000006402 ORF Verified YPR198W SGE1 NOR1 chromosome 16 L000001876 16 934034 935665 W 84.8 2011-02-03 1996-07-31 Plasma membrane multidrug transporter; member of the major facilitator superfamily; acts as an extrusion permease; partial multicopy suppressor of gal11 mutations +S000036370 CDS YPR198W 16 934034 935665 W 2011-02-03 1996-07-31 +S000006401 ORF Dubious YPR197C chromosome 16 16 934461 933898 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF SGE1/YPR198W +S000036181 CDS YPR197C 16 934461 933898 C 2011-02-03 1996-07-31 +S000006403 ORF Verified YPR199C ARR1 ACR1|YAP8 chromosome 16 L000004292 16 939032 938148 C 2011-02-03 1996-07-31 Transcriptional activator of the basic leucine zipper (bZIP) family; required for transcription of genes involved in resistance to arsenic compounds; directly binds trivalent arsenic (As(III)) as does K. lactis ortholog, KIYAP8 +S000036409 CDS YPR199C 16 939032 938148 C 2011-02-03 1996-07-31 +S000006404 ORF Verified YPR200C ARR2 ACR2 chromosome 16 L000004293|L000004290 16 939671 939279 C 2011-02-03 1996-07-31 Arsenate reductase required for arsenate resistance; converts arsenate to arsenite which can then be exported from cells by Arr3p +S000034447 CDS YPR200C 16 939671 939279 C 2011-02-03 1996-07-31 +S000006405 ORF Verified YPR201W ARR3 ACR3 chromosome 16 L000004323 16 939922 941136 W 2011-02-03 1996-07-31 Plasma membrane metalloid/H+ antiporter; member of bile/arsenite/riboflavin transporter (BART) superfamily; transports arsenite and antimonite; required for resistance to arsenic compounds; transcription is activated by Arr1p in the presence of arsenite +S000034611 CDS YPR201W 16 939922 941136 W 2011-02-03 1996-07-31 +S000130202 ARS ARS1632 chromosome 16 16 942084 943032 2011-02-03 2009-05-08 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000029002 telomere TEL16R chromosome 16 16 942396 948010 W 106 2011-02-03 2003-09-09|2011-02-03 Telomeric region on the right arm of Chromosome XVI; annotated components include an X element core sequence and a short Y' element; TEL16R does have telomeric repeats (TEL16R-TR), but they are missing from the genome annotation due to difficulties encountered during sequencing and/or assembly +S000029003 X_element TEL16R 16 942396 942771 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome XVI; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000029004 Y_prime_element TEL16R 16 942810 948010 W 2011-02-03 2003-09-09|2011-02-03 Telomeric short Y' element on the right arm of Chromosome XVI; contains an ARS consensus sequence, a region of 36-bp repeats, and four ORFs YPR202W, YPR203W, YPR204W, and YPR204C-A +S000006406 ORF Uncharacterized YPR202W chromosome 16 16 943032 943896 W 2011-02-03 1996-07-31 Putative protein of unknown function; similar to telomere-encoded helicases; down-regulated at low calcium levels; YPR202W is not an essential gene; transcript is predicted to be spliced but there is no evidence that it is spliced in vivo +S000034726 CDS YPR202W 16 943032 943050 W 2011-02-03 1996-07-31 +S000034727 CDS YPR202W 16 943199 943896 W 2011-02-03 1996-07-31 +S000034728 intron YPR202W 16 943051 943198 W 2011-02-03 1996-07-31 +S000006407 ORF Uncharacterized YPR203W chromosome 16 16 943880 944188 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000035720 CDS YPR203W 16 943880 944188 W 2011-02-03 1996-07-31 +S000006408 ORF Verified YPR204W Y' -Help1|Y' element ATP-dependent helicase chromosome 16 16 944603 947701 W 2011-02-03 1996-07-31 DNA helicase encoded within the telomeric Y' element; Y' -helicase protein 1 +S000035834 CDS YPR204W 16 944603 947701 W 2011-02-03 1996-07-31 +S000028727 ORF Dubious YPR204C-A chromosome 16 16 947338 946856 C 2011-02-03 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032717 CDS YPR204C-A 16 947338 946856 C 2011-02-03 2003-07-29 +S000007328 tRNA_gene tP(UGG)Q chromosome 17 L000004903 17 731 802 W 2000-05-19 2000-05-19 Mitochondrial proline tRNA (tRNA-Pro) +S000036040 noncoding_exon tP(UGG)Q 17 731 802 W 2000-05-19 2000-05-19 +S000007257 ORF Dubious Q0010 ORF6 chromosome 17 L000004921 17 3952 4338 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF Q0017 +S000036184 CDS Q0010 17 3952 4338 W 2000-05-19 2000-05-19 +S000007258 ORF Dubious Q0017 ORF7 chromosome 17 L000004922 17 4254 4415 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF Q0010 +S000036188 CDS Q0017 17 4254 4415 W 2000-05-19 2000-05-19 +S000029667 origin_of_replication ORI1 ORI1 chromosome 17 L000001308 17 4312 4012 C 2014-11-18 2014-11-18 Mitochondrial origin of replication +S000007287 rRNA_gene Q0020 15S_RRNA 14s rRNA|15S_RRNA_2 chromosome 17 L000004882 17 6546 8194 W 2000-05-19 2000-05-19 Ribosomal RNA of the small mitochondrial ribosomal subunit; MSU1 allele suppresses ochre stop mutations in mitochondrial protein-coding genes +S000037488 noncoding_exon Q0020 17 6546 8194 W 2000-05-19 2000-05-19 +S000007337 tRNA_gene tW(UCA)Q chromosome 17 L000004912 17 9374 9447 W 2000-05-19 2000-05-19 Mitochondrial tRNA, annotated as tryptophanyl tRNA (tRNA-Trp); predicted by tRNAscan-SE analysis to have specificity for selenocysteine +S000031464 noncoding_exon tW(UCA)Q 17 9374 9447 W 2000-05-19 2000-05-19 +S000007259 ORF Dubious Q0032 ORF8 chromosome 17 L000004923 17 11667 11957 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036376 CDS Q0032 17 11667 11957 W 2000-05-19 2000-05-19 +S000029331 origin_of_replication ORI8 ORI8 chromosome 17 L000003958 17 12780 12510 C 2014-11-18 2014-11-18 Mitochondrial origin of replication +S000007261 ORF Verified Q0050 AI1 intron-encoded reverse transcriptase aI1 chromosome 17 L000000066|L000004925 17 13818 16322 W 2000-05-19 2000-05-19 Reverse transcriptase required for splicing of the COX1 pre-mRNA; encoded by a mobile group II intron within the mitochondrial COX1 gene +S000037112 CDS Q0050 17 13818 16322 W 2000-05-19 2000-05-19 +S000007262 ORF Verified Q0055 AI2 intron-encoded reverse transcriptase aI2 chromosome 17 L000004926|L000000067 17 13818 18830 W 2000-05-19 2000-05-19 Reverse transcriptase required for splicing of the COX1 pre-mRNA; encoded by a mobile group II intron within the mitochondrial COX1 gene +S000037125 CDS Q0055 17 13818 13986 W 2000-05-19 2000-05-19 +S000037126 CDS Q0055 17 16435 18830 W 2000-05-19 2000-05-19 +S000037127 intron Q0055 17 13987 16434 W 2000-05-19 2000-05-19 +S000007263 ORF Verified Q0060 AI3 intron-encoded DNA endonuclease aI3|I-SceIII chromosome 17 L000004927|L000000068 17 13818 19996 W 2000-05-19 2000-05-19|2006-01-12 Endonuclease I-SceIII; encoded by a mobile group I intron within the mitochondrial COX1 gene +S000037203 CDS Q0060 17 13818 13986 W 2000-05-19 2000-05-19 +S000114045 CDS Q0060 17 16435 16470 W 2006-01-12 2006-01-12 +S000037204 CDS Q0060 17 18954 19996 W 2000-05-19 2000-05-19 +S000037205 intron Q0060 17 13987 16434 W 2006-01-12 2000-05-19|2006-01-12 +S000114046 intron Q0060 17 16471 18953 W 2006-01-12 2006-01-12 +S000007264 ORF Verified Q0065 AI4 intron-encoded DNA endonuclease aI4|I-SceII chromosome 17 L000004928|L000004885 17 13818 21935 W 2000-05-19 2000-05-19|2006-01-12 Endonuclease I-SceII; encoded by a mobile group I intron within the mitochondrial COX1 gene; intron is normally spliced by the BI4p maturase but AI4p can mutate to acquire the same maturase activity +S000037224 CDS Q0065 17 13818 13986 W 2000-05-19 2000-05-19 +S000114047 CDS Q0065 17 16435 16470 W 2006-01-12 2006-01-12 +S000037225 CDS Q0065 17 18954 18991 W 2000-05-19 2000-05-19 +S000037226 CDS Q0065 17 20508 21935 W 2000-05-19 2000-05-19 +S000037227 intron Q0065 17 13987 16434 W 2006-01-12 2000-05-19|2006-01-12 +S000114048 intron Q0065 17 16471 18953 W 2006-01-12 2006-01-12 +S000037228 intron Q0065 17 18992 20507 W 2000-05-19 2000-05-19 +S000007265 ORF Verified Q0070 AI5_ALPHA intron-encoded DNA endonuclease aI5 alpha chromosome 17 L000004929|L000004886 17 13818 23167 W 2000-05-19 2000-05-19 Endonuclease I-SceIV; involved in intron mobility; encoded by a mobile group I intron within the mitochondrial COX1 gene +S000029861 CDS Q0070 17 13818 13986 W 2000-05-19 2000-05-19 +S000029862 CDS Q0070 17 16435 16470 W 2000-05-19 2000-05-19 +S000029863 CDS Q0070 17 18954 18991 W 2000-05-19 2000-05-19 +S000029864 CDS Q0070 17 20508 20984 W 2000-05-19 2000-05-19 +S000029865 CDS Q0070 17 21995 23167 W 2000-05-19 2000-05-19 +S000029866 intron Q0070 17 13987 16434 W 2000-05-19 2000-05-19 +S000029867 intron Q0070 17 16471 18953 W 2000-05-19 2000-05-19 +S000029868 intron Q0070 17 18992 20507 W 2000-05-19 2000-05-19 +S000029869 intron Q0070 17 20985 21994 W 2000-05-19 2000-05-19 +S000007260 ORF Verified Q0045 COX1 cytochrome c oxidase subunit 1|OXI3 chromosome 17 L000004924|L000000383|L000001321 17 13818 26701 W 2000-05-19 2000-05-19 Subunit I of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain; one of three mitochondrially-encoded subunits +S000037020 CDS Q0045 17 13818 13986 W 2000-05-19 2000-05-19 +S000037021 CDS Q0045 17 16435 16470 W 2000-05-19 2000-05-19 +S000037022 CDS Q0045 17 18954 18991 W 2000-05-19 2000-05-19 +S000037023 CDS Q0045 17 20508 20984 W 2000-05-19 2000-05-19 +S000037024 CDS Q0045 17 21995 22246 W 2000-05-19 2000-05-19 +S000037025 CDS Q0045 17 23612 23746 W 2000-05-19 2000-05-19 +S000037026 CDS Q0045 17 25318 25342 W 2000-05-19 2000-05-19 +S000037027 CDS Q0045 17 26229 26701 W 2000-05-19 2000-05-19 +S000037028 intron Q0045 17 13987 16434 W 2000-05-19 2000-05-19 +S000037029 intron Q0045 17 16471 18953 W 2000-05-19 2000-05-19 +S000037030 intron Q0045 17 18992 20507 W 2000-05-19 2000-05-19 +S000037031 intron Q0045 17 20985 21994 W 2000-05-19 2000-05-19 +S000037032 intron Q0045 17 22247 23611 W 2000-05-19 2000-05-19 +S000037033 intron Q0045 17 23747 25317 W 2000-05-19 2000-05-19 +S000037034 intron Q0045 17 25343 26228 W 2000-05-19 2000-05-19 +S000007266 ORF Uncharacterized Q0075 AI5_BETA intron-encoded DNA endonuclease aI5 beta chromosome 17 L000004887|L000004930 17 24156 25255 W 2000-05-19 2000-05-19 Protein of unknown function; encoded within an intron of the mitochondrial COX1 gene; translational initiation codon is predicted to be ATA rather than ATG +S000029881 CDS Q0075 17 24156 24870 W 2000-05-19 2000-05-19 +S000029882 CDS Q0075 17 24906 25255 W 2000-05-19 2000-05-19 +S000029883 intron Q0075 17 24871 24905 W 2000-05-19 2000-05-19 +S000007267 ORF Verified Q0080 ATP8 F1F0 ATP synthase subunit 8|AAP1 chromosome 17 L000004931|L000002723|L000002797 17 27666 27812 W 2000-05-19 2000-05-19 Subunit 8 of the F0 sector of mitochondrial F1F0 ATP synthase; encoded on the mitochondrial genome; ATP8 and ATP6 mRNAs are not translated in the absence of the F1 sector of ATPase +S000029967 CDS Q0080 17 27666 27812 W 2000-05-19 2000-05-19 +S000007268 ORF Verified Q0085 ATP6 F1F0 ATP synthase subunit a|PHO1|OLI4|OLI2 chromosome 17 L000004932|L000001300|L000002722|L000001418|L000001299 17 28487 29266 W 2000-05-19 2000-05-19 Subunit a of the F0 sector of mitochondrial F1F0 ATP synthase; mitochondrially encoded; translation is specifically activated by Atp22p; ATP6 and ATP8 mRNAs are not translated in the absence of the F1 sector of ATPase; mutations in human ortholog MT-ATP6 are associated with neurodegenerative disorders such as Neurogenic Ataxia and Retinitis Pigmentosa (NARP), Leigh syndrome (LS), Charcot-Marie-Tooth (CMT), and ataxia telangiectasia +S000029982 CDS Q0085 17 28487 29266 W 2000-05-19 2000-05-19 +S000029673 origin_of_replication ORI7 ORI7 chromosome 17 L000001314 17 30220 30594 W 2014-11-18 2014-11-18 Mitochondrial origin of replication +S000007269 ORF Dubious Q0092 ORF5 chromosome 17 L000004933 17 30874 31014 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030082 CDS Q0092 17 30874 31014 W 2000-05-19 2000-05-19 +S000029668 origin_of_replication ORI2 ORI2 chromosome 17 L000001309 17 32231 32501 W 2014-11-18 2014-11-18 Mitochondrial origin of replication +S000007318 tRNA_gene tE(UUC)Q chromosome 17 L000004893 17 35373 35444 W 2000-05-19 2000-05-19 Mitochondrial glutamate tRNA (tRNA-Glu); predicted by tRNAscan-SE analysis +S000036036 noncoding_exon tE(UUC)Q 17 35373 35444 W 2000-05-19 2000-05-19 +S000007271 ORF Verified Q0110 BI2 cytochrome b mRNA maturase bI2 chromosome 17 L000004935|L000004888 17 36540 38579 W 2000-05-19 2000-05-19 Mitochondrial mRNA maturase with a role in splicing; encoded by both exon and intron sequences of partially processed COB mRNA +S000031214 CDS Q0110 17 36540 36954 W 2000-05-19 2000-05-19 +S000031215 CDS Q0110 17 37723 38579 W 2000-05-19 2000-05-19 +S000031216 intron Q0110 17 36955 37722 W 2000-05-19 2000-05-19 +S000007272 ORF Verified Q0115 BI3 cytochrome b mRNA maturase bI3 chromosome 17 L000004936|L000000176 17 36540 40265 W 2000-05-19 2000-05-19 Mitochondrial mRNA maturase; forms a complex with Mrs1p to mediate splicing of the bI3 intron of the COB gene; encoded by both exon and intron sequences of partially processed COB mRNA +S000031224 CDS Q0115 17 36540 36954 W 2000-05-19 2000-05-19 +S000031225 CDS Q0115 17 37723 37736 W 2000-05-19 2000-05-19 +S000031226 CDS Q0115 17 39141 40265 W 2000-05-19 2000-05-19 +S000031227 intron Q0115 17 36955 37722 W 2000-05-19 2000-05-19 +S000031228 intron Q0115 17 37737 39140 W 2000-05-19 2000-05-19 +S000007273 ORF Verified Q0120 BI4 intron-encoded RNA maturase bI4 chromosome 17 L000000177|L000004937 17 36540 42251 W 2000-05-19 2000-05-19 Mitochondrial mRNA maturase; forms a complex with Nam2p to mediate splicing of the bI4 intron of the COB gene; encoded by both exon and intron sequences of partially processed COB mRNA +S000032184 CDS Q0120 17 36540 36954 W 2000-05-19 2000-05-19 +S000032185 CDS Q0120 17 37723 37736 W 2000-05-19 2000-05-19 +S000032186 CDS Q0120 17 39141 39217 W 2000-05-19 2000-05-19 +S000032187 CDS Q0120 17 40841 42251 W 2000-05-19 2000-05-19 +S000032188 intron Q0120 17 36955 37722 W 2000-05-19 2000-05-19 +S000032189 intron Q0120 17 37737 39140 W 2000-05-19 2000-05-19 +S000032190 intron Q0120 17 39218 40840 W 2000-05-19 2000-05-19 +S000007270 ORF Verified Q0105 COB cytochrome b|CYTB|COB1 chromosome 17 L000004934|L000000376 17 36540 43647 W 2000-05-19 2000-05-19 Cytochrome b; mitochondrially encoded subunit of the ubiquinol-cytochrome c reductase complex which includes Cobp, Rip1p, Cyt1p, Cor1p, Qcr2p, Qcr6p, Qcr7p, Qcr8p, Qcr9p, and Qcr10p +S000031165 CDS Q0105 17 36540 36954 W 2000-05-19 2000-05-19 +S000031166 CDS Q0105 17 37723 37736 W 2000-05-19 2000-05-19 +S000031167 CDS Q0105 17 39141 39217 W 2000-05-19 2000-05-19 +S000031168 CDS Q0105 17 40841 41090 W 2000-05-19 2000-05-19 +S000031169 CDS Q0105 17 42508 42558 W 2000-05-19 2000-05-19 +S000031170 CDS Q0105 17 43297 43647 W 2000-05-19 2000-05-19 +S000031171 intron Q0105 17 36955 37722 W 2000-05-19 2000-05-19 +S000031172 intron Q0105 17 37737 39140 W 2000-05-19 2000-05-19 +S000031173 intron Q0105 17 39218 40840 W 2000-05-19 2000-05-19 +S000031174 intron Q0105 17 41091 42507 W 2000-05-19 2000-05-19 +S000031175 intron Q0105 17 42559 43296 W 2000-05-19 2000-05-19 +S000029672 origin_of_replication ORI6 ORI6 chromosome 17 L000001313 17 45227 47927 W 2014-11-18 2014-11-18 Mitochondrial origin of replication +S000007274 ORF Verified Q0130 OLI1 F0 ATP synthase subunit c|OLI3|ATP9 chromosome 17 L000004938|L000001298|L000002724 17 46723 46953 W 2000-05-19 2000-05-19 F0-ATP synthase subunit c (ATPase-associated proteolipid); encoded on the mitochondrial genome; mutation confers oligomycin resistance; expression is specifically dependent on the nuclear genes AEP1 and AEP2 +S000032266 CDS Q0130 17 46723 46953 W 2000-05-19 2000-05-19 +S000007333 tRNA_gene tS(UGA)Q2 chromosome 17 L000004908 17 48201 48290 W 2000-05-19 2000-05-19 Mitochondrial serine tRNA (tRNA-Ser); predicted by tRNAscan-SE analysis +S000031361 noncoding_exon tS(UGA)Q2 17 48201 48290 W 2000-05-19 2000-05-19 +S000007275 ORF Verified Q0140 VAR1 mitochondrial 37S ribosomal protein VAR1|VARI chromosome 17 L000004939|L000002456|L000002455 17 48901 50097 W 2000-05-19 2000-05-19 Mitochondrial ribosomal protein of the small subunit; mitochondrially-encoded; polymorphic in different strains due to variation in number of AAT (asparagine) codons; translated near the mitochondrial inner membrane; may have a role in loss of mitochondrial DNA under stress conditions +S000032355 CDS Q0140 17 48901 50097 W 2000-05-19 2000-05-19 +S000007276 ORF Dubious Q0142 ORF9 chromosome 17 L000004940 17 51052 51228 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps dubious open reading frame Q0143 +S000032370 CDS Q0142 17 51052 51228 W 2000-05-19 2000-05-19 +S000007277 ORF Dubious Q0143 ORF10 chromosome 17 L000004941 17 51277 51429 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032373 CDS Q0143 17 51277 51429 W 2000-05-19 2000-05-19 +S000007278 ORF Dubious Q0144 chromosome 17 L000004942 17 54109 54438 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032378 CDS Q0144 17 54109 54438 W 2000-05-19 2000-05-19 +S000029669 origin_of_replication ORI3 ORI3 chromosome 17 L000001310 17 54840 54567 C 2014-11-18 2014-11-18 Mitochondrial origin of replication +S000029670 origin_of_replication ORI4 ORI4 chromosome 17 L000001311 17 56832 56567 C 2014-11-18 2014-11-18 Mitochondrial origin of replication +S000007288 rRNA_gene Q0158 21S_RRNA 21S_rRNA_4|21S_rRNA_3 chromosome 17 L000004883 17 58009 62447 W 2000-05-19 2000-05-19 Mitochondrial 21S rRNA; intron encodes the I-SceI DNA endonuclease +S000034078 intron Q0158 17 60725 61867 W 2000-05-19 2000-05-19 +S000034076 noncoding_exon Q0158 17 58009 60724 W 2000-05-19 2000-05-19 +S000034077 noncoding_exon Q0158 17 61868 62447 W 2000-05-19 2000-05-19 +S000007279 ORF Verified Q0160 SCEI intron-encoded endonuclease I-SceI|I-SceIV|OMEGA chromosome 17 L000004889|L000001858 17 61022 61729 W 2000-05-19 2000-05-19 I-SceI DNA endonuclease; encoded by the mitochondrial group I intron of the 21S_rRNA gene; mediates gene conversion that propagates the intron into intron-less copies of the 21S_rRNA gene +S000033285 CDS Q0160 17 61022 61729 W 2000-05-19 2000-05-19 +S000007334 tRNA_gene tT(UGU)Q1 chromosome 17 L000004909 17 63862 63937 W 2000-05-19 2000-05-19 Mitochondrial threonine tRNA (tRNA-Thr); predicted by tRNAscan-SE analysis +S000033404 noncoding_exon tT(UGU)Q1 17 63862 63937 W 2000-05-19 2000-05-19 +S000007316 tRNA_gene tC(GCA)Q chromosome 17 L000004891 17 64415 64490 W 2000-05-19 2000-05-19 Mitochondrial cysteine tRNA (tRNA-Cys) +S000035255 noncoding_exon tC(GCA)Q 17 64415 64490 W 2000-05-19 2000-05-19 +S000007321 tRNA_gene tH(GUG)Q chromosome 17 L000004896 17 64596 64670 W 2000-05-19 2000-05-19 Mitochondrial histidine tRNA (tRNA-His); predicted by tRNAscan-SE analysis +S000033926 noncoding_exon tH(GUG)Q 17 64596 64670 W 2000-05-19 2000-05-19 +S000007280 ORF Dubious Q0182 ORF11 chromosome 17 L000004944 17 65770 66174 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034264 CDS Q0182 17 65770 66174 W 2000-05-19 2000-05-19 +S000007324 tRNA_gene tL(UAA)Q chromosome 17 L000004899 17 66095 66179 W 2000-05-19 2000-05-19 Mitochondrial leucine tRNA (tRNA-Leu); predicted by tRNAscan-SE analysis; required for mitochondrial translation and indirectly for maintenance of the mitochondrial genome; mutations in the orthologous human gene cause the neurological disease MELAS +S000037434 noncoding_exon tL(UAA)Q 17 66095 66179 W 2000-05-19 2000-05-19 +S000007329 tRNA_gene tQ(UUG)Q chromosome 17 L000004904 17 66210 66285 W 2000-05-19 2000-05-19 Mitochondrial glutamine tRNA (tRNA-Gln); predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000032591 noncoding_exon tQ(UUG)Q 17 66210 66285 W 2000-05-19 2000-05-19 +S000007323 tRNA_gene tK(UUU)Q chromosome 17 L000004898 17 67061 67134 W 2000-05-19 2000-05-19 Mitochondrial lysine tRNA (tRNA-Lys); predicted by tRNAscan-SE analysis; modification of wobble base U34 is decreased at elevated temperatures, decreasing ability to decode AAG codons; this function is performed at high temperature by imported cytoplasmic tRNA-Lys with CUU anticodon +S000034232 noncoding_exon tK(UUU)Q 17 67061 67134 W 2000-05-19 2000-05-19 +S000007331 tRNA_gene tR(UCU)Q1 chromosome 17 L000004906 17 67309 67381 W 2000-05-19 2000-05-19 Mitochondrial arginine tRNA (tRNA-Arg); predicted by tRNAscan-SE analysis +S000032809 noncoding_exon tR(UCU)Q1 17 67309 67381 W 2000-05-19 2000-05-19 +S000007320 tRNA_gene tG(UCC)Q chromosome 17 L000004895 17 67468 67542 W 2000-05-19 2000-05-19 Mitochondrial glycine tRNA (tRNA-Gly); predicted by tRNAscan-SE analysis +S000037571 noncoding_exon tG(UCC)Q 17 67468 67542 W 2000-05-19 2000-05-19 +S000007317 tRNA_gene tD(GUC)Q chromosome 17 L000004892 17 68322 68396 W 2000-05-19 2000-05-19 Mitochondrial aspartate tRNA (tRNA-Asp); predicted by tRNAscan-SE analysis +S000030428 noncoding_exon tD(GUC)Q 17 68322 68396 W 2000-05-19 2000-05-19 +S000007332 tRNA_gene tS(GCU)Q1 chromosome 17 L000004907 17 69203 69288 W 2000-05-19 2000-05-19 Mitochondrial serine tRNA (tRNA-Ser); predicted by tRNAscan-SE analysis +S000030614 noncoding_exon tS(GCU)Q1 17 69203 69288 W 2000-05-19 2000-05-19 +S000007330 tRNA_gene tR(ACG)Q2 chromosome 17 L000004905 17 69289 69362 W 2000-05-19 2000-05-19 Mitochondrial arginine tRNA (tRNA-Arg); predicted by tRNAscan-SE analysis +S000034929 noncoding_exon tR(ACG)Q2 17 69289 69362 W 2000-05-19 2000-05-19 +S000007315 tRNA_gene tA(UGC)Q chromosome 17 L000004890 17 69846 69921 W 2000-05-19 2000-05-19 Mitochondrial alanine tRNA (tRNA-Ala); predicted by tRNAscan-SE analysis +S000034925 noncoding_exon tA(UGC)Q 17 69846 69921 W 2000-05-19 2000-05-19 +S000007322 tRNA_gene tI(GAU)Q chromosome 17 L000004897 17 70162 70237 W 2000-05-19 2000-05-19 Mitochondrial isoleucine tRNA (tRNA-Ile); predicted by tRNAscan-SE analysis; mutations in human ortholog are linked to conditions such as progressive encephalopathy, metabolic syndrome, and hypomagnesaemia +S000036091 noncoding_exon tI(GAU)Q 17 70162 70237 W 2000-05-19 2000-05-19 +S000007338 tRNA_gene tY(GUA)Q chromosome 17 L000004913 17 70824 70907 W 2000-05-19 2000-05-19 Mitochondrial tyrosine tRNA (tRNA-Tyr) +S000034742 noncoding_exon tY(GUA)Q 17 70824 70907 W 2000-05-19 2000-05-19 +S000007327 tRNA_gene tN(GUU)Q chromosome 17 L000004902 17 71433 71503 W 2000-05-19 2000-05-19 Mitochondrial asparagine tRNA (tRNA-Asn); predicted by tRNAscan-SE analysis +S000030750 noncoding_exon tN(GUU)Q 17 71433 71503 W 2000-05-19 2000-05-19 +S000007325 tRNA_gene tM(CAU)Q1 chromosome 17 L000004900 17 72630 72705 W 2000-05-19 2000-05-19 Mitochondrial methionine tRNA (tRNA-Met); predicted by tRNAscan-SE analysis +S000032341 noncoding_exon tM(CAU)Q1 17 72630 72705 W 2000-05-19 2000-05-19 +S000007281 ORF Verified Q0250 COX2 cytochrome c oxidase subunit 2|OXII|OXI1 chromosome 17 L000004945|L000000384|L000001322|L000003004 17 73758 74513 W 2000-05-19 2000-05-19 Subunit II of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain; one of three mitochondrially-encoded subunits +S000036455 CDS Q0250 17 73758 74513 W 2000-05-19 2000-05-19 +S000007282 ORF Uncharacterized Q0255 maturase-like protein|RF1|ORF1 chromosome 17 L000004946 17 74495 75984 W 2000-05-19 2000-05-19 Maturase-like protein +S000036463 CDS Q0255 17 74495 75622 W 2000-05-19 2000-05-19 +S000036464 CDS Q0255 17 75663 75872 W 2000-05-19 2000-05-19 +S000036465 CDS Q0255 17 75904 75984 W 2000-05-19 2000-05-19 +S000036466 intron Q0255 17 75623 75662 W 2000-05-19 2000-05-19 +S000036467 intron Q0255 17 75873 75903 W 2000-05-19 2000-05-19 +S000007319 tRNA_gene tF(GAA)Q chromosome 17 L000004894 17 77431 77505 W 2000-05-19 2000-05-19 Mitochondrial phenylalanine tRNA (tRNA-Phe); predicted by tRNAscan-SE analysis +S000035453 noncoding_exon tF(GAA)Q 17 77431 77505 W 2000-05-19 2000-05-19 +S000007335 tRNA_gene tT(UAG)Q2 tT(XXX)Q2 chromosome 17 L000004910 17 78162 78089 C 2000-05-19 2000-05-19 Mitochondrial threonine tRNA (tRNA-Thr); decodes CUA codons as threonine rather than leucine; has an unusual enlarged 8-nt anticodon loop; may be evolutionarily derived from mitochondrial tRNA-His; conserved in some genera of budding yeasts +S000032409 noncoding_exon tT(UAG)Q2 17 78162 78089 C 2000-05-19 2000-05-19 +S000007336 tRNA_gene tV(UAC)Q chromosome 17 L000004911 17 78533 78608 W 2000-05-19 2000-05-19 Mitochondrial valine tRNA (tRNA-Val); predicted by tRNAscan-SE analysis +S000036325 noncoding_exon tV(UAC)Q 17 78533 78608 W 2000-05-19 2000-05-19 +S000007283 ORF Verified Q0275 COX3 cytochrome c oxidase subunit 3|OXI2 chromosome 17 L000004947|L000000385|L000001320 17 79213 80022 W 2000-05-19 2000-05-19 Subunit III of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain; one of three mitochondrially-encoded subunits +S000036648 CDS Q0275 17 79213 80022 W 2000-05-19 2000-05-19 +S000029671 origin_of_replication ORI5 ORI5 chromosome 17 L000001312 17 82329 82600 W 2014-11-18 2014-11-18 Mitochondrial origin of replication +S000007326 tRNA_gene tM(CAU)Q2 chromosome 17 L000004901 17 85035 85112 W 2000-05-19 2000-05-19 Mitochondrial formylated methionine tRNA (tRNA-fMet); predicted by tRNAscan-SE analysis +S000032348 noncoding_exon tM(CAU)Q2 17 85035 85112 W 2000-05-19 2000-05-19 +S000029023 ncRNA_gene Q0285 RPM1 chromosome 17 L000004810 17 85295 85777 W 2003-12-02 2003-12-02 RNA component of mitochondrial RNase P; mitochondrial RNase P also contains the protein subunit Rpm2p; RNase P removes 5' extensions from mitochondrial tRNA precursors; RPM1 is conserved in bacteria, fungi, and protozoa +S000035976 noncoding_exon Q0285 17 85295 85777 W 2003-12-02 2003-12-02 +S000007284 ORF Dubious Q0297 ORF12 chromosome 17 L000004948 17 85554 85709 W 2000-05-19 2000-05-19 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene RPM1 +S000037483 CDS Q0297 17 85554 85709 W 2000-05-19 2000-05-19 +S000029683 gene_group MAL3 MAL3 chromosome 2 L000001002 2 144 Multigene complex, polymeric locus for maltose fermentation; encodes the MAL33 trans-acting MAL-activator, MAL31 maltose permease, and MAL32 maltase +S000178039 ARS ARS200 chromosome 2 2 40 202 2014-11-18 2014-11-18 Autonomously replicating sequence +S000028599 ORF Dubious YBL113W-A chromosome 2 2 646 1128 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031383 CDS YBL113W-A 2 646 1128 W 2003-07-29 2003-07-29 +S000002153 ORF Uncharacterized YBL113C chromosome 2 2 2658 280 C 1996-07-31 1996-07-31 Helicase-like protein encoded within the telomeric Y' element +S000036166 CDS YBL113C 2 2658 280 C 1996-07-31 1996-07-31 +S000002152 ORF Uncharacterized YBL112C chromosome 2 2 2899 2582 C 1996-07-31 1996-07-31 Putative protein of unknown function; YBL112C is contained within TEL02L +S000035974 CDS YBL112C 2 2899 2582 C 1996-07-31 1996-07-31 +S000002151 ORF Verified YBL111C chromosome 2 2 5009 2907 C 1996-07-31 1996-07-31 Helicase-like protein encoded within the telomeric Y' element; relocalizes from mitochondrion to cytoplasm upon DNA replication stress +S000035858 CDS YBL111C 2 4116 2907 C 1996-07-31 1996-07-31 +S000035857 CDS YBL111C 2 5009 4216 C 1996-07-31 1996-07-31 +S000035859 intron YBL111C 2 4215 4117 C 1996-07-31 1996-07-31 +S000002150 ORF Dubious YBL109W chromosome 2 2 5790 6125 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034042 CDS YBL109W 2 5790 6125 W 1996-07-31 1996-07-31 +S000178040 ARS ARS201 chromosome 2 2 6498 6620 2014-11-18 2014-11-18 Autonomously replicating sequence +S000028867 telomere TEL02L chromosome 2 2 6608 1 C -80 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome II; annotated components include an X element core sequence, X element combinatorial repeats, and a short Y' element; TEL02L does have telomeric repeats (TEL02L-TR), but they are missing from the genome annotation due to difficulties encountered during sequencing and/or assembly +S000028868 X_element TEL02L 2 6608 6139 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome II; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028869 X_element_combinatorial_repeat TEL02L 2 6138 5849 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr II; contains repeats of the D, C, B and A types, Tbf1p binding sites, and ORF YBL109W; formerly called SubTelomeric Repeats +S000028870 Y_prime_element TEL02L 2 5848 1 C 2003-09-09 2003-09-09 Telomeric short Y' element on the left arm of Chromosome II; contains an ARS consensus sequence, a region of 36-bp repeats, and four ORFs (YBL111C, YBL112C, YBL113C, YBL113W-A) +S000007592 ORF Verified YBL108C-A PAU9 seripauperin PAU9 chromosome 2 2 7733 7605 C 2001-02-26 2001-02-26 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively +S000037104 CDS YBL108C-A 2 7733 7605 C 2001-02-26 2001-02-26 +S000000204 ORF Dubious YBL108W chromosome 2 2 8177 8482 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033883 CDS YBL108W 2 8177 8482 W 1996-07-31 1996-07-31 +S000006798 long_terminal_repeat YBLWdelta1 chromosome 2 2 8848 9092 W 2000-05-19 2000-05-19 Ty1 LTR +S000006799 long_terminal_repeat YBLWdelta2 chromosome 2 2 9093 9424 W 2000-05-19 2000-05-19 Ty2 LTR +S000007229 ORF Dubious YBL107W-A chromosome 2 2 9268 9372 W 1999-07-17 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the Ty2 LTR YBLWdelta2; YBL107W-A has a paralog, YER138W-A, that arose from a single-locus duplication +S000036010 CDS YBL107W-A 2 9268 9372 W 1999-07-17 1999-07-17 +S000006800 long_terminal_repeat YBLWdelta3 chromosome 2 2 9425 9518 W 2000-05-19 2000-05-19 Ty1 LTR +S000006647 tRNA_gene tL(UAA)B1 chromosome 2 L000003738 2 9583 9666 W 2000-05-19 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000035755 noncoding_exon tL(UAA)B1 2 9583 9666 W 2000-05-19 2000-05-19 +S000000203 ORF Verified YBL107C MIX23 MIC23 chromosome 2 2 10551 9961 C 1996-07-31 1996-07-31 Mitochondrial intermembrane space protein of unknown function; imported via the MIA import machinery; contains an unusual twin cysteine motif (CX13C CX14C) +S000033751 CDS YBL107C 2 10551 9961 C 1996-07-31 1996-07-31 +S000000202 ORF Verified YBL106C SRO77 putative Rab GTPase-binding protein SRO77|SNI2|SOP2 chromosome 2 L000004194 2 13879 10847 C 1996-07-31 1996-07-31|2011-02-03 Protein with roles in exocytosis and cation homeostasis; functions in docking and fusion of post-Golgi vesicles with plasma membrane; regulates cell proliferation and colony development via the Rho1-Tor1 pathway; interacts with SNARE protein Sec9p; homolog of Drosophila lethal giant larvae tumor suppressor; SRO77 has a paralog, SRO7, that arose from the whole genome duplication +S000033072 CDS YBL106C 2 13879 10847 C 1996-07-31 1996-07-31|2011-02-03 +S000000201 ORF Verified YBL105C PKC1 protein kinase C|CLY7|CLY5|STT1|HPO2|CLY15 chromosome 2 L000001446|L000000362|S000029091 2 17696 14241 C -79 1996-07-31 1996-07-31|2011-02-03 Protein serine/threonine kinase; essential for cell wall remodeling during growth; localized to sites of polarized growth and the mother-daughter bud neck; homolog of the alpha, beta, and gamma isoforms of mammalian protein kinase C (PKC) +S000032980 CDS YBL105C 2 17696 14241 C 1996-07-31 1996-07-31|2011-02-03 +S000000200 ORF Verified YBL104C SEA4 YBL103C-A chromosome 2 2 21293 18177 C 2004-01-26 2004-01-26|1996-07-31 Subunit of SEACAT, a subcomplex of the SEA complex; Sea4p, along with Rtc1p and Mtc5p, redundantly inhibit the TORC1 inhibitory role of the Iml1p/SEACIT (Iml1p-Npr2p-Npr3p) subcomplex, a GAP for GTPase Gtr1p (EGOC subunit) in response to amino acid limitation, thereby resulting in activation of TORC1 signaling; SEA is a coatomer-related complex that associates dynamically with the vacuole; contains an N-terminal beta-propeller fold and a C-terminal RING motif +S000032891 CDS YBL104C 2 21293 18177 C 2004-01-26 2004-01-26|1996-07-31 +S000000199 ORF Verified YBL103C RTG3 chromosome 2 L000003152 2 23536 22076 C 2011-02-03 1997-07-27|1997-01-28 bHLH/Zip transcription factor for retrograde (RTG) and TOR pathways; forms a complex with another bHLH/Zip protein, Rtg1p, to activate the pathways; target of Hog1p +S000032786 CDS YBL103C 2 23536 22076 C 2011-02-03 1997-07-27|1997-01-28 +S000000198 ORF Verified YBL102W SFT2 chromosome 2 L000002950 2 24098 24745 W 2004-01-26 1997-01-28 Tetra-spanning membrane protein found mostly in the late Golgi; non-essential; can suppress some sed5 alleles; may be part of the transport machinery, but precise function is unknown; similar to mammalian syntaxin 5 +S000032738 CDS YBL102W 2 24098 24745 W 2004-01-26 1997-01-28 +S000000197 ORF Verified YBL101C ECM21 ART2 chromosome 2 L000003896 2 28299 24946 C 2004-01-26 1998-09-13|1997-01-28 Protein involved in regulating endocytosis of plasma membrane proteins; identified as a substrate for ubiquitination by Rsp5p and deubiquitination by Ubp2p; promoter contains several Gcn4p binding elements; ECM21 has a paralog, CSR2, that arose from the whole genome duplication +S000031747 CDS YBL101C 2 28299 24946 C 2004-01-26 1998-09-13|1997-01-28 +S000028598 ORF Uncharacterized YBL100W-C YBL101W-C chromosome 2 2 28427 28546 W 2004-01-26 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031381 CDS YBL100W-C 2 28427 28546 W 2004-01-26 2003-07-29 +S000118996 ARS ARS230 ARSII-29|ARS201.5 chromosome 2 2 28942 29160 2011-02-03 2006-10-02 Autonomously Replicating Sequence +S000006801 long_terminal_repeat YBLWdelta4 chromosome 2 2 29644 29975 W 2011-02-03 2000-05-19 Ty2 LTR +S000006809 LTR_retrotransposon YBLWTy2-1 Ty2 chromosome 2 2 29644 35602 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000002148 transposable_element_gene YBL100W-A gag protein|TY2A_B|YBL101W-A chromosome 2 2 29935 31251 W 2011-02-03 1997-01-28 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000032385 CDS YBL100W-A 2 29935 31251 W 2011-02-03 1997-01-28 +S000002149 transposable_element_gene YBL100W-B gag-pol fusion protein|TY2B_B|YBL101W-B chromosome 2 2 29935 35248 W 2011-02-03 1997-01-28 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000032404 CDS YBL100W-B 2 29935 31227 W 2011-02-03 1997-01-28 +S000032405 CDS YBL100W-B 2 31229 35248 W 2011-02-03 1997-01-28 +S000032406 plus_1_translational_frameshift YBL100W-B 2 31228 31228 W 2011-02-03 1997-01-28 +S000006802 long_terminal_repeat YBLWdelta5 chromosome 2 2 35271 35602 W 2011-02-03 2000-05-19 Ty2 LTR +S000006803 long_terminal_repeat YBLWdelta6 chromosome 2 2 35604 35796 W 2011-02-03 2000-05-19 Ty1 LTR +S000006807 long_terminal_repeat YBLCtau1 YBLWtau1 chromosome 2 2 36221 35851 C 2011-02-03 2000-05-19|2007-04-05 Ty4 LTR +S000006562 tRNA_gene tF(GAA)B chromosome 2 L000003739 2 36398 36488 W 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis +S000035371 intron tF(GAA)B 2 36435 36452 W 2011-02-03 2000-05-19 +S000035369 noncoding_exon tF(GAA)B 2 36398 36434 W 2011-02-03 2000-05-19 +S000035370 noncoding_exon tF(GAA)B 2 36453 36488 W 2011-02-03 2000-05-19 +S000000195 ORF Verified YBL099W ATP1 F1F0 ATP synthase subunit alpha chromosome 2 L000000141 2 37053 38690 W 2011-02-03 1997-01-28|2011-02-03 Alpha subunit of the F1 sector of mitochondrial F1F0 ATP synthase; which is a large, evolutionarily conserved enzyme complex required for ATP synthesis; F1 translationally regulates ATP6 and ATP8 expression to achieve a balanced output of ATP synthase genes encoded in nucleus and mitochondria; phosphorylated; N-terminally propionylated in vivo +S000034558 CDS YBL099W 2 37053 38690 W 2011-02-03 1997-01-28|2011-02-03 +S000000196 ORF Dubious YBL100C chromosome 2 2 37303 36989 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the 5' end of ATP1 +S000031662 CDS YBL100C 2 37303 36989 C 2011-02-03 1997-01-28 +S000000194 ORF Verified YBL098W BNA4 kynurenine 3-monooxygenase chromosome 2 2 39145 40527 W 2011-02-03 1997-01-28 Kynurenine 3-monooxygenase; required for the de novo biosynthesis of NAD from tryptophan via kynurenine; expression regulated by Hst1p; putative therapeutic target for Huntington disease +S000034424 CDS YBL098W 2 39145 40527 W 2011-02-03 1997-01-28 +S000000193 ORF Verified YBL097W BRN1 condensin subunit BRN1 chromosome 2 L000004324 2 40831 43095 W 2011-02-03 2004-01-29|1997-01-28|2011-02-03 Subunit of the condensin complex; required for chromosome condensation and for clustering of tRNA genes at the nucleolus; may influence multiple aspects of chromosome transmission +S000034364 CDS YBL097W 2 40831 43095 W 2011-02-03 2004-01-29|1997-01-28|2011-02-03 +S000000191 ORF Uncharacterized YBL095W MRX3 chromosome 2 2 43277 44089 W 2011-02-03 1997-01-28 Protein that associates with mitochondrial ribosome; likely functions in cristae junction formation; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000033361 CDS YBL095W 2 43277 44089 W 2011-02-03 1997-01-28 +S000000192 ORF Dubious YBL096C chromosome 2 2 43482 43174 C 2011-02-03 1997-01-28 Non-essential protein of unknown function +S000033392 CDS YBL096C 2 43482 43174 C 2011-02-03 1997-01-28 +S000000190 ORF Dubious YBL094C chromosome 2 2 44097 43765 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps uncharacterized ORF YBL095W +S000033262 CDS YBL094C 2 44097 43765 C 2011-02-03 1997-01-28 +S000000189 ORF Verified YBL093C ROX3 SSX2|MED19|SSN7|NUT3 chromosome 2 L000001662|S000029515|L000002098 2 44918 44256 C 2011-02-03 1997-01-28 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme +S000032413 CDS YBL093C 2 44918 44256 C 2011-02-03 1997-01-28 +S000000188 ORF Verified YBL092W RPL32 eL32|ribosomal 60S subunit protein L32|L32e|L32 chromosome 2 L000004464 2 45978 46370 W 2011-02-03 1997-01-28 Ribosomal 60S subunit protein L32; overexpression disrupts telomeric silencing; homologous to mammalian ribosomal protein L32, no bacterial homolog +S000032377 CDS YBL092W 2 45978 46370 W 2011-02-03 1997-01-28 +S000122091 five_prime_UTR_intron YBL092W 2 45645 45977 W 2011-02-03 2007-04-04 +S000007228 ORF Verified YBL091C-A SCS22 phospholipid metabolism-regulating protein SCS22 chromosome 2 2 47180 46565 C 2011-02-03 2004-01-07|1999-07-17 Protein involved in regulation of phospholipid metabolism; one of 6 proteins (Ist2p, Scs2p, Scs22p, Tcb1p, Tcb2p, Tcb3p) that connect the ER and plasma membrane (PM); regulates PM PI4P levels by controlling access of the Sac1p phosphatase to its substrate, PI4P; human VAP homolog; similar to D. melanogaster inturned protein; SWAT-GFP and mCherry fusion proteins localize to the cytosol; SCS22 has a paralog, SCS2, that arose from the whole genome duplication +S000037851 CDS YBL091C-A 2 47058 46565 C 2011-02-03 2004-01-07|1999-07-17 +S000037850 CDS YBL091C-A 2 47180 47147 C 2011-02-03 2004-01-07 +S000037852 intron YBL091C-A 2 47146 47059 C 2011-02-03 2004-01-07 +S000000187 ORF Verified YBL091C MAP2 methionine aminopeptidase chromosome 2 L000003044 2 48628 47363 C 2011-02-03 1997-07-27|1997-01-28|2011-02-03 Methionine aminopeptidase; catalyzes the cotranslational removal of N-terminal methionine from nascent polypeptides; function is partially redundant with that of Map1p +S000032224 CDS YBL091C 2 48628 47363 C 2011-02-03 1997-07-27|1997-01-28|2011-02-03 +S000000186 ORF Verified YBL090W MRP21 mitochondrial 37S ribosomal protein MRP21|MRP50 chromosome 2 L000003275 2 48825 49358 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the small subunit; MRP21 exhibits genetic interactions with mutations in the COX2 and COX3 mRNA 5'-untranslated leader sequences +S000032193 CDS YBL090W 2 48825 49358 W 2011-02-03 1997-01-28 +S000000185 ORF Verified YBL089W AVT5 amino acid transporter chromosome 2 2 49574 50953 W 2011-02-03 2003-09-22|1997-01-28 Putative transporter; member of a family of seven S. cerevisiae genes (AVT1-7) related to vesicular GABA-glycine transporters; AVT5 has a paralog, AVT6, that arose from the whole genome duplication +S000031223 CDS YBL089W 2 49574 50953 W 2011-02-03 2003-09-22|1997-01-28 +S000000184 ORF Verified YBL088C TEL1 DNA-binding protein kinase TEL1 chromosome 2 L000002281 2 59382 51019 C -60 2011-02-03 1997-01-28|2011-02-03 Protein kinase primarily involved in telomere length regulation; contributes to cell cycle checkpoint control in response to DNA damage; acts with Red1p and Mec1p to promote interhomolog recombination by phosphorylation of Hop1; functionally redundant with Mec1p; regulates P-body formation induced by replication stress; homolog of human ataxia-telangiectasia mutated (ATM) gene +S000030193 CDS YBL088C 2 59382 51019 C 2011-02-03 1997-01-28|2011-02-03 +S000000183 ORF Verified YBL087C RPL23A uL14|ribosomal 60S subunit protein L23A|L14|YL32|L23A|L17aA chromosome 2 L000001716 2 60739 59822 C 2011-02-03 1997-01-28 Ribosomal 60S subunit protein L23A; homologous to mammalian ribosomal protein L23 and bacterial L14; RPL23A has a paralog, RPL23B, that arose from the whole genome duplication +S000030032 CDS YBL087C 2 60193 59822 C 2011-02-03 1997-01-28 +S000030031 CDS YBL087C 2 60739 60698 C 2011-02-03 1997-01-28 +S000030033 intron YBL087C 2 60697 60194 C 2011-02-03 1997-01-28 +S000000182 ORF Uncharacterized YBL086C chromosome 2 2 62602 61202 C 2011-02-03 1997-01-28 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery +S000029917 CDS YBL086C 2 62602 61202 C 2011-02-03 1997-01-28 +S000118344 ARS ARS202 ARSII-63 chromosome 2 2 63259 63381 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000000181 ORF Verified YBL085W BOI1 BOB1|GIN7 chromosome 2 L000000191|L000000703 2 63876 66818 W 2011-02-03 1997-01-28 Protein implicated in polar growth; functionally redundant with Boi2p; interacts with bud-emergence protein Bem1p; contains an SH3 (src homology 3) domain and a PH (pleckstrin homology) domain; relocalizes from bud neck to cytoplasm upon DNA replication stress; BOI1 has a paralog, BOI2, that arose from the whole genome duplication +S000029876 CDS YBL085W 2 63876 66818 W 2011-02-03 1997-01-28 +S000000180 ORF Verified YBL084C CDC27 anaphase promoting complex subunit CDC27|SNB1|APC3 chromosome 2 L000000266 2 69445 67169 C -58 2011-02-03 1997-01-28|2011-02-03 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); APC/C is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition +S000037167 CDS YBL084C 2 69445 67169 C 2011-02-03 1997-01-28|2011-02-03 +S000000179 ORF Dubious YBL083C chromosome 2 2 70138 69713 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps verified ORF ALG3 +S000037052 CDS YBL083C 2 70138 69713 C 2011-02-03 1997-01-28 +S000000178 ORF Verified YBL082C ALG3 dolichyl-P-Man:Man(5)GlcNAc(2)-PP-dolichol alpha-1,3-mannosyltransferase|RHK1 chromosome 2 L000002668 2 71127 69751 C 2011-02-03 1997-01-28 Dolichol-P-Man dependent alpha(1-3) mannosyltransferase; involved in synthesis of dolichol-linked oligosaccharide donor for N-linked glycosylation of proteins; G353A missense mutation in human ortholog ALG3 implicated in carbohydrate deficient glycoprotein syndrome type IV, which is characterized by microcephaly, severe epilepsy, minimal psychomotor development, partial deficiency of sialic acids in serum glycoproteins; wild-type human ALG3 can complement yeast alg3 mutant +S000036997 CDS YBL082C 2 71127 69751 C 2011-02-03 1997-01-28 +S000000177 ORF Uncharacterized YBL081W chromosome 2 2 71866 72972 W 2011-02-03 1997-01-28 Non-essential protein of unknown function; null mutation results in a decrease in plasma membrane electron transport +S000036378 CDS YBL081W 2 71866 72972 W 2011-02-03 1997-01-28 +S000000176 ORF Verified YBL080C PET112 glutamyl-tRNA(Gln) amidotransferase subunit PET112 chromosome 2 L000001394 2 74695 73070 C 2011-02-03 1997-01-28|2011-02-03 Subunit of the trimeric GatFAB AmidoTransferase(AdT) complex; involved in the formation of Q-tRNAQ; mutation is functionally complemented by the bacterial GatB ortholog +S000036223 CDS YBL080C 2 74695 73070 C 2011-02-03 1997-01-28|2011-02-03 +S000000175 ORF Verified YBL079W NUP170 NLE3 chromosome 2 L000001256|L000003140 2 75259 79767 W 2011-02-03 1997-01-28 Subunit of inner ring of nuclear pore complex (NPC); contributes to NPC assembly and nucleocytoplasmic transport; interacts with genomic regions that contain ribosomal protein and subtelomeric genes, where it functions in nucleosome positioning and as a repressor of transcription; both Nup170p and NUP157p are similar to human Nup155p; NUP170 has a paralog, NUP157, that arose from the whole genome duplication +S000034905 CDS YBL079W 2 75259 79767 W 2011-02-03 1997-01-28 +S000000174 ORF Verified YBL078C ATG8 ubiquitin-like protein ATG8|AUT7|CVT5|APG8 chromosome 2 L000004607|L000004604 2 80731 80378 C 2011-02-03 1997-01-28 Component of autophagosomes and Cvt vesicles; regulator of Atg1p, targets it to autophagosomes; binds the Atg1p-Atg13p complex, triggering its vacuolar degradation; unique ubiquitin-like protein whose conjugation target is lipid phosphatidylethanolamine (PE); Atg8p-PE is anchored to membranes, is involved in phagophore expansion, and may mediate membrane fusion during autophagosome formation; deconjugation of Atg8p-PE is required for efficient autophagosome biogenesis +S000033940 CDS YBL078C 2 80731 80378 C 2011-02-03 1997-01-28 +S000000173 ORF Dubious YBL077W chromosome 2 2 80897 81328 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene ILS1/YBL076C +S000033872 CDS YBL077W 2 80897 81328 W 2011-02-03 1997-01-28 +S000000172 ORF Verified YBL076C ILS1 isoleucine--tRNA ligase ILS1 chromosome 2 L000000856 2 84261 81043 C -43 2011-02-03 1997-01-28 Cytoplasmic isoleucine-tRNA synthetase; target of the G1-specific inhibitor reveromycin A +S000033054 CDS YBL076C 2 84261 81043 C 2011-02-03 1997-01-28 +S000000171 ORF Verified YBL075C SSA3 Hsp70 family ATPase SSA3|YG106 chromosome 2 L000002071|L000000820 2 86448 84499 C 2011-02-03 1997-01-28 ATPase involved in protein folding and the response to stress; plays a role in SRP-dependent cotranslational protein-membrane targeting and translocation; member of the heat shock protein 70 (HSP70) family; localized to the cytoplasm; SSA3 has a paralog, SSA4, that arose from the whole genome duplication +S000032985 CDS YBL075C 2 86448 84499 C 2011-02-03 1997-01-28 +S000000169 ORF Dubious YBL073W chromosome 2 2 87646 87957 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the essential gene AAR2/YBL074C +S000032838 CDS YBL073W 2 87646 87957 W 2011-02-03 1997-01-28 +S000000170 ORF Verified YBL074C AAR2 U5 snRNP complex subunit AAR2 chromosome 2 L000000008 2 87789 86722 C 2011-02-03 1997-01-28 Component of the U5 snRNP complex; required for splicing of U3 precursors; originally described as a splicing factor specifically required for splicing pre-mRNA of the MATa1 cistron +S000032869 CDS YBL074C 2 87789 86722 C 2011-02-03 1997-01-28 +S000006447 snoRNA_gene snR56 SNR56 chromosome 2 L000004525 2 88190 88277 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position G1428 +S000030761 noncoding_exon snR56 2 88190 88277 W 2011-02-03 2000-05-19 +S000000168 ORF Verified YBL072C RPS8A eS8|ribosomal 40S subunit protein S8A|S8e|rp19|YS9|S8A|S14A chromosome 2 L000001752|L000001753 2 89125 88523 C 2011-02-03 1997-01-28 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S8, no bacterial homolog; RPS8A has a paralog, RPS8B, that arose from the whole genome duplication +S000031871 CDS YBL072C 2 89125 88523 C 2011-02-03 1997-01-28 +S000122090 five_prime_UTR_intron YBL072C 2 89440 89133 C 2011-02-03 2007-04-04|2011-02-03 +S000028597 ORF Uncharacterized YBL071C-B chromosome 2 2 89556 89458 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031379 CDS YBL071C-B 2 89556 89458 C 2011-02-03 2003-07-29 +S000007587 ORF Verified YBL071W-A KTI11 DPH3 chromosome 2 2 89978 90226 W 2011-02-03 2001-01-30 Zn-ribbon protein that co-purifies with Dph1 and Dph2; in a complex required for synthesis of diphthamide on translation factor eEF2 and with Elongator subunits Iki3p, Elp2p, and Elp3p; involved in modification of wobble nucleosides in tRNAs; forms a stable heterodimer with Ats1p +S000037098 CDS YBL071W-A 2 89978 90226 W 2011-02-03 2001-01-30 +S000000167 ORF Uncharacterized YBL071C chromosome 2 2 90531 90223 C 2011-02-03 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YBL071C is not an essential gene +S000031723 CDS YBL071C 2 90531 90223 C 2011-02-03 1997-01-28 +S000000165 ORF Verified YBL069W AST1 chromosome 2 L000000133 2 90741 92030 W 2011-02-03 2001-05-29|1997-01-28 Lipid raft associated protein; interacts with the plasma membrane ATPase Pma1p and has a role in its targeting to the plasma membrane by influencing its incorporation into lipid rafts; sometimes classified in the medium-chain dehydrogenase/reductases (MDRs) superfamily; AST1 has a paralog, AST2, that arose from the whole genome duplication +S000031495 CDS YBL069W 2 90741 92030 W 2011-02-03 2001-05-29|1997-01-28 +S000000166 ORF Dubious YBL070C chromosome 2 2 90925 90605 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031635 CDS YBL070C 2 90925 90605 C 2011-02-03 1997-01-28 +S000028530 ORF Dubious YBL068W-A chromosome 2 2 91794 92030 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by fungal homology and RT-PCR +S000031139 CDS YBL068W-A 2 91794 92030 W 2011-02-03 2003-07-29 +S000000164 ORF Verified YBL068W PRS4 ribose phosphate diphosphokinase subunit PRS4 chromosome 2 L000001513 2 92414 93394 W 2011-02-03 2003-09-22|1997-01-28|2011-02-03 5-phospho-ribosyl-1(alpha)-pyrophosphate synthetase, synthesizes PRPP; which is required for nucleotide, histidine, and tryptophan biosynthesis; one of five related enzymes, which are active as heteromultimeric complexes; PRS4 has a paralog, PRS2, that arose from the whole genome duplication; a missense mutation in the conserved residue R196 of its human homolog PRPS1 is pathogenic +S000031367 CDS YBL068W 2 92414 93394 W 2011-02-03 2003-09-22|1997-01-28|2011-02-03 +S000178041 ARS ARS203 chromosome 2 2 93435 93519 2014-11-18 2014-11-18 Autonomously replicating sequence +S000000163 ORF Verified YBL067C UBP13 ubiquitin-specific protease UBP13 chromosome 2 L000003172 2 95882 93639 C 2011-02-03 2004-07-16|1997-01-28|1999-04-26|2011-02-03 Ubiquitin-specific protease that cleaves Ub-protein fusions; UBP13 has a paralog, UBP9, that arose from the whole genome duplication +S000030367 CDS YBL067C 2 95882 93639 C 2011-02-03 2004-07-16|1997-01-28|1999-04-26|2011-02-03 +S000000161 ORF Dubious YBL065W chromosome 2 2 99963 100307 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF SEF1/YBL066C; YBL065W is a non-essential gene +S000037539 CDS YBL065W 2 99963 100307 W 2011-02-03 1997-01-28 +S000000162 ORF Verified YBL066C SEF1 chromosome 2 L000003318 2 100115 96669 C 2011-02-03 2004-07-16|1999-04-26|1997-01-28 Putative transcription factor; has homolog in Kluyveromyces lactis +S000030204 CDS YBL066C 2 100115 96669 C 2011-02-03 2004-07-16|1997-01-28|1999-04-26 +S000000160 ORF Verified YBL064C PRX1 thioredoxin peroxidase PRX1 chromosome 2 2 101156 100371 C 2011-02-03 1997-01-28 Mitochondrial peroxiredoxin with thioredoxin peroxidase activity; has a role in reduction of hydroperoxides; reactivation requires Trr2p and glutathione; induced during respiratory growth and oxidative stress; phosphorylated; protein abundance increases in response to DNA replication stress +S000037361 CDS YBL064C 2 101156 100371 C 2011-02-03 1997-01-28 +S000000159 ORF Verified YBL063W KIP1 CIN9 chromosome 2 L000000907 2 101886 105221 W 2011-02-03 1997-01-28 Kinesin-related motor protein; required for mitotic spindle assembly, chromosome segregation, and 2 micron plasmid partitioning; functionally redundant with Cin8p for chromosomal but not plasmid functions +S000037298 CDS YBL063W 2 101886 105221 W 2011-02-03 1997-01-28 +S000000158 ORF Dubious YBL062W chromosome 2 2 105308 105688 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036607 CDS YBL062W 2 105308 105688 W 2011-02-03 1997-01-28 +S000000157 ORF Verified YBL061C SKT5 CSD4|CHS4|CAL2 chromosome 2 L000001911|L000000332 2 107406 105316 C 2011-02-03 1997-01-28 Activator of Chs3p (chitin synthase III) during vegetative growth; recruits Chs3p to the bud neck via interaction with Bni4p; SKT5 has a paralog, SHC1, that arose from the whole genome duplication +S000036460 CDS YBL061C 2 107406 105316 C 2011-02-03 1997-01-28 +S000000156 ORF Verified YBL060W YEL1 Arf family guanine nucleotide exchange factor YEL1 chromosome 2 2 107932 109995 W 2011-02-03 1997-01-28 Guanine nucleotide exchange factor specific for Arf3p; localized to the bud neck and tip; required for localization of Arf3p to the bud neck and tip +S000036446 CDS YBL060W 2 107932 109995 W 2011-02-03 1997-01-28 +S000007488 ORF Verified YBL059C-A CMC2 chromosome 2 2 110539 110125 C 2011-02-03 2000-12-01 Protein involved in respiratory chain complex assembly or maintenance; protein of the mitochondrial intermembrane space; contains twin Cx9C motifs that can form coiled coil-helix-coiled-coil helix fold +S000032274 CDS YBL059C-A 2 110420 110125 C 2011-02-03 2000-12-01 +S000032273 CDS YBL059C-A 2 110539 110506 C 2011-02-03 2000-12-01 +S000032275 intron YBL059C-A 2 110505 110421 C 2011-02-03 2000-12-01 +S000000155 ORF Uncharacterized YBL059W chromosome 2 2 110594 111244 W 2011-02-03 1997-01-28 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YBL059W has a paralog, YER093C-A, that arose from the whole genome duplication +S000035392 CDS YBL059W 2 110594 110879 W 2011-02-03 1997-01-28 +S000035393 CDS YBL059W 2 110949 111244 W 2011-02-03 1997-01-28 +S000035394 intron YBL059W 2 110880 110948 W 2011-02-03 1997-01-28 +S000000154 ORF Verified YBL058W SHP1 protein phosphatase regulator SHP1|UBX1 chromosome 2 L000002746 2 111437 112708 W 2011-02-03 1997-01-28 UBX domain-containing substrate adaptor for Cdc48p; ubiquitin regulatory X domain-containing protein that acts as a substrate recruiting cofactor for Cdc48p; positively regulates Glc7p PPase activity to promote growth and mitotic progression in complex with Cdc48p; ubiquitinated protein interactor involved in ER-associated degradation (ERAD); regulated by nuclear Ub-dependent degradation (INMAD pathway) independent of the Asi and Doa10 complexes; homolog of human p47 (NSFL1C) +S000034369 CDS YBL058W 2 111437 112708 W 2011-02-03 1997-01-28 +S000000153 ORF Verified YBL057C PTH2 aminoacyl-tRNA hydrolase chromosome 2 2 113427 112801 C 2011-02-03 1997-01-28|2011-02-03 One of two mitochondrially-localized peptidyl-tRNA hydrolases; negatively regulates the ubiquitin-proteasome pathway via interactions with ubiquitin-like ubiquitin-associated proteins; dispensable for cell growth; see also PTH1 +S000034185 CDS YBL057C 2 113427 112801 C 2011-02-03 1997-01-28|2011-02-03 +S000000152 ORF Verified YBL056W PTC3 type 2C protein phosphatase PTC3 chromosome 2 L000003426 2 113762 115168 W 2011-02-03 1997-01-28|2011-02-03 Type 2C protein phosphatase (PP2C); dephosphorylates Hog1p (see also Ptc2p) to limit maximal kinase activity induced by osmotic stress; dephosphorylates T169 phosphorylated Cdc28p (see also Ptc2p); role in DNA damage checkpoint inactivation; PTC3 has a paralog, PTC2, that arose from the whole genome duplication +S000034127 CDS YBL056W 2 113762 115168 W 2011-02-03 1997-01-28|2011-02-03 +S000000151 ORF Verified YBL055C 3'-5'-exodeoxyribonuclease|Tat-D chromosome 2 2 116829 115573 C 2011-02-03 1997-01-28 3'-->5' exonuclease and endonuclease with a possible role in apoptosis; has similarity to mammalian and C. elegans apoptotic nucleases +S000033245 CDS YBL055C 2 116829 115573 C 2011-02-03 1997-01-28 +S000000150 ORF Verified YBL054W TOD6 PBF1 chromosome 2 2 117589 119166 W 2011-02-03 1997-01-28 PAC motif binding protein involved in rRNA and ribosome biogenesis; subunit of the RPD3L histone deacetylase complex; Myb-like HTH transcription factor; hypophosphorylated by rapamycin treatment in a Sch9p-dependent manner; activated in stochastic pulses of nuclear localization +S000033217 CDS YBL054W 2 117589 119166 W 2011-02-03 1997-01-28 +S000000149 ORF Dubious YBL053W chromosome 2 2 119335 119709 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033156 CDS YBL053W 2 119335 119709 W 2011-02-03 1997-01-28 +S000000148 ORF Verified YBL052C SAS3 KAT6 chromosome 2 L000003280 2 121874 119379 C 2011-02-03 1997-01-28 Histone acetyltransferase catalytic subunit of NuA3 complex; acetylates histone H3, involved in transcriptional silencing; homolog of the mammalian MOZ proto-oncogene; mutant has aneuploidy tolerance; sas3gcn5 double mutation is lethal +S000032250 CDS YBL052C 2 121874 119379 C 2011-02-03 1997-01-28 +S000000147 ORF Verified YBL051C PIN4 MDT1 chromosome 2 2 124759 122753 C 2011-02-03 1997-01-28 Protein involved in G2/M phase progression and response to DNA damage; interacts with Rad53p; contains an RNA recognition motif, a nuclear localization signal, and several SQ/TQ cluster domains; hyperphosphorylated in response to DNA damage +S000032171 CDS YBL051C 2 124759 122753 C 2011-02-03 1997-01-28 +S000000146 ORF Verified YBL050W SEC17 RNS3 chromosome 2 L000001841 2 125125 126119 W 2011-02-03 1997-01-28 Alpha-SNAP cochaperone; SNARE-complex adaptor for Sec18 (NSF) during the disassembly of postfusion cis-SNARE complexes; stimulates the ATPase activity of Sec18p; peripheral membrane protein required for vesicular transport between ER and Golgi, the 'priming' step in homotypic vacuole fusion, and autophagy; similar to mammalian alpha-SNAP +S000032144 CDS YBL050W 2 125125 125154 W 2011-02-03 1997-01-28 +S000032145 CDS YBL050W 2 125271 126119 W 2011-02-03 1997-01-28 +S000032146 intron YBL050W 2 125155 125270 W 2011-02-03 1997-01-28 +S000000145 ORF Verified YBL049W MOH1 chromosome 2 2 126828 127244 W 2011-02-03 1997-01-28 Protein of unknown function, essential for stationary phase survival; not required for growth on nonfermentable carbon sources; possibly linked with vacuolar transport +S000031247 CDS YBL049W 2 126828 127244 W 2011-02-03 1997-01-28 +S000000144 ORF Dubious YBL048W RRT1 chromosome 2 2 127299 127610 W 2011-02-03 1997-01-28 Protein of unknown function; identified in a screen for mutants with increased levels of rDNA transcription; dubious open reading frame unlikely to encode a protein, based on experimental and comparative sequence data +S000031090 CDS YBL048W 2 127299 127610 W 2011-02-03 1997-01-28 +S000000143 ORF Verified YBL047C EDE1 BUD15 chromosome 2 2 132040 127895 C 2011-02-03 1997-01-28 Scaffold protein involved in the formation of early endocytic sites; putative regulator of cytokinesis; homo-oligomerization is required for localization to and organization of endocytic sites; has a network of interactions with other endocytic proteins; binds membranes in a ubiquitin-dependent manner; may also bind ubiquitinated membrane-associated proteins; interacts with Cmk2 and functions upstream of CMK2 in regulating non-apoptotic cell death; homolog of mammalian Eps15 +S000030056 CDS YBL047C 2 132040 127895 C 2011-02-03 1997-01-28 +S000000142 ORF Verified YBL046W PSY4 HSM6 chromosome 2 2 132424 133749 W 2011-02-03 1997-01-28 Regulatory subunit of protein phosphatase PP4; presence of Psy4p in the PP4 complex (along with catalytic subunit Pph3p and Psy2p) is required for dephosphorylation of the histone variant H2AX, but not for dephosphorylation of Rad53p, during recovery from the DNA damage checkpoint; localization is cell-cycle dependent and regulated by Cdc28p phosphorylation; required for cisplatin resistance; homolog of mammalian R2 +S000030008 CDS YBL046W 2 132424 133749 W 2011-02-03 1997-01-28 +S000000141 ORF Verified YBL045C COR1 ubiquinol--cytochrome-c reductase subunit COR1|QCR1 chromosome 2 L000000381 2 135516 134143 C 2011-02-03 1997-01-28 Core subunit of the ubiquinol-cytochrome c reductase complex; the ubiquinol-cytochrome c reductase complex (bc1 complex) is a component of the mitochondrial inner membrane electron transport chain +S000037896 CDS YBL045C 2 135516 134143 C 2011-02-03 1997-01-28 +S000000140 ORF Uncharacterized YBL044W chromosome 2 2 135998 136366 W 2011-02-03 1997-01-28 Putative protein of unknown function; YBL044W is not an essential protein +S000037855 CDS YBL044W 2 135998 136366 W 2011-02-03 1997-01-28 +S000000139 ORF Verified YBL043W ECM13 chromosome 2 L000003888 2 136688 137461 W 2011-02-03 1997-01-28 Non-essential protein of unknown function; induced by treatment with 8-methoxypsoralen and UVA irradiation; ECM13 has a paralog, YJR115W, that arose from the whole genome duplication +S000037081 CDS YBL043W 2 136688 137461 W 2011-02-03 1997-01-28 +S000000138 ORF Verified YBL042C FUI1 uridine permease chromosome 2 L000004437 2 140260 138341 C 2011-02-03 1997-01-28 High affinity uridine permease, localizes to the plasma membrane; also mediates low but significant transport of the cytotoxic nucleoside analog 5-fluorouridine; not involved in uracil transport; relative distribution to the vacuole increases upon DNA replication stress +S000036981 CDS YBL042C 2 140260 138341 C 2011-02-03 1997-01-28 +S000000137 ORF Verified YBL041W PRE7 proteasome core particle subunit beta 6|PRS3 chromosome 2 L000002699 2 141247 141972 W 2011-02-03 1997-01-28 Beta 6 subunit of the 20S proteasome +S000036959 CDS YBL041W 2 141247 141972 W 2011-02-03 1997-01-28 +S000000136 ORF Verified YBL040C ERD2 chromosome 2 L000000567 2 142868 142112 C 2011-02-03 1997-01-28 HDEL receptor; an integral membrane protein that binds to the HDEL motif in proteins destined for retention in the endoplasmic reticulum; has a role in maintenance of normal levels of ER-resident proteins +S000036161 CDS YBL040C 2 142749 142112 C 2011-02-03 1997-01-28 +S000036160 CDS YBL040C 2 142868 142847 C 2011-02-03 1997-01-28 +S000036162 intron YBL040C 2 142846 142750 C 2011-02-03 1997-01-28 +S000028517 ORF Uncharacterized YBL039W-B YBL039W-A chromosome 2 2 143393 143572 W 2011-02-03 2003-07-29 Putative protein of unknown function; mCherry fusion protein localizes to the vacuole +S000030292 CDS YBL039W-B 2 143393 143572 W 2011-02-03 2003-07-29 +S000178042 ARS ARS206 chromosome 2 2 143658 143745 2014-11-18 2014-11-18 Autonomously replicating sequence +S000028814 ORF Dubious YBL039C-A chromosome 2 2 145031 144948 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF URA7; identified by expression profiling and mass spectrometry +S000033616 CDS YBL039C-A 2 145031 144948 C 2011-02-03 2003-07-29 +S000000135 ORF Verified YBL039C URA7 CTP synthase URA7 chromosome 2 L000002436 2 145728 143989 C 2011-02-03 1997-01-28 Major CTP synthase isozyme (see also URA8); catalyzes the ATP-dependent transfer of the amide nitrogen from glutamine to UTP, forming CTP, the final step in de novo biosynthesis of pyrimidines; involved in phospholipid biosynthesis; capable of forming cytoplasmic filaments termed cytoophidium, especially during conditions of glucose depletion; URA7 has a paralog, URA8, that arose from the whole genome duplication +S000035182 CDS YBL039C 2 145728 143989 C 2011-02-03 1997-01-28 +S000000134 ORF Verified YBL038W MRPL16 RML16|mitochondrial 54S ribosomal protein YmL47|YmL47 chromosome 2 L000001165 2 146187 146885 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit; homologous to bacterial L16 ribosomal protein; synthetic lethality with hac1 mutation suggests a possible role in synthesis of precursors for protein glycosylation +S000035077 CDS YBL038W 2 146187 146885 W 2011-02-03 1997-01-28 +S000000133 ORF Verified YBL037W APL3 chromosome 2 L000003322 2 147209 150286 W 2011-02-03 1997-01-28 Alpha-adaptin; large subunit of the clathrin associated protein complex (AP-2); involved in vesicle mediated transport +S000034928 CDS YBL037W 2 147209 150286 W 2011-02-03 1997-01-28 +S000000132 ORF Verified YBL036C chromosome 2 2 151220 150447 C 2011-02-03 1997-01-28 Putative non-specific single-domain racemase; based on structural similarity; binds pyridoxal 5'-phosphate; expression of GFP-fusion protein induced in response to the DNA-damaging agent MMS +S000033968 CDS YBL036C 2 151220 150447 C 2011-02-03 1997-01-28 +S000000131 ORF Verified YBL035C POL12 DNA-directed DNA polymerase alpha subunit POL12 chromosome 2 L000002698 2 153610 151493 C 2011-02-03 1997-01-28 B subunit of DNA polymerase alpha-primase complex; required for initiation of DNA replication during mitotic and premeiotic DNA synthesis; also functions in telomere capping and length regulation +S000033851 CDS YBL035C 2 153610 151493 C 2011-02-03 1997-01-28 +S000000130 ORF Verified YBL034C STU1 chromosome 2 L000002138 2 158389 153848 C 2011-02-03 1997-01-28 Component of the mitotic spindle; binds to interpolar microtubules via its association with beta-tubulin (Tub2p); required for interpolar microtubules to provide an outward force on the spindle poles +S000033728 CDS YBL034C 2 158389 153848 C 2011-02-03 1997-01-28 +S000000129 ORF Verified YBL033C RIB1 GTP cyclohydrolase II chromosome 2 L000001634 2 159693 158656 C 2011-02-03 1999-04-22|1997-01-28 GTP cyclohydrolase II; catalyzes the first step of the riboflavin biosynthesis pathway +S000033070 CDS YBL033C 2 159693 158656 C 2011-02-03 1999-04-22|1997-01-28 +S000000128 ORF Verified YBL032W HEK2 KHD1 chromosome 2 2 160184 161329 W 2011-02-03 1997-01-28 RNA binding protein involved in asymmetric localization of ASH1 mRNA; represses translation of ASH1 mRNA, an effect reversed by Yck1p-dependent phosphoryation; regulates telomere position effect and length; similarity to hnRNP-K +S000033035 CDS YBL032W 2 160184 161329 W 2011-02-03 1997-01-28 +S000000127 ORF Verified YBL031W SHE1 chromosome 2 L000002867 2 161699 162715 W 2011-02-03 1997-01-28 Mitotic spindle protein; interacts with components of the Dam1 (DASH) complex, its effector Sli15p, and microtubule-associated protein Bim1p; also localizes to nuclear microtubules and to the bud neck in a ring-shaped structure; inhibits dynein function +S000032946 CDS YBL031W 2 161699 162715 W 2011-02-03 1997-01-28 +S000000126 ORF Verified YBL030C PET9 ADP/ATP carrier protein PET9|OP1|ANC2|AAC2 chromosome 2 L000000004|L000001386|L000004346 2 163997 163041 C -20 2011-02-03 1997-01-28 Major ADP/ATP carrier of the mitochondrial inner membrane; exchanges cytosolic ADP for mitochondrially synthesized ATP; also imports heme and ATP; required for viability in many lab strains that carry a sal1 mutation; PET9 has a paralog, AAC3, that arose from the whole genome duplication; human homolog SLC25A4 implicated in progressive external ophthalmoplegia can complement yeast null mutant +S000032782 CDS YBL030C 2 163997 163041 C 2011-02-03 1997-01-28 +S000007591 ORF Verified YBL029C-A chromosome 2 S000029022 2 164772 164488 C 2011-02-03 2001-02-26 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery; protein abundance increases in response to DNA replication stress; has potential orthologs in Saccharomyces species and in Yarrowia lipolytica +S000037103 CDS YBL029C-A 2 164772 164488 C 2011-02-03 2001-02-26 +S000000125 ORF Uncharacterized YBL029W chromosome 2 2 166134 167264 W 2011-02-03 1997-01-28 Non-essential protein of unknown function +S000032107 CDS YBL029W 2 166134 167264 W 2011-02-03 1997-01-28 +S000000124 ORF Verified YBL028C chromosome 2 2 167838 167518 C 2011-02-03 1997-01-28 Protein of unknown function that may interact with ribosomes; green fluorescent protein (GFP)-fusion protein localizes to the nucleolus; predicted to be involved in ribosome biogenesis +S000031894 CDS YBL028C 2 167838 167518 C 2011-02-03 1997-01-28 +S000000123 ORF Verified YBL027W RPL19B eL19|ribosomal 60S subunit protein L19B|L19e|rpl5L|YL14|L23B|L19B chromosome 2 L000001719|L000001718 2 168423 169376 W 2011-02-03 1997-01-28 Ribosomal 60S subunit protein L19B; rpl19a and rpl19b single null mutations result in slow growth, while the double null mutation is lethal; homologous to mammalian ribosomal protein L19, no bacterial homolog; RPL19B has a paralog, RPL19A, that arose from the whole genome duplication +S000031846 CDS YBL027W 2 168423 168424 W 2011-02-03 1997-01-28 +S000031847 CDS YBL027W 2 168809 169376 W 2011-02-03 1997-01-28 +S000031848 intron YBL027W 2 168425 168808 W 2011-02-03 1997-01-28 +S000118345 ARS ARS207 ARSII-170 chromosome 2 2 170173 170279 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178043 ARS_consensus_sequence ARS207 2 170223 170207 C 2014-11-18 2014-11-18 +S000000122 ORF Verified YBL026W LSM2 Sm-like protein LSM2|SNP3|SMX5 chromosome 2 L000003168 2 170623 171038 W 2011-02-03 1997-01-28 Lsm (Like Sm) protein; part of heteroheptameric complexes (Lsm2p-7p and either Lsm1p or 8p): cytoplasmic Lsm1p complex involved in mRNA decay; nuclear Lsm8p complex part of U6 snRNP and possibly involved in processing tRNA, snoRNA, and rRNA; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress +S000030858 CDS YBL026W 2 170623 170676 W 2011-02-03 1997-01-28 +S000030859 CDS YBL026W 2 170805 171038 W 2011-02-03 1997-01-28 +S000030860 intron YBL026W 2 170677 170804 W 2011-02-03 1997-01-28 +S000000121 ORF Verified YBL025W RRN10 chromosome 2 L000003279 2 171481 171918 W 2011-02-03 1997-01-28 Protein involved in promoting high level transcription of rDNA; subunit of UAF (upstream activation factor) for RNA polymerase I +S000030749 CDS YBL025W 2 171481 171918 W 2011-02-03 1997-01-28 +S000000120 ORF Verified YBL024W NCL1 tRNA (cytosine-C5-)-methyltransferase|TRM4 chromosome 2 2 172534 174588 W 2011-02-03 1997-01-28 S-adenosyl-L-methionine-dependent tRNA: m5C-methyltransferase; methylates cytosine to m5C at several positions in tRNAs and intron-containing pre-tRNAs; increases proportion of tRNALeu(CAA) with m5C at wobble position in response to hydrogen peroxide, causing selective translation of mRNA from genes enriched in TTG codon; loss of NCL1 confers hypersensitivity to oxidative stress; similar to Nop2p and human proliferation associated nucleolar protein p120 +S000030630 CDS YBL024W 2 172534 174588 W 2011-02-03 1997-01-28 +S000000119 ORF Verified YBL023C MCM2 MCM DNA helicase complex subunit MCM2 chromosome 2 L000001038 2 177526 174920 C -31 2011-02-03 1997-01-28 Protein involved in DNA replication; component of the Mcm2-7 hexameric helicase complex that binds chromatin as a part of the pre-replicative complex; relative distribution to the nucleus increases upon DNA replication stress +S000037739 CDS YBL023C 2 177526 174920 C 2011-02-03 1997-01-28 +S000000118 ORF Verified YBL022C PIM1 ATP-dependent Lon protease PIM1|LON1 chromosome 2 L000000949|L000001440 2 181275 177874 C 2011-02-03 1997-01-28 ATP-dependent Lon protease; involved in degradation of misfolded proteins in mitochondria; required for biogenesis and maintenance of mitochondria +S000037690 CDS YBL022C 2 181275 177874 C 2011-02-03 1997-01-28 +S000000117 ORF Verified YBL021C HAP3 chromosome 2 L000000753 2 182094 181660 C 2011-02-03 1997-01-28 Subunit of the Hap2p/3p/4p/5p CCAAT-binding complex; complex is heme-activated and glucose-repressed; complex is a transcriptional activator and global regulator of respiratory gene expression; contains sequences contributing to both complex assembly and DNA binding +S000037614 CDS YBL021C 2 182094 181660 C 2011-02-03 1997-01-28 +S000000116 ORF Verified YBL020W RFT1 glycolipid translocation protein chromosome 2 L000001626 2 182401 184125 W 2011-02-03 1997-01-28 Membrane protein required for translocation of Man5GlcNac2-PP-Dol; required for translocation of Man5GlcNac2-PP-Dol from the cytoplasmic side to the lumenal side of the ER membrane but is not the flippase; mutation is suppressed by expression of human p53 protein; essential gene +S000037598 CDS YBL020W 2 182401 184125 W 2011-02-03 1997-01-28 +S000000115 ORF Verified YBL019W APN2 DNA-(apurinic or apyrimidinic site) lyase APN2|ETH1 chromosome 2 L000004434 2 184353 185915 W 2011-02-03 1997-01-28 Class II abasic (AP) endonuclease involved in repair of DNA damage; homolog of human HAP1 and E. coli exoIII +S000037877 CDS YBL019W 2 184353 185915 W 2011-02-03 1997-01-28 +S000000114 ORF Verified YBL018C POP8 ribonuclease P chromosome 2 L000004304 2 186474 185998 C 2011-02-03 1997-01-28 Subunit of both RNase MRP and nuclear RNase P; RNase MRP cleaves pre-rRNA, while nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs; relocalizes to the cytosol in response to hypoxia +S000035953 CDS YBL018C 2 186352 185998 C 2011-02-03 1997-01-28 +S000035952 CDS YBL018C 2 186474 186428 C 2011-02-03 1997-01-28 +S000035954 intron YBL018C 2 186427 186353 C 2011-02-03 1997-01-28 +S000000113 ORF Verified YBL017C PEP1 type I sorting receptor|VPT1|VPS10 chromosome 2 L000001373 2 191583 186844 C -8 2011-02-03 1997-01-28 Type I transmembrane sorting receptor for multiple vacuolar hydrolases; cycles between the late-Golgi and prevacuolar endosome-like compartments +S000035832 CDS YBL017C 2 191583 186844 C 2011-02-03 1997-01-28 +S000000112 ORF Verified YBL016W FUS3 mitogen-activated serine/threonine-protein kinase FUS3|DAC2 chromosome 2 L000000655 2 192451 193512 W -5 2011-02-03 1997-01-28 Mitogen-activated serine/threonine protein kinase involved in mating; phosphoactivated by Ste7p; substrates include Ste12p, Far1p, Bni1p, Sst2p; inhibits invasive growth during mating by phosphorylating Tec1p, promoting its; inhibits recruitment of Ste5p, Cdc42p-mediated asymmetry and mating morphogenesis +S000035775 CDS YBL016W 2 192451 193512 W 2011-02-03 1997-01-28 +S000000111 ORF Verified YBL015W ACH1 acetyl-CoA hydrolase chromosome 2 L000000021 2 194122 195702 W 2011-02-03 1997-01-28 Protein with CoA transferase activity; particularly for CoASH transfer from succinyl-CoA to acetate; has minor acetyl-CoA-hydrolase activity; phosphorylated; required for acetate utilization and for diploid pseudohyphal growth +S000035656 CDS YBL015W 2 194122 195702 W 2011-02-03 1997-01-28 +S000006796 long_terminal_repeat YBLCdelta7 chromosome 2 2 197320 197016 C 2011-02-03 2000-05-19|2007-04-05 Ty1 LTR +S000006600 tRNA_gene tI(AAU)B chromosome 2 L000003740 2 197494 197567 W 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000030373 noncoding_exon tI(AAU)B 2 197494 197567 W 2011-02-03 2000-05-19 +S000006574 tRNA_gene tG(GCC)B chromosome 2 L000003750 2 197699 197629 C 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis +S000037887 noncoding_exon tG(GCC)B 2 197699 197629 C 2011-02-03 2000-05-19 +S000006797 long_terminal_repeat YBLWsigma1 YBLCsigma1 chromosome 2 2 197714 198054 W 2011-02-03 2000-05-19 Ty3 LTR +S000118997 ARS ARS231 ARSII-198|ARS207.5 chromosome 2 2 198313 198473 2014-11-18 2014-11-18|2006-10-02 Autonomously Replicating Sequence +S000178044 ARS_consensus_sequence ARS231 2 198385 198369 C 2014-11-18 2014-11-18 +S000000110 ORF Verified YBL014C RRN6 chromosome 2 L000001772 2 201748 199064 C 2011-02-03 1997-01-28|2011-02-03 Component of the core factor (CF) rDNA transcription factor complex; CF is required for transcription of 35S rRNA genes by RNA polymerase I and is composed of Rrn6p, Rrn7p, and Rrn11p +S000034605 CDS YBL014C 2 201748 199064 C 2011-02-03 1997-01-28|2011-02-03 +S000000109 ORF Verified YBL013W FMT1 methionyl-tRNA formyltransferase chromosome 2 2 202056 203261 W 2011-02-03 2004-01-29|1997-01-28 Methionyl-tRNA formyltransferase; catalyzes the formylation of initiator Met-tRNA in mitochondria; potential Cdc28p substrate +S000034585 CDS YBL013W 2 202056 203261 W 2011-02-03 2004-01-29|1997-01-28 +S000000107 ORF Verified YBL011W SCT1 bifunctional glycerol-3-phosphate/glycerone-phosphate O-acyltransferase SCT1|GAT2 chromosome 2 L000001820 2 203538 205817 W 2011-02-03 1997-01-28 Glycerol 3-phosphate/dihydroxyacetone phosphate sn-1 acyltransferase; dual substrate-specific acyltransferase of the glycerolipid biosynthesis pathway; prefers 16-carbon fatty acids; similar to Gpt2p; gene is constitutively transcribed +S000033576 CDS YBL011W 2 203538 205817 W 2011-02-03 1997-01-28 +S000000108 ORF Dubious YBL012C chromosome 2 2 203807 203406 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033578 CDS YBL012C 2 203807 203406 C 2011-02-03 1997-01-28 +S000000106 ORF Uncharacterized YBL010C chromosome 2 2 206949 206107 C 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein colocalizes with clathrin-coated vesicles +S000033474 CDS YBL010C 2 206949 206107 C 2011-02-03 1997-01-28 +S000000105 ORF Verified YBL009W ALK2 protein kinase ALK2 chromosome 2 2 207194 209224 W 2011-02-03 1997-01-28 Protein kinase; along with its paralog, ALK1, required for proper spindle positioning and nuclear segregation following mitotic arrest, proper organization of cell polarity factors in mitosis, proper localization of formins and polarity factors, and survival in cells that activate spindle assembly checkpoint; phosphorylated in response to DNA damage; ALK2 has a paralog, ALK1, that arose from the whole genome duplication; similar to mammalian haspins +S000033987 CDS YBL009W 2 207194 209224 W 2011-02-03 1997-01-28 +S000028529 ORF Uncharacterized YBL008W-A chromosome 2 2 209409 209648 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000030335 CDS YBL008W-A 2 209409 209648 W 2011-02-03 2003-07-29 +S000000104 ORF Verified YBL008W HIR1 chromosome 2 L000000776 2 209653 212175 W 2011-02-03 1997-01-28|2011-02-03 Subunit of the HIR complex; HIR is a nucleosome assembly complex involved in regulation of histone gene transcription; contributes to nucleosome formation, heterochromatic gene silencing, and formation of functional kinetochores +S000033882 CDS YBL008W 2 209653 212175 W 2011-02-03 1997-01-28|2011-02-03 +S000000103 ORF Verified YBL007C SLA1 cytoskeletal protein-binding protein SLA1 chromosome 2 L000001912 2 216366 212632 C 2011-02-03 1997-01-28 Cytoskeletal protein binding protein; required for assembly of the cortical actin cytoskeleton; interacts with proteins regulating actin dynamics and proteins required for endocytosis; found in the nucleus and cell cortex; has 3 SH3 domains +S000033661 CDS YBL007C 2 216366 212632 C 2011-02-03 1997-01-28 +S000028596 ORF Dubious YBL006W-A chromosome 2 2 216711 216860 W 2011-02-03 2004-01-29|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene LDB7/YBL006C +S000031377 CDS YBL006W-A 2 216711 216860 W 2011-02-03 2004-01-29|2003-07-29 +S000000102 ORF Verified YBL006C LDB7 RSC14 chromosome 2 2 217129 216587 C 2011-02-03 2004-01-29|1997-01-28 Component of the RSC chromatin remodeling complex; interacts with Rsc3p, Rsc30p, Npl6p, and Htl1p to form a module important for a broad range of RSC functions +S000030377 CDS YBL006C 2 217129 216587 C 2011-02-03 2004-01-29|1997-01-28 +S000000101 ORF Verified YBL005W PDR3 drug-responsive transcription factor PDR3|TPE2|AMY2 chromosome 2 L000002985|L000001363 2 217470 220400 W -10 2011-02-03 1997-01-28 Transcriptional activator of the pleiotropic drug resistance network; regulates expression of ATP-binding cassette (ABC) transporters through binding to cis-acting PDRE sites (PDR responsive elements); has a role in response to drugs and organic solvents; post-translationally up-regulated in cells lacking functional mitochondrial genome; involved in diauxic shift; relative distribution to nucleus increases upon DNA replication stress; APCC(Cdh1) substrate +S000030309 CDS YBL005W 2 217470 220400 W 2011-02-03 1997-01-28 +S000006804 long_terminal_repeat YBLWdelta8 chromosome 2 2 220895 221036 W 2011-02-03 2000-05-19 Ty1 LTR +S000006805 long_terminal_repeat YBLWdelta9 chromosome 2 2 221037 221370 W 2011-02-03 2000-05-19 Ty1 LTR +S000006808 LTR_retrotransposon YBLWTy1-1 Ty1 chromosome 2 2 221037 226952 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000002146 transposable_element_gene YBL005W-A gag protein chromosome 2 2 221330 222652 W 2011-02-03 1997-01-28 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000032539 CDS YBL005W-A 2 221330 222652 W 2011-02-03 1997-01-28 +S000002147 transposable_element_gene YBL005W-B gag-pol fusion protein chromosome 2 2 221330 226598 W 2011-02-03 1997-01-28 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000032555 CDS YBL005W-B 2 221330 222634 W 2011-02-03 1997-01-28 +S000032556 CDS YBL005W-B 2 222636 226598 W 2011-02-03 1997-01-28 +S000032557 plus_1_translational_frameshift YBL005W-B 2 222635 222635 W 2011-02-03 1997-01-28 +S000006806 long_terminal_repeat YBLWdelta10 chromosome 2 2 226621 226952 W 2011-02-03 2000-05-19 Ty1 LTR +S000006720 tRNA_gene tS(AGA)B chromosome 2 L000003741 2 227075 227156 W 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000032344 noncoding_exon tS(AGA)B 2 227075 227156 W 2011-02-03 2000-05-19 +S000000100 ORF Verified YBL004W UTP20 chromosome 2 2 227636 235117 W 2011-02-03 2001-05-29|1997-01-28 Component of the small-subunit (SSU) processome; SSU processome is involved in the biogenesis of the 18S rRNA +S000030137 CDS YBL004W 2 227636 235117 W 2011-02-03 2001-05-29|1997-01-28 +S000000099 ORF Verified YBL003C HTA2 histone H2A|H2A2 chromosome 2 L000000749|L000000828 2 235792 235394 C .2 2011-02-03 1997-01-28 Histone H2A; core histone protein required for chromatin assembly and chromosome function; one of two nearly identical (see also HTA1) subtypes; DNA damage-dependent phosphorylation by Mec1p facilitates DNA repair; acetylated by Nat4p +S000029974 CDS YBL003C 2 235792 235394 C 2011-02-03 1997-01-28 +S000000098 ORF Verified YBL002W HTB2 histone H2B chromosome 2 L000000830 2 236492 236887 W .2 2011-02-03 1997-01-28 Histone H2B; core histone protein required for chromatin assembly and chromosome function; nearly identical to HTB1; Rad6p-Bre1p-Lge1p mediated ubiquitination regulates reassembly after DNA replication, transcriptional activation, meiotic DSB formation and H3 methylation +S000037396 CDS YBL002W 2 236492 236887 W 2011-02-03 1997-01-28 +S000000097 ORF Verified YBL001C ECM15 chromosome 2 L000003890 2 237467 237153 C 2011-02-03 1997-01-28 Non-essential protein of unknown function; likely exists as tetramer, may be regulated by the binding of small-molecule ligands (possibly sulfate ions), may have a role in yeast cell-wall biogenesis +S000037284 CDS YBL001C 2 237467 237153 C 2011-02-03 1997-01-28 +S000118346 ARS ARS208 ARSII-238 chromosome 2 2 237787 237900 2014-11-18 2014-11-18|2006-08-30|2011-02-03 Autonomously Replicating Sequence +S000178045 ARS_consensus_sequence ARS208 2 237835 237819 C 2014-11-18 2014-11-18 +S000006464 centromere CEN2 CEN2 chromosome 2 L000000295 2 238207 238323 W 0 2011-02-03 2000-05-19 Chromosome II centromere +S000077260 centromere_DNA_Element_I CEN2 2 238207 238216 W 2011-02-03 2004-10-04 +S000077261 centromere_DNA_Element_II CEN2 2 238217 238298 W 2011-02-03 2004-10-04 +S000077262 centromere_DNA_Element_III CEN2 2 238299 238323 W 2011-02-03 2004-10-04 +S000000205 ORF Verified YBR001C NTH2 alpha,alpha-trehalase NTH2 chromosome 2 L000001281 2 241283 238941 C 2011-02-03 1997-01-28 Putative neutral trehalase, required for thermotolerance; may mediate resistance to other cellular stresses; NTH2 has a paralog, NTH1, that arose from the whole genome duplication +S000034705 CDS YBR001C 2 241283 238941 C 2011-02-03 1997-01-28 +S000000206 ORF Verified YBR002C RER2 ditrans,polycis-polyprenyl diphosphate synthase chromosome 2 L000004874 2 242568 241708 C 2011-02-03 1997-01-28 Forms the dehydrodolichyl diphosphate syntase (DDS) complex with NUS1; major enzyme of polyprenol synthesis in both the endoplasmic reticulum (ER) and in lipid droplets; participates in ER protein sorting; human ortholog DHDDS functionally complements the heat sensitive growth defect of a ts allele, and is associated with retinitis pigmentosa +S000035641 CDS YBR002C 2 242568 241708 C 2011-02-03 1997-01-28 +S000000207 ORF Verified YBR003W COQ1 trans-hexaprenyltranstransferase chromosome 2 L000000378 2 242809 244230 W 2011-02-03 1997-01-28 Hexaprenyl pyrophosphate synthetase; catalyzes the first step in ubiquinone (coenzyme Q) biosynthesis +S000035753 CDS YBR003W 2 242809 244230 W 2011-02-03 1997-01-28 +S000000208 ORF Verified YBR004C GPI18 GPI-anchor transamidase GPI18|FMP44 chromosome 2 2 245667 244366 C 2011-02-03 1997-01-28|2011-02-03 Functional ortholog of human PIG-V; PIG-V is a mannosyltransferase that transfers the second mannose in glycosylphosphatidylinositol biosynthesis; the authentic, non-tagged protein was localized to mitochondria +S000035794 CDS YBR004C 2 245667 244366 C 2011-02-03 1997-01-28|2011-02-03 +S000000209 ORF Verified YBR005W RCR1 SSH6 chromosome 2 2 245906 246547 W 2011-02-03 1997-01-28 Protein of the ER membrane involved in cell wall chitin deposition; may function in the endosomal-vacuolar trafficking pathway, helping determine whether plasma membrane proteins are degraded or routed to the plasma membrane; RCR1 has a paralog, RCR2, that arose from the whole genome duplication +S000035989 CDS YBR005W 2 245906 246547 W 2011-02-03 1997-01-28 +S000000210 ORF Verified YBR006W UGA2 succinate-semialdehyde dehydrogenase (NAD(P)(+))|UGA5 chromosome 2 S000007516 2 247010 248503 W 2011-02-03 1999-04-26|1997-01-28 Succinate semialdehyde dehydrogenase; involved in the utilization of gamma-aminobutyrate (GABA) as a nitrogen source; part of the 4-aminobutyrate and glutamate degradation pathways; localized to the cytoplasm +S000036842 CDS YBR006W 2 247010 248503 W 2011-02-03 1999-04-26|1997-01-28 +S000000211 ORF Verified YBR007C DSF2 chromosome 2 2 251016 248806 C 2011-02-03 1997-01-28|2011-02-03 Deletion suppressor of mpt5 mutation; relocalizes from bud neck to cytoplasm upon DNA replication stress +S000036880 CDS YBR007C 2 251016 248806 C 2011-02-03 1997-01-28|2011-02-03 +S000000212 ORF Verified YBR008C FLR1 chromosome 2 L000003532 2 254209 252563 C 2011-02-03 1997-01-28 Plasma membrane transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; involved in efflux of fluconazole, diazaborine, benomyl, methotrexate, and other drugs; expression induced in cells treated with the mycotoxin patulin; relocalizes from nucleus to plasma membrane upon DNA replication stress +S000036932 CDS YBR008C 2 254209 252563 C 2011-02-03 1997-01-28 +S000114517 ARS ARS209 ARS209 chromosome 2 2 254998 255083 2014-11-18 2014-11-18|2006-03-02|2011-02-03 Autonomously Replicating Sequence; originally referred to as H4 ARS +S000178046 ARS_consensus_sequence ARS209 2 255041 255025 C 2014-11-18 2014-11-18 +S000000213 ORF Verified YBR009C HHF1 histone H4 chromosome 2 L000000770 2 255684 255373 C 2011-02-03 1997-01-28 Histone H4; core histone protein required for chromatin assembly and chromosome function; one of two identical histone proteins (see also HHF2); contributes to telomeric silencing; N-terminal domain involved in maintaining genomic integrity +S000037700 CDS YBR009C 2 255684 255373 C 2011-02-03 1997-01-28 +S000000214 ORF Verified YBR010W HHT1 histone H3|SIN2|BUR5 chromosome 2 L000000772 2 256331 256741 W 2011-02-03 1997-01-28 Histone H3; core histone protein required for chromatin assembly, part of heterochromatin-mediated telomeric and HM silencing; one of two identical histone H3 proteins (see HHT2); regulated by acetylation, methylation, and phosphorylation; H3K14 acetylation plays an important role in the unfolding of strongly positioned nucleosomes during repair of UV damage +S000030575 CDS YBR010W 2 256331 256741 W 2011-02-03 1997-01-28 +S000000215 ORF Verified YBR011C IPP1 inorganic diphosphatase IPP1|PPA1 chromosome 2 L000000872 2 257975 257112 C 2011-02-03 1997-01-28 Cytoplasmic inorganic pyrophosphatase (PPase); homodimer that catalyzes the rapid exchange of oxygens from Pi with water, highly expressed and essential for viability, active-site residues show identity to those from E. coli PPase +S000030655 CDS YBR011C 2 257975 257112 C 2011-02-03 1997-01-28 +S000006810 long_terminal_repeat YBRCdelta11 chromosome 2 2 258976 258670 C 2011-02-03 2000-05-19|2007-04-05 Ty1 LTR +S000000216 ORF Dubious YBR012C chromosome 2 2 259566 259147 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; expression induced by iron-regulated transcriptional activator Aft2p +S000030768 CDS YBR012C 2 259566 259147 C 2011-02-03 1997-01-28 +S000006815 long_terminal_repeat YBRWdelta12 chromosome 2 2 259578 259909 W 2011-02-03 2000-05-19 Ty1 LTR +S000006821 LTR_retrotransposon YBRWTy1-2 Ty1 chromosome 2 2 259578 265494 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000002154 transposable_element_gene YBR012W-A gag protein chromosome 2 2 259869 261191 W 2011-02-03 1997-01-28 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000031588 CDS YBR012W-A 2 259869 261191 W 2011-02-03 1997-01-28 +S000002155 transposable_element_gene YBR012W-B gag-pol fusion protein chromosome 2 2 259869 265140 W 2011-02-03 1997-01-28 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000031594 CDS YBR012W-B 2 259869 261173 W 2011-02-03 1997-01-28 +S000031595 CDS YBR012W-B 2 261175 265140 W 2011-02-03 1997-01-28 +S000031596 plus_1_translational_frameshift YBR012W-B 2 261174 261174 W 2011-02-03 1997-01-28 +S000006816 long_terminal_repeat YBRWdelta13 chromosome 2 2 265163 265494 W 2011-02-03 2000-05-19 Ty1 LTR +S000000217 ORF Uncharacterized YBR013C chromosome 2 2 265881 265492 C 2011-02-03 1997-01-28 Putative protein of unknown function; haploid deletion mutant exhibits synthetic phenotype with alpha-synuclein; SWAT-GFP fusion protein localizes to the endoplasmic reticulum while mCherry fusion protein localizes to both the endoplasmic reticulum and vacuole +S000030875 CDS YBR013C 2 265881 265492 C 2011-02-03 1997-01-28 +S000006811 long_terminal_repeat YBRCdelta14 chromosome 2 2 266256 266178 C 2007-04-05 2000-05-19|2007-04-05 Ty1 LTR +S000006737 tRNA_gene tT(AGU)B chromosome 2 L000003742 2 266378 266450 W 2004-07-16 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000032147 noncoding_exon tT(AGU)B 2 266378 266450 W 2004-07-16 2000-05-19 +S000000218 ORF Verified YBR014C GRX7 glutathione-disulfide reductase GRX7 chromosome 2 2 267336 266725 C 2004-07-16 1997-01-28 Cis-golgi localized monothiol glutaredoxin; more similar in activity to dithiol than other monothiol glutaredoxins; involved in the oxidative stress response; does not bind metal ions; GRX7 has a paralog, GRX6, that arose from the whole genome duplication +S000031840 CDS YBR014C 2 267336 266725 C 2004-07-16 1997-01-28 +S000000219 ORF Verified YBR015C MNN2 alpha-1,2-mannosyltransferase MNN2|LDB8|CRV4|TTP1 chromosome 2 L000002385 2 269503 267710 C 2004-07-16 1997-01-28 Alpha-1,2-mannosyltransferase; responsible for addition of the first alpha-1,2-linked mannose to form the branches on the mannan backbone of oligosaccharides, localizes to an early Golgi compartment +S000032017 CDS YBR015C 2 269503 267710 C 2004-07-16 1997-01-28 +S000000220 ORF Verified YBR016W chromosome 2 2 270247 270633 W 2004-07-16 1997-01-28 Tail-anchored plasma membrane protein with a conserved CYSTM module; predicted to be palmitoylated; has similarity to hydrophilins, which are involved in the adaptive response to hyperosmotic conditions; YBR016W has a paralog, YDL012C, that arose from the whole genome duplication +S000032998 CDS YBR016W 2 270247 270633 W 2004-07-16 1997-01-28 +S000000221 ORF Verified YBR017C KAP104 chromosome 2 L000003444 2 273703 270947 C 2004-07-16 1997-01-28 Transportin or cytosolic karyopherin beta 2; functions in the rg-nuclear localization signal-mediated nuclear import/reimport of mRNA-binding proteins Nab2p and Hrp1p; regulates asymmetric protein synthesis in daughter cells during mitosis +S000033056 CDS YBR017C 2 273703 270947 C 2004-07-16 1997-01-28 +S000000222 ORF Verified YBR018C GAL7 UDP-glucose:hexose-1-phosphate uridylyltransferase chromosome 2 L000000662 2 275527 274427 C 7 2004-07-16 1997-01-28 Galactose-1-phosphate uridyl transferase; synthesizes glucose-1-phosphate and UDP-galactose from UDP-D-glucose and alpha-D-galactose-1-phosphate in the second step of galactose catabolism; human homolog UGP2 can complement yeast null mutant +S000033134 CDS YBR018C 2 275527 274427 C 2004-07-16 1997-01-28 +S000000223 ORF Verified YBR019C GAL10 bifunctional UDP-glucose 4-epimerase/aldose 1-epimerase chromosome 2 L000000663 2 278352 276253 C 7 2004-07-16 1997-01-28 UDP-glucose-4-epimerase; catalyzes interconversion of UDP-galactose and UDP-D-glucose in galactose metabolism; also catalyzes conversion of alpha-D-glucose or alpha-D-galactose to their beta-anomers; human homolog GALE implicated in galactosemia, can complement yeast null mutant +S000033206 CDS YBR019C 2 278352 276253 C 2004-07-16 1997-01-28 +S000000224 ORF Verified YBR020W GAL1 galactokinase chromosome 2 L000000658 2 279021 280607 W 7 2004-07-16 1997-01-28 Galactokinase; phosphorylates alpha-D-galactose to alpha-D-galactose-1-phosphate in the first step of galactose catabolism; expression regulated by Gal4p; human homolog GALK2 complements yeast null mutant; GAL1 has a paralog, GAL3, that arose from the whole genome duplication +S000034916 CDS YBR020W 2 279021 280607 W 2004-07-16 1997-01-28 +S000000225 ORF Verified YBR021W FUR4 uracil permease chromosome 2 L000000652 2 281443 283344 W 8 2004-07-16 1997-01-28 Plasma membrane localized uracil permease; expression is tightly regulated by uracil levels and environmental cues; conformational alterations induced by unfolding or substrate binding result in Rsp5p-mediated ubiquitination and degradation +S000035064 CDS YBR021W 2 281443 283344 W 2004-07-16 1997-01-28 +S000000226 ORF Verified YBR022W POA1 ADP-ribose 1''-phosphate phosphatase chromosome 2 2 283738 284271 W 2004-07-16 1997-01-28 Phosphatase that is highly specific for ADP-ribose 1''-phosphate; a tRNA splicing metabolite; may have a role in regulation of tRNA splicing +S000035171 CDS YBR022W 2 283738 284271 W 2004-07-16 1997-01-28 +S000000227 ORF Verified YBR023C CHS3 chitin synthase CHS3|KTI2|DIT101|CSD2|CAL1 chromosome 2 L000000331 2 287925 284428 C 9 2004-07-16 1997-01-28 Chitin synthase III; catalyzes the transfer of N-acetylglucosamine (GlcNAc) to chitin; required for synthesis of the majority of cell wall chitin, the chitin ring during bud emergence, and spore wall chitosan; contains overlapping di-leucine and di-acidic signals that mediate, respectively, intracellular trafficking by AP-1 and trafficking to plasma membrane by exomer complex; requires AP-3 complex for its intracellular retention +S000035205 CDS YBR023C 2 287925 284428 C 2004-07-16 1997-01-28 +S000000228 ORF Verified YBR024W SCO2 putative thioredoxin peroxidase SCO2 chromosome 2 L000001816 2 289445 290350 W 2004-07-16 1997-01-28 Protein anchored to mitochondrial inner membrane; may have a redundant function with Sco1p in delivery of copper to cytochrome c oxidase; interacts with Cox2p; SCO2 has a paralog, SCO1, that arose from the whole genome duplication +S000036144 CDS YBR024W 2 289445 290350 W 2004-07-16 1997-01-28 +S000000229 ORF Verified YBR025C OLA1 Obg-like ATPase chromosome 2 2 291865 290681 C 2004-07-16 1997-01-28 P-loop ATPase with similarity to human OLA1 and bacterial YchF; identified as specifically interacting with the proteasome; null mutant displays increased translation rate and increased readthrough of premature stop codons; protein abundance increases in response to hydrogen peroxide and to DNA replication stress +S000036196 CDS YBR025C 2 291865 290681 C 2004-07-16 1997-01-28 +S000000230 ORF Verified YBR026C ETR1 MRF1'|MRF1 chromosome 2 L000002810 2 294019 292877 C 2004-07-16 1997-01-28 2-enoyl thioester reductase; member of the medium chain dehydrogenase/reductase family; localized to mitochondria, where it has a probable role in fatty acid synthesis; human MECR functionally complements the respiratory growth defect of the null mutant +S000031678 CDS YBR026C 2 294019 292877 C 2004-07-16 1997-01-28 +S000000231 ORF Uncharacterized YBR027C chromosome 2 2 294356 294024 C 2004-07-16 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YBR027C is not an essential gene +S000031824 CDS YBR027C 2 294356 294024 C 2004-07-16 1997-01-28 +S000000232 ORF Verified YBR028C YPK3 putative protein kinase YPK3 chromosome 2 2 296002 294425 C 2004-07-16 1997-01-28 AGC kinase; phosphorylated by cAMP-dependent protein kinase (PKA) in a TORC1-dependent manner; directly phosphorylated by TORC1; phosphorylates ribosomal protein Rps6a/b (S6), in a TORC-dependent manner; undergoes autophosphorylation +S000031957 CDS YBR028C 2 296002 294425 C 2004-07-16 1997-01-28 +S000000233 ORF Verified YBR029C CDS1 phosphatidate cytidylyltransferase|CDG1 chromosome 2 L000002673 2 297742 296369 C 2004-07-16 1997-01-28 Phosphatidate cytidylyltransferase (CDP-diglyceride synthetase); an enzyme that catalyzes that conversion of CTP + phosphate into diphosphate + CDP-diaclglyerol, a critical step in the synthesis of all major yeast phospholipids; human homolog CDS1 can complement yeast cds1 null mutant +S000037428 CDS YBR029C 2 297742 296369 C 2004-07-16 1997-01-28 +S000000234 ORF Verified YBR030W RKM3 protein-lysine N-methyltransferase chromosome 2 2 298292 299950 W 2004-07-16 1997-01-28 Ribosomal lysine methyltransferase; specific for monomethylation of Rpl42ap and Rpl42bp (lysine 40); nuclear SET domain containing protein; relocalizes to the cytosol in response to hypoxia +S000037095 CDS YBR030W 2 298292 299950 W 2004-07-16 1997-01-28 +S000000235 ORF Verified YBR031W RPL4A uL4|ribosomal 60S subunit protein L4A|L4|rp2|YL2|L4A|L2A chromosome 2 L000001701 2 300166 301254 W 2004-07-16 1997-01-28 Ribosomal 60S subunit protein L4A; N-terminally acetylated; homologous to mammalian ribosomal protein L4 and bacterial L4; RPL4A has a paralog, RPL4B, that arose from the whole genome duplication +S000037181 CDS YBR031W 2 300166 301254 W 2004-07-16 1997-01-28 +S000000236 ORF Uncharacterized YBR032W chromosome 2 2 301519 301821 W 2004-07-16 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YBR032W is not an essential gene +S000037283 CDS YBR032W 2 301519 301821 W 2004-07-16 1997-01-28 +S000000237 ORF Uncharacterized YBR033W EDS1 chromosome 2 2 301944 304703 W 2004-07-16 1997-01-28 Putative zinc cluster protein, predicted to be a transcription factor; not an essential gene; EDS1 has a paralog, RGT1, that arose from the whole genome duplication +S000037351 CDS YBR033W 2 301944 304703 W 2004-07-16 1997-01-28 +S000000238 ORF Verified YBR034C HMT1 protein-arginine omega-N methyltransferase HMT1|RMT1|ODP1|HCP1 chromosome 2 L000002808|L000001296 2 305976 304930 C 2004-07-16 1997-01-28 Nuclear SAM-dependent mono- and asymmetric methyltransferase; modifies hnRNPs, including Npl3p and Hrp1p, affecting their activity and nuclear export; methylates U1 snRNP protein Snp1p, ribosomal protein Rps2p, and histones H3 and H4; interacts genetically with genes encoding components of Rpd3(L) and this interaction is important for Rpd3 recruitment to the subtelomeric region +S000037372 CDS YBR034C 2 305976 304930 C 2004-07-16 1997-01-28 +S000000239 ORF Verified YBR035C PDX3 pyridoxamine-phosphate oxidase PDX3 chromosome 2 L000001371 2 306955 306269 C 2004-07-16 1997-01-28 Pyridoxine (pyridoxamine) phosphate oxidase; has homologs in E. coli and Myxococcus xanthus; transcription is under the general control of nitrogen metabolism +S000030013 CDS YBR035C 2 306955 306269 C 2004-07-16 1997-01-28 +S000087162 snoRNA_gene snR161 SNR161 chromosome 2 2 307345 307185 C 2005-11-10 2005-11-10 H/ACA small nucleolar RNA (snoRNA); guides pseudouridylation of small subunit (SSU) rRNA at positions U632 and U766 +S000087163 noncoding_exon snR161 2 307345 307185 C 2005-11-10 2005-11-10 +S000006657 telomerase_RNA_gene TLC1 TLC1 TER1 chromosome 2 L000002315 2 307587 308887 W 2004-07-16 2000-05-19 RNA template component of telomerase; flexible scaffold that tethers telomerase holoenzyme protein subunits to the complex; contains template sequence that Est2p uses to add irregular repeats of TG(1-3) residues onto a DNA end; promoter regulated by the cell cycle dependent transcriptional activators Swi4p/Swi6p and Mbp1p/Swi6p +S000033066 noncoding_exon TLC1 2 307587 308887 W 2004-07-16 2000-05-19 +S000000240 ORF Verified YBR036C CSG2 mannosylinositol phosphorylceramide synthase regulatory subunit|CLS2 chromosome 2 L000002979|L000000427 2 310313 309081 C 2004-07-16 1997-01-28 Endoplasmic reticulum membrane protein; required for mannosylation of inositolphosphorylceramide and for growth at high calcium concentrations; protein abundance increases in response to DNA replication stress +S000030091 CDS YBR036C 2 310313 309081 C 2004-07-16 1997-01-28 +S000000241 ORF Verified YBR037C SCO1 Cu-binding protein SCO1|PET161 chromosome 2 L000001815 2 311452 310565 C 2011-02-03 1997-01-28 Copper-binding protein of mitochondrial inner membrane; required for cytochrome c oxidase activity and respiration; may function to deliver copper to cytochrome c oxidase; similar to thioredoxins; SCO1 has a paralog, SCO2, that arose from the whole genome duplication +S000030247 CDS YBR037C 2 311452 310565 C 2011-02-03 1997-01-28 +S000000242 ORF Verified YBR038W CHS2 chitin synthase CHS2 chromosome 2 L000000330 2 311898 314789 W 2011-02-03 1997-01-28 Chitin synthase II; catalyzes transfer of N-acetylglucosamine (GlcNAc) to chitin upon activation of zymogenic form; required for chitin synthesis in the primary septum during cytokinesis; localization regulated by Cdk1p during mitosis; phosphorylation by Dbf2p kinase regulates its dynamics and chitin synthesis during cytokinesis +S000033656 CDS YBR038W 2 311898 314789 W 2011-02-03 1997-01-28 +S000000243 ORF Verified YBR039W ATP3 F1F0 ATP synthase subunit gamma chromosome 2 L000000143 2 315575 316510 W 2004-07-16 1997-01-28 Gamma subunit of the F1 sector of mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis +S000033784 CDS YBR039W 2 315575 316510 W 2004-07-16 1997-01-28 +S000000244 ORF Verified YBR040W FIG1 chromosome 2 L000003311 2 316968 317864 W 2004-07-16 1997-01-28 Integral membrane protein required for efficient mating; may participate in or regulate the low affinity Ca2+ influx system, which affects intracellular signaling and cell-cell fusion during mating +S000033389 CDS YBR040W 2 316968 317864 W 2004-07-16 1997-01-28 +S000000245 ORF Verified YBR041W FAT1 long-chain fatty acid transporter FAT1 chromosome 2 L000003201 2 318266 320275 W 2004-07-16 2004-01-21|1997-01-28 Very long chain fatty acyl-CoA synthetase and fatty acid transporter; activates imported fatty acids with a preference for very long lengths (C20-C26); has a separate function in the transport of long chain fatty acids +S000033461 CDS YBR041W 2 318266 320275 W 2004-07-16 2004-01-21|1997-01-28 +S000000246 ORF Verified YBR042C CST26 putative acyltransferase|PSI1 chromosome 2 2 321609 320416 C 2004-07-16 1997-01-28 Acyltransferase; enzyme mainly responsible for the introduction of saturated very long chain fatty acids into neo-synthesized molecules of phosphatidylinositol; required for incorporation of stearic acid into phosphatidylinositol; affects chromosome stability when overexpressed; CST26 has a paralog, YDR018C, that arose from the whole genome duplication +S000033482 CDS YBR042C 2 321609 320416 C 2004-07-16 1997-01-28 +S000000247 ORF Verified YBR043C QDR3 AQR2 chromosome 2 2 323945 321876 C 2004-07-16 1997-01-28|2011-02-03 Multidrug transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; has a role in polyamine homeostasis; involved in spore wall asembly; sequence similarity to DTR1 and QDR1, and the triple mutant dtr1 qdr1 qdr3 exhibits reduced dityrosine fluorescence relative to the single mutants; expression is upregulated under polyamine stress; required for resistance to quinidine, barban, cisplatin, and bleomycin +S000033571 CDS YBR043C 2 323945 321876 C 2004-07-16 1997-01-28|2011-02-03 +S000000248 ORF Verified YBR044C TCM62 chromosome 2 2 326059 324341 C 2011-02-03 1997-01-28|2011-02-03 Protein involved in assembly of the succinate dehydrogenase complex; mitochondrial; putative chaperone +S000033606 CDS YBR044C 2 326059 324341 C 2011-02-03 1997-01-28|2011-02-03 +S000118347 ARS ARS211 ARSII-326 chromosome 2 2 326140 326375 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178047 ARS_consensus_sequence ARS211 2 326153 326169 W 2014-11-18 2014-11-18 +S000006769 tRNA_gene tV(UAC)B chromosome 2 L000003749 2 326865 326792 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000036275 noncoding_exon tV(UAC)B 2 326865 326792 C 2011-02-03 2000-05-19 +S000006817 long_terminal_repeat YBRWdelta15 chromosome 2 2 327069 327394 W 2011-02-03 2000-05-19 Ty1 LTR +S000006818 long_terminal_repeat YBRWdelta16 chromosome 2 2 327390 327704 W 2011-02-03 2000-05-19 Ty1 LTR +S000000249 ORF Verified YBR045C GIP1 protein phosphatase regulator GIP1 chromosome 2 L000003092 2 330092 328173 C 2011-02-03 1997-01-28|2011-02-03 Meiosis-specific regulatory subunit of the Glc7p protein phosphatase; regulates spore wall formation and septin organization, required for expression of some late meiotic genes and for normal localization of Glc7p +S000034552 CDS YBR045C 2 330092 328173 C 2011-02-03 1997-01-28|2011-02-03 +S000000250 ORF Verified YBR046C ZTA1 NADPH:quinone reductase chromosome 2 L000004168 2 331511 330507 C 2011-02-03 1997-01-28 NADPH-dependent quinone reductase; GFP-tagged protein localizes to the cytoplasm and nucleus; has similarity to E. coli quinone oxidoreductase and to human zeta-crystallin +S000034640 CDS YBR046C 2 331511 330507 C 2011-02-03 1997-01-28 +S000000251 ORF Uncharacterized YBR047W FMP23 chromosome 2 2 331833 332360 W 2011-02-03 1997-01-28 Putative protein of unknown function; proposed to be involved in iron or copper homeostasis; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000035689 CDS YBR047W 2 331833 332360 W 2011-02-03 1997-01-28 +S000000252 ORF Verified YBR048W RPS11B uS17|ribosomal 40S subunit protein S11B|S17|rp41B|YS12|S18B|S11B chromosome 2 L000001758 2 332831 333812 W 2011-02-03 1997-01-28 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S11 and bacterial S17; RPS11B has a paralog, RPS11A, that arose from the whole genome duplication +S000035808 CDS YBR048W 2 332831 332875 W 2011-02-03 1997-01-28 +S000035809 CDS YBR048W 2 333387 333812 W 2011-02-03 1997-01-28 +S000035810 intron YBR048W 2 332876 333386 W 2011-02-03 1997-01-28 +S000000253 ORF Verified YBR049C REB1 DNA-binding protein REB1|GRF2 chromosome 2 L000001601 2 336818 334386 C 2011-02-03 1997-01-28 RNA polymerase I enhancer binding protein; DNA binding protein that binds to genes transcribed by both RNA polymerase I and RNA polymerase II; required for termination of RNA polymerase I transcription; Reb1p bound to DNA acts to block RNA polymerase II readthrough transcription +S000035873 CDS YBR049C 2 336818 334386 C 2011-02-03 1997-01-28 +S000000255 ORF Dubious YBR051W chromosome 2 2 337988 338338 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the REG2/YBR050C regulatory subunit of the Glc7p type-1 protein phosphatase +S000036875 CDS YBR051W 2 337988 338338 W 2011-02-03 1997-01-28 +S000000254 ORF Verified YBR050C REG2 protein phosphatase regulator REG2 chromosome 2 L000004126 2 338199 337183 C 2011-02-03 1997-01-28 Regulatory subunit of the Glc7p type-1 protein phosphatase; involved with Reg1p, Glc7p, and Snf1p in regulation of glucose-repressible genes, also involved in glucose-induced proteolysis of maltose permease; REG2 has a paralog, REG1, that arose from the whole genome duplication +S000036783 CDS YBR050C 2 338199 337183 C 2011-02-03 1997-01-28 +S000000256 ORF Verified YBR052C RFS1 flavodoxin-like fold family protein chromosome 2 2 339352 338720 C 2011-02-03 1997-01-28 Protein of unknown function; member of a flavodoxin-like fold protein family that includes Pst2p and Ycp4p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; RFS1 has a paralog, PST2, that arose from the whole genome duplication +S000037575 CDS YBR052C 2 339352 338720 C 2011-02-03 1997-01-28 +S000000257 ORF Uncharacterized YBR053C chromosome 2 2 340751 339675 C 2011-02-03 1997-01-28 Putative protein of unknown function; induced by cell wall perturbation +S000037643 CDS YBR053C 2 340751 339675 C 2011-02-03 1997-01-28 +S000000258 ORF Verified YBR054W YRO2 chromosome 2 L000002548 2 343101 344135 W 2011-02-03 1997-01-28 Protein with a putative role in response to acid stress; null mutant is sensitive to acetic acid; transcription is regulated by Haa1p and induced in the presence of acetic acid; protein observed in plasma membrane foci in the presence of acetic acid; the authentic, non-tagged protein is detected in a phosphorylated state in highly purified mitochondria in high-throughput studies +S000037737 CDS YBR054W 2 343101 344135 W 2011-02-03 1997-01-28 +S000000259 ORF Verified YBR055C PRP6 U4/U6-U5 snRNP complex subunit PRP6|TSM7269|RNA6 chromosome 2 L000001499 2 347301 344602 C 33 2011-02-03 1997-01-28 Splicing factor; component of the U4/U6-U5 snRNP complex +S000037759 CDS YBR055C 2 347301 344602 C 2011-02-03 1997-01-28 +S000006648 tRNA_gene tL(UAA)B2 chromosome 2 L000003743 2 347603 347686 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000035757 noncoding_exon tL(UAA)B2 2 347603 347686 W 2011-02-03 2000-05-19 +S000000260 ORF Verified YBR056W 17-beta-hydroxysteroid dehydrogenase-like protein chromosome 2 2 347879 349384 W 2011-02-03 1997-01-28 Putative glycoside hydrolase of the mitochondrial intermembrane space +S000030661 CDS YBR056W 2 347879 349384 W 2011-02-03 1997-01-28 +S000006819 long_terminal_repeat YBRWdelta17 chromosome 2 2 350459 350751 W 2011-02-03 2000-05-19 Ty1 LTR +S000006691 tRNA_gene tQ(UUG)B chromosome 2 L000003744 2 350827 350898 W 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000031659 noncoding_exon tQ(UUG)B 2 350827 350898 W 2011-02-03 2000-05-19 +S000028736 ORF Uncharacterized YBR056W-A chromosome 2 2 351255 351455 W 2011-02-03 2003-07-29 Protein of unknown function; mRNA identified as translated by ribosome profiling data; partially overlaps dubious ORF YBR056C-B; YBR056W-A has a paralog, YDR034W-B, that arose from the whole genome duplication +S000033380 CDS YBR056W-A 2 351255 351455 W 2011-02-03 2003-07-29 +S000087087 ORF Dubious YBR056C-B chromosome 2 2 351451 351293 C 2011-02-03 2005-11-08 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the dubious ORF YBR056W-A +S000087088 CDS YBR056C-B 2 351451 351293 C 2011-02-03 2005-11-08 +S000000261 ORF Verified YBR057C MUM2 SPOT8 chromosome 2 L000003595|L000002013 2 353293 352193 C 31 2011-02-03 1997-01-28 Protein essential for meiotic DNA replication and sporulation; cytoplasmic protein; subunit of the MIS complex which controls mRNA methylation during during the induction of sporulation; also interacts with Orc2p, which is a component of the origin recognition complex +S000030712 CDS YBR057C 2 353293 352193 C 2011-02-03 1997-01-28 +S000000262 ORF Verified YBR058C UBP14 ubiquitin-specific protease UBP14|GID6 chromosome 2 L000003173 2 356017 353672 C 2011-02-03 2003-09-22|1997-01-28 Ubiquitin-specific protease; specifically disassembles unanchored ubiquitin chains; involved in fructose-1,6-bisphosphatase (Fbp1p) degradation; similar to human isopeptidase T +S000030826 CDS YBR058C 2 356017 353672 C 2011-02-03 2003-09-22|1997-01-28 +S000007521 ORF Verified YBR058C-A TSC3 chromosome 2 2 356566 356324 C 2011-02-03 2000-06-19 Protein that stimulates the activity of serine palmitoyltransferase; involved in sphingolipid biosynthesis; Lcb1p and Lcb2p are the two components of serine palmitoyltransferase +S000036279 CDS YBR058C-A 2 356566 356324 C 2011-02-03 2000-06-19 +S000000263 ORF Verified YBR059C AKL1 serine/threonine protein kinase AKL1 chromosome 2 S000007479 2 360187 356861 C 2011-02-03 1997-01-28 Ser-Thr protein kinase; member (with Ark1p and Prk1p) of the Ark kinase family; involved in endocytosis and actin cytoskeleton organization +S000031795 CDS YBR059C 2 360187 356861 C 2011-02-03 1997-01-28 +S000000264 ORF Verified YBR060C ORC2 origin recognition complex subunit 2|SIR5|RRR1 chromosome 2 L000001776 2 362514 360652 C 2011-02-03 1997-01-28 Subunit of the origin recognition complex (ORC); ORC directs DNA replication by binding to replication origins and is also involved in transcriptional silencing; interacts with Spp1p and with trimethylated histone H3; phosphorylated by Cdc28p +S000031761 CDS YBR060C 2 362514 360652 C 2011-02-03 1997-01-28 +S000000265 ORF Verified YBR061C TRM7 tRNA methyltransferase TRM7 chromosome 2 2 365719 364787 C 2011-02-03 1997-01-28 2'-O-ribose methyltransferase; methylates the 2'-O-ribose of tRNA-Phe, tRNA-Trp, and tRNA-Leu at positions C32 and N34 of tRNA anticodon loop; crucial biological role likely modification of tRNA-Phe; interacts with Trm732p and Rtt10p in 2'-O-methylation of C32 and N34 substrate tRNAs, respectively; yeast null mutant can be functionally complemented by human FTSJ1, mutations in which have been implicated in nonsyndromic X-linked intellectual disability (NSXLID) +S000031905 CDS YBR061C 2 365719 364787 C 2011-02-03 1997-01-28 +S000000266 ORF Uncharacterized YBR062C chromosome 2 2 366600 365976 C 2011-02-03 2004-07-16|1997-01-28 Protein of unknown function that interacts with Msb2p; may play a role in activation of the filamentous growth pathway +S000032827 CDS YBR062C 2 366502 365976 C 2011-02-03 2004-07-16|1997-01-28 +S000032826 CDS YBR062C 2 366600 366585 C 2011-02-03 2004-07-16 +S000032828 intron YBR062C 2 366584 366503 C 2011-02-03 2004-07-16 +S000000268 ORF Dubious YBR064W chromosome 2 2 367763 368191 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YBR063C +S000033067 CDS YBR064W 2 367763 368191 W 2011-02-03 1997-01-28 +S000000267 ORF Uncharacterized YBR063C chromosome 2 2 368184 366970 C 2011-02-03 1997-01-28 Putative protein of unknown function; YBR063C is not an essential gene +S000032899 CDS YBR063C 2 368184 366970 C 2011-02-03 1997-01-28 +S000000269 ORF Verified YBR065C ECM2 SLT11 chromosome 2 L000003878 2 369678 368584 C 2011-02-03 1997-01-28 Pre-mRNA splicing factor; facilitates the cooperative formation of U2/U6 helix II in association with stem II in the spliceosome, function may be regulated by Slu7p +S000033674 CDS YBR065C 2 369678 368584 C 2011-02-03 1997-01-28 +S000000270 ORF Verified YBR066C NRG2 chromosome 2 L000004599 2 370699 370037 C 2011-02-03 1997-01-28 Transcriptional repressor; mediates glucose repression and negatively regulates filamentous growth; activated in stochastic pulses of nuclear localization in response to low glucose +S000033763 CDS YBR066C 2 370699 370037 C 2011-02-03 1997-01-28 +S000000271 ORF Verified YBR067C TIP1 putative lipase chromosome 2 L000002311 2 372735 372103 C 2011-02-03 1997-01-28 Major cell wall mannoprotein with possible lipase activity; transcription is induced by heat- and cold-shock; member of the Srp1p/Tip1p family of serine-alanine-rich proteins +S000033875 CDS YBR067C 2 372735 372103 C 2011-02-03 1997-01-28 +S000000272 ORF Verified YBR068C BAP2 branched-chain amino acid permease BAP2 chromosome 2 L000003157 2 375690 373861 C 2011-02-03 1997-01-28|2011-02-03 High-affinity leucine permease; functions as a branched-chain amino acid permease involved in uptake of leucine, isoleucine and valine; contains 12 predicted transmembrane domains; BAP2 has a paralog, BAP3, that arose from the whole genome duplication +S000034014 CDS YBR068C 2 375690 373861 C 2011-02-03 1997-01-28|2011-02-03 +S000000273 ORF Verified YBR069C TAT1 amino acid transporter TAT1|VAP1|TAP1 chromosome 2 L000002454|L000002262 2 378433 376574 C 2011-02-03 1997-01-28 Amino acid transporter for valine, leucine, isoleucine, and tyrosine; low-affinity tryptophan and histidine transporter; overexpression confers FK506 and FTY720 resistance; protein abundance increases in response to DNA replication stress +S000034884 CDS YBR069C 2 378433 376574 C 2011-02-03 1997-01-28 +S000130151 ARS ARS212 ARSII-379 chromosome 2 2 379221 379912 2011-02-03 2009-05-07 Autonomously Replicating Sequence +S000000274 ORF Verified YBR070C ALG14 N-acetylglucosaminyldiphosphodolichol N-acetylglucosaminyltransferase anchoring subunit ALG14 chromosome 2 2 379934 379221 C 2011-02-03 1997-01-28 Component of UDP-GlcNAc transferase; required for second step of dolichyl-linked oligosaccharide synthesis; anchors catalytic subunit Alg13p to ER membrane; similar to bacterial and human glycosyltransferases; both human homologs ALG13 and ALG14 are required to complement yeast alg14 mutant +S000035895 CDS YBR070C 2 379934 379221 C 2011-02-03 1997-01-28 +S000000275 ORF Verified YBR071W chromosome 2 2 380411 381046 W 2011-02-03 1997-01-28 Protein of unknown function found in the cytoplasm and bud neck; mRNA expression may be regulated by the cell cycle and/or cell wall stress; overexpression of YBR071W affects endocytic protein trafficking +S000036135 CDS YBR071W 2 380411 381046 W 2011-02-03 1997-01-28 +S000000276 ORF Verified YBR072W HSP26 chaperone protein HSP26 chromosome 2 L000000817 2 382030 382674 W 2011-02-03 1997-01-28 Small heat shock protein (sHSP) with chaperone activity; forms hollow, sphere-shaped oligomers that suppress unfolded proteins aggregation; long-lived protein that is preferentially retained in mother cells and forms cytoplasmic foci; oligomer activation requires heat-induced conformational change; also has mRNA binding activity +S000036920 CDS YBR072W 2 382030 382674 W 2011-02-03 1997-01-28 +S000028532 ORF Uncharacterized YBR072C-A chromosome 2 2 383021 382860 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031141 CDS YBR072C-A 2 383021 382860 C 2011-02-03 2003-07-29 +S000000277 ORF Verified YBR073W RDH54 DNA-dependent ATPase RDH54|TID1 chromosome 2 L000002988|L000003224 2 383112 385988 W 2011-02-03 2003-09-22|1997-01-28|2009-05-07|2011-02-03 DNA-dependent ATPase; DNA recombination/repair translocase, supercoils DNA and promotes DNA strand opening; stimulates strand exchange by modifying dsDNA topology; involved in recombinational repair of DNA double-strand breaks (DSBs) during mitosis and meiosis; phosphorylated in Mec1p-, Rad53p-dependent way in response to one DSB; contributes to remodelling of nucleosomes; proposed to be involved in crossover interference; interacts with Dmc1p; stimulates Dmc1p and Rad51p +S000036971 CDS YBR073W 2 383112 385988 W 2011-02-03 2003-09-22|1997-01-28|2009-05-07|2011-02-03 +S000000278 ORF Verified YBR074W PFF1 YBR075W chromosome 2 2 386286 389216 W 2011-02-03 2003-09-29|1997-01-28|2011-02-03 Multi-spanning vacuolar membrane protease; glycosylated transmembrane protein bearing homology to the M28 family of metalloproteases; has a lumenal-facing protease domain; proposed role in vacuole physiology +S000037055 CDS YBR074W 2 386286 389216 W 2011-02-03 2003-09-29|1997-01-28|2011-02-03 +S000130152 ARS ARS213 ARSII-390 chromosome 2 2 389212 390371 2011-02-03 2009-05-07|2011-02-03 Autonomously Replicating Sequence +S000000280 ORF Verified YBR076W ECM8 chromosome 2 L000003883 2 390227 391291 W 2011-02-03 1997-01-28|2011-02-03 Non-essential protein of unknown function +S000037886 CDS YBR076W 2 390227 391291 W 2011-02-03 1997-01-28|2011-02-03 +S000028533 ORF Dubious YBR076C-A chromosome 2 2 391617 391351 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene ECM8; identified by fungal homology and RT-PCR +S000031142 CDS YBR076C-A 2 391617 391351 C 2011-02-03 2003-07-29 +S000000281 ORF Verified YBR077C SLM4 GSE1|NIR1|EGO3 chromosome 2 2 392293 391805 C 2011-02-03 1997-01-28 Component of the EGO and GSE complexes; essential for integrity and function of EGO; EGO is involved in the regulation of microautophagy and GSE is required for proper sorting of amino acid permease Gap1p; gene exhibits synthetic genetic interaction with MSS4 +S000029854 CDS YBR077C 2 392293 391805 C 2011-02-03 1997-01-28 +S000000282 ORF Verified YBR078W ECM33 chromosome 2 L000003902 2 393123 394742 W 2011-02-03 1997-01-28|2011-02-03 GPI-anchored protein of unknown function; possible role in apical bud growth; GPI-anchoring on the plasma membrane crucial to function; phosphorylated in mitochondria; similar to Sps2p; ECM33 has a paralog, PST1, that arose from the whole genome duplication +S000030046 CDS YBR078W 2 393123 393180 W 2011-02-03 1997-01-28 +S000030047 CDS YBR078W 2 393511 394742 W 2011-02-03 1997-01-28|2011-02-03 +S000030048 intron YBR078W 2 393181 393510 W 2011-02-03 1997-01-28 +S000000283 ORF Verified YBR079C RPG1 translation initiation factor eIF3 core subunit a|TIF32 chromosome 2 L000004268 2 398277 395383 C 2011-02-03 1997-01-28 eIF3a subunit of the eukaryotic translation initiation factor 3 (eIF3); subunit of the core complex of eIF3; essential for translation; part of a Prt1p-Rpg1p-Nip1p subcomplex that stimulates binding of mRNA and tRNA(i)Met to ribosomes; involved in translation reinitiation; eIF3 is also involved in programmed stop codon readthrough +S000030963 CDS YBR079C 2 398277 395383 C 2011-02-03 1997-01-28 +S000000284 ORF Verified YBR080C SEC18 AAA family ATPase SEC18|ANU4 chromosome 2 L000001842 2 400890 398614 C 48 2011-02-03 1997-01-28 AAA ATPase and SNARE disassembly chaperone; required for vesicular transport between ER and Golgi, the 'priming' step in homotypic vacuole fusion, autophagy, and protein secretion; releases Sec17p from SNAP complexes; has similarity to mammalian N-ethylmaleimide-sensitive factor (NSF) +S000031072 CDS YBR080C 2 400890 398614 C 2011-02-03 1997-01-28 +S000000285 ORF Verified YBR081C SPT7 SAGA histone acetyltransferase complex subunit SPT7|GIT2 chromosome 2 L000002033 2 405251 401253 C 46 2011-02-03 1997-01-28 Subunit of the SAGA transcriptional regulatory complex; involved in proper assembly of the complex; also present as a C-terminally truncated form in the SLIK/SALSA transcriptional regulatory complex +S000032039 CDS YBR081C 2 405251 401253 C 2011-02-03 1997-01-28 +S000006708 tRNA_gene tR(UCU)B chromosome 2 L000003745 2 405878 405949 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA); decodes AGA codons into arginine; one of 19 nuclear tRNAs for arginine; part of dicistronic transcript with tD(GUC)B +S000037831 noncoding_exon tR(UCU)B 2 405878 405949 W 2011-02-03 2000-05-19 +S000006530 tRNA_gene tD(GUC)B chromosome 2 L000003746 2 405960 406031 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000037666 noncoding_exon tD(GUC)B 2 405960 406031 W 2011-02-03 2000-05-19 +S000000286 ORF Verified YBR082C UBC4 E2 ubiquitin-conjugating protein UBC4 chromosome 2 L000002407 2 407169 406628 C 2011-02-03 1997-01-28 Ubiquitin-conjugating enzyme (E2); key E2 partner with Ubc1p for the anaphase-promoting complex (APC); mediates degradation of abnormal or excess proteins, including calmodulin and histone H3; regulates levels of DNA Polymerase-{alpha} to promote efficient and accurate DNA replication; interacts with many SCF ubiquitin protein ligases; component of the cellular stress response; UBC4 has a paralog, UBC5, that arose from the whole genome duplication +S000032123 CDS YBR082C 2 407027 406628 C 2011-02-03 1997-01-28 +S000032122 CDS YBR082C 2 407169 407123 C 2011-02-03 1997-01-28 +S000032124 intron YBR082C 2 407122 407028 C 2011-02-03 1997-01-28 +S000118348 ARS ARS214 ARSII-408 chromosome 2 2 407953 408068 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178048 ARS_consensus_sequence ARS214 2 408004 407988 C 2014-11-18 2014-11-18 +S000000287 ORF Verified YBR083W TEC1 ROC1 chromosome 2 L000002276|L000001658 2 409169 410629 W 2011-02-03 1997-01-28 Transcription factor targeting filamentation genes and Ty1 expression; Ste12p activation of most filamentation gene promoters depends on Tec1p and Tec1p transcriptional activity is dependent on its association with Ste12p; binds to TCS elements upstream of filamentation genes, which are regulated by Tec1p/Ste12p/Dig1p complex; competes with Dig2p for binding to Ste12p/Dig1p; positive regulator of chronological life span; TEA/ATTS DNA-binding domain family member +S000032249 CDS YBR083W 2 409169 410629 W 2011-02-03 1997-01-28 +S000000288 ORF Verified YBR084W MIS1 trifunctional formate-tetrahydrofolate ligase/methenyltetrahydrofolate cyclohydrolase/methylenetetrahydrofolate dehydrogenase MIS1 chromosome 2 L000001115 2 411054 413981 W 2011-02-03 1997-01-28 Mitochondrial C1-tetrahydrofolate synthase; involved in interconversion between different oxidation states of tetrahydrofolate (THF); provides activities of formyl-THF synthetase, methenyl-THF cyclohydrolase, and methylene-THF dehydrogenase +S000033123 CDS YBR084W 2 411054 413981 W 2011-02-03 1997-01-28 +S000002156 ORF Verified YBR084C-A RPL19A eL19|ribosomal 60S subunit protein L19A|L19e|rpl5L|YL14|L23A|L19A chromosome 2 L000001720 2 415261 414186 C 2011-02-03 1997-01-28 Ribosomal 60S subunit protein L19A; rpl19a and rpl19b single null mutations result in slow growth, while the double null mutation is lethal; homologous to mammalian ribosomal protein L19, no bacterial homolog; RPL19A has a paralog, RPL19B, that arose from the whole genome duplication +S000033730 CDS YBR084C-A 2 414753 414186 C 2011-02-03 1997-01-28 +S000033729 CDS YBR084C-A 2 415261 415260 C 2011-02-03 1997-01-28 +S000033731 intron YBR084C-A 2 415259 414754 C 2011-02-03 1997-01-28 +S000000289 ORF Verified YBR085W AAC3 ADP/ATP carrier protein AAC3|ANC3 chromosome 2 L000000005 2 415983 416906 W 2011-02-03 1997-01-28 Mitochondrial inner membrane ADP/ATP translocator; exchanges cytosolic ADP for mitochondrially synthesized ATP; expressed under anaerobic conditions; similar to Aac1p; has roles in maintenance of viability and in respiration; AAC3 has a paralog, PET9, that arose from the whole genome duplication +S000033180 CDS YBR085W 2 415983 416906 W 2011-02-03 1997-01-28 +S000118349 ARS ARS215 ARSII-418 chromosome 2 2 417784 418079 2011-02-03 2006-08-30 Autonomously Replicating Sequence; replication origin of very weak function +S000007522 ORF Verified YBR085C-A chromosome 2 2 419164 418907 C 2011-02-03 2000-07-14 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and to the nucleus; protein abundance increases in response to DNA replication stress +S000037060 CDS YBR085C-A 2 419164 418907 C 2011-02-03 2000-07-14 +S000000290 ORF Verified YBR086C IST2 chromosome 2 2 423041 420201 C 2011-02-03 2003-01-03|1997-01-28 Cortical ER protein involved in ER-plasma membrane tethering; one of 6 proteins (Ist2p, Scs2p, Scs22p, Tcb1p, Tcb2p, Tcb3p) that connect ER to the plasma membrane (PM) and regulate PM phosphatidylinositol-4-phosphate (PI4P) levels by controlling access of Sac1p phosphatase to its substrate PI4P in the PM; localizes to the mother cell in small-budded cells and to the bud in medium- and large-budded cells; mRNA is transported to the bud tip by an actomyosin-driven process +S000033202 CDS YBR086C 2 423041 420201 C 2011-02-03 2003-01-03|1997-01-28 +S000000291 ORF Verified YBR087W RFC5 replication factor C subunit 5 chromosome 2 L000002843 2 423765 424829 W 2011-02-03 1997-01-28 Subunit of heteropentameric Replication factor C (RF-C); RF-C is a DNA binding protein and ATPase that acts as a clamp loader of the proliferating cell nuclear antigen (PCNA) processivity factor for DNA polymerases delta and epsilon +S000033291 CDS YBR087W 2 423765 424829 W 2011-02-03 1997-01-28 +S000000293 ORF Dubious YBR089W chromosome 2 2 425183 425782 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the verified gene POL30 +S000034297 CDS YBR089W 2 425183 425782 W 2011-02-03 1997-01-28 +S000000292 ORF Verified YBR088C POL30 proliferating cell nuclear antigen|PCNA chromosome 2 L000001463 2 425766 424990 C 2011-02-03 1997-01-28 Proliferating cell nuclear antigen (PCNA); functions as the sliding replication clamp for DNA polymerase delta; may function as a docking site for other proteins required for mitotic and meiotic chromosomal DNA replication and for DNA repair; PCNA ubiquitination at K164 plays a crucial role during Okazaki fragment processing +S000033330 CDS YBR088C 2 425766 424990 C 2011-02-03 1997-01-28 +S000002157 ORF Verified YBR089C-A NHP6B high-mobility group nucleosome-binding protein|YBR090C-A chromosome 2 L000001246 2 426489 426190 C 2011-02-03 1997-01-28|2011-02-03 High-mobility group (HMG) protein; binds to and remodels nucleosomes; involved in recruiting FACT and other chromatin remodelling complexes to the chromosomes; functionally redundant with Nhp6Ap; required for transcriptional initiation fidelity of some tRNA genes; homologous to mammalian HMGB1 and HMGB2; NHP6B has a paralog, NHP6A, that arose from the whole genome duplication +S000031885 CDS YBR089C-A 2 426489 426190 C 2011-02-03 1997-01-28|2011-02-03 +S000122092 five_prime_UTR_intron YBR089C-A 2 426873 426517 C 2011-02-03 2007-04-04 +S000000294 ORF Uncharacterized YBR090C chromosome 2 2 427058 426333 C 2011-02-03 1997-01-28|2011-02-03 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus +S000035423 CDS YBR090C 2 426516 426333 C 2011-02-03 1997-01-28|2011-02-03 +S000035422 CDS YBR090C 2 427058 426874 C 2011-02-03 1997-01-28 +S000035424 intron YBR090C 2 426873 426517 C 2011-02-03 1997-01-28 +S000000295 ORF Verified YBR091C TIM12 MRS5 chromosome 2 L000001181 2 427484 427155 C 2011-02-03 1997-01-28 Essential protein of the inner mitochondrial membrane; peripherally localized; component of the TIM22 complex, which is a twin-pore translocase that mediates insertion of numerous multispanning inner membrane proteins +S000036311 CDS YBR091C 2 427484 427155 C 2011-02-03 1997-01-28 +S000000296 ORF Verified YBR092C PHO3 acid phosphatase PHO3|phoC chromosome 2 L000001419 2 429101 427698 C 47 2011-02-03 1997-01-28 Constitutively expressed acid phosphatase similar to Pho5p; brought to the cell surface by transport vesicles; hydrolyzes thiamin phosphates in the periplasmic space, increasing cellular thiamin uptake; expression is repressed by thiamin +S000036423 CDS YBR092C 2 429101 427698 C 2011-02-03 1997-01-28 +S000000297 ORF Verified YBR093C PHO5 acid phosphatase PHO5|phoE chromosome 2 L000001421 2 430951 429548 C 47 2011-02-03 1997-01-28 Repressible acid phosphatase; 1 of 3 repressible acid phosphatases that also mediates extracellular nucleotide-derived phosphate hydrolysis; secretory pathway derived cell surface glycoprotein; induced by phosphate starvation and coordinately regulated by PHO4 and PHO2 +S000036491 CDS YBR093C 2 430951 429548 C 2011-02-03 1997-01-28 +S000000298 ORF Verified YBR094W PBY1 putative tubulin tyrosine ligase chromosome 2 2 432036 434297 W 2011-02-03 1997-01-28|2011-02-03 Putative tubulin tyrosine ligase associated with P-bodies; may have a role in mRNA metabolism; yeast knockout collection strain identified as a pby1 null mutant is actually wild-type for PBY1 and deleted for mms4 +S000037253 CDS YBR094W 2 432036 434297 W 2011-02-03 1997-01-28|2011-02-03 +S000000299 ORF Verified YBR095C RXT2 RAF60 chromosome 2 2 435698 434406 C 2011-02-03 2003-09-22|1997-01-28 Component of the histone deacetylase Rpd3L complex; possibly involved in cell fusion and invasive growth; relocalizes to the cytosol in response to hypoxia +S000037292 CDS YBR095C 2 435698 434406 C 2011-02-03 2003-09-22|1997-01-28 +S000000300 ORF Uncharacterized YBR096W chromosome 2 2 436021 436713 W 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the ER +S000037475 CDS YBR096W 2 436021 436713 W 2011-02-03 1997-01-28 +S000000301 ORF Verified YBR097W VPS15 ubiquitin-binding serine/threonine protein kinase VPS15|VPT15|VPS40|VPL19|VAC4|GRD8 chromosome 2 L000002470|L000002924|S000029641|L000002480 2 436951 441315 W 2011-02-03 1997-01-28|2011-02-03 Serine/threonine protein kinase involved in vacuolar protein sorting; functions as a membrane-associated complex with Vps34p; active form recruits Vps34p to the Golgi membrane; interacts with the GDP-bound form of Gpa1p; myristoylated; a fraction is localized, with Vps34p, to nuclear pores at nucleus-vacuole junctions and may facilitate transcription elongation for genes positioned at the nuclear periphery +S000030201 CDS YBR097W 2 436951 441315 W 2011-02-03 1997-01-28|2011-02-03 +S000000302 ORF Verified YBR098W MMS4 YBR100W|SLX2 chromosome 2 2 441515 443590 W 2011-02-03 2003-01-03|1997-01-28 Subunit of structure-specific Mms4p-Mus81p endonuclease; cleaves branched DNA; involved in recombination, DNA repair, and joint molecule formation/resolution during meiotic recombination; phosphorylation of the non-catalytic subunit Mms4p by Cdc28p and Cdc5p during mitotic cell cycle activates the function of Mms4p-Mus81p +S000030360 CDS YBR098W 2 441515 443590 W 2011-02-03 2003-01-03|1997-01-28 +S000000303 ORF Dubious YBR099C chromosome 2 2 443307 442924 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene MMS4 +S000030430 CDS YBR099C 2 443307 442924 C 2011-02-03 1997-01-28 +S000000305 ORF Verified YBR101C FES1 chromosome 2 2 444693 443821 C 2011-02-03 1997-01-28 Hsp70 (Ssa1p) nucleotide exchange factor; required for the release of misfolded proteins from the Hsp70 system to the Ub-proteasome machinery for destruction; cytosolic homolog of Sil1p, which is the nucleotide exchange factor for BiP (Kar2p) in the endoplasmic reticulum; protein abundance increases in response to DNA replication stress +S000036293 CDS YBR101C 2 444693 443821 C 2011-02-03 1997-01-28 +S000000306 ORF Verified YBR102C EXO84 exocyst subunit EXO84|USA3 chromosome 2 S000007470|L000003227 2 447323 445062 C 2011-02-03 1997-01-28 Exocyst subunit with dual roles in exocytosis and spliceosome assembly; subunit of the the exocyst complex which mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis at the plasma membrane (PM) prior to SNARE-mediated fusion; required for exocyst assembly and targeting the complex to specific sites on the bud tip PM; associates the U1 snRNP; role in pre-mRNA splicing and prespliceosome formation; possible Cdc28 substrate +S000036412 CDS YBR102C 2 447323 445062 C 2011-02-03 1997-01-28 +S000000307 ORF Verified YBR103W SIF2 EMB1 chromosome 2 2 447709 449316 W 2011-02-03 1997-01-28 WD40 repeat-containing subunit of Set3C histone deacetylase complex; complex represses early/middle sporulation genes; antagonizes telomeric silencing; binds specifically to the Sir4p N-terminus +S000037118 CDS YBR103W 2 447709 449316 W 2011-02-03 1997-01-28 +S000007593 ORF Dubious YBR103C-A chromosome 2 2 449463 449320 C 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by homology to related yeast +S000037105 CDS YBR103C-A 2 449463 449320 C 2011-02-03 2001-02-26 +S000000308 ORF Verified YBR104W YMC2 organic acid transporter chromosome 2 L000002521 2 449667 450656 W 2011-02-03 1997-01-28 Putative mitochondrial inner membrane transporter; proposed role in oleate metabolism and glutamate biosynthesis; member of the mitochondrial carrier (MCF) family; YMC2 has a paralog, YMC1, that arose from the whole genome duplication +S000037195 CDS YBR104W 2 449667 450656 W 2011-02-03 1997-01-28 +S000000309 ORF Verified YBR105C VID24 glucose-induced degradation complex subunit VID24|GID4 chromosome 2 L000004624 2 451969 450881 C 2011-02-03 1997-01-28 GID Complex regulatory subunit; binds GID Complex in response to glucose through interactions with complex member Vid28p; regulates fructose-1,6-bisphosphatase (FBPase) targeting to the vacuole; promotes proteasome-dependent catabolite degradation of FBPase; peripheral membrane protein located at Vid (vacuole import and degradation) vesicles +S000037212 CDS YBR105C 2 451969 450881 C 2011-02-03 1997-01-28 +S000000310 ORF Verified YBR106W PHO88 SND3 chromosome 2 L000003995 2 452658 453224 W 2011-02-03 1997-01-28 Protein involved in SRP-independent targeting of substrates to the ER; component of an alternative ER targeting pathway that has partial functional redundancy with the GET pathway; preference for substrates with downstream transmembrane domains; interacts with Snd1p, Env10p/Snd2p, and Sec61p-translocon subunits; can compensate for loss of SRP; role in phosphate transport, interacting with pho88, and in the maturation of secretory proteins +S000037352 CDS YBR106W 2 452658 453224 W 2011-02-03 1997-01-28 +S000000311 ORF Verified YBR107C IML3 MCM19 chromosome 2 L000004778 2 454530 453793 C 2011-02-03 1997-01-28 Outer kinetochore protein and component of the Ctf19 complex; involved in the establishment of pericentromeric cohesion during mitosis; prevents non-disjunction of sister chromatids during meiosis II; forms a stable complex with Chl4p; required for localization of Sgo1p to pericentric sites during meiosis I; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-L and fission yeast fta1 +S000037374 CDS YBR107C 2 454530 453793 C 2011-02-03 1997-01-28 +S000000312 ORF Verified YBR108W AIM3 chromosome 2 2 454822 457665 W 2011-02-03 2004-07-09|1997-01-28|2011-02-03 Protein that inhibits barbed-end actin filament elongation; interacts with Rvs167p; null mutant is viable and displays elevated frequency of mitochondrial genome loss +S000030057 CDS YBR108W 2 454822 457665 W 2011-02-03 2004-07-09|1997-01-28|2011-02-03 +S000000313 ORF Verified YBR109C CMD1 calmodulin|CaM chromosome 2 L000000365 2 458362 457919 C 53 2011-02-03 1997-01-28 Calmodulin; Ca2+ binding protein that regulates Ca2+ independent processes (mitosis, bud growth, actin organization, endocytosis, etc.) and Ca2+ dependent processes (stress-activated pathways), targets include Nuf1p, Myo2p and calcineurin; binds to the Hog1p MAPK in response to hyperosmotic stress; potentiates membrane tubulation and constriction mediated by the Rvs161p-Rvs167p complex; human CALM1 or CALM2 functionally complement repression induced inviability +S000030094 CDS YBR109C 2 458362 457919 C 2011-02-03 1997-01-28 +S000028737 ORF Dubious YBR109W-A chromosome 2 2 458608 458832 W 2011-02-03 2003-07-29 Putative protein of unknown function; questionable ORF from MIPS +S000033381 CDS YBR109W-A 2 458608 458832 W 2011-02-03 2003-07-29 +S000000314 ORF Verified YBR110W ALG1 chitobiosyldiphosphodolichol beta-1,4 mannosyltransferase chromosome 2 L000000076 2 458872 460221 W 54 2011-02-03 1997-01-28 Mannosyltransferase; involved in asparagine-linked glycosylation in the endoplasmic reticulum (ER); essential for viability; human homolog ALG1 complements yeast null mutant +S000032542 CDS YBR110W 2 458872 460221 W 2011-02-03 1997-01-28 +S000000315 ORF Verified YBR111C YSA1 ADP-ribose diphosphatase|RMA2 chromosome 2 L000002551 2 461873 461178 C 2011-02-03 1997-01-28 Nudix hydrolase family member with ADP-ribose pyrophosphatase activity; shown to metabolize O-acetyl-ADP-ribose to AMP and acetylated ribose 5'-phosphate +S000032550 CDS YBR111C 2 461873 461178 C 2011-02-03 1997-01-28 +S000028510 ORF Verified YBR111W-A SUS1 chromosome 2 2 462139 462579 W 2011-02-03 2003-12-17|2003-07-29 Component of both the SAGA histone acetylase and TREX-2 complexes; interacts with RNA polymerase II; involved in mRNA export coupled transcription activation and elongation; involved in post-transcriptional tethering of active genes to the nuclear periphery and to non-nascent mRNP +S000030260 CDS YBR111W-A 2 462139 462209 W 2011-02-03 2003-12-17|2003-07-29 +S000030261 CDS YBR111W-A 2 462290 462429 W 2011-02-03 2003-12-17|2003-07-29 +S000030263 CDS YBR111W-A 2 462500 462579 W 2011-02-03 2003-12-17 +S000030262 intron YBR111W-A 2 462210 462289 W 2011-02-03 2003-12-17|2003-07-29 +S000030264 intron YBR111W-A 2 462430 462499 W 2011-02-03 2003-12-17 +S000000317 ORF Dubious YBR113W chromosome 2 2 465566 466048 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene CYC8 +S000033391 CDS YBR113W 2 465566 466048 W 2011-02-03 1997-01-28 +S000000316 ORF Verified YBR112C CYC8 transcription regulator CYC8|[OCT]|[OCT1+]|SSN6|CRT8 chromosome 2 L000000452 2 465770 462870 C 56 2011-02-03 1997-01-28 General transcriptional co-repressor; acts together with Tup1p; also acts as part of a transcriptional co-activator complex that recruits the SWI/SNF and SAGA complexes to promoters; can form the prion [OCT+] +S000032660 CDS YBR112C 2 465770 462870 C 2011-02-03 1997-01-28 +S000000318 ORF Verified YBR114W RAD16 DNA repair protein RAD16|PSO5 chromosome 2 L000004121|L000001565 2 467248 469620 W 58 2011-02-03 1997-01-28 Nucleotide excision repair (NER) protein; binds damaged DNA during NER; binds DNA in an ATP-dependent manner (with Rad7p) during NER; required for NER of non-transcribed chromatin; subunit of Nucleotide Excision Repair Factor 4 (NEF4) and the Elongin-Cullin-Socs (ECS) ligase complex +S000033462 CDS YBR114W 2 467248 469620 W 2011-02-03 1997-01-28 +S000000319 ORF Verified YBR115C LYS2 L-aminoadipate-semialdehyde dehydrogenase chromosome 2 L000000965 2 473926 469748 C 59 2011-02-03 1997-01-28 Alpha aminoadipate reductase; catalyzes the reduction of alpha-aminoadipate to alpha-aminoadipate 6-semialdehyde, which is the fifth step in biosynthesis of lysine; activation requires posttranslational phosphopantetheinylation by Lys5p +S000033483 CDS YBR115C 2 473926 469748 C 2011-02-03 1997-01-28 +S000000320 ORF Dubious YBR116C chromosome 2 2 474726 474199 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene TKL2 +S000033572 CDS YBR116C 2 474726 474199 C 2011-02-03 1997-01-28 +S000000321 ORF Verified YBR117C TKL2 transketolase TKL2 chromosome 2 L000002314 2 476437 474392 C 2011-02-03 1997-01-28 Transketolase; catalyzes conversion of xylulose-5-phosphate and ribose-5-phosphate to sedoheptulose-7-phosphate and glyceraldehyde-3-phosphate in the pentose phosphate pathway; needed for synthesis of aromatic amino acids; TKL2 has a paralog, TKL1, that arose from the whole genome duplication +S000033608 CDS YBR117C 2 476437 474392 C 2011-02-03 1997-01-28 +S000000322 ORF Verified YBR118W TEF2 translation elongation factor EF-1 alpha|eEF1A|EF-1 alpha chromosome 2 L000002278 2 477671 479047 W 61 2011-02-03 1997-01-28 Translational elongation factor EF-1 alpha; in the GTP-bound active form, binds to and delivers aminoacylated tRNA to the A-site of ribosomes for elongation of nascent polypeptides; associates with vacuolar Rho1p GTPase; TEF2-RFP levels increase during replicative aging; may also have a role in tRNA re-export from the nucleus; TEF2 has a paralog, TEF1, that arose from the whole genome duplication +S000034590 CDS YBR118W 2 477671 479047 W 2011-02-03 1997-01-28 +S000000323 ORF Verified YBR119W MUD1 U1A|U1-A chromosome 2 L000001217 2 479338 480323 W 2011-02-03 1997-01-28 U1 snRNP A protein; homolog of human U1-A; involved in nuclear mRNA splicing +S000034715 CDS YBR119W 2 479338 479345 W 2011-02-03 1997-01-28 +S000034716 CDS YBR119W 2 479435 480323 W 2011-02-03 1997-01-28 +S000034717 intron YBR119W 2 479346 479434 W 2011-02-03 1997-01-28 +S000000324 ORF Verified YBR120C CBP6 chromosome 2 L000000228 2 480923 480435 C 2011-02-03 1997-01-28 Mitochondrial protein required for translation of the COB mRNA; forms a complex with Cbp3p that binds to mt ribosomes near the polypeptide tunnel exit and promotes efficient translation of the COB mRNA; Cbp3p-Cbp6p complex also interacts with newly synthesized cytochrome b (Cobp) and Cbp4p to promote assembly of Cobp into the cytochrome bc1 complex; Cbp3p-Cbp6p complex is sequestered if assembly of Complex III is blocked, downregulating COB mRNA translation +S000035739 CDS YBR120C 2 480923 480435 C 2011-02-03 1997-01-28 +S000028815 ORF Dubious YBR121C-A chromosome 2 2 482484 482326 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely contained within the verified gene GRS1; identified by expression profiling and mass spectrometry +S000033618 CDS YBR121C-A 2 482484 482326 C 2011-02-03 2003-07-29 +S000000325 ORF Verified YBR121C GRS1 glycine--tRNA ligase chromosome 2 L000000738|L000000731 2 483367 481364 C 2011-02-03 1997-01-28|2011-02-03 Cytoplasmic and mitochondrial glycyl-tRNA synthase; ligates glycine to the cognate anticodon-bearing tRNA; transcription termination factor that may interact with the 3'-end of pre-mRNA to promote 3'-end formation; GRS1 has a paralog, GRS2, that arose from the whole genome duplication; human homolog GARS implicated in Charcot-Marie-Tooth disease, can complement yeast null mutant +S000036674 CDS YBR121C 2 483367 481364 C 2011-02-03 1997-01-28|2011-02-03 +S000000326 ORF Verified YBR122C MRPL36 mitochondrial 54S ribosomal protein YmL36|YmL36 chromosome 2 L000002531|L000001171 2 484503 483970 C 2011-02-03 2003-09-22|1997-01-28 Mitochondrial ribosomal protein of the large subunit; overproduction suppresses mutations in the COX2 leader peptide-encoding region +S000036725 CDS YBR122C 2 484503 483970 C 2011-02-03 2003-09-22|1997-01-28 +S000000328 ORF Dubious YBR124W chromosome 2 2 486507 486866 W 2011-02-03 1997-01-28 Putative protein of unknown function +S000037559 CDS YBR124W 2 486507 486866 W 2011-02-03 1997-01-28 +S000000327 ORF Verified YBR123C TFC1 transcription factor TFIIIC subunit TFC1|tau 95 chromosome 2 L000002285 2 486691 484742 C 2011-02-03 1997-01-28 Subunit of RNA polymerase III transcription initiation factor complex; one of six subunits of the RNA polymerase III transcription initiation factor complex (TFIIIC); part of the TauA globular domain of TFIIIC that binds DNA at the BoxA promoter sites of tRNA and similar genes; human homolog is TFIIIC-63 +S000036794 CDS YBR123C 2 486691 484742 C 2011-02-03 1997-01-28 +S000118350 ARS ARS216 ARSII-487 chromosome 2 2 486707 486954 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178049 ARS_consensus_sequence ARS216 2 486859 486843 C 2014-11-18 2014-11-18 +S000000329 ORF Verified YBR125C PTC4 type 2C protein phosphatase PTC4|GCT1 chromosome 2 2 488380 487199 C 2011-02-03 1997-01-28 Cytoplasmic type 2C protein phosphatase (PP2C); identified as a high-copy number suppressor of cnb1 mpk1 synthetic lethality; overexpression decreases high-osmolarity induced Hog1p phosphorylation and kinase activity +S000037589 CDS YBR125C 2 488380 487199 C 2011-02-03 1997-01-28 +S000000330 ORF Verified YBR126C TPS1 alpha,alpha-trehalose-phosphate synthase (UDP-forming) TPS1|TSS1|GLC6|GGS1|FDP1|CIF1|BYP1 chromosome 2 L000002330 2 490392 488905 C 41 2011-02-03 1997-01-28 Synthase subunit of trehalose-6-P synthase/phosphatase complex; synthesizes the storage carbohydrate trehalose, which is critically important for survival of long-term desiccation; also found in a monomeric form; expression is induced by the stress response and repressed by the Ras-cAMP pathway; protein abundance increases in response to DNA replication stress and in response to prolonged exposure to boric acid +S000037645 CDS YBR126C 2 490392 488905 C 2011-02-03 1997-01-28 +S000028600 ORF Verified YBR126W-A MEO1 chromosome 2 2 490850 491056 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray analysis, and genome-wide homology searches; mRNA identified as translated by ribosome profiling data; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; partially overlaps the dubious ORF YBR126W-B +S000031400 CDS YBR126W-A 2 490850 491056 W 2011-02-03 2003-07-29 +S000028738 ORF Dubious YBR126W-B chromosome 2 2 490927 491070 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YBR126W-A; identified by SAGE +S000033382 CDS YBR126W-B 2 490927 491070 W 2011-02-03 2003-07-29 +S000000331 ORF Verified YBR127C VMA2 H(+)-transporting V1 sector ATPase subunit B|ATPSV|VAT2 chromosome 2 L000002458 2 492822 491269 C 2011-02-03 1997-01-28 Subunit B of V1 peripheral membrane domain of vacuolar H+-ATPase; electrogenic proton pump found throughout the endomembrane system; contains nucleotide binding sites; also detected in the cytoplasm; protein abundance increases in response to DNA replication stress; human homolog ATP6V1B1, implicated in autosomal-recessive distal renal tubular acidosis (RTA) with sensorineural deafness, complements yeast null mutant +S000037698 CDS YBR127C 2 492822 491269 C 2011-02-03 1997-01-28 +S000000332 ORF Verified YBR128C ATG14 APG14|CVT12 chromosome 2 L000004763|L000004641 2 494115 493081 C 2011-02-03 1997-01-28 Autophagy-specific subunit of phosphatidylinositol 3-kinase complex I; Atg14p targets complex I to the phagophore assembly site (PAS); required for localizing additional ATG proteins to the PAS; required for overflow degradation of misfolded proteins when ERAD is saturated; homolog of human Barkor; other members are Vps34, Vps15, and Vps30p +S000037772 CDS YBR128C 2 494115 493081 C 2011-02-03 1997-01-28 +S000000333 ORF Verified YBR129C OPY1 chromosome 2 L000004016 2 495339 494353 C 2011-02-03 1997-01-28 Protein of unknown function; overproduction blocks cell cycle arrest in the presence of mating pheromone; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000030622 CDS YBR129C 2 495339 494353 C 2011-02-03 1997-01-28 +S000000334 ORF Verified YBR130C SHE3 chromosome 2 L000004189|L000002868 2 496869 495592 C 2011-02-03 1997-01-28 Protein adaptor between Myo4p and the She2p-mRNA complex; part of the mRNA localization machinery that restricts accumulation of certain proteins to the bud; also required for cortical ER inheritance +S000030714 CDS YBR130C 2 496869 495592 C 2011-02-03 1997-01-28 +S000000335 ORF Verified YBR131W CCZ1 CVT16 chromosome 2 L000004556|L000004776|S000029129 2 497163 499277 W 2011-02-03 1997-01-28 Subunit of a heterodimeric guanine nucleotide exchange factor (GEF); subunit of the Mon1-Ccz1 GEF complex, which stimulates nucleotide exchange and activation of Ypt7p, a Rab family GTPase involved in membrane tethering and fusion events at the late endosome and vacuole; GEF activity is stimulated by membrane association and anionic phospholipids; involved in localizing Ypt7p to the vacuolar membrane; required for macroautophagy, the CVT pathway and mitophagy +S000031661 CDS YBR131W 2 497163 499277 W 2011-02-03 1997-01-28 +S000028601 ORF Dubious YBR131C-A chromosome 2 2 497739 497650 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YBR131W; identified by gene-trapping, microarray analysis, and genome-wide homology searches +S000031403 CDS YBR131C-A 2 497739 497650 C 2011-02-03 2003-07-29 +S000000336 ORF Verified YBR132C AGP2 chromosome 2 L000003947 2 501442 499652 C 2011-02-03 1997-01-28 Plasma membrane regulator of polyamine and carnitine transport; has similarity to transporters but lacks transport activity; may act as a sensor that transduces environmental signals; has a positive or negative regulatory effect on transcription of many transporter genes +S000031670 CDS YBR132C 2 501442 499652 C 2011-02-03 1997-01-28 +S000000338 ORF Dubious YBR134W chromosome 2 2 504243 504644 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032775 CDS YBR134W 2 504243 504644 W 2011-02-03 1997-01-28 +S000000337 ORF Verified YBR133C HSL7 protein arginine N-methyltransferase chromosome 2 L000003130 2 504287 501804 C 2011-02-03 1997-01-28 Protein arginine N-methyltransferase; exhibits septin and Hsl1p-dependent localization to the bud neck in budded cells and periodic Hsl1p-dependent phosphorylation; required with Hsl1p, and Elm1p for the mother-bud neck recruitment, phosphorylation, and degradation of Swe1p; interacts directly with Swe1p; relocalizes away from bud neck upon DNA replication stress; human homolog PRMT5 can complement yeast hsl7 mutant +S000031794 CDS YBR133C 2 504287 501804 C 2011-02-03 1997-01-28 +S000000339 ORF Verified YBR135W CKS1 cyclin-dependent protein kinase regulatory subunit CKS1 chromosome 2 L000000347 2 504854 505306 W 73 2011-02-03 1997-01-28 Cyclin-dependent protein kinase regulatory subunit and adaptor; interacts with Cdc28p (aka Cdk1p); required for G1/S and G2/M phase transitions and budding; mediates phosphorylation and degradation of Sic1p; modulates proteolysis of M-phase targets through interactions with the proteasome; role in transcriptional regulation, recruiting proteasomal subunits to target gene promoters; human homologs CKS1B and CKS2 can each complement yeast cks1 null mutant +S000032889 CDS YBR135W 2 504854 505306 W 2011-02-03 1997-01-28 +S000000340 ORF Verified YBR136W MEC1 protein kinase MEC1|RAD31|SAD3|ESR1 chromosome 2 L000000586|S000029404|S000007656 2 505668 512774 W 2011-02-03 1997-01-28 Genome integrity checkpoint protein and PI kinase superfamily member; Mec1p and Dun1p function in same pathway to regulate dNTP pools and telomere length; signal transducer required for cell cycle arrest and transcriptional responses to damaged or unreplicated DNA; facilitates replication fork progression and regulates P-body formation under replication stress; promotes interhomolog recombination by phosphorylating Hop1p; associates with shortened, dysfunctional telomeres +S000032977 CDS YBR136W 2 505668 512774 W 2011-02-03 1997-01-28 +S000000341 ORF Verified YBR137W chromosome 2 2 513044 513583 W 2011-02-03 1997-01-28|2011-02-03 Protein with a role in ER delivery of tail-anchored membrane proteins; interacts with Sgt2p; binds to the TRC complex, which inserts proteins into the ER membrane; interacts with Msn5p karyopherin; YBR137W is not an essential gene +S000033068 CDS YBR137W 2 513044 513583 W 2011-02-03 1997-01-28|2011-02-03 +S000000342 ORF Uncharacterized YBR138C HDR1 chromosome 2 L000003401 2 515336 513762 C 2011-02-03 1997-01-28|2011-02-03 Cytoplasmic protein of unknown function; APCC(Cdh1) substrate; potentially phosphorylated by Cdc28p; YBR138C is not an essential gene +S000033676 CDS YBR138C 2 515336 513762 C 2011-02-03 1997-01-28|2011-02-03 +S000000343 ORF Verified YBR139W carboxypeptidase C chromosome 2 2 515664 517190 W 2011-02-03 1997-01-28 Putative serine type carboxypeptidase; role in phytochelatin synthesis; green fluorescent protein (GFP)-fusion protein localizes to the vacuole; expression induced by nitrogen limitation in a GLN3, GAT1-independent manner +S000033849 CDS YBR139W 2 515664 517190 W 2011-02-03 1997-01-28 +S000178050 ARS ARS217 chromosome 2 2 517185 517386 2014-11-18 2014-11-18 Autonomously replicating sequence +S000178051 ARS_consensus_sequence ARS217 2 517263 517247 C 2014-11-18 2014-11-18 +S000000344 ORF Verified YBR140C IRA1 GTPase-activating protein IRA1|PPD1|GLC1 chromosome 2 L000000704|L000000873 2 526628 517350 C 78 2011-02-03 1997-01-28 GTPase-activating protein; negatively regulates RAS by converting it from GTP- to the GDP-bound inactive form, required for reducing cAMP levels under nutrient limiting conditions, mediates membrane association of adenylate cyclase; mutations cause catalase T deficiency, defective glycogen synthesis and defective trehalose accumulation; IRA1 has a paralog, IRA2, that arose from the whole genome duplication; defects in human homolog NF1 are associated with neurofibromatosis +S000034687 CDS YBR140C 2 526628 517350 C 2011-02-03 1997-01-28 +S000028602 ORF Dubious YBR141W-A chromosome 2 2 527167 527262 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the uncharacterized ORF YBR141C; identified by gene-trapping, microarray analysis, and genome-wide homology searching +S000031405 CDS YBR141W-A 2 527167 527262 W 2011-02-03 2003-07-29 +S000000345 ORF Verified YBR141C BMT2 25S rRNA (adenine2142-N1)-methyltransferase chromosome 2 2 528038 527025 C 2011-02-03 1997-01-28|2011-02-03 Nucleolar S-adenosylmethionine-dependent rRNA methyltransferase; methylates adenine (m1A) of the large subunit (LSU) rRNA at position 2142; belongs to Rossmann fold superfamily; green fluorescent protein (GFP)-fusion protein localizes to the nucleolus; YBR141C is not an essential gene +S000034839 CDS YBR141C 2 528038 527025 C 2011-02-03 1997-01-28|2011-02-03 +S000000346 ORF Verified YBR142W MAK5 putative ATP-dependent RNA helicase chromosome 2 L000000979 2 528317 530638 W 80 2011-02-03 1997-01-28 Essential nucleolar protein; putative DEAD-box RNA helicase required for maintenance of M1 dsRNA virus; involved in biogenesis of large (60S) ribosomal subunits +S000035850 CDS YBR142W 2 528317 530638 W 2011-02-03 1997-01-28 +S000000347 ORF Verified YBR143C SUP45 translation termination factor eRF1|eRF1|SUP47|SUP1|SAL4 chromosome 2 L000002258|L000002206|S000029305|L000001134 2 532182 530869 C 81 2011-02-03 1997-01-28 Polypeptide release factor (eRF1) in translation termination; mutant form acts as a recessive omnipotent suppressor; methylated by Mtq2p-Trm112p in ternary complex eRF1-eRF3-GTP; mutation of methylation site confers resistance to zymocin; has a role in cytokinesis through interaction with Mlc1p +S000035896 CDS YBR143C 2 532182 530869 C 2011-02-03 1997-01-28 +S000000348 ORF Dubious YBR144C chromosome 2 2 533549 533235 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YBR144C is not an essential gene +S000036039 CDS YBR144C 2 533549 533235 C 2011-02-03 1997-01-28 +S000000349 ORF Verified YBR145W ADH5 alcohol dehydrogenase ADH5 chromosome 2 L000000045 2 533762 534817 W 2011-02-03 1997-01-28 Alcohol dehydrogenase isoenzyme V; involved in ethanol production; ADH5 has a paralog, ADH1, that arose from the whole genome duplication +S000036921 CDS YBR145W 2 533762 534817 W 2011-02-03 1997-01-28 +S000000350 ORF Verified YBR146W MRPS9 mitochondrial 37S ribosomal protein MRPS9 chromosome 2 L000001175 2 535260 536096 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the small subunit +S000036972 CDS YBR146W 2 535260 536096 W 2011-02-03 1997-01-28 +S000000351 ORF Verified YBR147W RTC2 cationic amino acid transporter|YPQ3|RRT11 chromosome 2 2 536575 537465 W 2011-02-03 1997-01-28 Putative vacuolar membrane transporter for cationic amino acids; likely contributes to amino acid homeostasis by exporting cationic amino acids from the vacuole; positive regulation by Lys14p suggests that lysine may be the primary substrate; member of the PQ-loop family, with seven transmembrane domains; similar to mammalian PQLC2 vacuolar transporter; RTC2 has a paralog, YPQ1, that arose from the whole genome duplication +S000037067 CDS YBR147W 2 536575 537465 W 2011-02-03 1997-01-28 +S000000352 ORF Verified YBR148W YSW1 chromosome 2 L000002553 2 537876 539705 W 2011-02-03 1997-01-28 Protein required for normal prospore membrane formation; interacts with Gip1p, which is the meiosis-specific regulatory subunit of the Glc7p protein phosphatase; expressed specifically in spores and localizes to the prospore membrane; YSW1 has a paralog, SPO21, that arose from the whole genome duplication +S000037151 CDS YBR148W 2 537876 539705 W 2011-02-03 1997-01-28 +S000000353 ORF Verified YBR149W ARA1 D-arabinose 1-dehydrogenase (NAD(P)(+)) ARA1 chromosome 2 L000004642 2 539987 541021 W 2011-02-03 1997-01-28 NADP+ dependent arabinose dehydrogenase; involved in carbohydrate metabolism; purified as homodimer; naturally occurs with a N-terminus degradation product +S000037890 CDS YBR149W 2 539987 541021 W 2011-02-03 1997-01-28 +S000000354 ORF Verified YBR150C TBS1 chromosome 2 2 544493 541209 C 2011-02-03 1997-01-28 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; TBS1 has a paralog, HAL9, that arose from the whole genome duplication +S000030836 CDS YBR150C 2 544493 541209 C 2011-02-03 1997-01-28 +S000000355 ORF Verified YBR151W APD1 chromosome 2 2 545028 545978 W 2011-02-03 1997-01-28 Protein of unknown function; required for normal localization of actin patches and for normal tolerance of sodium ions and hydrogen peroxide; localizes to both cytoplasm and nucleus +S000030957 CDS YBR151W 2 545028 545978 W 2011-02-03 1997-01-28 +S000000356 ORF Verified YBR152W SPP381 U4/U6-U5 snRNP complex subunit SPP381 chromosome 2 L000004711 2 546376 547251 W 2011-02-03 1997-01-28 mRNA splicing factor, component of U4/U6.U5 tri-snRNP; interacts genetically and physically with Prp38p; relocalizes to the cytosol in response to hypoxia +S000031058 CDS YBR152W 2 546376 547251 W 2011-02-03 1997-01-28 +S000000357 ORF Verified YBR153W RIB7 2,5-diamino-6-(ribosylamino)-4(3H)-pyrimidinone 5'-phosphate reductase chromosome 2 L000001637 2 547460 548194 W 2011-02-03 1997-01-28 Diaminohydroxyphoshoribosylaminopyrimidine deaminase; catalyzes the second step of the riboflavin biosynthesis pathway +S000032010 CDS YBR153W 2 547460 548194 W 2011-02-03 1997-01-28 +S000000358 ORF Verified YBR154C RPB5 DNA-directed RNA polymerase core subunit RPB5|ABC27 chromosome 2 L000001590|L000001679 2 549009 548362 C 2011-02-03 1997-01-28 RNA polymerase subunit ABC27; common to RNA polymerases I, II, and III; contacts DNA and affects transactivation +S000032044 CDS YBR154C 2 549009 548362 C 2011-02-03 1997-01-28 +S000077079 matrix_attachment_site ETC8 ETC8 chromosome 2 2 549229 549251 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; can act as a transcription-blocking insulator or as a heterochromatin barrier element; located between divergently transcribed genes RPB5 and CNS1 +S000000359 ORF Verified YBR155W CNS1 HSP70/90 family co-chaperone CNS1 chromosome 2 L000004495 2 549771 550928 W 2011-02-03 1997-01-28 TPR-containing co-chaperone; binds both Hsp82p (Hsp90) and Ssa1p (Hsp70); stimulates ATPase activity of Ssa1p; ts mutants reduce Hsp82p function, overexpression suppresses phenotypes of HSP82 ts allele and cpr7 deletion; human homolog TTC4 complements yeast cns1 mutant +S000032166 CDS YBR155W 2 549771 550928 W 2011-02-03 1997-01-28 +S000000360 ORF Verified YBR156C SLI15 chromosome 2 L000003320 2 553200 551104 C 2011-02-03 1997-01-28 Subunit of the conserved chromosomal passenger complex (CPC); complex regulates kinetochore-microtubule attachments, activation of the spindle tension checkpoint, and mitotic spindle disassembly; other complex members are Ipl1p, Bir1p, and Nbl1p +S000032209 CDS YBR156C 2 553200 551104 C 2011-02-03 1997-01-28 +S000000361 ORF Verified YBR157C ICS2 chromosome 2 2 554310 553543 C 2011-02-03 2004-01-21|1997-01-28 Protein of unknown function; null mutation does not confer any obvious defects in growth, spore germination, viability, or carbohydrate utilization +S000032276 CDS YBR157C 2 554310 553543 C 2011-02-03 2004-01-21|1997-01-28 +S000000362 ORF Verified YBR158W AMN1 CST13|ICS4 chromosome 2 L000002997 2 556549 558198 W 2011-02-03 1997-01-28 Protein required for daughter cell separation; multiple mitotic checkpoints, and chromosome stability; contains 12 degenerate leucine-rich repeat motifs; expression is induced by the Mitotic Exit Network (MEN) +S000033182 CDS YBR158W 2 556549 558198 W 2011-02-03 1997-01-28 +S000000363 ORF Verified YBR159W IFA38 ketoreductase chromosome 2 2 558685 559728 W 2011-02-03 1997-01-28 Microsomal beta-keto-reductase; contains oleate response element (ORE) sequence in the promoter region; mutants exhibit reduced VLCFA synthesis, accumulate high levels of dihydrosphingosine, phytosphingosine and medium-chain ceramides +S000033243 CDS YBR159W 2 558685 559728 W 2011-02-03 1997-01-28 +S000000364 ORF Verified YBR160W CDC28 cyclin-dependent serine/threonine-protein kinase CDC28|SRM5|HSL5|CDK1 chromosome 2 L000000267 2 560078 560974 W 90 2011-02-03 1997-01-28 Cyclin-dependent kinase (CDK) catalytic subunit; master regulator of mitotic and meiotic cell cycles; alternately associates with G1, S, G2/M phase cyclins, which provide substrate specificity; regulates metabolism, basal transcription, chromosome dynamics, growth and morphogenesis; transcript induction in osmostress involves antisense RNA; human homologs CDK1, CDK2, CDK3 can complement yeast conditional cdc28 mutants; human CDK1, CDK2 can complement yeast cdc28 null mutant +S000035243 CDS YBR160W 2 560078 560974 W 2011-02-03 1997-01-28 +S000000365 ORF Verified YBR161W CSH1 mannosylinositol phosphorylceramide synthase catalytic subunit CSH1 chromosome 2 2 561634 562764 W 2011-02-03 1997-01-28 Mannosylinositol phosphorylceramide (MIPC) synthase catalytic subunit; forms a complex with regulatory subunit Csg2p; function in sphingolipid biosynthesis is overlapping with that of Sur1p; CSH1 has a paralog, SUR1, that arose from the whole genome duplication +S000035322 CDS YBR161W 2 561634 562764 W 2011-02-03 1997-01-28 +S000000366 ORF Verified YBR162C TOS1 chromosome 2 2 564570 563203 C 2011-02-03 1997-01-28 Covalently-bound cell wall protein of unknown function; identified as a cell cycle regulated SBF target gene; deletion mutants are highly resistant to treatment with beta-1,3-glucanase; has sequence similarity to YJL171C +S000035351 CDS YBR162C 2 564570 563203 C 2011-02-03 1997-01-28 +S000002158 ORF Verified YBR162W-A YSY6 chromosome 2 L000002554 2 565231 565428 W 2011-02-03 1997-01-28 Protein of unknown function; expression suppresses a secretory pathway mutation in E. coli; has similarity to the mammalian RAMP4 protein involved in secretion +S000032375 CDS YBR162W-A 2 565231 565428 W 2011-02-03 1997-01-28 +S000000367 ORF Verified YBR163W EXO5 DEM1 chromosome 2 2 565723 567480 W 2011-02-03 1997-01-28 Mitochondrial 5'-3' exonuclease and sliding exonuclease; required for mitochondrial genome maintenance; distantly related to the RecB nuclease domain of bacterial RecBCD recombinases; may be regulated by the transcription factor Ace2 +S000035461 CDS YBR163W 2 565723 567480 W 2011-02-03 1997-01-28 +S000000368 ORF Verified YBR164C ARL1 Arf family GTPase ARL1|DLP2 chromosome 2 L000002832 2 568426 567875 C 2011-02-03 1997-01-28 Soluble GTPase with a role in regulation of membrane traffic; regulates potassium influx; role in membrane organization at trans-Golgi network; required for delivery of Atg9p to the phagophore assembly site during autophagy under high temperature stress; required with Ypt6p for starvation-induced autophagy; required for the CVT pathway under non-starvation conditions; G protein of the Ras superfamily, similar to ADP-ribosylation factor +S000036313 CDS YBR164C 2 568426 567875 C 2011-02-03 1997-01-28 +S000000369 ORF Verified YBR165W UBS1 chromosome 2 L000003544 2 568852 569685 W 2011-02-03 1997-01-28 Ubiquitin-conjugating enzyme suppressor that regulates Cdc34p; functions as a general positive regulator of Cdc34p activity; nuclear protein that may represent a link between nucleocytoplasmic transport and ubiquitin ligase activity +S000036458 CDS YBR165W 2 568852 569685 W 2011-02-03 1997-01-28 +S000000370 ORF Verified YBR166C TYR1 prephenate dehydrogenase (NADP(+)) chromosome 2 L000002359|L000002402 2 571200 569842 C 97 2011-02-03 1997-01-28 Prephenate dehydrogenase involved in tyrosine biosynthesis; expression is dependent on phenylalanine levels +S000036504 CDS YBR166C 2 571200 569842 C 2011-02-03 1997-01-28 +S000000371 ORF Verified YBR167C POP7 ribonuclease P/MRP protein subunit POP7|RPP2 chromosome 2 L000004303|L000004505 2 571890 571468 C 2011-02-03 1997-01-28 Subunit of RNase MRP, nuclear RNase P and telomerase; forms a soluble heterodimer with Pop6p that binds P3 domain of RNase MRP and RNase P RNAs; RNase MRP cleaves pre-rRNA, nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs, while telomerase replenishes telomeric DNA +S000036597 CDS YBR167C 2 571890 571468 C 2011-02-03 1997-01-28 +S000000372 ORF Verified YBR168W PEX32 chromosome 2 2 572371 573612 W 2011-02-03 1997-01-28 Peroxisomal integral membrane protein; involved in negative regulation of peroxisome size; partially functionally redundant with Pex31p; genetic interactions suggest action at a step downstream of steps mediated by Pex28p and Pex29p +S000037359 CDS YBR168W 2 572371 573612 W 2011-02-03 1997-01-28 +S000000373 ORF Verified YBR169C SSE2 adenyl-nucleotide exchange factor SSE2 chromosome 2 L000002079 2 575996 573915 C 2011-02-03 1997-01-28 Member of Hsp110 subclass of the heat shock protein 70 (HSP70) family; serves as nucleotide exchange factor to load ATP onto the SSA class of cytosolic Hsp70s; may be involved in protein folding; localized to the cytoplasm; SSE2 has a paralog, SSE1, that arose from the whole genome duplication +S000037401 CDS YBR169C 2 575996 573915 C 2011-02-03 1997-01-28 +S000000374 ORF Verified YBR170C NPL4 HRD4 chromosome 2 L000001271 2 578086 576344 C 2011-02-03 1997-01-28 Substrate-recruiting cofactor of the Cdc48p-Npl4p-Ufd1p segregase; assists Cdc48p in the dislocation of misfolded, polyubiquitinated ERAD substrates that are subsequently delivered to the proteasome for degradation; also involved in the regulated destruction of resident ER membrane proteins, such as HMG-CoA reductase (Hmg1/2p) and cytoplasmic proteins (Fbp1p); role in mobilizing membrane bound transcription factors by regulated ubiquitin/proteasome-dependent processing (RUP) +S000030469 CDS YBR170C 2 578086 576344 C 2011-02-03 1997-01-28 +S000000375 ORF Verified YBR171W SEC66 KAR7|Sec63 complex subunit SEC66|SEC71|HSS1 chromosome 2 L000001856 2 578364 578984 W 2011-02-03 1997-01-28 Non-essential subunit of Sec63 complex; with Sec61 complex, Kar2p/BiP and Lhs1p forms a channel competent for SRP-dependent and post-translational SRP-independent protein targeting and import into the ER; other members are Sec63p, Sec62p, and Sec72p +S000030603 CDS YBR171W 2 578364 578984 W 2011-02-03 1997-01-28 +S000000376 ORF Verified YBR172C SMY2 chromosome 2 L000001941 2 581372 579150 C 2011-02-03 2003-09-22|1997-01-28 GYF domain protein; involved in COPII vesicle formation; interacts with the Sec23p/Sec24p subcomplex; overexpression suppresses the temperature sensitivity of a myo2 mutant; similar to S. pombe Mpd2; SMY2 has a paralog, SYH1, that arose from the whole genome duplication +S000030643 CDS YBR172C 2 581372 579150 C 2011-02-03 2003-09-22|1997-01-28 +S000000377 ORF Verified YBR173C UMP1 RNS2 chromosome 2 L000004429 2 582172 581726 C 2011-02-03 1997-01-28 Chaperone required for correct maturation of the 20S proteasome; short-lived chaperone; may inhibit premature dimerization of proteasome half-mers; degraded by proteasome upon completion of its assembly +S000030726 CDS YBR173C 2 582172 581726 C 2011-02-03 1997-01-28 +S000000379 ORF Verified YBR175W SWD3 SAF35|CPS30 chromosome 2 2 582408 583355 W 2011-02-03 1997-01-28 Essential subunit of the COMPASS (Set1C) complex; COMPASS methylates histone H3 on lysine 4 and is required in transcriptional silencing near telomeres; WD40 beta propeller superfamily member and ortholog of mammalian WDR5 +S000031715 CDS YBR175W 2 582408 583355 W 2011-02-03 1997-01-28 +S000000378 ORF Dubious YBR174C chromosome 2 2 582652 582338 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YBR175W; null mutant is viable and sporulation defective +S000031563 CDS YBR174C 2 582652 582338 C 2011-02-03 1997-01-28 +S000000380 ORF Verified YBR176W ECM31 3-methyl-2-oxobutanoate hydroxymethyltransferase chromosome 2 L000003901 2 583720 584658 W 2011-02-03 1997-01-28 Ketopantoate hydroxymethyltransferase; required for pantothenic acid biosynthesis, converts 2-oxoisovalerate into 2-dehydropantoate +S000031869 CDS YBR176W 2 583720 584658 W 2011-02-03 1997-01-28 +S000000382 ORF Dubious YBR178W chromosome 2 2 586071 586445 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YBR177C +S000032865 CDS YBR178W 2 586071 586445 W 2011-02-03 1997-01-28 +S000000381 ORF Verified YBR177C EHT1 medium-chain fatty acid ethyl ester synthase/esterase chromosome 2 2 586162 584807 C 2011-02-03 1997-01-28 Acyl-coenzymeA:ethanol O-acyltransferase; plays a minor role in medium-chain fatty acid ethyl ester biosynthesis; possesses short-chain esterase activity; localizes to lipid particles and the mitochondrial outer membrane; EHT1 has a paralog, EEB1, that arose from the whole genome duplication +S000031916 CDS YBR177C 2 586162 584807 C 2011-02-03 1997-01-28 +S000000383 ORF Verified YBR179C FZO1 mitofusin chromosome 2 L000004083 2 589114 586547 C 2011-02-03 1997-01-28 Mitofusin; integral membrane protein involved in mitochondrial outer membrane tethering and fusion; role in mitochondrial genome maintenance; efficient tethering and degradation of Fzo1p requires an intact N-terminal GTPase domain; targeted for destruction by the ubiquitin ligase SCF-Mdm30p and the cytosolic ubiquitin-proteasome system +S000032906 CDS YBR179C 2 589114 586547 C 2011-02-03 1997-01-28 +S000000384 ORF Verified YBR180W DTR1 chromosome 2 2 589741 591459 W 2011-02-03 1997-01-28 Putative dityrosine transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; required for spore wall synthesis; sequence similarity to QDR1 and QDR3, and the triple mutant dtr1 qdr1 qdr3 exhibits reduced dityrosine fluorescence relative to the single mutants; expressed during sporulation +S000035007 CDS YBR180W 2 589741 591459 W 2011-02-03 1997-01-28 +S000000385 ORF Verified YBR181C RPS6B eS6|ribosomal 40S subunit protein S6B|S6e|RPS102|RPS101|LPG18 chromosome 2 L000002721 2 592774 591712 C 2011-02-03 1997-01-28 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S6, no bacterial homolog; phosphorylated on S233 by Ypk3p in a TORC1-dependent manner, and on S232 in a TORC1/2-dependent manner by Ypk1/2/3p; RPS6B has a paralog, RPS6A, that arose from the whole genome duplication +S000035075 CDS YBR181C 2 592416 591712 C 2011-02-03 1997-01-28 +S000035074 CDS YBR181C 2 592774 592769 C 2011-02-03 1997-01-28 +S000035076 intron YBR181C 2 592768 592417 C 2011-02-03 1997-01-28 +S000000386 ORF Verified YBR182C SMP1 chromosome 2 L000004146 2 594864 593506 C 2011-02-03 1997-01-28 MADS-box transcription factor involved in osmotic stress response; SMP1 has a paralog, RLM1, that arose from the whole genome duplication +S000035193 CDS YBR182C 2 594864 593506 C 2011-02-03 1997-01-28 +S000028603 ORF Uncharacterized YBR182C-A chromosome 2 2 595555 595361 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031408 CDS YBR182C-A 2 595555 595361 C 2011-02-03 2003-07-29 +S000000387 ORF Verified YBR183W YPC1 phytoceramidase chromosome 2 2 596115 597065 W 2011-02-03 1997-01-28 Alkaline ceramidase; also has reverse (CoA-independent) ceramide synthase activity; catalyzes both breakdown and synthesis of phytoceramide; overexpression confers fumonisin B1 resistance; YPC1 has a paralog, YDC1, that arose from the whole genome duplication +S000036119 CDS YBR183W 2 596115 597065 W 2011-02-03 1997-01-28 +S000000388 ORF Uncharacterized YBR184W chromosome 2 2 597363 598934 W 2011-02-03 1997-01-28 Putative protein of unknown function; YBR184W is not an essential gene +S000036220 CDS YBR184W 2 597363 598934 W 2011-02-03 1997-01-28 +S000000389 ORF Verified YBR185C MBA1 chromosome 2 L000002809 2 599959 599123 C 2011-02-03 1997-01-28 Membrane-associated mitochondrial ribosome receptor; forms a complex with Mdm38p that may facilitate recruitment of mRNA-specific translational activators to ribosomes; possible role in protein export from the matrix to inner membrane +S000036261 CDS YBR185C 2 599959 599123 C 2011-02-03 1997-01-28 +S000000390 ORF Verified YBR186W PCH2 chromosome 2 L000004274 2 600553 602360 W 2011-02-03 2000-07-14|1997-01-28 Hexameric ring ATPase that remodels chromosome axis protein Hop1p; nucleolar component of the pachytene checkpoint, which prevents chromosome segregation when recombination and chromosome synapsis are defective; also represses meiotic interhomolog recombination in rDNA; required for meiotic double-stranded break formation +S000036993 CDS YBR186W 2 600553 602103 W 2011-02-03 2000-07-14|1997-01-28 +S000036994 CDS YBR186W 2 602217 602360 W 2011-02-03 2000-07-14 +S000036995 intron YBR186W 2 602104 602216 W 2011-02-03 2000-07-14 +S000000391 ORF Verified YBR187W GDT1 putative ribosome biosynthesis protein GDT1 chromosome 2 2 602634 603476 W 2011-02-03 1997-01-28 Calcium transporter localized to the cis- and medial-Golgi apparatus; required for protein glycosylation; GFP-fusion protein localizes to the vacuole; TMEM165, a human gene which causes Congenital Disorders of Glycosylation is orthologous and functionally complements the null allele; expression pattern and physical interactions suggest a possible role in ribosome biogenesis; expression reduced in a gcr1 null mutant +S000037050 CDS YBR187W 2 602634 603476 W 2011-02-03 1997-01-28 +S000000392 ORF Verified YBR188C NTC20 chromosome 2 L000004267 2 604107 603685 C 2011-02-03 1997-01-28 Member of the NineTeen Complex (NTC); this complex contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs +S000037089 CDS YBR188C 2 604107 603685 C 2011-02-03 1997-01-28 +S000000393 ORF Verified YBR189W RPS9B ribosomal 40S subunit protein S9B|rp21|YS11|S9B|S4|S13|SUP46|RPS13A chromosome 2 L000002207|S000029306|L000001135 2 604508 605508 W 106 2011-02-03 1997-01-28 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S9 and bacterial S4; RPS9B has a paralog, RPS9A, that arose from the whole genome duplication +S000037264 CDS YBR189W 2 604508 604514 W 2011-02-03 1997-01-28 +S000037265 CDS YBR189W 2 604928 605508 W 2011-02-03 1997-01-28 +S000037266 intron YBR189W 2 604515 604927 W 2011-02-03 1997-01-28 +S000000394 ORF Dubious YBR190W chromosome 2 2 605966 606277 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ribosomal protein gene RPL21A/YBR191W +S000029997 CDS YBR190W 2 605966 606277 W 2011-02-03 1997-01-28 +S000000395 ORF Verified YBR191W RPL21A eL21|ribosomal 60S subunit protein L21A|L21e|L21A|URP1 chromosome 2 L000002441 2 606270 607140 W 2011-02-03 1997-01-28 Ribosomal 60S subunit protein L21A; homologous to mammalian ribosomal protein L21, no bacterial homolog; RPL21A has a paralog, RPL21B, that arose from the whole genome duplication +S000030992 CDS YBR191W 2 606270 606280 W 2011-02-03 1997-01-28 +S000030993 CDS YBR191W 2 606669 607140 W 2011-02-03 1997-01-28 +S000030994 intron YBR191W 2 606281 606668 W 2011-02-03 1997-01-28 +S000007594 ORF Dubious YBR191W-A chromosome 2 2 607149 607223 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037106 CDS YBR191W-A 2 607149 607223 W 2011-02-03 2001-02-26 +S000000396 ORF Verified YBR192W RIM2 PYT1 chromosome 2 L000001641 2 607652 608785 W 2011-02-03 1997-01-28 Mitochondrial pyrimidine nucleotide transporter; imports pyrimidine nucleoside triphosphates and exports pyrimidine nucleoside monophosphates; member of the mitochondrial carrier family +S000031077 CDS YBR192W 2 607652 608785 W 2011-02-03 1997-01-28 +S000000397 ORF Verified YBR193C MED8 chromosome 2 L000003917 2 609753 609082 C 2011-02-03 1997-01-28 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation +S000031128 CDS YBR193C 2 609753 609082 C 2011-02-03 1997-01-28 +S000000398 ORF Verified YBR194W AIM4 SOY1 chromosome 2 2 610038 610409 W 2011-02-03 1997-01-28 Protein proposed to be associated with the nuclear pore complex; null mutant is viable, displays elevated frequency of mitochondrial genome loss and is sensitive to freeze-thaw stress +S000032148 CDS YBR194W 2 610038 610409 W 2011-02-03 1997-01-28 +S000000399 ORF Verified YBR195C MSI1 CAC3 chromosome 2 L000001193 2 611882 610614 C 89 2011-02-03 1997-01-28 Subunit of chromatin assembly factor I (CAF-1); chromatin assembly by CAF-1 affects multiple processes including silencing at telomeres, mating type loci, and rDNA; maintenance of kinetochore structure; deactivation of DNA damage checkpoint after DNA repair; chromatin dynamics during transcription; and repression of divergent noncoding transcription; Msi1p localizes to nucleus and cytoplasm and independently regulates the RAS/cAMP pathway via sequestration of Npr1p kinase +S000032175 CDS YBR195C 2 611882 610614 C 2011-02-03 1997-01-28 +S000000400 ORF Verified YBR196C PGI1 glucose-6-phosphate isomerase|CDC30 chromosome 2 L000001410|L000001409 2 613900 612236 C 89 2011-02-03 1997-01-28 Glycolytic enzyme phosphoglucose isomerase; catalyzes the interconversion of glucose-6-phosphate and fructose-6-phosphate; required for cell cycle progression and completion of the gluconeogenic events of sporulation +S000032251 CDS YBR196C 2 613900 612236 C 2011-02-03 1997-01-28 +S000028534 ORF Uncharacterized YBR196C-A chromosome 2 2 614173 614024 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031143 CDS YBR196C-A 2 614173 614024 C 2011-02-03 2003-07-29 +S000028816 ORF Uncharacterized YBR196C-B chromosome 2 2 614630 614526 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000033621 CDS YBR196C-B 2 614630 614526 C 2011-02-03 2003-07-29 +S000000401 ORF Verified YBR197C chromosome 2 2 615856 615203 C 2011-02-03 1997-01-28 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; YBR197C is not an essential gene; relative distribution to the nucleus increases upon DNA replication stress; YBR197C has a paralog, YPL077C, that arose from the whole genome duplication +S000032354 CDS YBR197C 2 615856 615203 C 2011-02-03 1997-01-28 +S000000402 ORF Verified YBR198C TAF5 chromatin modification protein|TafII90|TAF90 chromosome 2 L000004155 2 618523 616127 C 2011-02-03 1997-01-28 Subunit (90 kDa) of TFIID and SAGA complexes; involved in RNA polymerase II transcription initiation and in chromatin modification +S000033223 CDS YBR198C 2 618523 616127 C 2011-02-03 1997-01-28 +S000000403 ORF Verified YBR199W KTR4 putative mannosyltransferase chromosome 2 L000000927 2 618909 620303 W 2011-02-03 1997-01-28 Glycosyltransferase involved in protein glycosylation; transfers GDP-mannose to methyl-alpha-mannoside in vitro; member of the KRE2/MNT1 mannosyltransferase family of type II membrane proteins with a short cytoplasmic N-terminus, a membrane-spanning region and a highly conserved catalytic lumenal domain +S000033316 CDS YBR199W 2 618909 620303 W 2011-02-03 1997-01-28 +S000000404 ORF Verified YBR200W BEM1 phosphatidylinositol-3-phosphate-binding protein BEM1|SRO1 chromosome 2 L000000167 2 620872 622527 W 102 2011-02-03 1997-01-28 Protein containing SH3-domains; involved in establishing cell polarity and morphogenesis; functions as a scaffold protein for complexes that include Cdc24p, Ste5p, Ste20p, and Rsr1p +S000030486 CDS YBR200W 2 620872 622527 W 2011-02-03 1997-01-28 +S000118351 ARS ARS220 ARSII-623 chromosome 2 2 622671 622939 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000028535 ORF Uncharacterized YBR200W-A chromosome 2 2 622983 623147 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031144 CDS YBR200W-A 2 622983 623147 W 2011-02-03 2003-07-29 +S000000405 ORF Verified YBR201W DER1 derlin chromosome 2 L000002800 2 623576 624211 W 2011-02-03 1999-04-26|1997-01-28 ER membrane protein that promotes export of misfolded polypeptides; required for ER-associated protein degradation of misfolded or unassembled proteins; initiates export of aberrant polypeptides from ER lumen by threading them into ER membrane and routing them to Hrd1p for ubiquitination; function normally requires N-terminal acetylation by NatB; N- and C- termini protrude into cytoplasm; similar to Dfm1p; homolog of mammalian derlin-1 +S000030597 CDS YBR201W 2 623576 624211 W 2011-02-03 1999-04-26|1997-01-28 +S000087085 ORF Uncharacterized YBR201C-A chromosome 2 2 624696 624493 C 2011-02-03 2005-11-08 Putative protein of unknown function +S000087086 CDS YBR201C-A 2 624696 624493 C 2011-02-03 2005-11-08 +S000000406 ORF Verified YBR202W MCM7 mini-chromosome maintenance complex protein 7|CDC47 chromosome 2 L000002760 2 625772 628309 W 2011-02-03 1997-01-28|2011-02-03 Component of the Mcm2-7 hexameric helicase complex; MCM2-7 primes origins of DNA replication in G1 and becomes an active ATP-dependent helicase that promotes DNA melting and elongation in S-phase; forms an Mcm4p-6p-7p subcomplex +S000030677 CDS YBR202W 2 625772 628309 W 2011-02-03 1997-01-28|2011-02-03 +S000000407 ORF Verified YBR203W COS111 chromosome 2 2 629168 631942 W 2011-02-03 1997-01-28|2011-02-03 Protein required for antifungal drug ciclopirox olamine resistance; not related to the subtelomerically-encoded COS family; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000031550 CDS YBR203W 2 629168 631942 W 2011-02-03 1997-01-28|2011-02-03 +S000130153 ARS ARS221 ARSII-632 chromosome 2 2 631939 632251 2011-02-03 2009-05-07|2011-02-03 Autonomously Replicating Sequence +S000178052 ARS_consensus_sequence ARS221 2 632005 632021 W 2014-11-18 2014-11-18 +S000000408 ORF Verified YBR204C LDH1 triacylglycerol lipase chromosome 2 2 633381 632254 C 2011-02-03 1997-01-28|2011-02-03 Serine hydrolase; exhibits active esterase plus weak triacylglycerol lipase activities; proposed role in lipid homeostasis, regulating phospholipid and non-polar lipid levels and required for mobilization of LD-stored lipids; localizes to the lipid droplet (LD) surface; contains a classical serine containing catalytic triad (GxSxG motif) +S000031575 CDS YBR204C 2 633381 632254 C 2011-02-03 1997-01-28|2011-02-03 +S000000409 ORF Verified YBR205W KTR3 mannosyltransferase KTR3 chromosome 2 L000000926 2 633622 634836 W 2011-02-03 1997-01-28 Putative alpha-1,2-mannosyltransferase; involved in O- and N-linked protein glycosylation; member of the KRE2/MNT1 mannosyltransferase family; Svp26p mediates uptake of Ktr3p into COPII vesicles; relocalizes from nucleus to vacuole upon DNA replication stress +S000031710 CDS YBR205W 2 633622 634836 W 2011-02-03 1997-01-28 +S000000410 ORF Dubious YBR206W chromosome 2 2 634601 634924 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene KTR3 +S000031861 CDS YBR206W 2 634601 634924 W 2011-02-03 1997-01-28 +S000000411 ORF Verified YBR207W FTH1 chromosome 2 L000003065 2 635146 636543 W 2011-02-03 1997-01-28|2011-02-03 Putative high affinity iron transporter; involved in transport of intravacuolar stores of iron; forms complex with Fet5p; expression is regulated by iron; proposed to play indirect role in endocytosis; protein abundance increases in response to DNA replication stress +S000032783 CDS YBR207W 2 635146 636543 W 2011-02-03 1997-01-28|2011-02-03 +S000000412 ORF Verified YBR208C DUR1,2 bifunctional urea carboxylase/allophanate hydrolase|DUR80 chromosome 2 L000000532|L000000533|L000000536 2 642210 636703 C 112 2011-02-03 1997-01-28 Urea amidolyase; contains both urea carboxylase and allophanate hydrolase activities, degrades urea to CO2 and NH3; expression sensitive to nitrogen catabolite repression and induced by allophanate, an intermediate in allantoin degradation; protein abundance increases in response to DNA replication stress +S000032849 CDS YBR208C 2 642210 636703 C 2011-02-03 1997-01-28 +S000000413 ORF Dubious YBR209W chromosome 2 2 642583 642900 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YBR209W is not an essential gene +S000032978 CDS YBR209W 2 642583 642900 W 2011-02-03 1997-01-28 +S000006526 tRNA_gene tC(GCA)B chromosome 2 L000003748 2 643078 643007 C 2011-02-03 2000-05-19 Cysteine tRNA (tRNA-Cys), predicted by tRNAscan-SE analysis +S000035208 noncoding_exon tC(GCA)B 2 643078 643007 C 2011-02-03 2000-05-19 +S000006820 long_terminal_repeat YBRCtau2 YBRWtau2 chromosome 2 2 643858 643488 C 2011-02-03 2000-05-19|2007-04-05 Ty4 LTR +S000006812 long_terminal_repeat YBRWdelta18 YBRCdelta18 chromosome 2 2 643859 644002 W 2011-02-03 2000-05-19 Ty1 LTR +S000006813 long_terminal_repeat YBRCdelta19 chromosome 2 2 644603 644362 C 2011-02-03 2000-05-19|2007-04-05 Ty1 LTR +S000006548 tRNA_gene tE(UUC)B chromosome 2 L000003747 2 645167 645238 W 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000035972 noncoding_exon tE(UUC)B 2 645167 645238 W 2011-02-03 2000-05-19 +S000000414 ORF Verified YBR210W ERV15 chromosome 2 2 645550 645978 W 2011-02-03 1997-01-28 Protein involved in export of proteins from the endoplasmic reticulum; ERV15 has a paralog, ERV14, that arose from the whole genome duplication +S000033653 CDS YBR210W 2 645550 645978 W 2011-02-03 1997-01-28 +S000000415 ORF Verified YBR211C AME1 ARP100 chromosome 2 L000004725 2 647132 646158 C 2011-02-03 1997-01-28 Essential kinetochore protein associated with microtubules and SPBs; component of the kinetochore sub-complex COMA (Ctf19p, Okp1p, Mcm21p, Ame1p); involved in spindle checkpoint maintenance; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-U and fission yeast Mis17; relative distribution to the nucleus increases upon DNA replication stress +S000033678 CDS YBR211C 2 647132 646158 C 2011-02-03 1997-01-28 +S000000416 ORF Verified YBR212W NGR1 RBP1 chromosome 2 L000001242 2 647886 649904 W 2011-02-03 1997-01-28 RNA binding protein that negatively regulates growth rate; interacts with the 3' UTR of the mitochondrial porin (POR1) mRNA and enhances its degradation; overexpression impairs mitochondrial function; interacts with Dhh1p to mediate POR1 mRNA decay; expressed in stationary phase +S000034651 CDS YBR212W 2 647886 649904 W 2011-02-03 1997-01-28 +S000000417 ORF Verified YBR213W MET8 bifunctional precorrin-2 dehydrogenase/sirohydrochlorin ferrochelatase MET8 chromosome 2 L000001083 2 650368 651192 W 119 2011-02-03 1997-01-28 Bifunctional dehydrogenase and ferrochelatase; involved in the biosynthesis of siroheme, a prosthetic group used by sulfite reductase; required for sulfate assimilation and methionine biosynthesis +S000034801 CDS YBR213W 2 650368 651192 W 2011-02-03 1997-01-28 +S000000418 ORF Verified YBR214W SDS24 chromosome 2 L000004811 2 651415 652998 W 2011-02-03 1997-01-28 Protein involved in cell separation during budding; one of two S. cerevisiae homologs (Sds23p and Sds24p) of the S. pombe Sds23 protein, which is implicated in APC/cyclosome regulation; may play an indirect role in fluid-phase endocytosis; protein abundance increases in response to DNA replication stress; SDS24 has a paralog, SDS23, that arose from the whole genome duplication +S000034936 CDS YBR214W 2 651415 652998 W 2011-02-03 1997-01-28 +S000000419 ORF Verified YBR215W HPC2 chromosome 2 L000000804 2 653356 655317 W 2011-02-03 1997-01-28|2007-07-09 Subunit of the HIR complex; HIR is a nucleosome assembly complex involved in regulation of histone gene transcription; mutants display synthetic defects with subunits of FACT, a complex that allows passage of RNA Pol II through nucleosomes +S000035856 CDS YBR215W 2 653356 653368 W 2011-02-03 1997-01-28|2007-07-09 +S000123275 CDS YBR215W 2 653453 655317 W 2011-02-03 2007-07-09 +S000123274 intron YBR215W 2 653369 653452 W 2011-02-03 2007-07-09 +S000000420 ORF Verified YBR216C YBP1 chromosome 2 2 657600 655576 C 2011-02-03 1997-01-28 Protein involved in cellular response to oxidative stress; required for oxidation of specific cysteine residues of transcription factor Yap1p, resulting in nuclear localization of Yap1p in response to stress; YBP1 has a paralog, YBP2, that arose from the whole genome duplication +S000035897 CDS YBR216C 2 657600 655576 C 2011-02-03 1997-01-28 +S000000421 ORF Verified YBR217W ATG12 APG12 chromosome 2 L000004702 2 657832 658392 W 2011-02-03 1997-01-28 Ubiquitin-like modifier involved in autophagy and the Cvt pathway; conserved; conjugated to Atg5p to form a complex involved in Atg8p lipidation; Atg5p-Atg12p conjugate enhances E2 activity of Atg3p by rearranging its catalytic site, also forms a complex with Atg16p; the Atg5-Atg12/Atg16 complex binds to membranes and is essential for autophagosome formation +S000036158 CDS YBR217W 2 657832 658392 W 2011-02-03 1997-01-28 +S000000422 ORF Verified YBR218C PYC2 pyruvate carboxylase 2 chromosome 2 L000001543 2 662249 658707 C 2011-02-03 1997-01-28 Pyruvate carboxylase isoform; cytoplasmic enzyme that converts pyruvate to oxaloacetate; differentially regulated than isoform Pyc1p; mutations in the human homolog are associated with lactic acidosis; PYC2 has a paralog, PYC1, that arose from the whole genome duplication +S000036216 CDS YBR218C 2 662249 658707 C 2011-02-03 1997-01-28 +S000000423 ORF Uncharacterized YBR219C chromosome 2 2 663303 662499 C 2011-02-03 1997-01-28 Putative protein of unknown function; YBR219C is not an essential gene +S000036941 CDS YBR219C 2 662581 662499 C 2011-02-03 1997-01-28 +S000036940 CDS YBR219C 2 663303 663003 C 2011-02-03 1997-01-28 +S000036942 intron YBR219C 2 663002 662582 C 2011-02-03 1997-01-28 +S000000424 ORF Uncharacterized YBR220C chromosome 2 2 664677 662995 C 2011-02-03 1997-01-28 Putative protein of unknown function; YBR220C is not an essential gene +S000037728 CDS YBR220C 2 664677 662995 C 2011-02-03 1997-01-28 +S000000425 ORF Verified YBR221C PDB1 pyruvate dehydrogenase (acetyl-transferring) subunit E1 beta chromosome 2 L000001353 2 666253 665153 C 2011-02-03 1997-01-28 E1 beta subunit of the pyruvate dehydrogenase (PDH) complex; PDH is an evolutionarily conserved multi-protein complex found in mitochondria +S000037817 CDS YBR221C 2 666253 665153 C 2011-02-03 1997-01-28 +S000028817 ORF Uncharacterized YBR221W-A chromosome 2 2 666538 666642 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000033623 CDS YBR221W-A 2 666538 666642 W 2011-02-03 2003-07-29 +S000000426 ORF Verified YBR222C PCS60 FAT2 chromosome 2 L000003238 2 668351 666720 C 2011-02-03 1997-01-28 Oxalyl-CoA synthetase; capable of catalyzing conversion of oxalate to oxalyl-CoA; catalyzes first step in pathway of oxalate degradation that functions to protect yeast from inhibitory effects of oxalate; peroxisomal protein that binds mRNA; localizes to both peroxisomal peripheral membrane and matrix, expression is highly inducible by oleic acid; similar to E. coli long chain acyl-CoA synthetase +S000029826 CDS YBR222C 2 668351 666720 C 2011-02-03 1997-01-28 +S000028604 ORF Dubious YBR223W-A chromosome 2 2 668721 668840 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps YBR223C; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031411 CDS YBR223W-A 2 668721 668840 W 2011-02-03 2003-07-29 +S000000428 ORF Dubious YBR224W chromosome 2 2 670125 670640 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene TDP1 +S000030960 CDS YBR224W 2 670125 670640 W 2011-02-03 1997-01-28 +S000000427 ORF Verified YBR223C TDP1 tyrosyl-DNA phosphodiesterase 1 chromosome 2 S000007461 2 670297 668663 C 2011-02-03 1997-01-28 Tyrosyl-DNA phosphodiesterase I; hydrolyzes 3' and 5'-phosphotyrosyl bonds; involved in the repair of DNA lesions created by topo I and topo II; mutations in the human homolog, TDP1, result in the a neurodegenerative disease, spinocerebellar ataxia with axonal neuropathy (SCAN1); yeast cells and human rhabdomyosarcoma lines that overexpress TDP1 both exhibit elevated dosage chromosomal instability (dCIN) +S000030837 CDS YBR223C 2 670297 668663 C 2011-02-03 1997-01-28 +S000000429 ORF Uncharacterized YBR225W chromosome 2 2 670627 673329 W 2011-02-03 1997-01-28 Putative protein of unknown function; non-essential gene identified in a screen for mutants affected in mannosylphophorylation of cell wall components +S000031063 CDS YBR225W 2 670627 673329 W 2011-02-03 1997-01-28 +S000000430 ORF Dubious YBR226C chromosome 2 2 673565 673155 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YBR225W +S000031074 CDS YBR226C 2 673565 673155 C 2011-02-03 1997-01-28 +S000000431 ORF Verified YBR227C MCX1 chromosome 2 2 675134 673572 C 2011-02-03 1997-01-28 Non-proteolytic ATPase of the AAA family; stimulates incorporation of the pyridoxal phosphate cofactor into Hem1p (5-aminolevulinic acid synthase); localized to the mitochondrial matrix; ortholog of vertebrate CLPX, which promotes erythropoiesis +S000032046 CDS YBR227C 2 675134 673572 C 2011-02-03 1997-01-28 +S000000432 ORF Verified YBR228W SLX1 endonuclease chromosome 2 2 675313 676227 W 2011-02-03 1997-01-28 Endonuclease involved in DNA recombination and repair; subunit of a complex, with Slx4p, that hydrolyzes 5' branches from duplex DNA in response to stalled or converging replication forks; function overlaps with that of Sgs1p-Top3p +S000032169 CDS YBR228W 2 675313 676227 W 2011-02-03 1997-01-28 +S000000433 ORF Verified YBR229C ROT2 glucan 1,3-alpha-glucosidase ROT2|GLS2 chromosome 2 L000003405 2 679221 676357 C 2011-02-03 1997-01-28 Glucosidase II catalytic subunit; required to trim the final glucose in N-linked glycans; required for normal cell wall synthesis; mutations in rot2 suppress tor2 mutations, and are synthetically lethal with rot1 mutations +S000032215 CDS YBR229C 2 679221 676357 C 2011-02-03 1997-01-28 +S000000434 ORF Verified YBR230C OM14 chromosome 2 2 680050 679549 C 2011-02-03 1997-01-28 Mitochondrial outer membrane receptor for cytosolic ribosomes; integral protein of the outer membrane that interacts with the nascent chain-associated complex (NAC) bound to ribosomes, contributing to co-translational mitochondrial import; interacts with porin (Por1p) and Om45p; abundance is decreased in cells grown in glucose relative to other carbon sources +S000034001 CDS YBR230C 2 679942 679549 C 2011-02-03 1997-01-28 +S000034000 CDS YBR230C 2 680050 680040 C 2011-02-03 1997-01-28 +S000034002 intron YBR230C 2 680039 679943 C 2011-02-03 1997-01-28 +S000029722 ORF Uncharacterized YBR230W-A chromosome 2 2 680362 680562 W 2011-02-03 2004-04-01 Putative protein of unknown function; YBR230W-A has a paralog, COQ8, that arose from the whole genome duplication +S000036857 CDS YBR230W-A 2 680362 680562 W 2011-02-03 2004-04-01 +S000006478 snRNA_gene LSR1 LSR1 U2|snR20 chromosome 2 L000000954 2 681862 680688 C 2011-02-03 2000-05-19|2006-10-04 U2 spliceosomal RNA (U2 snRNA), component of the spliceosome; pairs with the branchpoint sequence; functionally equivalent to mammalian U2 snRNA; stress-induced pseudouridylations at positions 56 and 93 may contribute to regulation of splicing +S000030971 noncoding_exon LSR1 2 681862 680688 C 2011-02-03 2000-05-19|2006-10-04 +S000000435 ORF Verified YBR231C SWC5 AOR1 chromosome 2 L000004001 2 683090 682179 C 2011-02-03 1997-01-28 Component of the SWR1 complex; complex exchanges histone variant H2AZ (Htz1p) for chromatin-bound histone H2A; protein abundance increases in response to DNA replication stress; relocalizes to the cytosol in response to hypoxia +S000034102 CDS YBR231C 2 683090 682179 C 2011-02-03 1997-01-28 +S000000437 ORF Verified YBR233W PBP2 HEK1 chromosome 2 L000004512 2 683428 684669 W 2011-02-03 1997-01-28 RNA binding protein; has similarity to mammalian heterogeneous nuclear RNP K protein, involved in the regulation of telomere position effect and telomere length; relative distribution to the nucleus increases upon DNA replication stress +S000035244 CDS YBR233W 2 683428 684669 W 2011-02-03 1997-01-28 +S000000436 ORF Dubious YBR232C chromosome 2 2 683732 683373 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034194 CDS YBR232C 2 683732 683373 C 2011-02-03 1997-01-28 +S000007595 ORF Verified YBR233W-A DAD3 chromosome 2 2 684977 685261 W 2011-02-03 2001-02-26 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; is transferred to the kinetochore prior to mitosis +S000037141 CDS YBR233W-A 2 684977 685261 W 2011-02-03 2001-02-26 +S000000438 ORF Verified YBR234C ARC40 chromosome 2 L000004788 2 686592 685438 C 2011-02-03 1997-01-28 Subunit of the ARP2/3 complex; ARP2/3 is required for the motility and integrity of cortical actin patches +S000035293 CDS YBR234C 2 686592 685438 C 2011-02-03 1997-01-28 +S000000439 ORF Verified YBR235W VHC1 chromosome 2 2 686901 690263 W 2011-02-03 1997-01-28 Vacuolar membrane cation-chloride cotransporter (CCC); likely mediates K+ and Cl- cotransport into the vacuole; has a role in potassium homeostasis and salt tolerance; localizes to sites of contact between the vacuole and mitochondria (vCLAMPs); similar to mammalian electroneutral Na(+)-(K+)-C1- cotransporter family +S000035401 CDS YBR235W 2 686901 690263 W 2011-02-03 1997-01-28 +S000000440 ORF Verified YBR236C ABD1 mRNA (guanine-N7)-methyltransferase chromosome 2 L000000011 2 691693 690383 C 2011-02-03 1997-01-28 Methyltransferase; catalyzes the transfer of a methyl group from S-adenosylmethionine to the GpppN terminus of capped mRNA; nuclear protein that relocalizes to the cytosol in response to hypoxia +S000035435 CDS YBR236C 2 691693 690383 C 2011-02-03 1997-01-28 +S000000441 ORF Verified YBR237W PRP5 DEAD-box RNA helicase PRP5|RNA5 chromosome 2 L000001498 2 691969 694518 W 138 2011-02-03 1997-01-28 RNA helicase in the DEAD-box family; necessary for prespliceosome formation, bridges U1 and U2 snRNPs and enables stable U2 snRNP association with intron RNA +S000036392 CDS YBR237W 2 691969 694518 W 2011-02-03 1997-01-28 +S000000442 ORF Verified YBR238C chromosome 2 2 697302 695107 C 2011-02-03 1997-01-28 Mitochondrial membrane protein; not required for respiratory growth but causes a synthetic respiratory defect in combination with rmd9 mutations; transcriptionally up-regulated by TOR; deletion increases life span; YBR238C has a paralog, RMD9, that arose from the whole genome duplication +S000036425 CDS YBR238C 2 697302 695107 C 2011-02-03 1997-01-28 +S000000443 ORF Verified YBR239C ERT1 chromosome 2 2 699943 698354 C 2011-02-03 1997-01-28 Transcriptional regulator; involved in regulation of gluconeogenesis and fermentable carbon utilization; GFP-fusion protein localizes to cytoplasm, nucleus; null mutation affects periodicity of transcriptional and metabolic oscillation; plays role in restricting Ty1 transposition; member of the zinc cluster family of proteins, similar to Rds2p +S000036512 CDS YBR239C 2 699943 698354 C 2011-02-03 1997-01-28 +S000000444 ORF Verified YBR240C THI2 phoF|PHO6 chromosome 2 L000003526 2 701842 700490 C 2011-02-03 1997-01-28 Transcriptional activator of thiamine biosynthetic genes; interacts with regulatory factor Thi3p to control expression of thiamine biosynthetic genes with respect to thiamine availability; acts together with Pdc2p to respond to thiaminediphosphate demand, possibly as related to carbon source availability; zinc finger protein of the Zn(II)2Cys6 type +S000037494 CDS YBR240C 2 701842 700490 C 2011-02-03 1997-01-28 +S000000445 ORF Uncharacterized YBR241C chromosome 2 2 704055 702589 C 2011-02-03 1997-01-28 Putative transporter, member of the sugar porter family; green fluorescent protein (GFP)-fusion protein localizes to the vacuolar membrane; YBR241C is not an essential gene; YBR241C has a paralog, VPS73, that arose from the whole genome duplication +S000037584 CDS YBR241C 2 704055 702589 C 2011-02-03 1997-01-28 +S000118352 ARS ARS222 ARSII-704 chromosome 2 2 704296 704566 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000000446 ORF Uncharacterized YBR242W chromosome 2 L000004757 2 704670 705386 W 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; YBR242W is not an essential gene; YBR242W has a paralog, YGL101W, that arose from the whole genome duplication +S000030457 CDS YBR242W 2 704670 705386 W 2011-02-03 1997-01-28 +S000000447 ORF Verified YBR243C ALG7 UDP-N-acetylglucosamine--dolichyl-phosphate N-acetylglucosaminephosphotransferase|TUR1 chromosome 2 L000000078 2 706793 705447 C 2011-02-03 1997-01-28 UDP-N-acetyl-glucosamine-1-P transferase; transfers Glc-Nac-P from UDP-GlcNac to Dol-P in the ER in the first step of the dolichol pathway of protein asparagine-linked glycosylation; inhibited by tunicamycin; human homolog DPAGT1 can complement yeast ALG7 mutant +S000030493 CDS YBR243C 2 706793 705447 C 2011-02-03 1997-01-28 +S000000448 ORF Verified YBR244W GPX2 glutathione peroxidase GPX2|AMI1 chromosome 2 2 707528 708016 W 2011-02-03 1997-01-28 Phospholipid hydroperoxide glutathione peroxidase; protects cells from phospholipid hydroperoxides and nonphospholipid peroxides during oxidative stress; induced by glucose starvation; protein abundance increases in response to DNA replication stress +S000030605 CDS YBR244W 2 707528 708016 W 2011-02-03 1997-01-28 +S000000449 ORF Verified YBR245C ISW1 chromatin-remodeling ATPase ISW1|SGN2 chromosome 2 L000004447 2 711539 708150 C 2011-02-03 1997-01-28 ATPase subunit of imitation-switch (ISWI) class chromatin remodelers; with Ioc3p forms Isw1a complex involved in repression of transcription initiation; with Ioc2p and Ioc4p forms Isw1b complex involved in regulation of transcription elongation; Isw1b recruited to ORFs by H3K36 methylation and acts with Chd1p to prevent trans-histone exchange over coding regions; Isw1p import into nucleus depends on C-terminal bipartite nuclear targeting signal KRIR X19 KKAK +S000030646 CDS YBR245C 2 711539 708150 C 2011-02-03 1997-01-28 +S000000450 ORF Verified YBR246W RRT2 DPH7|diphthamide synthase|ERE1 chromosome 2 2 711591 712754 W 2011-02-03 1997-01-28 Methylesterase performing penultimate step of diphthamide biosynthesis; hydrolyzes methylated diphthine to produce diphthine and allows Dph6-catalyzed amidation reaction to occur; deletion leads to resistance to sordarin and accumulation of methylatediphthine; WD40 domain-containing protein; involved in endosomal recycling; forms complex with Rtt10p that functions in retromer-mediated pathway for recycling internalized cell-surface proteins +S000030760 CDS YBR246W 2 711591 712754 W 2011-02-03 1997-01-28 +S000000451 ORF Verified YBR247C ENP1 snoRNA-binding rRNA-processing protein ENP1|MEG1 chromosome 2 L000003200|L000001059 2 714455 713004 C 2011-02-03 1997-01-28 Protein associated with U3 and U14 snoRNAs; required for pre-rRNA processing and 40S ribosomal subunit synthesis; localized in the nucleus and concentrated in the nucleolus; human BYSL functionally complements the heat sensitivity of an enp1 ts mutant +S000031591 CDS YBR247C 2 714455 713004 C 2011-02-03 1997-01-28 +S000000452 ORF Verified YBR248C HIS7 imidazoleglycerol-phosphate synthase chromosome 2 L000000784 2 716465 714807 C 146 2011-02-03 1997-01-28 Imidazole glycerol phosphate synthase; glutamine amidotransferase:cyclase that catalyzes the fifth step of histidine biosynthesis and also produces 5-aminoimidazole-4-carboxamide ribotide (AICAR), a purine precursor +S000031672 CDS YBR248C 2 716465 714807 C 2011-02-03 1997-01-28 +S000000453 ORF Verified YBR249C ARO4 3-deoxy-7-phosphoheptulonate synthase ARO4 chromosome 2 L000000119 2 717994 716882 C 2011-02-03 1997-01-28 3-deoxy-D-arabino-heptulosonate-7-phosphate (DAHP) synthase; catalyzes the first step in aromatic amino acid biosynthesis and is feedback-inhibited by tyrosine or high concentrations of phenylalanine or tryptophan; relative distribution to the nucleus increases upon DNA replication stress +S000031774 CDS YBR249C 2 717994 716882 C 2011-02-03 1997-01-28 +S000000454 ORF Verified YBR250W SPO23 chromosome 2 2 719033 720604 W 2011-02-03 1997-01-28 Protein of unknown function; associates with meiosis-specific protein Spo1p +S000033891 CDS YBR250W 2 719033 720604 W 2011-02-03 1997-01-28 +S000000455 ORF Verified YBR251W MRPS5 mitochondrial 37S ribosomal protein MRPS5 chromosome 2 L000001174 2 721390 722313 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the small subunit +S000034780 CDS YBR251W 2 721390 722313 W 2011-02-03 1997-01-28 +S000000456 ORF Verified YBR252W DUT1 bifunctional dITP/dUTP diphosphatase chromosome 2 L000000537 2 722611 723054 W 2011-02-03 1997-01-28 Deoxyuridine triphosphate diphosphatase (dUTPase); catalyzes hydrolysis of dUTP to dUMP and PPi, thereby preventing incorporation of uracil into DNA during replication; critical for the maintenance of genetic stability; also has diphosphatase activity on deoxyinosine triphosphate; human homolog DUT allows growth of yeast haploid dut1 null mutant after sporulation of heterozygous diploid +S000034888 CDS YBR252W 2 722611 723054 W 2011-02-03 1997-01-28 +S000000457 ORF Verified YBR253W SRB6 MED22 chromosome 2 L000002053 2 723270 723635 W 2011-02-03 1997-01-28 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation +S000035009 CDS YBR253W 2 723270 723635 W 2011-02-03 1997-01-28 +S000000458 ORF Verified YBR254C TRS20 TRAPP subunit TRS20 chromosome 2 S000007431 2 724263 723736 C 2011-02-03 1997-01-28 Core component of transport protein particle (TRAPP) complexes I-III; TRAPPs are multimeric guanine nucleotide-exchange factors for GTPase Ypt1p, regulating ER-Golgi traffic (TRAPPI), intra-Golgi traffic (TRAPPII), endosome-Golgi traffic (TRAPPII and III) and autophagy (TRAPPIII); mutation leads to defects in endocytic recycling, block in sporulation/meiosis; mutations in human homolog TRAPPC2 cause spondyloepiphyseal dysplasia tarda, TRAPPC2 can complement yeast null mutant +S000035081 CDS YBR254C 2 724263 723736 C 2011-02-03 1997-01-28 +S000000459 ORF Verified YBR255W MTC4 chromosome 2 2 724456 726540 W 2011-02-03 1997-01-28 Protein of unknown function; required for normal growth rate at 15 degrees C; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; mtc4 is synthetically sick with cdc13-1 +S000036028 CDS YBR255W 2 724456 726540 W 2011-02-03 1997-01-28 +S000007649 ORF Uncharacterized YBR255C-A RCF3 chromosome 2 2 727074 726618 C 2011-02-03 2003-12-17|2001-06-26 Putative protein of unknown function; may interact with respiratory chain complexes III (ubiquinol-cytochrome c reductase) or IV (cytochrome c oxidase); identified by sequence comparison with hemiascomycetous yeast species +S000037335 CDS YBR255C-A 2 726917 726618 C 2011-02-03 2003-12-17|2001-06-26 +S000037334 CDS YBR255C-A 2 727074 727012 C 2011-02-03 2003-12-17|2001-06-26 +S000037336 intron YBR255C-A 2 727011 726918 C 2011-02-03 2003-12-17|2001-06-26 +S000000460 ORF Verified YBR256C RIB5 riboflavin synthase chromosome 2 L000001636 2 728102 727386 C 150 2011-02-03 1997-01-28 Riboflavin synthase; catalyzes the last step of the riboflavin biosynthesis pathway +S000036049 CDS YBR256C 2 728102 727386 C 2011-02-03 1997-01-28 +S000000461 ORF Verified YBR257W POP4 RNase P/RNase MRP complex subunit chromosome 2 L000003537 2 728885 729724 W 2011-02-03 1997-01-28 Subunit of both RNase MRP and nuclear RNase P; RNase MRP cleaves pre-rRNA, while nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs; binds to the RPR1 RNA subunit in RNase P +S000036225 CDS YBR257W 2 728885 729724 W 2011-02-03 1997-01-28 +S000000462 ORF Verified YBR258C SHG1 CPS15 chromosome 2 2 730162 729734 C 2011-02-03 1997-01-28 Subunit of the COMPASS (Set1C) complex; COMPASS methylates histone H3 on lysine 4 and is required in transcriptional silencing near telomeres +S000036263 CDS YBR258C 2 730162 729734 C 2011-02-03 1997-01-28 +S000000463 ORF Verified YBR259W chromosome 2 2 730387 732453 W 2011-02-03 1997-01-28 Protein of unknown function; YBR259W is not an essential gene; forms cytoplasmic foci upon DNA replication stress +S000036998 CDS YBR259W 2 730387 732453 W 2011-02-03 1997-01-28 +S000000464 ORF Verified YBR260C RGD1 chromosome 2 2 734639 732639 C 2011-02-03 1997-01-28 GTPase-activating protein (RhoGAP) for Rho3p and Rho4p; possibly involved in control of actin cytoskeleton organization +S000035993 CDS YBR260C 2 734639 732639 C 2011-02-03 1997-01-28 +S000000465 ORF Verified YBR261C TAE1 N-terminal protein methyltransferase|NTM1 chromosome 2 2 735530 734832 C 2011-02-03 1997-01-28 AdoMet-dependent proline methyltransferase; catalyzes the dimethylation of ribosomal proteins Rpl12 and Rps25 at N-terminal proline residues; has a role in protein synthesis; fusion protein localizes to the cytoplasm +S000037822 CDS YBR261C 2 735530 734832 C 2011-02-03 1997-01-28 +S000000466 ORF Verified YBR262C MIC12 AIM5|MCS12|FMP51 chromosome 2 2 736040 735720 C 2011-02-03 1997-01-28 Component of the MICOS complex; MICOS (formerly MINOS or MitOS) is a mitochondrial inner membrane complex that extends into the intermembrane space and has a role in the maintenance of crista junctions, inner membrane architecture, and formation of contact sites to the outer membrane; forms a subcomplex with Mic10p and Mic27p whose assembly and stability requires cardiolipin +S000029843 CDS YBR262C 2 736040 735720 C 2011-02-03 1997-01-28 +S000000467 ORF Verified YBR263W SHM1 glycine hydroxymethyltransferase SHM1|TMP3|SHMT1 chromosome 2 L000001883 2 736264 737736 W 2011-02-03 2003-09-22|1997-01-28 Mitochondrial serine hydroxymethyltransferase; converts serine to glycine plus 5,10 methylenetetrahydrofolate; involved in generating precursors for purine, pyrimidine, amino acid, and lipid biosynthesis; reverse reaction generates serine +S000030905 CDS YBR263W 2 736264 737736 W 2011-02-03 2003-09-22|1997-01-28 +S000000468 ORF Verified YBR264C YPT10 Rab family GTPase YPT10 chromosome 2 2 738369 737770 C 2011-02-03 2003-09-22|1997-01-28 Rab family GTP-binding protein; contains the PEST signal sequence specific for proteolytic enzymes; may be involved in vesicular transport; overexpression leads to accumulation of Golgi-like cisternae with budding vesicles +S000030937 CDS YBR264C 2 738369 737770 C 2011-02-03 2003-09-22|1997-01-28 +S000000469 ORF Verified YBR265W TSC10 3-dehydrosphinganine reductase chromosome 2 2 738582 739544 W 2011-02-03 1997-01-28|2011-02-03 3-ketosphinganine reductase; catalyzes the second step in phytosphingosine synthesis; essential for growth in the absence of exogenous dihydrosphingosine or phytosphingosine; localized to lipid droplets; member of short chain dehydrogenase/reductase protein family +S000031091 CDS YBR265W 2 738582 739544 W 2011-02-03 1997-01-28|2011-02-03 +S000000471 ORF Verified YBR267W REI1 chromosome 2 2 739841 741022 W 2011-02-03 1999-04-26|1997-01-28|2011-02-03 Cytoplasmic pre-60S factor; required for the correct recycling of shuttling factors Alb1, Arx1 and Tif6 at the end of the ribosomal large subunit biogenesis; involved in bud growth in the mitotic signaling network +S000032151 CDS YBR267W 2 739841 741022 W 2011-02-03 1999-04-26|1997-01-28|2011-02-03 +S000000470 ORF Dubious YBR266C SLM6 chromosome 2 2 740388 739936 C 2011-02-03 1999-04-26|1997-01-28|2011-02-03 Protein with a potential role in actin cytoskeleton organization; gene exhibits synthetic genetic interaction with MSS4 encoding phosphatidylinositol 4-phosphate kinase +S000031132 CDS YBR266C 2 740388 739936 C 2011-02-03 1999-04-26|1997-01-28|2011-02-03 +S000000472 ORF Verified YBR268W MRPL37 mitochondrial 54S ribosomal protein YmL37|YmL37 chromosome 2 L000001172 2 741299 741616 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit +S000032225 CDS YBR268W 2 741299 741616 W 2011-02-03 1997-01-28 +S000118353 ARS ARS224 ARSII-742 chromosome 2 2 741681 741797 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178053 ARS_consensus_sequence ARS224 2 741742 741726 C 2014-11-18 2014-11-18 +S000000473 ORF Verified YBR269C SDH8 FMP21 chromosome 2 2 742576 742160 C 2011-02-03 2004-01-09|1997-01-28 Protein required for assembly of succinate dehydrogenase; interacts with flavinylated Sdh1p and may function as a chaperone for free Sdh1p, protecting its FAD cofactor from redox reactions before assembly of the complex; soluble protein of the mitochondrial matrix; respiratory defect of null mutant is functionally complemented by Drosophila and human orthologs +S000032252 CDS YBR269C 2 742576 742160 C 2011-02-03 2004-01-09|1997-01-28 +S000000474 ORF Verified YBR270C BIT2 chromosome 2 2 744398 742761 C 2011-02-03 1997-01-28|2011-02-03 Subunit of TORC2 membrane-associated complex; involved in regulation of actin cytoskeletal dynamics during polarized growth and cell wall integrity; interacts with Slm1p and Slm2p, homologous PH domain-containing TORC2 substrates; BIT2 has a paralog, BIT61, that arose from the whole genome duplication +S000031901 CDS YBR270C 2 744398 742761 C 2011-02-03 1997-01-28|2011-02-03 +S000000475 ORF Verified YBR271W EFM2 S-adenosylmethionine-dependent methyltransferase chromosome 2 2 744852 746111 W 2011-02-03 1997-01-28 S-adenosylmethionine-dependent methyltransferase; seven-beta-strand lysine methyltransferase which dimethylates translation elongation factor EF2 (Eft1p and Eft2p) at lysine 613 and methylates EF3 (Yef3p) at lysine 187; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; involved in regulation of translational termination; predicted involvement in ribosome biogenesis +S000032109 CDS YBR271W 2 744852 746111 W 2011-02-03 1997-01-28 +S000000476 ORF Verified YBR272C HSM3 chromosome 2 L000004729 2 747803 746361 C 2011-02-03 1997-01-28 Evolutionarily conserved 19S regulatory particle assembly-chaperone; involved in the assembly of the base subcomplex of the 19S proteasomal regulatory particle (RP); involved in DNA mismatch repair during slow growth; weak similarity to Msh1p; structural study suggests Hsm3p is a scaffold protein for Rpt1p-Rpt2p complex formation; ortholog of human 19S subunit S5b +S000032139 CDS YBR272C 2 747803 746361 C 2011-02-03 1997-01-28 +S000000477 ORF Verified YBR273C UBX7 CUI3 chromosome 2 2 749371 748061 C 2011-02-03 1997-01-28 UBX (ubiquitin regulatory X) domain-containing protein; interacts with Cdc48p; UBX7 has a paralog, UBX6, that arose from the whole genome duplication +S000034143 CDS YBR273C 2 749371 748061 C 2011-02-03 1997-01-28 +S000000478 ORF Verified YBR274W CHK1 serine/threonine protein kinase CHK1 chromosome 2 L000004861 2 749594 751177 W 2011-02-03 1997-01-28 Serine/threonine kinase and DNA damage checkpoint effector; mediates cell cycle arrest via phosphorylation of Pds1p; phosphorylated by checkpoint signal transducer Mec1p; homolog of S. pombe and mammalian Chk1 checkpoint kinase +S000034288 CDS YBR274W 2 749594 751177 W 2011-02-03 1997-01-28 +S000000479 ORF Verified YBR275C RIF1 DNA-binding protein RIF1 chromosome 2 L000001639 2 757106 751356 C 2011-02-03 1997-01-28|2011-02-03 Protein that binds to the Rap1p C-terminus; acts synergistically with Rif2p to help control telomere length and establish telomeric silencing; involved in control of DNA replication; contributes to resection of DNA double strand breaks (DSBs); deletion results in telomere elongation +S000034316 CDS YBR275C 2 757106 751356 C 2011-02-03 1997-01-28|2011-02-03 +S000118354 ARS ARS225 ARSII-757 chromosome 2 2 757437 757667 2011-02-03 2006-08-30 Autonomously Replicating Sequence; replication origin of very weak function +S000000480 ORF Verified YBR276C PPS1 tyrosine/serine/threonine protein phosphatase PPS1 chromosome 2 L000003522 2 760043 757620 C 2011-02-03 1997-01-28 Protein phosphatase; has specificity for serine, threonine, and tyrosine residues; has a role in the DNA synthesis phase of the cell cycle +S000034373 CDS YBR276C 2 760043 757620 C 2011-02-03 1997-01-28 +S000000482 ORF Verified YBR278W DPB3 DNA polymerase epsilon noncatalytic subunit chromosome 2 L000000520 2 760294 760899 W 2011-02-03 1997-01-28 Third-largest subunit of DNA polymerase II (DNA polymerase epsilon); required to maintain fidelity of chromosomal replication and also for inheritance of telomeric silencing; stabilizes the interaction of Pol epsilon with primer-template DNA, positively affecting the processivity of the polymerase and exonuclease activities of Pol epsilon; mRNA abundance peaks at the G1/S boundary of the cell cycle; DPB3 has a paralog, DLS1, that arose from the whole genome duplication +S000035459 CDS YBR278W 2 760294 760899 W 2011-02-03 1997-01-28 +S000000481 ORF Dubious YBR277C chromosome 2 2 760616 760215 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YBR278W +S000035356 CDS YBR277C 2 760616 760215 C 2011-02-03 1997-01-28 +S000000483 ORF Verified YBR279W PAF1 chromosome 2 L000002621 2 761257 762594 W 2011-02-03 1997-01-28 Component of the Paf1p complex involved in transcription elongation; binds to and modulates the activity of RNA polymerases I and II; required for expression of a subset of genes, including cell cycle-regulated genes; involved in SER3 repression by helping to maintain SRG1 transcription-dependent nucleosome occupancy; homolog of human PD2/hPAF1 +S000035503 CDS YBR279W 2 761257 762594 W 2011-02-03 1997-01-28 +S000000484 ORF Verified YBR280C SAF1 SCF ubiquitin ligase complex subunit SAF1 chromosome 2 2 764697 762784 C 2011-02-03 2003-09-22|1997-01-28 F-Box protein involved in proteasome-dependent degradation of Aah1p; involved in proteasome-dependent degradation of Aah1p during entry of cells into quiescence; interacts with Skp1 +S000035024 CDS YBR280C 2 764697 762784 C 2011-02-03 2003-09-22|1997-01-28 +S000000485 ORF Verified YBR281C DUG2 glutamine amidotransferase subunit DUG2 chromosome 2 2 767606 764970 C 2011-02-03 1997-01-28 Component of glutamine amidotransferase (GATase II); forms a complex with Dug3p to degrade glutathione (GSH) and other peptides containing a gamma-glu-X bond in an alternative pathway to GSH degradation by gamma-glutamyl transpeptidase (Ecm38p) +S000035219 CDS YBR281C 2 767606 764970 C 2011-02-03 1997-01-28 +S000000486 ORF Verified YBR282W MRPL27 mitochondrial 54S ribosomal protein YmL27|YmL27 chromosome 2 L000002528|L000001167 2 768240 768680 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit; homolog of human Bcl-2 interacting protein BMRP +S000036203 CDS YBR282W 2 768240 768680 W 2011-02-03 1997-01-28 +S000000487 ORF Verified YBR283C SSH1 chromosome 2 L000003994 2 770415 768943 C 2011-02-03 1997-01-28 Subunit of the Ssh1 translocon complex; Sec61p homolog involved in co-translational pathway of protein translocation; not essential +S000036248 CDS YBR283C 2 770415 768943 C 2011-02-03 1997-01-28 +S000000488 ORF Uncharacterized YBR284W metallo-dependent hydrolase superfamily protein chromosome 2 2 771239 773632 W 2011-02-03 1997-01-28 Putative metallo-dependent hydrolase superfamily protein; similar to AMP deaminases but lacks key catalytic residues and does not rescue purine nucleotide metabolic defect of quadruple aah1 ade8 amd1 his1 mutant; null mutant exhibits longer telomeres, altered Ty mobility, decreased resistance to rapamycin and wortmannin; induced in response to hydrostatic pressure; not an essential gene; YBR284W has a paralog, YJL070C, that arose from the whole genome duplication +S000036400 CDS YBR284W 2 771239 773632 W 2011-02-03 1997-01-28 +S000000489 ORF Uncharacterized YBR285W chromosome 2 2 773922 774356 W 2011-02-03 1997-01-28|2011-02-03 Putative protein of unknown function; YBR285W is not an essential gene +S000030111 CDS YBR285W 2 773922 774356 W 2011-02-03 1997-01-28|2011-02-03 +S000000490 ORF Verified YBR286W APE3 APY1 chromosome 2 L000000093 2 774700 776313 W 2011-02-03 1997-01-28|2005-11-07 Vacuolar aminopeptidase Y; processed to mature form by Prb1p +S000030229 CDS YBR286W 2 774700 776313 W 2011-02-03 1997-01-28|2005-11-07 +S000000491 ORF Uncharacterized YBR287W ZSP1 chromosome 2 2 776571 777854 W 2011-02-03 1997-01-28 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the ER; YBR287W is not an essential gene +S000030366 CDS YBR287W 2 776571 777854 W 2011-02-03 1997-01-28 +S000000492 ORF Verified YBR288C APM3 YKS6 chromosome 2 L000002758 2 779463 778012 C 2011-02-03 1997-01-28|2011-02-03 Mu3-like subunit of the clathrin associated protein complex (AP-3); functions in transport of alkaline phosphatase to the vacuole via the alternate pathway +S000030452 CDS YBR288C 2 779463 778012 C 2011-02-03 1997-01-28|2011-02-03 +S000000493 ORF Verified YBR289W SNF5 TYE4|SWI10|HAF4 chromosome 2 L000001948 2 779667 782384 W 2011-02-03 1997-01-28|2011-02-03 Subunit of the SWI/SNF chromatin remodeling complex; involved in transcriptional regulation; functions interdependently in transcriptional activation with Snf2p and Snf6p; relocates to the cytosol under hypoxic conditions +S000031369 CDS YBR289W 2 779667 782384 W 2011-02-03 1997-01-28|2011-02-03 +S000000494 ORF Verified YBR290W BSD2 chromosome 2 L000000194 2 782591 783556 W 2011-02-03 1997-01-28 Heavy metal ion homeostasis protein; facilitates trafficking of Smf1p and Smf2p metal transporters to vacuole where they are degraded; acts as an adaptor protein with Rsp5p in the regulated endocytosis of Smf1p and is itself ubiquitylated by Rsp5p; controls metal ion transport, prevents metal hyperaccumulation, functions in copper detoxification +S000031117 CDS YBR290W 2 782591 783556 W 2011-02-03 1997-01-28 +S000000495 ORF Verified YBR291C CTP1 chromosome 2 L000003310 2 784572 783673 C 2011-02-03 1997-01-28 Mitochondrial inner membrane citrate transporter; member of the mitochondrial carrier family +S000031161 CDS YBR291C 2 784572 783673 C 2011-02-03 1997-01-28 +S000000496 ORF Dubious YBR292C chromosome 2 2 785073 784702 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YBR292C is not an essential gene +S000032196 CDS YBR292C 2 785073 784702 C 2011-02-03 1997-01-28 +S000000497 ORF Verified YBR293W VBA2 chromosome 2 2 787006 788430 W 2011-02-03 1997-01-28 Permease of basic amino acids in the vacuolar membrane +S000032357 CDS YBR293W 2 787006 788430 W 2011-02-03 1997-01-28 +S000000498 ORF Verified YBR294W SUL1 sulfate permease|SFP2 chromosome 2 L000002180 2 789235 791814 W 2011-02-03 1999-04-26|1997-01-28 High affinity sulfate permease of the SulP anion transporter family; sulfate uptake is mediated by specific sulfate transporters Sul1p and Sul2p, which control the concentration of endogenous activated sulfate intermediates +S000032440 CDS YBR294W 2 789235 791814 W 2011-02-03 1999-04-26|1997-01-28 +S000118355 ARS ARS228 ARSII-792 chromosome 2 2 792218 792310 2014-11-18 2014-11-18|2006-08-30|2011-02-03 Autonomously Replicating Sequence +S000000499 ORF Verified YBR295W PCA1 cation-transporting P-type ATPase PCA1|PAY2|CAD2 chromosome 2 L000001347|L000000207 2 792849 796499 W 161 2011-02-03 1997-01-28|2011-02-03 Cadmium transporting P-type ATPase; may also have a role in copper and iron homeostasis; stabilized by Cd binding, which prevents ubiquitination; S288C and other lab strains contain a G970R mutation which eliminates Cd transport function +S000034460 CDS YBR295W 2 792849 796499 W 2011-02-03 1997-01-28|2011-02-03 +S000000500 ORF Verified YBR296C PHO89 ITN1 chromosome 2 2 798522 796798 C 2011-02-03 1997-01-28 Plasma membrane Na+/Pi cotransporter; active in early growth phase; similar to phosphate transporters of Neurospora crassa; transcription regulated by inorganic phosphate concentrations and Pho4p; mutations in related human transporter genes hPit1 and hPit2 are associated with hyperphosphatemia-induced calcification of vascular tissue and familial idiopathic basal ganglia calcification +S000034537 CDS YBR296C 2 798522 796798 C 2011-02-03 1997-01-28 +S000028605 ORF Uncharacterized YBR296C-A chromosome 2 2 800242 800123 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031414 CDS YBR296C-A 2 800242 800123 C 2011-02-03 2003-07-29 +S000000501 ORF Verified YBR297W MAL33 transcription factor MAL33|MALR|MAL3R chromosome 2 L000001016 2 800523 801929 W 2011-02-03 1997-01-28 MAL-activator protein; part of complex locus MAL3; nonfunctional in genomic reference strain S288C +S000034658 CDS YBR297W 2 800523 801929 W 2011-02-03 1997-01-28 +S000000502 ORF Verified YBR298C MAL31 maltose permease|MALT|MAL3T chromosome 2 L000001014 2 804475 802631 C 2011-02-03 1997-01-28 Maltose permease; high-affinity maltose transporter (alpha-glucoside transporter); encoded in the MAL3 complex locus; member of the 12 transmembrane domain superfamily of sugar transporters; functional in genomic reference strain S288C +S000034677 CDS YBR298C 2 804475 802631 C 2011-02-03 1997-01-28 +S000028606 ORF Uncharacterized YBR298C-A chromosome 2 2 805256 805035 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031416 CDS YBR298C-A 2 805256 805035 C 2011-02-03 2003-07-29 +S000000503 ORF Verified YBR299W MAL32 alpha-glucosidase MAL32|MALS|MAL3S chromosome 2 L000001015 2 805351 807105 W 2011-02-03 1997-01-28 Maltase (alpha-D-glucosidase); inducible protein involved in maltose catabolism; encoded in the MAL3 complex locus; functional in genomic reference strain S288C; hydrolyzes the disaccharides maltose, turanose, maltotriose, and sucrose +S000035668 CDS YBR299W 2 805351 807105 W 2011-02-03 1997-01-28 +S000000505 ORF Verified YBR301W PAU24 seripauperin PAU24|DAN3 chromosome 2 2 809057 809419 W 2011-02-03 1997-01-28 Cell wall mannoprotein; has similarity to Tir1p, Tir2p, Tir3p, and Tir4p; member of the seripauperin multigene family encoded mainly in subtelomeric regions; expressed under anaerobic conditions, completely repressed during aerobic growth +S000033172 CDS YBR301W 2 809057 809419 W 2011-02-03 1997-01-28 +S000000504 ORF Dubious YBR300C chromosome 2 2 809097 808600 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YBR301W; YBR300C is not an essential gene +S000033026 CDS YBR300C 2 809097 808600 C 2011-02-03 1997-01-28 +S000000506 ORF Verified YBR302C COS2 chromosome 2 L000004716 2 811479 810340 C 2011-02-03 1997-01-28 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins +S000033196 CDS YBR302C 2 811479 810340 C 2011-02-03 1997-01-28 +S000028940 telomere TEL02R chromosome 2 2 812379 813184 W 166 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome II; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats +S000028941 telomeric_repeat TEL02R 2 813138 813184 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome II +S000028942 X_element TEL02R 2 812379 812848 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome II; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028943 X_element_combinatorial_repeat TEL02R 2 812849 813137 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr II; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000029654 ORF Verified R0010W FLP1 2-micron L000000619 2-micron 252 1523 W 2006-10-06 2004-02-11 Site-specific recombinase encoded on the 2-micron plasmid; required for 2-micron plasmid propagation as part of a plasmid amplification system that compensates for any copy number decreases caused by missegregation events +S000119086 CDS R0010W 2-micron 252 1523 W 2006-10-06 2004-02-11 +S000029675 ORF Verified R0020C REP1 2-micron L000001611 2-micron 3008 1887 C 2006-10-06 2004-02-11 Master regulator that regulates transcript levels of the FLP1 gene; acts in concert with Rep2p to regulate transcript levels of the FLP1 gene that promotes plasmid copy amplification and 2-micron plasmid-inheritance; also autoregulates levels of its own transcript; both Rep1p and Rep2p are sumoylated which is important for function +S000119087 CDS R0020C 2-micron 3008 1887 C 2006-10-06 2004-02-11 +S000029674 ORF Verified R0030W RAF1 2-micron S000007507 2-micron 3271 3816 W 2006-10-06 2004-02-11 Anti-repressor that increases 2 micron plasmid copy number; increases 2 micron plasmid copy number by relieving repression of the FLP1 site-specific recombinase caused by the Rep1-Rep2p trascription regulator; also itself repressed by the Rep1p-Rep2p complex +S000119088 CDS R0030W 2-micron 3271 3816 W 2006-10-06 2004-02-11 +S000029676 ORF Verified R0040C REP2 2-micron L000001612 2-micron 6198 5308 C 2006-10-06 2004-02-11 Master regulator that regulates transcript levels of the FLP1 gene; acts in concert with Rep1p to regulate transcript levels of the FLP1 gene that promotes plasmid copy amplification and 2-micron plasmid-inheritance; also autoregulates levels of its own transcript; required for Rep1p stability; both Rep1p and Rep2p are sumoylated which is important for function +S000119089 CDS R0040C 2-micron 6198 5308 C 2006-10-06 2004-02-11 +S000028476 ARS ARS300 ARS300 chromosome 3 3 989 1068 2014-11-18 2003-03-31|2014-11-18 Autonomously Replicating Sequence +S000030118 ARS_consensus_sequence ARS300 3 1060 1050 C 2003-03-31 2003-03-31 +S000028871 telomere TEL03L chromosome 3 3 1098 1 C -50 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome III; composed of an X element core sequence, X element combinatorial repeats, and a terminal stretch of telomeric repeats +S000028872 telomeric_repeat TEL03L 3 360 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome III +S000028873 X_element TEL03L 3 1098 640 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome III; contains an ARS consensus sequence and an Abf1p binding site +S000028874 X_element_combinatorial_repeat TEL03L 3 639 361 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr III; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000006828 long_terminal_repeat YCLWomega1 chromosome 3 3 1179 1429 W 2000-09-13 2000-05-19 Ty5 LTR +S000006831 LTR_retrotransposon YCLWTy5-1 Ty5 chromosome 3 3 1179 4322 W 2000-09-13 2000-05-19 Ty5 element, LTR retrotransposon of the Copia (Pseudoviridae) group; this is the only near-full length Ty5 retrotransposon in S288C and it is non-functional +S000000581 ORF Dubious YCL076W chromosome 3 3 1392 2135 W 2000-09-13 2000-09-13|1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034360 CDS YCL076W 3 1392 2135 W 2000-09-13 2000-09-13|1997-01-28 +S000000580 pseudogene YCL075W chromosome 3 3 2126 2566 W 2000-09-13 1997-01-28 Pseudogene: encodes fragment of Ty Pol protein +S000033443 CDS YCL075W 3 2126 2566 W 2000-09-13 1997-01-28 +S000000579 pseudogene YCL074W chromosome 3 3 2824 3750 W 2000-09-13 2000-09-13|1997-01-28 Pseudogene: encodes fragment of Ty Pol protein +S000033352 CDS YCL074W 3 2824 3750 W 2000-09-13 2000-09-13|1997-01-28 +S000006829 long_terminal_repeat YCLWomega2 chromosome 3 3 4073 4322 W 2000-09-13 2000-05-19 Ty5 LTR +S000000575 ORF Verified YCL073C GEX1 glutathione exchanger chromosome 3 3 8326 6479 C 2000-09-13 2000-09-13|1997-01-28 Proton:glutathione antiporter; localized to the vacuolar and plasma membranes; imports glutathione from the vacuole and exports it through the plasma membrane; has a role in resistance to oxidative stress and modulation of the PKA pathway; GEX1 has a paralog, GEX2, that arose from a segmental duplication +S000033250 CDS YCL073C 3 8326 6479 C 2000-09-13 2000-09-13|1997-01-28 +S000000574 ORF Verified YCL069W VBA3 basic amino acid transporter chromosome 3 3 9706 11082 W 2000-09-13 1997-01-28 Permease of basic amino acids in the vacuolar membrane; VBA3 has a paralog, VBA5, that arose from a segmental duplication +S000031320 CDS YCL069W 3 9706 11082 W 2000-09-13 1997-01-28 +S000028477 ARS ARS301 ARS301 HML-E ARS chromosome 3 3 11146 11401 2003-03-31 2003-03-31 Inactive replication origin linked to the silent mating type locus HML; functions as a transcriptional silencer +S000030120 ARS_consensus_sequence ARS301 3 11257 11267 W 2003-03-31 2003-03-31 +S000029214 silent_mating_type_cassette_array silenced_gene HML HML chromosome 3 L000000791 3 11146 14849 W -49 2007-12-10 2007-12-10 Mating type cassette - left; unexpressed complete copy of the mating-type genes, silenced by the Sir2 histone deacetylase and its associated SIR1, SIR3 and SIR4 proteins; mating-type switching involves replacement of the Ya or Yalpha sequences present at the MAT locus with either the a or alpha genes located at one of the HM loci in a process stimulated by the HO endonuclease; sequence replacement occurs by gene conversion, leaving the donor unaltered +S000124942 W_region HML 3 11509 12238 W 2007-12-10 2007-12-10 +S000124943 X_region HML 3 12239 12943 W 2007-12-10 2007-12-10 +S000124944 Y_region HML 3 12944 13690 W 2007-12-10 2007-12-10 +S000124945 Z1_region HML 3 13691 13929 W 2007-12-10 2007-12-10 +S000124946 Z2_region HML 3 13930 14017 W 2007-12-10 2007-12-10 +S000000573 ORF Uncharacterized YCL068C chromosome 3 3 12285 11503 C 2000-09-13 2000-09-13|1997-01-28 Putative protein of unknown function +S000031134 CDS YCL068C 3 12285 11503 C 2000-09-13 2000-09-13|1997-01-28 +S000000572 ORF Verified|silenced_gene YCL067C HMLALPHA2 homeodomain mating type protein alpha2|ALPHA2 chromosome 3 3 13018 12386 C 2000-09-13 1997-01-28 Silenced copy of ALPHA2 at HML; homeobox-domain protein that associates with Mcm1p in haploid cells to repress a-specific gene expression and interacts with a1p in diploid cells to repress haploid-specific gene expression +S000030191 CDS YCL067C 3 13018 12386 C 2000-09-13 1997-01-28 +S000000571 ORF Verified|silenced_gene YCL066W HMLALPHA1 transcriptional co-activator mating type protein alpha|ALPHA1 chromosome 3 3 13282 13809 W 2000-09-13 1997-01-28 Silenced copy of ALPHA1 at HML; ALPHA1 encodes a transcriptional coactivator involved in the regulation of mating-type alpha-specific gene expression +S000030081 CDS YCL066W 3 13282 13809 W 2000-09-13 1997-01-28 +S000000570 ORF Dubious YCL065W chromosome 3 3 13751 14119 W 2000-09-13 2000-09-13|1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps HMLALPHA1 +S000029969 CDS YCL065W 3 13751 14119 W 2000-09-13 2000-09-13|1997-01-28 +S000028478 ARS ARS302 ARS302 HML-I ARS chromosome 3 3 14575 14849 2003-03-31 2003-03-31 Inactive replication origin linked to the silent mating type locus HML; functions as a transcriptional silencer +S000030152 ARS_consensus_sequence ARS302 3 14701 14711 W 2003-03-31 2003-03-31 +S000028479 ARS ARS303 ARS303 chromosome 3 3 14871 15213 2003-03-31 2003-03-31 Autonomously Replicating Sequence on Chromosome III; inactive as replication origin at native locus near HML +S000030154 ARS_consensus_sequence ARS303 3 15196 15186 C 2003-03-31 2003-03-31 +S000028480 ARS ARS320 ARS320 chromosome 3 3 15214 16274 2003-03-31 2003-03-31 Autonomously Replicating Sequence on Chromosome III; inactive as replication origin at native locus near HML +S000030156 ARS_consensus_sequence ARS320 3 15298 15308 W 2003-03-31 2003-03-31 +S000000569 ORF Verified YCL064C CHA1 L-serine/L-threonine ammonia-lyase CHA1 chromosome 3 L000000316 3 16880 15798 C -46 2000-09-13 2000-09-13|1997-01-28 Catabolic L-serine (L-threonine) deaminase; catalyzes the degradation of both L-serine and L-threonine; required to use serine or threonine as the sole nitrogen source, transcriptionally induced by serine and threonine +S000037243 CDS YCL064C 3 16880 15798 C 2000-09-13 2000-09-13|1997-01-28 +S000000568 ORF Verified YCL063W VAC17 YCL062W chromosome 3 3 17290 18561 W 2000-09-13 2000-09-13|1997-01-28 Phosphoprotein involved in vacuole inheritance; degraded in late M phase of the cell cycle; acts as a vacuole-specific receptor for myosin Myo2p; involved in regulation of asymmetric inheritance of aggregated/misfolded proteins and age reset +S000037206 CDS YCL063W 3 17290 18561 W 2000-09-13 2000-09-13|1997-01-28 +S000000566 ORF Verified YCL061C MRC1 chromatin-modulating protein MRC1|YCL060C chromosome 3 3 22106 18816 C 2000-09-13 2000-09-13|1997-01-28 S-phase checkpoint protein required for DNA replication; couples DNA helicase and polymerase; interacts with and stabilizes Pol2p at stalled replication forks during stress, where it forms a pausing complex with Tof1p and is phosphorylated by Mec1p; defines a novel S-phase checkpoint with Hog1p that coordinates DNA replication and transcription upon osmostress; protects uncapped telomeres; Dia2p-dependent degradation mediates checkpoint recovery; mammalian claspin homolog +S000036990 CDS YCL061C 3 22106 18816 C 2000-09-13 2000-09-13|1997-01-28 +S000000564 ORF Verified YCL059C KRR1 ribosome biosynthesis protein KRR1 chromosome 3 L000004098 3 23379 22429 C 2000-09-13 1997-01-28 Nucleolar protein required for rRNA synthesis and ribosomal assembly; required for the synthesis of 18S rRNA and for the assembly of 40S ribosomal subunit; essential gene +S000034984 CDS YCL059C 3 23379 22429 C 2000-09-13 1997-01-28 +S000028518 ORF Verified YCL058W-A ADF1 chromosome 3 3 23584 23925 W 2006-01-11 2003-07-29|2006-01-11 Transcriptional repressor encoded by the FYV5 antisense strand; negatively regulates transcription of FYV5 by binding to the promoter on the sense strand +S000030294 CDS YCL058W-A 3 23584 23925 W 2006-01-11 2003-07-29|2006-01-11 +S000000563 ORF Verified YCL058C FYV5 MDF1 chromosome 3 3 23981 23523 C 2000-09-13 1997-01-28 Protein involved in regulation of the mating pathway; binds with Matalpha2p to promoters of haploid-specific genes; required for survival upon exposure to K1 killer toxin; involved in ion homeostasis +S000034080 CDS YCL058C 3 23981 23523 C 2000-09-13 1997-01-28 +S000007547 ORF Verified YCL057C-A MIC10 MOS1|MCS10|MIO10 chromosome 3 3 24325 24032 C 2000-09-14 2000-09-14 Conserved component of the MICOS complex; MICOS (formerly MINOS or MitOS) is a mitochondrial inner membrane complex that extends into the intermembrane space and has a role in the maintenance of crista junctions, inner membrane architecture, and formation of contact sites to the outer membrane; forms a subcomplex with Mic12p and Mic27p whose assembly and stability requires cardiolipin; homo-oligomers cause membrane bending; ortholog of human MINOS1 +S000037065 CDS YCL057C-A 3 24325 24032 C 2000-09-14 2000-09-14 +S000000562 ORF Verified YCL057W PRD1 metalloendopeptidase chromosome 3 L000003155 3 24768 26906 W 2000-09-13 1997-01-28 Zinc metalloendopeptidase; found in the cytoplasm and intermembrane space of mitochondria; with Cym1p, involved in degradation of mitochondrial proteins and of presequence peptides cleaved from imported proteins; protein abundance increases in response to DNA replication stress +S000034023 CDS YCL057W 3 24768 26906 W 2000-09-13 1997-01-28 +S000000561 ORF Verified YCL056C PEX34 chromosome 3 3 27359 26925 C 2000-09-13 1997-01-28 Protein that regulates peroxisome populations; peroxisomal integral membrane protein; interacts with Pex11p, Pex25p, and Pex27p to control both constitutive peroxisome division and peroxisome morphology and abundance during peroxisome proliferation +S000033789 CDS YCL056C 3 27359 26925 C 2000-09-13 1997-01-28 +S000000560 ORF Verified YCL055W KAR4 chromosome 3 L000003481 3 27929 28936 W 2000-09-13 1997-01-28 Transcription factor required for response to pheromones; also required during meiosis; exists in two forms, a slower-migrating form more abundant during vegetative growth and a faster-migrating form induced by pheromone +S000033110 CDS YCL055W 3 27929 28936 W 2000-09-13 1997-01-28 +S000028481 ARS ARS304 ARS304 chromosome 3 3 30200 30657 2003-03-31 2003-03-31 Autonomously Replicating Sequence on Chromosome III +S000030159 ARS_consensus_sequence ARS304 3 30439 30429 C 2003-03-31 2003-03-31 +S000178054 ORF Uncharacterized YCL054W-A RDT1 chromosome 3 3 30910 30996 W 2014-11-18 2014-11-18 Short open reading frame, shows evidence of translation; may be new protein-coding gene that originated de novo from noncoding sequence; same allele found in at least 33 other S. cerevisiae strains; at least 3 strains have a second allele with three nucleotide substitutions leading to two amino acid differences +S000178055 CDS YCL054W-A 3 30910 30996 W 2014-11-18 2014-11-18 +S000000559 ORF Verified YCL054W SPB1 27S pre-rRNA (guanosine2922-2'-O)-methyltransferase chromosome 3 L000001990 3 31449 33974 W 2000-09-13 1999-07-17|1997-01-28 AdoMet-dependent methyltransferase; involved in rRNA processing and 60S ribosomal subunit maturation; methylates G2922 in the tRNA docking site of the large subunit rRNA and in the absence of snR52, U2921; suppressor of PAB1 mutants +S000033016 CDS YCL054W 3 31449 33974 W 2000-09-13 1999-07-17|1997-01-28 +S000000557 ORF Verified YCL052C PBN1 chromosome 3 L000003219 3 35393 34143 C 2000-09-13 1997-01-28 Component of glycosylphosphatidylinositol-mannosyltransferase I; essential component; required for the autocatalytic post-translational processing of the protease B precursor Prb1p; localizes to ER in lumenal orientation; homolog of mammalian PIG-X +S000031965 CDS YCL052C 3 35393 34143 C 2000-09-13 1997-01-28 +S000000556 ORF Verified YCL051W LRE1 chromosome 3 L000003355 3 35865 37616 W 2000-09-13 2000-09-13|1997-01-28 Protein involved in control of cell wall structure and stress response; direct inhibitor of the nuclear Dbf2 related (NDR) kinase Cbk1p-Mob2p; overproduction confers resistance to cell-wall degrading enzymes; exhibits genetic interactions with genes involved in the cell wall integrity pathway; LRE1 has a paralog, HLR1, that arose from the whole genome duplication +S000031923 CDS YCL051W 3 35865 37616 W 2000-09-13 2000-09-13|1997-01-28 +S000000555 ORF Verified YCL050C APA1 bifunctional AP-4-A phosphorylase/ADP sulfurylase|DTP1 chromosome 3 L000000090 3 38801 37836 C -33 2000-09-13 2000-09-13|1997-01-28 AP4A phosphorylase; bifunctional diadenosine 5',5'''-P1,P4-tetraphosphate phosphorylase and ADP sulfurylase involved in catabolism of bis(5'-nucleosidyl) tetraphosphates; catalyzes phosphorolysis of dinucleoside oligophosphates, cleaving substrates' alpha/beta-anhydride bond and introducing Pi into the beta-position of the corresponding NDP formed; protein abundance increases under DNA replication stress; APA1 has a paralog, APA2, that arose from the whole genome duplication +S000031713 CDS YCL050C 3 38801 37836 C 2000-09-13 2000-09-13|1997-01-28 +S000028482 ARS ARS305 ARS305 chromosome 3 3 39508 39595 2014-11-18 2003-03-31|2014-11-18 Efficient early-firing replication origin on Chromosome III +S000030162 ARS_consensus_sequence ARS305 3 39589 39579 C 2003-03-31 2003-03-31 +S000000554 ORF Uncharacterized YCL049C chromosome 3 3 40724 39786 C 2000-09-13 2000-09-13|1997-01-28 Protein of unknown function; localizes to membrane fraction; YCL049C is not an essential gene +S000031529 CDS YCL049C 3 40724 39786 C 2000-09-13 2000-09-13|1997-01-28 +S000087203 ORF Uncharacterized YCL048W-A chromosome 3 3 41488 41727 W 2005-11-14 2005-11-14 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the cell periphery and vacuole; YCL048W-A has a paralog, YDR524C-B, that arose from the whole genome duplication +S000087204 CDS YCL048W-A 3 41488 41727 W 2005-11-14 2005-11-14 +S000000553 ORF Verified YCL048W SPS22 chromosome 3 3 42165 43556 W 2000-09-13 1997-01-28 Protein of unknown function; SPS22 has a paralog, SPS2, that arose from the whole genome duplication; redundant with Sps2p for the organization of the beta-glucan layer of the spore wall +S000031494 CDS YCL048W 3 42165 43556 W 2000-09-13 1997-01-28 +S000000552 ORF Verified YCL047C POF1 nicotinamide-nucleotide adenylyltransferase chromosome 3 3 44437 43661 C 2000-09-13 1997-01-28 Nicotinamide mononucleotide-specific adenylyltransferase (NMNAT); catalyzes the conversion of nicotinamide mononucleotide (NMN) to nicotinamide adenine dinucleotide (NAD+); role in the nicotinamide riboside (NR) salvage pathway of NAD+ biosynthesis; involved in NR and NAD+ homeostasis; ATPase involved in protein quality control and filamentation pathways; interacts physically with Kss1p and suppresses the filamentation defect of a kss1 deletion +S000030504 CDS YCL047C 3 44437 43661 C 2000-09-13 1997-01-28 +S000000551 ORF Dubious YCL046W chromosome 3 3 46640 46963 W 2000-09-13 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YCL045C +S000030444 CDS YCL046W 3 46640 46963 W 2000-09-13 1997-01-28 +S000000550 ORF Verified YCL045C EMC1 chromosome 3 3 46905 44623 C 2000-09-13 1997-01-28 Member of conserved endoplasmic reticulum membrane complex; involved in efficient folding of proteins in the ER; null mutant displays induction of the unfolded protein response; interacts with Gal80p; homologous to worm H17B01.4/EMC-1, fly CG2943, and human KIAA0090 +S000030200 CDS YCL045C 3 46905 44623 C 2000-09-13 1997-01-28 +S000000549 ORF Verified YCL044C MGR1 chromosome 3 3 48364 47111 C 2000-09-13 1997-01-28 Subunit of the mitochondrial (mt) i-AAA protease supercomplex; i-AAA degrades misfolded mitochondrial proteins; forms a subcomplex with Mgr3p that binds to substrates to facilitate proteolysis; required for growth of cells lacking mtDNA +S000037468 CDS YCL044C 3 48364 47111 C 2000-09-13 1997-01-28 +S000000548 ORF Verified YCL043C PDI1 protein disulfide isomerase PDI1|TRG1|MFP1 chromosome 3 L000001360 3 50221 48653 C 2000-09-13 1997-01-28 Protein disulfide isomerase; multifunctional oxidoreductase of the ER lumen, essential for disulfide bond formation in secretory and cell-surface proteins, processing of non-native disulfide bonds; Ero1p activator; complexes with exomannosidase, Mnl1p to facilitate the recognition of misfolded glycoproteins and the trimming of glycan Man8GlcNAc2 to Man7GlcNAc2 on substrates, thereby accelerating ERAD; PDI1 has a paralog, EUG1, that arose from the whole genome duplication +S000037357 CDS YCL043C 3 50221 48653 C 2000-09-13 1997-01-28 +S000000547 ORF Uncharacterized YCL042W chromosome 3 3 50584 50943 W 2000-09-13 2000-09-13|1997-01-28 Putative protein of unknown function; epitope-tagged protein localizes to the cytoplasm +S000037297 CDS YCL042W 3 50584 50943 W 2000-09-13 2000-09-13|1997-01-28 +S000000546 ORF Dubious YCL041C chromosome 3 3 50627 50133 C 2000-09-13 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps both the verified gene PDI1/YCL043C and the uncharacterized gene YCL042W +S000036569 CDS YCL041C 3 50627 50133 C 2000-09-13 1997-01-28 +S000000545 ORF Verified YCL040W GLK1 glucokinase|HOR3 chromosome 3 L000000708 3 50838 52340 W -47 2000-09-13 1997-01-28 Glucokinase; catalyzes the phosphorylation of glucose at C6 in the first irreversible step of glucose metabolism; one of three glucose phosphorylating enzymes; expression regulated by non-fermentable carbon sources; GLK1 has a paralog, EMI2, that arose from the whole genome duplication +S000036534 CDS YCL040W 3 50838 52340 W 2000-09-13 1997-01-28 +S000000544 ORF Verified YCL039W GID7 glucose-induced degradation complex subunit GID7|MOH2 chromosome 3 3 52645 54882 W 2000-09-13 1999-07-17|1997-01-28 Subunit of GID Complex that binds directly to central component Vid30p; GID complex is involved in proteasome-dependent catabolite inactivation of fructose-1,6-bisphosphatase; Gid7p contains six WD40 repeats; computational analysis suggests that Gid7p and Moh1p have similar functions +S000035505 CDS YCL039W 3 52645 54882 W 2000-09-13 1999-07-17|1997-01-28 +S000000543 ORF Verified YCL038C ATG22 AUT4 chromosome 3 L000004750 3 56527 54941 C 2000-09-13 1997-01-28 Vacuolar integral membrane protein required for efflux of amino acids; required for efflux of amino acids during autophagic body breakdown in the vacuole; null mutation causes a gradual loss of viability during starvation +S000034405 CDS YCL038C 3 56527 54941 C 2000-09-13 1997-01-28 +S000000542 ORF Verified YCL037C SRO9 chromosome 3 L000003106 3 58678 57374 C 2003-09-22 2003-09-22|1997-01-28 Cytoplasmic RNA-binding protein; shuttles between nucleus and cytoplasm and is exported from the nucleus in an mRNA export-dependent manner; associates with translating ribosomes; involved in heme regulation of Hap1p as a component of the HMC complex, also involved in the organization of actin filaments; contains a La motif; SRO9 has a paralog, SLF1, that arose from the whole genome duplication +S000034295 CDS YCL037C 3 58678 57374 C 2003-09-22 2003-09-22|1997-01-28 +S000000541 ORF Verified YCL036W GFD2 YCD6 chromosome 3 L000004631 3 59026 60726 W 2000-09-13 1997-01-28 Protein of unknown function; identified as a high-copy suppressor of a dbp5 mutation; GFD2 has a paralog, YDR514C, that arose from the whole genome duplication +S000034257 CDS YCL036W 3 59026 60726 W 2000-09-13 1997-01-28 +S000000540 ORF Verified YCL035C GRX1 dithiol glutaredoxin GRX1 chromosome 3 3 61173 60841 C 2000-09-13 1997-01-28 Glutathione-dependent disulfide oxidoreductase; hydroperoxide and superoxide-radical responsive, heat-stable, with active site cysteine pair; protects cells from oxidative damage; GRX1 has a paralog, GRX2, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000033290 CDS YCL035C 3 61173 60841 C 2000-09-13 1997-01-28 +S000000539 ORF Verified YCL034W LSB5 chromosome 3 3 61658 62722 W 2000-09-13 2000-09-13|1997-01-28 Protein involved in membrane-trafficking events at plasma membrane; interacts with actin regulators Sla1p and Las17p, ubiquitin, Arf3p to couple actin dynamics to membrane trafficking processes; similar structure to GGA family of proteins with N-terminal VHS domain and GAT domain; binds Las17p, which is homolog of human Wiskott-Aldrich Syndrome protein involved in actin patch assembly, actin polymerization; may mediate disassembly of Pan1 complex from endocytic coat +S000033272 CDS YCL034W 3 61658 62722 W 2000-09-13 2000-09-13|1997-01-28 +S000000538 ORF Verified YCL033C MXR2 MSRB chromosome 3 3 63282 62776 C 2000-09-13 1997-01-28 Methionine-R-sulfoxide reductase; involved in the response to oxidative stress; protects iron-sulfur clusters from oxidative inactivation along with MXR1; involved in the regulation of lifespan +S000033176 CDS YCL033C 3 63282 62776 C 2000-09-13 1997-01-28 +S000000537 ORF Verified YCL032W STE50 chromosome 3 L000002125 3 63441 64481 W -22 2000-09-13 1997-01-28 Adaptor protein for various signaling pathways; involved in mating response, invasive/filamentous growth, osmotolerance; acts as an adaptor that links G protein-associated Cdc42p-Ste20p complex to the effector Ste11p to modulate signal transduction +S000033154 CDS YCL032W 3 63441 64481 W 2000-09-13 1997-01-28 +S000000536 ORF Verified YCL031C RRP7 chromosome 3 L000004251 3 65568 64675 C 2000-09-13 1997-01-28 Essential protein involved in rRNA processing and ribosome biogenesis; protein abundance increases in response to DNA replication stress +S000032244 CDS YCL031C 3 65568 64675 C 2000-09-13 1997-01-28 +S000000535 ORF Verified YCL030C HIS4 trifunctional histidinol dehydrogenase/phosphoribosyl-AMP cyclohydrolase/phosphoribosyl-ATP diphosphatase chromosome 3 L000000781 3 68333 65934 C -22 2000-09-13 2000-09-13|1997-01-28 Multifunctional enzyme containing phosphoribosyl-ATP pyrophosphatase; phosphoribosyl-AMP cyclohydrolase, and histidinol dehydrogenase activities; catalyzes the second, third, ninth and tenth steps in histidine biosynthesis +S000032161 CDS YCL030C 3 68333 65934 C 2000-09-13 2000-09-13|1997-01-28 +S000000534 ORF Verified YCL029C BIK1 PAC14|ARM5 chromosome 3 L000000178 3 69921 68599 C -21 2000-09-13 2000-09-13|1997-01-28 Microtubule-associated protein; component of the interface between microtubules and kinetochore, involved in sister chromatid separation; essential in polyploid cells but not in haploid or diploid cells; ortholog of mammalian CLIP-170 +S000031278 CDS YCL029C 3 69921 68599 C 2000-09-13 2000-09-13|1997-01-28 +S000000533 ORF Verified YCL028W RNQ1 prion domain-containing protein RNQ1|[PIN(+)] chromosome 3 S000007471 3 70150 71367 W 2000-09-13 2000-09-13|1997-01-28 [PIN(+)] prion; an infectious protein conformation that is generally an ordered protein aggregate +S000031217 CDS YCL028W 3 70150 71367 W 2000-09-13 2000-09-13|1997-01-28 +S000000532 ORF Verified YCL027W FUS1 chromosome 3 L000000653 3 71803 73341 W -21 2000-09-13 2000-09-13|1997-01-28 Membrane protein localized to the shmoo tip; required for cell fusion; expression regulated by mating pheromone; proposed to coordinate signaling, fusion, and polarization events required for fusion; potential Cdc28p substrate +S000031087 CDS YCL027W 3 71803 73341 W 2000-09-13 2000-09-13|1997-01-28 +S000007548 ORF Verified YCL026C-B HBN1 putative nitroreductase|YCL027C-A chromosome 3 3 73986 73405 C 2000-09-14 2000-09-14 Protein of unknown function; similar to bacterial nitroreductases; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; protein becomes insoluble upon intracellular iron depletion; protein abundance increases in response to DNA replication stress +S000037064 CDS YCL026C-B 3 73986 73405 C 2000-09-14 2000-09-14 +S000028483 ARS ARS306 ARS306 chromosome 3 3 74458 74677 2003-03-31 2003-03-31 Early-firing autonomously replicating sequence on Chromosome III +S000030165 ARS_consensus_sequence ARS306 3 74521 74531 W 2003-03-31 2003-03-31 +S000000589 ORF Verified YCL026C-A FRM2 type II nitroreductase|YCLX08C chromosome 3 L000004082 3 75285 74704 C 2000-09-13 2000-09-13|1997-01-28 Type II nitroreductase, using NADH as reductant; mutants are defective in fatty acid mediated repression of genes involved in fatty acid biosynthesis indicative of a role in lipid signaling; involved in the oxidative stress response; transcription induction by cadmium and selenite indicates a possible role in the metal stress response; expression induced in cells treated with the mycotoxin patulin +S000032741 CDS YCL026C-A 3 75285 74704 C 2000-09-13 2000-09-13|1997-01-28 +S000000530 ORF Verified YCL025C AGP1 amino acid transporter AGP1|YCC5 chromosome 3 L000003271 3 77919 76018 C 2006-01-12 2000-09-13|1997-01-28|2006-01-12 Low-affinity amino acid permease with broad substrate range; involved in uptake of asparagine, glutamine, and other amino acids; expression regulated by SPS plasma membrane amino acid sensor system (Ssy1p-Ptr3p-Ssy5p); AGP1 has a paralog, GNP1, that arose from the whole genome duplication +S000029928 CDS YCL025C 3 77919 76018 C 2006-01-12 2000-09-13|1997-01-28|2006-01-12 +S000000529 ORF Verified YCL024W KCC4 serine/threonine protein kinase chromosome 3 3 79162 82275 W 2006-01-12 2000-09-13|1997-01-28 Protein kinase of the bud neck involved in the septin checkpoint; associates with septin proteins, negatively regulates Swe1p by phosphorylation, shows structural homology to bud neck kinases Gin4p and Hsl1p; KCC4 has a paralog, GIN4, that arose from the whole genome duplication +S000029873 CDS YCL024W 3 79162 82275 W 2006-01-12 2000-09-13|1997-01-28 +S000000528 ORF Dubious YCL023C chromosome 3 3 79296 78949 C 2006-01-12 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF KCC4 +S000037128 CDS YCL023C 3 79296 78949 C 2006-01-12 1997-01-28 +S000000527 ORF Dubious YCL022C chromosome 3 3 82085 81570 C 2006-01-12 2000-09-13|1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified gene KCC4/YCL024W +S000037053 CDS YCL022C 3 82085 81570 C 2006-01-12 2000-09-13|1997-01-28 +S000006549 tRNA_gene tE(UUC)C chromosome 3 L000003760 3 82533 82462 C 2006-01-12 2000-05-19 Glutamine tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000035973 noncoding_exon tE(UUC)C 3 82533 82462 C 2006-01-12 2000-05-19 +S000126593 long_terminal_repeat YCLWdelta15 chromosome 3 3 82700 83036 W 2008-06-04 2008-06-04 Ty1 LTR +S000006822 long_terminal_repeat YCLCdelta1 chromosome 3 3 83194 83055 C 2007-04-02 2000-05-19|2007-04-02 Ty1 LTR +S000007549 ORF Uncharacterized YCL021W-A chromosome 3 3 83620 83997 W 2006-01-12 2000-09-14 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the vacuole +S000037066 CDS YCL021W-A 3 83620 83997 W 2006-01-12 2000-09-14 +S000006823 long_terminal_repeat YCLWdelta2a chromosome 3 3 84069 84294 W 2006-01-12 2000-05-19 Ty1 LTR +S000006825 long_terminal_repeat YCLWdelta3 chromosome 3 3 84295 84626 W 2006-01-12 2000-05-19 Ty1 LTR +S000006824 long_terminal_repeat YCLWdelta2b chromosome 3 3 84630 84718 W 2006-01-12 2000-05-19 Ty1 LTR +S000006826 long_terminal_repeat YCLWdelta4 chromosome 3 3 84811 85142 W 2006-01-12 2000-05-19 Ty2 LTR +S000006830 LTR_retrotransposon YCLWTy2-1 Ty2 chromosome 3 3 84811 90769 W 2006-01-12 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000000525 transposable_element_gene YCL020W gag protein chromosome 3 3 85102 86418 W 2006-01-12 2000-09-13|1997-01-28 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000036953 CDS YCL020W 3 85102 86418 W 2006-01-12 2000-09-13|1997-01-28 +S000000524 transposable_element_gene YCL019W gag-pol fusion protein chromosome 3 3 85102 90415 W 2006-01-12 2000-12-01|1997-01-28 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000036163 CDS YCL019W 3 85102 86391 W 2006-01-12 2000-12-01 +S000036164 CDS YCL019W 3 86393 90415 W 2006-01-12 2000-12-01|1997-01-28 +S000036165 plus_1_translational_frameshift YCL019W 3 86392 86392 W 2006-01-12 2000-12-01 +S000006827 long_terminal_repeat YCLWdelta5 chromosome 3 3 90438 90769 W 2006-01-12 2000-05-19 Ty2 LTR +S000006637 tRNA_gene tL(CAA)C SUP53 chromosome 3 L000002210|L000003751 3 90859 90972 W -10 2006-01-12 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis; can mutate to suppress amber nonsense mutations +S000033768 intron tL(CAA)C 3 90897 90928 W 2006-01-12 2000-05-19 +S000033766 noncoding_exon tL(CAA)C 3 90859 90896 W 2006-01-12 2000-05-19 +S000033767 noncoding_exon tL(CAA)C 3 90929 90972 W 2006-01-12 2000-05-19 +S000000523 ORF Verified YCL018W LEU2 3-isopropylmalate dehydrogenase chromosome 3 L000000943 3 91324 92418 W -5 2006-01-12 2000-09-13|1997-01-28 Beta-isopropylmalate dehydrogenase (IMDH); catalyzes the third step in the leucine biosynthesis pathway; can additionally catalyze the conversion of beta-ethylmalate into alpha-ketovalerate +S000035270 CDS YCL018W 3 91324 92418 W 2006-01-12 2000-09-13|1997-01-28 +S000000522 ORF Verified YCL017C NFS1 SPL1 chromosome 3 L000001240 3 94270 92777 C 2006-01-12 2000-09-13|1997-01-28 Cysteine desulfurase; involved in iron-sulfur cluster (Fe/S) biogenesis and in thio-modification of mitochondrial and cytoplasmic tRNAs; essential protein located predominantly in mitochondria +S000034976 CDS YCL017C 3 94270 92777 C 2006-01-12 2000-09-13|1997-01-28 +S000000521 ORF Verified YCL016C DCC1 chromosome 3 3 95763 94621 C 2006-01-12 2000-09-13|1997-01-28 Subunit of a complex with Ctf8p and Ctf18p; shares some components with Replication Factor C; required for sister chromatid cohesion and telomere length maintenance +S000034840 CDS YCL016C 3 95763 94621 C 2006-01-12 2000-09-13|1997-01-28 +S000000520 ORF Verified YCL014W BUD3 YCL012W chromosome 3 L000000200 3 96281 101191 W -9 2006-01-12 2000-09-13|1997-01-28 Guanine nucleotide exchange factor (GEF) for Cdc42p; activates Cdc42p in early G1, accounting for the first stage of biphasic activation, with Cdc24p accounting for the second stage in late G1; involved in the Cdc42p-mediated assembly of the axial landmark that dictates the site for the next round of budding, resulting in the axial budding pattern observed in haploids; localizes with septins to the bud neck contractile ring in mitosis +S000033879 CDS YCL014W 3 96281 101191 W 2006-01-12 2000-09-13|1997-01-28 +S000029705 ORF Verified YCL012C YCL011C-A chromosome 3 3 101788 101317 C 2006-01-12 2004-02-20|2011-02-03 Protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively; orthologs are present in S. bayanus, S. paradoxus and Ashbya gossypii; YCL012C is not an essential gene +S000036814 CDS YCL012C 3 101633 101317 C 2006-01-12 2004-02-20 +S000036813 CDS YCL012C 3 101788 101701 C 2006-01-12 2004-02-20 +S000036815 intron YCL012C 3 101700 101634 C 2006-01-12 2004-02-20|2011-02-03 +S000000517 ORF Verified YCL011C GBP2 single-stranded telomeric DNA-binding/mRNA-binding protein|RLF6 chromosome 3 L000002609|L000003049 3 103358 102075 C 2006-01-12 1997-01-28 Poly(A+) RNA-binding protein; key surveillance factor for the selective export of spliced mRNAs from the nucleus to the cytoplasm; preference for intron-containing genes; similar to Npl3p; also binds single-stranded telomeric repeat sequence in vitro; relocalizes to the cytosol in response to hypoxia; GBP2 has a paralog, HRB1, that arose from the whole genome duplication +S000032976 CDS YCL011C 3 103358 102075 C 2006-01-12 1997-01-28 +S000000516 ORF Verified YCL010C SGF29 chromosome 3 3 104350 103571 C 2006-01-12 1999-07-17|1997-01-28 Component of the HAT/Core module of the SAGA, SLIK, and ADA complexes; HAT/Core module also contains Gcn5p, Ngg1p, and Ada2p; binds methylated histone H3K4; involved in transcriptional regulation through SAGA and TBP recruitment to target promoters and H3 acetylation +S000032887 CDS YCL010C 3 104350 103571 C 2006-01-12 1999-07-17|1997-01-28 +S000000515 ORF Verified YCL009C ILV6 acetolactate synthase regulatory subunit chromosome 3 L000004096 3 105548 104619 C 2006-01-12 1999-07-17|1997-01-28 Regulatory subunit of acetolactate synthase; acetolactate synthase catalyzes the first step of branched-chain amino acid biosynthesis; enhances activity of the Ilv2p catalytic subunit, localizes to mitochondria +S000032134 CDS YCL009C 3 105548 104619 C 2006-01-12 1999-07-17|1997-01-28 +S000000514 ORF Verified YCL008C STP22 ubiquitin-binding ESCRT-I subunit protein STP22|AGS1|VPL15|VPS23 chromosome 3 L000003975|S000029031|L000000064 3 106853 105696 C 2006-01-12 2004-02-18|2000-09-13|1997-01-28 Component of the ESCRT-I complex; ESCRT-I is involved in ubiquitin-dependent sorting of proteins into the endosome; prevents polyubiquitination of the arrestin-related protein Rim8p, thereby directing its monoubiquitination by Rsp5p; homologous to the mouse and human Tsg101 tumor susceptibility gene; mutants exhibit a Class E Vps phenotype; +S000032022 CDS YCL008C 3 106853 105696 C 2006-01-12 2004-02-18|1997-01-28|2000-09-13 +S000028508 ORF Verified YCL005W-A VMA9 H(+)-transporting V0 sector ATPase subunit e|LDB10|CWH36 chromosome 3 3 107023 107417 W 2006-01-12 2003-07-29 Vacuolar H+ ATPase subunit e of the V-ATPase V0 subcomplex; essential for vacuolar acidification; interacts with the V-ATPase assembly factor Vma21p in the ER; involved in V0 biogenesis +S000030218 CDS YCL005W-A 3 107023 107033 W 2006-01-12 2003-07-29 +S000030219 CDS YCL005W-A 3 107111 107191 W 2006-01-12 2003-07-29 +S000030220 CDS YCL005W-A 3 107288 107417 W 2006-01-12 2003-07-29 +S000030221 intron YCL005W-A 3 107034 107110 W 2006-01-12 2003-07-29 +S000030222 intron YCL005W-A 3 107192 107287 W 2006-01-12 2003-07-29 +S000000513 ORF Dubious YCL007C CWH36 chromosome 3 L000002918 3 107366 106974 C 2006-01-12 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps verified ORF YCL005W-A; mutations in YCL007C were thought to confer sensitivity to calcofluor white, but this phenotype was later shown to be due to the defect in YCL005W-A +S000031856 CDS YCL007C 3 107366 106974 C 2006-01-12 1997-01-28 +S000006503 snoRNA_gene snR43 SNR43 chromosome 3 L000003410 3 107712 107504 C 2006-01-12 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U966 and of 5.8S rRNA at position 73 +S000030615 noncoding_exon snR43 3 107712 107504 C 2006-01-12 2000-05-19 +S000000511 ORF Verified YCL005W LDB16 chromosome 3 3 108021 108791 W 2006-01-12 2000-09-13|1997-01-28 Protein involved in lipid droplet (LD) assembly; forms a complex with Sei1p at ER-LD contact sites, stabilizing contact sites; ensures that LDs bud from the ER towards the cytosolic side of the membrane; null mutants have decreased net negative cell surface charge and localized accumulation of phosphatidic acid (PA) marker proteins; GFP-fusion protein expression is induced in response to MMS; null mutant can be complemented by the human seipin, BSCL2 +S000030833 CDS YCL005W 3 108021 108791 W 2006-01-12 2000-09-13|1997-01-28 +S000028484 ARS ARS307 ARS307 chromosome 3 3 108727 109060 2014-11-18 2003-03-31|2014-11-18 Autonomously Replicating Sequence on Chromosome III +S000030169 ARS_consensus_sequence ARS307 3 108970 108960 C 2006-01-12 2003-03-31 +S000000510 ORF Verified YCL004W PGS1 CDP-diacylglycerol--glycerol-3-phosphate 3-phosphatidyltransferase|YCL003W|PEL1 chromosome 3 L000001372 3 109105 110670 W 2006-01-12 2000-02-10|1997-01-28 Phosphatidylglycerolphosphate synthase; catalyzes the synthesis of phosphatidylglycerolphosphate from CDP-diacylglycerol and sn-glycerol 3-phosphate in the first committed and rate-limiting step of cardiolipin biosynthesis +S000030745 CDS YCL004W 3 109105 110670 W 2006-01-12 2000-02-10|1997-01-28 +S000000508 ORF Uncharacterized YCL002C chromosome 3 3 111675 110808 C 2011-02-03 2003-09-27|1997-01-28|2000-09-13|2011-02-03 Putative protein of unknown function; YCL002C is not an essential gene +S000037735 CDS YCL002C 3 111557 110808 C 2011-02-03 2003-09-27|1997-01-28|2000-09-13|2011-02-03 +S000037734 CDS YCL002C 3 111675 111634 C 2011-02-03 2003-09-27 +S000037736 intron YCL002C 3 111633 111558 C 2011-02-03 2003-09-27 +S000000507 ORF Verified YCL001W RER1 protein retrieval receptor chromosome 3 L000001613 3 111916 112482 W 2011-02-03 1999-07-17|1997-01-28 Protein involved in retention of membrane proteins; including Sec12p, in the ER; localized to Golgi; functions as a retrieval receptor in returning membrane proteins to the ER +S000037714 CDS YCL001W 3 111916 112482 W 2011-02-03 1999-07-17|1997-01-28 +S000007221 ORF Uncharacterized YCL001W-A chromosome 3 3 113080 113541 W 2011-02-03 1999-07-17 Putative protein of unknown function; YCL001W-A gene has similarity to DOM34 and is present in a region duplicated between chromosomes XIV and III +S000034577 CDS YCL001W-A 3 113080 113541 W 2011-02-03 1999-07-17 +S000007596 ORF Uncharacterized YCL001W-B chromosome 3 3 113770 114024 W 2011-02-03 2001-02-26 Putative protein of unknown function; present in a region duplicated between chromosomes XIV and III; YCL001W-B has a paralog, DOM34, that arose from the whole genome duplication +S000037142 CDS YCL001W-B 3 113770 114024 W 2011-02-03 2001-02-26 +S000028485 ARS ARS308 ARS308 chromosome 3 3 114321 114939 2011-02-03 2003-03-31 Autonomously Replicating Sequence on Chromosome III +S000006465 centromere CEN3 CEN3 chromosome 3 L000000296 3 114385 114501 W 0 2011-02-03 2000-05-19 Chromosome III centromere +S000077263 centromere_DNA_Element_I CEN3 3 114385 114394 W 2011-02-03 2004-10-04 +S000077264 centromere_DNA_Element_II CEN3 3 114395 114476 W 2011-02-03 2004-10-04 +S000077265 centromere_DNA_Element_III CEN3 3 114477 114501 W 2011-02-03 2004-10-04 +S000000594 ORF Uncharacterized YCR001W chromosome 3 3 115685 115999 W 2011-02-03 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YCR001W is not an essential gene +S000035168 CDS YCR001W 3 115685 115999 W 2011-02-03 1997-01-28 +S000000595 ORF Verified YCR002C CDC10 septin CDC10 chromosome 3 L000000250 3 118348 117380 C -.75 2011-02-03 1997-01-28 Component of the septin ring, required for cytokinesis; septins are GTP-binding proteins that assemble into rod-like hetero-oligomers that can associate to form filaments; septin rings at the mother-bud neck act as scaffolds for recruiting cell division factors and as barriers to prevent diffusion of specific proteins between mother and daughter cells; N-terminus interacts with phosphatidylinositol-4,5-bisphosphate; protein abundance increases under DNA damage stress +S000035178 CDS YCR002C 3 118348 117380 C 2011-02-03 1997-01-28 +S000000596 ORF Verified YCR003W MRPL32 mitochondrial 54S ribosomal protein YmL32|YmL32 chromosome 3 L000001169 3 118620 119171 W 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit; protein abundance increases in response to DNA replication stress +S000036143 CDS YCR003W 3 118620 119171 W 2011-02-03 1997-01-28 +S000000597 ORF Verified YCR004C YCP4 flavodoxin-like fold family protein chromosome 3 L000004160 3 120318 119575 C 2011-02-03 1997-01-28 Protein of unknown function; has sequence and structural similarity to flavodoxins; predicted to be palmitoylated; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000036195 CDS YCR004C 3 120318 119575 C 2011-02-03 1997-01-28 +S000000598 ORF Verified YCR005C CIT2 citrate (Si)-synthase CIT2 chromosome 3 L000000342 3 122328 120946 C 2011-02-03 2000-09-13|1997-01-28 Citrate synthase, peroxisomal isozyme involved in glyoxylate cycle; catalyzes condensation of acetyl coenzyme A and oxaloacetate to form citrate; expression is controlled by Rtg1p and Rtg2p transcription factors; SCF-Ucc1 regulates level of Cit2p to maintain citrate homeostasis; oxaloacetate-dependent positive feedback loop inhibits Cit2p ubiquitination; CIT2 has a paralog, CIT1, that arose from the whole genome duplication +S000031674 CDS YCR005C 3 122328 120946 C 2011-02-03 2000-09-13|1997-01-28 +S000000599 ORF Uncharacterized YCR006C chromosome 3 3 123003 122530 C 2011-02-03 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YCR006C is not an essential gene +S000031816 CDS YCR006C 3 123003 122530 C 2011-02-03 1997-01-28 +S000006678 tRNA_gene tP(AGG)C SUF2 chromosome 3 L000002150|L000003759 3 123648 123577 C 2 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in proline codons +S000033260 noncoding_exon tP(AGG)C 3 123648 123577 C 2011-02-03 2000-05-19 +S000006832 long_terminal_repeat YCRCdelta6 chromosome 3 3 124465 124134 C 2011-02-03 2000-05-19|2007-04-02 Ty1 LTR +S000000600 ORF Uncharacterized YCR007C DUP240 family protein chromosome 3 3 126730 126011 C 2011-02-03 1997-01-28 Putative integral membrane protein; member of DUP240 gene family; SWAT-GFP and mCherry fusion proteins localize to the cell periphery and vacuole; YCR007C is not an essential gene +S000031932 CDS YCR007C 3 126730 126011 C 2011-02-03 1997-01-28 +S000006668 tRNA_gene tN(GUU)C chromosome 3 L000003752 3 127716 127789 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis +S000030674 noncoding_exon tN(GUU)C 3 127716 127789 W 2011-02-03 2000-05-19 +S000000601 ORF Verified YCR008W SAT4 serine/threonine protein kinase SAT4|HAL4 chromosome 3 L000004136 3 128470 130281 W 2011-02-03 1997-01-28 Ser/Thr protein kinase involved in salt tolerance; funtions in regulation of Trk1p-Trk2p potassium transporter; overexpression affects the Fe-S and lipoamide containing proteins in the mitochondrion; required for lipoylation of Lat1p, Kgd2p and Gcv3p; partially redundant with Hal5p; has similarity to Npr1p; localizes to the cytoplasm and mitochondrion +S000037489 CDS YCR008W 3 128470 130281 W 2011-02-03 1997-01-28 +S000000602 ORF Verified YCR009C RVS161 amphiphysin-like protein RVS161|SPE161|FUS7|END6 chromosome 3 L000001788 3 131542 130745 C 1 2011-02-03 1997-01-28 Amphiphysin-like lipid raft protein; N-BAR domain protein that interacts with Rvs167p and regulates polarization of the actin cytoskeleton, endocytosis, cell polarity, cell fusion and viability following starvation or osmotic stress +S000037521 CDS YCR009C 3 131542 130745 C 2011-02-03 1997-01-28 +S000028486 ARS ARS309 ARS309 chromosome 3 3 132043 132120 2014-11-18 2003-03-31|2014-11-18 Autonomously Replicating Sequence on Chromosome III +S000030172 ARS_consensus_sequence ARS309 3 132046 132056 W 2011-02-03 2003-03-31 +S000000603 ORF Verified YCR010C ADY2 ATO1 chromosome 3 3 133124 132273 C 2011-02-03 1997-01-28 Acetate transporter required for normal sporulation; phosphorylated in mitochondria; ADY2 has a paralog, ATO2, that arose from the whole genome duplication +S000037136 CDS YCR010C 3 133124 132273 C 2011-02-03 1997-01-28 +S000000604 ORF Verified YCR011C ADP1 putative ATP-dependent permease ADP1 chromosome 3 L000000049 3 136873 133724 C 1 2011-02-03 2000-09-13|1997-01-28 Putative ATP-dependent permease of the ABC transporter family +S000037210 CDS YCR011C 3 136873 133724 C 2011-02-03 2000-09-13|1997-01-28 +S000000605 ORF Verified YCR012W PGK1 phosphoglycerate kinase chromosome 3 L000001411 3 137746 138996 W 2 2011-02-03 2000-09-13|1997-01-28 3-phosphoglycerate kinase; catalyzes transfer of high-energy phosphoryl groups from the acyl phosphate of 1,3-bisphosphoglycerate to ADP to produce ATP; key enzyme in glycolysis and gluconeogenesis +S000037349 CDS YCR012W 3 137746 138996 W 2011-02-03 2000-09-13|1997-01-28 +S000000606 ORF Dubious YCR013C chromosome 3 3 139049 138402 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; transcription of both YCR013C and the overlapping essential gene PGK1 is reduced in a gcr1 null mutant +S000037371 CDS YCR013C 3 139049 138402 C 2011-02-03 1997-01-28 +S000000607 ORF Verified YCR014C POL4 DNA-directed DNA polymerase IV|POLX chromosome 3 L000001462 3 140933 139185 C 2011-02-03 2000-09-13|1997-01-28 DNA polymerase IV; undergoes pair-wise interactions with Dnl4p-Lif1p and Rad27p to mediate repair of DNA double-strand breaks by non-homologous end joining (NHEJ); homologous to mammalian DNA polymerase beta +S000029998 CDS YCR014C 3 140933 139185 C 2011-02-03 2000-09-13|1997-01-28 +S000000608 ORF Verified YCR015C CTO1 chromosome 3 3 142170 141217 C 2011-02-03 2000-09-13|1997-01-28 Protein required for cold tolerance; involved in phosphate uptake; YCR015C is not an essential gene +S000030089 CDS YCR015C 3 142170 141217 C 2011-02-03 2000-09-13|1997-01-28 +S000007298 snoRNA_gene snR33 SNR33 chromosome 3 L000001971 3 142546 142364 C 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U1042 +S000036761 noncoding_exon snR33 3 142546 142364 C 2011-02-03 2000-05-19 +S000006575 tRNA_gene tG(GCC)C SUF16 chromosome 3 L000002163|L000003758 3 142771 142701 C 3 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis;can mutate to suppress +1 frameshift mutations in glycine codons +S000037891 noncoding_exon tG(GCC)C 3 142771 142701 C 2011-02-03 2000-05-19 +S000006833 long_terminal_repeat YCRCdelta7 chromosome 3 3 143080 142758 C 2011-02-03 2000-05-19|2007-04-02 Ty1 LTR +S000000609 ORF Uncharacterized YCR016W chromosome 3 3 143634 144506 W 2011-02-03 2000-09-13|1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleolus and nucleus; predicted to be involved in ribosome biogenesis +S000030347 CDS YCR016W 3 143634 144506 W 2011-02-03 2000-09-13|1997-01-28 +S000000610 ORF Verified YCR017C CWH43 chromosome 3 3 147634 144773 C 2011-02-03 2000-09-13|1997-01-28 GPI lipid remodelase; responsible for introducing ceramides into GPI anchors having a C26:0 fatty acid in sn-2 of the glycerol moiety; can also use lyso-GPI protein anchors and various base resistant lipids as substrates; contains 14-16 transmembrane segments and several putative glycosylation and phosphorylation sites; null mutation is synthetically lethal with pkc1 deletion +S000030381 CDS YCR017C 3 147634 144773 C 2011-02-03 2000-09-13|1997-01-28 +S000000611 ORF Verified YCR018C SRD1 chromosome 3 L000002054 3 148903 148238 C 9 2011-02-03 2000-09-13|1997-01-28 Protein involved in the processing of pre-rRNA to mature rRNA; contains a C2/C2 zinc finger motif; srd1 mutation suppresses defects caused by the rrp1-1 mutation +S000033700 CDS YCR018C 3 148903 148238 C 2011-02-03 2000-09-13|1997-01-28 +S000006835 long_terminal_repeat YCRWdelta8 chromosome 3 3 149482 149809 W 2011-02-03 2000-05-19 Ty1 LTR +S000006658 tRNA_gene tM(CAU)C chromosome 3 L000003753 3 149920 149991 W 2011-02-03 2000-05-19 Methionine tRNA (tRNA-Met), predicted by tRNAscan-SE analysis +S000034498 noncoding_exon tM(CAU)C 3 149920 149991 W 2011-02-03 2000-05-19 +S000006836 long_terminal_repeat YCRWdelta9 chromosome 3 3 150220 150551 W 2011-02-03 2000-05-19 Ty1 LTR +S000007429 long_terminal_repeat YCRCtau1 chromosome 3 3 151055 150695 C 2011-02-03 2000-05-19|2008-03-05 Ty4 LTR +S000006615 tRNA_gene tK(CUU)C chromosome 3 L000003757 3 151356 151284 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000035985 noncoding_exon tK(CUU)C 3 151356 151284 C 2011-02-03 2000-05-19 +S000006837 long_terminal_repeat YCRWdelta10 chromosome 3 3 151521 151851 W 2011-02-03 2000-05-19 Ty1 LTR +S000007230 ORF Dubious YCR018C-A chromosome 3 3 151862 151608 C 2011-02-03 1999-07-17 Putative protein of unknown function; encoded opposite a Ty1 LTR +S000036351 CDS YCR018C-A 3 151862 151608 C 2011-02-03 1999-07-17 +S000000612 ORF Verified YCR019W MAK32 chromosome 3 L000000999 3 152837 153928 W 2011-02-03 1997-01-28 Protein necessary for stability of L-A dsRNA-containing particles +S000033899 CDS YCR019W 3 152837 153928 W 2011-02-03 1997-01-28 +S000000613 ORF Verified YCR020C PET18 HIT2 chromosome 3 L000001390 3 154659 154012 C 17 2011-02-03 1997-01-28 Protein of unknown function; has weak similarity to proteins involved in thiamin metabolism; expression is induced in the absence of thiamin +S000033420 CDS YCR020C 3 154659 154012 C 2011-02-03 1997-01-28 +S000000614 ORF Verified YCR020C-A MAK31 NAA38|SMX1|LSM9 chromosome 3 L000000998 3 155096 154830 C 2011-02-03 1997-01-28 Non-catalytic subunit of N-terminal acetyltransferase of the NatC type; required for replication of dsRNA virus; member of the Sm protein family +S000031333 CDS YCR020C-A 3 155096 154830 C 2011-02-03 1997-01-28 +S000006439 ORF Verified YCR020W-B HTL1 chromosome 3 L000004545 3 155320 155556 W 2011-02-03 1999-07-17 Component of the RSC chromatin remodeling complex; RSC functions in transcriptional regulation and elongation, chromosome stability, and establishing sister chromatid cohesion; involved in telomere maintenance +S000033349 CDS YCR020W-B 3 155320 155556 W 2011-02-03 1999-07-17 +S000000615 ORF Verified YCR021C HSP30 YRO1 chromosome 3 L000000818 3 157107 156109 C 2011-02-03 1997-01-28 Negative regulator of the H(+)-ATPase Pma1p; stress-responsive protein; hydrophobic plasma membrane localized; induced by heat shock, ethanol treatment, weak organic acid, glucose limitation, and entry into stationary phase +S000033481 CDS YCR021C 3 157107 156109 C 2011-02-03 1997-01-28 +S000000616 ORF Uncharacterized YCR022C chromosome 3 3 157765 157421 C 2011-02-03 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YCR022C is not an essential gene +S000033548 CDS YCR022C 3 157765 157421 C 2011-02-03 1997-01-28 +S000000617 ORF Verified YCR023C chromosome 3 3 160373 158538 C 2011-02-03 2000-09-13|1997-01-28 Vacuolar membrane protein of unknown function; member of the multidrug resistance family; YCR023C is not an essential gene +S000033605 CDS YCR023C 3 160373 158538 C 2011-02-03 2000-09-13|1997-01-28 +S000000618 ORF Verified YCR024C SLM5 asparagine--tRNA ligase SLM5 chromosome 3 3 162222 160744 C 2011-02-03 2000-09-13|1997-01-28 Mitochondrial asparaginyl-tRNA synthetase +S000034549 CDS YCR024C 3 162222 160744 C 2011-02-03 2000-09-13|1997-01-28 +S000028818 ORF Uncharacterized YCR024C-B chromosome 3 3 162865 162599 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000033627 CDS YCR024C-B 3 162865 162599 C 2011-02-03 2003-07-29 +S000000619 ORF Verified YCR024C-A PMP1 proteolipid ATPase chromosome 3 L000001453 3 163067 162945 C 2011-02-03 1997-01-28 Regulatory subunit for the plasma membrane H(+)-ATPase Pma1p; small single-membrane span proteolipid; forms unique helix and positively charged cytoplasmic domain that is able to specifically segregate phosphatidylserines; PMP1 has a paralog, PMP2, that arose from the whole genome duplication +S000030035 CDS YCR024C-A 3 163067 162945 C 2011-02-03 1997-01-28 +S000000620 ORF Dubious YCR025C chromosome 3 3 163856 163446 C 2011-02-03 2000-09-13|1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YCR025C is not an essential gene +S000034636 CDS YCR025C 3 163856 163446 C 2011-02-03 2000-09-13|1997-01-28 +S000000621 ORF Verified YCR026C NPP1 nucleotide diphosphatase/phosphodiesterase NPP1 chromosome 3 3 166339 164111 C 2011-02-03 2000-09-13|1997-01-28 Nucleotide pyrophosphatase/phosphodiesterase; mediates extracellular nucleotide phosphate hydrolysis along with Npp2p and Pho5p; activity and expression enhanced during conditions of phosphate starvation; involved in spore wall assembly; NPP1 has a paralog, NPP2, that arose from the whole genome duplication, and an npp1 npp2 double mutant exhibits reduced dityrosine fluorescence relative to the single mutants +S000034766 CDS YCR026C 3 166339 164111 C 2011-02-03 2000-09-13|1997-01-28 +S000028487 ARS ARS310 ARS310 chromosome 3 3 166503 167348 2011-02-03 2003-03-31 Compound autonomously replicating sequence on Chromosome III +S000030176 ARS_consensus_sequence ARS310 3 166663 166673 W 2011-02-03 2003-03-31 +S000030177 ARS_consensus_sequence ARS310 3 166710 166700 C 2011-02-03 2003-03-31 +S000030178 ARS_consensus_sequence ARS310 3 166766 166756 C 2011-02-03 2003-03-31 +S000000622 ORF Verified YCR027C RHB1 putative GTPase RHB1|RSG1 chromosome 3 S000007419 3 167999 167370 C 2011-02-03 2000-09-13|1997-01-28 Putative Rheb-related GTPase; involved in regulating canavanine resistance and arginine uptake; member of the Ras superfamily of G-proteins +S000035733 CDS YCR027C 3 167999 167370 C 2011-02-03 2000-09-13|1997-01-28 +S000006692 tRNA_gene tQ(UUG)C chromosome 3 L000003756 3 168372 168301 C 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000031663 noncoding_exon tQ(UUG)C 3 168372 168301 C 2011-02-03 2000-05-19 +S000006838 long_terminal_repeat YCRWdelta11 chromosome 3 3 169573 169888 W 2011-02-03 2000-05-19 Ty1 LTR +S000000623 ORF Verified YCR028C FEN2 chromosome 3 L000004079 3 172424 170886 C 2011-02-03 2000-09-13|1997-01-28 Plasma membrane H+-pantothenate symporter; confers sensitivity to the antifungal agent fenpropimorph; relocalizes from vacuole to cytoplasm upon DNA replication stress +S000035840 CDS YCR028C 3 172424 170886 C 2011-02-03 2000-09-13|1997-01-28 +S000007222 ORF Verified YCR028C-A RIM1 chromosome 3 L000001640 3 173440 172950 C 2011-02-03 2000-09-13|1999-07-17 ssDNA-binding protein essential for mitochondrial genome maintenance; involved in mitochondrial DNA replication; stimulates utilization by Mip1p DNA polymerase of RNA primers synthesized by Rpo41p +S000030988 CDS YCR028C-A 3 173115 172950 C 2011-02-03 2000-09-13|1999-07-17 +S000030987 CDS YCR028C-A 3 173440 173199 C 2011-02-03 2000-09-13|1999-07-17 +S000030989 intron YCR028C-A 3 173198 173116 C 2011-02-03 2000-09-13|1999-07-17 +S000000626 ORF Verified YCR030C SYP1 YCR029C-A chromosome 3 3 176438 173826 C 2011-02-03 2000-09-13|1997-01-28|1999-07-17 Negative regulator of WASP-Arp23 complex; involved in endocytic site formation; directly inhibits Las17p stimulation of Arp23 complex-mediated actin assembly in vitro; may regulate assembly and disassembly of the septin ring; colocalizes and interacts with septin subunits; potential role in actin cytoskeletal organization +S000036846 CDS YCR030C 3 176438 173826 C 2011-02-03 2000-09-13|1999-07-17|1997-01-28 +S000006456 snoRNA_gene snR65 SNR65 chromosome 3 L000004534 3 177183 177282 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U2347 +S000030850 noncoding_exon snR65 3 177183 177282 W 2011-02-03 2000-05-19 +S000000627 ORF Verified YCR031C RPS14A uS11|ribosomal 40S subunit protein S14A|S11|rp59A|S14A|RPL59|CRY1 chromosome 3 L000000423 3 178220 177500 C 26 2011-02-03 2000-09-13|1997-01-28 Protein component of the small (40S) ribosomal subunit; required for ribosome assembly and 20S pre-rRNA processing; mutations confer cryptopleurine resistance; homologous to mammalian ribosomal protein S14 and bacterial S11; RPS14A has a paralog, RPS14B, that arose from the whole genome duplication +S000037573 CDS YCR031C 3 177906 177500 C 2011-02-03 2000-09-13|1997-01-28 +S000037572 CDS YCR031C 3 178220 178214 C 2011-02-03 2000-09-13|1997-01-28 +S000037574 intron YCR031C 3 178213 177907 C 2011-02-03 2000-09-13|1997-01-28 +S000007314 snoRNA_gene snR189 SNR189 chromosome 3 L000001976 3 178798 178610 C 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2735 and small subunit (SSU) rRNA at position U466 +S000030325 noncoding_exon snR189 3 178798 178610 C 2011-02-03 2000-05-19 +S000000628 ORF Verified YCR032W BPH1 chromosome 3 L000003507 3 179520 186023 W 2011-02-03 2000-09-13|1997-01-28 Protein homologous to Chediak-Higashi syndrome and Beige proteins; both of which are implicated in disease syndromes in human and mouse, respectively, due to defective lysosomal trafficking; mutant phenotype and genetic interactions suggest a role in protein sorting +S000037675 CDS YCR032W 3 179520 186023 W 2011-02-03 2000-09-13|1997-01-28 +S000000629 ORF Verified YCR033W SNT1 chromosome 3 3 186489 190169 W 2011-02-03 2000-09-13|1997-01-28 Subunit of the Set3C deacetylase complex; interacts directly with the Set3C subunit, Sif2p; putative DNA-binding protein; mutant has increased aneuploidy tolerance; relocalizes to the cytosol in response to hypoxia +S000037732 CDS YCR033W 3 186489 190169 W 2011-02-03 2000-09-13|1997-01-28 +S000000630 ORF Verified YCR034W ELO2 fatty acid elongase ELO2|FEN1|VBM2|GNS1 chromosome 3 L000003126|L000000608 3 190592 191635 W 24 2011-02-03 1997-01-28 Fatty acid elongase, involved in sphingolipid biosynthesis; acts on fatty acids of up to 24 carbons in length; mutations have regulatory effects on 1,3-beta-glucan synthase, vacuolar ATPase, and the secretory pathway; ELO2 has a paralog, ELO1, that arose from the whole genome duplication; lethality of the elo2 elo3 double null mutation is functionally complemented by human ELOVL1 and weakly complemented by human ELOVL3 or ELOV7 +S000037781 CDS YCR034W 3 190592 191635 W 2011-02-03 1997-01-28 +S000000631 ORF Verified YCR035C RRP43 exosome non-catalytic core subunit RRP43 chromosome 3 L000003552 3 193018 191834 C 2011-02-03 2000-09-13|1997-01-28 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; has similarity to E. coli RNase PH and to human hRrp43p (OIP2, EXOSC8); protein abundance increases in response to DNA replication stress +S000030620 CDS YCR035C 3 193018 191834 C 2011-02-03 2000-09-13|1997-01-28 +S000000632 ORF Verified YCR036W RBK1 putative ribokinase chromosome 3 L000001587 3 193297 194298 W 29 2011-02-03 2000-09-13|1997-01-28 Putative ribokinase +S000030780 CDS YCR036W 3 193297 194298 W 2011-02-03 2000-09-13|1997-01-28 +S000028488 ARS ARS313 ARS313 ARSIII-194 chromosome 3 3 194308 194367 2014-11-18 2003-03-31|2014-11-18|2006-09-06 Autonomously Replicating Sequence on Chromosome III +S000000633 ORF Verified YCR037C PHO87 SPX domain-containing inorganic phosphate transporter chromosome 3 L000002740 3 197185 194414 C 2011-02-03 2000-09-13|1997-01-28 Low-affinity inorganic phosphate (Pi) transporter; acts upstream of Pho81p in regulation of the PHO pathway; expression is independent of Pi concentration and Pho4p activity; contains 12 membrane-spanning segments; PHO87 has a paralog, PHO90, that arose from the whole genome duplication +S000030810 CDS YCR037C 3 197185 194414 C 2011-02-03 2000-09-13|1997-01-28 +S000028489 ARS ARS314 ARS314 ARSIII-198 chromosome 3 3 197460 197598 2014-11-18 2003-03-31|2014-11-18|2006-09-06 Autonomously Replicating Sequence on Chromosome III; active in <10% of cell cycles +S000178056 ARS_consensus_sequence ARS314 3 197552 197536 C 2014-11-18 2014-11-18 +S000029699 mating_type_region MATALPHA MATALPHA MAT chromosome 3 L000001031 3 198671 201177 W 30 2011-02-03 2007-12-10 Mating type locus; note that the systematic sequence in SGD contains MATalpha sequences +S000124947 W_region MATALPHA 3 198671 199400 W 2011-02-03 2007-12-10 +S000124948 X_region MATALPHA 3 199401 200103 W 2011-02-03 2007-12-10 +S000124949 Y_region MATALPHA 3 200104 200850 W 2011-02-03 2007-12-10 +S000124950 Z1_region MATALPHA 3 200851 201089 W 2011-02-03 2007-12-10 +S000124951 Z2_region MATALPHA 3 201090 201177 W 2011-02-03 2007-12-10 +S000007597 ORF Dubious YCR038W-A chromosome 3 3 199293 199418 W 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene BUD5/YCR038C; identified by homology with hemiascomycetous yeast species +S000037143 CDS YCR038W-A 3 199293 199418 W 2011-02-03 2001-02-26 +S000000634 ORF Verified YCR038C BUD5 Ras family guanine nucleotide exchange factor BUD5 chromosome 3 L000000202 3 199549 197621 C 30 2011-02-03 2000-09-13|1997-01-28 GTP/GDP exchange factor for Rsr1p (Bud1p); required for both axial and bipolar budding patterns; mutants exhibit random budding in all cell types +S000031792 CDS YCR038C 3 199549 197621 C 2011-02-03 2000-09-13|1997-01-28 +S000000635 ORF Verified YCR039C MATALPHA2 homeodomain mating type protein alpha2|ALPHA2 chromosome 3 L000002973 3 200178 199546 C 2011-02-03 1997-01-28 Homeobox-domain protein; with Mcm1p, represses a-specific genes in haploids; acts with A1p to repress transcription of haploid-specific genes in diploids; one of two genes encoded by the MATalpha mating type cassette +S000031946 CDS YCR039C 3 200178 199546 C 2011-02-03 1997-01-28 +S000000636 ORF Verified YCR040W MATALPHA1 transcriptional co-activator mating type protein alpha|ALPHA1 chromosome 3 L000002972 3 200442 200969 W 2011-02-03 1997-01-28 Transcriptional co-activator that regulates mating-type-specific genes; targets the transcription factor Mcm1p to the promoters of alpha-specific genes; one of two genes encoded by the MATalpha mating type cassette +S000032771 CDS YCR040W 3 200442 200969 W 2011-02-03 1997-01-28 +S000000637 ORF Verified YCR041W chromosome 3 3 200911 201243 W 2011-02-03 1997-01-28 Protein of unknown function; overexpression suppresses the high-frequency loss of mini-chromosomes, probably by increasing the rate of proper chromosome segregation; translated gene product of YCR041W, but not its transcript, is responsible for suppression; suppression ability of YCR041W is completely dependent on silencing protein Sir4p +S000032864 CDS YCR041W 3 200911 201243 W 2011-02-03 1997-01-28 +S000000638 ORF Verified YCR042C TAF2 TafII150|TSM1|TAF150 chromosome 3 L000002367 3 205397 201174 C 31 2011-02-03 1997-01-28 TFIID subunit (150 kDa); involved in RNA polymerase II transcription initiation +S000032896 CDS YCR042C 3 205397 201174 C 2011-02-03 1997-01-28 +S000000639 ORF Uncharacterized YCR043C chromosome 3 3 206644 206261 C 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the Golgi apparatus; YCR043C is not an essential gene +S000033005 CDS YCR043C 3 206644 206261 C 2011-02-03 1997-01-28 +S000000640 ORF Verified YCR044C PER1 COS16 chromosome 3 3 207950 206877 C 2011-02-03 1997-01-28 Protein of the endoplasmic reticulum; required for GPI-phospholipase A2 activity that remodels the GPI anchor as a prerequisite for association of GPI-anchored proteins with lipid rafts; functionally complemented by human ortholog PERLD1 +S000033673 CDS YCR044C 3 207950 206877 C 2011-02-03 1997-01-28 +S000028607 ORF Dubious YCR045W-A chromosome 3 3 208751 209101 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps with YCR045C; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching +S000031418 CDS YCR045W-A 3 208751 209101 W 2011-02-03 2003-07-29 +S000000641 ORF Verified YCR045C RRT12 OSW3 chromosome 3 3 209610 208135 C 2011-02-03 1997-01-28 Probable subtilisin-family protease; role in formation of the dityrosine layer of spore walls; localizes to the spore wall and also the nuclear envelope and ER region in mature spores +S000033761 CDS YCR045C 3 209610 208135 C 2011-02-03 1997-01-28 +S000000642 ORF Verified YCR046C IMG1 mitochondrial 54S ribosomal protein IMG1 chromosome 3 L000004445 3 210423 209914 C 2011-02-03 1997-01-28 Mitochondrial ribosomal protein of the large subunit; required for respiration and for maintenance of the mitochondrial genome +S000033858 CDS YCR046C 3 210423 209914 C 2011-02-03 1997-01-28 +S000028608 ORF Dubious YCR047W-A chromosome 3 3 211301 211507 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps with YCR047C; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching +S000031420 CDS YCR047W-A 3 211301 211507 W 2011-02-03 2003-07-29 +S000000643 ORF Verified YCR047C BUD23 18S rRNA (guanine1575-N7)-methyltransferase chromosome 3 3 211545 210718 C 2011-02-03 1997-01-28 Methyltransferase that methylates residue G1575 of 18S rRNA; required for rRNA processing and nuclear export of 40S ribosomal subunits independently of methylation activity; diploid mutant displays random budding pattern; functional homolog of human WBSCR22 +S000034011 CDS YCR047C 3 211545 210718 C 2011-02-03 1997-01-28 +S000000644 ORF Verified YCR048W ARE1 sterol acyltransferase|SAT2 chromosome 3 L000003221|L000002768 3 211929 213761 W 2011-02-03 1997-01-28 Acyl-CoA:sterol acyltransferase; endoplasmic reticulum enzyme that contributes the major sterol esterification activity in the absence of oxygen; ARE1 has a paralog, ARE2, that arose from the whole genome duplication +S000034969 CDS YCR048W 3 211929 213761 W 2011-02-03 1997-01-28 +S000000645 ORF Dubious YCR049C chromosome 3 3 212317 211871 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035033 CDS YCR049C 3 212317 211871 C 2011-02-03 1997-01-28 +S000000646 ORF Uncharacterized YCR050C chromosome 3 3 213772 213464 C 2011-02-03 1997-01-28 Non-essential protein of unknown function; deletion mutant is synthetically sick or lethal with alpha-synuclein +S000036029 CDS YCR050C 3 213772 213464 C 2011-02-03 1997-01-28 +S000000647 ORF Uncharacterized YCR051W chromosome 3 3 214071 214739 W 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; contains ankyrin (Ank) repeats; YCR051W is not an essential gene +S000036913 CDS YCR051W 3 214071 214739 W 2011-02-03 1997-01-28 +S000000648 ORF Verified YCR052W RSC6 chromosome 3 L000003151 3 214994 216445 W 2011-02-03 1997-01-28 Component of the RSC chromatin remodeling complex; essential for mitotic growth; RSC6 has a paralog, SNF12, that arose from the whole genome duplication +S000036966 CDS YCR052W 3 214994 216445 W 2011-02-03 1997-01-28 +S000000649 ORF Verified YCR053W THR4 threonine synthase THR4 chromosome 3 L000002300 3 216697 218241 W 51 2011-02-03 1997-01-28 Threonine synthase; conserved protein that catalyzes formation of threonine from O-phosphohomoserine; expression is regulated by the GCN4-mediated general amino acid control pathway +S000037048 CDS YCR053W 3 216697 218241 W 2011-02-03 1997-01-28 +S000000650 ORF Verified YCR054C CTR86 chromosome 3 L000004071 3 220067 218376 C 2011-02-03 1997-01-28 Essential protein of unknown function; with orthologs in Ashbya gossypii and Candida albicans; similar to human ATXN10, mutations in which cause spinocerebellar ataxia type 10; codon usage corresponds to that observed for yeast genes expressed at low levels; relative distribution to the nucleus increases upon DNA replication stress +S000037070 CDS YCR054C 3 220067 218376 C 2011-02-03 1997-01-28 +S000000653 ORF Verified YCR057C PWP2 snoRNA-binding rRNA-processing protein PWP2|UTP1|YCR058C|YCR055C chromosome 3 L000001540 3 223228 220457 C 2011-02-03 2000-09-13|1997-01-28 Conserved 90S pre-ribosomal component; essential for proper endonucleolytic cleavage of the 35 S rRNA precursor at A0, A1, and A2 sites; contains eight WD-repeats; PWP2 deletion leads to defects in cell cycle and bud morphogenesis +S000029966 CDS YCR057C 3 223228 220457 C 2011-02-03 2000-09-13|1997-01-28 +S000000655 ORF Verified YCR059C YIH1 chromosome 3 3 224230 223454 C 2011-02-03 1997-01-28 Negative regulator of eIF2 kinase Gcn2p; competes with Gcn2p for binding to Gcn1p; may contribute to regulation of translation in response to starvation via regulation of Gcn2p; binds to monomeric actin and to ribosomes and polyribosomes; ortholog of mammalian IMPACT +S000031068 CDS YCR059C 3 224230 223454 C 2011-02-03 1997-01-28 +S000000656 ORF Verified YCR060W TAH1 chromosome 3 3 224399 224734 W 2011-02-03 1997-01-28 Component of conserved R2TP complex (Rvb1-Rvb2-Tah1-Pih1); R2TP complex interacts with Hsp90 (Hsp82p and Hsc82p) to mediate assembly of large protein complexes such as box C/D snoRNPs and RNA polymerase II; contains a single TPR domain with at least two TPR motifs; plays a role in determining prion variants +S000032111 CDS YCR060W 3 224399 224734 W 2011-02-03 1997-01-28 +S000028490 ARS ARS315 ARS315 ARSIII-225 chromosome 3 3 224816 225061 2011-02-03 2003-03-31|2006-09-06 Highly-active autonomously replicating sequence; initiates replication in ~90% of cell cycles +S000178057 ARS_consensus_sequence ARS315 3 224853 224869 W 2014-11-18 2014-11-18 +S000000657 ORF Uncharacterized YCR061W YCR062W chromosome 3 3 225563 227458 W 2011-02-03 2000-09-14|1997-01-28 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; induced by treatment with 8-methoxypsoralen and UVA irradiation +S000032157 CDS YCR061W 3 225563 227458 W 2011-02-03 2000-09-14|1997-01-28 +S000006730 tRNA_gene tS(CGA)C SUP61 chromosome 3 L000002215|L000003754 3 227942 228042 W 68 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis; i6A37 modification is catalyzed by Mod5p; can mutate to suppress amber or ochre nonsense mutations; suppressor mutant alleles are recessive lethal and can only be maintained when an additional wild-type copy of the gene is present, because SUP61 encodes the only tRNA species that can decode UCG codons +S000029830 intron tS(CGA)C 3 227979 227997 W 2011-02-03 2000-05-19 +S000029828 noncoding_exon tS(CGA)C 3 227942 227978 W 2011-02-03 2000-05-19 +S000029829 noncoding_exon tS(CGA)C 3 227998 228042 W 2011-02-03 2000-05-19 +S000000659 ORF Verified YCR063W BUD31 U2 snRNP complex subunit BUD31|CWC14 chromosome 3 3 228318 228791 W 2011-02-03 1997-01-28 Component of the SF3b subcomplex of the U2 snRNP; increases efficiency of first and second step pre-mRNA splicing; diploid mutants display a random budding pattern instead of the wild-type bipolar pattern; facilitates passage through G1/S Start, but is not required for G2/M transition or exit from mitosis +S000033121 CDS YCR063W 3 228318 228791 W 2011-02-03 1997-01-28 +S000000660 ORF Dubious YCR064C chromosome 3 3 228505 228095 C 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene BUD31 +S000033148 CDS YCR064C 3 228505 228095 C 2011-02-03 1997-01-28 +S000000661 ORF Verified YCR065W HCM1 chromosome 3 L000000757 3 229310 231004 W 2011-02-03 2000-09-13|1997-01-28 Forkhead transcription factor; drives S-phase activation of genes involved in chromosome segregation, spindle dynamics, budding; also activates genes involved in respiration, use of alternative energy sources (like proline), NAD synthesis, oxidative stress resistance; key factor in early adaptation to nutrient deficiency and diauxic shift; suppressor of calmodulin mutants with specific SPB assembly defects; ortholog of C. elegans lifespan regulator PHA-4 +S000033238 CDS YCR065W 3 229310 231004 W 2011-02-03 2000-09-13|1997-01-28 +S000000662 ORF Verified YCR066W RAD18 E3 ubiquitin-protein ligase RAD18 chromosome 3 L000001567 3 231500 232963 W 67 2011-02-03 1997-01-28 E3 ubiquitin ligase; forms heterodimer with Rad6p to monoubiquitinate PCNA-K164; heterodimer binds single-stranded DNA and has single-stranded DNA dependent ATPase activity; required for postreplication repair; SUMO-targeted ubiquitin ligase (STUbl) that contains a SUMO-interacting motif (SIM) which stimulates its ubiquitin ligase activity towards the sumoylated form of PCNA +S000033283 CDS YCR066W 3 231500 232963 W 2011-02-03 1997-01-28 +S000000663 ORF Verified YCR067C SED4 chromosome 3 L000001860 3 236322 233125 C 2011-02-03 1997-01-28 Integral ER membrane protein that stimulates Sar1p GTPase activity; involved in COPII vesicle budding through disassociation of coat proteins from membranes onto liposomes; binds Sec16p; SED4 has a paralog, SEC12, that arose from the whole genome duplication +S000033324 CDS YCR067C 3 236322 233125 C 2011-02-03 1997-01-28 +S000000664 ORF Verified YCR068W ATG15 triglyceride lipase ATG15|CVT17|AUT5 chromosome 3 L000004767|L000004751 3 237214 238776 W 2011-02-03 2000-09-13|1997-01-28 Phospholipase; preferentially hydrolyses phosphatidylserine, with minor activity against cardiolipin and phosphatidylethanolamine; required for lysis of autophagic and CVT bodies; targeted to intravacuolar vesicles during autophagy via the multivesicular body (MVB) pathway; required for the maintenance of lipid droplet quantity after the diauxic shift; regulates lipolysis; expression regulated by Yap1p during autophagy +S000034292 CDS YCR068W 3 237214 238776 W 2011-02-03 2000-09-13|1997-01-28 +S000000665 ORF Verified YCR069W CPR4 peptidylprolyl isomerase family protein CPR4|SCC3|YCR070W|CYP4 chromosome 3 L000001804 3 239055 240011 W 2011-02-03 1997-01-28 Peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; has a potential role in the secretory pathway; CPR4 has a paralog, CPR8, that arose from the whole genome duplication +S000034404 CDS YCR069W 3 239055 240011 W 2011-02-03 1997-01-28 +S000000667 ORF Verified YCR071C IMG2 mitochondrial 54S ribosomal protein IMG2 chromosome 3 L000004446 3 240543 240103 C 2011-02-03 2000-09-13|1997-01-28 Mitochondrial ribosomal protein of the large subunit; conserved in metazoa, with similarity to human mitochondrial ribosomal protein MRPL49 +S000036422 CDS YCR071C 3 240543 240103 C 2011-02-03 2000-09-13|1997-01-28 +S000000668 ORF Verified YCR072C RSA4 chromosome 3 3 242352 240805 C 2011-02-03 2000-09-13|1997-01-28 WD-repeat protein involved in ribosome biogenesis; may interact with ribosomes; required for maturation and efficient intra-nuclear transport or pre-60S ribosomal subunits, localizes to the nucleolus +S000036487 CDS YCR072C 3 242352 240805 C 2011-02-03 2000-09-13|1997-01-28 +S000000669 ORF Verified YCR073C SSK22 mitogen-activated protein kinase kinase kinase SSK22 chromosome 3 L000002827 3 246583 242588 C 2011-02-03 2000-09-13|1997-01-28 MAP kinase kinase kinase of HOG1 mitogen-activated signaling pathway; functionally redundant with Ssk2p; interacts with and is activated by Ssk1p; phosphorylates Pbs2p; SSK22 has a paralog, SSK2, that arose from the whole genome duplication +S000036585 CDS YCR073C 3 246583 242588 C 2011-02-03 2000-09-13|1997-01-28 +S000000718 ORF Verified YCR073W-A SOL2 YCRX13W chromosome 3 L000003116 3 246963 247910 W 2011-02-03 2000-09-13|1997-01-28 Protein with a possible role in tRNA export; shows similarity to 6-phosphogluconolactonase non-catalytic domains but does not exhibit this enzymatic activity; homologous to Sol3p and Sol4p; SOL2 has a paralog, SOL1, that arose from the whole genome duplication +S000032484 CDS YCR073W-A 3 246963 247910 W 2011-02-03 2000-09-13|1997-01-28 +S000000671 ORF Verified YCR075C ERS1 cystinosin-like protein ERS1 chromosome 3 L000000582 3 248815 248033 C 2011-02-03 1997-01-28 Protein involved in cystine transport; localizes to the vacuole, plasma membrane and endosome; similarity to human cystinosin, a H(+)-driven transporter involved in L-cystine export from lysosomes and implicated in the disease cystinosis; contains seven transmembrane domains; mutation is functionally complemented by human CTNS +S000037388 CDS YCR075C 3 248815 248033 C 2011-02-03 1997-01-28 +S000028519 ORF Verified YCR075W-A EGO2 chromosome 3 3 248975 249202 W 2011-02-03 2003-07-29 Component of the EGO and GSE complexes; identified by homology to Ashbya gossypii; YCR075W-A has a paralog, YNR034W-A, that arose from the whole genome duplication +S000030296 CDS YCR075W-A 3 248975 249202 W 2011-02-03 2003-07-29 +S000000672 ORF Verified YCR076C FUB1 chromosome 3 3 250045 249293 C 2011-02-03 1997-01-28 Proteasome-binding protein; interacts physically with multiple subunits of the 20S proteasome and genetically with genes encoding 20S core particle and 19S regulatory particle subunits; exhibits boundary activity which blocks the propagation of heterochromatic silencing; contains a PI31 proteasome regulator domain and sequence similarity with human PSMF1, a proteasome inhibitor; not an essential gene +S000037531 CDS YCR076C 3 250045 249293 C 2011-02-03 1997-01-28 +S000000673 ORF Verified YCR077C PAT1 MRT1 chromosome 3 L000001183|L000003214 3 252628 250238 C 2011-02-03 2000-09-13|1997-01-28|2011-02-03 Deadenylation-dependent mRNA-decapping factor; also required for faithful chromosome transmission, maintenance of rDNA locus stability, and protection of mRNA 3'-UTRs from trimming; associated with topoisomerase II; binds to mRNAs under glucose starvation, most often in the 3' UTR; functionally linked to Pab1p; forms cytoplasmic foci upon DNA replication stress; phosphorylation by PKA inhibits P body foci formation +S000030274 CDS YCR077C 3 252628 250238 C 2011-02-03 2000-09-13|1997-01-28|2011-02-03 +S000002133 ORF Verified YCR079W PTC6 type 2C protein phosphatase PTC6|PPP2|AUP1 chromosome 3 3 252845 254173 W 2011-02-03 2000-09-13|1997-01-28 Mitochondrial type 2C protein phosphatase (PP2C); has similarity to mammalian PP1Ks; involved in mitophagy; null mutant is sensitive to rapamycin and has decreased phosphorylation of the Pda1 subunit of pyruvate dehydrogenase +S000031401 CDS YCR079W 3 252845 254173 W 2011-02-03 2000-09-13|1997-01-28 +S000000677 ORF Verified YCR081W SRB8 MED12|YCR080W|SSN5|NUT6|GIG1 chromosome 3 L000003007 3 254371 258654 W 2011-02-03 2000-09-13|1997-01-28 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation; involved in glucose repression +S000031712 CDS YCR081W 3 254371 258654 W 2011-02-03 2000-09-13|1997-01-28 +S000028609 ORF Dubious YCR081C-A chromosome 3 3 258651 258415 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps with SRB8/YCR081W; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching +S000031422 CDS YCR081C-A 3 258651 258415 C 2011-02-03 2003-07-29 +S000000678 ORF Verified YCR082W AHC2 chromosome 3 3 258883 259269 W 2011-02-03 1997-01-28 Component of the ADA histone acetyltransferase complex; Ahc2p and Ahc1p are unique to the ADA complex and not shared with the related SAGA and SLIK complexes; may tether Ahc1p to the complex +S000031866 CDS YCR082W 3 258883 259269 W 2011-02-03 1997-01-28 +S000000679 ORF Verified YCR083W TRX3 chromosome 3 3 259578 259961 W 2011-02-03 1997-01-28 Mitochondrial thioredoxin; highly conserved oxidoreductase required to maintain the redox homeostasis of the cell, forms the mitochondrial thioredoxin system with Trr2p, redox state is maintained by both Trr2p and Glr1p +S000031961 CDS YCR083W 3 259578 259961 W 2011-02-03 1997-01-28 +S000000680 ORF Verified YCR084C TUP1 chromatin-silencing transcriptional regulator TUP1|UMR7|SFL2|ROX4|FLK1|CYC9|CRT4|AMM1|AER2|AAR1 chromosome 3 L000002391 3 262452 260311 C 77 2011-02-03 1997-01-28 General repressor of transcription; forms complex with Cyc8p, involved in the establishment of repressive chromatin structure through interactions with histones H3 and H4, appears to enhance expression of some genes +S000032798 CDS YCR084C 3 262452 260311 C 2011-02-03 1997-01-28 +S000000681 ORF Uncharacterized YCR085W chromosome 3 3 262916 263269 W 2011-02-03 1997-01-28 Putative protein of unknown function; conserved among S. cerevisiae strains; YCR085W is not an essential gene +S000032982 CDS YCR085W 3 262916 263269 W 2011-02-03 1997-01-28 +S000000682 ORF Verified YCR086W CSM1 chromosome 3 S000007653 3 263392 263964 W 2011-02-03 1997-01-28 Nucleolar protein that mediates homolog segregation during meiosis I; forms a complex with Lrs4p and then Mam1p at kinetochores; required for condensin recruitment to the replication fork barrier site and rDNA repeat segregation +S000033051 CDS YCR086W 3 263392 263964 W 2011-02-03 1997-01-28 +S000000683 ORF Dubious YCR087W chromosome 3 3 263976 264491 W 2011-02-03 1997-01-28 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps uncharacterized gene YCR087C-A; YCR087W is not an essential gene +S000033786 CDS YCR087W 3 263976 264491 W 2011-02-03 1997-01-28 +S000007223 ORF Uncharacterized YCR087C-A LUG1 chromosome 3 3 264467 264006 C 2011-02-03 1999-07-17 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the nucleolus; YCR087C-A is not an essential gene +S000034092 CDS YCR087C-A 3 264467 264006 C 2011-02-03 1999-07-17 +S000000684 ORF Verified YCR088W ABP1 chromosome 3 L000000013 3 265068 266846 W 80 2011-02-03 1997-01-28 Actin-binding protein of the cortical actin cytoskeleton; important for activation of the Arp2/3 complex that plays a key role actin in cytoskeleton organization; inhibits barbed-end actin filament elongation; phosphorylation within its Proline-Rich Regio, mediated by Cdc28p and Pho85p, protects Abp1p from proteolysis mediated by its own PEST sequences; mammalian homolog of HIP-55 (hematopoietic progenitor kinase 1 [HPK1]-interacting protein of 55 kDa) +S000033904 CDS YCR088W 3 265068 266846 W 2011-02-03 1997-01-28 +S000000685 ORF Verified YCR089W FIG2 chromosome 3 L000003312 3 267434 272263 W 2011-02-03 2000-09-13|1997-01-28 Cell wall adhesin, expressed specifically during mating; may be involved in maintenance of cell wall integrity during mating; FIG2 has a paralog, AGA1, that arose from the whole genome duplication +S000034060 CDS YCR089W 3 267434 272263 W 2011-02-03 2000-09-13|1997-01-28 +S000028491 ARS ARS316 ARS316 ARSIII-273 chromosome 3 3 272852 273095 2011-02-03 2003-03-31|2006-09-06 Inefficient autonomously replicating sequence; active in ~25% of cell cycles +S000178058 ARS_consensus_sequence ARS316 3 273024 273008 C 2014-11-18 2014-11-18 +S000000686 ORF Uncharacterized YCR090C chromosome 3 3 272863 272315 C 2011-02-03 1997-01-28 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; YCR090C is not an essential gene +S000036138 CDS YCR090C 3 272863 272315 C 2011-02-03 1997-01-28 +S000000687 ORF Verified YCR091W KIN82 putative serine/threonine protein kinase KIN82|FPK2 chromosome 3 L000000906 3 274404 276566 W 2011-02-03 2000-09-13|1997-01-28|2011-02-03 Putative serine/threonine protein kinase; implicated in the regulation of phospholipid asymmetry through the activation of phospholipid translocases (flippases); involved in the phosphorylation of upstream inhibitory kinase Ypk1p along with Fpk1p; has a redundant role in the cellular response to mating pheromone; KIN82 has a paralog, FPK1, that arose from the whole genome duplication +S000036298 CDS YCR091W 3 274404 276566 W 2011-02-03 2000-09-13|1997-01-28|2011-02-03 +S000000688 ORF Verified YCR092C MSH3 mismatch repair protein MSH3 chromosome 3 L000001191 3 279820 276764 C 2011-02-03 2007-09-06|1997-01-28 Mismatch repair protein; forms dimers with Msh2p that mediate repair of insertion or deletion mutations and removal of nonhomologous DNA ends, contains a PCNA (Pol30p) binding motif required for genome stability +S000036361 CDS YCR092C 3 279820 276764 C 2011-02-03 1997-01-28|2007-09-06 +S000000689 ORF Verified YCR093W CDC39 CCR4-NOT core subunit CDC39|SMD6|ROS1|NOT1 chromosome 3 L000000274 3 280117 286443 W 91 2011-02-03 2000-09-13|1997-01-28 Subunit of the CCR4-NOT1 core complex; this complex has multiple roles in the regulation of mRNA levels including regulation of transcription and destabilization of mRNA by deadenylation; basal transcription factor that increases initiation and elongation; activates the ATPase activity of Dhh1p, resulting in processing body disassembly +S000037049 CDS YCR093W 3 280117 286443 W 2011-02-03 2000-09-13|1997-01-28 +S000000690 ORF Verified YCR094W CDC50 aminophospholipid translocase regulatory protein CDC50 chromosome 3 L000004326 3 286762 287937 W 2011-02-03 1997-01-28 Endosomal protein that interacts with phospholipid flippase Drs2p; interaction with Cdc50p is essential for Drs2p catalytic activity; mutations affect cell polarity and polarized growth; similar to Lem3p; CDC50 has a paralog, YNR048W, that arose from the whole genome duplication +S000037156 CDS YCR094W 3 286762 287937 W 2011-02-03 1997-01-28 +S000000691 ORF Uncharacterized YCR095C OCA4 chromosome 3 3 289258 288170 C 2011-02-03 1997-01-28 Cytoplasmic protein required for replication of Brome mosaic virus; S. cerevisiae is a model system for studying replication of positive-strand RNA viruses in their natural hosts +S000037199 CDS YCR095C 3 289258 288170 C 2011-02-03 1997-01-28 +S000029724 ORF Uncharacterized YCR095W-A chromosome 3 3 289639 289797 W 2011-02-03 2004-08-27 Putative protein of unknown function +S000036860 CDS YCR095W-A 3 289639 289797 W 2011-02-03 2004-08-27 +S000006839 long_terminal_repeat YCRWdelta12 chromosome 3 3 291373 291712 W 2011-02-03 2000-05-19 Ty1 LTR +S000006841 long_terminal_repeat YCRWomega3 chromosome 3 3 291922 292167 W 2011-02-03 2000-05-19 Ty5 LTR +S000029655 silent_mating_type_cassette_array silenced_gene HMR HMR chromosome 3 L000000792 3 292388 295034 W 94 2011-02-03 2007-12-10 Mating-type cassette - right; unexpressed complete copy of the mating-type genes, silenced by the Sir2 histone deacetylase and its associated SIR1, SIR3 and SIR4 proteins; mating-type switching involves replacement of the Ya or Yalpha sequences present at the MAT locus with either the a or alpha genes located at one of the HM loci in a process stimulated by the HO endonuclease; sequence replacement occurs by gene conversion, leaving the donor unaltered +S000124952 X_region HMR 3 293032 293736 W 2011-02-03 2007-12-10 +S000124953 Y_region HMR 3 293737 294378 W 2011-02-03 2007-12-10 +S000124954 Z1_region HMR 3 294379 294617 W 2011-02-03 2007-12-10 +S000028492 ARS ARS317 ARS317 HMR-E ARS chromosome 3 3 292638 292694 2014-11-18 2003-03-31|2014-11-18 ARS that fires extremely inefficiently and late during S phase; fires late and inefficiently compared to other origins in the genome; active in only a small fraction of cell cycles +S000121225 ARS_consensus_sequence ARS317 3 292684 292674 C 2011-02-03 2007-03-06 +S000000692 ORF Verified|silenced_gene YCR096C HMRA2 homeodomain mating type protein a2|A2 chromosome 3 3 293538 293179 C 2011-02-03 1997-01-28 Silenced copy of a2 at HMR; similarity to Alpha2p; required along with a1p for inhibiting expression of the HO endonuclease in a/alpha HO/HO diploid cells with an active mating-type interconversion system +S000037309 CDS YCR096C 3 293538 293179 C 2011-02-03 1997-01-28 +S000000694 ORF Verified|silenced_gene YCR097W HMRA1 YCR097WB chromosome 3 S000007657 3 293835 294321 W 2011-02-03 1997-01-28 Silenced copy of a1 at HMR; homeobox corepressor that interacts with Alpha2p to repress haploid-specific gene transcription in diploid cells +S000030021 CDS YCR097W 3 293835 293939 W 2011-02-03 1997-01-28 +S000030022 CDS YCR097W 3 293994 294239 W 2011-02-03 1997-01-28 +S000030023 CDS YCR097W 3 294292 294321 W 2011-02-03 1997-01-28 +S000030024 intron YCR097W 3 293940 293993 W 2011-02-03 1997-01-28 +S000030025 intron YCR097W 3 294240 294291 W 2011-02-03 1997-01-28 +S000007632 ORF Dubious YCR097W-A chromosome 3 3 294439 294705 W 2011-02-03 2000-07-12 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by homology to a hemiascomycetous yeast protein +S000036353 CDS YCR097W-A 3 294439 294705 W 2011-02-03 2000-07-12 +S000028493 ARS ARS318 ARS318 HMR-I ARS chromosome 3 3 294820 294901 2014-11-18 2003-03-31|2014-11-18 ARS that becomes active if the nearby ARS317/HMR-E silencer is deleted; active in only a small fraction of cell cycles +S000030213 ARS_consensus_sequence ARS318 3 294824 294834 W 2011-02-03 2003-03-31|2009-02-19 +S000006840 long_terminal_repeat YCRWdelta13 chromosome 3 3 295003 295330 W 2011-02-03 2000-05-19 Ty1 LTR +S000006738 tRNA_gene tT(AGU)C chromosome 3 L000003755 3 295484 295556 W 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000032149 noncoding_exon tT(AGU)C 3 295484 295556 W 2011-02-03 2000-05-19 +S000006834 long_terminal_repeat YCRCdelta14 chromosome 3 3 296190 295958 C 2011-02-03 2000-05-19|2007-04-02 Ty1 LTR +S000000695 ORF Verified YCR098C GIT1 chromosome 3 L000003211 3 298605 297049 C 2011-02-03 1997-01-28 Plasma membrane permease; mediates uptake of glycerophosphoinositol and glycerophosphocholine as sources of the nutrients inositol and phosphate; expression and transport rate are regulated by phosphate and inositol availability +S000030063 CDS YCR098C 3 298605 297049 C 2011-02-03 1997-01-28 +S000000696 ORF Uncharacterized YCR099C chromosome 3 3 301299 300832 C 2011-02-03 1997-01-28 Putative protein of unknown function +S000031088 CDS YCR099C 3 301299 300832 C 2011-02-03 1997-01-28 +S000000697 ORF Uncharacterized YCR100C chromosome 3 3 302221 301271 C 2011-02-03 1997-01-28 Putative protein of unknown function +S000036663 CDS YCR100C 3 302221 301271 C 2011-02-03 1997-01-28 +S000000698 ORF Uncharacterized YCR101C chromosome 3 3 303030 302482 C 2011-02-03 1997-01-28 Putative protein of unknown function; localizes to the membrane fraction; YCR101C is not an essential gene +S000036721 CDS YCR101C 3 303030 302482 C 2011-02-03 1997-01-28 +S000000699 ORF Uncharacterized YCR102C chromosome 3 3 305467 304361 C 2011-02-03 1997-01-28 Putative protein of unknown function; involved in copper metabolism; similar to C. carbonum toxD gene; member of the quinone oxidoreductase family +S000036781 CDS YCR102C 3 305467 304361 C 2011-02-03 1997-01-28 +S000007231 ORF Dubious YCR102W-A chromosome 3 3 306735 306932 W 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037829 CDS YCR102W-A 3 306735 306932 W 2011-02-03 1999-07-17 +S000000701 ORF Verified YCR104W PAU3 seripauperin PAU3 chromosome 3 L000002739 3 307801 308175 W 2011-02-03 1997-01-28 Member of the seripauperin multigene family; encoded mainly in subtelomeric region; active during alcoholic fermentation; regulated by anaerobiosis; negatively regulated by oxygen; repressed by heme +S000037613 CDS YCR104W 3 307801 308175 W 2011-02-03 1997-01-28 +S000000702 ORF Verified YCR105W ADH7 NADP-dependent alcohol dehydrogenase|ADHVII chromosome 3 3 309070 310155 W 2011-02-03 1997-01-28 NADPH-dependent medium chain alcohol dehydrogenase; has broad substrate specificity; member of the cinnamyl family of alcohol dehydrogenases; may be involved in fusel alcohol synthesis or in aldehyde tolerance +S000037676 CDS YCR105W 3 309070 310155 W 2011-02-03 1997-01-28 +S000000703 ORF Verified YCR106W RDS1 chromosome 3 3 310958 313456 W 2011-02-03 1997-01-28 Putative zinc cluster transcription factor; involved in conferring resistance to cycloheximide +S000037733 CDS YCR106W 3 310958 313456 W 2011-02-03 1997-01-28 +S000000704 ORF Verified YCR107W AAD3 putative aryl-alcohol dehydrogenase chromosome 3 L000004636 3 313890 314981 W 2011-02-03 2000-09-13|1997-01-28 Putative aryl-alcohol dehydrogenase; similar to P. chrysosporium aryl-alcohol dehydrogenase; mutational analysis has not yet revealed a physiological role; AAD3 has a paralog, AAD15, that arose from a segmental duplication; members of the AAD gene family comprise three pairs (AAD3 + AAD15, AAD6/AAD16 + AAD4, AAD10 + AAD14) whose two genes are more related to one another than to other members of the family +S000037782 CDS YCR107W 3 313890 314981 W 2011-02-03 2000-09-13|1997-01-28 +S000028944 telomere TEL03R chromosome 3 3 315783 316620 W 102 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome III; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats +S000028945 telomeric_repeat TEL03R 3 316522 316620 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome III +S000028946 X_element TEL03R 3 315783 316239 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome III; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YCR108C +S000028947 X_element_combinatorial_repeat TEL03R 3 316240 316521 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr III; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000028494 ARS ARS319 ARS319 chromosome 3 3 315807 315879 2014-11-18 2003-03-31|2014-11-18 Highly-active subtelomeric autonomously replicating sequence; initiates replication in ~90% of cell cycles +S000030215 ARS_consensus_sequence ARS319 3 315821 315831 W 2011-02-03 2003-03-31 +S000028536 ORF Uncharacterized YCR108C chromosome 3 3 316188 315997 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031145 CDS YCR108C 3 316188 315997 C 2011-02-03 2003-07-29 +S000121226 ARS ARS400 ARSIV-1 chromosome 4 4 137 1392 2007-03-06 2007-03-06 Autonomously Replicating Sequence +S000178059 ARS_consensus_sequence ARS400 4 869 853 C 2014-11-18 2014-11-18 +S000028875 telomere TEL04L chromosome 4 4 904 1 C -153 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome IV; composed of an X element core sequence, X element combinatorial repeats, and a terminal stretch of telomeric repeats +S000028876 telomeric_repeat TEL04L 4 154 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome IV +S000028877 X_element TEL04L 4 904 435 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome IV; spans 469 bp and contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028878 X_element_combinatorial_repeat TEL04L 4 434 155 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr IV; spans 279 bp and contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000002407 ORF Verified YDL248W COS7 chromosome 4 L000004065 4 1802 2953 W 1996-07-31 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000036145 CDS YDL248W 4 1802 2953 W 1996-07-31 1996-07-31 +S000007602 ORF Dubious YDL247W-A chromosome 4 4 3762 3836 W 2001-02-26 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by sequence comparison with hemiascomycetous yeast species +S000037148 CDS YDL247W-A 4 3762 3836 W 2001-02-26 2001-02-26 +S000002406 ORF Verified YDL247W MPH2 alpha-glucoside permease chromosome 4 4 5985 7814 W 1996-07-31 1996-07-31 Alpha-glucoside permease; transports maltose, maltotriose, alpha-methylglucoside, and turanose; almost identical to Mph3p; encoded in a subtelomeric position in a region likely to have undergone duplication +S000035265 CDS YDL247W 4 5985 7814 W 1996-07-31 1996-07-31 +S000002405 ORF Verified YDL246C SOR2 L-iditol 2-dehydrogenase SOR2 chromosome 4 4 9756 8683 C 1996-07-31 1996-07-31 Sorbitol dehydrogenase; protein sequence is 99% identical to the Sor1p sorbitol dehydrogenase +S000035109 CDS YDL246C 4 9756 8683 C 1996-07-31 1996-07-31 +S000002404 ORF Verified YDL245C HXT15 HLT2|hexose transporter HXT15 chromosome 4 L000002986 4 13360 11657 C 1996-07-31 1996-07-31 Putative transmembrane polyol transporter; supports growth on and uptake of mannitol, sorbitol and xylitol with moderate affinity when overexpressed in a strain deleted for hexose family members; minor hexose transport activity when overexpressed in a similar strain; similarity to hexose transporters; expression is induced by low levels of glucose and repressed by high levels of glucose +S000035017 CDS YDL245C 4 13360 11657 C 1996-07-31 1996-07-31 +S000118427 ARS ARS403 ARSIV-16 chromosome 4 4 15493 15739 2006-08-30 2006-08-30 Autonomously Replicating Sequence +S000178060 ARS_consensus_sequence ARS403 4 15682 15666 C 2014-11-18 2014-11-18 +S000002403 ORF Verified YDL244W THI13 4-amino-5-hydroxymethyl-2-methylpyrimidine phosphate synthase chromosome 4 S000007414 4 16204 17226 W 1996-07-31 1996-07-31 Protein involved in synthesis of the thiamine precursor HMP; member of a subtelomeric gene family including THI5, THI11, THI12, and THI13; hydroxymethylpyrimidine is also known as HMP +S000034919 CDS YDL244W 4 16204 17226 W 1996-07-31 1996-07-31 +S000002402 ORF Verified YDL243C AAD4 putative aryl-alcohol dehydrogenase chromosome 4 L000004637 4 18566 17577 C 1996-07-31 1996-07-31 Putative aryl-alcohol dehydrogenase; involved in oxidative stress response; similar to P. chrysosporium aryl-alcohol dehydrogenase; expression induced in cells treated with the mycotoxin patulin; members of the AAD gene family comprise three pairs (AAD3 + AAD15, AAD6/AAD16 + AAD4, AAD10 + AAD14) whose two genes are more related to one another than to other members of the family +S000032895 CDS YDL243C 4 18566 17577 C 1996-07-31 1996-07-31 +S000002401 ORF Dubious YDL242W chromosome 4 4 18959 19312 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032853 CDS YDL242W 4 18959 19312 W 1996-07-31 1996-07-31 +S000002400 ORF Uncharacterized YDL241W chromosome 4 4 20635 21006 W 1996-07-31 1996-07-31 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; YDL241W is not an essential gene +S000032761 CDS YDL241W 4 20635 21006 W 1996-07-31 1996-07-31 +S000007601 ORF Dubious YDL240C-A chromosome 4 4 22608 22471 C 2001-02-26 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by sequence comparison with hemiascomycetous yeast species +S000037147 CDS YDL240C-A 4 22608 22471 C 2001-02-26 2001-02-26 +S000002399 ORF Verified YDL240W LRG1 chromosome 4 L000000953 4 22823 25876 W 1996-07-31 1996-07-31|2011-02-03 GTPase-activating protein (GAP); contains Rho1p-specific GAP activity, interacting with activated forms of Rho1p; functions along with Sac7p as a negative regulator of the Pkc1p-mediated cell wall integrity signaling pathway; negative regulator of cell wall 1,3-beta-glucan biosynthesis; required for efficient cell fusion; contains a RhoGAP domain and three Lin-11-Isl1-Mec-3 (LIM) domains +S000032681 CDS YDL240W 4 22823 25876 W 1996-07-31 1996-07-31|2011-02-03 +S000002398 ORF Verified YDL239C ADY3 chromosome 4 4 28775 26403 C 1996-07-31 1996-07-31|2011-02-03 Protein required for spore wall formation; subunit of the leading edge protein (LEP) complex (Ssp1-Ady3-Don1-Irc10) that forms a ring-like structure at the leading edge of the prospore membrane during meiosis II; mediates assembly of the LEP complex, formation of the ring-like structure via interaction with spindle pole body components and prospore membrane maturation; potentially phosphorylated by Cdc28p; ADY3 has a paralog, CNM67, that arose from the whole +S000032048 CDS YDL239C 4 28775 26403 C 1996-07-31 1996-07-31|2011-02-03 +S000002397 ORF Verified YDL238C GUD1 guanine deaminase chromosome 4 4 30454 28985 C 1996-07-31 1996-07-31 Guanine deaminase; a catabolic enzyme of the guanine salvage pathway producing xanthine and ammonia from guanine; activity is low in exponentially-growing cultures but expression is increased in post-diauxic and stationary-phase cultures +S000031892 CDS YDL238C 4 30454 28985 C 1996-07-31 1996-07-31 +S000002396 ORF Verified YDL237W AIM6 LRC1 chromosome 4 4 30657 31829 W 1996-07-31 1996-07-31|2011-02-03 Protein of unknown function; required for respiratory growth; YDL237W is not an essential gene +S000031783 CDS YDL237W 4 30657 31829 W 1996-07-31 1996-07-31|2011-02-03 +S000002395 ORF Verified YDL236W PHO13 4-nitrophenylphosphatase chromosome 4 L000001425 4 32296 33234 W 1996-07-31 1996-07-31 Conserved phosphatase acting as a metabolite repair enzyme; shows specific dephosphorylating activity on two side-products of central carbohydrate metabolism, 2-phosphoglycolate and 4-phosphoerythronate; alkaline phosphatase specific for p-nitrophenyl phosphate; also has protein phosphatase activity; human ortholog PGP shows similar substrate specificity, deletion causes similar metabolite accumulation phenotypes, suggesting conserved role in eliminating glycolytic byproducts +S000030827 CDS YDL236W 4 32296 33234 W 1996-07-31 1996-07-31 +S000002394 ORF Verified YDL235C YPD1 chromosome 4 L000003285 4 33918 33415 C 1996-07-31 1996-07-31 Osmotic stress-responsive phosphorelay intermediate sensor protein; phosphorylated by the plasma membrane sensor Sln1p in response to osmotic stress and then in turn phosphorylates the response regulators Ssk1p in the cytosol and Skn7p in the nucleus +S000030691 CDS YDL235C 4 33918 33415 C 1996-07-31 1996-07-31 +S000002393 ORF Verified YDL234C GYP7 chromosome 4 L000003067 4 36477 34237 C 2011-02-03 1996-07-31 GTPase-activating protein for yeast Rab family members; members include Ypt7p (most effective), Ypt1p, Ypt31p, and Ypt32p (in vitro); involved in vesicle mediated protein trafficking; contains a PH-like domain +S000036775 CDS YDL234C 4 36477 34237 C 2011-02-03 1996-07-31 +S000002392 ORF Uncharacterized YDL233W MFG1 chromosome 4 4 36797 38173 W 2011-02-03 1996-07-31 Regulator of filamentous growth; interacts with FLO11 promoter and regulates FLO11 expression; binds to transcription factors Flo8p and Mss11p; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; YDL233W is not an essential gene +S000036757 CDS YDL233W 4 36797 38173 W 2011-02-03 1996-07-31 +S000002391 ORF Verified YDL232W OST4 olichyl-diphosphooligosaccharide--protein glycotransferase OST4 chromosome 4 L000003180 4 38487 38597 W 2011-02-03 1996-07-31 Subunit of the oligosaccharyltransferase complex of the ER lumen; complex catalyzes protein asparagine-linked glycosylation; type I membrane protein required for incorporation of Ost3p or Ost6p into the OST complex +S000036662 CDS YDL232W 4 38487 38597 W 2011-02-03 1996-07-31 +S000002390 ORF Verified YDL231C BRE4 chromosome 4 4 42244 38867 C 2011-02-03 1996-07-31 Zinc finger protein containing five transmembrane domains; null mutant exhibits strongly fragmented vacuoles and sensitivity to brefeldin A, a drug which is known to affect intracellular transport +S000036514 CDS YDL231C 4 42244 38867 C 2011-02-03 1996-07-31 +S000002389 ORF Verified YDL230W PTP1 tyrosine protein phosphatase PTP1 chromosome 4 L000001525 4 42700 43707 W 2011-02-03 1996-07-31 Phosphotyrosine-specific protein phosphatase; dephosphorylates a broad range of substrates in vivo, including Fpr3p; localized to the cytoplasm and the mitochondria; proposed to be a negative regulator of filamentation +S000036498 CDS YDL230W 4 42700 43707 W 2011-02-03 1996-07-31 +S000002388 ORF Verified YDL229W SSB1 Hsp70 family ATPase SSB1|YG101 chromosome 4 L000002073|L000002508 4 44065 45906 W -129 2011-02-03 1996-07-31 Cytoplasmic ATPase that is a ribosome-associated molecular chaperone; functions with J-protein partner Zuo1p; may be involved in folding of newly-made polypeptide chains; member of the HSP70 family; interacts with phosphatase subunit Reg1p; SSB1 has a paralog, SSB2, that arose from the whole genome duplication +S000035996 CDS YDL229W 4 44065 45906 W 2011-02-03 1996-07-31 +S000002387 ORF Dubious YDL228C chromosome 4 4 45918 45277 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps the verified gene SSB1 +S000035797 CDS YDL228C 4 45918 45277 C 2011-02-03 1996-07-31 +S000114787 ARS ARS404 ARS404 HO ARS chromosome 4 4 46185 46237 2014-11-18 2014-11-18|2006-04-10 Autonomously Replicating Sequence +S000121227 ARS_consensus_sequence ARS404 4 46230 46214 C 2014-11-18 2014-11-18|2007-03-06 +S000002386 ORF Verified YDL227C HO chromosome 4 L000000796 4 48031 46271 C -130 2011-02-03 1996-07-31 Site-specific endonuclease; required for gene conversion at the MAT locus (homothallic switching) through the generation of a ds DNA break; expression restricted to mother cells in late G1 as controlled by Swi4p-Swi6p, Swi5p, and Ash1p +S000035713 CDS YDL227C 4 48031 46271 C 2011-02-03 1996-07-31 +S000002385 ORF Verified YDL226C GCS1 chromosome 4 L000000693 4 52173 51115 C 2011-02-03 1996-07-31 ADP-ribosylation factor GTPase activating protein (ARF GAP); involved in ER-Golgi transport; required for prospore membrane formation; regulates phospholipase Spo14p; shares functional similarity with Glo3p; GCS1 has a paralog, SPS18, that arose from the whole genome duplication +S000035648 CDS YDL226C 4 52173 51115 C 2011-02-03 1996-07-31 +S000002384 ORF Verified YDL225W SHS1 septin SHS1|SEP7 chromosome 4 4 52445 54100 W 2011-02-03 1996-07-31 Component of the septin ring that is required for cytokinesis; present at the ends of rod-like septin hetero-oligomers; C-terminal extension is important for recruitment of Bni5p to the mother-bud neck, which in turn is required for Myo1p recruitment and cytokinesis; undergoes sumoylation and phosphorylation during mitosis; protein abundance increases in response to DNA replication stress +S000035638 CDS YDL225W 4 52445 54100 W 2011-02-03 1996-07-31 +S000002383 ORF Verified YDL224C WHI4 chromosome 4 L000004493 4 56346 54397 C 2011-02-03 1996-07-31 Putative RNA binding protein; regulates the cell size requirement for passage through Start and commitment to cell division; WHI4 has a paralog, WHI3, that arose from the whole genome duplication +S000034657 CDS YDL224C 4 56346 54397 C 2011-02-03 1996-07-31 +S000002382 ORF Verified YDL223C HBT1 chromosome 4 S000007655 4 60405 57265 C 2011-02-03 1996-07-31 Shmoo tip protein, substrate of Hub1p ubiquitin-like protein; mutants are defective for mating projection formation, thereby implicating Hbt1p in polarized cell morphogenesis; HBT1 has a paralog, YNL195C, that arose from the whole genome duplication +S000034598 CDS YDL223C 4 60405 57265 C 2011-02-03 1996-07-31 +S000002381 ORF Verified YDL222C FMP45 chromosome 4 4 61801 60872 C 2011-02-03 1996-07-31 Integral membrane protein localized to mitochondria; required for sporulation and maintaining sphingolipid content; similar to SUR7; FMP45 has a paralog, YNL194C, that arose from the whole genome duplication +S000034458 CDS YDL222C 4 61801 60872 C 2011-02-03 1996-07-31 +S000002380 ORF Dubious YDL221W chromosome 4 4 62011 62562 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the 3' end of essential gene CDC13 +S000034428 CDS YDL221W 4 62011 62562 W 2011-02-03 1996-07-31 +S000002379 ORF Verified YDL220C CDC13 telomere-binding protein CDC13|EST4 chromosome 4 L000000253 4 65018 62244 C -122 2011-02-03 1996-07-31 Single stranded DNA-binding protein found at TG1-3 telomere G-tails; key roles in regulation of telomerase, telomere end protection, conventional telomere replication; regulates telomere replication through recruitment of specific sub-complexes, essential function is telomere capping; forms homodimer via N-terminus; disruption of dimerization leads to short telomeres; autophagy and proteasome are involved in Cdc13p degradation; differentially phosphorylated through cell cycle +S000032343 CDS YDL220C 4 65018 62244 C 2011-02-03 1996-07-31 +S000002378 ORF Verified YDL219W DTD1 D-tyrosyl-tRNA(Tyr) deacylase chromosome 4 4 65242 65765 W 2011-02-03 1996-07-31 D-Tyr-tRNA(Tyr) deacylase; functions in protein translation, may affect nonsense suppression via alteration of the protein synthesis machinery; ubiquitous among eukaryotes +S000032532 CDS YDL219W 4 65242 65306 W 2011-02-03 1996-07-31 +S000032533 CDS YDL219W 4 65378 65765 W 2011-02-03 1996-07-31 +S000032534 intron YDL219W 4 65307 65377 W 2011-02-03 1996-07-31 +S000002377 ORF Uncharacterized YDL218W chromosome 4 4 66493 67446 W 2011-02-03 1996-07-31 Putative protein of unknown function; YDL218W transcription is regulated by Azf1p and induced by starvation and aerobic conditions; expression also induced in cells treated with the mycotoxin patulin +S000031549 CDS YDL218W 4 66493 67446 W 2011-02-03 1996-07-31 +S000002376 ORF Verified YDL217C TIM22 translocation channel protein TIM22 chromosome 4 L000004157 4 68606 67983 C 2011-02-03 1996-07-31 Essential core component of the mitochondrial TIM22 complex; involved in insertion of polytopic proteins into the inner membrane; forms the channel through which proteins are imported +S000031465 CDS YDL217C 4 68606 67983 C 2011-02-03 1996-07-31 +S000002375 ORF Verified YDL216C RRI1 COP9 signalosome catalytic subunit RRI1|JAB1|CSN5 chromosome 4 S000007574 4 70319 68997 C 2011-02-03 1996-07-31|2006-04-13 Catalytic subunit of the COP9 signalosome (CSN) complex; acts as an isopeptidase in cleaving the ubiquitin-like protein Nedd8 from SCF ubiquitin ligases; metalloendopeptidase involved in the adaptation to pheromone signaling; involved in modulation of genes controlling amino acid and lipid metabolism, and ergosterol biosynthesis +S000031346 CDS YDL216C 4 70319 68997 C 2011-02-03 1996-07-31|2006-04-13 +S000002374 ORF Verified YDL215C GDH2 glutamate dehydrogenase (NAD(+))|GDHB|GDH-B chromosome 4 L000000697 4 73918 70640 C 2011-02-03 1996-07-31 NAD(+)-dependent glutamate dehydrogenase; degrades glutamate to ammonia and alpha-ketoglutarate; expression sensitive to nitrogen catabolite repression and intracellular ammonia levels; genetically interacts with GDH3 by suppressing stress-induced apoptosis +S000031302 CDS YDL215C 4 73918 70640 C 2011-02-03 1996-07-31 +S000002373 ORF Verified YDL214C PRR2 serine/threonine protein kinase PRR2 chromosome 4 4 76545 74446 C 2011-02-03 1996-07-31 Serine/threonine protein kinase; inhibits pheromone induced signalling downstream of MAPK, possibly at the level of the Ste12p transcription factor; mutant has increased aneuploidy tolerance; PRR2 has a paralog, NPR1, that arose from the whole genome duplication +S000030339 CDS YDL214C 4 76545 74446 C 2011-02-03 1996-07-31 +S000002372 ORF Verified YDL213C NOP6 chromosome 4 4 77966 77289 C 2011-02-03 1996-07-31 rRNA-binding protein required for 40S ribosomal subunit biogenesis; contains an RNA recognition motif (RRM); hydrophilin essential to overcome the stress of the desiccation-rehydration process; NOP6 may be a fungal-specific gene as no homologs have been yet identified in higher eukaryotes +S000030227 CDS YDL213C 4 77966 77289 C 2011-02-03 1996-07-31 +S000002371 ORF Verified YDL212W SHR3 APF1 chromosome 4 L000001885 4 78426 79058 W 2011-02-03 1996-07-31 Endoplasmic reticulum packaging chaperone; required for incorporation of amino acid permeases into COPII coated vesicles for transport to the cell surface +S000030170 CDS YDL212W 4 78426 79058 W 2011-02-03 1996-07-31 +S000002370 ORF Uncharacterized YDL211C chromosome 4 4 80412 79294 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole; YDL211C has a paralog, TDA7, that arose from the whole genome duplication +S000036399 CDS YDL211C 4 80412 79294 C 2011-02-03 1996-07-31 +S000006576 tRNA_gene tG(GCC)D1 chromosome 4 L000003761 4 83548 83618 W 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis +S000031690 noncoding_exon tG(GCC)D1 4 83548 83618 W 2011-02-03 2000-05-19 +S000002369 ORF Verified YDL210W UGA4 chromosome 4 L000002424 4 84270 85985 W 2011-02-03 1996-07-31 GABA (gamma-aminobutyrate) permease; serves as a GABA transport protein involved in the utilization of GABA as a nitrogen source; catalyzes the transport of putrescine and delta-aminolevulinic acid (ALA); localized to the vacuolar membrane +S000036357 CDS YDL210W 4 84270 85985 W 2011-02-03 1996-07-31 +S000118428 ARS ARS405 ARSIV-86 chromosome 4 4 85945 86176 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178061 ARS_consensus_sequence ARS405 4 86125 86109 C 2014-11-18 2014-11-18 +S000002368 ORF Verified YDL209C CWC2 NTC40 chromosome 4 4 87226 86207 C 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); this complex contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs; binds directly to U6 snRNA; similar to S. pombe Cwf2 +S000036574 CDS YDL209C 4 87226 86207 C 2011-02-03 1996-07-31 +S000002367 ORF Verified YDL208W NHP2 snoRNA-binding protein NHP2 chromosome 4 L000001243 4 87512 87982 W 2011-02-03 1996-07-31|2005-11-22 Protein related to mammalian high mobility group (HMG) proteins; nuclear protein; essential for function of H/ACA-type snoRNPs, which are involved in 18S rRNA processing +S000036516 CDS YDL208W 4 87512 87982 W 2011-02-03 1996-07-31|2005-11-22 +S000002366 ORF Verified YDL207W GLE1 nucleoporin GLE1|NLE2|BRR3|RSS1 chromosome 4 L000003399|L000001255|S000029324 4 88248 89864 W 2011-02-03 1996-07-31 Cytoplasmic nucleoporin required for polyadenylated mRNA export; contains a nuclear export signal; when bound to inositol hexakisphosphate (IP6), functions as an activator for the Dbp5p ATPase activity at the nuclear pore complex during mRNA export; mediates translation initiation; required for efficient translation termination +S000036457 CDS YDL207W 4 88248 89864 W 2011-02-03 1996-07-31 +S000002365 ORF Uncharacterized YDL206W chromosome 4 4 90176 92464 W 2011-02-03 1996-07-31 Putative protein of unknown function; YDL206W is not an essential protein +S000035556 CDS YDL206W 4 90176 92464 W 2011-02-03 1996-07-31 +S000002364 ORF Verified YDL205C HEM3 hydroxymethylbilane synthase|OLE2 chromosome 4 L000000762 4 93745 92762 C 2011-02-03 1996-07-31 Porphobilinogen deaminase; catalyzes the conversion of 4-porphobilinogen to hydroxymethylbilane, the third step in heme biosynthesis; localizes to the cytoplasm and nucleus; expression is regulated by Hap2p-Hap3p, but not by levels of heme; human homolog HMBS can complement yeast mutant and allow growth of haploid null after sporulation of a heterozygous diploid +S000035448 CDS YDL205C 4 93745 92762 C 2011-02-03 1996-07-31 +S000002363 ORF Verified YDL204W RTN2 chromosome 4 4 94605 95786 W 2011-02-03 1996-07-31 Reticulon protein; involved in nuclear pore assembly and maintenance of tubular ER morphology; promotes membrane curvature; regulates the ER asymmetry-induced inheritance block during ER stress; role in ER-derived peroxisomal biogenesis; interacts with Sec6p, Yip3p, and Sbh1p; less abundant than RTN1; member of RTNLA (reticulon-like A) subfamily; protein increases in abundance and relocalizes to plasma membrane upon DNA replication stress +S000035441 CDS YDL204W 4 94605 95786 W 2011-02-03 1996-07-31 +S000002362 ORF Verified YDL203C ACK1 chromosome 4 4 97953 96082 C 2011-02-03 1996-07-31 Protein that functions in the cell wall integrity pathway; functions upstream of Pkc1p; GFP-fusion protein expression is induced in response to the DNA-damaging agent MMS; non-tagged Ack1p is detected in purified mitochondria +S000035331 CDS YDL203C 4 97953 96082 C 2011-02-03 1996-07-31 +S000002361 ORF Verified YDL202W MRPL11 mitochondrial 54S ribosomal protein YmL11|YmL11 chromosome 4 L000002686 4 98475 99224 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; localizes to vacuole in response to H2O2 +S000035301 CDS YDL202W 4 98475 99224 W 2011-02-03 1996-07-31 +S000002360 ORF Verified YDL201W TRM8 tRNA (guanine46-N7)-methyltransferase chromosome 4 4 99561 100421 W 2011-02-03 1996-07-31 Noncatalytic subunit of a tRNA methyltransferase complex; Trm8p and Trm82p comprise an enzyme that catalyzes a methyl-transfer from S-adenosyl-l-methionine to the N(7) atom of guanine at position 46 in tRNA; Trm8 lacks catalytic activity if not bound to Trm82p +S000034332 CDS YDL201W 4 99561 100421 W 2011-02-03 1996-07-31 +S000002359 ORF Verified YDL200C MGT1 methylated-DNA--protein-cysteine methyltransferase|MGMT chromosome 4 L000001106 4 101067 100501 C 2011-02-03 1996-07-31|2006-04-13 DNA repair methyltransferase (6-O-methylguanine-DNA methylase); involved in protection against DNA alkylation damage +S000034219 CDS YDL200C 4 101067 100501 C 2011-02-03 1996-07-31|2006-04-13 +S000002358 ORF Uncharacterized YDL199C chromosome 4 4 103353 101290 C 2011-02-03 1996-07-31 Putative transporter; member of the sugar porter family +S000035760 CDS YDL199C 4 103353 101290 C 2011-02-03 1996-07-31 +S000002357 ORF Verified YDL198C GGC1 SHM1|YHM1 chromosome 4 L000001881 4 104551 103649 C 2011-02-03 1996-07-31 Mitochondrial GTP/GDP transporter; essential for mitochondrial genome maintenance; has a role in mitochondrial iron transport; member of the mitochondrial carrier family +S000035649 CDS YDL198C 4 104551 103649 C 2011-02-03 1996-07-31 +S000002356 ORF Verified YDL197C ASF2 chromosome 4 L000000127 4 106494 104917 C -109.03 2011-02-03 1996-07-31 Anti-silencing protein; causes derepression of silent loci when overexpressed +S000034644 CDS YDL197C 4 106494 104917 C 2011-02-03 1996-07-31 +S000002355 ORF Dubious YDL196W chromosome 4 4 106741 107070 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame is located in promoter region of essential gene SEC31 +S000034607 CDS YDL196W 4 106741 107070 W 2011-02-03 1996-07-31 +S000002354 ORF Verified YDL195W SEC31 WEB1 chromosome 4 L000002484 4 107208 111029 W 2011-02-03 1996-07-31|2011-02-03 Component of the Sec13p-Sec31p complex of the COPII vesicle coat; COPII coat is required for vesicle formation in ER to Golgi transport; mutant has increased aneuploidy tolerance +S000034506 CDS YDL195W 4 107208 111029 W 2011-02-03 1996-07-31|2011-02-03 +S000002353 ORF Verified YDL194W SNF3 glucose sensor chromosome 4 L000001946 4 111580 114234 W -104 2011-02-03 1996-07-31 Plasma membrane low glucose sensor, regulates glucose transport; high affinity sensor that contains 12 predicted transmembrane segments and a long C-terminal tail required for induction of hexose transporters; also senses fructose and mannose; SNF3 has a paralog, RGT2, that arose from the whole genome duplication +S000033579 CDS YDL194W 4 111580 114234 W 2011-02-03 1996-07-31 +S000002352 ORF Verified YDL193W NUS1 ditrans,polycis-polyprenyl diphosphate synthase chromosome 4 4 114672 115799 W 2011-02-03 1996-07-31 Forms dehydrodolichyl diphosphate syntase complex with RER2 or SRT1; tet-repressible mutant shows accumulation of hypoglycosylated forms of CPY, suggesting that Nus1p may be involved in protein trafficking; mutations in human homolog NUS1 have been implicated in congenital scoliosis, neurological impairment, refractory epilepsy, hearing deficit, and visual impairment; human cis-prenyltransferase complex complements yeast null mutant +S000033540 CDS YDL193W 4 114672 115799 W 2011-02-03 1996-07-31 +S000002351 ORF Verified YDL192W ARF1 Arf family GTPase ARF1 chromosome 4 L000000104 4 116321 116866 W -91 2011-02-03 1996-07-31 ADP-ribosylation factor; GTPase of the Ras superfamily involved in regulation of coated vesicle formation in intracellular trafficking within the Golgi; ARF1 has a paralog, ARF2, that arose from the whole genome duplication; arf1 arf2 double null mutation is complemented by human ARF1, ARF4, ARF5, or ARF6 +S000033475 CDS YDL192W 4 116321 116866 W 2011-02-03 1996-07-31 +S000002350 ORF Verified YDL191W RPL35A uL29|ribosomal 60S subunit protein L35A|L35A|L29|SOS1 chromosome 4 L000001985 4 117664 118517 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L35A; homologous to mammalian ribosomal protein L35 and bacterial L29; RPL35A has a paralog, RPL35B, that arose from the whole genome duplication +S000033395 CDS YDL191W 4 117664 117666 W 2011-02-03 1996-07-31 +S000033396 CDS YDL191W 4 118158 118517 W 2011-02-03 1996-07-31 +S000033397 intron YDL191W 4 117667 118157 W 2011-02-03 1996-07-31 +S000002349 ORF Verified YDL190C UFD2 ubiquitin-ubiquitin ligase UFD2 chromosome 4 L000002788 4 121592 118707 C 2011-02-03 1996-07-31|2011-02-03 Ubiquitin chain assembly factor (E4); cooperates with a ubiquitin-activating enzyme (E1), a ubiquitin-conjugating enzyme (E2), and a ubiquitin protein ligase (E3) to conjugate ubiquitin to substrates; also functions as an E3 +S000032665 CDS YDL190C 4 121592 118707 C 2011-02-03 1996-07-31|2011-02-03 +S000002348 ORF Verified YDL189W RBS1 chromosome 4 4 122216 123589 W 2011-02-03 2000-07-22|1996-07-31 Protein involved in assembly of the RNA polymerase III (Pol III) complex; high copy suppressor of Pol III assembly mutation and psk1 psk2 mutations that confer temperature-sensitivity for galactose utilization; physically interacts with Pol III; proposed to bind single-stranded nucleic acids via its R3H domain +S000033663 CDS YDL189W 4 122216 123589 W 2011-02-03 2000-07-22|1996-07-31 +S000122396 five_prime_UTR_intron YDL189W 4 122078 122176 W 2011-02-03 2007-04-27 +S000118429 ARS ARS406 ARSIV-124 chromosome 4 4 123617 123901 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178062 ARS_consensus_sequence ARS406 4 123795 123779 C 2014-11-18 2014-11-18 +S000002347 ORF Verified YDL188C PPH22 phosphoprotein phosphatase 2A catalytic subunit PPH22|PPH2 chromosome 4 L000001473 4 124998 123865 C -102 2011-02-03 1996-07-31 Catalytic subunit of protein phosphatase 2A (PP2A); functionally redundant with Pph21p; methylated at C terminus; forms alternate complexes with several regulatory subunits; involved in signal transduction and regulation of mitosis; protein abundance increases in response to DNA replication stress; dephosphorylates Tel1p/Mec1p-phosphorylated Cdc13p to promote telomerase release from telomeres at G2/M; PPH22 has a paralog, PPH21, that arose from the whole genome duplication +S000030301 CDS YDL188C 4 124998 123865 C 2011-02-03 1996-07-31 +S000002345 ORF Uncharacterized YDL186W chromosome 4 4 125616 126449 W 2011-02-03 1996-07-31 Putative protein of unknown function; YDL186W is not an essential gene +S000030062 CDS YDL186W 4 125616 126449 W 2011-02-03 1996-07-31 +S000002346 ORF Dubious YDL187C chromosome 4 4 125838 125509 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030099 CDS YDL187C 4 125838 125509 C 2011-02-03 1996-07-31 +S000002344 ORF Verified YDL185W VMA1 H(+)-transporting V1 sector ATPase subunit A|TFP1|CLS8 chromosome 4 L000002289 4 126787 130002 W -101.43 2011-02-03 1996-07-31 Subunit A of the V1 peripheral membrane domain of V-ATPase; protein precursor undergoes self-catalyzed splicing to yield the extein Tfp1p and the intein Vde (PI-SceI), which is a site-specific endonuclease; the V1 peripheral membrane domain of the vacuolar H+-ATPase (V-ATPase) has eight subunits; involved in methionine restriction extension of chronological lifespan in an autophagy-dependent manner +S000029978 CDS YDL185W 4 126787 130002 W 2011-02-03 1996-07-31 +S000029636 intein_encoding_region YDL185W S000007537 4 127636 129000 W 2014-11-18 2014-11-18 Vma1p derived endonuclease; a 50 kDa intein derived from the self-splicing of amino acid residues 284-738 of the VMA1 primary translation product; has endonuclease activity and cleaves at the VMA1 gene to stimulate gene conversion during meiosis +S000007600 ORF Dubious YDL185C-A chromosome 4 4 126835 126608 C 2011-02-03 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YDL185W; identified by homology with hemiascomycetous yeast species +S000037146 CDS YDL185C-A 4 126835 126608 C 2011-02-03 2001-02-26 +S000002343 ORF Verified YDL184C RPL41A eL41|ribosomal 60S subunit protein L41A|L41e|YL41|L47A|L41A|RPL47A chromosome 4 L000001738 4 130484 130407 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L41A; comprises only 25 amino acids; rpl41a rpl41b double null mutant is viable; homologous to mammalian ribosomal protein L41, no bacterial homolog; RPL41A has a paralog, RPL41B, that arose from the whole genome duplication +S000037317 CDS YDL184C 4 130484 130407 C 2011-02-03 1996-07-31 +S000002342 ORF Verified YDL183C MKR1 chromosome 4 4 131833 130871 C 2011-02-03 1996-07-31 Protein that may form an active mitochondrial KHE system; mitochondrial inner-membrane protein; non-essential gene; KHE system stands for K+/H+ exchanger system +S000037236 CDS YDL183C 4 131833 130871 C 2011-02-03 1996-07-31 +S000002341 ORF Verified YDL182W LYS20 homocitrate synthase LYS20 chromosome 4 L000004103 4 133437 134723 W 2011-02-03 1996-07-31 Homocitrate synthase isozyme and functions in DNA repair; catalyzes the condensation of acetyl-CoA and alpha-ketoglutarate to form homocitrate, which is the first step in the lysine biosynthesis pathway; LYS20 has a paralog, LYS21, that arose from the whole genome duplication +S000037198 CDS YDL182W 4 133437 134723 W 2011-02-03 1996-07-31 +S000002340 ORF Verified YDL181W INH1 ATPase inhibitor chromosome 4 L000000866 4 135179 135436 W 2011-02-03 1996-07-31 Protein that inhibits ATP hydrolysis by the F1F0-ATP synthase; inhibitory function is enhanced by stabilizing proteins Stf1p and Stf2p; has a calmodulin-binding motif and binds calmodulin in vitro; INH1 has a paralog, STF1, that arose from the whole genome duplication +S000037121 CDS YDL181W 4 135179 135436 W 2011-02-03 1996-07-31 +S000002339 ORF Uncharacterized YDL180W chromosome 4 4 135896 137539 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole +S000036445 CDS YDL180W 4 135896 137539 W 2011-02-03 1996-07-31 +S000002338 ORF Verified YDL179W PCL9 chromosome 4 L000004041 4 138291 139205 W 2011-02-03 1996-07-31 Cyclin; forms a functional kinase complex with Pho85p cyclin-dependent kinase (Cdk), expressed in late M/early G1 phase, activated by Swi5p; PCL9 has a paralog, PCL2, that arose from the whole genome duplication +S000032032 CDS YDL179W 4 138291 139205 W 2011-02-03 1996-07-31 +S000002337 ORF Verified YDL178W DLD2 D-lactate dehydrogenase|AIP2 chromosome 4 L000000070 4 139522 141114 W 2011-02-03 1996-07-31 D-2-hydroxyglutarate dehydrogenase, and minor D-lactate dehydrogenase; mitochondrial matrix protein that oxidizes D-2-hydroxyglutarate (D-2HG), an oncometabolite, to alpha-ketoglutarate with a minor role in lactate catabolism; located in the mitochondrial matrix +S000031886 CDS YDL178W 4 139522 141114 W 2011-02-03 1996-07-31 +S000002336 ORF Uncharacterized YDL177C chromosome 4 4 141721 141209 C 2011-02-03 1996-07-31 Putative protein of unknown function; similar to the mouse IMPACT gene; YDL177C is not an essential gene +S000031688 CDS YDL177C 4 141721 141209 C 2011-02-03 1996-07-31 +S000002335 ORF Verified YDL176W chromosome 4 4 142097 144223 W 2011-02-03 1996-07-31 Protein of unknown function; predicted by computational methods to be involved in fructose-1,6-bisphosphatase (Fbp1p) degradation; interacts with components of the GID complex; YDL176W is not an essential gene +S000036245 CDS YDL176W 4 142097 144223 W 2011-02-03 1996-07-31 +S000002334 ORF Verified YDL175C AIR2 TRAMP complex RNA-binding subunit chromosome 4 4 145518 144484 C 2011-02-03 1996-07-31 RNA-binding subunit of the TRAMP nuclear RNA surveillance complex; involved in nuclear RNA processing and degradation; involved in TRAMP complex assembly as a bridge between Mtr4p and Trf4p; stimulates the poly(A) polymerase activity of Pap2p in vitro; has 5 zinc knuckle motifs; AIR2 has a paralog, AIR1, that arose from the whole genome duplication; Air2p and Air1p have nonredundant roles in regulation of substrate specificity of the exosome +S000036095 CDS YDL175C 4 145518 144484 C 2011-02-03 1996-07-31 +S000002333 ORF Verified YDL174C DLD1 D-lactate dehydrogenase chromosome 4 L000000508 4 147589 145826 C 2011-02-03 1996-07-31 Major mitochondrial D-lactate dehydrogenase; oxidizes D-lactate to pyruvate, transcription is heme-dependent, repressed by glucose, and derepressed in ethanol or lactate; located in the mitochondrial inner membrane +S000035215 CDS YDL174C 4 147589 145826 C 2011-02-03 1996-07-31 +S000002332 ORF Verified YDL173W PAR32 chromosome 4 4 148191 149078 W 2011-02-03 1996-07-31 Protein of unknown function; hyperphosphorylated upon rapamycin treatment in a Tap42p-dependent manner; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; PAR32 is not an essential gene +S000035172 CDS YDL173W 4 148191 149078 W 2011-02-03 1996-07-31 +S000002331 ORF Dubious YDL172C chromosome 4 4 149086 148607 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035016 CDS YDL172C 4 149086 148607 C 2011-02-03 1996-07-31 +S000002330 ORF Verified YDL171C GLT1 glutamate synthase (NADH) chromosome 4 L000003333 4 155640 149203 C 2011-02-03 1996-07-31 NAD(+)-dependent glutamate synthase (GOGAT); synthesizes glutamate from glutamine and alpha-ketoglutarate; with Gln1p, forms the secondary pathway for glutamate biosynthesis from ammonia; expression regulated by nitrogen source; assembles into filaments as cells approach stationary phase and under cytosolic acidification and starvation conditions +S000034863 CDS YDL171C 4 155640 149203 C 2011-02-03 1996-07-31 +S000002329 ORF Verified YDL170W UGA3 chromosome 4 L000002423 4 156318 157904 W 2011-02-03 1996-07-31 Transcriptional activator for GABA-dependent induction of GABA genes; binds to DNA elements found in the promoters of target genes and increases their expression in the presence of GABA (gamma-aminobutyrate); zinc finger transcription factor of the Zn(2)-Cys(6) binuclear cluster domain type; localized to the nucleus; examples of GABA genes include UGA1, UGA2, and UGA4 +S000034829 CDS YDL170W 4 156318 157904 W 2011-02-03 1996-07-31 +S000002328 ORF Verified YDL169C UGX2 chromosome 4 L000002851 4 158735 158064 C 2011-02-03 1996-07-31 Protein of unknown function; transcript accumulates in response to any combination of stress conditions +S000033142 CDS YDL169C 4 158735 158064 C 2011-02-03 1996-07-31 +S000002327 ORF Verified YDL168W SFA1 bifunctional alcohol dehydrogenase/S-(hydroxymethyl)glutathione dehydrogenase|ADH5 chromosome 4 L000001868 4 159604 160764 W 2011-02-03 1996-07-31 Bifunctional alcohol dehydrogenase and formaldehyde dehydrogenase; formaldehyde dehydrogenase activity is glutathione-dependent; functions in formaldehyde detoxification and formation of long chain and complex alcohols, regulated by Hog1p-Sko1p; protein abundance increases in response to DNA replication stress +S000033096 CDS YDL168W 4 159604 160764 W 2011-02-03 1996-07-31 +S000002326 ORF Verified YDL167C NRP1 chromosome 4 L000000121 4 163154 160995 C 2011-02-03 1996-07-31 Putative RNA binding protein of unknown function; localizes to stress granules induced by glucose deprivation; predicted to be involved in ribosome biogenesis +S000032963 CDS YDL167C 4 163154 160995 C 2011-02-03 1996-07-31 +S000002325 ORF Verified YDL166C FAP7 nucleoside-triphosphatase chromosome 4 4 164042 163449 C 2011-02-03 1996-07-31 Essential NTPase required for small ribosome subunit synthesis; mediates processing of the 20S pre-rRNA at site D in the cytoplasm but associates only transiently with 43S preribosomes via Rps14p; complex with Rps14 is conserved between humans, yeast, and arches; may be the endonuclease for site D; depletion leads to accumulation of pre-40S ribosomes in 80S-like ribosomes; human TAF9 functionally complements the lethality of the null mutation +S000032043 CDS YDL166C 4 164042 163449 C 2011-02-03 1996-07-31 +S000002324 ORF Verified YDL165W CDC36 CCR4-NOT core subunit CDC36|NOT2|DNA19 chromosome 4 L000000272 4 164290 164865 W -80 2011-02-03 1996-07-31 Component of the CCR4-NOT core complex, involved in mRNA decapping; this complex has multiple roles in regulating mRNA levels including regulation of transcription and destabilizing mRNAs through deadenylation; basal transcription factor +S000031977 CDS YDL165W 4 164290 164865 W 2011-02-03 1996-07-31 +S000002322 ORF Dubious YDL163W chromosome 4 4 166956 167258 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene CDC9/YDL164C encoding DNA ligase +S000030824 CDS YDL163W 4 166956 167258 W 2011-02-03 1996-07-31 +S000002323 ORF Verified YDL164C CDC9 DNA ligase (ATP) CDC9|MMS8 chromosome 4 L000000249 4 167254 164987 C -78 2011-02-03 1996-07-31 DNA ligase I found in nucleus and mitochondria; essential enzyme that joins Okazaki fragments during DNA replication; also acts in ribonucleotide excision repair, base excision repair, and recombination; DNA ligase I mutants trigger ubiquitination of PCNA at K107, facilitating Rad59p-mediated bypass of unligated Okazaki fragments; human homolog LIG1 can complement yeast cdc9 temperature-sensitive mutant at restrictive temperature +S000030891 CDS YDL164C 4 167254 164987 C 2011-02-03 1996-07-31 +S000002320 ORF Verified YDL161W ENT1 epsin chromosome 4 4 167714 169078 W 2011-02-03 1996-07-31 Epsin-like protein involved in endocytosis and actin patch assembly; functionally redundant with Ent2p; binds clathrin via a clathrin-binding domain motif at C-terminus; relocalizes from bud neck to cytoplasm upon DNA replication stress; ENT1 has a paralog, ENT2, that arose from the whole genome duplication +S000030611 CDS YDL161W 4 167714 169078 W 2011-02-03 1996-07-31 +S000002321 ORF Dubious YDL162C chromosome 4 4 167715 167359 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ENT1/YDL161W, a verified gene involved in endocytosis and actin cortical patch assembly +S000030690 CDS YDL162C 4 167715 167359 C 2011-02-03 1996-07-31 +S000028520 ORF Verified YDL160C-A MHF2 chromosome 4 4 169608 169366 C 2011-02-03 2003-07-29 Component of the heterotetrameric MHF histone-fold complex; in humans the MHF complex interacts with both DNA and Mph1p ortholog FANCM to stabilize and remodel blocked replication forks and repair damaged DNA; mhf2 srs2 double mutants are MMS hypersensitive; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-X, also known as MHF2 +S000030315 CDS YDL160C-A 4 169608 169366 C 2011-02-03 2003-07-29 +S000002319 ORF Verified YDL160C DHH1 DExD/H-box ATP-dependent RNA helicase DHH1 chromosome 4 L000000504 4 171930 170410 C 2011-02-03 1996-07-31 Cytoplasmic DEAD-box helicase, stimulates mRNA decapping; coordinates distinct steps in mRNA function and decay, interacting with both decapping and deadenylase complexes; role in translational repression, mRNA decay, and possibly mRNA export; interacts and cooperates with Ngr1p to promote specific mRNA decay; ATP- and RNA-bound form promotes processing body (PB) assembly, while ATPase stimulation by Not1p promotes PB disassembly; forms cytoplasmic foci on replication stress +S000036698 CDS YDL160C 4 171930 170410 C 2011-02-03 1996-07-31 +S000007599 ORF Uncharacterized YDL159W-A YDL159W-B chromosome 4 4 172182 172313 W 2011-02-03 2001-02-26 Putative protein of unknown function; identified by sequence comparison with hemiascomycetous yeast species +S000037145 CDS YDL159W-A 4 172182 172313 W 2011-02-03 2001-02-26 +S000002318 ORF Verified YDL159W STE7 mitogen-activated protein kinase kinase STE7 chromosome 4 L000002117 4 172481 174028 W -76 2011-02-03 1996-07-31 Signal transducing MAP kinase kinase; involved in pheromone response where it phosphorylates Fus3p; involved in the pseudohyphal/invasive growth pathway where it phosphorylates of Kss1p; phosphorylated by Ste11p; degraded by ubiquitin pathway +S000036970 CDS YDL159W 4 172481 174028 W 2011-02-03 1996-07-31 +S000028612 ORF Dubious YDL159C-B YDL159C-A chromosome 4 4 173232 173056 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031444 CDS YDL159C-B 4 173232 173056 C 2011-02-03 2003-07-29 +S000002317 ORF Dubious YDL158C chromosome 4 4 174174 173866 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036885 CDS YDL158C 4 174174 173866 C 2011-02-03 1996-07-31 +S000002316 ORF Uncharacterized YDL157C chromosome 4 4 174588 174232 C 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000036806 CDS YDL157C 4 174588 174232 C 2011-02-03 1996-07-31 +S000002315 ORF Verified YDL156W CMR1 chromosome 4 4 174918 176486 W 2011-02-03 1996-07-31 Nuclear protein with a role in protein quality control; localizes to the intranuclear quality control compartment (INQ) in response to proteasome inhibition or DNA replication stress; INQ likely sequesters proteins involved in DNA metabolism for degradation or re-folding; DNA-binding protein with preference for UV-damaged DNA; contains three WD domains (WD-40 repeat); human ortholog WDR76 also exhibits perinuclear localization under similar stress conditions +S000035992 CDS YDL156W 4 174918 176486 W 2011-02-03 1996-07-31 +S000002314 ORF Verified YDL155W CLB3 B-type cyclin CLB3 chromosome 4 L000000351 4 176773 178056 W 2011-02-03 1996-07-31 B-type cyclin involved in cell cycle progression; activates Cdc28p to promote the G2/M transition; may be involved in DNA replication and spindle assembly; accumulates during S phase and G2, then targeted for ubiquitin-mediated degradation; relative distribution to the nucleus increases upon DNA replication stress; CLB3 has a paralog, CLB4, that arose from the whole genome duplication +S000035864 CDS YDL155W 4 176773 178056 W 2011-02-03 1996-07-31 +S000002313 ORF Verified YDL154W MSH5 MutS family protein MSH5 chromosome 4 L000002573 4 178334 181039 W 2011-02-03 1996-07-31 Protein of the MutS family; forms a dimer with Msh4p that facilitates crossovers between homologs during meiosis; msh5-Y823H mutation confers tolerance to DNA alkylating agents; homologs present in C. elegans and humans +S000035754 CDS YDL154W 4 178334 181039 W 2011-02-03 1996-07-31 +S000002311 ORF Dubious YDL152W chromosome 4 4 182822 183187 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF SAS10/YDL153C, a component of the small ribosomal subunit processosome +S000034761 CDS YDL152W 4 182822 183187 W 2011-02-03 1996-07-31 +S000002312 ORF Verified YDL153C SAS10 rRNA-processing protein SAS10|UTP3 chromosome 4 L000003317 4 183018 181186 C 2011-02-03 1996-07-31 Subunit of U3-containing Small Subunit (SSU) processome complex; involved in production of 18S rRNA and assembly of small ribosomal subunit; disrupts silencing when overproduced; mutant has increased aneuploidy tolerance; essential gene +S000035646 CDS YDL153C 4 183018 181186 C 2011-02-03 1996-07-31 +S000002309 ORF Verified YDL150W RPC53 DNA-directed RNA polymerase III subunit C53|C53|RPC4 chromosome 4 L000001691 4 183343 184611 W -70 2011-02-03 1996-07-31 RNA polymerase III subunit C53 +S000034634 CDS YDL150W 4 183343 184611 W 2011-02-03 1996-07-31 +S000002310 ORF Dubious YDL151C BUD30 chromosome 4 S000007648 4 183899 183318 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 96% of ORF overlaps the verified gene RPC53; diploid mutant displays a weak budding pattern phenotype in a systematic assay +S000034639 CDS YDL151C 4 183899 183318 C 2011-02-03 1996-07-31 +S000002308 ORF Verified YDL149W ATG9 autophagy protein ATG9|CVT6|APG9|CVT7|AUT9 chromosome 4 L000004759|L000004753|L000004758|S000029131 4 184925 187918 W 2011-02-03 1996-07-31 Transmembrane protein involved in forming Cvt and autophagic vesicles; cycles between the phagophore assembly site (PAS) and other cytosolic punctate structures, not found in autophagosomes; may be involved in membrane delivery to the PAS +S000032870 CDS YDL149W 4 184925 187918 W 2011-02-03 1996-07-31 +S000002307 ORF Verified YDL148C NOP14 snoRNA-binding rRNA-processing protein NOP14|UTP2 chromosome 4 4 190586 188154 C 2011-02-03 1996-07-31 Nucleolar protein; forms a complex with Noc4p that mediates maturation and nuclear export of 40S ribosomal subunits; also present in the small subunit processome complex, which is required for processing of pre-18S rRNA +S000032714 CDS YDL148C 4 190586 188154 C 2011-02-03 1996-07-31 +S000002306 ORF Verified YDL147W RPN5 proteasome regulatory particle lid subunit RPN5|NAS5 chromosome 4 L000004451|L000004305 4 190924 192261 W 2011-02-03 1996-07-31 Subunit of the CSN and 26S proteasome lid complexes; similar to mammalian p55 subunit and to another S. cerevisiae regulatory subunit, Rpn7p; Rpn5p is an essential protein; the COP9 signalosome is also known as the CSN +S000032657 CDS YDL147W 4 190924 192261 W 2011-02-03 1996-07-31 +S000002305 ORF Verified YDL146W LDB17 chromosome 4 4 192750 194225 W 2011-02-03 1996-07-31 Protein involved in the regulation of endocytosis; transiently recruited to actin cortical patches in a SLA1-dependent manner after late coat component assembly; GFP-fusion protein localizes to the periphery, cytoplasm, bud, and bud neck +S000032526 CDS YDL146W 4 192750 194225 W 2011-02-03 1996-07-31 +S000002304 ORF Verified YDL145C COP1 coatomer subunit alpha|SOO1|RET1|SEC33 chromosome 4 L000002603 4 198176 194571 C 2011-02-03 1996-07-31 Alpha subunit of COPI vesicle coatomer complex; complex surrounds transport vesicles in the early secretory pathway +S000031516 CDS YDL145C 4 198176 194571 C 2011-02-03 1996-07-31 +S000002303 ORF Verified YDL144C chromosome 4 4 199732 198662 C 2011-02-03 2003-09-22|1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; YDL144C is not an essential gene; protein abundance increases in response to DNA replication stress +S000031463 CDS YDL144C 4 199732 198662 C 2011-02-03 2003-09-22|1996-07-31 +S000002302 ORF Verified YDL143W CCT4 chaperonin-containing T-complex subunit CCT4|ANC2|TCP4 chromosome 4 L000000087 4 199996 201582 W 2011-02-03 1996-07-31 Subunit of the cytosolic chaperonin Cct ring complex; related to Tcp1p, required for the assembly of actin and tubulins in vivo +S000031415 CDS YDL143W 4 199996 201582 W 2011-02-03 1996-07-31 +S000002301 ORF Verified YDL142C CRD1 cardiolipin synthase|CLS1 chromosome 4 L000003358 4 202570 201719 C 2011-02-03 1996-07-31 Cardiolipin synthase; produces cardiolipin, which is a phospholipid of the mitochondrial inner membrane that is required for normal mitochondrial membrane potential and function and for correct integration of membrane-multispanning proteins into the mitochondrial outer membrane; required to maintain tubular mitochondrial morphology and functions in mitochondrial fusion; also required for normal vacuolar ion homeostasis +S000030494 CDS YDL142C 4 202570 201719 C 2011-02-03 1996-07-31 +S000002300 ORF Verified YDL141W BPL1 biotin--[acetyl-CoA-carboxylase] ligase BPL1|ACC2 chromosome 4 L000002771 4 203039 205111 W 2011-02-03 1996-07-31 Biotin:apoprotein ligase; covalently modifies proteins with the addition of biotin, required for acetyl-CoA carboxylase (Acc1p) holoenzyme formation; comparative analysis suggests that a mitochondrially targeted form may result from translation starting at a non-canonical codon upstream of the annotated start codon; human homolog HLCS can complement yeast BPL1 mutant +S000030458 CDS YDL141W 4 203039 205111 W 2011-02-03 1996-07-31 +S000002299 ORF Verified YDL140C RPO21 DNA-directed RNA polymerase II core subunit RPO21|B220|SUA8|RPB220|RPB1 chromosome 4 L000001744 4 210561 205360 C -68 2011-02-03 1996-07-31 RNA polymerase II largest subunit B220; part of central core; phosphorylation of C-terminal heptapeptide repeat domain regulates association with transcription and splicing factors; similar to bacterial beta-prime +S000030216 CDS YDL140C 4 210561 205360 C 2011-02-03 1996-07-31 +S000002298 ORF Verified YDL139C SCM3 chromosome 4 L000003281 4 212046 211375 C 2011-02-03 2003-09-22|1996-07-31 Nonhistone component of centromeric chromatin; binds to histone H3 variant, Cse4p, and recruits it to centromeres; involved in the assembly and maintenance of Cse4-H4 at centromeres; required for kinetochore assembly and G2/M progression; may protect Cse4p from ubiquitination; homolog of mammalian HJURP +S000037514 CDS YDL139C 4 212046 211375 C 2011-02-03 2003-09-22|1996-07-31 +S000118430 ARS ARS409 ARSIV-213 chromosome 4 4 212519 212618 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178063 ARS_consensus_sequence ARS409 4 212594 212578 C 2014-11-18 2014-11-18 +S000002297 ORF Verified YDL138W RGT2 glucose sensor chromosome 4 L000003268 4 213351 215642 W 2011-02-03 1996-07-31 Plasma membrane high glucose sensor that regulates glucose transport; low affinity sesnor that contains 12 predicted transmembrane segments and a long C-terminal tail required for hexose transporter induction; phosphorylation of the tail by Yck1p/Yck2p facilitates binding to the HXT co-repressors, Mth1p and Std1p; RGT2 has a paralog, SNF3, that arose from the whole genome duplication +S000037451 CDS YDL138W 4 213351 215642 W 2011-02-03 1996-07-31 +S000002296 ORF Verified YDL137W ARF2 Arf family GTPase ARF2 chromosome 4 L000000105|L000000060 4 216529 217074 W -64 1996-07-31 1996-07-31 ADP-ribosylation factor; GTPase of the Ras superfamily involved in regulation of coated formation vesicles in intracellular trafficking within the Golgi; ARF2 has a paralog, ARF1, that arose from the whole genome duplication; arf1 arf2 double null mutation is complemented by human ARF1, ARF4, ARF5, or ARF6 +S000036736 CDS YDL137W 4 216529 217074 W 1996-07-31 1996-07-31 +S000122094 five_prime_UTR_intron YDL137W 4 216158 216489 W 2007-04-04 2007-04-04 +S000002295 ORF Verified YDL136W RPL35B uL29|ribosomal 60S subunit protein L35B|L35B|L29|SOS2 chromosome 4 L000001986 4 217600 218367 W 1996-07-31 1996-07-31 Ribosomal 60S subunit protein L35B; homologous to mammalian ribosomal protein L35 and bacterial L29; RPL35B has a paralog, RPL35A, that arose from the whole genome duplication +S000036637 CDS YDL136W 4 217600 217602 W 1996-07-31 1996-07-31 +S000036638 CDS YDL136W 4 218008 218367 W 1996-07-31 1996-07-31 +S000036639 intron YDL136W 4 217603 218007 W 1996-07-31 1996-07-31 +S000002294 ORF Verified YDL135C RDI1 chromosome 4 L000002743 4 219288 218680 C 1996-07-31 1996-07-31 Rho GDP dissociation inhibitor; involved in the localization and regulation of Cdc42p and Rho1p; protein abundance increases in response to DNA replication stress +S000036486 CDS YDL135C 4 219288 218680 C 1996-07-31 1996-07-31 +S000002292 ORF Verified YDL134C PPH21 phosphoprotein phosphatase 2A catalytic subunit PPH21 chromosome 4 L000001472 4 220771 219662 C -66 1996-07-31 1996-07-31 Catalytic subunit of protein phosphatase 2A (PP2A); functionally redundant with Pph22p; methylated at C terminus; forms alternate complexes with several regulatory subunits; involved in signal transduction and regulation of mitosis; forms nuclear foci upon DNA replication stress; PPH21 has a paralog, PPH22, that arose from the whole genome duplication +S000035565 CDS YDL134C 4 220771 219662 C 1996-07-31 1996-07-31 +S000002293 ORF Verified YDL133C-A RPL41B eL41|ribosomal 60S subunit protein L41B|L41e|YL41|L47B|L41B|YDL134C-A|RPL47B chromosome 4 L000001739 4 221801 221724 C 1999-07-17 1999-07-17 Ribosomal 60S subunit protein L41B; comprises only 25 amino acids; rpl41a rpl41b double null mutant is viable; homologous to mammalian ribosomal protein L41, no bacterial homolog; RPL41B has a paralog, RPL41A, that arose from the whole genome duplication +S000030753 CDS YDL133C-A 4 221801 221724 C 1999-07-17 1999-07-17 +S000002291 ORF Verified YDL133W SRF1 chromosome 4 4 222427 223740 W 1996-07-31 1996-07-31 Regulator of phospholipase D (Spo14p); interacts with Spo14p and regulates its catalytic activity; capable of buffering the toxicity of C16:0 platelet activating factor, a lipid that accumulates intraneuronally in Alzheimer's patients +S000035552 CDS YDL133W 4 222427 223740 W 1996-07-31 1996-07-31 +S000002290 ORF Verified YDL132W CDC53 cullin CDC53 chromosome 4 L000000281 4 224304 226751 W -81 1996-07-31 1996-07-31 Cullin; structural protein of SCF complexes (which also contain Skp1p, Cdc34p, Hrt1p and an F-box protein) involved in ubiquitination; SCF promotes the G1-S transition by targeting G1 cyclins and the Cln-CDK inhibitor Sic1p for degradation; human homolog CUL1 can complement yeast cdc53 null mutant +S000035487 CDS YDL132W 4 224304 226751 W 1996-07-31 1996-07-31 +S000002289 ORF Verified YDL131W LYS21 homocitrate synthase LYS21 chromosome 4 L000004259 4 227393 228715 W 1996-07-31 1996-07-31 Homocitrate synthase isozyme; catalyzes the condensation of acetyl-CoA and alpha-ketoglutarate to form homocitrate, which is the first step in the lysine biosynthesis pathway; LYS21 has a paralog, LYS20, that arose from the whole genome duplication +S000035437 CDS YDL131W 4 227393 228715 W 1996-07-31 1996-07-31 +S000007232 ORF Verified YDL130W-A STF1 ATPase-binding protein|AIS2 chromosome 4 L000002126 4 229171 229431 W 1999-07-17 1999-07-17 Protein involved in regulation of the mitochondrial F1F0-ATP synthase; Stf1p and Stf2p act as stabilizing factors that enhance inhibitory action of the Inh1p protein; protein abundance increases in response to DNA replication stress; STF1 has a paralog, INH1, that arose from the whole genome duplication +S000033965 CDS YDL130W-A 4 229171 229431 W 1999-07-17 1999-07-17 +S000002288 ORF Verified YDL130W RPP1B ribosomal protein P1B|YP1beta|P1B|L44'|Ax|RPLA3|RPL44' chromosome 4 L000003298|L000001734 4 229906 230527 W 1996-07-31 1996-07-31 Ribosomal protein P1 beta; component of the ribosomal stalk, which is involved in interaction of translational elongation factors with ribosome; free (non-ribosomal) P1 stimulates the phosphorylation of the eIF2 alpha subunit (Sui2p) by Gcn2p; accumulation is regulated by phosphorylation and interaction with the P2 stalk component +S000035361 CDS YDL130W 4 229906 230019 W 1996-07-31 1996-07-31 +S000035362 CDS YDL130W 4 230321 230527 W 1996-07-31 1996-07-31 +S000035363 intron YDL130W 4 230020 230320 W 1996-07-31 1996-07-31 +S000002287 ORF Verified YDL129W chromosome 4 4 231024 231899 W 1996-07-31 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and the nucleus; YDL129W is not an essential gene; relative distribution to the nucleus increases upon DNA replication stress +S000034421 CDS YDL129W 4 231024 231899 W 1996-07-31 1996-07-31 +S000002286 ORF Verified YDL128W VCX1 MNR1|HUM1 chromosome 4 L000002990 4 232652 233887 W 1996-07-31 1996-07-31 Vacuolar membrane antiporter with Ca2+/H+ and K+/H+ exchange activity; involved in control of cytosolic Ca2+ and K+ concentrations; has similarity to sodium/calcium exchangers, including the bovine Na+/Ca2+,K+ antiporter +S000034358 CDS YDL128W 4 232652 233887 W 1996-07-31 1996-07-31 +S000002285 ORF Verified YDL127W PCL2 cyclin PCL2|CLN4 chromosome 4 L000002784 4 234927 235853 W 2004-02-11 2004-02-11|1996-07-31 Cyclin, interacts with cyclin-dependent kinase Pho85p; member of the Pcl1,2-like subfamily, involved in the regulation of polarized growth and morphogenesis and progression through the cell cycle; localizes to sites of polarized cell growth; PCL2 has a paralog, PCL9, that arose from the whole genome duplication +S000033442 CDS YDL127W 4 234927 235853 W 2004-02-11 2004-02-11|1996-07-31 +S000178064 ARS ARS409.5 chromosome 4 4 235937 236185 2014-11-18 2014-11-18 Strong autonomously replicating sequence +S000002284 ORF Verified YDL126C CDC48 AAA family ATPase CDC48 chromosome 4 L000000280 4 238664 236157 C 2004-02-11 1996-07-31 AAA ATPase; subunit of polyUb-selective segregase complex involved in ERAD, INM-associated degradation (INMAD), mitotic spindle disassembly, macroautophagy, PMN, ribosome-associated degradation, ribophagy, homotypic ER membrane fusion, SCF complex disassembly, cell wall integrity during heat stress, and telomerase regulation; mobilizes membrane-anchored transcription factors by regulated Ub/proteasome-dependent processing (RUP); human ortholog VCP complements a cdc48 mutant +S000033307 CDS YDL126C 4 238664 236157 C 2004-02-11 1996-07-31 +S000002283 ORF Verified YDL125C HNT1 adenosine 5'-monophosphoramidase chromosome 4 L000003334 4 239606 239019 C 2004-02-11 1996-07-31 Adenosine 5'-monophosphoramidase; interacts physically and genetically with Kin28p, a CDK and TFIIK subunit, and genetically with CAK1; member of histidine triad (HIT) superfamily of nucleotide-binding proteins; protein abundance increases in response to DNA replication stress; human homolog HINT1 can complement yeast hnt1 mutant +S000033248 CDS YDL125C 4 239398 239019 C 2004-02-11 1996-07-31 +S000033247 CDS YDL125C 4 239606 239510 C 2004-02-11 1996-07-31 +S000033249 intron YDL125C 4 239509 239399 C 2004-02-11 1996-07-31 +S000002282 ORF Verified YDL124W aldo-keto reductase superfamily protein chromosome 4 4 240259 241197 W 2004-02-11 1996-07-31 NADPH-dependent alpha-keto amide reductase; reduces aromatic alpha-keto amides, aliphatic alpha-keto esters, and aromatic alpha-keto esters; member of the aldo-keto reductase (AKR) family; protein abundance increases in response to DNA replication stress +S000033228 CDS YDL124W 4 240259 241197 W 2004-02-11 1996-07-31 +S000002281 ORF Verified YDL123W SNA4 chromosome 4 4 241418 241840 W 2004-02-11 1996-07-31 Protein of unknown function; localized to the vacuolar outer membrane; predicted to be palmitoylated +S000032369 CDS YDL123W 4 241418 241840 W 2004-02-11 1996-07-31 +S000002280 ORF Verified YDL122W UBP1 ubiquitin-specific protease UBP1 chromosome 4 L000002415 4 242552 244981 W 2004-02-11 1996-07-31 Ubiquitin-specific protease; removes ubiquitin from ubiquitinated proteins; cleaves at the C terminus of ubiquitin fusions irrespective of their size; capable of cleaving polyubiquitin chains +S000032268 CDS YDL122W 4 242552 244981 W 2004-02-11 1996-07-31 +S000002279 ORF Uncharacterized YDL121C chromosome 4 4 245582 245133 C 2004-02-11 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; YDL121C is not an essential protein +S000031235 CDS YDL121C 4 245582 245133 C 2004-02-11 1996-07-31 +S000002278 ORF Verified YDL120W YFH1 ferroxidase chromosome 4 L000003525 4 245923 246447 W 2004-02-11 1996-07-31 Mitochondrial matrix iron chaperone; oxidizes and stores iron; interacts with Isu1p to promote Fe-S cluster assembly; mutation results in multiple Fe/S-dependent enzyme deficiencies; human frataxin homolog FXN is mutated in Friedrich's ataxia; human FTL gene can complement yeast yfh1 null mutant +S000031221 CDS YDL120W 4 245923 246447 W 2004-02-11 1996-07-31 +S000002276 ORF Dubious YDL118W chromosome 4 4 247302 247682 W 2004-02-11 1996-07-31 Dubious open reading frame, unlikely to encode a protein; overlaps almost completely with YDL119C; mutations that would affect both YDL118W and YDL119C confer defective telomere maintenance and are synthetically sick or lethal with alpha-synuclein +S000030066 CDS YDL118W 4 247302 247682 W 2004-02-11 1996-07-31 +S000002277 ORF Verified YDL119C HEM25 chromosome 4 4 247612 246689 C 2004-02-11 1996-07-31 Mitochondrial glycine transporter; required for the transport of glycine into mitochondria for initiation of heme biosynthesis, with YMC1 acting as a secondary transporter; homolog of human SLC25A38, a mitochondrial glycine transporter associated with nonsyndromic autosomal recessive congenital sideroblastic anemia; human SLC25A38 can complement the heme deficiency associated with the null mutant; GFP-fusion protein is induced in response to the DNA-damaging agent MMS +S000030189 CDS YDL119C 4 247612 246689 C 2004-02-11 1996-07-31 +S000002275 ORF Verified YDL117W CYK3 chromosome 4 4 248581 251238 W 2004-02-11 1996-07-31 SH3-domain protein located in the bud neck and cytokinetic actin ring; relocalizes from bud neck to nucleus upon DNA replication stress; activates the chitin synthase activity of Chs2p during cytokinesis; suppressor of growth and cytokinesis defects of chs2 phospho-mutants +S000029965 CDS YDL117W 4 248581 251238 W 2004-02-11 1996-07-31 +S000002274 ORF Verified YDL116W NUP84 chromosome 4 L000003137 4 251566 253746 W 2004-02-11 1996-07-31 Subunit of the Nup84p subcomplex of the nuclear pore complex (NPC); contributes to nucleocytoplasmic transport and NPC biogenesis; also plays roles in several processes that may require localization of genes or chromosomes at the nuclear periphery, including double-strand break repair, transcription and chromatin silencing; homologous to human NUP107 +S000029859 CDS YDL116W 4 251566 253746 W 2004-02-11 1996-07-31 +S000118431 ARS ARS410 ARSIV-254 chromosome 4 4 253791 254039 2006-08-30 2006-08-30 Autonomously Replicating Sequence +S000178065 ARS_consensus_sequence ARS410 4 253948 253932 C 2014-11-18 2014-11-18 +S000007598 ORF Dubious YDL114W-A chromosome 4 4 254935 255048 W 2004-02-11 2001-02-26 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified based on homology to hemiascomycetous yeasts +S000037144 CDS YDL114W-A 4 254935 255048 W 2004-02-11 2001-02-26 +S000002273 ORF Verified YDL115C IWR1 chromosome 4 4 255126 253995 C 2007-07-10 2004-02-23|2007-07-10|1996-07-31|2004-01-23 RNA polymerase II transport factor, conserved from yeast to humans; also has a role in transporting RNA polymerase III into the nucleus; interacts with most of the RNAP II subunits; nucleo-cytoplasmic shuttling protein; deletion causes hypersensitivity to K1 killer toxin; protein increases in abundance and relocalizes from nucleus to cytoplasm upon DNA replication stress +S000123279 CDS YDL115C 4 254974 253995 C 2007-07-10 2007-07-10 +S000037159 CDS YDL115C 4 255126 255045 C 2007-07-10 2004-02-23|2007-07-10|1996-07-31|2004-01-23 +S000123278 intron YDL115C 4 255044 254975 C 2007-07-10 2007-07-10 +S000002272 ORF Uncharacterized YDL114W short-chain dehydrogenase/reductase chromosome 4 4 255604 256530 W 2004-02-11 1996-07-31 Putative short-chain dehydrogenase/reductase; YDL114W is not an essential gene +S000037093 CDS YDL114W 4 255604 256530 W 2004-02-11 1996-07-31 +S000130171 ARS ARS411 chromosome 4 4 256530 256633 2009-05-07 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000002271 ORF Verified YDL113C ATG20 CVT20|SNX42 chromosome 4 4 258555 256633 C 2004-02-11 1996-07-31 Sorting nexin family member; required for the cytoplasm-to-vacuole targeting (Cvt) pathway and for endosomal sorting; has a Phox homology domain that binds phosphatidylinositol-3-phosphate; interacts with Snx4p; potential Cdc28p substrate +S000036989 CDS YDL113C 4 258555 256633 C 2004-02-11 1996-07-31 +S000002270 ORF Verified YDL112W TRM3 tRNA (guanosine(18)-2'-O)-methyltransferase chromosome 4 L000004920 4 258915 263225 W 2004-02-11 1996-07-31 2'-O-ribose methyltransferase; catalyzes the ribose methylation of the guanosine nucleotide at position 18 of tRNAs +S000036371 CDS YDL112W 4 258915 263225 W 2004-02-11 1996-07-31 +S000002269 ORF Verified YDL111C RRP42 exosome non-catalytic core subunit RRP42 chromosome 4 L000003551 4 264110 263313 C 2004-02-11 1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; has similarity to E. coli RNase PH and to human hRrp42p (EXOSC7) +S000036214 CDS YDL111C 4 264110 263313 C 2004-02-11 1996-07-31 +S000002268 ORF Verified YDL110C TMA17 ADC17 chromosome 4 S000154294 4 264964 264512 C 2004-02-11 1996-07-31 ATPase dedicated chaperone that adapts proteasome assembly to stress; Tma17p is induced upon stress; interacts with Rpt6p to assist its pairing to Rpt3p and early steps in proteasome biogenesis; associates with ribosomes; heterozygous deletion demonstrated increases in chromosome instability in a rad9 deletion background; protein abundance is decreased upon intracellular iron depletion +S000036093 CDS YDL110C 4 264964 264512 C 2004-02-11 1996-07-31 +S000002267 ORF Uncharacterized YDL109C putative lipase chromosome 4 4 267201 265258 C 2004-02-11 1996-07-31 Putative lipase; involved in lipid metabolism; not an essential gene; YDL109C has a paralog, ROG1, that arose from the whole genome duplication +S000033934 CDS YDL109C 4 267201 265258 C 2004-02-11 1996-07-31 +S000002266 ORF Verified YDL108W KIN28 TFIIH complex serine/threonine-protein kinase subunit KIN28 chromosome 4 L000000905 4 267698 268699 W 2004-02-11 1996-07-31 Serine/threonine protein kinase, subunit of transcription factor TFIIH; involved in transcription initiation at RNA polymerase II promoters; phosphorylates Ser5 residue of the PolII C-terminal domain (CTD) at gene promoters; relocalizes to the cytosol in response to hypoxia +S000033868 CDS YDL108W 4 267698 267725 W 2004-02-11 1996-07-31 +S000033869 CDS YDL108W 4 267807 268699 W 2004-02-11 1996-07-31 +S000033870 intron YDL108W 4 267726 267806 W 2004-02-11 1996-07-31 +S000002265 ORF Verified YDL107W MSS2 chromosome 4 L000001202 4 268921 269976 W 2004-02-11 1996-07-31 Peripherally bound inner membrane protein of the mitochondrial matrix; involved in membrane insertion of C-terminus of Cox2p, interacts genetically and physically with Cox18p +S000033109 CDS YDL107W 4 268921 269976 W 2004-02-11 1996-07-31 +S000002264 ORF Verified YDL106C PHO2 phoB|GRF10|BAS2 chromosome 4 L000000728 4 271901 270222 C -58.01 2004-02-11 1996-07-31 Homeobox transcription factor; regulatory targets include genes involved in phosphate metabolism; binds cooperatively with Pho4p to the PHO5 promoter; phosphorylation of Pho2p facilitates interaction with Pho4p; relocalizes to the cytosol in response to hypoxia +S000032983 CDS YDL106C 4 271901 270222 C 2004-02-11 1996-07-31 +S000002263 ORF Verified YDL105W NSE4 Smc5-Smc6 complex subunit NSE4|QRI2 chromosome 4 L000002653 4 272389 273597 W 2004-02-11 1996-07-31 Component of the SMC5-SMC6 complex; this complex plays a key role in the removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair +S000032948 CDS YDL105W 4 272389 273597 W 2004-02-11 1996-07-31 +S000002262 ORF Verified YDL104C QRI7 putative N(6)-L-threonylcarbamoyladenine synthase chromosome 4 L000002654 4 274876 273653 C 2004-02-11 1996-07-31 Protein involved in threonylcarbamoyl adenosine biosynthesis; Sua5p and Qri7p are necessary and sufficient for RNA t6A modification in vitro; highly conserved mitochondrial protein; essential for t6A modification of mitochondrial tRNAs that decode ANN codons; similar to Kae1p and E. coli YgjD, both of which are also required for tRNA t6A modification; when directed to the cytoplasm, complements the essential function of Kae1p in the KEOPS complex +S000031963 CDS YDL104C 4 274876 273653 C 2004-02-11 1996-07-31 +S000002261 ORF Verified YDL103C QRI1 UDP-N-acetylglucosamine diphosphorylase|UAP1 chromosome 4 L000002652 4 276581 275148 C 2004-02-11 1996-07-31 UDP-N-acetylglucosamine pyrophosphorylase; catalyzes the formation of UDP-N-acetylglucosamine (UDP-GlcNAc), which is important in cell wall biosynthesis, protein N-glycosylation, and GPI anchor biosynthesis; protein abundance increases in response to DNA replication stress +S000031867 CDS YDL103C 4 276581 275148 C 2004-02-11 1996-07-31 +S000002260 ORF Verified YDL102W POL3 DNA-directed DNA polymerase delta POL3|CDC2|TEX1|HPR6 chromosome 4 L000000242 4 276872 280165 W -55 2004-02-11 1996-07-31|2011-02-03 Catalytic subunit of DNA polymerase delta; required for chromosomal DNA replication during mitosis and meiosis, intragenic recombination, repair of double strand DNA breaks, and DNA replication during nucleotide excision repair (NER) +S000031813 CDS YDL102W 4 276872 280165 W 2004-02-11 1996-07-31|2011-02-03 +S000002259 ORF Verified YDL101C DUN1 serine/threonine protein kinase DUN1 chromosome 4 L000000531 4 281848 280307 C 2004-02-11 1996-07-31 Cell-cycle checkpoint S/T protein kinase; required for transient G2/M arrest after DNA damage, damage-induced transcription, and nuclear-to-cytoplasmic redistribution of Rnr2p-Rnr4p after genotoxic stress and iron deprivation; phosphorylates repair protein Rad55p, transcriptional repressor Sml1p, superoxide dismutase, and ribonucleotide reductase inhibitors Crt1p and Dif1p; functions in the Mec1p pathway to regulate dNTP pools and telomere length; postreplicative repair role +S000031605 CDS YDL101C 4 281848 280307 C 2004-02-11 1996-07-31 +S000002258 ORF Verified YDL100C GET3 guanine nucleotide exchange factor GET3|ARR4 chromosome 4 4 283176 282112 C 2004-02-11 1996-07-31 Guanine nucleotide exchange factor for Gpa1p; amplifies G protein signaling; functions as a chaperone under ATP-depleted oxidative stress conditions; subunit of GET complex, involved in ATP dependent Golgi to ER trafficking and insertion of tail-anchored (TA) proteins into ER membrane under non-stress conditions; binds as dimer to transmembrane domain (TMD) cargo, shielding TMDs from aqueous solvent; protein abundance increases under DNA replication stress +S000030758 CDS YDL100C 4 283176 282112 C 2004-02-11 1996-07-31 +S000002257 ORF Verified YDL099W BUG1 chromosome 4 4 283419 284444 W 2004-02-11 1996-07-31 Cis-golgi localized protein involved in ER to Golgi transport; forms a complex with the mammalian GRASP65 homolog, Grh1p; mutants are compromised for the fusion of ER-derived vesicles with Golgi membranes +S000034178 CDS YDL099W 4 283419 284444 W 2004-02-11 1996-07-31 +S000002256 ORF Verified YDL098C SNU23 U4/U6-U5 snRNP complex subunit SNU23 chromosome 4 4 285165 284581 C 2004-02-11 1996-07-31 Component of the U4/U6.U5 snRNP complex; involved in mRNA splicing via spliceosome +S000034033 CDS YDL098C 4 285165 284581 C 2004-02-11 1996-07-31 +S000002255 ORF Verified YDL097C RPN6 proteasome regulatory particle lid subunit RPN6|NAS4 chromosome 4 L000004306 4 286695 285391 C 2004-02-11 1996-07-31 Essential, non-ATPase regulatory subunit of the 26S proteasome lid; required for the assembly and activity of the 26S proteasome; the human homolog (S9 protein) partially rescues Rpn6p depletion; protein abundance increases in response to DNA replication stress +S000033908 CDS YDL097C 4 286695 285391 C 2004-02-11 1996-07-31 +S000002253 ORF Verified YDL095W PMT1 dolichyl-phosphate-mannose-protein mannosyltransferase PMT1 chromosome 4 L000001458 4 287059 289512 W 2004-02-11 1996-07-31 Protein O-mannosyltransferase of the ER membrane; transfers mannose from dolichyl phosphate-D-mannose to protein serine and threonine residues; 1 of 7 related proteins involved in O-glycosylation which is essential for cell wall rigidity; involved in ER quality control; amino terminus faces cytoplasm, carboxyl terminus faces ER lumen +S000033095 CDS YDL095W 4 287059 289512 W 2004-02-11 1996-07-31 +S000002254 ORF Dubious YDL096C OPI6 chromosome 4 4 287324 286998 C 2004-02-11 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene PMT1/YDL095W; YDL096C is not essential +S000033140 CDS YDL096C 4 287324 286998 C 2004-02-11 1996-07-31 +S000002251 ORF Verified YDL093W PMT5 putative dolichyl-phosphate-mannose-protein mannosyltransferase PMT5 chromosome 4 L000003164 4 289909 292140 W 2004-02-11 1996-07-31 Protein O-mannosyltransferase; transfers mannose residues from dolichyl phosphate-D-mannose to protein serine/threonine residues; acts in a complex with Pmt3p, can instead interact with Pmt2p in some conditions; target for new antifungals +S000032094 CDS YDL093W 4 289909 292140 W 2004-02-11 1996-07-31 +S000002252 ORF Dubious YDL094C chromosome 4 4 290081 289572 C 2004-02-11 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verfied gene PMT5/YDL093W; YDL094C is not essential +S000032962 CDS YDL094C 4 290081 289572 C 2004-02-11 1996-07-31 +S000002250 ORF Verified YDL092W SRP14 RNA-binding signal recognition particle subunit SRP14 chromosome 4 L000002061 4 292781 293221 W 2004-02-11 1996-07-31 Signal recognition particle (SRP) subunit; interacts with the RNA component of SRP to form the Alu domain, which is the region of SRP responsible for arrest of nascent chain elongation during membrane targeting; homolog of mammalian SRP14 +S000031975 CDS YDL092W 4 292781 293221 W 2004-02-11 1996-07-31 +S000002249 ORF Verified YDL091C UBX3 chromosome 4 4 294759 293392 C 2004-02-11 1996-07-31 Clathrin-coated vesicle component, regulator of endocytosis; copurifies with the DSC ubiquitin ligase complex; UBX (ubiquitin regulatory X) domain-containing protein that interacts with Cdc48p; required for efficient clathrin-mediated endocytosis; ortholog of fission yeast Ucp10 +S000030889 CDS YDL091C 4 294759 293392 C 2004-02-11 1996-07-31 +S000002248 ORF Verified YDL090C RAM1 protein farnesyltransferase|STE16|SGP2|SCG2|FUS8|DPR1 chromosome 4 L000001579 4 296329 295034 C -33 2004-02-11 1996-07-31 Beta subunit of the CAAX farnesyltransferase (FTase); this complex prenylates the a-factor mating pheromone and Ras proteins; required for the membrane localization of Ras proteins and a-factor; homolog of the mammalian FTase beta subunit +S000030792 CDS YDL090C 4 296329 295034 C 2004-02-11 1996-07-31 +S000002247 ORF Verified YDL089W NUR1 chromosome 4 4 296820 298274 W 2004-02-11 1996-07-31 Protein involved in regulation of mitotic exit; dephosphorylation target of Cdc14p in anaphase, which promotes timely rDNA segregation and allows mitotic progression; interacts with Csm1p, Lrs4p; required for rDNA repeat stability; null mutant causes increase in unequal sister-chromatid exchange; GFP-fusion protein localizes to the nuclear periphery, possible Cdc28p substrate +S000037902 CDS YDL089W 4 296820 298274 W 2004-02-11 1996-07-31 +S000002246 ORF Verified YDL088C ASM4 FG-nucleoporin ASM4|NUP59 chromosome 4 L000002642 4 300003 298417 C 2004-02-11 1996-07-31 FG-nucleoporin component of central core of nuclear pore complex (NPC); contributes directly to nucleocytoplasmic transport; induces membrane tubulation, which may contribute to nuclear pore assembly; ASM4 has a paralog, NUP53, that arose from the whole genome duplication +S000037765 CDS YDL088C 4 300003 298417 C 2004-02-11 1996-07-31 +S000002245 ORF Verified YDL087C LUC7 EPE1|EXM2 chromosome 4 L000003348 4 300999 300214 C 2004-02-11 1996-07-31 Essential protein associated with the U1 snRNP complex; splicing factor involved in recognition of 5' splice site; contains two zinc finger motifs; N-terminal zinc finger binds pre-mRNA; relocalizes to the cytosol in response to hypoxia +S000037703 CDS YDL087C 4 300999 300214 C 2004-02-11 1996-07-31 +S000002244 ORF Uncharacterized YDL086W carboxymethylenebutenolidase chromosome 4 4 301413 302234 W 2004-02-11 1996-07-31 Putative carboxymethylenebutenolidase; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YDL086W is not an essential gene +S000036968 CDS YDL086W 4 301413 302234 W 2004-02-11 1996-07-31 +S000028611 ORF Dubious YDL086C-A chromosome 4 4 302089 301655 C 2004-02-11 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps uncharacterized ORF YDL086W; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching +S000031442 CDS YDL086C-A 4 302089 301655 C 2004-02-11 2003-07-29 +S000007588 ORF Uncharacterized YDL085C-A chromosome 4 4 302670 302464 C 2004-02-11 2001-01-30 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus +S000037099 CDS YDL085C-A 4 302670 302464 C 2004-02-11 2001-01-30 +S000002243 ORF Verified YDL085W NDE2 NADH-ubiquinone reductase (H(+)-translocating) NDE2|NDH2 chromosome 4 4 303211 304848 W 2004-02-11 1996-07-31 Mitochondrial external NADH dehydrogenase; catalyzes the oxidation of cytosolic NADH; Nde1p and Nde2p are involved in providing the cytosolic NADH to the mitochondrial respiratory chain; NDE2 has a paralog, NDE1, that arose from the whole genome duplication +S000036900 CDS YDL085W 4 303211 304848 W 2004-02-11 1996-07-31 +S000002242 ORF Verified YDL084W SUB2 ATP-dependent RNA helicase SUB2 chromosome 4 L000004574 4 305237 306577 W 2004-02-11 1996-07-31 Component of the TREX complex required for nuclear mRNA export; member of the DEAD-box RNA helicase superfamily and is involved in early and late steps of spliceosome assembly; homolog of the human splicing factor hUAP56; relocalizes from nucleus to cytoplasm upon DNA replication stress +S000036856 CDS YDL084W 4 305237 306577 W 2004-02-11 1996-07-31 +S000002241 ORF Verified YDL083C RPS16B uS9|ribosomal 40S subunit protein S16B|S9|rp61R|S16B chromosome 4 L000004478 4 307789 306926 C 2004-02-11 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S16 and bacterial S9; RPS16B has a paralog, RPS16A, that arose from the whole genome duplication +S000035913 CDS YDL083C 4 307333 306926 C 2004-02-11 1996-07-31 +S000035912 CDS YDL083C 4 307789 307766 C 2004-02-11 1996-07-31 +S000035914 intron YDL083C 4 307765 307334 C 2004-02-11 1996-07-31 +S000002240 ORF Verified YDL082W RPL13A eL13|ribosomal 60S subunit protein L13A|L13e|L13A chromosome 4 L000004454 4 308424 309388 W 2004-02-11 1996-07-31 Ribosomal 60S subunit protein L13A; not essential for viability; homologous to mammalian ribosomal protein L13, no bacterial homolog; RPL13A has a paralog, RPL13B, that arose from the whole genome duplication +S000035860 CDS YDL082W 4 308424 308427 W 2004-02-11 1996-07-31 +S000035861 CDS YDL082W 4 308793 309388 W 2004-02-11 1996-07-31 +S000035862 intron YDL082W 4 308428 308792 W 2004-02-11 1996-07-31 +S000002239 ORF Verified YDL081C RPP1A P1A|ribosomal protein P1A|RPLA1 chromosome 4 L000002627 4 310122 309802 C 2004-02-11 1996-07-31 Ribosomal stalk protein P1 alpha; involved in the interaction between translational elongation factors and the ribosome; free (non-ribosomal) P1 stimulates the phosphorylation of the eIF2 alpha subunit (Sui2p) by Gcn2p; accumulation of P1 in the cytoplasm is regulated by phosphorylation and interaction with the P2 stalk component +S000035711 CDS YDL081C 4 310122 309802 C 2004-02-11 1996-07-31 +S000002238 ORF Verified YDL080C THI3 branched-chain-2-oxoacid decarboxylase THI3|KID1 chromosome 4 L000003499 4 312471 310642 C 2004-02-11 1996-07-31 Regulatory protein that binds Pdc2p and Thi2p transcription factors; activates thiamine biosynthesis transcription factors Pdc2p and Thi2p by binding to them, but releases and de-activates them upon binding to thiamine pyrophosphate (TPP), the end product of the pathway; has similarity to decarboxylases but enzymatic activity is not detected +S000035644 CDS YDL080C 4 312471 310642 C 2004-02-11 1996-07-31 +S000002237 ORF Verified YDL079C MRK1 putative serine/threonine protein kinase MRK1 chromosome 4 L000001151 4 314748 312951 C 2004-02-11 1996-07-31 Glycogen synthase kinase 3 (GSK-3) homolog; one of four GSK-3 homologs in S. cerevisiae that function to activate Msn2p-dependent transcription of stress responsive genes and that function in protein degradation; MRK1 has a paralog, RIM11, that arose from the whole genome duplication +S000033718 CDS YDL079C 4 314044 312951 C 2004-02-11 1996-07-31 +S000033717 CDS YDL079C 4 314748 314337 C 2004-02-11 1996-07-31 +S000033719 intron YDL079C 4 314336 314045 C 2004-02-11 1996-07-31 +S000002236 ORF Verified YDL078C MDH3 malate dehydrogenase MDH3 chromosome 4 L000001047 4 316388 315357 C 2004-02-11 1996-07-31 Peroxisomal malate dehydrogenase; catalyzes interconversion of malate and oxaloacetate; involved in the glyoxylate cycle +S000033624 CDS YDL078C 4 316388 315357 C 2004-02-11 1996-07-31 +S000130172 ARS ARS412 chromosome 4 4 316771 317230 2014-11-18 2014-11-18|2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000178066 ARS_consensus_sequence ARS412 4 316862 316878 W 2014-11-18 2014-11-18 +S000002235 ORF Verified YDL077C VAM6 VPS39|VPL22|VPL18|CVT4 chromosome 4 L000003935 4 320120 316971 C 2004-02-11 1996-07-31 Guanine nucleotide exchange factor for the GTPase Gtr1p; subunit of the HOPS endocytic tethering complex; vacuole membrane protein; functions as a Rab GTPase effector, interacting with both GTP- and GDP-bound conformations of Ypt7p; facilitates tethering and promotes membrane fusion events at the late endosome and vacuole; required for both membrane and protein trafficking; component of vacuole-mitochondrion contacts (vCLAMPs) important for lipid transfer between organelles +S000033526 CDS YDL077C 4 320120 316971 C 2004-02-11 1996-07-31 +S000002234 ORF Verified YDL076C RXT3 chromosome 4 4 321552 320668 C 2004-02-11 1996-07-31 Component of the Rpd3L histone deacetylase complex; involved in histone deacetylation; protein abundance increases in response to DNA replication stress +S000032814 CDS YDL076C 4 321552 320668 C 2004-02-11 1996-07-31 +S000002233 ORF Verified YDL075W RPL31A eL31|ribosomal 60S subunit protein L31A|L31e|YL28|L34A|L31A|RPL34 chromosome 4 L000003297|L000001727 4 322226 322988 W 2004-02-11 1996-07-31 Ribosomal 60S subunit protein L31A; associates with karyopherin Sxm1p; loss of both Rpl31p and Rpl39p confers lethality; homologous to mammalian ribosomal protein L31, no bacterial homolog; RPL31A has a paralog, RPL31B, that arose from the whole genome duplication +S000032744 CDS YDL075W 4 322226 322282 W 2004-02-11 1996-07-31 +S000032745 CDS YDL075W 4 322704 322988 W 2004-02-11 1996-07-31 +S000032746 intron YDL075W 4 322283 322703 W 2004-02-11 1996-07-31 +S000006454 snoRNA_gene snR63 SNR63 chromosome 4 L000004532 4 323471 323217 C 2004-02-11 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A2256 +S000030842 noncoding_exon snR63 4 323471 323217 C 2004-02-11 2000-05-19 +S000002232 ORF Verified YDL074C BRE1 E3 ubiquitin-protein ligase BRE1 chromosome 4 4 326149 324047 C 2004-02-11 1996-07-31 E3 ubiquitin ligase; forms heterodimer with Rad6p to regulate K63 polyubiquitination in response to oxidative stress and to monoubiquinate histone H2B-K123, which is required for the subsequent methylation of histone H3-K4 and H3-K79; required for DSBR, transcription, silencing, and checkpoint control; interacts with RNA-binding protein Npl3p, linking histone ubiquitination to mRNA processing; Bre1p-dependent histone ubiquitination promotes pre-mRNA splicing +S000032572 CDS YDL074C 4 326149 324047 C 2004-02-11 1996-07-31 +S000002231 ORF Verified YDL073W AHK1 chromosome 4 4 326613 329567 W 2004-02-11 1996-07-31 Scaffold protein in the HKR1 sub-branch of the Hog1p-signaling pathway; physically interacts with the cytoplasmic domain of Hkr1p, and with Sho1p, Pbs2p, and Ste11p; prevents cross-talk signaling from Hkr1p of the osmotic stress MAPK cascade to the Kss1p MAPK cascade; non-essential gene +S000032520 CDS YDL073W 4 326613 329567 W 2004-02-11 1996-07-31 +S000118432 ARS ARS413 ARSIV-330 chromosome 4 4 329566 329814 2006-08-30 2006-08-30 Autonomously Replicating Sequence +S000178067 ARS_consensus_sequence ARS413 4 329671 329687 W 2014-11-18 2014-11-18 +S000002230 ORF Verified YDL072C YET3 chromosome 4 4 330447 329836 C 2004-02-11 1996-07-31 Protein of unknown function; YET3 null mutant decreases the level of secreted invertase; homolog of human BAP31 protein; protein abundance increases in response to DNA replication stress +S000031514 CDS YDL072C 4 330447 329836 C 2004-02-11 1996-07-31 +S000002228 ORF Verified YDL070W BDF2 chromosome 4 L000004431 4 331024 332940 W 2011-02-03 1996-07-31 Protein involved in transcription initiation; acts at TATA-containing promoters; associates with the basal transcription factor TFIID; contains two bromodomains; corresponds to the C-terminal region of mammalian TAF1; redundant with Bdf1p; protein abundance increases in response to DNA replication stress; BDF2 has a paralog, BDF1, that arose from the whole genome duplication +S000031410 CDS YDL070W 4 331024 332940 W 2011-02-03 1996-07-31 +S000002229 ORF Dubious YDL071C IRC1 chromosome 4 4 331040 330666 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF BDF2/YDL070W +S000031459 CDS YDL071C 4 331040 330666 C 2011-02-03 1996-07-31 +S000002226 ORF Dubious YDL068W chromosome 4 4 333500 333829 W 2004-02-11 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030510 CDS YDL068W 4 333500 333829 W 2004-02-11 1996-07-31 +S000002227 ORF Verified YDL069C CBS1 chromosome 4 L000000230 4 333810 333121 C 2004-02-11 2003-09-22|1996-07-31 Mitochondrial translational activator of the COB mRNA; membrane protein that interacts with translating ribosomes, acts on the COB mRNA 5'-untranslated leader +S000030553 CDS YDL069C 4 333810 333121 C 2004-02-11 2003-09-22|1996-07-31 +S000002225 ORF Verified YDL067C COX9 cytochrome c oxidase subunit VIIa chromosome 4 L000000393 4 334396 334217 C 2004-02-11 1996-07-31 Subunit VIIa of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain +S000037632 CDS YDL067C 4 334396 334217 C 2004-02-11 1996-07-31 +S000002224 ORF Verified YDL066W IDP1 isocitrate dehydrogenase (NADP(+)) IDP1 chromosome 4 L000000852 4 334835 336121 W 2004-02-11 1996-07-31 Mitochondrial NADP-specific isocitrate dehydrogenase; catalyzes the oxidation of isocitrate to alpha-ketoglutarate; not required for mitochondrial respiration and may function to divert alpha-ketoglutarate to biosynthetic processes +S000037594 CDS YDL066W 4 334835 336121 W 2004-02-11 1996-07-31 +S000002223 ORF Verified YDL065C PEX19 PAS12 chromosome 4 L000003965 4 337277 336249 C 2006-04-12 1996-07-31|2006-04-12 Chaperone and import receptor for newly-synthesized class I PMPs; binds peroxisomal membrane proteins (PMPs) in the cytoplasm and delivers them to the peroxisome for subsequent insertion into the peroxisomal membrane; interacts with Myo2p and contributes to peroxisome partitioning +S000037387 CDS YDL065C 4 337277 336249 C 2006-04-12 1996-07-31|2006-04-12 +S000002222 ORF Verified YDL064W UBC9 E2 SUMO-conjugating protein UBC9 chromosome 4 L000002636 4 337487 338070 W 2004-02-11 1996-07-31 SUMO-conjugating enzyme involved in the Smt3p conjugation pathway; nuclear protein required for S- and M-phase cyclin degradation and mitotic control; involved in proteolysis mediated by the anaphase-promoting complex cyclosome (APCC) +S000036730 CDS YDL064W 4 337487 337524 W 2004-02-11 1996-07-31 +S000036731 CDS YDL064W 4 337635 338070 W 2004-02-11 1996-07-31 +S000036732 intron YDL064W 4 337525 337634 W 2004-02-11 1996-07-31 +S000002220 ORF Dubious YDL062W chromosome 4 4 339857 340282 W 2004-02-11 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps uncharacterized ORF YDL063C; YDL062W is not essential +S000036515 CDS YDL062W 4 339857 340282 W 2004-02-11 1996-07-31 +S000002221 ORF Verified YDL063C SYO1 chromosome 4 4 340134 338272 C 2004-02-11 1996-07-31 Transport adaptor or symportin; facilitates synchronized nuclear coimport of the two 5S-rRNA binding proteins Rpl5p and Rpl11p; binds to nascent Rpl5p during translation; required for biogenesis of the large ribosomal subunit; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus +S000036559 CDS YDL063C 4 340134 338272 C 2004-02-11 1996-07-31 +S000002219 ORF Verified YDL061C RPS29B uS14|ribosomal 40S subunit protein S29B|S14|YS29|S36B|S29B|YS29B chromosome 4 L000002550 4 340798 340628 C 2004-02-11 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S29 and bacterial S14; RPS29B has a paralog, RPS29A, that arose from the whole genome duplication +S000035564 CDS YDL061C 4 340798 340628 C 2004-02-11 1996-07-31 +S000122093 five_prime_UTR_intron YDL061C 4 341219 340811 C 2007-04-04 2007-04-04 +S000002218 ORF Verified YDL060W TSR1 chromosome 4 4 341619 343985 W 2004-02-11 1996-07-31 Protein required for processing of 20S pre-rRNA in the cytoplasm; associates with pre-40S ribosomal particles; inhibits the premature association of 60S subunits with assembling 40S subunits in the cytoplasm; similar to Bms1p; relocalizes from nucleus to cytoplasm upon DNA replication stress +S000035549 CDS YDL060W 4 341619 343985 W 2004-02-11 1996-07-31 +S000002217 ORF Verified YDL059C RAD59 chromosome 4 L000003987 4 344953 344237 C 2004-02-11 1996-07-31 Protein involved DNA double-strand break repair; repairs breaks in DNA during vegetative growth via recombination and single-strand annealing; anneals complementary single-stranded DNA; forms nuclear foci upon DNA replication stress; required for loading of Rad52p to DSBs; regulates replication fork progression in DNA ligase I-deficient cells; paralog of Rad52p +S000035590 CDS YDL059C 4 344953 344237 C 2004-02-11 1996-07-31 +S000002216 ORF Verified YDL058W USO1 INT1 chromosome 4 L000002446 4 345665 351037 W 2004-02-11 1996-07-31 Essential protein involved in vesicle-mediated ER to Golgi transport; binds membranes and functions during vesicle docking to the Golgi; required for assembly of the ER-to-Golgi SNARE complex +S000035550 CDS YDL058W 4 345665 351037 W 2004-02-11 1996-07-31 +S000002215 ORF Uncharacterized YDL057W chromosome 4 4 351434 352420 W 2004-02-11 1996-07-31 Putative protein of unknown function; YDL057W is not an essential gene +S000034554 CDS YDL057W 4 351434 352420 W 2004-02-11 1996-07-31 +S000002214 ORF Verified YDL056W MBP1 transcription factor MBP1 chromosome 4 L000001032 4 352877 355378 W 2004-02-11 1996-07-31 Transcription factor; involved in regulation of cell cycle progression from G1 to S phase, forms a complex with Swi6p that binds to MluI cell cycle box regulatory element in promoters of DNA synthesis genes +S000034419 CDS YDL056W 4 352877 355378 W 2004-02-11 1996-07-31 +S000002213 ORF Verified YDL055C PSA1 mannose-1-phosphate guanylyltransferase|SRB1|VIG9|MPG1 chromosome 4 L000002625|L000002860|L000002049 4 356759 355674 C 2004-02-11 1996-07-31 GDP-mannose pyrophosphorylase (mannose-1-phosphate guanyltransferase); synthesizes GDP-mannose from GTP and mannose-1-phosphate in cell wall biosynthesis; required for normal cell wall structure +S000034293 CDS YDL055C 4 356759 355674 C 2004-02-11 1996-07-31 +S000006629 tRNA_gene tK(UUU)D chromosome 4 L000003762|S000007415 4 359577 359672 W 2004-02-11 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000034182 intron tK(UUU)D 4 359614 359636 W 2004-02-11 2000-05-19 +S000034180 noncoding_exon tK(UUU)D 4 359577 359613 W 2004-02-11 2000-05-19 +S000034181 noncoding_exon tK(UUU)D 4 359637 359672 W 2004-02-11 2000-05-19 +S000002212 ORF Verified YDL054C MCH1 chromosome 4 4 361285 359825 C 2004-02-11 1996-07-31 Protein with similarity to mammalian monocarboxylate permeases; monocarboxylate permeases are involved in transport of monocarboxylic acids across the plasma membrane but mutant is not deficient in monocarboxylate transport +S000033372 CDS YDL054C 4 361285 359825 C 2004-02-11 1996-07-31 +S000002211 ORF Verified YDL053C PBP4 chromosome 4 4 362256 361699 C 2004-02-11 1996-07-31 Pbp1p binding protein; interacts strongly with Pab1p-binding protein 1 (Pbp1p) in the yeast two-hybrid system; also interacts with Lsm12p in a copurification assay; relative distribution to the nucleus increases upon DNA replication stress +S000033305 CDS YDL053C 4 362256 361699 C 2004-02-11 1996-07-31 +S000002210 ORF Verified YDL052C SLC1 1-acylglycerol-3-phosphate O-acyltransferase SLC1 chromosome 4 L000001914 4 363583 362672 C 2004-02-11 1996-07-31 1-acyl-sn-glycerol-3-phosphate acyltransferase; catalyzes the acylation of lysophosphatidic acid to form phosphatidic acid, a key intermediate in lipid metabolism; enzymatic activity detected in lipid particles and microsomes +S000033244 CDS YDL052C 4 363583 362672 C 2004-02-11 1996-07-31 +S000002209 ORF Verified YDL051W LHP1 YLA1|LAH1 chromosome 4 L000002518 4 363952 364779 W 2004-02-11 1996-07-31 RNA binding protein required for maturation of tRNA and U6 snRNA; acts as a molecular chaperone for RNAs transcribed by polymerase III; homologous to human La (SS-B) autoantigen +S000033227 CDS YDL051W 4 363952 364779 W 2004-02-11 1996-07-31 +S000002208 ORF Dubious YDL050C chromosome 4 4 364817 364446 C 2004-02-11 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032313 CDS YDL050C 4 364817 364446 C 2004-02-11 1996-07-31 +S000002207 ORF Verified YDL049C KNH1 chromosome 4 L000002837 4 365874 365068 C 2004-02-11 1996-07-31 Protein with similarity to Kre9p; Kre9p is involved in cell wall beta 1,6-glucan synthesis; overproduction suppresses growth defects of a kre9 null mutant; required for propionic acid resistance +S000031388 CDS YDL049C 4 365874 365068 C 2004-02-11 1996-07-31 +S000002206 ORF Verified YDL048C STP4 chromosome 4 L000003372 4 368211 366739 C 2004-02-11 1999-02-09|1996-07-31 Protein containing a Kruppel-type zinc-finger domain; similar to Stp1p, Stp2p; predicted transcription factor; relative distribution to the nucleus increases upon DNA replication stress; STP4 has a paralog, STP3, that arose from the whole genome duplication +S000031282 CDS YDL048C 4 368211 366739 C 2004-02-11 1999-02-09|1996-07-31 +S000002205 ORF Verified YDL047W SIT4 type 2A-related serine/threonine-protein phosphatase SIT4|PPH1 chromosome 4 L000001901 4 369771 370706 W 2011-02-03 1996-07-31 Ceramide-activated, type 2A-related serine-threonine phosphatase; functions in G1/S transition of mitotic cycle; controls lifespan, mitochondrial function, cell cycle progression by regulating HXK2 phosphorylation; regulator of COPII coat dephosphorylation; required for ER to Golgi traffic; interacts with Hrr25p kinase; cytoplasmic and nuclear protein that modulates functions mediated by Pkc1p including cell wall and actin cytoskeleton organization; similar to human PP6 +S000031218 CDS YDL047W 4 369771 370706 W 2011-02-03 1996-07-31 +S000002204 ORF Verified YDL046W NPC2 sterol transporter chromosome 4 S000028462 4 371240 371761 W 2011-02-03 1996-07-31 Sterol transport protein and functional homolog of human NPC2/He1; human NPC2 is a cholesterol-binding protein whose deficiency causes Niemann-Pick type C2 disease involving retention of cholesterol in lysosomes; yeast NPC2 can complement mutations in human NPC2 +S000031100 CDS YDL046W 4 371240 371761 W 2011-02-03 1996-07-31 +S000006430 ORF Verified YDL045W-A MRP10 mitochondrial 37S ribosomal protein YmS-T|YmS-T chromosome 4 L000003390 4 372248 372535 W 2011-02-03 1999-07-17 Mitochondrial ribosomal protein of the small subunit; contains twin cysteine-x9-cysteine motifs; oxidized by Mia40p during import into mitochondria +S000032810 CDS YDL045W-A 4 372248 372535 W 2011-02-03 1999-07-17 +S000002203 ORF Verified YDL045C FAD1 FMN adenylyltransferase chromosome 4 L000000598 4 373608 372688 C 2011-02-03 1996-07-31 Flavin adenine dinucleotide (FAD) synthetase; performs the second step in synthesis of FAD from riboflavin; mutation is functionally complemented by human FLAD1 +S000030018 CDS YDL045C 4 373608 372688 C 2011-02-03 1996-07-31 +S000002202 ORF Verified YDL044C MTF2 NAM1 chromosome 4 L000001212 4 375289 373967 C -17.93 2011-02-03 1996-07-31 Mitochondrial protein that interacts with mitochondrial RNA polymerase; interacts with an N-terminal region of mitochondrial RNA polymerase (Rpo41p) and couples RNA processing and translation to transcription +S000029908 CDS YDL044C 4 375289 373967 C 2011-02-03 1996-07-31 +S000002201 ORF Verified YDL043C PRP11 RNA11 chromosome 4 L000001502 4 376480 375680 C -17.13 2011-02-03 1996-07-31 Subunit of the SF3a splicing factor complex; required for spliceosome assembly +S000037237 CDS YDL043C 4 376480 375680 C 2011-02-03 1996-07-31 +S000002199 ORF Dubious YDL041W chromosome 4 4 378102 378455 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene SIR2/YDL042C +S000037091 CDS YDL041W 4 378102 378455 W 2011-02-03 1996-07-31 +S000002200 ORF Verified YDL042C SIR2 NAD-dependent histone deacetylase SIR2|MAR1 chromosome 4 L000001895 4 378445 376757 C -16.03 2011-02-03 1996-07-31 Conserved NAD+ dependent histone deacetylase of the Sirtuin family; deacetylation targets are primarily nuclear proteins; required for telomere hypercluster formation in quiescent yeast cells; involved in regulation of lifespan; plays roles in silencing at HML, HMR, telomeres, and rDNA; negatively regulates initiation of DNA replication; functions as regulator of autophagy like mammalian homolog SIRT1, and also of mitophagy +S000037155 CDS YDL042C 4 378445 376757 C 2011-02-03 1996-07-31 +S000002198 ORF Verified YDL040C NAT1 peptide alpha-N-acetyltransferase complex A subunit NAT1|NAA15|AAA1 chromosome 4 L000000002 4 381438 378874 C -14.93 2011-02-03 1996-07-31 Subunit of protein N-terminal acetyltransferase NatA; NatA comprised of Nat1p, Ard1p, and Nat5p; N-terminally acetylates many proteins to influence multiple processes such as cell cycle progression, heat-shock resistance, mating, sporulation, telomeric silencing and early stages of mitophagy; orthologous to human NAA15; expression of both human NAA10 and NAA15 functionally complements ard1 nat1 double mutant although single mutations are not complemented by their orthologs +S000036986 CDS YDL040C 4 381438 378874 C 2011-02-03 1996-07-31 +S000002197 ORF Verified YDL039C PRM7 pheromone-regulated protein PRM7|YDL038C chromosome 4 4 384081 381985 C 2011-02-03 1996-07-31|2008-06-05 Pheromone-regulated protein; predicted to have one transmembrane segment; promoter contains Gcn4p binding elements; in W303 strain one continuous open reading frame comprising of YDL037C, the intergenic region and YDL039C encodes the IMI1 +S000035141 CDS YDL039C 4 384081 381985 C 2011-02-03 1996-07-31|2008-06-05 +S000002195 ORF Verified YDL037C BSC1 chromosome 4 4 385587 384601 C 2011-02-03 1996-07-31 Protein of unconfirmed function; similar to cell surface flocculin Flo11p; ORF exhibits genomic organization compatible with a translational readthrough-dependent mode of expression; in W303 strain one continuous open reading frame comprising of YDL037C, the intergenic region and YDL039C encodes the gene IMI1 +S000034059 CDS YDL037C 4 385587 384601 C 2011-02-03 1996-07-31 +S000002194 ORF Verified YDL036C PUS9 pseudouridine synthase PUS9 chromosome 4 4 388901 387513 C 2011-02-03 1996-07-31 Mitochondrial tRNA:pseudouridine synthase; catalyzes the formation of pseudouridine at position 32 in mitochondrial tRNAs; contains an N-terminal mitochondrial targeting sequence; PUS9 has a paralog, RIB2, that arose from the whole genome duplication +S000033903 CDS YDL036C 4 388901 387513 C 2011-02-03 1996-07-31 +S000002192 ORF Dubious YDL034W chromosome 4 4 391783 392127 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps with verified gene GPR1/YDL035C; YDL034W is not an essential gene +S000033108 CDS YDL034W 4 391783 392127 W 2011-02-03 1996-07-31 +S000002193 ORF Verified YDL035C GPR1 chromosome 4 L000004298 4 392057 389172 C 2011-02-03 1996-07-31 Plasma membrane G protein coupled receptor (GPCR); interacts with the heterotrimeric G protein alpha subunit, Gpa2p, and with Plc1p; sensor that integrates nutritional signals with the modulation of cell fate via PKA and cAMP synthesis +S000033783 CDS YDL035C 4 392057 389172 C 2011-02-03 1996-07-31 +S000002190 ORF Dubious YDL032W chromosome 4 4 393690 394001 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene SLM3/YDL033C; YDL032W is not an essential gene +S000032947 CDS YDL032W 4 393690 394001 W 2011-02-03 1996-07-31 +S000002191 ORF Verified YDL033C SLM3 tRNA-5-taurinomethyluridine 2-sulfurtransferase|MTU1|MTO2 chromosome 4 4 393912 392659 C 2011-02-03 1996-07-31 tRNA-specific 2-thiouridylase; responsible for 2-thiolation of the wobble base of mitochondrial tRNAs; human homolog TRMU is implicated in myoclonus epilepsy associated with ragged red fibers (MERRF), and can complement yeast null mutant +S000032981 CDS YDL033C 4 393912 392659 C 2011-02-03 1996-07-31 +S000002189 ORF Verified YDL031W DBP10 putative ATP-dependent RNA helicase DBP10 chromosome 4 L000004557 4 394217 397204 W 2011-02-03 1996-07-31|2011-02-03 Putative ATP-dependent RNA helicase of the DEAD-box protein family; constituent of 66S pre-ribosomal particles; essential protein involved in ribosome biogenesis +S000032837 CDS YDL031W 4 394217 397204 W 2011-02-03 1996-07-31|2011-02-03 +S000002188 ORF Verified YDL030W PRP9 SF3a splicing factor complex subunit PRP9 chromosome 4 L000001501 4 397537 399129 W 2011-02-03 1996-07-31 Subunit of the SF3a splicing factor complex; required for spliceosome assembly; acts after the formation of the U1 snRNP-pre-mRNA complex +S000031920 CDS YDL030W 4 397537 399129 W 2011-02-03 1996-07-31 +S000002187 ORF Verified YDL029W ARP2 actin-related protein 2|ACT2 chromosome 4 L000000026 4 399340 400638 W 2011-02-03 1996-07-31 Essential component of the Arp2/3 complex; Arp2/3 is a highly conserved actin nucleation center required for the motility and integrity of actin patches; involved in endocytosis and membrane growth and polarity; required for efficient Golgi-to-ER trafficking in COPI mutants +S000032598 CDS YDL029W 4 399340 399361 W 2011-02-03 1996-07-31 +S000032599 CDS YDL029W 4 399485 400638 W 2011-02-03 1996-07-31 +S000032600 intron YDL029W 4 399362 399484 W 2011-02-03 1996-07-31 +S000002186 ORF Verified YDL028C MPS1 serine/threonine/tyrosine protein kinase MPS1|PAC8|RPK1 chromosome 4 L000001698 4 403291 400997 C 2011-02-03 1996-07-31|2011-02-03 Dual-specificity kinase; autophosphorylation required for function; required for spindle pole body (SPB) duplication and spindle checkpoint function; contributes to bi-orientation by promoting formation of force-generating kinetochore-microtubule attachments in meiosis I; substrates include SPB proteins Spc42p, Spc110p, and Spc98p, mitotic exit network protein Mob1p, kinetochore protein Cnn1p, and checkpoint protein Mad1p; substrate of APCC(Cdh1); similar to human Mps1p +S000031526 CDS YDL028C 4 403291 400997 C 2011-02-03 1996-07-31|2011-02-03 +S000002184 ORF Dubious YDL026W chromosome 4 4 404749 405060 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031360 CDS YDL026W 4 404749 405060 W 2011-02-03 1996-07-31 +S000002185 ORF Uncharacterized YDL027C MRX9 chromosome 4 4 404957 403695 C 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YDL027C is not an essential gene +S000031399 CDS YDL027C 4 404957 403695 C 2011-02-03 1996-07-31 +S000028610 ORF Dubious YDL025W-A chromosome 4 4 405410 405514 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the ORF YDL025C; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching +S000031440 CDS YDL025W-A 4 405410 405514 W 2011-02-03 2003-07-29 +S000002183 ORF Verified YDL025C RTK1 putative serine/threonine protein kinase RTK1 chromosome 4 4 407206 405344 C 2011-02-03 1996-07-31 Putative protein kinase, potentially phosphorylated by Cdc28p; interacts with ribosome biogenesis factors, Cka2, Gus1 and Arc1; protein abundance increases in response to DNA replication stress +S000030352 CDS YDL025C 4 407206 405344 C 2011-02-03 1996-07-31 +S000118433 ARS ARS414 ARSIV-408 chromosome 4 4 408075 408316 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000002182 ORF Verified YDL024C DIA3 putative acid phosphatase DIA3 chromosome 4 4 409857 408451 C 2011-02-03 1996-07-31 Protein of unknown function; involved in invasive and pseudohyphal growth +S000030155 CDS YDL024C 4 409857 408451 C 2011-02-03 1996-07-31 +S000028537 ORF Uncharacterized YDL022C-A chromosome 4 4 410056 409808 C 2011-02-03 2003-07-29 Protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the cytosol; partially overlaps the verified gene DIA3; identified by fungal homology and RT-PCR; mRNA identified as translated by ribosome profiling data +S000031146 CDS YDL022C-A 4 410056 409808 C 2011-02-03 2003-07-29 +S000006510 tRNA_gene tA(AGC)D chromosome 4 L000003763 4 410379 410451 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine +S000032254 noncoding_exon tA(AGC)D 4 410379 410451 W 2011-02-03 2000-05-19 +S000002180 ORF Verified YDL022W GPD1 glycerol-3-phosphate dehydrogenase (NAD(+)) GPD1|OSR5|OSG1|HOR1|DAR1 chromosome 4 L000000722 4 411825 413000 W 2011-02-03 1996-07-31 NAD-dependent glycerol-3-phosphate dehydrogenase; key enzyme of glycerol synthesis, essential for growth under osmotic stress; expression regulated by high-osmolarity glycerol response pathway; protein abundance increases in response to DNA replication stress; constitutively inactivated via phosphorylation by the protein kinases Ypk1p and Ypk2p, dephosphorylation increases catalytic activity; forms a heterodimer with Pnc1p to facilitate its peroxisomal import +S000037411 CDS YDL022W 4 411825 413000 W 2011-02-03 1996-07-31 +S000002181 ORF Dubious YDL023C SRF4 chromosome 4 4 412081 411761 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in other Saccharomyces species; overlaps the verified gene GPD1; deletion confers sensitivity to GSAO; deletion in cyr1 mutant results in loss of stress resistance +S000037466 CDS YDL023C 4 412081 411761 C 2011-02-03 1996-07-31 +S000002179 ORF Verified YDL021W GPM2 phosphoglycerate mutase family protein GPM2 chromosome 4 L000003294 4 413953 414888 W 2011-02-03 1996-07-31 Homolog of Gpm1p phosphoglycerate mutase; converts 3-phosphoglycerate to 2-phosphoglycerate in glycolysis; may be non-functional; GPM2 has a paralog, GPM3, that arose from the whole genome duplication +S000037296 CDS YDL021W 4 413953 414888 W 2011-02-03 1996-07-31 +S000002178 ORF Verified YDL020C RPN4 stress-regulated transcription factor RPN4|UFD5|SON1 chromosome 4 L000001984 4 416708 415113 C 2011-02-03 1996-07-31 Transcription factor that stimulates expression of proteasome genes; Rpn4p levels are in turn regulated by the 26S proteasome in a negative feedback control mechanism; RPN4 is transcriptionally regulated by various stress responses; relative distribution to the nucleus increases upon DNA replication stress +S000036564 CDS YDL020C 4 416708 415113 C 2011-02-03 1996-07-31 +S000002177 ORF Verified YDL019C OSH2 oxysterol-binding protein related protein OSH2 chromosome 4 4 421514 417663 C 2011-02-03 1996-07-31 Member of an oxysterol-binding protein family with seven members; in S. cerevisiae, family members have overlapping, redundant functions in sterol metabolism and collectively perform a function essential for viability; contains FFAT motif; interacts with ER anchor Scs2p at patches at the plasma membrane and at the nuclear envelope; regulated by sterol binding; OSH2 has a paralog, SWH1, that arose from the whole genome duplication +S000035539 CDS YDL019C 4 421514 417663 C 2011-02-03 1996-07-31 +S000002176 ORF Verified YDL018C ERP3 chromosome 4 L000004680 4 423510 422833 C 2011-02-03 1996-07-31 Protein with similarity to Emp24p and Erv25p; member of the p24 family involved in ER to Golgi transport +S000035452 CDS YDL018C 4 423510 422833 C 2011-02-03 1996-07-31 +S000002175 ORF Verified YDL017W CDC7 serine/threonine protein kinase CDC7|SAS1|LSD6 chromosome 4 L000000247 4 424209 425732 W -1 2011-02-03 1996-07-31 DDK (Dbf4-dependent kinase) catalytic subunit; required for origin firing and replication fork progression in mitotic S phase through phosphorylation of Mcm2-7p complexes and Cdc45p; kinase activity correlates with cyclical DBF4 expression; required for pre-meiotic DNA replication, meiotic DSB formation, recruitment of monopolin complex to kinetochores during meiosis I, regulation of meiosis-specific Ndt80p; mutation complemented by human CDC7 and DBF4 co-expression +S000035373 CDS YDL017W 4 424209 425732 W 2011-02-03 1996-07-31 +S000002174 ORF Dubious YDL016C chromosome 4 4 425872 425570 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF CDC7/YDL153C, the catalytic subunit of a complex that regulates DNA replication +S000034291 CDS YDL016C 4 425872 425570 C 2011-02-03 1996-07-31 +S000002173 ORF Verified YDL015C TSC13 trans-2-enoyl-CoA reductase (NADPH) TSC13 chromosome 4 4 426934 426002 C 2011-02-03 1996-07-31 Enoyl reductase; catalyzes last step in each cycle of very long chain fatty acid elongation; localizes to ER, highly enriched in a structure marking nuclear-vacuolar junctions; coimmunoprecipitates with elongases Elo2p and Elo3p; protein increases in abundance and relative distribution to ER foci increases upon DNA replication stress; human homolog TECR implicated in nonsyndromic mental retardation, can complement yeast mutant +S000034157 CDS YDL015C 4 426934 426002 C 2011-02-03 1996-07-31 +S000002172 ORF Verified YDL014W NOP1 rRNA methyltransferase NOP1|LOT3 chromosome 4 L000001260 4 427364 428347 W -1.93 2011-02-03 1996-07-31 Histone glutamine methyltransferase, modifies H2A at Q105 in nucleolus; component of the small subunit processome complex, which is required for processing of pre-18S rRNA; ortholog of mammalian fibrillarin; inviability of the null mutant is functionally complemented by human FBL +S000034123 CDS YDL014W 4 427364 428347 W 2011-02-03 1996-07-31 +S000002171 ORF Verified YDL013W SLX5 SUMO-targeted ubiquitin ligase complex subunit SLX5|ULS2|HEX3 chromosome 4 L000000768 4 429067 430926 W -1.69 2011-02-03 1996-07-31 Subunit of the Slx5-Slx8 SUMO-targeted Ub ligase (STUbL) complex; role in Ub-mediated degradation of histone variant Cse4p preventing mislocalization to euchromatin; role in proteolysis of spindle positioning protein Kar9p, and DNA repair proteins Rad52p and Rad57p; forms SUMO-dependent nuclear foci, including DNA repair centers; contains a RING domain and two SIM motifs; associates with the centromere; required for maintenance of genome integrity like human ortholog RNF4 +S000033268 CDS YDL013W 4 429067 430926 W 2011-02-03 1996-07-31 +S000002170 ORF Verified YDL012C chromosome 4 4 431517 431108 C 2011-02-03 1996-07-31 Tail-anchored plasma membrane protein with a conserved CYSTM module; possibly involved in response to stress; may contribute to non-homologous end-joining (NHEJ) based on ydl012c htz1 double null phenotype; YDL012C has a paralog, YBR016W, that arose from the whole genome duplication +S000033170 CDS YDL012C 4 431386 431108 C 2011-02-03 1996-07-31 +S000033169 CDS YDL012C 4 431517 431473 C 2011-02-03 1996-07-31 +S000033171 intron YDL012C 4 431472 431387 C 2011-02-03 1996-07-31 +S000002168 ORF Verified YDL010W GRX6 glutathione-disulfide reductase GRX6 chromosome 4 4 432330 433025 W 2011-02-03 1996-07-31 Cis-golgi localized monothiol glutaredoxin, binds Fe-S cluster; more similar in activity to dithiol than other monothiol glutaredoxins; involved in the oxidative stress response; GRX6 has a paralog, GRX7, that arose from the whole genome duplication +S000032278 CDS YDL010W 4 432330 433025 W 2011-02-03 1996-07-31 +S000002169 ORF Dubious YDL011C chromosome 4 4 432631 432308 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the uncharacterized ORF YDL010W +S000032316 CDS YDL011C 4 432631 432308 C 2011-02-03 1996-07-31 +S000002167 ORF Uncharacterized YDL009C chromosome 4 4 433248 432925 C 2011-02-03 1996-07-31 Protein of unknown function; mRNA identified as translated by ribosome profiling data; SWAT-GFP and mCherry fusion proteins localize to the cytosol; partially overlaps the verified ORF YDL010W; YDL009C is not an essential gene +S000032265 CDS YDL009C 4 433248 432925 C 2011-02-03 1996-07-31 +S000002166 ORF Verified YDL008W APC11 anaphase promoting complex subunit 11 chromosome 4 L000004322 4 433497 433994 W 2011-02-03 1996-07-31 Catalytic core subunit, Anaphase-Promoting Complex/Cyclosome (APC/C); which is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; contains a RING-H2 domain that is required for activity +S000032227 CDS YDL008W 4 433497 433994 W 2011-02-03 1996-07-31 +S000006739 tRNA_gene tT(AGU)D chromosome 4 L000003788 4 434336 434264 C 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000032153 noncoding_exon tT(AGU)D 4 434336 434264 C 2011-02-03 2000-05-19 +S000006842 long_terminal_repeat YDLCdelta1 chromosome 4 4 434739 434423 C 2011-02-03 2000-05-19 Ty1 LTR +S000130173 ARS ARS415 chromosome 4 4 434971 435320 2014-11-18 2014-11-18|2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000113557 ORF Uncharacterized YDL007C-A chromosome 4 4 436824 436567 C 2011-02-03 2005-11-17 Putative protein of unknown function +S000113558 CDS YDL007C-A 4 436824 436567 C 2011-02-03 2005-11-17 +S000006843 long_terminal_repeat YDLWtau1 chromosome 4 4 437149 437518 W 2011-02-03 2000-05-19 Ty4 LTR +S000006721 tRNA_gene tS(AGA)D1 chromosome 4 L000003764 4 437772 437853 W 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000031630 noncoding_exon tS(AGA)D1 4 437772 437853 W 2011-02-03 2000-05-19 +S000002165 ORF Verified YDL007W RPT2 proteasome regulatory particle base subunit RPT2|YTA5|YHS4 chromosome 4 L000002559 4 438047 439360 W 2011-02-03 1996-07-31 ATPase of the 19S regulatory particle of the 26S proteasome; one of six ATPases of the regulatory particle; involved in the degradation of ubiquitinated substrates; required for normal peptide hydrolysis by the core 20S particle; N-myristoylation of Rpt2p at Gly2 is involved in regulating the proper intracellular distribution of proteasome activity by controlling the nuclear localization of the 26S proteasome +S000031210 CDS YDL007W 4 438047 439360 W 2011-02-03 1996-07-31 +S000002164 ORF Verified YDL006W PTC1 type 2C protein phosphatase PTC1|TPD1|KCS2|CWH47 chromosome 4 L000000890|L000001523 4 439909 440754 W 2011-02-03 1996-07-31 Type 2C protein phosphatase (PP2C); dephosphorylates Hog1p, inactivating osmosensing MAPK cascade; involved in Fus3p activation during pheromone response; deletion affects precursor tRNA splicing, mitochondrial inheritance, and sporulation +S000031084 CDS YDL006W 4 439909 440754 W 2011-02-03 1996-07-31 +S000002163 ORF Verified YDL005C MED2 chromosome 4 L000003914 4 442309 441014 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation; relocalizes to the cytosol in response to hypoxia +S000030042 CDS YDL005C 4 442309 441014 C 2011-02-03 1996-07-31 +S000002162 ORF Verified YDL004W ATP16 F1F0 ATP synthase subunit delta chromosome 4 L000000150 4 443029 443511 W 2011-02-03 1996-07-31 Delta subunit of the central stalk of mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; F1 translationally regulates ATP6 and ATP8 expression to achieve a balanced output of ATP synthase genes encoded in nucleus and mitochondria; phosphorylated +S000030001 CDS YDL004W 4 443029 443511 W 2011-02-03 1996-07-31 +S000002161 ORF Verified YDL003W MCD1 kleisin alpha|SCC1|RHC21|PDS3 chromosome 4 L000002676 4 444683 446383 W 2011-02-03 1996-07-31 Essential alpha-kleisin subunit of the cohesin complex; required for sister chromatid cohesion in mitosis and meiosis; apoptosis induces cleavage and translocation of a C-terminal fragment to mitochondria; expression peaks in S phase +S000029870 CDS YDL003W 4 444683 446383 W 2011-02-03 1996-07-31 +S000002160 ORF Verified YDL002C NHP10 HMO2 chromosome 4 L000002765 4 447578 446967 C 2011-02-03 1996-07-31 Non-essential INO80 chromatin remodeling complex subunit; preferentially binds DNA ends, protecting them from exonucleatic cleavage; deletion affects telomere maintenance via recombination; related to mammalian high mobility group proteins +S000037122 CDS YDL002C 4 447578 446967 C 2011-02-03 1996-07-31 +S000002159 ORF Verified YDL001W RMD1 chromosome 4 4 447984 449276 W 2011-02-03 1996-07-31 Cytoplasmic protein required for sporulation +S000037078 CDS YDL001W 4 447984 449276 W 2011-02-03 1996-07-31 +S000006466 centromere CEN4 CEN4 chromosome 4 L000000297 4 449711 449821 W 0 2011-02-03 2000-05-19|2006-05-08 Chromosome IV centromere +S000077266 centromere_DNA_Element_I CEN4 4 449711 449720 W 2011-02-03 2004-10-04 +S000077267 centromere_DNA_Element_II CEN4 4 449721 449796 W 2011-02-03 2004-10-04 +S000077268 centromere_DNA_Element_III CEN4 4 449797 449821 W 2011-02-03 2004-10-04 +S000002408 ORF Verified YDR001C NTH1 alpha,alpha-trehalase NTH1 chromosome 4 L000001280 4 452475 450220 C 2011-02-03 1996-07-31 Neutral trehalase, degrades trehalose; required for thermotolerance and may mediate resistance to other cellular stresses; phosphorylated and activated by Cdc28p at the G1/S phase transition to coordinately regulate carbohydrate metabolism and the cell cycle; inhibited by Dcs1p; NTH1 has a paralog, NTH2, that arose from the whole genome duplication +S000033545 CDS YDR001C 4 452475 450220 C 2011-02-03 1996-07-31 +S000002409 ORF Verified YDR002W YRB1 Ran GTPase-binding protein YRB1|STP52|SFO1|HTN1|CST20 chromosome 4 L000001871|S000029527|L000002134 4 453045 453650 W 2011-02-03 1996-07-31 Ran GTPase binding protein; involved in nuclear protein import and RNA export, ubiquitin-mediated protein degradation during the cell cycle; shuttles between the nucleus and cytoplasm; is essential; homolog of human RanBP1 +S000034475 CDS YDR002W 4 453045 453650 W 2011-02-03 1996-07-31 +S000002410 ORF Verified YDR003W RCR2 SSH5 chromosome 4 S000029511|L000002952 4 454122 454754 W 2011-02-03 1996-07-31 Vacuolar protein; presumably functions within the endosomal-vacuolar trafficking pathway, affecting events that determine whether plasma membrane proteins are degraded or routed to the plasma membrane; RCR2 has a paralog, RCR1, that arose from the whole genome duplication +S000034587 CDS YDR003W 4 454122 454754 W 2011-02-03 1996-07-31 +S000028819 ORF Uncharacterized YDR003W-A chromosome 4 4 454782 454904 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000033630 CDS YDR003W-A 4 454782 454904 W 2011-02-03 2003-07-29 +S000002411 ORF Verified YDR004W RAD57 putative DNA-dependent ATPase RAD57 chromosome 4 L000001577 4 455201 456583 W 2 2011-02-03 1996-07-31 Protein that stimulates strand exchange; stimulates strand exchange by stabilizing the binding of Rad51p to single-stranded DNA; involved in the recombinational repair of double-strand breaks in DNA during vegetative growth and meiosis; forms heterodimer with Rad55p +S000034681 CDS YDR004W 4 455201 456583 W 2011-02-03 1996-07-31 +S000002412 ORF Verified YDR005C MAF1 RNA polymerase III-inhibiting protein MAF1 chromosome 4 L000002614 4 458103 456836 C 2011-02-03 1996-07-31 Highly conserved negative regulator of RNA polymerase III; involved in tRNA processing and stability; inhibits tRNA degradation via rapid tRNA decay (RTD) pathway; binds N-terminal domain of Rpc160p subunit of Pol III to prevent closed-complex formation; regulated by phosphorylation mediated by TORC1, protein kinase A, Sch9p, casein kinase 2; localizes to cytoplasm during vegetative growth and translocates to nucleus and nucleolus under stress conditions +S000034763 CDS YDR005C 4 458017 456836 C 2011-02-03 1996-07-31 +S000034762 CDS YDR005C 4 458103 458098 C 2011-02-03 1996-07-31 +S000034764 intron YDR005C 4 458097 458018 C 2011-02-03 1996-07-31 +S000002413 ORF Verified YDR006C SOK1 chromosome 4 L000001983 4 461247 458542 C 2011-02-03 1996-07-31 Protein of unknown function; overexpression suppresses the growth defect of mutants lacking protein kinase A activity; involved in cAMP-mediated signaling; localized to the nucleus; similar to the mouse testis-specific protein PBS13 +S000035723 CDS YDR006C 4 461247 458542 C 2011-02-03 1996-07-31 +S000002414 ORF Verified YDR007W TRP1 phosphoribosylanthranilate isomerase TRP1 chromosome 4 L000002352 4 461842 462516 W 1 2011-02-03 2004-02-11|1996-07-31 Phosphoribosylanthranilate isomerase; catalyzes the third step in tryptophan biosynthesis; in 2004, the sequence of TRP1 from strain S228C was updated by changing the previously annotated internal STOP (TAA) to serine (TCA); enhances vegetative growth at low and high temperatures when used as an auxotrophic marker in strains such as W303 +S000035920 CDS YDR007W 4 461842 462516 W 2011-02-03 2004-02-11|1996-07-31 +S000029652 ARS ARS416 ARS1 chromosome 4 S000007454 4 462567 462622 2014-11-18 2014-11-18|2006-04-10 Early-firing autonomously replicating sequence; highly efficient chromosomal replicator active in nearly every cell cycle +S000121228 ARS_consensus_sequence ARS416 4 462606 462596 C 2011-02-03 2007-03-06 +S000002415 ORF Dubious YDR008C chromosome 4 4 462602 462252 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps TRP1/YDR007W on opposite strand +S000035999 CDS YDR008C 4 462602 462252 C 2011-02-03 1996-07-31 +S000002416 ORF Verified YDR009W GAL3 transcriptional regulator GAL3 chromosome 4 L000000660 4 463434 464996 W 1 2011-02-03 1996-07-31 Transcriptional regulator; involved in activation of the GAL genes in response to galactose; forms a complex with Gal80p to relieve Gal80p inhibition of Gal4p; binds galactose and ATP but does not have galactokinase activity; GAL3 has a paralog, GAL1, that arose from the whole genome duplication +S000037895 CDS YDR009W 4 463434 464996 W 2011-02-03 1996-07-31 +S000002417 ORF Dubious YDR010C chromosome 4 4 465383 465051 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037562 CDS YDR010C 4 465383 465051 C 2011-02-03 1996-07-31 +S000002418 ORF Verified YDR011W SNQ2 ATP-binding cassette transporter SNQ2 chromosome 4 L000001957 4 465919 470424 W 2011-02-03 1996-07-31 Plasma membrane ATP-binding cassette (ABC) transporter; multidrug transporter involved in multidrug resistance and resistance to singlet oxygen species +S000037672 CDS YDR011W 4 465919 470424 W 2011-02-03 1996-07-31 +S000002419 ORF Verified YDR012W RPL4B uL4|ribosomal 60S subunit protein L4B|L4|rp2|YL2|L4B|L2B chromosome 4 L000001702 4 471853 472941 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L4B; homologous to mammalian ribosomal protein L4 and bacterial L4; RPL4B has a paralog, RPL4A, that arose from the whole genome duplication +S000037729 CDS YDR012W 4 471853 472941 W 2011-02-03 1996-07-31 +S000002420 ORF Verified YDR013W PSF1 DNA replication protein PSF1|CDC101 chromosome 4 4 473157 473783 W 2011-02-03 1996-07-31 Subunit of the GINS complex (Sld5p, Psf1p, Psf2p, Psf3p); complex is localized to DNA replication origins and implicated in assembly of the DNA replication machinery +S000037779 CDS YDR013W 4 473157 473783 W 2011-02-03 1996-07-31 +S000002421 ORF Verified YDR014W RAD61 WPL1 chromosome 4 4 474046 475989 W 2011-02-03 1996-07-31 Subunit of a complex that inhibits sister chromatid cohesion; also negatively regulates chromosome condensation; inhibited by Eco1p-acetylated cohesin subunits Smc3p and Mcd1p; binds Smc3p ATPase head of cohesin; related to the human Wapl protein that controls the association of cohesin with chromatin +S000030660 CDS YDR014W 4 474046 475989 W 2011-02-03 1996-07-31 +S000113613 ORF Verified YDR014W-A HED1 chromosome 4 4 477797 478285 W 2011-02-03 2006-04-14 Meiosis-specific protein; down-regulates Rad51p-mediated mitotic recombination when the meiotic recombination machinery is impaired; promotes synapsis and required for the normal morphogenesis of synaptonemal complex; prevents the recruitment of Rad54p to site-specific DNA double-strand breaks in vivo; early meiotic gene, transcribed specifically during meiotic prophase +S000114898 CDS YDR014W-A 4 477797 478285 W 2011-02-03 2006-04-14 +S000002422 ORF Dubious YDR015C chromosome 4 4 478199 477960 C 2011-02-03 1996-07-31|2006-04-13 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene HED1/YDR014W-A +S000030702 CDS YDR015C 4 478199 477960 C 2011-02-03 1996-07-31|2006-04-13 +S000002423 ORF Verified YDR016C DAD1 chromosome 4 4 478758 478474 C 2011-02-03 1996-07-31 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; is transferred to the kinetochore prior to mitosis +S000030807 CDS YDR016C 4 478758 478474 C 2011-02-03 1996-07-31 +S000002424 ORF Verified YDR017C KCS1 inositol polyphosphate kinase KCS1 chromosome 4 L000000889 4 482267 479115 C 2011-02-03 1996-07-31 Inositol hexakisphosphate and inositol heptakisphosphate kinase; generation of high energy inositol pyrophosphates by Kcs1p is required for many processes such as vacuolar biogenesis, stress response, RNA polymerase I-mediated rRNA transcription and telomere maintenance; inositol hexakisphosphate is also known as IP6; inositol heptakisphosphate is also known as IP7 +S000031751 CDS YDR017C 4 482267 479115 C 2011-02-03 1996-07-31 +S000002425 ORF Uncharacterized YDR018C putative acyltransferase chromosome 4 4 483860 482670 C 2011-02-03 1996-07-31 Probable membrane protein with three predicted transmembrane domains; similar to C. elegans F55A11.5 and maize 1-acyl-glycerol-3-phosphate acyltransferase; YDR018C has a paralog, CST26, that arose from the whole genome duplication +S000031907 CDS YDR018C 4 483860 482670 C 2011-02-03 1996-07-31 +S000118434 ARS ARS417 ARSIV-484 chromosome 4 4 484006 484059 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178068 ARS_consensus_sequence ARS417 4 484035 484019 C 2014-11-18 2014-11-18 +S000002426 ORF Verified YDR019C GCV1 glycine decarboxylase subunit T|GSD1 chromosome 4 L000002736 4 485365 484163 C 2011-02-03 1996-07-31 T subunit of the mitochondrial glycine decarboxylase complex; glycine decarboxylase is required for the catabolism of glycine to 5,10-methylene-THF; expression is regulated by levels of levels of 5,10-methylene-THF in the cytoplasm +S000032068 CDS YDR019C 4 485365 484163 C 2011-02-03 1996-07-31 +S000002427 ORF Uncharacterized YDR020C DAS2 putative uridine kinase DAS2|RRT3 chromosome 4 4 486444 485746 C 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene identified in a screen for mutants with increased levels of rDNA transcription; weak similarity with uridine kinases and with phosphoribokinases +S000032817 CDS YDR020C 4 486444 485746 C 2011-02-03 1996-07-31 +S000002428 ORF Verified YDR021W FAL1 ATP-dependent RNA helicase FAL1 chromosome 4 L000003480 4 486804 488003 W 2011-02-03 1996-07-31 Nucleolar protein required for maturation of 18S rRNA; member of the eIF4A subfamily of DEAD-box ATP-dependent RNA helicases; 18S rRNA biogenesis defect of the null mutant is functionally complemented by human EIF4A3 +S000032973 CDS YDR021W 4 486804 488003 W 2011-02-03 1996-07-31 +S000002429 ORF Verified YDR022C ATG31 CIS1 chromosome 4 L000003475 4 488662 488072 C 2011-02-03 1996-07-31 Autophagy-specific protein required for autophagosome formation; forms a complex with Atg17p and Atg29p that localizes other proteins to the pre-autophagosomal structure; constitutively phosphorylated, and phosphorylation of residue S174 is required for function; high-copy suppressor of CIK1 deletion +S000033002 CDS YDR022C 4 488662 488072 C 2011-02-03 1996-07-31 +S000006770 tRNA_gene tV(UAC)D chromosome 4 L000003787 4 488870 488797 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000036290 noncoding_exon tV(UAC)D 4 488870 488797 C 2011-02-03 2000-05-19 +S000002430 ORF Verified YDR023W SES1 serine--tRNA ligase SES1|SerRS chromosome 4 L000001867 4 489508 490896 W 2011-02-03 1996-07-31 Cytosolic seryl-tRNA synthetase; class II aminoacyl-tRNA synthetase that aminoacylates tRNA(Ser), displays tRNA-dependent amino acid recognition which enhances discrimination of the serine substrate, interacts with peroxin Pex21p +S000033710 CDS YDR023W 4 489508 490896 W 2011-02-03 1996-07-31 +S000002431 ORF Dubious YDR024W FYV1 chromosome 4 4 491017 491502 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; mutation decreases survival upon exposure to K1 killer toxin +S000033822 CDS YDR024W 4 491017 491502 W 2011-02-03 1996-07-31 +S000002432 ORF Verified YDR025W RPS11A uS17|ribosomal 40S subunit protein S11A|S17|rp41A|YS12|S18A|S11A chromosome 4 L000001757 4 491515 492324 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S11 and bacterial S17; N-terminally propionylated in vivo; RPS11A has a paralog, RPS11B, that arose from the whole genome duplication +S000033919 CDS YDR025W 4 491515 491559 W 2011-02-03 1996-07-31 +S000033920 CDS YDR025W 4 491899 492324 W 2011-02-03 1996-07-31 +S000033921 intron YDR025W 4 491560 491898 W 2011-02-03 1996-07-31 +S000002433 ORF Verified YDR026C NSI1 YTT1 chromosome 4 4 494268 492556 C 2011-02-03 1996-07-31 RNA polymerase I termination factor; binds to rDNA terminator element, required for efficient Pol I termination; required for rDNA silencing at NTS1; facilities association of Sir2p with NTS1, contributes to rDNA stability and cell longevity; interacts physically with Fob1p and RENT subunits, Sir2p and Net1p; may interact with ribosomes, based on co-purification experiments; Myb-like DNA-binding protein; NSI1 has a paralog, REB1, that arose from the whole genome duplication +S000033977 CDS YDR026C 4 494268 492556 C 2011-02-03 1996-07-31 +S000002434 ORF Verified YDR027C VPS54 TCS3|CGP1|LUV1 chromosome 4 L000004648 4 497318 494649 C 2011-02-03 1996-07-31 Component of the GARP (Golgi-associated retrograde protein) complex; GARP is required for the recycling of proteins from endosomes to the late Golgi, and for mitosis after DNA damage induced checkpoint arrest; potentially phosphorylated by Cdc28p; members of the GARP complex are Vps51p-Vps52p-Vps53p-Vps54p +S000034876 CDS YDR027C 4 497318 494649 C 2011-02-03 1996-07-31 +S000002435 ORF Verified YDR028C REG1 protein phosphatase regulator REG1|SRN1|SPP43|PZF240|HEX2 chromosome 4 L000001609 4 500879 497835 C 2.79 2011-02-03 1996-07-31 Regulatory subunit of type 1 protein phosphatase Glc7p; involved in negative regulation of glucose-repressible genes; involved in regulation of the nucleocytoplasmic shuttling of Hxk2p; REG1 has a paralog, REG2, that arose from the whole genome duplication +S000035027 CDS YDR028C 4 500879 497835 C 2011-02-03 1996-07-31 +S000002436 ORF Uncharacterized YDR029W chromosome 4 4 501100 501414 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YDR029W is not an essential gene +S000035276 CDS YDR029W 4 501100 501414 W 2011-02-03 1996-07-31 +S000002437 ORF Verified YDR030C RAD28 chromosome 4 L000004123 4 503273 501753 C 2011-02-03 1996-07-31 Protein involved in DNA repair; related to the human CSA protein that is involved in transcription-coupled repair nucleotide excision repair +S000036180 CDS YDR030C 4 503273 501753 C 2011-02-03 1996-07-31 +S000002438 ORF Verified YDR031W MIX14 MIC14 chromosome 4 4 503498 503863 W 2011-02-03 2004-07-22|1996-07-31 Mitochondrial intermembrane space protein of unknown function; required for normal oxygen consumption; contains twin cysteine-x9-cysteine motifs; protein abundance increases in response to DNA replication stress +S000036965 CDS YDR031W 4 503498 503863 W 2011-02-03 2004-07-22|1996-07-31 +S000002439 ORF Verified YDR032C PST2 flavodoxin-like fold family protein chromosome 4 4 504695 504099 C 2011-02-03 1996-07-31 Protein with similarity to a family of flavodoxin-like proteins; induced by oxidative stress in a Yap1p dependent manner; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; protein abundance increases in response to DNA replication stress; PST2 has a paralog, RFS1, that arose from the whole genome duplication +S000036988 CDS YDR032C 4 504695 504099 C 2011-02-03 1996-07-31 +S000119069 ARS ARS450 ARSIV-506|ARS417.5 chromosome 4 4 505343 505584 2011-02-03 2006-10-05 Autonomously Replicating Sequence +S000002440 ORF Verified YDR033W MRH1 chromosome 4 4 508147 509109 W 2011-02-03 1996-07-31 Protein that localizes primarily to the plasma membrane; also found at the nuclear envelope; long-lived protein that is asymmetrically retained in the plasma membrane of mother cells; the authentic, non-tagged protein is detected in mitochondria in a phosphorylated state; null mutation confers sensitivity to acetic acid +S000037115 CDS YDR033W 4 508147 509109 W 2011-02-03 1996-07-31 +S000002441 ORF Verified YDR034C LYS14 chromosome 4 L000000971 4 512109 509737 C 8 2011-02-03 1996-07-31 Transcriptional activator involved in regulating lysine biosynthesis; involved in the regulation of genes of the lysine biosynthesis pathway; requires 2-aminoadipate semialdehyde as co-inducer +S000037166 CDS YDR034C 4 512109 509737 C 2011-02-03 1996-07-31 +S000006844 long_terminal_repeat YDRCdelta2 chromosome 4 4 513258 512986 C 2011-02-03 2000-05-19 Ty1 LTR +S000006845 long_terminal_repeat YDRCdelta3 chromosome 4 4 513590 513259 C 2011-02-03 2000-05-19 Ty1 LTR +S000006846 long_terminal_repeat YDRCdelta4 chromosome 4 4 514020 513692 C 2011-02-03 2000-05-19 Ty2 LTR +S000007345 transposable_element_gene YDR034C-D gag-pol fusion protein chromosome 4 4 519356 514043 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000035118 CDS YDR034C-D 4 518062 514043 C 2011-02-03 1999-07-17 +S000035117 CDS YDR034C-D 4 519356 518064 C 2011-02-03 1999-07-17 +S000035119 plus_1_translational_frameshift YDR034C-D 4 518063 518063 C 2011-02-03 1999-07-17 +S000007344 transposable_element_gene YDR034C-C gag protein chromosome 4 4 519356 518040 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000035078 CDS YDR034C-C 4 519356 518040 C 2011-02-03 1999-07-17 +S000006862 LTR_retrotransposon YDRCTy2-1 Ty2 chromosome 4 4 519647 513692 C 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000006847 long_terminal_repeat YDRCdelta5 chromosome 4 4 519647 519316 C 2011-02-03 2000-05-19 Ty2 LTR +S000006649 tRNA_gene tL(UAA)D chromosome 4 L000003765 4 519743 519826 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000037383 noncoding_exon tL(UAA)D 4 519743 519826 W 2011-02-03 2000-05-19 +S000006848 long_terminal_repeat YDRCdelta6a chromosome 4 4 520475 520173 C 2011-02-03 2000-05-19 Ty1 LTR +S000006863 long_terminal_repeat YDRWdelta7 chromosome 4 4 520477 520805 W 2011-02-03 2000-05-19 Ty1 LTR +S000007233 ORF Uncharacterized YDR034C-A chromosome 4 4 520692 520516 C 2011-02-03 1999-07-17 Putative protein of unknown function; contained within the solo Ty1 LTR element YDRWdelta7 +S000035073 CDS YDR034C-A 4 520692 520516 C 2011-02-03 1999-07-17 +S000006849 long_terminal_repeat YDRCdelta6b chromosome 4 4 520833 520806 C 2011-02-03 2000-05-19 Ty1 LTR +S000006693 tRNA_gene tQ(UUG)D1 chromosome 4 L000003766 4 520972 521043 W 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000034805 noncoding_exon tQ(UUG)D1 4 520972 521043 W 2011-02-03 2000-05-19 +S000007234 ORF Uncharacterized YDR034W-B chromosome 4 4 521314 521469 W 2011-02-03 1999-07-17 Predicted tail-anchored plasma membrane protein; contains conserved CYSTM module; related proteins in other organisms may be involved in response to stress; N- and C-terminal fusion proteins localize to the cell periphery; YDR034W-B has a paralog, YBR056W-A, that arose from the whole genome duplication +S000030044 CDS YDR034W-B 4 521314 521469 W 2011-02-03 1999-07-17 +S000002442 ORF Verified YDR035W ARO3 3-deoxy-7-phosphoheptulonate synthase ARO3 chromosome 4 L000000118 4 521816 522928 W 2011-02-03 1996-07-31 3-deoxy-D-arabino-heptulosonate-7-phosphate (DAHP) synthase; catalyzes the first step in aromatic amino acid biosynthesis and is feedback-inhibited by phenylalanine or high concentration of tyrosine or tryptophan +S000029906 CDS YDR035W 4 521816 522928 W 2011-02-03 1996-07-31 +S000002443 ORF Verified YDR036C EHD3 MRP5 chromosome 4 4 524713 523211 C 2011-02-03 1996-07-31 3-hydroxyisobutyryl-CoA hydrolase; member of a family of enoyl-CoA hydratase/isomerases; non-tagged protein is detected in highly purified mitochondria in high-throughput studies; phosphorylated; mutation affects fluid-phase endocytosis +S000029947 CDS YDR036C 4 524713 523211 C 2011-02-03 1996-07-31 +S000002444 ORF Verified YDR037W KRS1 lysine--tRNA ligase KRS1|GCD5 chromosome 4 L000000673|L000000919 4 525440 527215 W 2011-02-03 1996-07-31 Lysyl-tRNA synthetase +S000031019 CDS YDR037W 4 525440 527215 W 2011-02-03 1996-07-31 +S000002445 ORF Verified YDR038C ENA5 putative Na(+)-exporting P-type ATPase ENA5 chromosome 4 L000003293 4 530697 527422 C 2011-02-03 1996-07-31 Protein with similarity to P-type ATPase sodium pumps; member of the Na+ efflux ATPase family +S000031057 CDS YDR038C 4 530697 527422 C 2011-02-03 1996-07-31 +S000002446 ORF Verified YDR039C ENA2 Na(+)-exporting P-type ATPase ENA2 chromosome 4 L000000556 4 534582 531307 C 2011-02-03 1996-07-31 P-type ATPase sodium pump; involved in Na+ efflux to allow salt tolerance; likely not involved in Li+ efflux +S000031179 CDS YDR039C 4 534582 531307 C 2011-02-03 1996-07-31 +S000002447 ORF Verified YDR040C ENA1 Na(+)/Li(+)-exporting P-type ATPase ENA1|PMR2|HOR6 chromosome 4 L000001456 4 538467 535192 C 15 2011-02-03 1996-07-31 P-type ATPase sodium pump; involved in Na+ and Li+ efflux to allow salt tolerance +S000032116 CDS YDR040C 4 538467 535192 C 2011-02-03 1996-07-31 +S000002448 ORF Verified YDR041W RSM10 mitochondrial 37S ribosomal protein RSM10 chromosome 4 4 539803 540414 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; has similarity to E. coli S10 ribosomal protein; essential for viability, unlike most other mitoribosomal proteins +S000032233 CDS YDR041W 4 539803 540414 W 2011-02-03 1996-07-31 +S000002449 ORF Uncharacterized YDR042C chromosome 4 4 541203 540601 C 2011-02-03 1996-07-31 Putative protein of unknown function; expression is increased in ssu72-ts69 mutant +S000032269 CDS YDR042C 4 541203 540601 C 2011-02-03 1996-07-31 +S000006507 snoRNA_gene snR47 SNR47 chromosome 4 L000003414 4 541700 541602 C 2011-02-03 2000-05-19|2007-04-04 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A2220 and small subunit (SSU) rRNA at position A619 +S000030649 noncoding_exon snR47 4 541700 541602 C 2011-02-03 2000-05-19|2007-04-04 +S000002450 ORF Verified YDR043C NRG1 transcriptional regulator NRG1 chromosome 4 L000004598 4 543369 542674 C 2011-02-03 1996-07-31 Transcriptional repressor; recruits the Cyc8p-Tup1p complex to promoters; mediates glucose repression and negatively regulates a variety of processes including filamentous growth and alkaline pH response; activated in stochastic pulses of nuclear localization in response to low glucose +S000033143 CDS YDR043C 4 543369 542674 C 2011-02-03 1996-07-31 +S000002451 ORF Verified YDR044W HEM13 coproporphyrinogen oxidase chromosome 4 L000000765 4 546642 547628 W 2011-02-03 1996-07-31 Coproporphyrinogen III oxidase; oxygen-requiring enzyme that catalyzes sixth step in heme biosynthetic pathway; transcription is repressed by oxygen and heme (via Rox1p and Hap1p); human homolog CPOX can complement yeast mutant and allow growth of haploid null after sporulation of a heterozygous diploid +S000033232 CDS YDR044W 4 546642 547628 W 2011-02-03 1996-07-31 +S000002452 ORF Verified YDR045C RPC11 DNA-directed RNA polymerase III core subunit RPC11|C11 chromosome 4 L000004954 4 548310 547978 C 2011-02-03 1996-07-31 RNA polymerase III subunit C11; mediates pol III RNA cleavage activity and is important for termination of transcription; homologous to TFIIS +S000033256 CDS YDR045C 4 548310 547978 C 2011-02-03 1996-07-31 +S000002453 ORF Verified YDR046C BAP3 amino acid transporter BAP3|PAP1 chromosome 4 L000004277 4 550576 548762 C 2011-02-03 1996-07-31 Amino acid permease; involved in uptake of cysteine, leucine, isoleucine and valine; BAP3 has a paralog, BAP2, that arose from the whole genome duplication +S000033308 CDS YDR046C 4 550576 548762 C 2011-02-03 1996-07-31 +S000002454 ORF Verified YDR047W HEM12 uroporphyrinogen decarboxylase HEM12|HEM6 chromosome 4 L000000764 4 551860 552948 W 2011-02-03 1996-07-31 Uroporphyrinogen decarboxylase; catalyzes the fifth step in the heme biosynthetic pathway; localizes to both the cytoplasm and nucleus; a hem12 mutant has phenotypes similar to patients with porphyria cutanea tarda +S000034271 CDS YDR047W 4 551860 552948 W 2011-02-03 1996-07-31 +S000002456 ORF Verified YDR049W VMS1 chromosome 4 4 553254 555152 W 2011-02-03 1996-07-31 Component of a Cdc48p-complex involved in protein quality control; exhibits cytosolic and ER-membrane localization, with Cdc48p, during normal growth, and contributes to ER-associated degradation (ERAD) of specific substrates at a step after their ubiquitination; forms a mitochondrially-associated complex with Cdc48p and Npl4p under oxidative stress that is required for ubiquitin-mediated mitochondria-associated protein degradation (MAD); conserved in C. elegans and humans +S000035432 CDS YDR049W 4 553254 555152 W 2011-02-03 1996-07-31 +S000002455 ORF Dubious YDR048C chromosome 4 4 553398 553084 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF VMS1/YDR049W +S000034352 CDS YDR048C 4 553398 553084 C 2011-02-03 1996-07-31 +S000118435 ARS ARS418 ARSIV-555 chromosome 4 4 555240 555404 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000002457 ORF Verified YDR050C TPI1 triose-phosphate isomerase TPI1 chromosome 4 L000002326 4 556472 555726 C 2011-02-03 1996-07-31 Triose phosphate isomerase, abundant glycolytic enzyme; mRNA half-life is regulated by iron availability; transcription is controlled by activators Reb1p, Gcr1p, and Rap1p through binding sites in the 5' non-coding region; inhibition of Tpi1p activity by PEP (phosphoenolpyruvate) stimulates redox metabolism in respiring cells; E104D mutation in human homolog TPI1 causes a rare autosomal disease; human TPI1 can complement yeast null mutant +S000036419 CDS YDR050C 4 556472 555726 C 2011-02-03 1996-07-31 +S000002458 ORF Verified YDR051C DET1 acid phosphatase DET1 chromosome 4 4 558060 557056 C 2011-02-03 1996-07-31 Acid phosphatase; involved in the non-vesicular transport of sterols in both directions between the endoplasmic reticulum and plasma membrane; deletion confers sensitivity to nickel +S000036483 CDS YDR051C 4 558060 557056 C 2011-02-03 1996-07-31 +S000002460 ORF Dubious YDR053W chromosome 4 4 560249 560644 W 2011-02-03 1996-07-31 Putative protein of unknown function; open reading frame overlaps 5' end of essential DBF4 gene encoding the regulatory subunit of the Cdc7p-Dbf4p kinase complex +S000037331 CDS YDR053W 4 560249 560644 W 2011-02-03 1996-07-31 +S000002459 ORF Verified YDR052C DBF4 protein serine/threonine kinase activating protein DBF4|DNA52|LSD7 chromosome 4 L000000488|S000029149|L000000513 4 560625 558511 C 2011-02-03 1996-07-31 Regulatory subunit of Cdc7p-Dbf4p kinase complex; required for Cdc7p kinase activity and initiation of DNA replication; phosphorylates the Mcm2-7 family of proteins; cell cycle regulated; relative distribution to the nucleus increases upon DNA replication stress; co-expression of human CDC7 and DBF4 complements single cdc7 or dbf4 null mutations or the cdc7 dbf4 double null mutation +S000036579 CDS YDR052C 4 560625 558511 C 2011-02-03 1996-07-31 +S000002461 ORF Verified YDR054C CDC34 SCF E2 ubiquitin-protein ligase catalytic subunit CDC34|UBC3|DNA6 chromosome 4 L000000271 4 562327 561440 C 37 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme (E2); catalytic subunit of SCF ubiquitin-protein ligase complex (together with Skp1p, Rbx1p, Cdc53p, and an F-box protein) that regulates cell cycle progression by targeting key substrates for degradation; protein abundance increases in response to DNA replication stress; human CDC34 functionally complements the thermosensitivity of the cdc34-2 mutant +S000037377 CDS YDR054C 4 562327 561440 C 2011-02-03 1996-07-31 +S000002462 ORF Verified YDR055W PST1 HPF2 chromosome 4 L000004850 4 563527 564861 W 2011-02-03 1996-07-31 Cell wall protein that contains a putative GPI-attachment site; secreted by regenerating protoplasts; up-regulated by activation of the cell integrity pathway, as mediated by Rlm1p; upregulated by cell wall damage via disruption of FKS1; PST1 has a paralog, ECM33, that arose from the whole genome duplication +S000030148 CDS YDR055W 4 563527 564861 W 2011-02-03 1996-07-31 +S000002463 ORF Uncharacterized YDR056C EMC10 chromosome 4 4 565640 565023 C 2011-02-03 1996-07-31 Putative protein of unknown function; subunit of evolutionarily conserved EMC (Endoplasmic Reticulum Membrane Complex) implicated in ERAD (ER-associated degradation) and proper assembly of multi-pass transmembrane (TM) proteins; EMC acts in yeast as an ER-mitochondria tether that interacts with outer membrane protein Tom5p of TOM (Translocase of the Mitochondrial Outer Membrane) complex; YDR056C is not an essential protein +S000030254 CDS YDR056C 4 565640 565023 C 2011-02-03 1996-07-31 +S000002464 ORF Verified YDR057W YOS9 chromosome 4 4 565927 567555 W 2011-02-03 1996-07-31 ER quality-control lectin; integral subunit of the HRD ligase; participates in efficient ER retention of misfolded proteins by recognizing them and delivering them to Hrd1p; binds to glycans with terminal alpha-1,6 linked mannose on misfolded N-glycosylated proteins and participates in targeting proteins to ERAD; member of the OS-9 protein family +S000030476 CDS YDR057W 4 565927 567555 W 2011-02-03 1996-07-31 +S000118436 ARS ARS419 ARSIV-568 chromosome 4 4 567610 567685 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178069 ARS_consensus_sequence ARS419 4 567677 567661 C 2014-11-18 2014-11-18 +S000002465 ORF Verified YDR058C TGL2 triglyceride lipase chromosome 4 L000003248 4 568703 567723 C 2011-02-03 1996-07-31 Triacylglycerol lipase that is localized to the mitochondria; has lipolytic activity towards triacylglycerols and diacylglycerols when expressed in E. coli +S000030539 CDS YDR058C 4 568703 567723 C 2011-02-03 1996-07-31 +S000006709 tRNA_gene tR(UCU)D chromosome 4 L000003767 4 568882 568953 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000037839 noncoding_exon tR(UCU)D 4 568882 568953 W 2011-02-03 2000-05-19 +S000006531 tRNA_gene tD(GUC)D chromosome 4 L000003768 4 568964 569035 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000037680 noncoding_exon tD(GUC)D 4 568964 569035 W 2011-02-03 2000-05-19 +S000002466 ORF Verified YDR059C UBC5 E2 ubiquitin-conjugating protein UBC5 chromosome 4 L000002408 4 569770 569234 C 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme; mediates selective degradation of short-lived, abnormal, or excess proteins, including histone H3; central component of the cellular stress response; expression is heat inducible; protein abundance increases in response to DNA replication stress; UBC5 has a paralog, UBC4, that arose from the whole genome duplication +S000031454 CDS YDR059C 4 569633 569234 C 2011-02-03 1996-07-31 +S000031453 CDS YDR059C 4 569770 569724 C 2011-02-03 1996-07-31 +S000031455 intron YDR059C 4 569723 569634 C 2011-02-03 1996-07-31 +S000002467 ORF Verified YDR060W MAK21 RNA-binding ribosome biosynthesis protein MAK21|NOC1 chromosome 4 L000000993 4 570649 573726 W 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; required for large (60S) ribosomal subunit biogenesis; acts as part of a Mak21p-Noc2p-Rrp5p module that associates with nascent pre-rRNA during transcription and has a role in bigenesis of the large ribosomal subunit; involved in nuclear export of pre-ribosomes; required for maintenance of dsRNA virus; homolog of human CAATT-binding protein +S000031685 CDS YDR060W 4 570649 573726 W 2011-02-03 1996-07-31 +S000002468 ORF Uncharacterized YDR061W chromosome 4 4 574164 575783 W 2011-02-03 1996-07-31 Protein with similarity to ABC transporter family members; lacks predicted membrane-spanning regions; transcriptionally activated by Yrm1p along with genes involved in multidrug resistance +S000031826 CDS YDR061W 4 574164 575783 W 2011-02-03 1996-07-31 +S000002469 ORF Verified YDR062W LCB2 serine C-palmitoyltransferase LCB2|TSC1|SCS1 chromosome 4 L000001819 4 576474 578159 W 2011-02-03 1996-07-31 Component of serine palmitoyltransferase; responsible along with Lcb1p for the first committed step in sphingolipid synthesis, which is the condensation of serine with palmitoyl-CoA to form 3-ketosphinganine +S000031954 CDS YDR062W 4 576474 578159 W 2011-02-03 1996-07-31 +S000002470 ORF Verified YDR063W AIM7 GMF1|GMF chromosome 4 4 578663 579112 W 2011-02-03 1996-07-31 Protein that interacts with Arp2/3 complex; interacts with Arp2/3 complex to stimulate actin filament debranching and inhibit actin nucleation; has similarity to Cof1p and also to human glia maturation factor (GMF); null mutant displays elevated mitochondrial genome loss +S000032842 CDS YDR063W 4 578663 579112 W 2011-02-03 1996-07-31 +S000002471 ORF Verified YDR064W RPS13 uS15|ribosomal 40S subunit protein S13|YS15|S27a|S15|S13|RPS13C|RPS13B chromosome 4 L000002900|L000002655 4 579458 580452 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S13 and bacterial S15 +S000032956 CDS YDR064W 4 579458 579478 W 2011-02-03 1996-07-31 +S000032957 CDS YDR064W 4 580018 580452 W 2011-02-03 1996-07-31 +S000032958 intron YDR064W 4 579479 580017 W 2011-02-03 1996-07-31 +S000002472 ORF Verified YDR065W RRG1 chromosome 4 4 580687 581784 W 2011-02-03 1996-07-31 Protein of unknown function; required for vacuolar acidification and mitochondrial genome maintenance; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000033047 CDS YDR065W 4 580687 581784 W 2011-02-03 1996-07-31 +S000002473 ORF Verified YDR066C RTR2 putative protein-serine/threonine phosphatase chromosome 4 4 582498 581908 C 2011-02-03 1996-07-31 Protein of unknown function; exhibits genetic interactions with Rtr1p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YDR066C is not an essential gene; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress; RTR2 has a paralog, RTR1, that arose from the whole genome duplication +S000033084 CDS YDR066C 4 582498 581908 C 2011-02-03 1996-07-31 +S000002474 ORF Uncharacterized YDR067C OCA6 protein-tyrosine-phosphatase chromosome 4 4 583465 582791 C 2011-02-03 1996-07-31 Cytoplasmic protein required for replication of Brome mosaic virus; S. cerevisiae is a model system for studying positive-strand RNA virus replication; null mutation confers sensitivity to tunicamycin and DTT +S000033843 CDS YDR067C 4 583465 582791 C 2011-02-03 1996-07-31 +S000002475 ORF Verified YDR068W DOS2 chromosome 4 L000000518 4 583713 584645 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000034055 CDS YDR068W 4 583713 584645 W 2011-02-03 1996-07-31 +S000002476 ORF Verified YDR069C DOA4 ubiquitin-specific protease DOA4|UBP4|SSV7|NPI2|MUT4|DOS1 chromosome 4 L000000514 4 587719 584939 C 2011-02-03 1996-07-31 Ubiquitin hydrolase; deubiquitinates intralumenal vesicle (ILVs) cargo proteins; required for recycling ubiquitin from proteasome-bound ubiquitinated intermediates, acts at the late endosome/prevacuolar compartment to recover ubiquitin from ubiquitinated membrane proteins destined for the vacuole; DOA4 has a paralog, UBP5, that arose from the whole genome duplication +S000034891 CDS YDR069C 4 587719 584939 C 2011-02-03 1996-07-31 +S000002477 ORF Verified YDR070C FMP16 chromosome 4 4 588379 588098 C 2011-02-03 1996-07-31 Protein of unknown function; may be involved in responding to conditions of stress; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; protein abundance increases in response to DNA replication stress +S000036234 CDS YDR070C 4 588379 588098 C 2011-02-03 1996-07-31 +S000002478 ORF Verified YDR071C PAA1 polyamine acetyltransferase chromosome 4 4 589402 588827 C 2011-02-03 1996-07-31 Polyamine acetyltransferase; acetylates polyamines (e.g. putrescine, spermidine, spermine) and also aralkylamines (e.g. tryptamine, phenylethylamine); may be involved in transcription and/or DNA replication +S000036334 CDS YDR071C 4 589402 588827 C 2011-02-03 1996-07-31 +S000002479 ORF Verified YDR072C IPT1 MIC2|inositolphosphotransferase|KTI6|SYR4 chromosome 4 L000004226|L000003534|S000029294 4 591344 589761 C 2011-02-03 1996-07-31 Inositolphosphotransferase; involved in synthesis of mannose-(inositol-P)2-ceramide (M(IP)2C), the most abundant sphingolipid; can mutate to resistance to the antifungals syringomycin E and DmAMP1 and to K. lactis zymocin +S000037011 CDS YDR072C 4 591344 589761 C 2011-02-03 1996-07-31 +S000002480 ORF Verified YDR073W SNF11 chromosome 4 L000003167 4 592439 592948 W 2011-02-03 1996-07-31 Subunit of the SWI/SNF chromatin remodeling complex; involved in transcriptional regulation; interacts with a highly conserved 40-residue sequence of Snf2p; relocates to the cytosol under hypoxic conditions +S000037137 CDS YDR073W 4 592439 592948 W 2011-02-03 1996-07-31 +S000002481 ORF Verified YDR074W TPS2 trehalose-phosphatase TPS2|PFK3|HOG2 chromosome 4 L000002331 4 593893 596583 W 2011-02-03 1996-07-31 Phosphatase subunit of the trehalose-6-P synthase/phosphatase complex; involved in synthesis of the storage carbohydrate trehalose; expression is induced by stress conditions and repressed by the Ras-cAMP pathway; protein abundance increases in response to DNA replication stress +S000037233 CDS YDR074W 4 593893 596583 W 2011-02-03 1996-07-31 +S000002482 ORF Verified YDR075W PPH3 phosphoprotein phosphatase PP4 catalytic subunit PPH3 chromosome 4 L000001471 4 597156 598082 W 53 2011-02-03 1996-07-31 Catalytic subunit of protein phosphatase PP4 complex; Pph3p and Psy2p form active complex, Psy4p may provide substrate specificity; regulates recovery from the DNA damage checkpoint, the gene conversion- and single-strand annealing-mediated pathways of meiotic double-strand break repair and efficient Non-Homologous End-Joining (NHEJ) pathway; involved in activation of Gln3p to alleviate nitrogen catabolite repression; Pph3p and Psy2p localize to foci on meiotic chromosomes +S000029904 CDS YDR075W 4 597156 598082 W 2011-02-03 1996-07-31 +S000002483 ORF Verified YDR076W RAD55 putative DNA-dependent ATPase RAD55 chromosome 4 L000001575 4 598468 599688 W 53 2011-02-03 1996-07-31 Protein that stimulates strand exchange; stimulates strand exchange by stabilizing the binding of Rad51p to single-stranded DNA; involved in the recombinational repair of double-strand breaks in DNA during vegetative growth and meiosis; forms heterodimer with Rad57p +S000030010 CDS YDR076W 4 598468 599688 W 2011-02-03 1996-07-31 +S000002484 ORF Verified YDR077W SED1 chromosome 4 L000001859 4 600793 601809 W 2011-02-03 1996-07-31 Major stress-induced structural GPI-cell wall glycoprotein; associates with translating ribosomes, possible role in mitochondrial genome maintenance; ORF contains two distinct variable minisatellites; SED1 has a paralog, SPI1, that arose from the whole genome duplication +S000030135 CDS YDR077W 4 600793 601809 W 2011-02-03 1996-07-31 +S000002485 ORF Verified YDR078C SHU2 chromosome 4 4 602869 602198 C 2011-02-03 1996-07-31 Component of Shu complex (aka PCSS complex); Shu complex also includes Psy3, Csm2, Shu1, and promotes error-free DNA repair, Shu complex mediates inhibition of Srs2p function; promotes formation of Rad51p filaments; important for both mitotic and meiotic homologous recombination, and contains a conserved SWIM domain that is necessary for both +S000030241 CDS YDR078C 4 602869 602198 C 2011-02-03 1996-07-31 +S000002486 ORF Verified YDR079W PET100 chromosome 4 L000003521 4 603064 603399 W 2011-02-03 1996-07-31 Chaperone that facilitates the assembly of cytochrome c oxidase; integral to the mitochondrial inner membrane; interacts with a subcomplex of subunits VII, VIIa, and VIII (Cox7p, Cox9p, and Cox8p) but not with the holoenzyme +S000031263 CDS YDR079W 4 603064 603399 W 2011-02-03 1996-07-31 +S000007603 ORF Verified YDR079C-A TFB5 TFIIH complex subunit TFB5 chromosome 4 4 603811 603593 C 2011-02-03 2001-02-26 Component of RNA polymerase II general transcription factor TFIIH; involved in transcription initiation and in nucleotide-excision repair; relocalizes to the cytosol in response to hypoxia; homolog of Chlamydomonas reinhardtii REX1-S protein involved in DNA repair +S000037149 CDS YDR079C-A 4 603811 603593 C 2011-02-03 2001-02-26 +S000002487 ORF Verified YDR080W VPS41 VPL20|VAM2|SVL2|FET2|CVT8 chromosome 4 L000003512|L000004234 4 604008 606986 W 2011-02-03 1996-07-31 Subunit of the HOPS endocytic tethering complex; vacuole membrane protein that functions as a Rab GTPase effector, interacting specifically with the GTP-bound conformation of Ypt7p, facilitating tethering, docking and promoting membrane fusion events at the late endosome and vacuole; required for both membrane and protein trafficking; Yck3p-mediated phosphorylation regulates the organization of vacuolar fusion sites +S000032217 CDS YDR080W 4 604008 606986 W 2011-02-03 1996-07-31 +S000002488 ORF Verified YDR081C PDC2 chromosome 4 L000001355 4 610081 607304 C 50 2011-02-03 1996-07-31 Transcription factor for thiamine-regulated genes; required for expression of the two isoforms of pyruvate decarboxylase (PDC1 and PDC5) along with thiamine biosynthetic genes; binds a DNA sequence in the PDC5 promoter; mutant fails to grow on 2% glucose and thus is scored as inviable under standard conditions +S000032243 CDS YDR081C 4 610081 607304 C 2011-02-03 1996-07-31 +S000002489 ORF Verified YDR082W STN1 chromosome 4 L000003921 4 610441 611925 W 2011-02-03 1996-07-31 Telomere end-binding and capping protein; plays a key role with Pol12p in linking telomerase action with completion of lagging strand synthesis, and in a regulatory step required for telomere capping; similar to human Stn1 +S000032408 CDS YDR082W 4 610441 611925 W 2011-02-03 1996-07-31 +S000002490 ORF Verified YDR083W RRP8 25S rRNA (adenine645-N1)-methyltransferase chromosome 4 4 612073 613251 W 2011-02-03 2003-09-22|2006-01-19|1996-07-31 Nucleolar S-adenosylmethionine-dependent rRNA methyltransferase; methylates adenine (m1A) of the large subunit (LSU) rRNA at position 645; involved in pre-rRNA cleavage at site A2; mutation is synthetically lethal with a gar1 mutation; deletion disrupts telomere maintenance by influencing the expression of neighboring gene STN1 +S000033239 CDS YDR083W 4 612073 613251 W 2011-02-03 2003-09-22|2006-01-19|1996-07-31 +S000002491 ORF Verified YDR084C TVP23 chromosome 4 4 614004 613405 C 2011-02-03 1996-07-31 Integral membrane protein; localized to late Golgi vesicles along with the v-SNARE Tlg2p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern +S000033277 CDS YDR084C 4 614004 613405 C 2011-02-03 1996-07-31 +S000002492 ORF Verified YDR085C AFR1 chromosome 4 L000000059 4 616150 614288 C 47.97 2011-02-03 1996-07-31 Protein required for pheromone-induced projection (shmoo) formation; regulates septin architecture during mating; has an RVXF motif that mediates targeting of Glc7p to mating projections; interacts with Cdc12p; AFR1 has a paralog, YER158C, that arose from the whole genome duplication +S000033345 CDS YDR085C 4 616150 614288 C 2011-02-03 1996-07-31 +S000002493 ORF Verified YDR086C SSS1 translocon subunit SSS1 chromosome 4 L000002092 4 617170 616928 C 2011-02-03 1996-07-31 Subunit of the Sec61p translocation complex (Sec61p-Sss1p-Sbh1p); this complex forms a channel for passage of secretory proteins through the endoplasmic reticulum membrane, and of the Ssh1p complex (Ssh1p-Sbh2p-Sss1p); interacts with Ost4p and Wbp1p +S000033427 CDS YDR086C 4 617170 616928 C 2011-02-03 1996-07-31 +S000002494 ORF Verified YDR087C RRP1 chromosome 4 L000001774 4 618306 617470 C 2011-02-03 1996-07-31 Essential evolutionarily conserved nucleolar protein; necessary for biogenesis of 60S ribosomal subunits and for processing of pre-rRNAs to mature rRNA; associated with several distinct 66S pre-ribosomal particles +S000034333 CDS YDR087C 4 618306 617470 C 2011-02-03 1996-07-31 +S000002495 ORF Verified YDR088C SLU7 mRNA splicing protein SLU7|SLT17 chromosome 4 L000001922 4 619645 618497 C 2011-02-03 1996-07-31 RNA splicing factor; required for ATP-independent portion of 2nd catalytic step of spliceosomal RNA splicing; interacts with Prp18p; contains zinc knuckle domain +S000034412 CDS YDR088C 4 619645 618497 C 2011-02-03 1996-07-31 +S000006700 tRNA_gene tR(ACG)D chromosome 4 L000003786 4 620041 619969 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 6 nuclear tRNA genes containing the tDNA-anticodon ACG (converted to ICG in the mature tRNA), decodes CGU, CGC, and probably CGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000030369 noncoding_exon tR(ACG)D 4 620041 619969 C 2011-02-03 2000-05-19 +S000002496 ORF Verified YDR089W VTC5 chromosome 4 4 622112 624721 W 2011-02-03 1996-07-31 Novel subunit of the vacuolar transporter chaperone complex; vacuolar transmembrane protein that regulates biosynthesis of polyphosphate; deletion reduces and overexpression increases polyP accumulation; SPX domain (Syg1, Pho81, Xpr1)-containing protein involved in phosphate homeostasis; relocalizes from vacuole to cytoplasm upon DNA replication stress +S000035491 CDS YDR089W 4 622112 624721 W 2011-02-03 1996-07-31 +S000002497 ORF Uncharacterized YDR090C chromosome 4 4 625998 625066 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000035405 CDS YDR090C 4 625998 625066 C 2011-02-03 1996-07-31 +S000002498 ORF Verified YDR091C RLI1 Fe-S cluster-binding ribosome biosynthesis protein chromosome 4 4 628534 626708 C 2011-02-03 1996-07-31 Essential Fe-S protein; required for ribosome biogenesis, translation initiation/termination; facilitates binding of multifactor complex (MFC) of initiation factors to small ribosomal subunit; Dom34-Hbs1 complex and Rli1p work in dissociating inactive ribosomes, thereby facilitating translation restart; forms complex with Lto1p and Yae1p; dependency on ROS-labile FeS clusters, activity in nuclear ribosomal-subunit export impaired by mild oxidative stress +S000035466 CDS YDR091C 4 628534 626708 C 2011-02-03 1996-07-31 +S000130174 ARS ARS420 chromosome 4 4 628938 629582 2014-11-18 2014-11-18|2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000002499 ORF Verified YDR092W UBC13 E2 ubiquitin-conjugating protein UBC13 chromosome 4 L000003387 4 629876 630605 W 2011-02-03 1996-07-31 E2 ubiquitin-conjugating enzyme; involved in the error-free DNA postreplication repair pathway; interacts with Mms2p to assemble ubiquitin chains at the Ub Lys-63 residue; DNA damage triggers redistribution from the cytoplasm to the nucleus +S000035560 CDS YDR092W 4 629876 629905 W 2011-02-03 1996-07-31 +S000035561 CDS YDR092W 4 630174 630605 W 2011-02-03 1996-07-31 +S000035562 intron YDR092W 4 629906 630173 W 2011-02-03 1996-07-31 +S000002500 ORF Verified YDR093W DNF2 aminophospholipid-translocating P4-type ATPase DNF2 chromosome 4 4 631282 636120 W 2011-02-03 1996-07-31 Aminophospholipid translocase (flippase); type 4 P-type ATPase; involved in phospholipid translocation, contributing to endocytosis, protein transport, and cellular polarization; localizes primarily to the plasma membrane; localizes to the shmoo tip where it has a redundant role in the cellular response to mating pheromone; DNF2 has a paralog, DNF1, that arose from the whole genome duplication +S000036482 CDS YDR093W 4 631282 636120 W 2011-02-03 1996-07-31 +S000002501 ORF Dubious YDR094W chromosome 4 4 635840 636175 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF DNF2/YDR093W +S000036554 CDS YDR094W 4 635840 636175 W 2011-02-03 1996-07-31 +S000002502 ORF Dubious YDR095C chromosome 4 4 636527 636117 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036605 CDS YDR095C 4 636527 636117 C 2011-02-03 1996-07-31 +S000002503 ORF Verified YDR096W GIS1 histone demethylase GIS1 chromosome 4 L000003351 4 637139 639823 W 2011-02-03 1996-07-31 Histone demethylase and transcription factor; regulates genes during nutrient limitation; activity modulated by proteasome-mediated proteolysis; has JmjC and JmjN domain in N-terminus that interact, promoting stability and proper transcriptional activity; contains two transactivating domains downstream of Jmj domains and a C-terminal DNA binding domain; relocalizes to the cytosol in response to hypoxia; GIS1 has a paralog, RPH1, that arose from the whole genome duplication +S000037381 CDS YDR096W 4 637139 639823 W 2011-02-03 1996-07-31 +S000118437 ARS ARS421 ARSIV-640 chromosome 4 4 640006 640072 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178070 ARS_consensus_sequence ARS421 4 640062 640046 C 2014-11-18 2014-11-18 +S000002504 ORF Verified YDR097C MSH6 PMS6|mismatch repair ATPase MSH6|PMS3 chromosome 4 L000003135|L000004503|S000029377 4 643837 640109 C 2011-02-03 1996-07-31 Protein required for mismatch repair in mitosis and meiosis; forms a complex with Msh2p to repair both single-base & insertion-deletion mispairs; also involved in interstrand cross-link repair; potentially phosphorylated by Cdc28p +S000037420 CDS YDR097C 4 643837 640109 C 2011-02-03 1996-07-31 +S000002505 ORF Verified YDR098C GRX3 monothiol glutaredoxin GRX3 chromosome 4 S000007444 4 644930 644178 C 2014-11-18 1996-07-31|2014-11-18 Glutathione-dependent oxidoreductase; hydroperoxide and superoxide-radical responsive; monothiol glutaredoxin subfamily member along with Grx4p and Grx5p; protects cells from oxidative damage; with Grx4p, binds to Aft1p in iron-replete conditions, promoting its dissociation from promoters; evidence exists indicating that the translation start site is not Met1 as currently annotated, but rather Met36; GRX3 has a paralog, GRX4, that arose from the whole genome duplication +S000037543 CDS YDR098C 4 644930 644178 C 2014-11-18 1996-07-31|2014-11-18 +S000006694 tRNA_gene tQ(UUG)D2 chromosome 4 L000003785 4 645224 645153 C 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000034810 noncoding_exon tQ(UUG)D2 4 645224 645153 C 2011-02-03 2000-05-19 +S000006850 long_terminal_repeat YDRCdelta7 chromosome 4 4 645835 645502 C 2011-02-03 2000-05-19 Ty1 LTR +S000007391 transposable_element_gene YDR098C-B gag-pol fusion protein chromosome 4 4 651126 645858 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000032257 CDS YDR098C-B 4 649820 645858 C 2011-02-03 1999-07-17 +S000032256 CDS YDR098C-B 4 651126 649822 C 2011-02-03 1999-07-17 +S000032258 plus_1_translational_frameshift YDR098C-B 4 649821 649821 C 2011-02-03 1999-07-17 +S000007390 transposable_element_gene YDR098C-A gag protein chromosome 4 4 651126 649804 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000032236 CDS YDR098C-A 4 651126 649804 C 2011-02-03 1999-07-17 +S000006859 LTR_retrotransposon YDRCTy1-1 Ty1 chromosome 4 4 651419 645502 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000006851 long_terminal_repeat YDRCdelta8 chromosome 4 4 651419 651086 C 2011-02-03 2000-05-19 Ty1 LTR +S000006855 long_terminal_repeat YDRCsigma1 chromosome 4 4 651503 651420 C 2011-02-03 2000-05-19 Ty3 LTR +S000006852 long_terminal_repeat YDRCdelta9 chromosome 4 4 651980 651682 C 2011-02-03 2000-05-19 Ty1 LTR +S000002506 ORF Verified YDR099W BMH2 14-3-3 family protein BMH2|SCD3 chromosome 4 L000000186 4 653607 654428 W 63 2011-02-03 1996-07-31 14-3-3 protein, minor isoform; controls proteome at post-transcriptional level, binds proteins and DNA, involved in regulation of many processes including exocytosis, vesicle transport, Ras/MAPK signaling, and rapamycin-sensitive signaling; protein increases in abundance and relative distribution to the nucleus increases upon DNA replication stress; abundance relative to Bmh1p increases during sporulation +S000030398 CDS YDR099W 4 653607 654428 W 2011-02-03 1996-07-31 +S000122095 five_prime_UTR_intron YDR099W 4 652781 653523 W 2011-02-03 2007-04-04 +S000002507 ORF Verified YDR100W TVP15 chromosome 4 4 655013 655444 W 2011-02-03 1996-07-31 Integral membrane protein; localized to late Golgi vesicles along with the v-SNARE Tlg2p +S000035845 CDS YDR100W 4 655013 655444 W 2011-02-03 1996-07-31 +S000002508 ORF Verified YDR101C ARX1 putative hydrolase chromosome 4 4 657467 655686 C 2011-02-03 1996-07-31 Nuclear export factor for the ribosomal pre-60S subunit; shuttling factor which directly binds FG rich nucleoporins and facilities translocation through the nuclear pore complex; interacts directly with Alb1p; responsible for Tif6p recycling defects in the absence of Rei1; associated with the ribosomal export complex +S000035887 CDS YDR101C 4 657467 655686 C 2011-02-03 1996-07-31 +S000002509 ORF Uncharacterized YDR102C chromosome 4 4 657980 657648 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YDR102C is not an essential gene; homozygous diploid deletion strain exhibits high budding index +S000036020 CDS YDR102C 4 657980 657648 C 2011-02-03 1996-07-31 +S000002510 ORF Verified YDR103W STE5 NUL3|HMD3 chromosome 4 L000002115 4 658350 661103 W 63 2011-02-03 1996-07-31 Pheromone-responsive MAPK scaffold protein; couples activation of the G-protein-coupled pheromone receptor to MAPK activation; intramolecular interaction of PH and VWA domains blocks activation of assembled signaling cascade components (Ste11p, Ste7p and Fus3p) under basal conditions; Gbeta-gamma (Ste4p-Ste18p)-dependent docking at the plasma membrane and binding of PI(4,5)P2 by the PH domain relieves autoinhibition, resulting in pheromone-dependent pathway activation +S000036909 CDS YDR103W 4 658350 661103 W 2011-02-03 1996-07-31 +S000002511 ORF Verified YDR104C SPO71 chromosome 4 4 664910 661173 C 2011-02-03 1996-07-31 Meiosis-specific protein required for prospore membrane morphogenesis; localizes to the prospore membrane (PSM) during sporulation; required for PSM elongation and closure; genetically antagonistic to SPO1; recruits Vps13p to the PSM during sporulation; interacts and functions cooperatively with Spo73p; mutants have defects in the PSM, aberrant spore wall formation and reduced PtdIns-phosphate pools in the PSM; contains three PH-like domains +S000036931 CDS YDR104C 4 664910 661173 C 2011-02-03 1996-07-31 +S000002512 ORF Verified YDR105C TMS1 chromosome 4 4 666770 665349 C 2011-02-03 1996-07-31 Vacuolar membrane protein of unknown function; is conserved in mammals; predicted to contain eleven transmembrane helices; interacts with Pdr5p, a protein involved in multidrug resistance +S000036992 CDS YDR105C 4 666770 665349 C 2011-02-03 1996-07-31 +S000002513 ORF Verified YDR106W ARP10 chromosome 4 L000003439 4 667004 667858 W 2011-02-03 1996-07-31 Component of the dynactin complex; localized to the pointed end of the Arp1p filament; may regulate membrane association of the complex +S000037120 CDS YDR106W 4 667004 667858 W 2011-02-03 1996-07-31 +S000006601 tRNA_gene tI(AAU)D chromosome 4 L000003784 4 668080 668007 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000030399 noncoding_exon tI(AAU)D 4 668080 668007 C 2011-02-03 2000-05-19 +S000006856 long_terminal_repeat YDRWsigma2 YDRCsigma2 chromosome 4 4 668096 668436 W 2011-02-03 2000-05-19|2007-04-02 Ty3 LTR +S000006864 long_terminal_repeat YDRWdelta10 chromosome 4 4 668543 668784 W 2011-02-03 2000-05-19 Ty1 LTR +S000002514 ORF Verified YDR107C TMN2 chromosome 4 4 671034 669016 C 2011-02-03 1996-07-31 Protein with a role in cellular adhesion and filamentous growth; similar to Tmn3p; member of the evolutionarily conserved Transmembrane Nine family of proteins with nine membrane-spanning segments; TMN2 has a paralog, EMP70, that arose from the whole genome duplication +S000037823 CDS YDR107C 4 671034 669016 C 2011-02-03 1996-07-31 +S000002515 ORF Verified YDR108W TRS85 GSG1|MUM1 chromosome 4 L000002779|S000029315|L000002585 4 671269 673365 W 2011-02-03 1996-07-31 Component of transport protein particle (TRAPP) complex III; TRAPPIII is a multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating endosome-Golgi traffic and required for membrane expansion during autophagy and the CVT pathway; directs Ypt1p to the PAS; late post-replication meiotic role +S000029911 CDS YDR108W 4 671269 673365 W 2011-02-03 1996-07-31 +S000002516 ORF Uncharacterized YDR109C putative phosphotransferase chromosome 4 4 675667 673520 C 2011-02-03 1996-07-31 Putative kinase +S000029962 CDS YDR109C 4 675667 673520 C 2011-02-03 1996-07-31 +S000002517 ORF Verified YDR110W FOB1 replication fork barrier binding protein FOB1|HRM1 chromosome 4 L000003959 4 676102 677802 W 2011-02-03 1996-07-31 Nucleolar protein that binds the rDNA replication fork barrier site; required for replication fork blocking, recombinational hotspot activity, condensin recruitment to replication fork barrier (RFB), and rDNA repeat segregation; related to retroviral integrases +S000031039 CDS YDR110W 4 676102 677802 W 2011-02-03 1996-07-31 +S000002519 ORF Dubious YDR112W IRC2 chromosome 4 4 679544 679852 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ALT2/YDR111C; null mutant displays increased levels of spontaneous Rad52p foci +S000032093 CDS YDR112W 4 679544 679852 W 2011-02-03 1996-07-31 +S000002518 ORF Uncharacterized YDR111C ALT2 alanine transaminase ALT2 chromosome 4 4 679764 678241 C 2011-02-03 1996-07-31 Catalytically inactive alanine transaminase; expression is repressed in the presence of alanine and repression is mediated by Nrg1p; ALT2 has a paralog, ALT1, that arose from the whole genome duplication +S000031067 CDS YDR111C 4 679764 678241 C 2011-02-03 1996-07-31 +S000002520 ORF Verified YDR113C PDS1 securin chromosome 4 L000001368 4 681617 680496 C 2011-02-03 1996-07-31 Securin; inhibits anaphase by binding separin Esp1p; blocks cyclin destruction and mitotic exit, essential for meiotic progression and mitotic cell cycle arrest; localization is cell-cycle dependent and regulated by Cdc28p phosphorylation +S000032118 CDS YDR113C 4 681617 680496 C 2011-02-03 1996-07-31 +S000002522 ORF Verified YDR115W MRX14 putative mitochondrial 54S ribosomal protein chromosome 4 4 682175 682492 W 2011-02-03 1996-07-31 Putative mitochondrial ribosomal protein of the large subunit; similar to E. coli L34 ribosomal protein; required for respiratory growth, as are most mitochondrial ribosomal proteins; protein increases in abundance and relocalizes to the plasma membrane upon DNA replication stress +S000032311 CDS YDR115W 4 682175 682492 W 2011-02-03 1996-07-31 +S000002521 ORF Uncharacterized YDR114C chromosome 4 4 682226 681924 C 2011-02-03 1996-07-31 Putative protein of unknown function; deletion mutant exhibits poor growth at elevated pH and calcium +S000032200 CDS YDR114C 4 682226 681924 C 2011-02-03 1996-07-31 +S000002523 ORF Verified YDR116C MRPL1 mitochondrial 54S ribosomal protein MRPL1 chromosome 4 4 683581 682724 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000033144 CDS YDR116C 4 683581 682724 C 2011-02-03 1996-07-31 +S000002524 ORF Verified YDR117C TMA64 RBF64 chromosome 4 4 685643 683946 C 2011-02-03 1996-07-31 Protein of unknown function that associates with ribosomes; has a putative RNA binding domain; in mammals the corresponding protein, eIF2D, has been shown to possess translation initiation factor activity +S000033197 CDS YDR117C 4 685643 683946 C 2011-02-03 1996-07-31 +S000002525 ORF Verified YDR118W APC4 anaphase promoting complex subunit 4 chromosome 4 L000004319 4 685882 687840 W 2011-02-03 1996-07-31 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); APC/C is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; component of the platform domain of the APC/C, based on structural analysis; relative distribution to the nucleus increases upon DNA replication stress +S000033282 CDS YDR118W 4 685882 687840 W 2011-02-03 1996-07-31 +S000028820 ORF Dubious YDR118W-A chromosome 4 4 687768 687884 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified using a combination of expression profiling and mass spectrometry +S000033639 CDS YDR118W-A 4 687768 687884 W 2011-02-03 2003-07-29 +S000002526 ORF Uncharacterized YDR119W VBA4 chromosome 4 4 688227 690533 W 2011-02-03 1996-07-31 Protein of unknown function; proposed role as a basic amino acid permease based on phylogeny; GFP-fusion protein localizes to vacuolar membrane; physical interaction with Atg27p suggests a possible role in autophagy; non-essential gene +S000034153 CDS YDR119W 4 688227 690533 W 2011-02-03 1996-07-31 +S000113555 ORF Verified YDR119W-A COX26 chromosome 4 4 691014 691214 W 2011-02-03 2005-11-16 Stabilizes or regulates formation of respiratory chain supercomplexes composed of Complex III (ubiquinol-cytochrome c reductase) and Complex IV (cytochrome c oxidase) +S000113556 CDS YDR119W-A 4 691014 691214 W 2011-02-03 2005-11-16 +S000002527 ORF Verified YDR120C TRM1 tRNA (guanine26-N2)-dimethyltransferase chromosome 4 L000002337 4 693261 691549 C 2011-02-03 1996-07-31 tRNA methyltransferase; two forms of protein are made by alternative translation starts; localizes to both nucleus and mitochondrion to produce modified base N2,N2-dimethylguanosine in tRNAs in both compartments; nuclear Trm1p is evenly distributed around inner nuclear membrane in WT, but mislocalizes as puncta near ER-nucleus junctions in spindle pole body (SPB) mutants; both Trm1p inner nuclear membrane targeting and maintenance depend upon SPB +S000035345 CDS YDR120C 4 693261 691549 C 2011-02-03 1996-07-31 +S000002528 ORF Verified YDR121W DPB4 DNA polymerase epsilon noncatalytic subunit chromosome 4 S000007463 4 693585 694175 W 2011-02-03 1996-07-31 Subunit of DNA pol epsilon and of ISW2 chromatin accessibility complex; involved in both chromosomal DNA replication and inheritance of telomeric silencing; stabilizes the interaction of Pol epsilon with primer-template DNA, positively affecting the processivity of the polymerase and exonuclease activities of Pol epsilon; interacts with extranucleosomal DNA and acts as anchor point for ISW2 complex that retains its position on DNA during nucleosome mobilization +S000035456 CDS YDR121W 4 693585 694175 W 2011-02-03 1996-07-31 +S000002529 ORF Verified YDR122W KIN1 serine/threonine protein kinase KIN1 chromosome 4 L000000901 4 694700 697894 W 2011-02-03 1996-07-31 Serine/threonine protein kinase involved in regulation of exocytosis; localizes to the cytoplasmic face of the plasma membrane; KIN1 has a paralog, KIN2, that arose from the whole genome duplication +S000036387 CDS YDR122W 4 694700 697894 W 2011-02-03 1996-07-31 +S000002530 ORF Verified YDR123C INO2 SCS1|DIE1 chromosome 4 L000000868|L000002801 4 699468 698554 C 2011-02-03 1996-07-31 Transcription factor; component of the heteromeric Ino2p/Ino4p basic helix-loop-helix transcription activator that binds inositol/choline-responsive elements (ICREs), required for derepression of phospholipid biosynthetic genes in response to inositol depletion; involved in diauxic shift +S000036420 CDS YDR123C 4 699468 698554 C 2011-02-03 1996-07-31 +S000002531 ORF Uncharacterized YDR124W chromosome 4 4 700315 701289 W 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene; expression is strongly induced by alpha factor +S000036553 CDS YDR124W 4 700315 701289 W 2011-02-03 1996-07-31 +S000002532 ORF Verified YDR125C ECM18 alpha/beta hydrolase family protein chromosome 4 L000003893 4 702758 701397 C 2011-02-03 1996-07-31 Protein of unknown function; ECM18 has a paralog, ICT1, that arose from the whole genome duplication +S000036581 CDS YDR125C 4 702758 701397 C 2011-02-03 1996-07-31 +S000114834 ARS ARS422 ARS422 ARSIV-703|ARO1 ARS chromosome 4 4 702887 703132 2011-02-03 2006-09-08|2006-04-12 Autonomously Replicating Sequence +S000178071 ARS_consensus_sequence ARS422 4 702924 702940 W 2014-11-18 2014-11-18 +S000002533 ORF Verified YDR126W SWF1 palmitoyltransferase SWF1|PSL10 chromosome 4 4 703234 704244 W 2011-02-03 1996-07-31 Palmitoyltransferase that acts on transmembrane proteins; including the SNAREs Snc1p, Syn8p, Tlg1p and likely all SNAREs; contains an Asp-His-His-Cys-cysteine rich (DHHC-CRD) domain; may have a role in vacuole fusion +S000037340 CDS YDR126W 4 703234 704244 W 2011-02-03 1996-07-31 +S000002534 ORF Verified YDR127W ARO1 pentafunctional protein ARO1p chromosome 4 L000000116 4 704484 709250 W 81 2011-02-03 1996-07-31 Pentafunctional arom protein; catalyzes steps 2 through 6 in the biosynthesis of chorismate, which is a precursor to aromatic amino acids +S000037463 CDS YDR127W 4 704484 709250 W 2011-02-03 1996-07-31 +S000002535 ORF Verified YDR128W MTC5 SEA3 chromosome 4 4 709549 712995 W 2011-02-03 1996-07-31 Subunit of SEACAT, a subcomplex of the SEA complex; Mtc1p, along with Rtc1p and Sea4p, redundantly inhibit the TORC1 inhibitory role of the Iml1p/SEACIT (Iml1p-Npr2p-Npr3p) subcomplex, a GAP for GTPase Gtr1p (EGOC subunit) in response to amino acid limitation, thereby resulting in activation of TORC1 signaling; SEA is a coatomer-related complex that associates dynamically with the vacuole; relative distribution to the vacuolar membrane decreases upon DNA replication stress +S000030151 CDS YDR128W 4 709549 712995 W 2011-02-03 1996-07-31 +S000002536 ORF Verified YDR129C SAC6 fimbrin|ABP67 chromosome 4 L000001793 4 715379 713340 C 84 2011-02-03 1996-07-31 Fimbrin, actin-bundling protein; cooperates with Scp1p in organization and maintenance of the actin cytoskeleton; phosphorylated by Cdc28p/Clb2p in metaphase on T103, to regulate conformation, and modulate actin filament binding affinity and actin cable dynamics; relocalizes from the plasma membrane to the cytoplasm upon DNA replication stress; human homologs PLS3 and LCP1 implicated in spinocerebellar ataxia type 2 (SCA2) can each complement yeast null mutant +S000030258 CDS YDR129C 4 715247 713340 C 2011-02-03 1996-07-31 +S000030257 CDS YDR129C 4 715379 715359 C 2011-02-03 1996-07-31 +S000030259 intron YDR129C 4 715358 715248 C 2011-02-03 1996-07-31 +S000002537 ORF Verified YDR130C FIN1 chromosome 4 4 716622 715747 C 2011-02-03 1996-07-31 Spindle pole body-related intermediate filament protein; forms cell cycle-specific filaments between spindle pole bodies in dividing cells; localizes to poles and microtubules of spindle during anaphase and contributes to spindle stability; involved in Glc7p localization and regulation; relative distribution to the nucleus increases upon DNA replication stress +S000030642 CDS YDR130C 4 716622 715747 C 2011-02-03 1996-07-31 +S000002538 ORF Verified YDR131C chromosome 4 4 718460 716790 C 2011-02-03 1996-07-31 F-box protein subunit of SCF ubiquitin ligase complex; substrate-specific adaptor subunit that recruits substrates to a core ubiquitination complex +S000030724 CDS YDR131C 4 718460 716790 C 2011-02-03 1996-07-31 +S000002539 ORF Verified YDR132C chromosome 4 4 720303 718816 C 2011-02-03 1996-07-31 Protein of unknown function; protein increases in abundance and relative distribution to the nucleus increases upon DNA replication stress; YDR132C has a paralog, YLR108C, that arose from the whole genome duplication +S000031561 CDS YDR132C 4 720303 718816 C 2011-02-03 1996-07-31 +S000002540 ORF Dubious YDR133C chromosome 4 4 721297 720962 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps YDR134C +S000031648 CDS YDR133C 4 721297 720962 C 2011-02-03 1996-07-31 +S000002541 blocked_reading_frame YDR134C chromosome 4 4 721481 721071 C 2011-02-03 1996-07-31 Cell wall protein; YDR134C has a paralog, CCW12, that arose from the whole genome duplication; S. cerevisiae genome reference strain S288C contains an internal in-frame stop at codon 67, which in other strains encodes glutamine +S000031764 CDS YDR134C 4 721481 721071 C 2011-02-03 1996-07-31 +S000002542 ORF Verified YDR135C YCF1 ATP-binding cassette glutathione S-conjugate transporter YCF1 chromosome 4 L000002499 4 727551 723004 C 2011-02-03 1996-07-31 Vacuolar glutathione S-conjugate transporter; ABC-C transporter of the ATP-binding cassette family; required for vacuole fusion; forms stable complexes with vacuole fusion machinery; regulates Vam7p recruitment to vacuoles; role in detoxifying metals (Cd, Hg, As); transports GSSG that is not immediately reduced in cytosol to vacuole; transports unconjugated bilirubin, selenodigluthatione, oxidized glutathione; similar to human cystic fibrosis protein CFTR +S000031914 CDS YDR135C 4 727551 723004 C 2011-02-03 1996-07-31 +S000002544 ORF Verified YDR137W RGP1 chromosome 4 L000001628 4 728259 730250 W 82 2011-02-03 1996-07-31 Subunit of a Golgi membrane exchange factor (Ric1p-Rgp1p); this complex catalyzes nucleotide exchange on Ypt6p +S000032960 CDS YDR137W 4 728259 730250 W 2011-02-03 1996-07-31 +S000002543 ORF Dubious YDR136C VPS61 chromosome 4 4 728283 727711 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 4% of ORF overlaps the verified gene RGP1; deletion causes a vacuolar protein sorting defect +S000032795 CDS YDR136C 4 728283 727711 C 2011-02-03 1996-07-31 +S000002545 ORF Verified YDR138W HPR1 TRF1 chromosome 4 L000000808 4 730578 732836 W 82 2011-02-03 1996-07-31 Subunit of THO/TREX complexes; this complex couple transcription elongation with mitotic recombination and with mRNA metabolism and export, subunit of an RNA Pol II complex; regulates lifespan; involved in telomere maintenance; similar to Top1p +S000033050 CDS YDR138W 4 730578 732836 W 2011-02-03 1996-07-31 +S000002546 ORF Verified YDR139C RUB1 NEDD8 family protein RUB1 chromosome 4 L000003330|L000004485 4 733924 733618 C 2011-02-03 2000-12-01|1996-07-31 Ubiquitin-like protein with similarity to mammalian NEDD8; conjugation (neddylation) substrates include the cullins Cdc53p, Rtt101p, and Cul3p; activated by Ula1p and Uba3p (E1 enzyme pair); conjugation mediated by Ubc12p (E2 enzyme) +S000033098 CDS YDR139C 4 733702 733618 C 2011-02-03 2000-12-01|1996-07-31 +S000033097 CDS YDR139C 4 733924 733776 C 2011-02-03 2000-12-01|1996-07-31 +S000033099 intron YDR139C 4 733775 733703 C 2011-02-03 2000-12-01|1996-07-31 +S000002547 ORF Verified YDR140W MTQ2 S-adenosylmethionine-dependent methyltransferase chromosome 4 4 734138 734803 W 2011-02-03 1996-07-31 S-adenosylmethionine-dependent methyltransferase; subunit of complex with Trm112p that methylates translation release factor Sup45p (eRF1) in the ternary complex eRF1-eRF3-GTP; similar to E.coli PrmC; member of the seven beta-strand family +S000036021 CDS YDR140W 4 734138 734803 W 2011-02-03 1996-07-31 +S000002548 ORF Verified YDR141C DOP1 chromosome 4 4 739997 734901 C 2011-02-03 1996-07-31 Golgi-localized, leucine-zipper domain containing protein; involved in endosome to Golgi transport, organization of the ER, establishing cell polarity, and morphogenesis; detected in highly purified mitochondria in high-throughput studies +S000036047 CDS YDR141C 4 739997 734901 C 2011-02-03 1996-07-31 +S000002549 ORF Verified YDR142C PEX7 PEB1|PAS7 chromosome 4 L000001340 4 741600 740473 C 2011-02-03 1996-07-31 Peroxisomal signal receptor for peroxisomal matrix proteins; recognizes the N-terminal nonapeptide signal (PTS2); WD repeat protein; defects in human homolog cause lethal rhizomelic chondrodysplasia punctata (RCDP) +S000036136 CDS YDR142C 4 741600 740473 C 2011-02-03 1996-07-31 +S000002550 ORF Verified YDR143C SAN1 ubiquitin-protein ligase SAN1 chromosome 4 L000001800 4 743874 742042 C 2011-02-03 1996-07-31 Ubiquitin-protein ligase; involved in proteasome-dependent degradation of aberrant nuclear proteins; targets substrates with regions of exposed hydrophobicity containing 5 or more contiguous hydrophobic residues; contains intrinsically disordered regions that contribute to substrate recognition; prefers a window of exposed hydrophobicity that causes a particular level of protein insolubility, suggesting that San1p evolved to target highly aggregation-prone proteins +S000036257 CDS YDR143C 4 743874 742042 C 2011-02-03 1996-07-31 +S000002551 ORF Verified YDR144C MKC7 aspartyl protease|YPS2 chromosome 4 L000003069 4 746101 744311 C 2011-02-03 1996-07-31 GPI-anchored aspartyl protease; member of the yapsin family of proteases involved in cell wall growth and maintenance; shares functions with Yap3p and Kex2p; MKC7 has a paralog, YPS1, that arose from the whole genome duplication +S000036336 CDS YDR144C 4 746101 744311 C 2011-02-03 1996-07-31 +S000002552 ORF Verified YDR145W TAF12 TafII61|TafII68|TAF68|TAF61 chromosome 4 L000003462 4 746738 748357 W 2011-02-03 1996-07-31 Subunit (61/68 kDa) of TFIID and SAGA complexes; involved in RNA polymerase II transcription initiation and in chromatin modification, similar to histone H2A; overexpression of the human ortholog, TAF12, an oncogene involved in the formation of choroid plexus carcinomas, results in dosage chromosomal instability (dCIN) in a human cell line similar to the dCIN observed in yeast overexpressors +S000037046 CDS YDR145W 4 746738 748357 W 2011-02-03 1996-07-31 +S000119070 ARS ARS451 ARSIV-748|ARS422.5 chromosome 4 4 748392 748637 2011-02-03 2006-10-05 Autonomously Replicating Sequence +S000178072 ARS_consensus_sequence ARS451 4 748456 748472 W 2014-11-18 2014-11-18 +S000002553 ORF Verified YDR146C SWI5 DNA-binding transcription factor SWI5 chromosome 4 L000002253 4 750742 748613 C 2011-02-03 1996-07-31 Transcription factor that recruits Mediator and Swi/Snf complexes; activates transcription of genes expressed at the M/G1 phase boundary and in G1 phase; required for expression of the HO gene controlling mating type switching; localization to nucleus occurs during G1 and appears to be regulated by phosphorylation by Cdc28p kinase; SWI5 has a paralog, ACE2, that arose from the whole genome duplication +S000037075 CDS YDR146C 4 750742 748613 C 2011-02-03 1996-07-31 +S000002554 ORF Verified YDR147W EKI1 bifunctional choline kinase/ethanolamine kinase EKI1 chromosome 4 L000004610 4 751631 753235 W 2011-02-03 1996-07-31 Ethanolamine kinase; primarily responsible for phosphatidylethanolamine synthesis via the CDP-ethanolamine pathway; exhibits some choline kinase activity, thus contributing to phosphatidylcholine synthesis via the CDP-choline pathway; EKI1 has a paralog, CKI1, that arose from the whole genome duplication +S000037235 CDS YDR147W 4 751631 753235 W 2011-02-03 1996-07-31 +S000118438 ARS ARS423 ARSIV-753 chromosome 4 4 753242 753386 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178073 ARS_consensus_sequence ARS423 4 753333 753317 C 2014-11-18 2014-11-18 +S000002555 ORF Verified YDR148C KGD2 alpha-ketoglutarate dehydrogenase KGD2 chromosome 4 L000000898 4 755066 753675 C 2011-02-03 1996-07-31 Dihydrolipoyl transsuccinylase; component of the mitochondrial alpha-ketoglutarate dehydrogenase complex, which catalyzes the oxidative decarboxylation of alpha-ketoglutarate to succinyl-CoA in the TCA cycle; phosphorylated +S000037302 CDS YDR148C 4 755066 753675 C 2011-02-03 1996-07-31 +S000002557 ORF Verified YDR150W NUM1 PAC12 chromosome 4 L000001287 4 755628 763874 W 2011-02-03 1996-07-31 Protein required for nuclear migration; component of the mitochondria-ER-cortex-ancor (MECA); required for the association of mitochondria with the cell cortex and for accurate distribution of mitochondrial network; interacts with Mdm36p to link the ER and mitochondria at the cortex; localizes to the mother cell cortex and the bud tip; may mediate interactions of dynein and cytoplasmic microtubules with the cell cortex +S000031071 CDS YDR150W 4 755628 763874 W 2011-02-03 1996-07-31 +S000002556 ORF Dubious YDR149C chromosome 4 4 756262 755555 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene NUM1/YDR150W; null mutation blocks anaerobic growth +S000029951 CDS YDR149C 4 756262 755555 C 2011-02-03 1996-07-31 +S000002558 ORF Verified YDR151C CTH1 putative mRNA-binding protein CTH1 chromosome 4 L000002772 4 765155 764178 C 2011-02-03 1996-07-31 Member of the CCCH zinc finger family; similar to mammalian Tis11 protein, which activates transcription and also has a role in mRNA degradation; may function with Tis11p in iron homeostasis; CTH1 has a paralog, TIS11, that arose from the whole genome duplication +S000031106 CDS YDR151C 4 765155 764178 C 2011-02-03 1996-07-31 +S000002559 ORF Verified YDR152W GIR2 chromosome 4 4 765706 766503 W 2011-02-03 1996-07-31 Highly-acidic RWD domain-containing cytoplasmic protein; forms a highly conserved complex with Rbg2p that is responsible for efficient cell growth under amino acid starvation and binds translational activator Gcn1p in dose-dependent manner according to stress level; associates with translating ribosomes; intrinsically unstructured protein whose stability is enhanced upon binding Rbg2p +S000031232 CDS YDR152W 4 765706 766503 W 2011-02-03 1996-07-31 +S000002560 ORF Verified YDR153C ENT5 chromosome 4 4 767971 766736 C 2011-02-03 1996-07-31 Protein containing an N-terminal epsin-like domain; involved in clathrin recruitment and traffic between the Golgi and endosomes; associates with the clathrin adaptor Gga2p, clathrin adaptor complex AP-1, and clathrin +S000032164 CDS YDR153C 4 767971 766736 C 2011-02-03 1996-07-31 +S000002561 ORF Dubious YDR154C chromosome 4 4 768753 768403 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; null mutant exhibits synthetic phenotype with alpha-synuclein +S000032245 CDS YDR154C 4 768753 768403 C 2011-02-03 1996-07-31 +S000002562 ORF Verified YDR155C CPR1 peptidylprolyl isomerase CPR1|CPH1|CYP1 chromosome 4 L000002663 4 769000 768512 C 2011-02-03 1996-07-31 Cytoplasmic peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; binds the drug cyclosporin A; N-terminally propionylated in vivo; protein abundance increases in response to DNA replication stress +S000032345 CDS YDR155C 4 769000 768512 C 2011-02-03 1996-07-31 +S000002563 ORF Verified YDR156W RPA14 DNA-directed RNA polymerase I subunit RPA14|A14 chromosome 4 L000002883 4 769525 769938 W 2011-02-03 1996-07-31 RNA polymerase I subunit A14 +S000033241 CDS YDR156W 4 769525 769938 W 2011-02-03 1996-07-31 +S000002564 ORF Dubious YDR157W chromosome 4 4 769931 770332 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033302 CDS YDR157W 4 769931 770332 W 2011-02-03 1996-07-31 +S000002565 ORF Verified YDR158W HOM2 aspartate-semialdehyde dehydrogenase|THR2 chromosome 4 L000000799 4 770357 771454 W 92 2011-02-03 1996-07-31 Aspartic beta semi-aldehyde dehydrogenase; catalyzes the second step in the common pathway for methionine and threonine biosynthesis; expression regulated by Gcn4p and the general control of amino acid synthesis +S000033370 CDS YDR158W 4 770357 771454 W 2011-02-03 1996-07-31 +S000002566 ORF Verified YDR159W SAC3 LEP1 chromosome 4 L000001792 4 771877 775782 W 92 2011-02-03 1996-07-31 mRNA export factor; required for biogenesis of the small ribosomal subunit; component of TREX-2 complex (Sac3p-Thp1p-Sus1p-Cdc31p) involved in transcription elongation and mRNA export from the nucleus; involved in post-transcriptional tethering of active genes to the nuclear periphery and to non-nascent mRNP; similar to the human germinal center-associated nuclear protein (GANP) +S000034282 CDS YDR159W 4 771877 775782 W 2011-02-03 1996-07-31 +S000002567 ORF Verified YDR160W SSY1 RAA1|SHR10 chromosome 4 L000004190|L000003184|S000029399|L000001553 4 776163 778721 W 92 2011-02-03 1996-07-31 Component of the SPS plasma membrane amino acid sensor system; senses external amino acid concentration and transmits intracellular signals that result in regulation of expression of amino acid permease genes; other members are Ssy1p, Ptr3p, and Ssy5p +S000034346 CDS YDR160W 4 776163 778721 W 2011-02-03 1996-07-31 +S000002568 ORF Verified YDR161W ACL4 chromosome 4 L000004169 4 779043 780206 W 2011-02-03 1996-07-31 Specific assembly chaperone for ribosomal protein Rpl4p; binds to an evolutionarily conserved surface extension of nascent Rpl4p and chaperones Rpl4p until its assembly into the pre-ribosome; transcriptionally co-regulated with rRNA and ribosome biosynthesis genes +S000035308 CDS YDR161W 4 779043 780206 W 2011-02-03 1996-07-31 +S000002569 ORF Verified YDR162C NBP2 chromosome 4 L000002861 4 781100 780390 C 2011-02-03 1996-07-31 Protein involved in the HOG (high osmolarity glycerol) pathway; negatively regulates Hog1p by recruitment of phosphatase Ptc1p the Pbs2p-Hog1p complex; interacts with Bck1p and down regulates the cell wall integrity pathway; found in the nucleus and cytoplasm, contains an SH3 domain and a Ptc1p binding domain (PBM) +S000035337 CDS YDR162C 4 781100 780390 C 2011-02-03 1996-07-31 +S000002570 ORF Verified YDR163W CWC15 U2-type spliceosomal complex subunit CWC15 chromosome 4 4 781423 781950 W 2011-02-03 1996-07-31 Non-essential protein involved in pre-mRNA splicing; component of a complex containing Cef1p; has similarity to S. pombe Cwf15p +S000035446 CDS YDR163W 4 781423 781950 W 2011-02-03 1996-07-31 +S000002571 ORF Verified YDR164C SEC1 chromosome 4 L000001827 4 784215 782041 C 94.77 2011-02-03 1996-07-31 Sm-like protein involved in docking and fusion of exocytic vesicles; binds to assembled SNARE complexes at the membrane and stimulates membrane fusion; localization to sites of secretion (bud neck and bud tip) is dependent on SNARE function; interacts directly with essential exocyst subunit Sec6p +S000035467 CDS YDR164C 4 784215 782041 C 2011-02-03 1996-07-31 +S000002572 ORF Verified YDR165W TRM82 chromosome 4 4 784871 786205 W 2011-02-03 1996-07-31 Catalytic subunit of a tRNA methyltransferase complex; Trm8p and Trm82p comprise an enzyme that catalyzes a methyl-transfer from S-adenosyl-l-methionine to the N(7) atom of guanine at position 46 in tRNA; Trm8 lacks catalytic activity if not bound to Trm82p; relocalizes to the cytosol in response to hypoxia; mutation in human ortholog WDR4 causes microcephalic primordial dwarfism +S000035563 CDS YDR165W 4 784871 786205 W 2011-02-03 1996-07-31 +S000002573 ORF Verified YDR166C SEC5 exocyst subunit SEC5 chromosome 4 L000001831 4 789221 786306 C 95 2011-02-03 1996-07-31 Essential 107kDa subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis at the plasma membrane prior to SNARE-mediated fusion; involved in assembly of the exocyst complex; required with Sec3p for ER inheritance where it promotes anchoring of the cortical ER at the bud tip +S000035593 CDS YDR166C 4 789221 786306 C 2011-02-03 1996-07-31 +S000002574 ORF Verified YDR167W TAF10 TafII25|TAF25|TAF23 chromosome 4 L000003460 4 789449 790069 W 2011-02-03 1996-07-31 Subunit (145 kDa) of TFIID and SAGA complexes; involved in RNA polymerase II transcription initiation and in chromatin modification +S000036558 CDS YDR167W 4 789449 790069 W 2011-02-03 1996-07-31 +S000002575 ORF Verified YDR168W CDC37 SMO1 chromosome 4 L000000273 4 790328 791848 W 95 2011-02-03 1996-07-31 Essential Hsp90p co-chaperone; necessary for passage through the START phase of the cell cycle; stabilizes protein kinase nascent chains and participates along with Hsp90p in their folding +S000036673 CDS YDR168W 4 790328 791848 W 2011-02-03 1996-07-31 +S000002576 ORF Verified YDR169C STB3 chromosome 4 L000002109 4 793889 792348 C 2011-02-03 1996-07-31 Ribosomal RNA processing element (RRPE)-binding protein; involved in the glucose-induced transition from quiescence to growth; restricted to nucleus in quiescent cells, released into cytoplasm after glucose repletion; binds Sin3p; relative distribution to the nucleus increases upon DNA replication stress +S000036712 CDS YDR169C 4 793889 792348 C 2011-02-03 1996-07-31 +S000028538 ORF Uncharacterized YDR169C-A chromosome 4 4 794723 794574 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031147 CDS YDR169C-A 4 794723 794574 C 2011-02-03 2003-07-29 +S000002577 ORF Verified YDR170C SEC7 Arf family guanine nucleotide exchange factor SEC7 chromosome 4 L000001833 4 802222 796193 C 96 2011-02-03 1996-07-31 Guanine nucleotide exchange factor (GEF) for ADP ribosylation factors; involved in proliferation of the Golgi, intra-Golgi transport and ER-to-Golgi transport; found in the cytoplasm and on Golgi-associated coated vesicles +S000036405 CDS YDR170C 4 802222 796193 C 2011-02-03 1996-07-31 +S000006695 tRNA_gene tQ(UUG)D3 chromosome 4 L000003783 4 802802 802731 C 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000034813 noncoding_exon tQ(UUG)D3 4 802802 802731 C 2011-02-03 2000-05-19 +S000006865 long_terminal_repeat YDRWdelta11 chromosome 4 4 802905 803235 W 2011-02-03 2000-05-19 Ty1 LTR +S000007227 transposable_element_gene YDR170W-A gag protein chromosome 4 4 803195 804517 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag; YDR170W-A is part of a mutant retrotransposon; distribution in the cytoplasm becomes irregular rather than punctate upon DNA replication stress +S000036096 CDS YDR170W-A 4 803195 804517 W 2011-02-03 1999-07-17 +S000118439 ARS ARS425 ARSIV-806 chromosome 4 4 806052 806277 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178074 ARS_consensus_sequence ARS425 4 806099 806115 W 2014-11-18 2014-11-18 +S000002578 ORF Verified YDR171W HSP42 heat shock protein HSP42 chromosome 4 L000003095 4 806621 807748 W 2011-02-03 1996-07-31 Small heat shock protein (sHSP) with chaperone activity; forms barrel-shaped oligomers that suppress unfolded protein aggregation; involved in cytoskeleton reorganization after heat shock; protein abundance increases and forms cytoplasmic foci in response to DNA replication stress +S000030208 CDS YDR171W 4 806621 807748 W 2011-02-03 1996-07-31 +S000002579 ORF Verified YDR172W SUP35 translation termination factor GTPase eRF3|eRF3|[PSI(+)]|[PSI]|SUP36|SUP2|SUF12|SAL3|PNM2|GST1 chromosome 4 L000002200 4 808324 810381 W 142.87 2011-02-03 1996-07-31 Translation termination factor eRF3; has a role in mRNA deadenylation and decay; altered protein conformation creates the [PSI(+)] prion that modifies cellular fitness, alters translational fidelity by affecting reading frame selection, and results in a nonsense suppressor phenotype; many stress-response genes are repressed in the presence of [PSI(+)] +S000030332 CDS YDR172W 4 808324 810381 W 2011-02-03 1996-07-31 +S000002580 ORF Verified YDR173C ARG82 inositol polyphosphate multikinase|ARGRIII|IPK2|ARGR3 chromosome 4 L000002727 4 811632 810565 C 95 2011-02-03 1996-07-31 Inositol polyphosphate multikinase (IPMK); sequentially phosphorylates Ins(1,4,5)P3 to form Ins(1,3,4,5,6)P5; also has diphosphoinositol polyphosphate synthase activity; regulates arginine-, phosphate-, and nitrogen-responsive genes +S000030416 CDS YDR173C 4 811632 810565 C 2011-02-03 1996-07-31 +S000002581 ORF Verified YDR174W HMO1 HSM2 chromosome 4 L000003234 4 812110 812850 W 2011-02-03 1996-07-31 Chromatin associated high mobility group (HMG) family member; involved in compacting, bending, bridging and looping DNA; rDNA-binding component that regulates transcription from RNA polymerase I promoters; regulates start site selection of ribosomal protein genes via RNA polymerase II promoters; role in genome maintenance; associates with a 5'-3' DNA helicase and Fpr1p, a prolyl isomerase; relocalizes to the cytosol in response to hypoxia +S000031344 CDS YDR174W 4 812110 812850 W 2011-02-03 1996-07-31 +S000002582 ORF Verified YDR175C RSM24 mitochondrial 37S ribosomal protein RSM24 chromosome 4 4 814152 813193 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit +S000031376 CDS YDR175C 4 814152 813193 C 2011-02-03 1996-07-31 +S000002583 ORF Verified YDR176W NGG1 histone acetyltransferase NGG1|SWI7|ADA3 chromosome 4 L000001241 4 814452 816560 W 2011-02-03 1996-07-31 Subunit of chromatin modifying histone acetyltransferase complexes; member of the ADA complex, the SAGA complex, and the SLIK complex; transcriptional regulator involved in glucose repression of Gal4p-regulated genes +S000031512 CDS YDR176W 4 814452 816560 W 2011-02-03 1996-07-31 +S000002584 ORF Verified YDR177W UBC1 E2 ubiquitin-conjugating protein UBC1 chromosome 4 L000002406 4 816878 817525 W 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme; key E2 partner with Ubc4p for the anaphase-promoting complex (APC); mediates selective degradation of short-lived and abnormal proteins; plays a role in vesicle biogenesis and ER-associated protein degradation (ERAD); component of the cellular stress response; protein abundance increases in response to DNA replication stress key E2 partner with Ubc4p for the anaphase-promoting complex (APC) +S000031590 CDS YDR177W 4 816878 817525 W 2011-02-03 1996-07-31 +S000002585 ORF Verified YDR178W SDH4 succinate dehydrogenase membrane anchor subunit SDH4|ACN18 chromosome 4 L000001826 4 817950 818495 W 2011-02-03 1996-07-31 Membrane anchor subunit of succinate dehydrogenase (SDH); involved in coupling the oxidation of succinate to the transfer of electrons to ubiquinone as part of the TCA cycle and the mitochondrial respiratory chain; has similarity to human SDH subunit D (SDHD), which is implicated in paraganglioma +S000032569 CDS YDR178W 4 817950 818495 W 2011-02-03 1996-07-31 +S000002586 ORF Verified YDR179C CSN9 chromosome 4 S000007578 4 819196 818708 C 2011-02-03 1996-07-31 Subunit of the Cop9 signalosome; Cop9 signalosome is required for deneddylation, or removal of the ubiquitin-like protein Rub1p from Cdc53p (cullin); involved in adaptation to pheromone signaling +S000032647 CDS YDR179C 4 819196 818708 C 2011-02-03 1996-07-31 +S000002587 ORF Verified YDR179W-A NVJ3 chromosome 4 4 819433 820824 W 2011-02-03 2004-07-21|1996-07-31 Protein with a potential role in tethering ER and vacuoles; localizes to nucleus-vacuole junctions in an Mdm1p-dependent manner; contains a lipid-binding PXA domain +S000037444 CDS YDR179W-A 4 819433 820824 W 2011-02-03 2004-07-21|1996-07-31 +S000002588 ORF Verified YDR180W SCC2 cohesin-loading factor complex subunit SCC2 chromosome 4 L000004262 4 821295 825776 W 2011-02-03 1996-07-31 Subunit of cohesin loading factor (Scc2p-Scc4p); a complex required for loading of cohesin complexes onto chromosomes; involved in establishing sister chromatid cohesion during DSB repair via histone H2AX; promotes gene expression program that supports translational fidelity; evolutionarily-conserved adherin; relocalizes to cytosol in response to hypoxia; human disorder Cornelia de Lange syndrome is caused by mutations in NIPBL, the human ortholog of SCC2 +S000034456 CDS YDR180W 4 821295 825776 W 2011-02-03 1996-07-31 +S000002589 ORF Verified YDR181C SAS4 chromosome 4 L000004214 4 827355 825910 C 2011-02-03 1996-07-31 Subunit of the SAS complex (Sas2p, Sas4p, Sas5p); acetylates free histones and nucleosomes and regulates transcriptional silencing; required for the HAT activity of Sas2p +S000034496 CDS YDR181C 4 827355 825910 C 2011-02-03 1996-07-31 +S000002590 ORF Verified YDR182W CDC1 putative lipid phosphatase CDC1|ESP2|DSR1|DSC1 chromosome 4 L000000241 4 827582 829057 W 2011-02-03 1996-07-31 Putative mannose-ethanolamine phosphate phosphodiesterase; involved in GPI-anchor remodeling prior to the attachment of cell wall proteins to beta 1,3-glucan, removing ethanolamine phosphate from the first mannose of GPI anchors; mutants display elevated Ca2+-dependent signaling resulting in secondary actin polarization and Golgi inheritance defects; enzyme is Mn2+-dependent; mutants have cell division cycle defect and fragile cell walls +S000034637 CDS YDR182W 4 827582 829057 W 2011-02-03 1996-07-31 +S000028539 ORF Uncharacterized YDR182W-A chromosome 4 4 829151 829354 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031148 CDS YDR182W-A 4 829151 829354 W 2011-02-03 2003-07-29 +S000002591 ORF Verified YDR183W PLP1 chromosome 4 L000003424 4 829585 830277 W 2011-02-03 1996-07-31 Protein that interacts with CCT (chaperonin containing TCP-1) complex; has a role in actin and tubulin folding; has weak similarity to phosducins, which are G-protein regulators +S000034709 CDS YDR183W 4 829585 830277 W 2011-02-03 1996-07-31 +S000028540 ORF Dubious YDR183C-A chromosome 4 4 830654 830397 C 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by fungal homology and RT-PCR +S000031190 CDS YDR183C-A 4 830654 830397 C 2011-02-03 2003-07-29 +S000002592 ORF Verified YDR184C ATC1 LIC4 chromosome 4 L000004405 4 831513 830629 C 2011-02-03 1996-07-31 Nuclear protein; possibly involved in regulation of cation stress responses and/or in the establishment of bipolar budding pattern; relative distribution to the nucleus decreases upon DNA replication stress +S000034749 CDS YDR184C 4 831513 830629 C 2011-02-03 1996-07-31 +S000002593 ORF Verified YDR185C UPS3 GEP2 chromosome 4 4 832473 831934 C 2011-02-03 1996-07-31 Mitochondrial protein of unknown function; similar to Ups1p and Ups2p which are involved in regulation of mitochondrial cardiolipin and phosphatidylethanolamine levels; null is viable but interacts synthetically with ups1 and ups2 mutations; UPS3 has a paralog, UPS2, that arose from the whole genome duplication +S000035675 CDS YDR185C 4 832473 831934 C 2011-02-03 1996-07-31 +S000002594 ORF Verified YDR186C SND1 chromosome 4 4 835492 832859 C 2011-02-03 1996-07-31 Protein involved in SRP-independent targeting of substrates to the ER; component of an alternative ER targeting pathway that has partial functional redundancy with the GET pathway; preference for substrates with downstream transmembrane domains; interacts with Env10p/Snd2p and Pho88p/Snd3p; can compensate for loss of SRP; may interact with ribosomes, based on co-purification experiments; GFP-fusion protein localizes to the cytoplasm +S000035744 CDS YDR186C 4 835492 832859 C 2011-02-03 1996-07-31 +S000002596 ORF Verified YDR188W CCT6 chaperonin-containing T-complex subunit CCT6|TCP20|TCP6|HTR3 chromosome 4 L000002271 4 836421 838061 W 2011-02-03 1996-07-31 Subunit of the cytosolic chaperonin Cct ring complex; related to Tcp1p, essential protein that is required for the assembly of actin and tubulins in vivo; contains an ATP-binding motif +S000036804 CDS YDR188W 4 836421 838061 W 2011-02-03 1996-07-31 +S000002595 ORF Dubious YDR187C chromosome 4 4 836746 836228 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified, essential ORF CCT6/YDR188W +S000035828 CDS YDR187C 4 836746 836228 C 2011-02-03 1996-07-31 +S000002597 ORF Verified YDR189W SLY1 syntaxin-binding protein chromosome 4 L000001923 4 838392 840392 W 2011-02-03 1996-07-31 Hydrophilic protein involved in ER/Golgi vesicle trafficking; SM (Sec1/Munc-18) family protein that binds the tSNARE Sed5p and stimulates its assembly into a trans-SNARE membrane-protein complex +S000036882 CDS YDR189W 4 838392 840392 W 2011-02-03 1996-07-31 +S000002598 ORF Verified YDR190C RVB1 RuvB family ATP-dependent DNA helicase pontin|TIP49|TIH1|TIP49A chromosome 4 S000007843 4 841995 840604 C 2011-02-03 1996-07-31 ATP-dependent DNA helicase, also known as pontin; member of the AAA+ and RuvB-like protein families; similar to Rvb2p; conserved component of multiple complexes including the INO80 complex, the Swr1 complex, and the R2TP complex (Rvb1-Rvb2-Tah1-Pih1); involved in multiple processes such as chromatin remodeling, box C/D snoRNP assembly, and RNA polymerase II assembly +S000036562 CDS YDR190C 4 841995 840604 C 2011-02-03 1996-07-31 +S000002599 ORF Verified YDR191W HST4 NAD-dependent histone deacetylase HST4 chromosome 4 L000003043 4 842337 843449 W 2011-02-03 1996-07-31 NAD(+)-dependent protein deacetylase; deacetylation targets are primarily mitochondrial proteins; involved along with Hst3p in silencing at telomeres, cell cycle progression, radiation resistance, genomic stability and short-chain fatty acid metabolism; accumulates in mitochondria in response to biotin starvation and may link biotin metabolism with energy homeostasis; member of the Sir2 family and may be the functional equivalent of human SIRT3 +S000036688 CDS YDR191W 4 842337 843449 W 2011-02-03 1996-07-31 +S000002601 ORF Dubious YDR193W chromosome 4 4 844554 844952 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030657 CDS YDR193W 4 844554 844952 W 2011-02-03 1996-07-31 +S000002600 ORF Verified YDR192C NUP42 FG-nucleoporin NUP42|UIP1|RIP1 chromosome 4 L000002940 4 844861 843569 C 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; also part of the nuclear pore complex (NPC) cytoplasmic filaments; contributes directly to nucleocytoplasmic transport and maintenance of the NPC permeability barrier and is involved in gene tethering at the nuclear periphery; interacts with Gle1p +S000036723 CDS YDR192C 4 844861 843569 C 2011-02-03 1996-07-31 +S000002602 ORF Verified YDR194C MSS116 ATP-dependent RNA helicase chromosome 4 L000001206 4 847946 845952 C 2011-02-03 1996-07-31 Mitochondrial transcription elongation factor; DEAD-box protein; required for efficient splicing of mitochondrial Group I and II introns; non-polar RNA helicase that also facilities strand annealing; promotes RNA folding by stabilizing an early assembly intermediate +S000030696 CDS YDR194C 4 847946 845952 C 2011-02-03 1996-07-31 +S000028541 ORF Uncharacterized YDR194W-A chromosome 4 4 848071 848223 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031191 CDS YDR194W-A 4 848071 848223 W 2011-02-03 2003-07-29 +S000002603 ORF Verified YDR195W REF2 RNA-processing protein REF2 chromosome 4 L000002661 4 848599 850200 W 2011-02-03 1996-07-31 RNA-binding protein; involved in the cleavage step of mRNA 3'-end formation prior to polyadenylation, and in snoRNA maturation; part of holo-CPF subcomplex APT, which associates with 3'-ends of snoRNA- and mRNA-encoding genes; putative regulatory subunit of type 1 protein phosphatase Glc7p, required for actomyosin ring formation, and for timely dephosphorylation and release of Bnr1p from the division site; relocalizes to the cytosol in response to hypoxia +S000030881 CDS YDR195W 4 848599 850200 W 2011-02-03 1996-07-31 +S000002604 ORF Verified YDR196C CAB5 putative dephospho-CoA kinase chromosome 4 4 850999 850274 C 2011-02-03 1996-07-31 Subunit of the CoA-Synthesizing Protein Complex (CoA-SPC); subunits of this complex are: Cab2p, Cab3p, Cab4p, Cab5p, Sis2p and Vhs3p; probable dephospho-CoA kinase (DPCK) that catalyzes the last step in coenzyme A biosynthesis; null mutant lethality is complemented by human homolog DCAKD and by E. coli coaE (encoding DPCK); detected in purified mitochondria in high-throughput studies; also localized to lipid droplets +S000031739 CDS YDR196C 4 850999 850274 C 2011-02-03 1996-07-31 +S000002605 ORF Verified YDR197W CBS2 CBP7 chromosome 4 L000000231 4 851228 852397 W 2011-02-03 1996-07-31 Mitochondrial translational activator of the COB mRNA; interacts with translating ribosomes, acts on the COB mRNA 5'-untranslated leader +S000032020 CDS YDR197W 4 851228 852397 W 2011-02-03 1996-07-31 +S000002606 ORF Verified YDR198C RKM2 protein-lysine N-methyltransferase chromosome 4 4 853972 852533 C 2011-02-03 1996-07-31 Ribosomal protein lysine methyltransferase; responsible for trimethylation of the lysine residue at position 3 of Rpl12Ap and Rpl12Bp +S000032059 CDS YDR198C 4 853972 852533 C 2011-02-03 1996-07-31 +S000002607 ORF Dubious YDR199W chromosome 4 4 854175 854540 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene VPS64/YDR200C; computationally predicted to have thiol-disulfide oxidoreductase activity +S000033057 CDS YDR199W 4 854175 854540 W 2011-02-03 1996-07-31 +S000002608 ORF Verified YDR200C VPS64 FAR9 chromosome 4 4 856093 854279 C 2011-02-03 1996-07-31 Protein required for cytoplasm to vacuole targeting of proteins; forms a complex with Far3p and Far7p to Far11p involved in recovery from pheromone-induced cell cycle arrest; mutant has increased aneuploidy tolerance; VPS64 has a paralog, FAR10, that arose from the whole genome duplication +S000037661 CDS YDR200C 4 856093 854279 C 2011-02-03 1996-07-31 +S000002609 ORF Verified YDR201W SPC19 chromosome 4 L000004693 4 856317 856814 W 2011-02-03 1996-07-31 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; also localized to nuclear side of spindle pole body +S000030528 CDS YDR201W 4 856317 856814 W 2011-02-03 1996-07-31 +S000002611 ORF Dubious YDR203W chromosome 4 4 857682 857999 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF RAV2/YDR202C +S000030685 CDS YDR203W 4 857682 857999 W 2011-02-03 1996-07-31 +S000002610 ORF Verified YDR202C RAV2 chromosome 4 4 857953 856898 C 2011-02-03 1996-07-31 Subunit of RAVE complex (Rav1p, Rav2p, Skp1p); the RAVE complex associates with the V1 domain of the vacuolar membrane (H+)-ATPase (V-ATPase) and promotes assembly and reassembly of the holoenzyme +S000030555 CDS YDR202C 4 857953 856898 C 2011-02-03 1996-07-31 +S000002612 ORF Verified YDR204W COQ4 ubiquinone biosynthesis protein COQ4 chromosome 4 L000003957 4 858137 859144 W 2011-02-03 1996-07-31 Protein with a role in ubiquinone (Coenzyme Q) biosynthesis; possibly functioning in stabilization of Coq7p; located on matrix face of mitochondrial inner membrane; component of a mitochondrial ubiquinone-synthesizing complex; human homolog COQ4 can complement yeast coq4 null mutant +S000030757 CDS YDR204W 4 858137 859144 W 2011-02-03 1996-07-31 +S000002613 ORF Verified YDR205W MSC2 metal cation transporter MSC2 chromosome 4 4 859346 861520 W 2011-02-03 2003-09-22|1996-07-31 Endoplasmic reticulum zinc transporter; part of a heterodimeric transporter with Zrg17p that transfers zinc from the cytosol to the ER lumen; member of the cation diffusion facilitator family of efflux pumps; localizes to ER and nucleus; mutations affect the cellular distribution of zinc and also confer defects in meiotic recombination between homologous chromatids +S000031604 CDS YDR205W 4 859346 861520 W 2011-02-03 2003-09-22|1996-07-31 +S000002614 ORF Verified YDR206W EBS1 chromosome 4 L000004629 4 862054 864708 W 2011-02-03 1996-07-31 Protein involved in translation inhibition and nonsense-mediated decay; interacts with cap binding protein Cdc33p and with Nam7p; localizes to P-bodies upon glucose starvation; mRNA abundance regulated by mRNA decay factors; EBS1 has a paralog, EST1, that arose from the whole genome duplication +S000031711 CDS YDR206W 4 862054 864708 W 2011-02-03 1996-07-31 +S000002615 ORF Verified YDR207C UME6 DNA-binding transcriptional regulator UME6|RIM16|NIM2|CAR80 chromosome 4 L000002426 4 867522 865012 C 2011-02-03 1996-07-31 Rpd3L histone deacetylase complex subunit; key transcriptional regulator of early meiotic genes; involved in chromatin remodeling and transcriptional repression via DNA looping; binds URS1 upstream regulatory sequence, represses transcription by recruiting conserved histone deacetylase Rpd3p (through co-repressor Sin3p) and chromatin-remodeling factor Isw2p; couples metabolic responses to nutritional cues with initiation and progression of meiosis, forms compl +S000031768 CDS YDR207C 4 867522 865012 C 2011-02-03 1996-07-31 +S000002616 ORF Verified YDR208W MSS4 1-phosphatidylinositol-4-phosphate 5-kinase chromosome 4 L000001203 4 868224 870563 W 2011-02-03 1996-07-31 Phosphatidylinositol-4-phosphate 5-kinase; involved in actin cytoskeleton organization and cell morphogenesis; multicopy suppressor of stt4 mutation +S000031959 CDS YDR208W 4 868224 870563 W 2011-02-03 1996-07-31 +S000002618 ORF Uncharacterized YDR210W chromosome 4 4 871074 871301 W 2011-02-03 1996-07-31 Predicted tail-anchored plasma membrane protein; contains a conserved CYSTM module; related proteins in other organisms may be involved in response to stress; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery +S000034858 CDS YDR210W 4 871074 871301 W 2011-02-03 1996-07-31 +S000002617 ORF Uncharacterized YDR209C chromosome 4 4 871449 871036 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YDR209C is not an essential gene; partially overlaps uncharacterized gene YDR210W +S000032797 CDS YDR209C 4 871449 871036 C 2011-02-03 1996-07-31 +S000006867 long_terminal_repeat YDRWdelta13 chromosome 4 4 871821 872152 W 2011-02-03 2000-05-19 Ty1 LTR +S000006884 LTR_retrotransposon YDRWTy2-2 Ty2 chromosome 4 4 871821 877779 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007392 transposable_element_gene YDR210W-A gag protein chromosome 4 4 872112 873428 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000029817 CDS YDR210W-A 4 872112 873428 W 2011-02-03 1999-07-17 +S000007393 transposable_element_gene YDR210W-B gag-pol fusion protein chromosome 4 4 872112 877425 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000029819 CDS YDR210W-B 4 872112 873404 W 2011-02-03 1999-07-17 +S000029820 CDS YDR210W-B 4 873406 877425 W 2011-02-03 1999-07-17 +S000029821 plus_1_translational_frameshift YDR210W-B 4 873405 873405 W 2011-02-03 1999-07-17 +S000006868 long_terminal_repeat YDRWdelta14 chromosome 4 4 877448 877779 W 2011-02-03 2000-05-19 Ty1 LTR +S000007410 transposable_element_gene YDR210C-D gag-pol fusion protein|YDR210W-D chromosome 4 4 883927 878659 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000029824 CDS YDR210C-D 4 882621 878659 C 2011-02-03 1999-07-17 +S000029823 CDS YDR210C-D 4 883927 882623 C 2011-02-03 1999-07-17 +S000029825 plus_1_translational_frameshift YDR210C-D 4 882622 882622 C 2011-02-03 1999-07-17 +S000007409 transposable_element_gene YDR210C-C gag protein|YDR210W-C chromosome 4 4 883927 882605 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000029822 CDS YDR210C-C 4 883927 882605 C 2011-02-03 1999-07-17 +S000006860 LTR_retrotransposon YDRCTy1-2 Ty1 chromosome 4 4 884220 878303 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000006613 tRNA_gene tI(UAU)D chromosome 4 L000003769 4 884361 884493 W 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000035113 intron tI(UAU)D 4 884398 884457 W 2011-02-03 2000-05-19 +S000035111 noncoding_exon tI(UAU)D 4 884361 884397 W 2011-02-03 2000-05-19 +S000035112 noncoding_exon tI(UAU)D 4 884458 884493 W 2011-02-03 2000-05-19 +S000002619 ORF Verified YDR211W GCD6 translation initiation factor eIF2B catalytic subunit epsilon chromosome 4 L000000674 4 884727 886865 W 2011-02-03 1996-07-31 Catalytic epsilon subunit of the translation initiation factor eIF2B; eIF2B is the guanine-nucleotide exchange factor for eIF2; activity subsequently regulated by phosphorylated eIF2; first identified as a negative regulator of GCN4 expression; forms cytoplasmic foci upon DNA replication stress +S000034999 CDS YDR211W 4 884727 886865 W 2011-02-03 1996-07-31 +S000002620 ORF Verified YDR212W TCP1 chaperonin-containing T-complex alpha subunit TCP1|CCT1 chromosome 4 L000002267 4 887232 888911 W 127 2011-02-03 1996-07-31 Alpha subunit of chaperonin-containing T-complex; complex mediates protein folding in the cytosol; involved in actin cytoskeleton maintenance; overexpression in neurons suppresses formation of pathogenic conformations of huntingtin protein +S000035134 CDS YDR212W 4 887232 888911 W 2011-02-03 1996-07-31 +S000002621 ORF Verified YDR213W UPC2 MOX4 chromosome 4 4 889751 892492 W 2011-02-03 1996-07-31 Sterol regulatory element binding protein; induces sterol biosynthetic genes, upon sterol depletion; acts as a sterol sensor, binding ergosterol in sterol rich conditions; relocates from intracellular membranes to perinuclear foci upon sterol depletion; redundant activator of filamentation with ECM22, up-regulating the expression of filamentous growth genes; contains a Zn[2]-Cys[6] binuclear cluster; UPC2 has a paralog, ECM22, that arose from the whole genome duplication +S000036022 CDS YDR213W 4 889751 892492 W 2011-02-03 1996-07-31 +S000002622 ORF Verified YDR214W AHA1 chromosome 4 4 892875 893927 W 2011-02-03 1996-07-31 Co-chaperone that binds Hsp82p and activates its ATPase activity; plays a role in determining prion variants; similar to Hch1p; expression is regulated by stresses such as heat shock; protein abundance increases in response to DNA replication stress +S000036092 CDS YDR214W 4 892875 893927 W 2011-02-03 1996-07-31 +S000002623 ORF Dubious YDR215C chromosome 4 4 894502 894089 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; null mutant displays elevated sensitivity to expression of a mutant huntingtin fragment or of alpha-synuclein +S000036137 CDS YDR215C 4 894502 894089 C 2011-02-03 1996-07-31|2011-02-03 +S000002624 ORF Verified YDR216W ADR1 DNA-binding transcription factor ADR1 chromosome 4 L000000050 4 895035 899006 W 125 2011-02-03 1996-07-31 Carbon source-responsive zinc-finger transcription factor; required for transcription of the glucose-repressed gene ADH2, of peroxisomal protein genes, and of genes required for ethanol, glycerol, and fatty acid utilization +S000036296 CDS YDR216W 4 895035 899006 W 2011-02-03 1996-07-31 +S000130175 ARS ARS427 chromosome 4 4 899051 899596 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000002625 ORF Verified YDR217C RAD9 chromatin-binding protein RAD9 chromosome 4 L000001562 4 903480 899551 C 126 2011-02-03 1996-07-31 DNA damage-dependent checkpoint protein; required for cell-cycle arrest in G1/S, intra-S, and G2/M, plays a role in postreplication repair (PRR) pathway; transmits checkpoint signal by activating Rad53p and Chk1p; hyperphosphorylated by Mec1p and Tel1p; multiple cyclin dependent kinase consensus sites and the C-terminal BRCT domain contribute to DNA damage checkpoint activation; Rad9p Chk1 Activating Domain (CAD) is phosphorylated at multiple sites by Cdc28p/Clb2p +S000036338 CDS YDR217C 4 903480 899551 C 2011-02-03 1996-07-31 +S000002626 ORF Verified YDR218C SPR28 septin SPR28 chromosome 4 L000004150 4 905052 903781 C 2011-02-03 1996-07-31 Sporulation-specific homolog of the CDC3/10/11/12 family of genes; meiotic septin expressed at high levels during meiotic divisions and ascospore formation; the yeast CDC3/10/11/12 family is a family of bud neck microfilament genes +S000037012 CDS YDR218C 4 905052 903781 C 2011-02-03 1996-07-31 +S000002627 ORF Verified YDR219C MFB1 chromosome 4 4 906852 905455 C 2011-02-03 1996-07-31 Mitochondria-associated F-box protein; involved in maintenance of normal mitochondrial morphology; interacts with Skp1p through the F-box motif; preferentially localizes to the mother cell during budding +S000037083 CDS YDR219C 4 906852 905455 C 2011-02-03 1996-07-31 +S000002628 ORF Dubious YDR220C chromosome 4 4 907293 907000 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; null mutant exhibits synthetic phenotype with alpha-synuclein +S000037911 CDS YDR220C 4 907293 907000 C 2011-02-03 1996-07-31 +S000002629 ORF Verified YDR221W GTB1 chromosome 4 4 907330 909438 W 2011-02-03 1996-07-31 Glucosidase II beta subunit, forms a complex with alpha subunit Rot2p; involved in removal of two glucose residues from N-linked glycans during glycoprotein biogenesis in the ER; relocalizes from ER to cytoplasm upon DNA replication stress +S000029995 CDS YDR221W 4 907330 909438 W 2011-02-03 1996-07-31 +S000002630 ORF Uncharacterized YDR222W chromosome 4 4 910054 911301 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; YDR222W has a paralog, YLR225C, that arose from the whole genome duplication +S000030976 CDS YDR222W 4 910054 911301 W 2011-02-03 1996-07-31 +S000002631 ORF Verified YDR223W CRF1 chromosome 4 4 912099 913502 W 2011-02-03 1996-07-31 Transcriptional corepressor; involved in repression of ribosomal protein (RP) gene transcription via the TOR signaling pathway which promotes accumulation of Crf1p in the nucleus; role in repression of RP genes varies by strain; CRF1 has a paralog, IFH1, that arose from the whole genome duplication +S000031073 CDS YDR223W 4 912099 913502 W 2011-02-03 1996-07-31 +S000118440 ARS ARS428 ARSIV-914 chromosome 4 4 913790 914038 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178075 ARS_consensus_sequence ARS428 4 913856 913872 W 2014-11-18 2014-11-18 +S000002632 ORF Verified YDR224C HTB1 histone H2B|SPT12 chromosome 4 L000000829 4 914712 914317 C 132 2011-02-03 1996-07-31 Histone H2B; core histone protein required for chromatin assembly and chromosome function; nearly identical to HTB2; Rad6p-Bre1p-Lge1p mediated ubiquitination regulates reassembly after DNA replication, transcriptional activation, meiotic DSB formation and H3 methylation +S000031108 CDS YDR224C 4 914712 914317 C 2011-02-03 1996-07-31 +S000002633 ORF Verified YDR225W HTA1 histone H2A|SPT11|H2A1 chromosome 4 L000000827 4 915530 915928 W 132 2011-02-03 1996-07-31 Histone H2A; core histone protein required for chromatin assembly and chromosome function; one of two nearly identical subtypes (see also HTA2); DNA damage-dependent phosphorylation by Mec1p facilitates DNA repair; acetylated by Nat4p; N-terminally propionylated in vivo +S000031234 CDS YDR225W 4 915530 915928 W 2011-02-03 1996-07-31 +S000002634 ORF Verified YDR226W ADK1 adenylate kinase ADK1|AKY2|AKY1 chromosome 4 L000000046 4 916486 917154 W 133 2011-02-03 1996-07-31 Adenylate kinase, required for purine metabolism; localized to the cytoplasm and the mitochondria; lacks cleavable signal sequence; protein abundance increases in response to DNA replication stress; mutations affecting Adk1p catalytic activity deregulate expression of phosphate utilization genes PHO5 and PHO84; human homolog AK1 can complement yeast adk1 mutant +S000032219 CDS YDR226W 4 916486 917154 W 2011-02-03 1996-07-31 +S000002635 ORF Verified YDR227W SIR4 chromatin-silencing protein SIR4|UTH2|STE9|ASD1 chromosome 4 L000001897 4 917571 921647 W 128 2011-02-03 1996-07-31 SIR protein involved in assembly of silent chromatin domains; silent information regulator (SIR) along with SIR2 and SIR3; involved in assembly of silent chromatin domains at telomeres and the silent mating-type loci; some alleles of SIR4 prolong lifespan; required for telomere hypercluster formation in quiescent yeast cells +S000032314 CDS YDR227W 4 917571 921647 W 2011-02-03 1996-07-31 +S000118441 ARS ARS429 ARSIV-922 chromosome 4 4 921692 921939 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178076 ARS_consensus_sequence ARS429 4 921736 921752 W 2014-11-18 2014-11-18 +S000002636 ORF Verified YDR228C PCF11 chromosome 4 L000004116 4 923806 921926 C 2011-02-03 1996-07-31 mRNA 3' end processing factor; essential component of cleavage and polyadenylation factor IA (CF IA), involved in pre-mRNA 3' end processing and in transcription termination; binds C-terminal domain of largest subunit of RNA pol II (Rpo21p); required for gene looping; relocalizes to the cytosol in response to hypoxia +S000032352 CDS YDR228C 4 923806 921926 C 2011-02-03 1996-07-31 +S000002637 ORF Verified YDR229W IVY1 chromosome 4 4 924785 926146 W 2011-02-03 1996-07-31 Phospholipid-binding protein that interacts with both Ypt7p and Vps33p; may partially counteract the action of Vps33p and vice versa, localizes to the rim of the vacuole as cells approach stationary phase +S000033246 CDS YDR229W 4 924785 926146 W 2011-02-03 1996-07-31 +S000002638 ORF Dubious YDR230W chromosome 4 4 926223 926570 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene COX20/YDR231C +S000034096 CDS YDR230W 4 926223 926570 W 2011-02-03 1996-07-31 +S000002639 ORF Verified YDR231C COX20 chromosome 4 S000007474 4 926910 926293 C 2011-02-03 1996-07-31 Mitochondrial inner membrane protein; required for proteolytic processing of Cox2p and its assembly into cytochrome c oxidase +S000034128 CDS YDR231C 4 926910 926293 C 2011-02-03 1996-07-31 +S000002640 ORF Verified YDR232W HEM1 5-aminolevulinate synthase|OLE3|CYD1 chromosome 4 L000000760 4 927452 929098 W 2011-02-03 1996-07-31 5-aminolevulinate synthase; catalyzes the first step in the heme biosynthetic pathway; an N-terminal signal sequence is required for localization to the mitochondrial matrix; expression is regulated by Hap2p-Hap3p; has a pyridoxal phosphate cofactor whose insertion is mediated by Mcx1p +S000034287 CDS YDR232W 4 927452 929098 W 2011-02-03 1996-07-31 +S000002641 ORF Verified YDR233C RTN1 chromosome 4 4 930357 929470 C 2011-02-03 1996-07-31 Reticulon protein; involved in nuclear pore assembly and maintenance of tubular ER morphology; promotes membrane curvature; regulates the ER asymmetry-induced inheritance block during ER stress; role in ER-derived peroxisomal biogenesis; increases tubular ER when overexpressed; mutants have reduced phosphatidylserine transfer between the ER and mitochondria; interacts with exocyst subunit Sec6p, Yip3p, and Sbh1p; member of the RTNLA subfamily +S000034311 CDS YDR233C 4 930357 929470 C 2011-02-03 1996-07-31 +S000002642 ORF Verified YDR234W LYS4 homoaconitate hydratase LYS4|LYS3 chromosome 4 L000000966 4 931129 933210 W 145.87 2011-02-03 1996-07-31 Homoaconitase; catalyzes the conversion of homocitrate to homoisocitrate, which is a step in the lysine biosynthesis pathway +S000035310 CDS YDR234W 4 931129 933210 W 2011-02-03 1996-07-31 +S000002643 ORF Verified YDR235W PRP42 mRNA splicing protein PRP42|SNU65|MUD16 chromosome 4 L000003969 4 933504 935138 W 2011-02-03 1996-07-31 U1 snRNP protein involved in splicing; required for U1 snRNP biogenesis; contains multiple tetriatricopeptide repeats +S000035386 CDS YDR235W 4 933504 935138 W 2011-02-03 1996-07-31 +S000002644 ORF Verified YDR236C FMN1 riboflavin kinase chromosome 4 4 935892 935236 C 2011-02-03 1996-07-31 Riboflavin kinase, produces riboflavin monophosphate (FMN); FMN is a necessary cofactor for many enzymes; predominantly localizes to the microsomal fraction and also found in the mitochondrial inner membrane; human RFK functionally complements the lethality of the null mutation +S000035407 CDS YDR236C 4 935892 935236 C 2011-02-03 1996-07-31 +S000002645 ORF Verified YDR237W MRPL7 mitochondrial 54S ribosomal protein YmL7/YmL5|YmL7|YmL5 chromosome 4 L000002684 4 936615 937493 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; MRPL7 produces both YmL5 and YmL7, which are two different modified forms of the same protein +S000035502 CDS YDR237W 4 936615 937493 W 2011-02-03 1996-07-31 +S000002646 ORF Verified YDR238C SEC26 coatomer subunit beta chromosome 4 L000001847 4 940816 937895 C 2011-02-03 1996-07-31 Essential beta-coat protein of the COPI coatomer; involved in ER-to-Golgi protein trafficking and maintenance of normal ER morphology; shares 43% sequence identity with mammalian beta-coat protein (beta-COP) +S000035532 CDS YDR238C 4 940816 937895 C 2011-02-03 1996-07-31 +S000002647 ORF Verified YDR239C chromosome 4 4 943420 941057 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments +S000035595 CDS YDR239C 4 943420 941057 C 2011-02-03 1996-07-31 +S000002649 ORF Dubious YDR241W BUD26 chromosome 4 4 945151 945438 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 1% of ORF overlaps the verified gene SNU56; diploid mutant displays a weak budding pattern phenotype in a systematic assay +S000036282 CDS YDR241W 4 945151 945438 W 2011-02-03 1996-07-31 +S000002648 ORF Verified YDR240C SNU56 MUD10 chromosome 4 L000004362 4 945152 943674 C 2011-02-03 1996-07-31 Component of U1 snRNP required for mRNA splicing via spliceosome; yeast specific, no metazoan counterpart; interacts with mRNA in commitment complex +S000036072 CDS YDR240C 4 945152 943674 C 2011-02-03 1996-07-31 +S000006866 long_terminal_repeat YDRWdelta12 chromosome 4 4 945351 945673 W 2011-02-03 2000-05-19 Ty1 LTR +S000006857 long_terminal_repeat YDRCsigma3 chromosome 4 4 946295 945955 C 2011-02-03 2000-05-19 Ty3 LTR +S000006778 tRNA_gene tY(GUA)D SUP2 chromosome 4 L000003770 4 946312 946400 W 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations +S000034661 intron tY(GUA)D 4 946351 946364 W 2011-02-03 2000-05-19 +S000034659 noncoding_exon tY(GUA)D 4 946312 946350 W 2011-02-03 2000-05-19 +S000034660 noncoding_exon tY(GUA)D 4 946365 946400 W 2011-02-03 2000-05-19 +S000002650 ORF Verified YDR242W AMD2 putative amidase chromosome 4 L000000083 4 946807 948456 W 2011-02-03 1996-07-31 Putative amidase +S000036363 CDS YDR242W 4 946807 948456 W 2011-02-03 1996-07-31 +S000002651 ORF Verified YDR243C PRP28 mRNA splicing protein PRP28 chromosome 4 L000001509 4 950284 948518 C 144.27 2011-02-03 1996-07-31 RNA binding protein; involved in RNA isomerization at the 5' splice site and for exchange of U6 for U1 snRNA at the 5' splice site; similar to the RNA helicases of the DEAD-box family +S000036406 CDS YDR243C 4 950284 948518 C 2011-02-03 1996-07-31 +S000002652 ORF Verified YDR244W PEX5 PAS10 chromosome 4 L000001342 4 950563 952401 W 2011-02-03 1996-07-31 Peroxisomal membrane signal receptor for peroxisomal matrix proteins; receptor for the C-terminal tripeptide signal sequence (PTS1) of peroxisomal matrix proteins; required for peroxisomal matrix protein import; also proposed to have PTS1-receptor independent functions +S000030212 CDS YDR244W 4 950563 952401 W 2011-02-03 1996-07-31 +S000002653 ORF Verified YDR245W MNN10 alpha-1,6-mannosyltransferase|REC41|SLC2|BED1 chromosome 4 L000002793|L000002853 4 952800 953981 W 2011-02-03 1996-07-31 Subunit of a Golgi mannosyltransferase complex; complex mediates elongation of the polysaccharide mannan backbone; membrane protein of the mannosyltransferase family; other members of the complex are Anp1p, Mnn9p, Mnn11p, and Hoc1p +S000030334 CDS YDR245W 4 952800 953981 W 2011-02-03 1996-07-31 +S000002654 ORF Verified YDR246W TRS23 TRAPP subunit TRS23 chromosome 4 S000007432 4 954288 954947 W 2011-02-03 1996-07-31 Core component of transport protein particle (TRAPP) complexes I-III; TRAPP complexes are related multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating ER-Golgi traffic (TRAPPI), intra-Golgi traffic (TRAPPII), endosome-Golgi traffic (TRAPPII and III) and autophagy (TRAPPIII); human homolog is TRAPPC4 +S000030489 CDS YDR246W 4 954288 954947 W 2011-02-03 1996-07-31 +S000028542 ORF Uncharacterized YDR246W-A chromosome 4 4 955133 955333 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031192 CDS YDR246W-A 4 955133 955333 W 2011-02-03 2003-07-29 +S000002655 ORF Verified YDR247W VHS1 putative serine/threonine protein kinase VHS1 chromosome 4 4 956013 957398 W 2011-02-03 1996-07-31 Cytoplasmic serine/threonine protein kinase; identified as a high-copy suppressor of the synthetic lethality of a sis2 sit4 double mutant, suggesting a role in G1/S phase progression; VHS1 has a paralog, SKS1, that arose from the whole genome duplication +S000031345 CDS YDR247W 4 956013 957398 W 2011-02-03 1996-07-31 +S000002656 ORF Uncharacterized YDR248C gluconokinase chromosome 4 4 958339 957758 C 2011-02-03 1996-07-31 Putative gluconokinase; sequence similarity to bacterial and human gluconokinase; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; upregulated by deletion of the RNAP-II associated factor, PAF1 +S000031382 CDS YDR248C 4 958339 957758 C 2011-02-03 1996-07-31 +S000002657 ORF Uncharacterized YDR249C chromosome 4 4 959802 958681 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000031491 CDS YDR249C 4 959802 958681 C 2011-02-03 1996-07-31 +S000002658 ORF Dubious YDR250C chromosome 4 4 960361 960086 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031286 CDS YDR250C 4 960361 960086 C 2011-02-03 1996-07-31 +S000002659 ORF Verified YDR251W PAM1 chromosome 4 L000001334 4 960614 963106 W 2011-02-03 1996-07-31 Essential protein of unknown function; exhibits variable expression during colony morphogenesis; overexpression permits survival without protein phosphatase 2A, inhibits growth, and induces a filamentous phenotype; PAM1 has a paralog, SVL3, that arose from the whole genome duplication +S000032340 CDS YDR251W 4 960614 963106 W 2011-02-03 1996-07-31 +S000002660 ORF Verified YDR252W BTT1 CCR4-NOT core subunit BTT1 chromosome 4 L000000195 4 963412 963861 W 2011-02-03 1996-07-31 Heterotrimeric nascent polypeptide-associated complex beta3 subunit; complex binds ribosomes via its beta-subunits in close proximity to nascent polypeptides; interacts with Caf130p of the CCR4-NOT complex; similar to human BTF3; BTT1 has a paralog, EGD1, that arose from the whole genome duplication +S000032433 CDS YDR252W 4 963412 963861 W 2011-02-03 1996-07-31 +S000002661 ORF Verified YDR253C MET32 chromosome 4 L000003470 4 964565 963990 C 2011-02-03 1996-07-31 Zinc-finger DNA-binding transcription factor; involved in transcriptional regulation of the methionine biosynthetic genes; targets strong transcriptional activator Met4p to promoters of sulfur metabolic genes; feedforward loop exists in the regulation of genes controlled by Met4p and Met32p; lack of such a loop for MET31 may account for the differential actions of Met32p and Met31p; MET32 has a paralog, MET31, that arose from the whole genome duplication +S000032479 CDS YDR253C 4 964565 963990 C 2011-02-03 1996-07-31 +S000002662 ORF Verified YDR254W CHL4 MCM17|CTF17 chromosome 4 L000000321 4 965113 966489 W 2011-02-03 1996-07-31 Outer kinetochore protein required for chromosome stability; involved in new kinetochore assembly and sister chromatid cohesion; forms a stable complex with Iml3p; peripheral component of the Ctf19 kinetochore complex that interacts with Ctf19p, Ctf3p, and Mif2p; required for the spindle assembly checkpoint; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-N and fission yeast mis15 +S000034580 CDS YDR254W 4 965113 966489 W 2011-02-03 1996-07-31 +S000002663 ORF Verified YDR255C RMD5 ubiquitin-protein ligase RMD5|GID2 chromosome 4 4 967822 966557 C 2011-02-03 1996-07-31 Component of GID Complex that confers ubiquitin ligase (U3) activity; necessary for polyubiquitination and degradation of the gluconeogenic enzyme fructose-1,6-bisphosphatase; forms dimer with Fyv10p that is then recruited to GID Complex by Gid8p; also required for sporulation; conserved protein that has a degenerate RING finger domain +S000034601 CDS YDR255C 4 967822 966557 C 2011-02-03 1996-07-31 +S000002664 ORF Verified YDR256C CTA1 catalase A chromosome 4 L000000428 4 969680 968133 C 2011-02-03 1996-07-31 Catalase A; breaks down hydrogen peroxide in the peroxisomal matrix formed by acyl-CoA oxidase (Pox1p) during fatty acid beta-oxidation +S000034671 CDS YDR256C 4 969680 968133 C 2011-02-03 1996-07-31 +S000002665 ORF Verified YDR257C RKM4 ribosomal lysine N-methyltransferase|SET7|RMS1 chromosome 4 L000003277 4 971474 969990 C 2011-02-03 1996-07-31 Ribosomal lysine methyltransferase; specific for monomethylation of Rpl42ap and Rpl42bp (lysine 55); nuclear SET-domain containing protein +S000034751 CDS YDR257C 4 971474 969990 C 2011-02-03 1996-07-31 +S000002666 ORF Verified YDR258C HSP78 chaperone ATPase HSP78 chromosome 4 L000000821 4 974243 971808 C 2011-02-03 1996-07-31 Oligomeric mitochondrial matrix chaperone; cooperates with Ssc1p in mitochondrial thermotolerance after heat shock; able to prevent the aggregation of misfolded proteins as well as resolubilize protein aggregates +S000035676 CDS YDR258C 4 974243 971808 C 2011-02-03 1996-07-31 +S000002667 ORF Verified YDR259C YAP6 HAL7 chromosome 4 L000004344 4 975782 974631 C 2011-02-03 1996-07-31 Basic leucine zipper (bZIP) transcription factor; physically interacts with the Tup1-Cyc8 complex and recruits Tup1p to its targets; overexpression increases sodium and lithium tolerance; computational analysis suggests a role in regulation of expression of genes involved in carbohydrate metabolism; YAP6 has a paralog, CIN5, that arose from the whole genome duplication +S000035746 CDS YDR259C 4 975782 974631 C 2011-02-03 1996-07-31 +S000002668 ORF Verified YDR260C SWM1 APC13 chromosome 4 L000004027 4 977229 976717 C 2011-02-03 1996-07-31 Subunit of the anaphase-promoting complex (APC); APC is an E3 ubiquitin ligase that regulates the metaphase-anaphase transition and exit from mitosis; required for activation of the daughter-specific gene expression and spore wall maturation +S000035460 CDS YDR260C 4 977229 976717 C 2011-02-03 1996-07-31 +S000002669 ORF Verified YDR261C EXG2 glucan exo-1,3-beta-glucosidase chromosome 4 L000000593 4 979209 977521 C 162 2011-02-03 1996-07-31 Exo-1,3-beta-glucanase; involved in cell wall beta-glucan assembly; may be anchored to the plasma membrane via a glycosylphosphatidylinositol (GPI) anchor +S000035548 CDS YDR261C 4 979209 977521 C 2011-02-03 1996-07-31 +S000006722 tRNA_gene tS(AGA)D2 chromosome 4 L000003774 4 981055 980974 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000031633 noncoding_exon tS(AGA)D2 4 981055 980974 C 2011-02-03 2000-05-19 +S000006869 long_terminal_repeat YDRWdelta19 chromosome 4 4 981171 981502 W 2011-02-03 2000-05-19 Ty1 LTR +S000006885 LTR_retrotransposon YDRWTy2-3 Ty2 chromosome 4 4 981171 987125 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007396 transposable_element_gene YDR261W-A gag protein chromosome 4 4 981462 982778 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000034032 CDS YDR261W-A 4 981462 982778 W 2011-02-03 1999-07-17 +S000007397 transposable_element_gene YDR261W-B gag-pol fusion protein chromosome 4 4 981462 986775 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000034034 CDS YDR261W-B 4 981462 982754 W 2011-02-03 1999-07-17 +S000034035 CDS YDR261W-B 4 982756 986775 W 2011-02-03 1999-07-17 +S000034036 plus_1_translational_frameshift YDR261W-B 4 982755 982755 W 2011-02-03 1999-07-17 +S000006870 long_terminal_repeat YDRWdelta20 chromosome 4 4 986794 987125 W 2011-02-03 2000-05-19 Ty1 LTR +S000006853 long_terminal_repeat YDRCdelta21 chromosome 4 4 987483 987150 C 2011-02-03 2000-05-19 Ty1 LTR +S000007395 transposable_element_gene YDR261C-D gag-pol fusion protein chromosome 4 4 992349 987534 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; Gag processing produces capsid proteins, Pol is cleaved to produce protease, reverse transcriptase and integrase activities; in YDRCTy1-3 TYB is mutant and probably non-functional +S000032325 CDS YDR261C-D 4 991043 987534 C 2011-02-03 1999-07-17 +S000032324 CDS YDR261C-D 4 992349 991045 C 2011-02-03 1999-07-17 +S000032326 plus_1_translational_frameshift YDR261C-D 4 991044 991044 C 2011-02-03 1999-07-17 +S000007394 transposable_element_gene YDR261C-C gag protein chromosome 4 4 992349 991027 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; Gag processing produces capsid proteins; in YDRCTy1-3 TYB is mutant and probably non-functional +S000031433 CDS YDR261C-C 4 992349 991027 C 2011-02-03 1999-07-17 +S000006861 LTR_retrotransposon YDRCTy1-3 Ty1 chromosome 4 4 992642 987150 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; mutated in S288C +S000006854 long_terminal_repeat YDRCdelta22 chromosome 4 4 992642 992309 C 2011-02-03 2000-05-19 Ty1 LTR +S000006880 long_terminal_repeat YDRCsigma4 YDRWsigma4 chromosome 4 4 992815 992740 C 2011-02-03 2000-05-19|2007-04-02 Ty3 LTR +S000006577 tRNA_gene tG(GCC)D2 chromosome 4 L000003771 4 992832 992902 W 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis +S000031716 noncoding_exon tG(GCC)D2 4 992832 992902 W 2011-02-03 2000-05-19 +S000002670 ORF Uncharacterized YDR262W chromosome 4 4 993134 993952 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole and is induced in response to the DNA-damaging agent MMS; gene expression increases in response to Zymoliase treatment +S000036503 CDS YDR262W 4 993134 993952 W 2011-02-03 1996-07-31 +S000002671 ORF Verified YDR263C DIN7 exodeoxyribonuclease DIN7|DIN3 chromosome 4 L000003086 4 995534 994242 C 2011-02-03 1996-07-31 Mitochondrial nuclease functioning in DNA repair and replication; modulates the stability of the mitochondrial genome, induced by exposure to mutagens, also induced during meiosis at a time nearly coincident with commitment to recombination; DIN7 has a paralog, EXO1, that arose from the whole genome duplication +S000036563 CDS YDR263C 4 995534 994242 C 2011-02-03 1996-07-31 +S000002672 ORF Verified YDR264C AKR1 palmitoyltransferase AKR1 chromosome 4 L000000072 4 998323 996029 C 2011-02-03 1996-07-31 Palmitoyl transferase involved in protein palmitoylation; acts as a negative regulator of pheromone response pathway; required for endocytosis of pheromone receptors; involved in cell shape control; contains ankyrin repeats; AKR1 has a paralog, AKR2, that arose from the whole genome duplication; any of several human homologs encoding DHHC-type zinc fingers (ZDHHC) can complement temperature sensitivity of yeast akr1 null mutant +S000036629 CDS YDR264C 4 998323 996029 C 2011-02-03 1996-07-31 +S000002673 ORF Verified YDR265W PEX10 ubiquitin-protein ligase peroxin 10|PAS4 chromosome 4 L000003961 4 998864 999877 W 2011-02-03 1996-07-31 Peroxisomal membrane E3 ubiquitin ligase; required for for Ubc4p-dependent Pex5p ubiquitination and peroxisomal matrix protein import; contains zinc-binding RING domain; mutations in human homolog cause various peroxisomal disorders +S000036772 CDS YDR265W 4 998864 999877 W 2011-02-03 1996-07-31 +S000002674 ORF Verified YDR266C HEL2 E3 ubiquitin-protein ligase HEL2 chromosome 4 4 1002023 1000104 C 2011-02-03 1996-07-31 RING finger ubiquitin ligase (E3); involved in ubiquitination and degradation of excess histones; interacts with Ubc4p and Rad53p; null mutant sensitive to hydroxyurea (HU); green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; computational analysis suggests a role as a transcription factor +S000030572 CDS YDR266C 4 1002023 1000104 C 2011-02-03 1996-07-31 +S000002675 ORF Verified YDR267C CIA1 iron-sulfur cluster assembly protein CIA1 chromosome 4 4 1003502 1002510 C 2011-02-03 1996-07-31 Component of cytosolic iron-sulfur protein assembly (CIA) machinery; acts at late step of Fe-S cluster assembly; forms CIA targeting complex with Cia2p and Met18p that directs Fe-S cluster incorporation into subset of proteins involved in methionine biosynthesis, DNA replication and repair, transcription, telomere maintenance; contains WD40 repeats; human homolog CIAO1 can complement yeast cia1 null mutant +S000030699 CDS YDR267C 4 1003502 1002510 C 2011-02-03 1996-07-31 +S000002676 ORF Verified YDR268W MSW1 tryptophan--tRNA ligase MSW1 chromosome 4 L000001209 4 1004004 1005143 W 2011-02-03 1996-07-31 Mitochondrial tryptophanyl-tRNA synthetase +S000030885 CDS YDR268W 4 1004004 1005143 W 2011-02-03 1996-07-31 +S000002678 ORF Verified YDR270W CCC2 Cu(2+)-transporting P-type ATPase CCC2 chromosome 4 L000000235 4 1005675 1008689 W 2011-02-03 1996-07-31 Cu(+2)-transporting P-type ATPase; required for export of copper from the cytosol into an extracytosolic compartment; similar to human proteins involved in Menkes and Wilsons diseases; protein abundance increases in response to DNA replication stress; affects TBSV model (+)RNA virus replication by regulating copper metabolism; human homologs ATP7A and ATP7B both complement yeast null mutant +S000031624 CDS YDR270W 4 1005675 1008689 W 2011-02-03 1996-07-31 +S000002677 ORF Dubious YDR269C chromosome 4 4 1005988 1005665 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031741 CDS YDR269C 4 1005988 1005665 C 2011-02-03 1996-07-31 +S000002679 ORF Dubious YDR271C chromosome 4 4 1008766 1008395 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF CCC2/YDR270W +S000031691 CDS YDR271C 4 1008766 1008395 C 2011-02-03 1996-07-31 +S000002680 ORF Verified YDR272W GLO2 hydroxyacylglutathione hydrolase GLO2 chromosome 4 L000003488 4 1009010 1009834 W 2011-02-03 1996-07-31 Cytoplasmic glyoxalase II; catalyzes the hydrolysis of S-D-lactoylglutathione into glutathione and D-lactate; GLO2 has a paralog, GLO4, that arose from the whole genome duplication +S000032699 CDS YDR272W 4 1009010 1009834 W 2011-02-03 1996-07-31 +S000002681 ORF Verified YDR273W DON1 chromosome 4 4 1010176 1011273 W 2011-02-03 1996-07-31 Meiosis-specific component of the spindle pole body; subunit of the leading edge protein (LEP) complex (Ssp1-Ady3-Don1-Irc10) that forms a ring-like structure at the leading edge of the prospore membrane (PSM) during meiosis II; required for PSM growth and closure; DON1 has a paralog, CUE5, that arose from the whole genome +S000032778 CDS YDR273W 4 1010176 1011273 W 2011-02-03 1996-07-31 +S000002682 ORF Uncharacterized YDR274C chromosome 4 4 1011960 1011589 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YDR274C is not an essential gene +S000032843 CDS YDR274C 4 1011960 1011589 C 2011-02-03 1996-07-31 +S000002683 ORF Verified YDR275W BSC2 chromosome 4 4 1012252 1012959 W 2011-02-03 1996-07-31 Protein of unknown function; ORF exhibits genomic organization compatible with a translational readthrough-dependent mode of expression; null mutant displays increased translation rate and increased readthrough of premature stop codons; BSC2 has a paralog, IRC23, that arose from the whole genome duplication +S000034861 CDS YDR275W 4 1012252 1012959 W 2011-02-03 1996-07-31 +S000002684 ORF Verified YDR276C PMP3 SNA1 chromosome 4 4 1013643 1013476 C 2011-02-03 1996-07-31 Small plasma membrane protein; confers resistance to amphotericin B and is a potential target of this common antifungal drug; related to a family of plant polypeptides that are overexpressed under high salt concentration or low temperature; not essential for viability; deletion causes hyperpolarization of the plasma membrane potential +S000034908 CDS YDR276C 4 1013643 1013476 C 2011-02-03 1996-07-31 +S000002685 ORF Verified YDR277C MTH1 HTR1|DGT1|BPC1 chromosome 4 L000001213|L000000831 4 1015702 1014401 C 2011-02-03 1996-07-31 Negative regulator of the glucose-sensing signal transduction pathway; required for repression of transcription by Rgt1p; interacts with Rgt1p and the Snf3p and Rgt2p glucose sensors; phosphorylated by Yck1p, triggering Mth1p degradation; MTH1 has a paralog, STD1, that arose from the whole genome duplication +S000035061 CDS YDR277C 4 1015702 1014401 C 2011-02-03 1996-07-31 +S000118442 ARS ARS430 ARSIV-1017 chromosome 4 4 1016670 1016911 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178077 ARS_consensus_sequence ARS430 4 1016846 1016830 C 2014-11-18 2014-11-18 +S000006546 tRNA_gene tE(CUC)D chromosome 4 L000003781 4 1017278 1017207 C 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis +S000031893 noncoding_exon tE(CUC)D 4 1017278 1017207 C 2011-02-03 2000-05-19 +S000002686 ORF Uncharacterized YDR278C chromosome 4 4 1017318 1017001 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YDR278C is not an essential gene +S000035163 CDS YDR278C 4 1017318 1017001 C 2011-02-03 1996-07-31 +S000002687 ORF Verified YDR279W RNH202 Rnh2B chromosome 4 4 1019368 1020420 W 2011-02-03 1996-07-31 Ribonuclease H2 subunit; required for RNase H2 activity; role in ribonucleotide excision repair; related to human AGS2 that causes Aicardi-Goutieres syndrome +S000036060 CDS YDR279W 4 1019368 1020420 W 2011-02-03 1996-07-31 +S000002688 ORF Verified YDR280W RRP45 exosome non-catalytic core subunit RRP45 chromosome 4 L000004578 4 1020747 1021664 W 2011-02-03 1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; has similarity to E. coli RNase PH and to human hRrp45p (PM/SCL-75, EXOSC9); protein abundance increases in response to DNA replication stress +S000035087 CDS YDR280W 4 1020747 1021664 W 2011-02-03 1996-07-31 +S000002689 ORF Verified YDR281C PHM6 chromosome 4 S000007515 4 1022321 1022007 C 2011-02-03 1996-07-31 Protein of unknown function; expression is regulated by phosphate levels +S000035153 CDS YDR281C 4 1022321 1022007 C 2011-02-03 1996-07-31 +S000006881 long_terminal_repeat YDRWsigma5 chromosome 4 4 1023137 1023477 W 2011-02-03 2000-05-19 Ty3 LTR +S000002690 ORF Verified YDR282C MRX10 chromosome 4 4 1024755 1023511 C 2011-02-03 1996-07-31 Mitochondrial inner membrane protein of unknown function; associates with mitochondrial ribosome; localizes to the inner membrane with the C terminus facing the intermembrane space; ortholog of human RMND1, mutation in which is implicated in infantile encephaloneuromyopathy and defective mitochondrial translation +S000035316 CDS YDR282C 4 1024755 1023511 C 2011-02-03 1996-07-31 +S000002691 ORF Verified YDR283C GCN2 serine/threonine-protein kinase GCN2|AAS102|NDR2|AAS1 chromosome 4 L000000681 4 1030049 1025070 C 173 2011-02-03 1996-07-31 Protein kinase; phosphorylates the alpha-subunit of translation initiation factor eIF2 (Sui2p) in response to starvation; activated by uncharged tRNAs and the Gcn1p-Gcn20p complex; contributes to DNA damage checkpoint control +S000036262 CDS YDR283C 4 1030049 1025070 C 2011-02-03 1996-07-31 +S000002692 ORF Verified YDR284C DPP1 bifunctional diacylglycerol diphosphate phosphatase/phosphatidate phosphatase|ZRG1 chromosome 4 L000003582 4 1031419 1030550 C 2011-02-03 1996-07-31 Diacylglycerol pyrophosphate (DGPP) phosphatase; zinc-regulated vacuolar membrane-associated lipid phosphatase, dephosphorylates DGPP to phosphatidate (PA) and Pi, then PA to diacylglycerol; involved in lipid signaling and cell metabolism +S000036340 CDS YDR284C 4 1031419 1030550 C 2011-02-03 1996-07-31 +S000002693 ORF Verified YDR285W ZIP1 chromosome 4 L000002568 4 1032436 1035063 W 2011-02-03 1996-07-31 Transverse filament protein of the synaptonemal complex; required for normal levels of meiotic recombination and pairing between homologous chromosome during meiosis; required for meiotic recombination between non-allelc sites; potential Cdc28p substrate +S000036473 CDS YDR285W 4 1032436 1035063 W 2011-02-03 1996-07-31 +S000002694 ORF Uncharacterized YDR286C chromosome 4 4 1035575 1035231 C 2011-02-03 1996-07-31 Putative protein of unknown function; predicted to have thiol-disulfide oxidoreductase active site +S000037085 CDS YDR286C 4 1035575 1035231 C 2011-02-03 1996-07-31 +S000002695 ORF Verified YDR287W INM2 inositol monophosphate 1-phosphatase INM2 chromosome 4 4 1035995 1036873 W 2011-02-03 1996-07-31 Inositol monophosphatase; involved in biosynthesis of inositol; enzymatic activity requires magnesium ions and is inhibited by lithium and sodium ions; inm1 inm2 double mutant lacks inositol auxotrophy +S000037232 CDS YDR287W 4 1035995 1036873 W 2011-02-03 1996-07-31 +S000002696 ORF Verified YDR288W NSE3 Smc5-Smc6 complex subunit NSE3 chromosome 4 4 1037195 1038106 W 2011-02-03 1996-07-31 Component of the SMC5-SMC6 complex; this complex plays a key role in the removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair; protein abundance increases in response to DNA replication stress +S000037315 CDS YDR288W 4 1037195 1038106 W 2011-02-03 1996-07-31 +S000002698 ORF Dubious YDR290W SWS1 chromosome 4 4 1039370 1039699 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF RTT103 +S000031324 CDS YDR290W 4 1039370 1039699 W 2011-02-03 1996-07-31 +S000002697 ORF Verified YDR289C RTT103 chromosome 4 4 1039509 1038280 C 2011-02-03 1996-07-31 Protein involved in transcription termination by RNA polymerase II; interacts with exonuclease Rat1p and Rai1p; has an RPR domain (carboxy-terminal domain interacting domain); also involved in regulation of Ty1 transposition +S000037346 CDS YDR289C 4 1039509 1038280 C 2011-02-03 1996-07-31 +S000002699 ORF Verified YDR291W HRQ1 ATP-dependent 3'-5' DNA helicase chromosome 4 4 1039728 1042961 W 2011-02-03 1996-07-31 3'-5' DNA helicase that has DNA strand annealing activity; helicase activity is stimulated by fork structure and 3'-tail length of substrates; acts with Rad4p in nucleotide-excision repair; belongs to the widely conserved RecQ family of proteins which are involved in maintaining genomic integrity; similar to the human RecQ4p implicated in Rothmund-Thomson syndrome (RTS) +S000032334 CDS YDR291W 4 1039728 1042961 W 2011-02-03 1996-07-31 +S000002700 ORF Verified YDR292C SRP101 Signal recognition particle receptor subunit alpha chromosome 4 L000002067 4 1045011 1043146 C 2011-02-03 1996-07-31 Signal recognition particle (SRP) receptor alpha subunit; contain GTPase domains; involved in SRP-dependent protein targeting; interacts with the beta subunit, Srp102p +S000032412 CDS YDR292C 4 1045011 1043146 C 2011-02-03 1996-07-31 +S000002701 ORF Verified YDR293C SSD1 mRNA-binding translational repressor SSD1|SRK1|RLT1|MCS1|CLA1 chromosome 4 L000002077 4 1049392 1045640 C 176 2011-02-03 1996-07-31 Translational repressor with a role in polar growth and wall integrity; regulated by Cbk1p phosphorylation to effect bud-specific translational control and localization of specific mRNAs; interacts with TOR pathway components; contains a functional N-terminal nuclear localization sequence and nucleocytoplasmic shuttling appears to be critical to Ssd1p function +S000032503 CDS YDR293C 4 1049392 1045640 C 2011-02-03 1996-07-31 +S000002702 ORF Verified YDR294C DPL1 sphinganine-1-phosphate aldolase DPL1|BST1 chromosome 4 L000004296 4 1052228 1050459 C 2011-02-03 1996-07-31 Dihydrosphingosine phosphate lyase; regulates intracellular levels of sphingolipid long-chain base phosphates (LCBPs), degrades phosphorylated long chain bases, prefers C16 dihydrosphingosine-l-phosphate as a substrate +S000032617 CDS YDR294C 4 1052228 1050459 C 2011-02-03 1996-07-31 +S000002703 ORF Verified YDR295C HDA2 PLO2 chromosome 4 4 1054647 1052623 C 2011-02-03 1996-07-31 Subunit of the HDA1 histone deacetylase complex; possibly tetrameric trichostatin A-sensitive class II histone deacetylase complex contains Hda1p homodimer and an Hda2p-Hda3p heterodimer; involved in telomere maintenance; relocalizes to the cytosol in response to hypoxia +S000033335 CDS YDR295C 4 1054647 1052623 C 2011-02-03 1996-07-31 +S000002704 ORF Verified YDR296W MHR1 XTC1 chromosome 4 L000004333 4 1055212 1055892 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; also involved in homologous recombination in mitochondria; required for recombination-dependent mtDNA partitioning; involved in stimulation of mitochondrial DNA replication in response to oxidative stress +S000033421 CDS YDR296W 4 1055212 1055892 W 2011-02-03 1996-07-31 +S000002705 ORF Verified YDR297W SUR2 sphingosine hydroxylase|SYR2 chromosome 4 L000002244|L000002259 4 1056551 1057600 W 2011-02-03 1996-07-31 Sphinganine C4-hydroxylase; catalyses the conversion of sphinganine to phytosphingosine in sphingolipid biosyntheis +S000033508 CDS YDR297W 4 1056551 1057600 W 2011-02-03 1996-07-31 +S000118443 ARS ARS431 ARSIV-1058 chromosome 4 4 1057841 1057951 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178078 ARS_consensus_sequence ARS431 4 1057887 1057903 W 2014-11-18 2014-11-18 +S000002706 ORF Verified YDR298C ATP5 F1F0 ATP synthase subunit 5|OSC1 chromosome 4 L000000145 4 1058814 1058176 C 2011-02-03 1996-07-31 Subunit 5 of the stator stalk of mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; homologous to bovine subunit OSCP (oligomycin sensitivity-conferring protein); phosphorylated +S000033515 CDS YDR298C 4 1058814 1058176 C 2011-02-03 1996-07-31 +S000002707 ORF Verified YDR299W BFR2 rRNA-processing protein BFR2 chromosome 4 L000004432 4 1059627 1061231 W 2011-02-03 1996-07-31 Component of the SSU and 90S preribosomes; involved in pre-18S rRNA processing; binds to U3 snoRNA and Mpp10p; multicopy suppressor of sensitivity to Brefeldin A; expression is induced during lag phase and also by cold shock +S000033609 CDS YDR299W 4 1059627 1061231 W 2011-02-03 1996-07-31 +S000002708 ORF Verified YDR300C PRO1 glutamate 5-kinase chromosome 4 L000001491 4 1062791 1061505 C 187 2011-02-03 1996-07-31 Gamma-glutamyl kinase; catalyzes the first step in proline biosynthesis; required for nitrogen starvation-induced ribophagy but not for nonselective autophagy; PRO1 has a paralog, YHR033W, that arose from the whole genome duplication +S000030896 CDS YDR300C 4 1062791 1061505 C 2011-02-03 1996-07-31 +S000002709 ORF Verified YDR301W CFT1 YHH1 chromosome 4 L000003600 4 1063352 1067425 W 2011-02-03 1996-07-31 RNA-binding subunit of the mRNA cleavage and polyadenylation factor; involved in poly(A) site recognition and required for both pre-mRNA cleavage and polyadenylation, 51% sequence similarity with mammalian AAUAA-binding subunit of CPSF +S000031983 CDS YDR301W 4 1063352 1067425 W 2011-02-03 1996-07-31 +S000002710 ORF Verified YDR302W GPI11 mannose-ethanolamine phosphotransferase GPI11 chromosome 4 4 1067731 1068390 W 2011-02-03 1996-07-31 ER membrane protein involved in a late step of GPI anchor assembly; involved in the addition of phosphoethanolamine to the multiply mannosylated glycosylphosphatidylinositol (GPI) intermediate; human PIG-Fp is a functional homolog +S000032108 CDS YDR302W 4 1067731 1068390 W 2011-02-03 1996-07-31 +S000002711 ORF Verified YDR303C RSC3 chromosome 4 4 1071386 1068729 C 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; essential gene required for maintenance of proper ploidy and regulation of ribosomal protein genes and the cell wall/stress response; RSC3 has a paralog, RSC30, that arose from the whole genome duplication +S000032135 CDS YDR303C 4 1071386 1068729 C 2011-02-03 1996-07-31 +S000002712 ORF Verified YDR304C CPR5 peptidylprolyl isomerase family protein CPR5|CYP5 chromosome 4 L000000466 4 1072557 1071880 C 2011-02-03 1996-07-31 Peptidyl-prolyl cis-trans isomerase (cyclophilin) of the ER; catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; transcriptionally induced in response to unfolded proteins in the ER; CPR5 has a paralog, CPR2, that arose from the whole genome duplication +S000034130 CDS YDR304C 4 1072557 1071880 C 2011-02-03 1996-07-31 +S000002713 ORF Verified YDR305C HNT2 bis(5'-adenosyl)-triphosphatase|APH1 chromosome 4 L000003335 4 1073488 1072746 C 2011-02-03 1996-07-31 Dinucleoside triphosphate hydrolase; has similarity to the tumor suppressor FHIT and belongs to the histidine triad (HIT) superfamily of nucleotide-binding proteins +S000034247 CDS YDR305C 4 1073312 1072746 C 2011-02-03 1996-07-31 +S000034246 CDS YDR305C 4 1073488 1073402 C 2011-02-03 1996-07-31 +S000034248 intron YDR305C 4 1073401 1073313 C 2011-02-03 1996-07-31 +S000002714 ORF Verified YDR306C chromosome 4 4 1075171 1073735 C 2011-02-03 1996-07-31 F-box protein of unknown function; interacts with Sgt1p via a Leucine-Rich Repeat (LRR) domain +S000034313 CDS YDR306C 4 1075171 1073735 C 2011-02-03 1996-07-31 +S000006767 tRNA_gene tV(CAC)D chromosome 4 L000003780 4 1075544 1075472 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000030586 noncoding_exon tV(CAC)D 4 1075544 1075472 C 2011-02-03 2000-05-19 +S000002715 ORF Uncharacterized YDR307W PMT7 putative dolichyl-phosphate-mannose--protein mannosyltransferase chromosome 4 S000029378|L000004021|L000004010 4 1075865 1077853 W 2011-02-03 1996-07-31 Putative protein mannosyltransferase similar to Pmt1p; has a potential role in protein O-glycosylation +S000035324 CDS YDR307W 4 1075865 1077853 W 2011-02-03 1996-07-31 +S000002716 ORF Verified YDR308C SRB7 SSX1|MED21 chromosome 4 L000002754|S000029514|L000002097 4 1078449 1078027 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation; target of the global repressor Tup1p +S000035339 CDS YDR308C 4 1078449 1078027 C 2011-02-03 1996-07-31 +S000002717 ORF Verified YDR309C GIC2 chromosome 4 L000003314 4 1080199 1079048 C 2011-02-03 1996-07-31 Redundant rho-like GTPase Cdc42p effector; involved in initiation of budding and cellular polarization; interacts with Cdc42p via the Cdc42/Rac-interactive binding (CRIB) domain and with PI(4,5)P2 via a polybasic region; GIC2 has a paralog, GIC1, that arose from the whole genome duplication +S000035408 CDS YDR309C 4 1080199 1079048 C 2011-02-03 1996-07-31 +S000002718 ORF Verified YDR310C SUM1 chromosome 4 L000003008 4 1084316 1081128 C 2011-02-03 1996-07-31 Transcriptional repressor that regulates middle-sporulation genes; required for mitotic repression of middle sporulation-specific genes; also acts as general replication initiation factor; involved in telomere maintenance, chromatin silencing; regulated by pachytene checkpoint +S000034868 CDS YDR310C 4 1084316 1081128 C 2011-02-03 1996-07-31 +S000002719 ORF Verified YDR311W TFB1 TFIIH/NER complex subunit TFB1 chromosome 4 L000002284 4 1085065 1086993 W 2011-02-03 1996-07-31 Subunit of TFIIH and nucleotide excision repair factor 3 complexes; required for nucleotide excision repair, target for transcriptional activators; relocalizes to the cytosol in response to hypoxia +S000035123 CDS YDR311W 4 1085065 1086993 W 2011-02-03 1996-07-31 +S000002720 ORF Verified YDR312W SSF2 rRNA-binding ribosome biosynthesis protein chromosome 4 L000002081 4 1087581 1088942 W 2011-02-03 1996-07-31 Protein required for ribosomal large subunit maturation; functionally redundant with Ssf1p; member of the Brix family; SSF2 has a paralog, SSF1, that arose from the whole genome duplication +S000035275 CDS YDR312W 4 1087581 1088942 W 2011-02-03 1996-07-31 +S000002721 ORF Verified YDR313C PIB1 phosphatidylinositol-3-phosphate-binding ubiquitin-protein ligase chromosome 4 L000004635 4 1090079 1089219 C 2011-02-03 1996-07-31 RING-type ubiquitin ligase of the endosomal and vacuolar membranes; binds phosphatidylinositol(3)-phosphate; contains a FYVE finger domain +S000036080 CDS YDR313C 4 1090079 1089219 C 2011-02-03 1996-07-31 +S000002722 ORF Verified YDR314C RAD34 chromosome 4 4 1092511 1090433 C 2011-02-03 1996-07-31 Protein involved in nucleotide excision repair (NER); homologous to RAD4 +S000036213 CDS YDR314C 4 1092511 1090433 C 2011-02-03 1996-07-31 +S000002723 ORF Verified YDR315C IPK1 inositol pentakisphosphate 2-kinase|GSL1 chromosome 4 L000003564 4 1093586 1092741 C 2011-02-03 1996-07-31 Inositol 1,3,4,5,6-pentakisphosphate 2-kinase; nuclear protein required for synthesis of 1,2,3,4,5,6-hexakisphosphate (phytate), which is integral to cell function; has 2 motifs conserved in other fungi; ipk1 gle1 double mutant is inviable; human IPPK can complement ipk1 null mutant +S000036321 CDS YDR315C 4 1093586 1092741 C 2011-02-03 1996-07-31 +S000002724 ORF Verified YDR316W OMS1 putative RNA methyltransferase chromosome 4 4 1093763 1095178 W 2011-02-03 1996-07-31 Protein integral to the mitochondrial membrane; has a conserved methyltransferase motif and is predicted to be an RNA methyltransferase; multicopy suppressor of respiratory defects caused by OXA1 mutations +S000030079 CDS YDR316W 4 1093763 1095178 W 2011-02-03 1996-07-31 +S000006563 tRNA_gene tF(GAA)D chromosome 4 L000003779 4 1095461 1095370 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis +S000035376 intron tF(GAA)D 4 1095424 1095406 C 2011-02-03 2000-05-19 +S000035375 noncoding_exon tF(GAA)D 4 1095405 1095370 C 2011-02-03 2000-05-19 +S000035374 noncoding_exon tF(GAA)D 4 1095461 1095425 C 2011-02-03 2000-05-19 +S000006871 long_terminal_repeat YDRWdelta23 chromosome 4 4 1095767 1096104 W 2011-02-03 2000-05-19 Ty1 LTR +S000006882 LTR_retrotransposon YDRWTy1-4 Ty1 chromosome 4 4 1095767 1101692 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007398 transposable_element_gene YDR316W-A gag protein chromosome 4 4 1096064 1097386 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000034439 CDS YDR316W-A 4 1096064 1097386 W 2011-02-03 1999-07-17 +S000007399 transposable_element_gene YDR316W-B gag-pol fusion protein chromosome 4 4 1096064 1101332 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000034443 CDS YDR316W-B 4 1096064 1097368 W 2011-02-03 1999-07-17 +S000034444 CDS YDR316W-B 4 1097370 1101332 W 2011-02-03 1999-07-17 +S000034445 plus_1_translational_frameshift YDR316W-B 4 1097369 1097369 W 2011-02-03 1999-07-17 +S000006872 long_terminal_repeat YDRWdelta24 chromosome 4 4 1101355 1101692 W 2011-02-03 2000-05-19 Ty1 LTR +S000002725 ORF Verified YDR317W HIM1 chromosome 4 S000029210|L000000774 4 1102184 1103428 W 275 2011-02-03 1996-07-31 Protein of unknown function involved in DNA repair +S000030217 CDS YDR317W 4 1102184 1103428 W 2011-02-03 1996-07-31 +S000002726 ORF Verified YDR318W MCM21 CTF5 chromosome 4 L000003998 4 1103758 1104947 W 2011-02-03 2003-09-27|1996-07-31 Component of the kinetochore sub-complex COMA; COMA (Ctf19p, Okp1p, Mcm21p, Ame1p) bridges kinetochore subunits in contact with centromeric DNA with subunits bound to microtubules during kinetochore assembly; involved in minichromosome maintenance; modified by sumoylation; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-O and fission yeast mal2 +S000030336 CDS YDR318W 4 1103758 1103809 W 2011-02-03 2003-09-27|1996-07-31 +S000030337 CDS YDR318W 4 1103893 1104947 W 2011-02-03 2003-09-27 +S000030338 intron YDR318W 4 1103810 1103892 W 2011-02-03 2003-09-27 +S000002727 ORF Uncharacterized YDR319C YFT2 FIT2A chromosome 4 4 1105827 1105003 C 2011-02-03 1996-07-31 Protein required for normal ER membrane biosynthesis; member of the highly conserved FIT family of proteins involved in triglyceride droplet biosynthesis and homologous to human FIT2; interacts with Sst2p and Hsp82p in high-throughput two-hybrid screens +S000030447 CDS YDR319C 4 1105827 1105003 C 2011-02-03 1996-07-31 +S000002728 ORF Verified YDR320C SWA2 BUD24|AUX1 chromosome 4 4 1108101 1106095 C 2011-02-03 1996-07-31 Auxilin-like protein involved in vesicular transport; clathrin-binding protein required for uncoating of clathrin-coated vesicles +S000030945 CDS YDR320C 4 1108101 1106095 C 2011-02-03 1996-07-31 +S000028821 ORF Dubious YDR320W-B chromosome 4 4 1108484 1108621 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene DAD4/YDR320C-A +S000033640 CDS YDR320W-B 4 1108484 1108621 W 2011-02-03 2003-07-29 +S000007604 ORF Verified YDR320C-A DAD4 HSK2 chromosome 4 4 1108498 1108280 C 2011-02-03 2001-02-26 Essential subunit of the Dam1 complex (aka DASH complex); complex couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; is transferred to the kinetochore prior to mitosis +S000037150 CDS YDR320C-A 4 1108498 1108280 C 2011-02-03 2001-02-26 +S000002729 ORF Verified YDR321W ASP1 asparaginase ASP1 chromosome 4 L000000129 4 1108702 1109847 W 190 2011-02-03 1996-07-31 Cytosolic L-asparaginase, involved in asparagine catabolism; catalyzes hydrolysis of L-asparagine to aspartic acid and ammonia; important enzyme for the treatment of acute lymphoblastic leukemia; has low glutaminase activity and dependence; synthesized constitutively +S000031109 CDS YDR321W 4 1108702 1109847 W 2011-02-03 1996-07-31 +S000119071 ARS ARS452 ARSIV-1110|ARS431.5 chromosome 4 4 1109964 1110204 2011-02-03 2006-10-05 Autonomously Replicating Sequence +S000002730 ORF Verified YDR322W MRPL35 mitochondrial 54S ribosomal protein YmL35|YmL35 chromosome 4 L000002694 4 1110589 1111692 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000031250 CDS YDR322W 4 1110589 1111692 W 2011-02-03 1996-07-31 +S000007255 ORF Verified YDR322C-A TIM11 F1F0 ATP synthase subunit e|ATP21 chromosome 4 L000004719 4 1112293 1112003 C 2011-02-03 1999-07-17 Subunit e of mitochondrial F1F0-ATPase; ATPase is a large, evolutionarily conserved enzyme complex required for ATP synthesis; essential for the dimeric and oligomeric state of ATP synthase, which in turn determines the shape of inner membrane cristae +S000035372 CDS YDR322C-A 4 1112293 1112003 C 2011-02-03 1999-07-17 +S000002731 ORF Verified YDR323C PEP7 VPT19|VPS19|VPL21|VAC1 chromosome 4 L000001377 4 1114027 1112480 C 192 2011-02-03 1996-07-31 Adaptor protein involved in vesicle-mediated vacuolar protein sorting; multivalent adaptor protein; facilitates vesicle-mediated vacuolar protein sorting by ensuring high-fidelity vesicle docking and fusion, which are essential for targeting of vesicles to the endosome; required for vacuole inheritance +S000031288 CDS YDR323C 4 1114027 1112480 C 2011-02-03 1996-07-31 +S000002732 ORF Verified YDR324C UTP4 chromosome 4 4 1116763 1114433 C 2011-02-03 1996-07-31 Subunit of U3-containing 90S preribosome and SSU processome complexes; involved in production of 18S rRNA and assembly of small ribosomal subunit; member of t-Utp subcomplex involved with transcription of 35S rRNA transcript; Small Subunit processome is also known as SSU processome +S000032287 CDS YDR324C 4 1116763 1114433 C 2011-02-03 1996-07-31 +S000002733 ORF Verified YDR325W YCG1 condensin subunit YCG1|YCS5|TIE1 chromosome 4 S000007469 4 1117126 1120233 W 2011-02-03 2002-12-17|1996-07-31 Subunit of the condensin complex; required for establishment and maintenance of chromosome condensation, chromosome segregation and chromatin binding by the complex; required for tRNA genes clustering at the nucleolus; required for replication slow zone breakage following Mec1p inactivation; transcription is cell cycle regulated, peaking in mitosis and declining in G1; protein is constitutively degraded by the proteasome; rate limiting for condensin recruitment to chromatin +S000032437 CDS YDR325W 4 1117126 1120233 W 2011-02-03 2002-12-17|1996-07-31 +S000002734 ORF Verified YDR326C YSP2 LAM2|LTC4 chromosome 4 4 1124925 1120609 C 2011-02-03 1996-07-31 Sterol-binding protein; has a probable role in retrograde transport of sterols from the plasma membrane to the ER; contains two StART-like domains that bind sterols and a GRAM domain; co-localizes to puncta in the cortical ER with Sip3p; one of six StART-like domain-containing proteins in yeast that may be involved in sterol transfer between intracellular membranes; conserved across eukaryotes +S000032495 CDS YDR326C 4 1124925 1120609 C 2011-02-03 1996-07-31 +S000002735 ORF Dubious YDR327W chromosome 4 4 1125302 1125628 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene SKP1 +S000034595 CDS YDR327W 4 1125302 1125628 W 2011-02-03 1996-07-31 +S000002736 ORF Verified YDR328C SKP1 SCF ubiquitin ligase subunit SKP1|CBF3D|MGO1 chromosome 4 L000001910 4 1126018 1125434 C 2011-02-03 1996-07-31 Evolutionarily conserved kinetochore protein; part of multiple protein complexes, including the SCF ubiquitin ligase complex, the CBF3 complex that binds centromeric DNA, and the RAVE complex that regulates assembly of the V-ATPase; protein abundance increases in response to DNA replication stress +S000034604 CDS YDR328C 4 1126018 1125434 C 2011-02-03 1996-07-31 +S000002737 ORF Verified YDR329C PEX3 PAS3 chromosome 4 L000001339 4 1127595 1126270 C 2011-02-03 1996-07-31 Peroxisomal membrane protein (PMP); required for proper localization and stability of PMPs; anchors peroxisome retention factor Inp1p at the peroxisomal membrane; interacts with Pex19p +S000034672 CDS YDR329C 4 1127595 1126270 C 2011-02-03 1996-07-31 +S000002738 ORF Verified YDR330W UBX5 chromosome 4 4 1127872 1129374 W 2011-02-03 1996-07-31 UBX domain-containing protein that interacts with Cdc48p; ubiquitin regulatory X is also known as UBX +S000034262 CDS YDR330W 4 1127872 1129374 W 2011-02-03 1996-07-31 +S000002739 ORF Verified YDR331W GPI8 GPI-anchor transamidase chromosome 4 L000004086 4 1129588 1130823 W 2011-02-03 1996-07-31 ER membrane glycoprotein subunit of the GPI transamidase complex; adds glycosylphosphatidylinositol (GPI) anchors to newly synthesized proteins; human PIG-K protein is a functional homolog +S000034385 CDS YDR331W 4 1129588 1130823 W 2011-02-03 1996-07-31 +S000002740 ORF Verified YDR332W IRC3 double-stranded DNA-dependent ATPase chromosome 4 4 1131001 1133070 W 2011-02-03 1996-07-31 Double-stranded DNA-dependent helicase of the DExH/D-box family; required for maintenance of the mitochondrial (mt) genome; null mutant accumulates double-stranded breaks in mt DNA; localizes to the mt matrix +S000035410 CDS YDR332W 4 1131001 1133070 W 2011-02-03 1996-07-31 +S000002741 ORF Verified YDR333C RQC1 chromosome 4 4 1135431 1133260 C 2011-02-03 1996-07-31 Component of the ribosome quality control complex (RQC); RQC (Rqc1p-Rkr1p-Tae2p-Cdc48p-Npl4p-Ufd1p) is a ribosome-bound complex required for the degradation of polypeptides arising from stalled translation; required along with Rkr1p for recruitment of the Cdc48p-Npl4p-Ufd1p AAA ATPase complex to the RQC +S000035465 CDS YDR333C 4 1135431 1133260 C 2011-02-03 1996-07-31 +S000002742 ORF Verified YDR334W SWR1 chromatin-remodeling protein SWR1 chromosome 4 S000007447 4 1135932 1140476 W 2011-02-03 1996-07-31 Swi2/Snf2-related ATPase; structural component of the SWR1 complex, which exchanges histone variant H2AZ (Htz1p) for chromatin-bound histone H2A; relocalizes to the cytosol in response to hypoxia; chronological aging factor that mediates lifespan extension by dietary restriction +S000035602 CDS YDR334W 4 1135932 1140476 W 2011-02-03 1996-07-31 +S000002743 ORF Verified YDR335W MSN5 karyopherin MSN5|STE21|KAP142 chromosome 4 L000002124|L000003212 4 1141168 1144842 W 196 2011-02-03 1996-07-31 Karyopherin; involved in nuclear import and export of proteins, including import of replication protein A and export of Far1p and transcription factors Swi5p, Swi6p, Msn2p, and Pho4p; required for re-export of mature tRNAs after their retrograde import from the cytoplasm; exportin-5 homolog +S000036506 CDS YDR335W 4 1141168 1144842 W 2011-02-03 1996-07-31 +S000002744 ORF Uncharacterized YDR336W MRX8 chromosome 4 4 1145092 1146036 W 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; sumoylated under stress conditions in a genome wide study; YDR336W is not an essential gene +S000036602 CDS YDR336W 4 1145092 1146036 W 2011-02-03 1996-07-31 +S000002745 ORF Verified YDR337W MRPS28 mitochondrial 37S ribosomal protein MRPS28 chromosome 4 L000001176 4 1146319 1147179 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit +S000036695 CDS YDR337W 4 1146319 1147179 W 2011-02-03 1996-07-31 +S000002746 ORF Uncharacterized YDR338C chromosome 4 4 1149466 1147379 C 2011-02-03 1996-07-31 Putative protein of unknown function; member of the multi-drug and toxin extrusion (MATE) family of the multidrug/oligosaccharidyl-lipid/polysaccharide (MOP) exporter superfamily +S000036729 CDS YDR338C 4 1149466 1147379 C 2011-02-03 1996-07-31 +S000002747 ORF Verified YDR339C FCF1 rRNA-processing protein FCF1|UTP24 chromosome 4 4 1150520 1149951 C 2011-02-03 1996-07-31 Putative PINc domain nuclease; required for early cleavages of 35S pre-rRNA and maturation of 18S rRNA; component of the SSU (small subunit) processome involved in 40S ribosomal subunit biogenesis; copurifies with Faf1p +S000030573 CDS YDR339C 4 1150520 1149951 C 2011-02-03 1996-07-31 +S000002748 ORF Dubious YDR340W chromosome 4 4 1150881 1151183 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000030471 CDS YDR340W 4 1150881 1151183 W 2011-02-03 1996-07-31 +S000006777 tRNA_gene tX(XXX)D chromosome 4 L000003778 4 1150941 1150842 C 2011-02-03 2000-05-19 tRNA of undetermined specificity, predicted by tRNAscan-SE analysis; very similar to serine tRNAs +S000032726 noncoding_exon tX(XXX)D 4 1150941 1150842 C 2011-02-03 2000-05-19 +S000006873 long_terminal_repeat YDRWdelta25 chromosome 4 4 1151039 1151368 W 2011-02-03 2000-05-19 Ty1 LTR +S000002749 ORF Verified YDR341C arginine--tRNA ligase|ArgRS|RRS1 chromosome 4 4 1153626 1151803 C 2011-02-03 1996-07-31 Arginyl-tRNA synthetase; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; YDR341C has a paralog, MSR1, that arose from the whole genome duplication +S000030508 CDS YDR341C 4 1153626 1151803 C 2011-02-03 1996-07-31 +S000002750 ORF Verified YDR342C HXT7 hexose transporter HXT7 chromosome 4 L000000841 4 1155928 1154216 C 2011-02-03 1996-07-31 High-affinity glucose transporter; member of the major facilitator superfamily, nearly identical to Hxt6p, expressed at high basal levels relative to other HXTs, expression repressed by high glucose levels; HXT7 has a paralog, HXT4, that arose from the whole genome duplication +S000031436 CDS YDR342C 4 1155928 1154216 C 2011-02-03 1996-07-31 +S000118444 ARS ARS432 ARSIV-1159 chromosome 4 4 1159262 1159510 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000119074 ARS_consensus_sequence ARS432 4 1159461 1159447 C 2011-02-03 2006-10-05 +S000002751 ORF Verified YDR343C HXT6 hexose transporter HXT6 chromosome 4 L000000840 4 1161320 1159608 C 2011-02-03 1996-07-31 High-affinity glucose transporter; member of the major facilitator superfamily, nearly identical to Hxt7p, expressed at high basal levels relative to other HXTs, repression of expression by high glucose requires SNF3; HXT6 has a paralog, HXT1, that arose from the whole genome duplication +S000031535 CDS YDR343C 4 1161320 1159608 C 2011-02-03 1996-07-31 +S000002752 ORF Dubious YDR344C chromosome 4 4 1162449 1162006 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031692 CDS YDR344C 4 1162449 1162006 C 2011-02-03 1996-07-31 +S000002753 ORF Verified YDR345C HXT3 hexose transporter HXT3 chromosome 4 L000000837 4 1164660 1162957 C 209.07 2011-02-03 1996-07-31 Low affinity glucose transporter of the major facilitator superfamily; expression is induced in low or high glucose conditions; HXT3 has a paralog, HXT5, that arose from the whole genome duplication +S000032671 CDS YDR345C 4 1164660 1162957 C 2011-02-03 1996-07-31 +S000119072 ARS ARS453 ARSIV-1166|ARS432.5 chromosome 4 4 1166067 1166212 2014-11-18 2014-11-18|2006-10-05 Autonomously Replicating Sequence +S000119073 ARS_consensus_sequence ARS453 4 1166181 1166167 C 2011-02-03 2006-10-05 +S000002754 ORF Verified YDR346C SVF1 SGI1 chromosome 4 4 1168659 1167214 C 2011-02-03 1996-07-31 Protein with a potential role in cell survival pathways; required for the diauxic growth shift; expression in mammalian cells increases survival under conditions inducing apoptosis; mutant has increased aneuploidy tolerance +S000032732 CDS YDR346C 4 1168659 1167214 C 2011-02-03 1996-07-31 +S000002755 ORF Verified YDR347W MRP1 mitochondrial 37S ribosomal protein MRP1 chromosome 4 L000001152 4 1169178 1170143 W 204.07 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; MRP1 exhibits genetic interactions with PET122, encoding a COX3-specific translational activator, and with PET123, encoding a small subunit mitochondrial ribosomal protein +S000032890 CDS YDR347W 4 1169178 1170143 W 2011-02-03 1996-07-31 +S000002756 ORF Verified YDR348C PAL1 chromosome 4 4 1171825 1170326 C 2011-02-03 1996-07-31 Protein of unknown function thought to be involved in endocytosis; physically interacts with Ede1p and is found at endocytic sites at cell periphery during early stages of endocytosis; green fluorescent protein (GFP)-fusion protein localizes to bud neck; potential Cdc28p substrate; similar to S. pombe Pal1 protein; relocalizes from bud neck to cytoplasm upon DNA replication stress; PAL1 has a paralog, YHR097C, that arose from the whole genome duplication +S000034824 CDS YDR348C 4 1171825 1170326 C 2011-02-03 1996-07-31 +S000002757 ORF Verified YDR349C YPS7 putative aspartic endopeptidase chromosome 4 L000004384 4 1174176 1172386 C 2011-02-03 1996-07-31 Putative GPI-anchored aspartic protease; member of the yapsin family of proteases involved in cell wall growth and maintenance; located in the cytoplasm and endoplasmic reticulum +S000034909 CDS YDR349C 4 1174176 1172386 C 2011-02-03 1996-07-31 +S000006874 long_terminal_repeat YDRWdelta26 chromosome 4 4 1175316 1175647 W 2011-02-03 2000-05-19 Ty1 LTR +S000006858 long_terminal_repeat YDRCsigma6 chromosome 4 4 1175812 1175134 C 2011-02-03 2000-05-19 Ty3 LTR +S000006659 tRNA_gene tM(CAU)D EMT1 chromosome 4 L000000551|L000003772 4 1175829 1175901 W 2011-02-03 2000-05-19 Methionine tRNA (tRNA-Met), functions in translational elongation; not involved in translational initiation; predicted by tRNAscan-SE analysis +S000034501 noncoding_exon tM(CAU)D 4 1175829 1175901 W 2011-02-03 2000-05-19 +S000002758 ORF Verified YDR350C ATP22 TCM10 chromosome 4 L000002912 4 1178174 1176120 C 2011-02-03 1996-07-31|2011-02-03 Specific translational activator for the mitochondrial ATP6 mRNA; Atp6p encodes a subunit of F1F0 ATP synthase; localized to the mitochondrial inner membrane +S000033802 CDS YDR350C 4 1178174 1176120 C 2011-02-03 1996-07-31|2011-02-03 +S000002759 ORF Verified YDR351W SBE2 chromosome 4 L000002745 4 1178666 1181260 W 2011-02-03 1996-07-31 Protein required for bud growth; involved in transport of cell wall components from the Golgi to the cell surface; SBE2 has a paralog, SBE22, that arose from the whole genome duplication +S000034051 CDS YDR351W 4 1178666 1181260 W 2011-02-03 1996-07-31 +S000002760 ORF Verified YDR352W YPQ2 chromosome 4 4 1181801 1182754 W 2011-02-03 1996-07-31 Putative vacuolar membrane transporter for cationic amino acids; likely contributes to amino acid homeostasis by exporting cationic amino acids from the vacuole; member of the PQ-loop family, with seven transmembrane domains; mutant phenotype is functionally complemented by rat PQLC2 vacuolar transporter +S000034941 CDS YDR352W 4 1181801 1182754 W 2011-02-03 1996-07-31 +S000002761 ORF Verified YDR353W TRR1 thioredoxin-disulfide reductase TRR1 chromosome 4 L000003953 4 1183299 1184258 W 2011-02-03 1996-07-31 Cytoplasmic thioredoxin reductase; key regulatory enzyme that determines the redox state of the thioredoxin system, which acts as a disulfide reductase system and protects cells against both oxidative and reductive stress; protein abundance increases in response to DNA replication stress; TRR1 has a paralog, TRR2, that arose from the whole genome duplication +S000035089 CDS YDR353W 4 1183299 1184258 W 2011-02-03 1996-07-31 +S000002762 ORF Verified YDR354W TRP4 anthranilate phosphoribosyltransferase chromosome 4 L000002355 4 1184747 1185889 W 209 2011-02-03 1996-07-31 Anthranilate phosphoribosyl transferase; transferase of the tryptophan biosynthetic pathway; catalyzes the phosphoribosylation of anthranilate; subject to the general control system of amino acid biosynthesis +S000035242 CDS YDR354W 4 1184747 1185889 W 2011-02-03 1996-07-31 +S000028613 ORF Dubious YDR354C-A chromosome 4 4 1185282 1185139 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps TRP4; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031447 CDS YDR354C-A 4 1185282 1185139 C 2011-02-03 2003-07-29 +S000002764 ORF Verified YDR356W SPC110 NUF1|XCM1 chromosome 4 L000001285 4 1186107 1188941 W 2011-02-03 1996-07-31 Inner plaque spindle pole body (SPB) component; ortholog of human kendrin; gamma-tubulin small complex (gamma-TuSC) receptor that interacts with Spc98p to recruit the complex to the nuclear side of the SPB, connecting nuclear microtubules to the SPB; promotes gamma-TuSC assembly and oligomerization to initiate microtubule nucleation; interacts with Tub4p-complex and calmodulin; phosphorylated by Mps1p in cell cycle-dependent manner +S000036297 CDS YDR356W 4 1186107 1188941 W 2011-02-03 1996-07-31 +S000002763 ORF Dubious YDR355C chromosome 4 4 1186369 1186067 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified essential ORF SPC110/YDR356W +S000035318 CDS YDR355C 4 1186369 1186067 C 2011-02-03 1996-07-31 +S000002765 ORF Verified YDR357C CNL1 BLC1 chromosome 4 4 1189567 1189199 C 2011-02-03 1996-07-31 Subunit of the BLOC-1 complex involved in endosomal maturation; interacts with Msb3p; null mutant is sensitive to drug inducing secretion of vacuolar cargo; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000036341 CDS YDR357C 4 1189567 1189199 C 2011-02-03 1996-07-31 +S000002766 ORF Verified YDR358W GGA1 ubiquitin-binding protein chromosome 4 S000007493 4 1190059 1191732 W 2011-02-03 1996-07-31 Golgi-localized protein with homology to gamma-adaptin; interacts with and regulates Arf1p and Arf2p in a GTP-dependent manner in order to facilitate traffic through the late Golgi; GGA1 has a paralog, GGA2, that arose from the whole genome duplication +S000036474 CDS YDR358W 4 1190059 1191732 W 2011-02-03 1996-07-31 +S000002768 ORF Dubious YDR360W OPI7 chromosome 4 4 1194598 1195032 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene VID21/YDR359C +S000030092 CDS YDR360W 4 1194598 1195032 W 2011-02-03 1996-07-31|2011-02-03 +S000002767 ORF Verified YDR359C EAF1 VID21 chromosome 4 4 1194884 1191936 C 2011-02-03 2004-02-06|1996-07-31 Component of the NuA4 histone acetyltransferase complex; acts as a platform for assembly of NuA4 subunits into the native complex; required for initiation of pre-meiotic DNA replication, likely due to its requirement for expression of IME1 +S000037088 CDS YDR359C 4 1194884 1191936 C 2011-02-03 2004-02-06|1996-07-31 +S000002769 ORF Verified YDR361C BCP1 protein-transporting protein BCP1 chromosome 4 4 1196263 1195412 C 2011-02-03 1996-07-31 Essential protein involved in nuclear export of Mss4p; Mss4p is a lipid kinase that generates phosphatidylinositol 4,5-biphosphate and plays a role in actin cytoskeleton organization and vesicular transport +S000030230 CDS YDR361C 4 1196263 1195412 C 2011-02-03 1996-07-31 +S000002770 ORF Verified YDR362C TFC6 transcription factor TFIIIC subunit TFC6|tau 91 chromosome 4 L000004492 4 1198697 1196679 C 2011-02-03 1996-07-31 Subunit of RNA polymerase III transcription initiation factor complex; one of six subunits of RNA polymerase III transcription initiation factor complex (TFIIIC); part of TFIIIC TauB domain that binds BoxB promoter sites of tRNA and other genes; cooperates with Tfc3p in DNA binding; human homolog is TFIIIC-110 +S000031159 CDS YDR362C 4 1198697 1196679 C 2011-02-03 1996-07-31 +S000077077 matrix_attachment_site ETC6 ETC6 chromosome 4 4 1198885 1198907 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; can act as a transcription-blocking insulator or as a heterochromatin barrier element; remains predominantly localized to the nuclear periphery throughout cell cycle; located between divergently transcribed genes TFC6 and ESC2 +S000002771 ORF Verified YDR363W ESC2 chromosome 4 L000004423 4 1199183 1200553 W 2011-02-03 1996-07-31 Sumo-like domain protein; prevents accumulation of toxic intermediates during replication-associated recombinational repair; roles in silencing, lifespan, chromatid cohesion and the intra-S-phase DNA damage checkpoint; RENi family member +S000031326 CDS YDR363W 4 1199183 1200553 W 2011-02-03 1996-07-31 +S000006616 tRNA_gene tK(CUU)D1 chromosome 4 L000003773 4 1201750 1201822 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000035877 noncoding_exon tK(CUU)D1 4 1201750 1201822 W 2011-02-03 2000-05-19 +S000007235 ORF Verified YDR363W-A SEM1 proteasome regulatory particle lid subunit SEM1|HOD1|DSS1 chromosome 4 L000003539|L000004647 4 1202128 1202397 W 2011-02-03 1999-07-17 19S proteasome regulatory particle lid subcomplex component; role in Ub-dependent proteolysis and proteasome stability; involved in TREX-2 mediated mRNA export, and in the prevention of transcription-associated genome instability; ubiquitinated by Nedd4-like E3-ligase, Rsp5p; human ortholog DSS1, a BRCA1 binding protein implicated in cancer, complements the yeast null; drives trinucleotide repeat expansion; protein abundance increases in response to DNA replication stress +S000037294 CDS YDR363W-A 4 1202128 1202397 W 2011-02-03 1999-07-17 +S000002772 ORF Verified YDR364C CDC40 SLU4|SLT15|PRP17 chromosome 4 L000000275|L000001921 4 1204210 1202843 C 211 2011-02-03 1996-07-31 Pre-mRNA splicing factor; important for catalytic step II of pre-mRNA splicing and plays a role in cell cycle progression, particularly at the G1/S phase transition; required for DNA synthesis during mitosis and meiosis; has WD repeats; thermosensitivity of the cdc40 null mutant is functionally complemented by a chimeric construct containing the N-terminal 156 amino acids of yeast Cdc40p fused to the C-terminal two thirds (297 amino acids) of human CDC40 +S000031393 CDS YDR364C 4 1204210 1202843 C 2011-02-03 1996-07-31 +S000002773 ORF Verified YDR365C ESF1 chromosome 4 4 1206383 1204497 C 2011-02-03 1996-07-31 Nucleolar protein involved in pre-rRNA processing; depletion causes severely decreased 18S rRNA levels +S000032429 CDS YDR365C 4 1206383 1204497 C 2011-02-03 1996-07-31 +S000006875 long_terminal_repeat YDRWdelta27 chromosome 4 4 1206704 1207037 W 2011-02-03 2000-05-19 Ty1 LTR +S000006883 LTR_retrotransposon YDRWTy1-5 Ty1 chromosome 4 4 1206704 1212621 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007400 transposable_element_gene YDR365W-A gag protein chromosome 4 4 1206997 1208319 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000032504 CDS YDR365W-A 4 1206997 1208319 W 2011-02-03 1999-07-17 +S000007401 transposable_element_gene YDR365W-B gag-pol fusion protein chromosome 4 S000029012 4 1206997 1212265 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000032510 CDS YDR365W-B 4 1206997 1208301 W 2011-02-03 1999-07-17 +S000032511 CDS YDR365W-B 4 1208303 1212265 W 2011-02-03 1999-07-17 +S000032512 plus_1_translational_frameshift YDR365W-B 4 1208302 1208302 W 2011-02-03 1999-07-17 +S000006876 long_terminal_repeat YDRWdelta28 chromosome 4 4 1212288 1212621 W 2011-02-03 2000-05-19 Ty1 LTR +S000002774 ORF Uncharacterized YDR366C chromosome 4 4 1212836 1212438 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000032506 CDS YDR366C 4 1212836 1212438 C 2011-02-03 1996-07-31 +S000002775 ORF Verified YDR367W KEI1 chromosome 4 4 1212848 1213614 W 2011-02-03 1996-07-31 Component of inositol phosphorylceramide (IPC) synthase; forms a complex with Aur1p and regulates its activity; required for IPC synthase complex localization to the Golgi; post-translationally processed by Kex2p; KEI1 is an essential gene +S000032662 CDS YDR367W 4 1212848 1212877 W 2011-02-03 1996-07-31 +S000032663 CDS YDR367W 4 1212979 1213614 W 2011-02-03 1996-07-31 +S000032664 intron YDR367W 4 1212878 1212978 W 2011-02-03 1996-07-31 +S000002776 ORF Verified YDR368W YPR1 trifunctional aldehyde reductase/carbonyl reductase (NADPH)/glucose 1-dehydrogenase (NADP(+)) YPR1 chromosome 4 L000003084 4 1213904 1214842 W 2011-02-03 1996-07-31 NADPH-dependent aldo-keto reductase; reduces multiple substrates including 2-methylbutyraldehyde and D,L-glyceraldehyde, expression is induced by osmotic and oxidative stress; functionally redundant with other aldo-keto reductases; protein abundance increases in response to DNA replication stress; YPR1 has a paralog, GCY1, that arose from the whole genome duplication; human homolog AKR1B1 can complement yeast null mutant +S000033354 CDS YDR368W 4 1213904 1214842 W 2011-02-03 1996-07-31 +S000002777 ORF Verified YDR369C XRS2 chromosome 4 L000002489 4 1217580 1215016 C 211 2011-02-03 1996-07-31 Protein required for DNA repair; component of the Mre11 complex, which is involved in double strand breaks, meiotic recombination, telomere maintenance, and checkpoint signaling +S000033386 CDS YDR369C 4 1217580 1215016 C 2011-02-03 1996-07-31 +S000002778 ORF Verified YDR370C DXO1 chromosome 4 4 1219110 1217782 C 2011-02-03 1996-07-31 mRNA 5'-end-capping quality-control protein; has distributive, 5'-3' exoRNase activity; similar to Rai1p; +S000034314 CDS YDR370C 4 1219110 1217782 C 2011-02-03 1996-07-31 +S000002779 ORF Uncharacterized YDR371W CTS2 putative chitinase chromosome 4 4 1219413 1220948 W 2011-02-03 1996-07-31 Putative chitinase; functionally complements A. gossypii cts2 mutant sporulation defect +S000034441 CDS YDR371W 4 1219413 1220948 W 2011-02-03 1996-07-31 +S000028822 ORF Dubious YDR371C-A chromosome 4 4 1219613 1219509 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized gene CTS2/YDR371W; identified by expression profiling and mass spectrometry +S000033641 CDS YDR371C-A 4 1219613 1219509 C 2011-02-03 2003-07-29 +S000002780 ORF Verified YDR372C VPS74 MNN3|API1 chromosome 4 4 1222149 1221112 C 2011-02-03 1996-07-31 Golgi phosphatidylinositol-4-kinase effector and PtdIns4P sensor; interacts with the cytosolic domains of cis and medial glycosyltransferases, and in the PtdIns4P-bound state mediates the targeting of these enzymes to the Golgi; interacts with the catalytic domain of Sac1p, the major cellular PtdIns4P phosphatase, to direct dephosphosphorylation of the Golgi pool of PtdIns4P; tetramerization required for function; ortholog of human GOLPH3/GPP34/GMx33 +S000034509 CDS YDR372C 4 1222149 1221112 C 2011-02-03 1996-07-31 +S000002781 ORF Verified YDR373W FRQ1 frequenin chromosome 4 4 1222759 1223331 W 2011-02-03 1996-07-31 N-myristoylated calcium-binding protein; may have a role in intracellular signaling through its regulation of the phosphatidylinositol 4-kinase Pik1p; member of the recoverin/frequenin branch of the EF-hand superfamily; human NCS1 functionally complements the heat sensitivity of a frq1 ts mutant +S000035570 CDS YDR373W 4 1222759 1223331 W 2011-02-03 1996-07-31 +S000002782 ORF Verified YDR374C PHO92 mRNA-binding phosphate metabolism regulator chromosome 4 4 1224394 1223474 C 2011-02-03 1996-07-31 Posttranscriptional regulator of phosphate metabolism; facilitates PHO4 mRNA degradation by interacting with Pop2p; regulates PHO4 mRNA stability by binding to PHO4's 3'UTR in a phosphate-dependent manner; contains highly conserved YTH (YT521-B Homology) domain that exhibits RNA-binding activity; human homolog YTHDF2 can complement yeast null mutant +S000035608 CDS YDR374C 4 1224394 1223474 C 2011-02-03 1996-07-31 +S000113553 ORF Verified YDR374W-A WIP1 chromosome 4 4 1224757 1225026 W 2011-02-03 2005-11-16 Kinetochore localized protein of unknown function; interacts with Cnn1p (CENP-T); orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-W and fission yeast new1 +S000113554 CDS YDR374W-A 4 1224757 1225026 W 2011-02-03 2005-11-16 +S000002783 ORF Verified YDR375C BCS1 bifunctional AAA family ATPase chaperone/translocase BCS1 chromosome 4 L000000164 4 1226536 1225166 C 2011-02-03 1996-07-31 Protein translocase and chaperone required for Complex III assembly; member of the AAA ATPase family; forms a homo-oligomeric complex in the mitochondrial inner membrane that translocates the C-terminal domain of Rip1p from the matrix across the inner membrane and delivers it to an assembly intermediate of respiratory Complex III; also required for assembly of the Qcr10p subunit; mutation is functionally complemented by human homolog BCS1L, linked to neonatal diseases +S000035698 CDS YDR375C 4 1226536 1225166 C 2011-02-03 1996-07-31 +S000002784 ORF Verified YDR376W ARH1 NADPH-adrenodoxin reductase chromosome 4 L000002799 4 1226822 1228303 W 2011-02-03 1996-07-31 Oxidoreductase of the mitochondrial inner membrane; involved in cytoplasmic and mitochondrial iron homeostasis and required for activity of Fe-S cluster-containing enzymes; one of the few mitochondrial proteins essential for viability +S000036678 CDS YDR376W 4 1226822 1228303 W 2011-02-03 1996-07-31 +S000002785 ORF Verified YDR377W ATP17 F1F0 ATP synthase subunit f chromosome 4 L000003415 4 1228611 1228916 W 2011-02-03 1996-07-31 Subunit f of the F0 sector of mitochondrial F1F0 ATP synthase; F1F0 ATP synthase is a large, evolutionarily conserved enzyme complex required for ATP synthesis +S000036737 CDS YDR377W 4 1228611 1228916 W 2011-02-03 1996-07-31 +S000002786 ORF Verified YDR378C LSM6 U4/U6-U5 snRNP complex subunit LSM6 chromosome 4 L000004685 4 1229609 1229349 C 2011-02-03 1996-07-31|2005-11-22 Lsm (Like Sm) protein; part of heteroheptameric complexes (Lsm2p-7p and either Lsm1p or 8p): cytoplasmic Lsm1p complex involved in mRNA decay; nuclear Lsm8p complex part of U6 snRNP and possibly involved in processing tRNA, snoRNA, and rRNA +S000036760 CDS YDR378C 4 1229609 1229349 C 2011-02-03 1996-07-31|2005-11-22 +S000002787 ORF Verified YDR379W RGA2 chromosome 4 L000004022 4 1230167 1233196 W 2011-02-03 1996-07-31 GTPase-activating protein for polarity-establishment protein Cdc42p; implicated in control of septin organization, pheromone response, and haploid invasive growth; regulated by Pho85p and Cdc28p; RGA2 has a paralog, RGA1, that arose from the whole genome duplication +S000036849 CDS YDR379W 4 1230167 1233196 W 2011-02-03 1996-07-31 +S000007605 ORF Verified YDR379C-A SDH6 chromosome 4 4 1233517 1233278 C 2011-02-03 2001-02-26 Mitochondrial protein involved in assembly of succinate dehydrogenase; has a role in maturation of the Sdh2p subunit; member of the LYR protein family; mutations in human ortholog SDHAF1 are associated with infantile leukoencephalopathy +S000037182 CDS YDR379C-A 4 1233517 1233278 C 2011-02-03 2001-02-26 +S000002788 ORF Verified YDR380W ARO10 phenylpyruvate decarboxylase ARO10 chromosome 4 4 1234218 1236125 W 2011-02-03 1996-07-31 Phenylpyruvate decarboxylase; catalyzes decarboxylation of phenylpyruvate to phenylacetaldehyde, which is the first specific step in the Ehrlich pathway; involved in protein N-terminal Met and Ala catabolism +S000037478 CDS YDR380W 4 1234218 1236125 W 2011-02-03 1996-07-31 +S000002789 ORF Verified YDR381W YRA1 RNA-binding protein YRA1|SHE11 chromosome 4 L000002959|L000002873 4 1236558 1238004 W 2011-02-03 1999-07-17|1996-07-31 Nuclear polyadenylated RNA-binding protein; required for export of poly(A)+ mRNA from the nucleus; proposed to couple mRNA export with 3' end processing via its interactions with Mex67p and Pcf11p; interacts with DBP2; inhibits the helicase activity of Dbp2; functionally redundant with Yra2p, another REF family member +S000037615 CDS YDR381W 4 1236558 1236842 W 2011-02-03 1999-07-17|1996-07-31 +S000037616 CDS YDR381W 4 1237609 1238004 W 2011-02-03 1999-07-17 +S000037617 intron YDR381W 4 1236843 1237608 W 2011-02-03 1999-07-17 +S000007650 ORF Verified YDR381C-A chromosome 4 4 1238850 1238312 C 2011-02-03 2004-01-26|2001-03-30 Protein of unknown function; localized to the mitochondrial outer membrane +S000037338 CDS YDR381C-A 4 1238630 1238312 C 2011-02-03 2004-01-26|2001-03-30 +S000037337 CDS YDR381C-A 4 1238850 1238825 C 2011-02-03 2004-01-26|2001-03-30 +S000037339 intron YDR381C-A 4 1238824 1238631 C 2011-02-03 2004-01-26|2001-03-30 +S000002790 ORF Verified YDR382W RPP2B ribosomal protein P2B|YP2beta|P2B|L45|YPA1|RPL45 chromosome 4 L000001736 4 1239492 1239824 W 2011-02-03 1996-07-31 Ribosomal protein P2 beta; a component of the ribosomal stalk, which is involved in the interaction between translational elongation factors and the ribosome; free (non-ribosomal) P2 stimulates the phosphorylation of the eIF2 alpha subunit (Sui2p) by Gcn2p; regulates the accumulation of P1 (Rpp1Ap and Rpp1Bp) in the cytoplasm +S000030372 CDS YDR382W 4 1239492 1239824 W 2011-02-03 1996-07-31 +S000002791 ORF Verified YDR383C NKP1 chromosome 4 4 1240676 1239960 C 2011-02-03 2003-09-22|1996-07-31 Central kinetochore protein and subunit of the Ctf19 complex; mutants have elevated rates of chromosome loss; orthologous to fission yeast kinetochore protein fta4 +S000030450 CDS YDR383C 4 1240676 1239960 C 2011-02-03 2003-09-22|1996-07-31 +S000118445 ARS ARS433 ARSIV-1241 chromosome 4 4 1240882 1241110 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178079 ARS_consensus_sequence ARS433 4 1240919 1240935 W 2014-11-18 2014-11-18 +S000002792 ORF Verified YDR384C ATO3 putative ammonium permease ATO3 chromosome 4 4 1242031 1241204 C 2011-02-03 1996-07-31 Plasma membrane protein, putative ammonium transporter; regulation pattern suggests a possible role in export of ammonia from the cell; phosphorylated in mitochondria; member of the TC 9.B.33 YaaH family of putative transporters +S000030592 CDS YDR384C 4 1242031 1241204 C 2011-02-03 1996-07-31 +S000002793 ORF Verified YDR385W EFT2 elongation factor 2 chromosome 4 L000000544 4 1243230 1245758 W 2011-02-03 1996-07-31 Elongation factor 2 (EF-2), also encoded by EFT1; catalyzes ribosomal translocation during protein synthesis; contains diphthamide, the unique posttranslationally modified histidine residue specifically ADP-ribosylated by diphtheria toxin; EFT2 has a paralog, EFT1, that arose from the whole genome duplication +S000030719 CDS YDR385W 4 1243230 1245758 W 2011-02-03 1996-07-31 +S000002794 ORF Verified YDR386W MUS81 SLX3 chromosome 4 L000004650 4 1246084 1247982 W 2011-02-03 1996-07-31 Subunit of structure-specific Mms4p-Mus81p endonuclease; cleaves branched DNA; involved in DNA repair, replication fork stability, and joint molecule formation/resolution during meiotic recombination; promotes template switching during break-induced replication (BIR), causing non-reciprocal translocations (NRTs); helix-hairpin-helix protein; phosphorylation of non-catalytic subunit Mms4p by Cdc28p and Cdcp during mitotic cell cycle activates function of Mms4p-Mus81p +S000031582 CDS YDR386W 4 1246084 1247982 W 2011-02-03 1996-07-31 +S000002795 ORF Uncharacterized YDR387C CIN10 chromosome 4 4 1249821 1248154 C 2011-02-03 1996-07-31 Putative transporter; member of the sugar porter family; non-essential gene; overexpression results in elevated colony sectoring, an indicator of chromosomal instability +S000031627 CDS YDR387C 4 1249821 1248154 C 2011-02-03 1996-07-31 +S000002796 ORF Verified YDR388W RVS167 amphiphysin chromosome 4 L000001789 4 1250186 1251634 W 2011-02-03 1996-07-31 Calmodulin-binding actin-associated protein; roles in endocytic membrane tabulation and constriction, and exocytosis; N-BAR domain protein that interacts with Rvs161p to regulate actin cytoskeleton, endocytosis, and viability following starvation or osmotic stress; recruited to bud tips by Gyl1p and Gyp5p during polarized growth; homolog of mammalian amphiphysin +S000031800 CDS YDR388W 4 1250186 1251634 W 2011-02-03 1996-07-31 +S000002797 ORF Verified YDR389W SAC7 chromosome 4 L000001794 4 1252537 1254501 W 220 2011-02-03 1996-07-31 GTPase activating protein (GAP) for Rho1p; regulator of a Tor2p-mediated, Rho1p GTPase switch that controls organization of the actin cytoskeleton; negative regulator of the RHO1-PKC1-MAPK cell integrity (CWI) and membrane fluidity homeostasis signaling pathways; potential Cdc28p substrate; SAC7 has a paralog, BAG7, that arose from the whole genome duplication +S000031909 CDS YDR389W 4 1252537 1254501 W 2011-02-03 1996-07-31 +S000002798 ORF Verified YDR390C UBA2 E1 ubiquitin-activating protein UBA2|UAL1 chromosome 4 L000002404 4 1256847 1254937 C 2011-02-03 1996-07-31 Subunit of heterodimeric nuclear SUMO activating enzyme E1 with Aos1p; activates Smt3p (SUMO) before its conjugation to proteins (sumoylation), which may play a role in protein targeting; essential for viability +S000032721 CDS YDR390C 4 1256847 1254937 C 2011-02-03 1996-07-31 +S000006572 tRNA_gene tG(CCC)D SUF3 chromosome 4 L000002151|L000003777 4 1257079 1257008 C 232 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons +S000032332 noncoding_exon tG(CCC)D 4 1257079 1257008 C 2011-02-03 2000-05-19 +S000002799 ORF Uncharacterized YDR391C chromosome 4 4 1258056 1257358 C 2011-02-03 1996-07-31 Putative protein of unknown function; possibly involved in zinc homeostasis; Bdf1p-dependent transcription induced by salt stress; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus +S000032830 CDS YDR391C 4 1258056 1257358 C 2011-02-03 1996-07-31 +S000002800 ORF Verified YDR392W SPT3 transcriptional regulator SPT3 chromosome 4 L000002029 4 1258696 1259709 W 2011-02-03 1996-07-31 Subunit of the SAGA and SAGA-like transcriptional regulatory complexes; interacts with Spt15p to activate transcription of some RNA polymerase II-dependent genes, also functions to inhibit transcription at some promoters; relocalizes to the cytosol in response to hypoxia +S000033594 CDS YDR392W 4 1258696 1259709 W 2011-02-03 1996-07-31 +S000002801 ORF Verified YDR393W SHE9 MDM33 chromosome 4 L000002871 4 1259901 1261271 W 2011-02-03 1996-07-31 Protein required for normal mitochondrial morphology; mitochondrial inner membrane protein; may be involved in fission of the inner membrane; forms a homo-oligomeric complex +S000033681 CDS YDR393W 4 1259901 1261271 W 2011-02-03 1996-07-31 +S000002802 ORF Verified YDR394W RPT3 proteasome regulatory particle base subunit RPT3|YTA2|YNT1 chromosome 4 L000002556|L000002537 4 1261681 1262967 W 2011-02-03 1996-07-31 ATPase of the 19S regulatory particle of the 26S proteasome; one of ATPases of the regulatory particle; involved in the degradation of ubiquitinated substrates; substrate of N-acetyltransferase B +S000033819 CDS YDR394W 4 1261681 1262967 W 2011-02-03 1996-07-31 +S000002803 ORF Verified YDR395W SXM1 KAP108 chromosome 4 L000003508 4 1263324 1266158 W 2011-02-03 1996-07-31 Nuclear transport factor (karyopherin); involved in protein transport between the cytoplasm and nucleoplasm; similar to Nmd5p, Cse1p, Lph2p, and the human cellular apoptosis susceptibility protein, CAS1 +S000034692 CDS YDR395W 4 1263324 1266158 W 2011-02-03 1996-07-31 +S000002804 ORF Dubious YDR396W chromosome 4 4 1266295 1266795 W 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; extensively overlaps essential NCB2 gene encoding the beta subunit of the NC2 dimeric histone-fold complex +S000034845 CDS YDR396W 4 1266295 1266795 W 2011-02-03 1996-07-31 +S000002805 ORF Verified YDR397C NCB2 negative cofactor 2 transcription regulator complex subunit NCB2|YDR1 chromosome 4 L000003241 4 1266898 1266366 C 2011-02-03 1996-07-31 Subunit of a heterodimeric NC2 transcription regulator complex; complex binds to TBP and can repress transcription by preventing preinitiation complex assembly or stimulate activated transcription; homologous to human NC2beta; complex also includes Bur6p +S000034923 CDS YDR397C 4 1266769 1266366 C 2011-02-03 1996-07-31 +S000034922 CDS YDR397C 4 1266898 1266862 C 2011-02-03 1996-07-31 +S000034924 intron YDR397C 4 1266861 1266770 C 2011-02-03 1996-07-31 +S000002806 ORF Verified YDR398W UTP5 chromosome 4 4 1267471 1269402 W 2011-02-03 1996-07-31 Subunit of U3-containing Small Subunit (SSU) processome complex; involved in production of 18S rRNA and assembly of small ribosomal subunit +S000035902 CDS YDR398W 4 1267471 1269402 W 2011-02-03 1996-07-31 +S000002807 ORF Verified YDR399W HPT1 hypoxanthine phosphoribosyltransferase|HGPRTase|HPRT|BRA6 chromosome 4 L000004313 4 1270068 1270733 W 2011-02-03 1996-07-31 Dimeric hypoxanthine-guanine phosphoribosyltransferase; catalyzes the transfer of the phosphoribosyl portion of 5-phosphoribosyl-alpha-1-pyrophosphate to a purine base (either guanine or hypoxanthine) to form pyrophosphate and a purine nucleotide (either guanosine monophosphate or inosine monophosphate); mutations in the human homolog HPRT1 can cause Lesch-Nyhan syndrome and Kelley-Seegmiller syndrome +S000036067 CDS YDR399W 4 1270068 1270733 W 2011-02-03 1996-07-31 +S000002808 ORF Verified YDR400W URH1 trifunctional uridine nucleosidase/nicotinamide riboside hydrolase/nicotinic acid riboside hydrolase chromosome 4 S000007492 4 1271063 1272085 W 2011-02-03 2003-09-22|1996-07-31 Uridine nucleosidase (uridine-cytidine N-ribohydrolase); cleaves N-glycosidic bonds in nucleosides; involved in the pyrimidine salvage and nicotinamide riboside salvage pathways +S000033224 CDS YDR400W 4 1271063 1272085 W 2011-02-03 2003-09-22|1996-07-31 +S000002809 ORF Dubious YDR401W chromosome 4 4 1272223 1272786 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033274 CDS YDR401W 4 1272223 1272786 W 2011-02-03 1996-07-31 +S000002810 ORF Verified YDR402C DIT2 putative cytochrome P450|CYP56 chromosome 4 L000000507 4 1273703 1272234 C 2011-02-03 1996-07-31 N-formyltyrosine oxidase; sporulation-specific microsomal enzyme involved in the production of N,N-bisformyl dityrosine required for spore wall maturation, homologous to cytochrome P-450s; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively +S000033300 CDS YDR402C 4 1273703 1272234 C 2011-02-03 1996-07-31 +S000002811 ORF Verified YDR403W DIT1 chromosome 4 L000000506 4 1274602 1276212 W 2011-02-03 1996-07-31 Sporulation-specific enzyme required for spore wall maturation; involved in the production of a soluble LL-dityrosine-containing precursor of the spore wall; transcripts accumulate at the time of prospore enclosure +S000034267 CDS YDR403W 4 1274602 1276212 W 2011-02-03 1996-07-31 +S000118446 ARS ARS434 ARSIV-1276 chromosome 4 4 1276225 1276452 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000002812 ORF Verified YDR404C RPB7 DNA-directed RNA polymerase II subunit RPB7|B16 chromosome 4 L000001681 4 1277169 1276654 C 2011-02-03 1996-07-31 RNA polymerase II subunit B16; forms dissociable heterodimer with Rpb4p; Rpb4/7 dissociates from RNAPII as Ser2 CTD phosphorylation increases; Rpb4/7 regulates cellular lifespan via mRNA decay process; involved in recruitment of 3'-end processing factors to transcribing RNA polymerase II complex, export of mRNA to cytoplasm under stress conditions; also involved in translation initiation +S000034321 CDS YDR404C 4 1277169 1276654 C 2011-02-03 1996-07-31 +S000002813 ORF Verified YDR405W MRP20 mitochondrial 54S ribosomal protein YmL41|YmL41|MRPL41 chromosome 4 L000001158 4 1277646 1278437 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000035411 CDS YDR405W 4 1277646 1278437 W 2011-02-03 1996-07-31 +S000002814 ORF Verified YDR406W PDR15 ATP-binding cassette multidrug transporter PDR15 chromosome 4 L000002909 4 1279210 1283799 W 2011-02-03 1996-07-31 Plasma membrane ATP binding cassette (ABC) transporter; multidrug transporter and general stress response factor implicated in cellular detoxification; regulated by Pdr1p, Pdr3p and Pdr8p; promoter contains a PDR responsive element; PDR15 has a paralog, PDR5, that arose from the whole genome duplication +S000035511 CDS YDR406W 4 1279210 1283799 W 2011-02-03 1996-07-31 +S000028543 ORF Dubious YDR406W-A YDR406C-A chromosome 4 4 1283799 1284044 W 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by fungal homology and RT-PCR +S000031193 CDS YDR406W-A 4 1283799 1284044 W 2011-02-03 2003-07-29 +S000002815 ORF Verified YDR407C TRS120 chromosome 4 S000007435 4 1287938 1284069 C 2011-02-03 1996-07-31 Component of transport protein particle (TRAPP) complex II; TRAPPII is a multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating intra-Golgi and endosome-Golgi traffic +S000035551 CDS YDR407C 4 1287938 1284069 C 2011-02-03 1996-07-31 +S000002816 ORF Verified YDR408C ADE8 phosphoribosylglycinamide formyltransferase chromosome 4 L000000037 4 1288859 1288215 C 256 2011-02-03 1996-07-31 Phosphoribosyl-glycinamide transformylase; catalyzes a step in the 'de novo' purine nucleotide biosynthetic pathway +S000035623 CDS YDR408C 4 1288859 1288215 C 2011-02-03 1996-07-31 +S000077072 matrix_attachment_site ETC1 ETC1 chromosome 4 4 1289041 1289063 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; located between divergently transcribed genes ADE8 and SIZ1 +S000002817 ORF Verified YDR409W SIZ1 SUMO ligase SIZ1|ULL1 chromosome 4 S000007589 4 1289406 1292120 W 2011-02-03 1996-07-31 SUMO E3 ligase; promotes attachment of small ubiquitin-related modifier sumo (Smt3p) to primarily cytoplasmic proteins; regulates Rsp5p ubiquitin ligase activity and is in turn itself regulated by Rsp5p; required for sumoylation of septins and histone H3 variant Cse4p, a prerequisite for STUbL-mediated Ub-dependent degradation; localizes to the septin ring; acts as an adapter between E2, Ubc9p and substrates; tends to compensate for survival of DNA damage in absence of Nfi1p +S000036616 CDS YDR409W 4 1289406 1292120 W 2011-02-03 1996-07-31 +S000002818 ORF Verified YDR410C STE14 protein-S-isoprenylcysteine carboxyl O-methyltransferase chromosome 4 L000002121 4 1293091 1292372 C 259.47 2011-02-03 1996-07-31 Farnesyl cysteine-carboxyl methyltransferase; mediates the carboxyl methylation step during C-terminal CAAX motif processing of a-factor and RAS proteins in the endoplasmic reticulum, localizes to the ER membrane +S000037364 CDS YDR410C 4 1293091 1292372 C 2011-02-03 1996-07-31 +S000002819 ORF Verified YDR411C DFM1 chromosome 4 4 1294394 1293369 C 2011-02-03 1996-07-31 Endoplasmic reticulum (ER) localized protein; involved in ER-associated protein degradation (ERAD), ER stress, and homeostasis; interacts with components of ERAD-L and ERAD-C and Cdc48p; derlin-like family member similar to Der1p +S000037501 CDS YDR411C 4 1294394 1293369 C 2011-02-03 1996-07-31 +S000002820 ORF Verified YDR412W RRP17 chromosome 4 4 1294693 1295400 W 2011-02-03 1996-07-31 Component of the pre-60S pre-ribosomal particle; required for cell viability under standard (aerobic) conditions but not under anaerobic conditions; exonuclease required for 5' end processing of pre-60S ribosomal RNA +S000030317 CDS YDR412W 4 1294693 1295400 W 2011-02-03 1996-07-31 +S000002821 ORF Dubious YDR413C chromosome 4 4 1295411 1294836 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the essential uncharacterized ORF YDR412W that is implicated in rRNA processing +S000030389 CDS YDR413C 4 1295411 1294836 C 2011-02-03 1996-07-31 +S000002822 ORF Verified YDR414C ERD1 LDB2 chromosome 4 L000000566|L000004741 4 1296686 1295598 C 2011-02-03 1996-07-31|2011-02-03 Predicted membrane protein required for lumenal ER protein retention; mutants secrete the endogenous ER protein, BiP (Kar2p) +S000030512 CDS YDR414C 4 1296686 1295598 C 2011-02-03 1996-07-31|2011-02-03 +S000002823 ORF Uncharacterized YDR415C putative aminopeptidase chromosome 4 4 1298161 1297037 C 2011-02-03 1996-07-31 Putative aminopeptidase; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to the vacuole +S000031437 CDS YDR415C 4 1298161 1297037 C 2011-02-03 1996-07-31 +S000002824 ORF Verified YDR416W SYF1 mRNA splicing protein SYF1|NTC90 chromosome 4 L000004195 4 1298432 1301011 W 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); that contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs; null mutant has splicing defect and arrests in G2/M; relocalizes to the cytosol in response to hypoxia; homologs in human and C. elegans +S000031649 CDS YDR416W 4 1298432 1301011 W 2011-02-03 1996-07-31 +S000002826 ORF Verified YDR418W RPL12B uL11|ribosomal 60S subunit protein L12B|L11|YL23|L15B|L12B chromosome 4 L000001711 4 1301616 1302113 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L12B; rpl12a rpl12b double mutant exhibits slow growth and slow translation; homologous to mammalian ribosomal protein L12 and bacterial L11; RPL12B has a paralog, RPL12A, that arose from the whole genome duplication +S000032701 CDS YDR418W 4 1301616 1302113 W 2011-02-03 1996-07-31 +S000002825 ORF Dubious YDR417C chromosome 4 4 1301926 1301555 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF RPL12B/YDR418W +S000031695 CDS YDR417C 4 1301926 1301555 C 2011-02-03 1996-07-31 +S000118447 ARS ARS435 ARSIV-1303 chromosome 4 4 1302689 1302768 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000002827 ORF Verified YDR419W RAD30 DNA-directed DNA polymerase eta|DBH1 chromosome 4 L000003523 4 1303174 1305072 W 2011-02-03 1996-07-31 DNA polymerase eta; involved in translesion synthesis during post-replication repair; catalyzes the synthesis of DNA opposite cyclobutane pyrimidine dimers and other lesions; involved in formation of post-replicative damage-induced genome-wide cohesion; may also have a role in protection against mitochondrial mutagenesis; mutations in human pol eta are responsible for XPV +S000032806 CDS YDR419W 4 1303174 1305072 W 2011-02-03 1996-07-31 +S000006723 tRNA_gene tS(AGA)D3 chromosome 4 L000003782 4 1305630 1305712 W 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000031657 noncoding_exon tS(AGA)D3 4 1305630 1305712 W 2011-02-03 2000-05-19 +S000130176 ARS ARS436 chromosome 4 4 1305757 1306312 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000002828 ORF Verified YDR420W HKR1 chromosome 4 L000000788 4 1306267 1311675 W 2011-02-03 1996-07-31 Mucin family member that functions as an osmosensor in the HOG pathway; large, highly glycosylated protein that functions redundantly with Msb2p in Sho1p-mediated osmostresss induction of the HOG signaling pathway; cytoplasmic domain interacts with Ahk1p a scaffold protein that prevents cross talk with the Kss1p MAPK of the filamentous growth pathway; mutant displays defects in beta-1,3 glucan synthesis and bud site selection +S000032953 CDS YDR420W 4 1306267 1311675 W 2011-02-03 1996-07-31 +S000002829 ORF Verified YDR421W ARO80 chromosome 4 4 1312040 1314892 W 2011-02-03 1996-07-31 Zinc finger transcriptional activator of the Zn2Cys6 family; activates transcription of aromatic amino acid catabolic genes in the presence of aromatic amino acids +S000033023 CDS YDR421W 4 1312040 1314892 W 2011-02-03 1996-07-31 +S000002830 ORF Verified YDR422C SIP1 chromosome 4 L000001890 4 1317773 1315326 C 2011-02-03 1996-07-31|2006-04-12 Alternate beta-subunit of the Snf1p kinase complex; may confer substrate specificity; vacuolar protein containing KIS (Kinase-Interacting Sequence) and ASC (Association with Snf1 kinase Complex) domains involved in protein interactions +S000033079 CDS YDR422C 4 1317773 1315326 C 2011-02-03 1996-07-31|2006-04-12 +S000002831 ORF Verified YDR423C CAD1 YAP2 chromosome 4 L000000206 4 1319275 1318046 C 271 2011-02-03 1996-07-31 AP-1-like basic leucine zipper (bZIP) transcriptional activator; involved in stress responses, iron metabolism, and pleiotropic drug resistance; controls a set of genes involved in stabilizing proteins; binds consensus sequence TTACTAA; CAD1 has a paralog, YAP1, that arose from the whole genome duplication +S000033829 CDS YDR423C 4 1319275 1318046 C 2011-02-03 1996-07-31 +S000002832 ORF Verified YDR424C DYN2 dynein light chain|SLC1 chromosome 4 L000003064 4 1319841 1319387 C 2011-02-03 1996-07-31 Cytoplasmic light chain dynein, microtubule motor protein; required for intracellular transport and cell division; involved in mitotic spindle positioning; forms complex with dynein intermediate chain Pac11p that promotes Dyn1p homodimerization, potentiates motor processivity; Dyn2p-Pac11p complex important for interaction of dynein motor complex with dynactin complex; acts as molecular glue to dimerize, stabilize Nup82-Nsp1-Nup159 complex module of cytoplasmic pore filaments +S000033950 CDS YDR424C 4 1319617 1319387 C 2011-02-03 1996-07-31 +S000033949 CDS YDR424C 4 1319720 1319698 C 2011-02-03 1996-07-31 +S000033948 CDS YDR424C 4 1319841 1319817 C 2011-02-03 1996-07-31 +S000033952 intron YDR424C 4 1319697 1319618 C 2011-02-03 1996-07-31 +S000033951 intron YDR424C 4 1319816 1319721 C 2011-02-03 1996-07-31 +S000002833 ORF Verified YDR425W SNX41 chromosome 4 4 1320064 1321941 W 2011-02-03 1996-07-31 Sorting nexin; involved in the retrieval of late-Golgi SNAREs from the post-Golgi endosome to the trans-Golgi network; interacts with Snx4p +S000034950 CDS YDR425W 4 1320064 1321941 W 2011-02-03 1996-07-31 +S000002834 ORF Dubious YDR426C chromosome 4 4 1322006 1321629 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF SNX41 +S000035012 CDS YDR426C 4 1322006 1321629 C 2011-02-03 1996-07-31 +S000002835 ORF Verified YDR427W RPN9 proteasome regulatory particle lid subunit RPN9|NAS7 chromosome 4 L000004309 4 1322205 1323386 W 2011-02-03 1996-07-31 Non-ATPase regulatory subunit of the 26S proteasome; similar to putative proteasomal subunits in other species; null mutant is temperature sensitive and exhibits cell cycle and proteasome assembly defects; protein abundance increases in response to DNA replication stress; relocalizes to the cytosol in response to hypoxia +S000035280 CDS YDR427W 4 1322205 1323386 W 2011-02-03 1996-07-31 +S000002836 ORF Verified YDR428C BNA7 arylformamidase chromosome 4 4 1324239 1323454 C 2011-02-03 1996-07-31 Formylkynurenine formamidase; involved in the de novo biosynthesis of NAD from tryptophan via kynurenine +S000035320 CDS YDR428C 4 1324239 1323454 C 2011-02-03 1996-07-31 +S000002837 ORF Verified YDR429C TIF35 translation initiation factor eIF3 core subunit g chromosome 4 L000004253 4 1325301 1324477 C 2011-02-03 1996-07-31 eIF3g subunit of the eukaryotic translation initiation factor 3 (eIF3); subunit of the core complex of eIF3; is essential for translation; stimulates resumption of ribosomal scanning during translation reinitiation; eIF3 is also involved in programmed stop codon readthrough +S000036266 CDS YDR429C 4 1325301 1324477 C 2011-02-03 1996-07-31 +S000002839 ORF Dubious YDR431W chromosome 4 4 1328390 1328701 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000029889 CDS YDR431W 4 1328390 1328701 W 2011-02-03 1996-07-31 +S000002838 ORF Verified YDR430C CYM1 MOP112 chromosome 4 4 1328470 1325501 C 2011-02-03 1996-07-31 Lysine-specific metalloprotease of the pitrilysin family; metalloprotease of the intermembrane space; degrades proteins and presequence peptides cleaved from imported proteins; required for normal mitochondrial morphology +S000037179 CDS YDR430C 4 1328470 1325501 C 2011-02-03 1996-07-31 +S000002840 ORF Verified YDR432W NPL3 mRNA-binding protein NPL3|NAB1|NOP3|MTS1|MTR13 chromosome 4 L000001270 4 1328783 1330027 W 2011-02-03 1996-07-31 RNA-binding protein; promotes elongation, regulates termination, and carries poly(A) mRNA from nucleus to cytoplasm; represses translation initiation by binding eIF4G; required for pre-mRNA splicing; interacts with E3 ubiquitin ligase Bre1p, linking histone ubiquitination to mRNA processing; may have role in telomere maintenance; dissociation from mRNAs promoted by Mtr10p; phosphorylated by Sky1p in cytoplasm; protein abundance increases in response to DNA replication stress +S000029988 CDS YDR432W 4 1328783 1330027 W 2011-02-03 1996-07-31 +S000002841 ORF Dubious YDR433W KRE22 chromosome 4 4 1329600 1330040 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030126 CDS YDR433W 4 1329600 1330040 W 2011-02-03 1996-07-31 +S000002842 ORF Verified YDR434W GPI17 GPI-anchor transamidase GPI17 chromosome 4 4 1331237 1332841 W 2011-02-03 1996-07-31 Transmembrane protein; subunit of the glycosylphosphatidylinositol transamidase complex that adds GPIs to newly synthesized proteins; human PIG-S homolog +S000031125 CDS YDR434W 4 1331237 1332841 W 2011-02-03 1996-07-31 +S000002843 ORF Verified YDR435C PPM1 leucine carboxy methyltransferase chromosome 4 4 1333969 1332983 C 2011-02-03 1996-07-31 Carboxyl methyltransferase; methylates the C terminus of the protein phosphatase 2A catalytic subunit (Pph21p or Pph22p), which is important for complex formation with regulatory subunits; required for methionine to inhibit autophagy and promote growth +S000031177 CDS YDR435C 4 1333969 1332983 C 2011-02-03 1996-07-31 +S000002844 ORF Verified YDR436W PPZ2 salt homeostasis regulator chromosome 4 L000001479 4 1334821 1336953 W 2011-02-03 1996-07-31 Serine/threonine protein phosphatase Z, isoform of Ppz1p; involved in regulation of potassium transport, which affects osmotic stability, cell cycle progression, and halotolerance +S000031349 CDS YDR436W 4 1334821 1336953 W 2011-02-03 1996-07-31 +S000002845 ORF Verified YDR437W GPI19 phosphatidylinositol N-acetylglucosaminyltransferase GPI19 chromosome 4 4 1337352 1337774 W 2011-02-03 1996-07-31 Subunit of GPI-GlcNAc transferase involved in synthesis of GlcNAc-PI; N-acetylglucosaminyl phosphatidylinositol (GlcNAc-PI) is the first intermediate in glycosylphosphatidylinositol (GPI) anchor synthesis; shares similarity with mammalian PIG-P +S000032347 CDS YDR437W 4 1337352 1337774 W 2011-02-03 1996-07-31 +S000002846 ORF Verified YDR438W THI74 chromosome 4 4 1338274 1339386 W 2011-02-03 1996-07-31 Mitochondrial transporter repressible by thiamine; THI74 has a paralog, YML018C, that arose from the whole genome duplication; shows sequence homology to human gene SLC35F3, a thiamine transporter implicated in hypertension +S000032476 CDS YDR438W 4 1338274 1339386 W 2011-02-03 1996-07-31 +S000002847 ORF Verified YDR439W LRS4 chromosome 4 L000004395 4 1339676 1340719 W 2011-02-03 1996-07-31 Nucleolar protein that forms a complex with Csm1p; and then Mam1p at kinetochores during meiosis I to mediate accurate homolog segregation; required for condensin recruitment to the replication fork barrier site and rDNA repeat segregation +S000032575 CDS YDR439W 4 1339676 1340719 W 2011-02-03 1996-07-31 +S000002848 ORF Verified YDR440W DOT1 histone methyltransferase DOT1|KMT4|PCH1 chromosome 4 L000004390|L000004273 4 1342493 1344241 W 2011-02-03 1996-07-31 Nucleosomal histone H3-Lys79 methylase; methylation is required for telomeric silencing, meiotic checkpoint control, and DNA damage response +S000033292 CDS YDR440W 4 1342493 1344241 W 2011-02-03 1996-07-31 +S000002849 ORF Verified YDR441C APT2 adenine phosphoribosyltransferase APT2 chromosome 4 L000000102 4 1345062 1344517 C 2011-02-03 1996-07-31 Potential adenine phosphoribosyltransferase; encodes a protein with similarity to adenine phosphoribosyltransferase, but artificially expressed protein exhibits no enzymatic activity; APT2 has a paralog, APT1, that arose from the whole genome duplication +S000033331 CDS YDR441C 4 1345062 1344517 C 2011-02-03 1996-07-31 +S000002850 ORF Dubious YDR442W chromosome 4 4 1345647 1346039 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034272 CDS YDR442W 4 1345647 1346039 W 2011-02-03 1996-07-31 +S000002851 ORF Verified YDR443C SSN2 SSX5|MED13|RYE3|UME2|SRB9|SCA1|NUT8 chromosome 4 L000001803|L000002088|S000029518|L000002101 4 1349938 1345676 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; required for stable association of Srb10p-Srb11p kinase; essential for transcriptional regulation +S000034322 CDS YDR443C 4 1349938 1345676 C 2011-02-03 1996-07-31 +S000002852 ORF Uncharacterized YDR444W putative hydrolase chromosome 4 4 1350290 1352353 W 2011-02-03 1996-07-31 Putative hydrolase acting on ester bonds +S000034446 CDS YDR444W 4 1350290 1352353 W 2011-02-03 1996-07-31 +S000006617 tRNA_gene tK(CUU)D2 chromosome 4 L000003776 4 1352538 1352466 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000035878 noncoding_exon tK(CUU)D2 4 1352538 1352466 C 2011-02-03 2000-05-19 +S000002853 ORF Dubious YDR445C chromosome 4 4 1352589 1352182 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034512 CDS YDR445C 4 1352589 1352182 C 2011-02-03 1996-07-31 +S000006877 long_terminal_repeat YDRWdelta29 chromosome 4 4 1352644 1352975 W 2011-02-03 2000-05-19 Ty1 LTR +S000006878 long_terminal_repeat YDRWdelta30 chromosome 4 4 1352976 1353226 W 2011-02-03 2000-05-19 Ty1 LTR +S000002854 ORF Verified YDR446W ECM11 chromosome 4 L000003886 4 1353725 1354633 W 2011-02-03 1996-07-31 Meiosis-specific protein; component of the Synaptonemal Complex (SC) along with Gmc2p; required for efficient crossover formation and for the efficient loading of the SC transverse filament protein, Zip1p; is SUMOlytaed in a Gmc2p manner, and SUMOylation is required for its function in meiosis; GFP fusion protein is present in discrete clusters in the nucleus throughout mitosis; may be involved in maintaining chromatin structure +S000035576 CDS YDR446W 4 1353725 1354633 W 2011-02-03 1996-07-31 +S000002855 ORF Verified YDR447C RPS17B eS17|ribosomal 40S subunit protein S17B|S17e|rp51B|S17B|RPL51B|RP51B chromosome 4 L000001670|L000001741 4 1355553 1354829 C 2011-02-03 1996-07-31 Ribosomal protein 51 (rp51) of the small (40s) subunit; homologous to mammalian ribosomal protein S17, no bacterial homolog; RPS17B has a paralog, RPS17A, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000035611 CDS YDR447C 4 1355236 1354829 C 2011-02-03 1996-07-31 +S000035610 CDS YDR447C 4 1355553 1355551 C 2011-02-03 1996-07-31 +S000035612 intron YDR447C 4 1355550 1355237 C 2011-02-03 1996-07-31 +S000002856 ORF Verified YDR448W ADA2 chromatin-binding transcription regulator ADA2|SWI8 chromosome 4 L000000029 4 1356065 1357369 W 2011-02-03 1996-07-31 Transcription coactivator; component of the ADA and SAGA transcriptional adaptor/HAT (histone acetyltransferase) complexes +S000035771 CDS YDR448W 4 1356065 1357369 W 2011-02-03 1996-07-31 +S000002857 ORF Verified YDR449C UTP6 snoRNA-binding rRNA-processing protein UTP6 chromosome 4 4 1358902 1357580 C 2011-02-03 1996-07-31 Nucleolar protein; component of the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA +S000036633 CDS YDR449C 4 1358902 1357580 C 2011-02-03 1996-07-31 +S000002858 ORF Verified YDR450W RPS18A uS13|ribosomal 40S subunit protein S18A|S18A|S13 chromosome 4 L000004480 4 1359923 1360798 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S18 and bacterial S13; RPS18A has a paralog, RPS18B, that arose from the whole genome duplication; protein increases in abundance and relocalizes from cytoplasm to nuclear foci upon DNA replication stress +S000036543 CDS YDR450W 4 1359923 1359969 W 2011-02-03 1996-07-31 +S000036544 CDS YDR450W 4 1360405 1360798 W 2011-02-03 1996-07-31 +S000036545 intron YDR450W 4 1359970 1360404 W 2011-02-03 1996-07-31 +S000002859 ORF Verified YDR451C YHP1 chromosome 4 4 1362181 1361120 C 2011-02-03 1996-07-31 Homeobox transcriptional repressor; binds Mcm1p and early cell cycle box (ECB) elements of cell cycle regulated genes, thereby restricting ECB-mediated transcription to the M/G1 interval; YHP1 has a paralog, YOX1, that arose from the whole genome duplication +S000036584 CDS YDR451C 4 1362181 1361120 C 2011-02-03 1996-07-31 +S000002860 ORF Verified YDR452W PPN1 endopolyphosphatase|PHM5 chromosome 4 S000007514 4 1362878 1364902 W 2011-02-03 1996-07-31 Dual endo- and exopolyphosphatase with a role in phosphate metabolism; acts as both an endopolyphosphatase cleaving long chains of polyphosphate distributively to generate shorter polymer chains and as an exopolyphosphatase catalyzing the hydrolysis of terminal phosphate from polyphosphate; localizes to the vacuole, nucleus and cytosol; functions as a homodimer; relocalizes from vacuole to cytoplasm upon DNA replication stress +S000036745 CDS YDR452W 4 1362878 1364902 W 2011-02-03 1996-07-31 +S000002861 ORF Verified YDR453C TSA2 thioredoxin peroxidase TSA2|cTPxII chromosome 4 4 1365662 1365072 C 2011-02-03 1996-07-31 Stress inducible cytoplasmic thioredoxin peroxidase; cooperates with Tsa1p in the removal of reactive oxygen, nitrogen and sulfur species using thioredoxin as hydrogen donor; deletion enhances the mutator phenotype of tsa1 mutants; protein abundance increases in response to DNA replication stress; TSA2 has a paralog, TSA1, that arose from the whole genome duplication +S000037410 CDS YDR453C 4 1365662 1365072 C 2011-02-03 1996-07-31 +S000002862 ORF Verified YDR454C GUK1 BRA3|guanylate kinase|PUR5 chromosome 4 L000000745 4 1366827 1366264 C 2011-02-03 1996-07-31 Guanylate kinase; converts GMP to GDP; required for growth and mannose outer chain elongation of cell wall N-linked glycoproteins +S000037538 CDS YDR454C 4 1366827 1366264 C 2011-02-03 1996-07-31 +S000002864 ORF Verified YDR456W NHX1 bifunctional K:H/Na:H antiporter NHX1|VPL27|NHA2|VPS44 chromosome 4 L000004336 4 1367485 1369386 W 2011-02-03 1996-07-31 Na+/H+ and K+/H+ exchanger; required for intracellular sequestration of Na+ and K+; located in the vacuole and late endosome compartments; required for osmotolerance to acute hypertonic shock and for vacuolar fusion; ortholog of human NHE9, which is linked to autism +S000030521 CDS YDR456W 4 1367485 1369386 W 2011-02-03 1996-07-31 +S000002863 ORF Dubious YDR455C chromosome 4 4 1367681 1367373 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene YDR456W +S000037654 CDS YDR455C 4 1367681 1367373 C 2011-02-03 1996-07-31 +S000002865 ORF Verified YDR457W TOM1 E3 ubiquitin-protein ligase TOM1 chromosome 4 L000002983 4 1369790 1379596 W 2011-02-03 1996-07-31 E3 ubiquitin ligase of the hect-domain class; has a role in mRNA export from the nucleus and may regulate transcriptional coactivators; involved in degradation of excess histones; interacts with Dia2p and is required for Dia2p degradation; required to target Cdc6p for ubiquitin-mediated destruction during G1 phase +S000030634 CDS YDR457W 4 1369790 1379596 W 2011-02-03 1996-07-31 +S000130177 ARS ARS439 chromosome 4 4 1379641 1380100 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000002866 ORF Verified YDR458C HEH2 chromosome 4 4 1382046 1380055 C 2011-02-03 1996-07-31 Inner nuclear membrane (INM) protein; contains helix-extension-helix (HEH) motif, nuclear localization signal sequence; targeting to the INM requires the Srp1p-Kap95p karyopherins and the Ran cycle; HEH2 has a paralog, SRC1, that arose from the whole genome duplication +S000030675 CDS YDR458C 4 1382046 1380055 C 2011-02-03 1996-07-31 +S000002867 ORF Verified YDR459C PFA5 palmitoyltransferase PFA5 chromosome 4 4 1383443 1382319 C 2011-02-03 1996-07-31 Palmitoyltransferase with autoacylation activity; likely functions in pathway(s) outside Ras; member of a family of putative palmitoyltransferases containing an Asp-His-His-Cys-cysteine rich (DHHC-CRD) domain +S000031546 CDS YDR459C 4 1383443 1382319 C 2011-02-03 1996-07-31 +S000002868 ORF Verified YDR460W TFB3 TFIIH/NER complex subunit TFB3|RIG2 chromosome 4 L000003496 4 1383811 1384776 W 2011-02-03 1996-07-31 Subunit of TFIIH and nucleotide excision repair factor 3 complexes; involved in transcription initiation, required for nucleotide excision repair; ring finger protein similar to mammalian CAK and TFIIH subunit +S000031579 CDS YDR460W 4 1383811 1384776 W 2011-02-03 1996-07-31 +S000002869 ORF Verified YDR461W MFA1 mating pheromone a chromosome 4 L000001096 4 1385176 1385286 W 280.27 2011-02-03 1996-07-31 Mating pheromone a-factor; made by a cells; interacts with alpha cells to induce cell cycle arrest and other responses leading to mating; biogenesis involves C-terminal modification, N-terminal proteolysis, and export; also encoded by MFA2 +S000032540 CDS YDR461W 4 1385176 1385286 W 2011-02-03 1996-07-31 +S000087209 ORF Uncharacterized YDR461C-A chromosome 4 4 1385766 1385524 C 2011-02-03 2005-11-15 Putative protein of unknown function +S000087210 CDS YDR461C-A 4 1385766 1385524 C 2011-02-03 2005-11-15 +S000002870 ORF Verified YDR462W MRPL28 mitochondrial 54S ribosomal protein YmL28|YmL28 chromosome 4 L000002691 4 1386073 1386516 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; protein abundance increases in response to DNA replication stress +S000032692 CDS YDR462W 4 1386073 1386516 W 2011-02-03 1996-07-31 +S000002871 ORF Verified YDR463W STP1 SSY2|BAP1 chromosome 4 L000002132 4 1386816 1388375 W 298 2011-02-03 2003-09-22|1996-07-31 Transcription factor; contains a N-terminal regulatory motif (RI) that acts as a cytoplasmic retention determinant and as an Asi dependent degron in the nucleus; undergoes proteolytic processing by SPS (Ssy1p-Ptr3p-Ssy5p)-sensor component Ssy5p in response to extracellular amino acids; activates transcription of amino acid permease genes and may have a role in tRNA processing; STP1 has a paralog, STP2, that arose from the whole genome duplication +S000032755 CDS YDR463W 4 1386816 1388375 W 2011-02-03 2003-09-22|1996-07-31 +S000002872 ORF Verified YDR464W SPP41 chromosome 4 L000002019 4 1388872 1393179 W 297 2011-02-03 1996-07-31 Protein of unknown function; involved in negative regulation of expression of spliceosome components PRP4 and PRP3; relocalizes to the cytosol in response to hypoxia +S000033502 CDS YDR464W 4 1388872 1393179 W 2011-02-03 1996-07-31 +S000028614 ORF Dubious YDR464C-A chromosome 4 4 1392680 1392492 C 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031450 CDS YDR464C-A 4 1392680 1392492 C 2011-02-03 2003-07-29 +S000002873 ORF Verified YDR465C RMT2 protein-arginine N5-methyltransferase chromosome 4 L000004724 4 1394574 1393336 C 2011-02-03 1996-07-31 Arginine N5 methyltransferase; methylates ribosomal protein Rpl12 (L12) on Arg67; relative distribution to the nucleus increases upon DNA replication stress +S000033538 CDS YDR465C 4 1394574 1393336 C 2011-02-03 1996-07-31 +S000002874 ORF Verified YDR466W PKH3 protein kinase PKH3 chromosome 4 4 1395121 1397817 W 2011-02-03 1996-07-31 Protein kinase with similarity to mammalian PDK1 and yeast Pkh1p/Phk2p; yeast Pkh1p and Pkh2p are two redundant upstream activators of Pkc1p; identified as a multicopy suppressor of a pkh1 pkh2 double mutant +S000033694 CDS YDR466W 4 1395121 1397817 W 2011-02-03 1996-07-31 +S000002875 ORF Dubious YDR467C chromosome 4 4 1397909 1397583 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033742 CDS YDR467C 4 1397909 1397583 C 2011-02-03 1996-07-31 +S000002876 ORF Verified YDR468C TLG1 chromosome 4 L000004227 4 1398700 1398026 C 2011-02-03 1996-07-31 Essential t-SNARE that mediates fusion of vesicles with the late Golgi; forms a complex with Tlg2p and Vti1p; mediates fusion of endosome-derived vesicles with the late Golgi; binds the docking complex VFT (Vps fifty-three) through interaction with Vps51p +S000034625 CDS YDR468C 4 1398700 1398026 C 2011-02-03 1996-07-31 +S000002877 ORF Verified YDR469W SDC1 SAF19|CPS25 chromosome 4 4 1399015 1399542 W 2011-02-03 1996-07-31 Subunit of the COMPASS (Set1C) complex; COMPASS methylates lysine 4 of histone H3 and is required in chromatin silencing at telomeres; contains a Dpy-30 domain that mediates interaction with Bre2p; similar to C. elegans and human DPY-30 +S000034852 CDS YDR469W 4 1399015 1399542 W 2011-02-03 1996-07-31 +S000002878 ORF Verified YDR470C UGO1 chromosome 4 4 1401214 1399706 C 2011-02-03 2000-04-06|1996-07-31|2011-02-03 Outer membrane component of the mitochondrial fusion machinery; binds to Fzo1p and Mgm1p to link these two GTPases during mitochondrial fusion; involved in fusion of both the outer and inner membranes; facilitates dimerization of Fzo1p during fusion; import into the outer membrane is mediated by Tom70p and Mim1p; has similarity to carrier proteins but likely not a transporter; similar to human SLC25A46 implicated in optic atroprophy spectrum disorder +S000035822 CDS YDR470C 4 1401214 1399706 C 2011-02-03 2000-04-06|1996-07-31|2011-02-03 +S000002879 ORF Verified YDR471W RPL27B eL27|ribosomal 60S subunit protein L27B|L27e|L27B chromosome 4 L000002898 4 1401770 1402564 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L27B; homologous to mammalian ribosomal protein L27, no bacterial homolog; RPL27B has a paralog, RPL27A, that arose from the whole genome duplication +S000036787 CDS YDR471W 4 1401770 1401800 W 2011-02-03 1996-07-31 +S000036788 CDS YDR471W 4 1402185 1402564 W 2011-02-03 1996-07-31 +S000036789 intron YDR471W 4 1401801 1402184 W 2011-02-03 1996-07-31 +S000006498 snoRNA_gene snR13 SNR13 chromosome 4 L000002849 4 1402919 1403042 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at positions A2280 and A2281 +S000036591 noncoding_exon snR13 4 1402919 1403042 W 2011-02-03 2000-05-19 +S000002880 ORF Verified YDR472W TRS31 TRAPP subunit TRS31 chromosome 4 S000007433 4 1403322 1404173 W 2011-02-03 1996-07-31 Core component of transport protein particle (TRAPP) complexes I-III; TRAPP complexes are related multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating ER-Golgi traffic (TRAPPI), intra-Golgi traffic (TRAPPII), endosome-Golgi traffic (TRAPPII and III) and autophagy (TRAPPIII) +S000036864 CDS YDR472W 4 1403322 1404173 W 2011-02-03 1996-07-31 +S000118448 ARS ARS440 ARSIV-1404 chromosome 4 4 1404290 1404524 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178080 ARS_consensus_sequence ARS440 4 1404322 1404338 W 2014-11-18 2014-11-18 +S000002881 ORF Verified YDR473C PRP3 U4/U6-U5 snRNP complex subunit PRP3|RNA3 chromosome 4 L000001496 4 1405854 1404445 C 300 2011-02-03 1996-07-31 Splicing factor; component of the U4/U6-U5 snRNP complex +S000036886 CDS YDR473C 4 1405854 1404445 C 2011-02-03 1996-07-31 +S000002883 ORF Verified YDR475C JIP4 YDR474C chromosome 4 4 1410094 1407464 C 2011-02-03 2003-09-30|1996-07-31 Protein of unknown function; previously annotated as two separate ORFs, YDR474C and YDR475C, which were merged as a result of corrections to the systematic reference sequence; JIP4 has a paralog, YOR019W, that arose from the whole genome duplication +S000037707 CDS YDR475C 4 1410094 1407464 C 2011-02-03 2003-09-30|1996-07-31 +S000002884 ORF Uncharacterized YDR476C chromosome 4 4 1411127 1410453 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; YDR476C is not an essential gene +S000037771 CDS YDR476C 4 1411127 1410453 C 2011-02-03 1996-07-31 +S000002885 ORF Verified YDR477W SNF1 AMP-activated serine/threonine-protein kinase catalytic subunit SNF1|PAS14|HAF3|GLC2|CCR1|CAT1 chromosome 4 L000001944 4 1412373 1414274 W 304 2011-02-03 1996-07-31 AMP-activated S/T protein kinase; forms a complex with Snf4p and members of the Sip1p/Sip2p/Gal83p family; required for transcription of glucose-repressed genes, thermotolerance, sporulation, and peroxisome biogenesis; regulates nucleocytoplasmic shuttling of Hxk2p; regulates filamentous growth and acts as a non-canonical GEF, activating Arf3p during invasive growth; SUMOylation by Mms21p inhibits its function and targets Snf1p for destruction via the Slx5-Slx8 Ub ligase +S000029842 CDS YDR477W 4 1412373 1414274 W 2011-02-03 1996-07-31 +S000002886 ORF Verified YDR478W SNM1 chromosome 4 L000002825 4 1414575 1415171 W 2011-02-03 1996-07-31 Ribonuclease MRP complex subunit; ribonuclease (RNase) MRP cleaves pre-rRNA and has a role in cell cycle-regulated degradation of daughter cell-specific mRNAs; binds to the NME1 RNA subunit of RNase MRP +S000030848 CDS YDR478W 4 1414575 1415171 W 2011-02-03 1996-07-31 +S000002887 ORF Verified YDR479C PEX29 chromosome 4 4 1416874 1415210 C 2011-02-03 1996-07-31 ER-resident protein involved in peroxisomal biogenesis; ER-localized protein that associates with peroxisomes; interacts with Pex30p and reticulons Rtn1p and Yop1p to regulate peroxisome biogenesis from the ER; role in peroxisomal-destined vesicular flow from the ER; regulates peroxisomal size, number and distribution; Pex28p and Pex29p may act at steps upstream of those mediated by Pex30p, Pex31p, and Pex32p; forms ER foci upon DNA replication stress +S000030901 CDS YDR479C 4 1416874 1415210 C 2011-02-03 1996-07-31 +S000002888 ORF Verified YDR480W DIG2 RST2 chromosome 4 L000003123 4 1417399 1418370 W 2011-02-03 1996-07-31 MAP kinase-responsive inhibitor of the Ste12p transcription factor; involved in the regulation of mating-specific genes and the invasive growth pathway; related regulators Dig1p and Dig2p bind to Ste12p; DIG2 has a paralog, DIG1, that arose from the whole genome duplication +S000032009 CDS YDR480W 4 1417399 1418370 W 2011-02-03 1996-07-31 +S000002889 ORF Verified YDR481C PHO8 alkaline phosphatase PHO8|phoH chromosome 4 L000001422 4 1420250 1418550 C 306 2011-02-03 1996-07-31 Repressible vacuolar alkaline phosphatase; regulated by levels of Pi and by Pho4p, Pho9p, Pho80p, Pho81p and Pho85p; dephosphorylates phosphotyrosyl peptides; contributes to NAD+ metabolism by producing nicotinamide riboside from NMN +S000032056 CDS YDR481C 4 1420250 1418550 C 2011-02-03 1996-07-31 +S000002890 ORF Verified YDR482C CWC21 U2-type spliceosomal complex subunit CWC21 chromosome 4 4 1420838 1420431 C 2011-02-03 1996-07-31 Protein involved in RNA splicing by the spliceosome; component of a complex containing Cef1p; interacts genetically with ISY1 and BUD13; may bind RNA; has similarity to S. pombe Cwf21p +S000032970 CDS YDR482C 4 1420838 1420431 C 2011-02-03 1996-07-31 +S000002891 ORF Verified YDR483W KRE2 alpha-1,2-mannosyltransferase KRE2|MNT1 chromosome 4 L000000913 4 1421157 1422485 W 306 2011-02-03 1996-07-31 Alpha1,2-mannosyltransferase of the Golgi; involved in protein mannosylation; KRE2 has a paralog, KTR6, that arose from the whole genome duplication +S000033119 CDS YDR483W 4 1421157 1422485 W 2011-02-03 1996-07-31 +S000002892 ORF Verified YDR484W VPS52 SAC2 chromosome 4 L000001791 4 1422763 1424688 W 314 2011-02-03 1996-07-31 Component of the GARP (Golgi-associated retrograde protein) complex; GARP is required for the recycling of proteins from endosomes to the late Golgi, and for mitosis after DNA damage induced checkpoint arrest; involved in localization of actin and chitin; members of the GARP complex are Vps51p-Vps52p-Vps53p-Vps54p +S000033198 CDS YDR484W 4 1422763 1424688 W 2011-02-03 1996-07-31 +S000002893 ORF Verified YDR485C VPS72 SWC2 chromosome 4 4 1427207 1424820 C 2011-02-03 2003-09-22|1996-07-31 Htz1p-binding component of the SWR1 complex; exchanges histone variant H2AZ (Htz1p) for chromatin-bound histone H2A; may function as a lock that prevents removal of H2AZ from nucleosomes; required for vacuolar protein sorting +S000033955 CDS YDR485C 4 1427207 1424820 C 2011-02-03 2003-09-22|1996-07-31 +S000002894 ORF Verified YDR486C VPS60 CHM5|MOS10 chromosome 4 4 1428120 1427431 C 2011-02-03 2003-09-22|1996-07-31 Protein involved in late endosome to vacuole transport; cytoplasmic and vacuolar membrane protein; required for normal filament maturation during pseudohyphal growth; may function in targeting cargo proteins for degradation; interacts with Vta1p +S000034065 CDS YDR486C 4 1428120 1427431 C 2011-02-03 2003-09-22|1996-07-31 +S000002895 ORF Verified YDR487C RIB3 3,4-dihydroxy-2-butanone-4-phosphate synthase RIB3 chromosome 4 L000001635 4 1428980 1428354 C 2011-02-03 1996-07-31 3,4-dihydroxy-2-butanone-4-phosphate synthase (DHBP synthase); required for riboflavin biosynthesis from ribulose-5-phosphate, also has an unrelated function in mitochondrial respiration +S000034158 CDS YDR487C 4 1428980 1428354 C 2011-02-03 1996-07-31 +S000002896 ORF Verified YDR488C PAC11 dynein intermediate chain chromosome 4 L000001330 4 1430789 1429188 C 2011-02-03 1996-07-31 Dynein intermediate chain, microtubule motor protein; required for intracellular transport and cell division; acts in cytoplasmic dynein pathway; forms complex with dynein light chain Dyn2p that promotes Dyn1p homodimerization and potentiates motor processivity; Dyn2p-Pac11p complex is also important for interaction of dynein motor complex with dynactin complex; forms cortical cytoplasmic microtubule capture site with Num1p; essential in the absence of CIN8 +S000035100 CDS YDR488C 4 1430789 1429188 C 2011-02-03 1996-07-31 +S000002897 ORF Verified YDR489W SLD5 DNA replication protein SLD5|CDC105 chromosome 4 4 1431012 1431896 W 2011-02-03 1996-07-31 Subunit of the GINS complex (Sld5p, Psf1p, Psf2p, Psf3p); complex is localized to DNA replication origins and implicated in assembly of the DNA replication machinery +S000035299 CDS YDR489W 4 1431012 1431896 W 2011-02-03 1996-07-31 +S000002898 ORF Verified YDR490C PKH1 serine/threonine protein kinase PKH1 chromosome 4 L000004616 4 1434268 1431968 C 2011-02-03 1996-07-31 Serine/threonine protein kinase; involved in sphingolipid-mediated signaling pathway that controls endocytosis; activates Ypk1p and Ykr2p, components of signaling cascade required for maintenance of cell wall integrity; contains a PH-like domain; redundant with Pkh2p; PKH1 has a paralog, PKH2, that arose from the whole genome duplication +S000036098 CDS YDR490C 4 1434268 1431968 C 2011-02-03 1996-07-31 +S000002900 ORF Verified YDR492W IZH1 PAQR-type receptor chromosome 4 4 1434924 1435874 W 2011-02-03 1996-07-31 Membrane protein involved in zinc ion homeostasis; member of the four-protein IZH family; transcription is regulated directly by Zap1p, expression induced by zinc deficiency and fatty acids; deletion increases sensitivity to elevated zinc; IZH1 has a paralog, IZH4, that arose from the whole genome duplication +S000031780 CDS YDR492W 4 1434924 1435874 W 2011-02-03 1996-07-31 +S000002899 ORF Dubious YDR491C chromosome 4 4 1434991 1434500 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036239 CDS YDR491C 4 1434991 1434500 C 2011-02-03 1996-07-31 +S000002901 ORF Verified YDR493W MZM1 AIM8|FMP36 chromosome 4 4 1436217 1436588 W 2011-02-03 1996-07-31 Protein required for assembly of the cytochrome bc(1) complex; acts as a chaperone for Rip1p and facilitates its insertion into the complex at a late stage of assembly; localized to the mitochondrial matrix; null mutant exhibits a respiratory growth defect and reduced mitochondrial zinc levels, which is characteristic of mutations affecting bc(1) complex assembly; member of the LYR protein family; human LYRM7 is a functional ortholog +S000031922 CDS YDR493W 4 1436217 1436588 W 2011-02-03 1996-07-31 +S000002902 ORF Verified YDR494W RSM28 mitochondrial 37S ribosomal protein RSM28 chromosome 4 4 1436930 1438015 W 2011-02-03 2002-12-17|1996-07-31 Mitochondrial ribosomal protein of the small subunit; genetic interactions suggest a possible role in promoting translation initiation +S000037424 CDS YDR494W 4 1436930 1438015 W 2011-02-03 2002-12-17|1996-07-31 +S000002903 ORF Verified YDR495C VPS3 CORVET complex subunit VPS3|VPT17|VPL3|PEP6 chromosome 4 L000002469 4 1441150 1438115 C 2011-02-03 1996-07-31 Component of CORVET membrane tethering complex; cytoplasmic protein required for the sorting and processing of soluble vacuolar proteins, acidification of the vacuolar lumen, and assembly of the vacuolar H+-ATPase +S000037459 CDS YDR495C 4 1441150 1438115 C 2011-02-03 1996-07-31 +S000002904 ORF Verified YDR496C PUF6 chromosome 4 4 1443403 1441433 C 2011-02-03 1996-07-31 Pumilio-homology domain protein; binds the 3' UTR of ASH1 mRNA and represses its translation, resulting in proper asymmetric localization of ASH1 mRNA; required at post-transcriptional step for efficient retrotransposition; absence results in decreased Ty1 Gag:GFP protein levels; co-sediments with the 60S ribosomal subunit and is required for its biogenesis +S000037553 CDS YDR496C 4 1443403 1441433 C 2011-02-03 1996-07-31 +S000002905 ORF Verified YDR497C ITR1 myo-inositol transporter ITR1 chromosome 4 L000000879 4 1445467 1443713 C 2011-02-03 1996-07-31 Myo-inositol transporter; member of the sugar transporter superfamily; expression is repressed by inositol and choline via Opi1p and derepressed via Ino2p and Ino4p; relative distribution to the vacuole increases upon DNA replication stress; ITR1 has a paralog, ITR2, that arose from the whole genome duplication +S000037634 CDS YDR497C 4 1445467 1443713 C 2011-02-03 1996-07-31 +S000002906 ORF Verified YDR498C SEC20 chromosome 4 L000001843 4 1446994 1445843 C 2011-02-03 1996-07-31 Membrane glycoprotein v-SNARE; involved in retrograde transport from the Golgi to the endoplasmic reticulum (ER); required for N- and O-glycosylation in the Golgi but not in the ER and for efficient nuclear fusion during mating; mediates Sey1p-independent homotypic ER fusion; interacts with the Dsl1p complex through Tip20p +S000030424 CDS YDR498C 4 1446994 1445843 C 2011-02-03 1996-07-31 +S000002907 ORF Verified YDR499W LCD1 PIE1|DDC2 chromosome 4 4 1447830 1450073 W 2011-02-03 1996-07-31 Essential protein required for the DNA integrity checkpoint pathways; interacts physically with Mec1p; putative homolog of S. pombe Rad26 and human ATRIP; forms nuclear foci upon DNA replication stress +S000030564 CDS YDR499W 4 1447830 1450073 W 2011-02-03 1996-07-31 +S000002908 ORF Verified YDR500C RPL37B eL37|ribosomal 60S subunit protein L37B|L37e|YL35|L43|L37B chromosome 4 L000002899 4 1450853 1450198 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L37B; required for processing of 27SB pre-rRNA and formation of stable 66S assembly intermediates; protein abundance increases in response to DNA replication stress; homologous to mammalian ribosomal protein L37, no bacterial homolog; RPL37B has a paralog, RPL37A, that arose from the whole genome duplication +S000036331 CDS YDR500C 4 1450457 1450198 C 2011-02-03 1996-07-31 +S000036330 CDS YDR500C 4 1450853 1450847 C 2011-02-03 1996-07-31 +S000036332 intron YDR500C 4 1450846 1450458 C 2011-02-03 1996-07-31 +S000002909 ORF Verified YDR501W PLM2 chromosome 4 S000007440 4 1451353 1452918 W 2011-02-03 1996-07-31 Putative transcription factor, contains Forkhead Associated domain; found associated with chromatin; target of SBF transcription factor; induced in response to DNA damaging agents and deletion of telomerase; PLM2 has a paralog, TOS4, that arose from the whole genome duplication +S000037037 CDS YDR501W 4 1451353 1452918 W 2011-02-03 1996-07-31 +S000002910 ORF Verified YDR502C SAM2 methionine adenosyltransferase SAM2|ETH2 chromosome 4 L000001799 4 1454464 1453310 C 2011-02-03 1996-07-31 S-adenosylmethionine synthetase; catalyzes transfer of the adenosyl group of ATP to the sulfur atom of methionine; comparative analysis suggests that a mitochondrially targeted form may result from translation starting at a non-canonical codon upstream of the annotated start codon +S000037058 CDS YDR502C 4 1454464 1453310 C 2011-02-03 1996-07-31 +S000130178 ARS ARS442 chromosome 4 4 1454509 1455087 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000002911 ORF Verified YDR503C LPP1 phosphatidate phosphatase LPP1 chromosome 4 L000004266 4 1455866 1455042 C 2011-02-03 1996-07-31 Lipid phosphate phosphatase; catalyzes Mg(2+)-independent dephosphorylation of phosphatidic acid (PA), lysophosphatidic acid, and diacylglycerol pyrophosphate; involved in control of the cellular levels of phosphatidylinositol and PA +S000037180 CDS YDR503C 4 1455866 1455042 C 2011-02-03 1996-07-31 +S000002912 ORF Verified YDR504C SPG3 chromosome 4 4 1456694 1456311 C 2011-02-03 1996-07-31 Protein required for high temperature survival during stationary phase; not required for growth on nonfermentable carbon sources; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum +S000037274 CDS YDR504C 4 1456694 1456311 C 2011-02-03 1996-07-31 +S000002913 ORF Verified YDR505C PSP1 GIN5 chromosome 4 L000002881|L000002877 4 1459220 1456695 C 2011-02-03 1996-07-31|2011-02-03 Asn and gln rich protein of unknown function; high-copy suppressor of POL1 (DNA polymerase alpha) and partial suppressor of CDC2 (polymerase delta) and CDC6 (pre-RC loading factor) mutations; overexpression results in growth inhibition; PSP1 has a paralog, YLR177W, that arose from the whole genome duplication +S000029936 CDS YDR505C 4 1459220 1456695 C 2011-02-03 1996-07-31|2011-02-03 +S000002914 ORF Verified YDR506C GMC1 putative oxidoreductase chromosome 4 4 1461554 1459728 C 2011-02-03 1996-07-31 Protein involved in meiotic progression; mutants are delayed in meiotic nuclear division and are defective in synaptonemal complex assembly; possible membrane-localized protein; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively +S000030050 CDS YDR506C 4 1461554 1459728 C 2011-02-03 1996-07-31 +S000006638 tRNA_gene tL(CAA)D chromosome 4 L000003775 4 1461829 1461715 C 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000033776 intron tL(CAA)D 4 1461791 1461759 C 2011-02-03 2000-05-19 +S000033775 noncoding_exon tL(CAA)D 4 1461758 1461715 C 2011-02-03 2000-05-19 +S000033774 noncoding_exon tL(CAA)D 4 1461829 1461792 C 2011-02-03 2000-05-19 +S000118449 ARS ARS443 ARSIV-1462 chromosome 4 4 1461862 1462173 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000002915 ORF Verified YDR507C GIN4 protein kinase GIN4|ERC47 chromosome 4 L000002876 4 1465786 1462358 C 2011-02-03 1996-07-31 Protein kinase involved in bud growth and assembly of the septin ring; proposed to have kinase-dependent and kinase-independent activities; undergoes autophosphorylation; similar to Hsl1p; GIN4 has a paralog, KCC4, that arose from the whole genome duplication +S000030234 CDS YDR507C 4 1465786 1462358 C 2011-02-03 1996-07-31 +S000002917 ORF Dubious YDR509W chromosome 4 4 1468226 1468573 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031352 CDS YDR509W 4 1468226 1468573 W 2011-02-03 1996-07-31 +S000002916 ORF Verified YDR508C GNP1 glutamine permease GNP1 chromosome 4 L000002806 4 1468444 1466453 C 2011-02-03 1996-07-31 High-affinity glutamine permease; also transports Leu, Ser, Thr, Cys, Met and Asn; expression is fully dependent on Grr1p and modulated by the Ssy1p-Ptr3p-Ssy5p (SPS) sensor of extracellular amino acids; GNP1 has a paralog, AGP1, that arose from the whole genome duplication +S000031178 CDS YDR508C 4 1468444 1466453 C 2011-02-03 1996-07-31 +S000002918 ORF Verified YDR510W SMT3 SUMO family protein SMT3 chromosome 4 L000001938 4 1469400 1469705 W 2011-02-03 1996-07-31 Ubiquitin-like protein of the SUMO family; conjugated to lysine residues of target proteins; associates with transcriptionally active genes; regulates chromatid cohesion, chromosome segregation, APC-mediated proteolysis, DNA replication and septin ring dynamics; human homolog SUMO1 can complement yeast null mutant +S000032284 CDS YDR510W 4 1469400 1469705 W 2011-02-03 1996-07-31 +S000028615 ORF Dubious YDR510C-A chromosome 4 4 1469811 1469695 C 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031452 CDS YDR510C-A 4 1469811 1469695 C 2011-02-03 2003-07-29 +S000002919 ORF Verified YDR511W SDH7 ACN9 chromosome 4 4 1470017 1470418 W 2011-02-03 1996-07-31 Mitochondrial protein involved in assembly of succinate dehydrogenase; has a role in maturation of the Sdh2p subunit; localized to the mitochondrial intermembrane space; required for acetate utilization and gluconeogenesis; mutation in Drosophila ortholog SDHAF3 causes reduced succinate dehydrogenase activity and neuronal and muscular dysfunction; member of the LYR protein family +S000032384 CDS YDR511W 4 1470017 1470418 W 2011-02-03 1996-07-31 +S000002921 ORF Verified YDR513W GRX2 dithiol glutaredoxin GRX2|TTR1 chromosome 4 L000000510|L000002386 4 1471017 1471448 W 2011-02-03 1996-07-31 Cytoplasmic glutaredoxin; thioltransferase, glutathione-dependent disulfide oxidoreductase involved in maintaining redox state of target proteins, also exhibits glutathione peroxidase activity, expression induced in response to stress; GRX2 has two in-frame start codons resulting in a shorter isoform that is retained in the cytosol and a longer form translocated to the mitochondrial matrix; GRX2 has a paralog, GRX1, that arose from the whole genome duplication +S000033294 CDS YDR513W 4 1471017 1471448 W 2011-02-03 1996-07-31 +S000002920 ORF Verified YDR512C EMI1 chromosome 4 4 1471063 1470500 C 2011-02-03 1996-07-31 Non-essential protein of unknown function; required for transcriptional induction of the early meiotic-specific transcription factor IME1, also required for sporulation; contains twin cysteine-x9-cysteine motifs; deletion affects mitochondrial morphology +S000032449 CDS YDR512C 4 1471063 1470500 C 2011-02-03 1996-07-31 +S000002922 ORF Verified YDR514C chromosome 4 4 1472999 1471548 C 2011-02-03 1996-07-31 Protein of unknown function that localizes to mitochondria; overexpression affects endocytic protein trafficking; YDR514C has a paralog, GFD2, that arose from the whole genome duplication +S000033333 CDS YDR514C 4 1472999 1471548 C 2011-02-03 1996-07-31 +S000002923 ORF Verified YDR515W SLF1 SRO99 chromosome 4 L000004191|L000002894 4 1473429 1474772 W 2011-02-03 1996-07-31 RNA binding protein that associates with polysomes; may be involved in regulating mRNA translation; involved in the copper-dependent mineralization of copper sulfide complexes on cell surface in cells cultured in copper salts; SLF1 has a paralog, SRO9, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000034278 CDS YDR515W 4 1473429 1474772 W 2011-02-03 1996-07-31 +S000002924 ORF Verified YDR516C EMI2 putative glucokinase chromosome 4 4 1476476 1474974 C 2011-02-03 1996-07-31 Non-essential protein of unknown function; required for transcriptional induction of the early meiotic-specific transcription factor IME1; required for sporulation; expression regulated by glucose-repression transcription factors Mig1/2p; EMI2 has a paralog, GLK1, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000034325 CDS YDR516C 4 1476476 1474974 C 2011-02-03 1996-07-31 +S000002925 ORF Verified YDR517W GRH1 chromosome 4 4 1477239 1478357 W 2011-02-03 1996-07-31 Acetylated cis-Golgi protein, involved in ER to Golgi transport; homolog of human GRASP65; forms a complex with the coiled-coil protein Bug1p; mutants are compromised for the fusion of ER-derived vesicles with Golgi membranes; protein abundance increases in response to DNA replication stress +S000034449 CDS YDR517W 4 1477239 1478357 W 2011-02-03 1996-07-31 +S000002926 ORF Verified YDR518W EUG1 protein disulfide isomerase EUG1 chromosome 4 L000000589 4 1478608 1480161 W 2011-02-03 1996-07-31 Protein disulfide isomerase of the endoplasmic reticulum lumen; EUG1 has a paralog, PDI1, that arose from the whole genome duplication; function overlaps with that of Pdi1p; may interact with nascent polypeptides in the ER +S000034562 CDS YDR518W 4 1478608 1480161 W 2011-02-03 1996-07-31 +S000002927 ORF Verified YDR519W FPR2 peptidylprolyl isomerase family protein FPR2|FKB2 chromosome 4 L000000613 4 1480425 1480832 W 2011-02-03 1996-07-31 Membrane-bound peptidyl-prolyl cis-trans isomerase (PPIase); binds to the drugs FK506 and rapamycin; expression pattern suggests possible involvement in ER protein trafficking; relocalizes from nucleus to vacuole upon DNA replication stress; mutation is functionally complemented by human FKBP2 +S000035584 CDS YDR519W 4 1480425 1480832 W 2011-02-03 1996-07-31 +S000002929 ORF Dubious YDR521W chromosome 4 4 1483141 1483476 W 2011-02-03 1996-07-31 Dubious ORF that overlaps YDR520C; mutant increases expression of PIS1 and RPL3 in glycerol +S000035558 CDS YDR521W 4 1483141 1483476 W 2011-02-03 1996-07-31 +S000002928 ORF Uncharacterized YDR520C URC2 RRT4 chromosome 4 S000122335 4 1483403 1481085 C 2011-02-03 1996-07-31 Putative Zn(II)2Cys6 motif containing transcription factor; non-essential gene identified in a screen for mutants with increased levels of rDNA transcription; similar to S. kluyveri Urc2p involved in uracil catabolism +S000035462 CDS YDR520C 4 1483403 1481085 C 2011-02-03 1996-07-31 +S000002930 ORF Verified YDR522C SPS2 chromosome 4 L000002025 4 1485303 1483795 C 2011-02-03 1996-07-31 Protein expressed during sporulation; SPS2 has a paralog, SPS22, that arose from the whole genome duplication; redundant with Sps22p for organization of the beta-glucan layer of the spore wall; S. pombe ortholog is a spore wall component +S000035591 CDS YDR522C 4 1485303 1483795 C 2011-02-03 1996-07-31 +S000118450 ARS ARS446 ARSIV-1487 chromosome 4 4 1486918 1487161 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178081 ARS_consensus_sequence ARS446 4 1487092 1487076 C 2014-11-18 2014-11-18 +S000002931 ORF Verified YDR523C SPS1 putative serine/threonine protein kinase SPS1 chromosome 4 L000002024 4 1487038 1485566 C 2011-02-03 1996-07-31 Putative protein serine/threonine kinase; localizes to the nucleus and cytoplasm; required for efficient spore packaging, prospore membrane development and closure and localization of enzymes involved in spore wall synthesis; interacts with and required for Ssp1p phosphorylation and turnover; member of the GCKIII subfamily of STE20 kinases; multiply phosphorylated on S/T residues; interacts with 14-3-3 proteins, Bmh1p and Bmh2p; expressed at the end of meiosis +S000036490 CDS YDR523C 4 1487038 1485566 C 2011-02-03 1996-07-31 +S000002932 ORF Verified YDR524C AGE1 SAT1 chromosome 4 S000007502 4 1488990 1487542 C 2011-02-03 1996-07-31 ADP-ribosylation factor (ARF) GTPase activating protein (GAP) effector; involved in the secretory and endocytic pathways; contains C2C2H2 cysteine/histidine motif +S000036586 CDS YDR524C 4 1488990 1487542 C 2011-02-03 1996-07-31 +S000028740 ORF Uncharacterized YDR524W-C YDR524W-A chromosome 4 4 1489403 1489492 W 2011-02-03 2003-07-29 Putative protein of unknown function; small ORF identified by SAGE; deletion strains are moderately sensitive to the radiomimetic drug bleomycin +S000033410 CDS YDR524W-C 4 1489403 1489492 W 2011-02-03 2003-07-29 +S000028739 ORF Uncharacterized YDR524C-B chromosome 4 4 1489798 1489598 C 2011-02-03 2003-07-29 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; YDR524C-B has a paralog, YCL048W-A, that arose from the whole genome duplication +S000033383 CDS YDR524C-B 4 1489798 1489598 C 2011-02-03 2003-07-29 +S000002933 ORF Dubious YDR525W API2 chromosome 4 4 1489905 1490234 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 26% of ORF overlaps the dubious ORF YDR524C-A; insertion mutation in a cdc34-2 mutant background causes altered bud morphology +S000036746 CDS YDR525W 4 1489905 1490234 W 2011-02-03 1996-07-31 +S000028616 ORF Dubious YDR524C-A YDR524C-C chromosome 4 4 1489990 1489871 C 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031456 CDS YDR524C-A 4 1489990 1489871 C 2011-02-03 2003-07-29 +S000007236 ORF Verified YDR525W-A SNA2 chromosome 4 4 1490596 1490835 W 2011-02-03 1999-07-17 Protein of unknown function; has similarity to Pmp3p, which is involved in cation transport; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern +S000036177 CDS YDR525W-A 4 1490596 1490835 W 2011-02-03 1999-07-17 +S000002935 ORF Verified YDR527W RBA50 chromosome 4 4 1491094 1492413 W 2011-02-03 1996-07-31|2011-02-03 Protein involved in transcription; interacts with RNA polymerase II subunits Rpb2p, Rpb3, and Rpb11p; has similarity to human RPAP1 +S000037626 CDS YDR527W 4 1491094 1492413 W 2011-02-03 1996-07-31|2011-02-03 +S000002934 ORF Dubious YDR526C chromosome 4 4 1491545 1491075 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037413 CDS YDR526C 4 1491545 1491075 C 2011-02-03 1996-07-31 +S000028466 snoRNA_gene snR84 SNR84 RUF1 chromosome 4 4 1493026 1492477 C 2011-02-03 2003-03-05 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2266; overexpression confers resistance to baking-associated stress +S000030073 noncoding_exon snR84 4 1493026 1492477 C 2011-02-03 2003-03-05 +S000002936 ORF Verified YDR528W HLR1 chromosome 4 4 1494586 1495857 W 2011-02-03 1996-07-31 Protein involved in regulation of cell wall composition and integrity; also involved in cell wall response to osmotic stress; overproduction suppresses a lysis sensitive PKC mutation; HLR1 has a paralog, LRE1, that arose from the whole genome duplication +S000030394 CDS YDR528W 4 1494586 1495857 W 2011-02-03 1996-07-31 +S000002937 ORF Verified YDR529C QCR7 ubiquinol--cytochrome-c reductase subunit 7|UCR7|CRO1|COR4 chromosome 4 L000001547 4 1496548 1496165 C 2011-02-03 1996-07-31 Subunit 7 of ubiquinol cytochrome-c reductase (Complex III); Complex III is a component of the mitochondrial inner membrane electron transport chain; oriented facing the mitochondrial matrix; N-terminus appears to play a role in complex assembly +S000030475 CDS YDR529C 4 1496548 1496165 C 2011-02-03 1996-07-31 +S000002938 ORF Verified YDR530C APA2 bifunctional AP-4-A phosphorylase/ADP sulfurylase chromosome 4 L000000091 4 1497768 1496791 C 2011-02-03 1996-07-31 Diadenosine 5',5'''-P1,P4-tetraphosphate phosphorylase II; AP4A phosphorylase involved in catabolism of bis(5'-nucleosidyl) tetraphosphates; APA2 has a paralog, APA1, that arose from the whole genome duplication +S000031311 CDS YDR530C 4 1497768 1496791 C 2011-02-03 1996-07-31 +S000002939 ORF Verified YDR531W CAB1 pantothenate kinase chromosome 4 4 1498232 1499335 W 2011-02-03 1996-07-31 Pantothenate kinase, ATP:D-pantothenate 4'-phosphotransferase; catalyzes the first committed step in the universal biosynthetic pathway for synthesis of coenzyme A (CoA); transcriptionally regulated by Upc2p via a sterol response element +S000031423 CDS YDR531W 4 1498232 1499335 W 2011-02-03 1996-07-31 +S000002940 ORF Verified YDR532C KRE28 chromosome 4 4 1500553 1499396 C 2011-02-03 1996-07-31 Subunit of a kinetochore-microtubule binding complex; complex bridges centromeric heterochromatin and kinetochore MAPs and motors; required for sister chromatid bi-orientation and kinetochore binding of SAC components; complex also includes Spc105p; modified by sumoylation +S000031481 CDS YDR532C 4 1500553 1499396 C 2011-02-03 1996-07-31 +S000002941 ORF Verified YDR533C HSP31 glutathione-independent methylglyoxalase chromosome 4 4 1502160 1501447 C 2011-02-03 1996-07-31 Methylglyoxalase that converts methylglyoxal to D-lactate; involved in oxidative stress resistance, diauxic shift, and stationary phase survival; has similarity to E. coli Hsp31 and C. albicans Glx3p; member of the DJ-1/ThiJ/PfpI superfamily, which includes human DJ-1 involved in Parkinson's disease and cancer; exists as a dimer and contains a putative metal-binding site; protein abundance increases in response to DNA replication stress +S000031524 CDS YDR533C 4 1502160 1501447 C 2011-02-03 1996-07-31 +S000002942 ORF Verified YDR534C FIT1 chromosome 4 4 1504900 1503314 C 2011-02-03 1996-07-31 Mannoprotein that is incorporated into the cell wall; incorporated via a glycosylphosphatidylinositol (GPI) anchor; involved in the retention of siderophore-iron in the cell wall +S000031631 CDS YDR534C 4 1504900 1503314 C 2011-02-03 1996-07-31 +S000002943 ORF Dubious YDR535C chromosome 4 4 1507362 1506606 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YDR535C is not an essential gene +S000032613 CDS YDR535C 4 1507058 1506606 C 2011-02-03 1996-07-31 +S000032612 CDS YDR535C 4 1507362 1507315 C 2011-02-03 1996-07-31 +S000032614 intron YDR535C 4 1507314 1507059 C 2011-02-03 1996-07-31 +S000002944 ORF Verified YDR536W STL1 glucose-inactivated glycerol proton symporter STL1 chromosome 4 L000002130 4 1508005 1509714 W 2011-02-03 1996-07-31 Glycerol proton symporter of the plasma membrane; subject to glucose-induced inactivation, strongly but transiently induced when cells are subjected to osmotic shock +S000032772 CDS YDR536W 4 1508005 1509714 W 2011-02-03 1996-07-31 +S000002946 ORF Verified YDR538W PAD1 phenylacrylic acid decarboxylase PAD1|POF1 chromosome 4 L000001331 4 1510902 1511630 W 2011-02-03 1996-07-31 Phenylacrylic acid decarboxylase; confers resistance to cinnamic acid, decarboxylates aromatic carboxylic acids to the corresponding vinyl derivatives; also has mRNA binding activity; homolog of E. coli UbiX; co-overproduction of Pad1p and Fdc1p greatly increases cinnamic acid decarboxylase activity +S000033597 CDS YDR538W 4 1510902 1511630 W 2011-02-03 1996-07-31 +S000002945 ORF Dubious YDR537C chromosome 4 4 1511461 1510856 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps verified ORF PAD1/YDR538W +S000032834 CDS YDR537C 4 1511461 1510856 C 2011-02-03 1996-07-31 +S000002947 ORF Verified YDR539W FDC1 putative phenylacrylic acid decarboxylase FDC1 chromosome 4 4 1512094 1513605 W 2011-02-03 1996-07-31 Ferulic acid decarboxylase, also active on p-coumaric acid; essential for decarboxylation of aromatic carboxylic acids to corresponding vinyl derivatives; co-overproduction of Pad1p and Fdc1p greatly increases cinnamic acid decarboxylase activity; structure implicates Glu285 as the general base in the nonoxidative decarboxylation reaction catalyzed by Fdc1p; homolog of E. coli UbiD; GFP-fusion protein localizes to cytoplasm +S000033698 CDS YDR539W 4 1512094 1513605 W 2011-02-03 1996-07-31 +S000002948 ORF Verified YDR540C IRC4 chromosome 4 4 1517675 1517136 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant displays increased levels of spontaneous Rad52p foci; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus +S000034746 CDS YDR540C 4 1517675 1517136 C 2011-02-03 1996-07-31 +S000006879 long_terminal_repeat YDRWdelta31 chromosome 4 4 1518484 1518807 W 2011-02-03 2000-05-19 Ty1 LTR +S000002949 ORF Verified YDR541C carbonyl reductase (NADPH-dependent) chromosome 4 4 1520698 1519664 C 2011-02-03 1996-07-31|2011-02-03 Aldehyde reductase; substrates include both aromatic and aliphatic aldehydes; uses NADPH as cofactor; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively +S000035672 CDS YDR541C 4 1520698 1519664 C 2011-02-03 1996-07-31|2011-02-03 +S000002950 ORF Verified YDR542W PAU10 seripauperin PAU10 chromosome 4 4 1523249 1523611 W 2011-02-03 1996-07-31 Protein of unknown function; SWAT-GFP fusion protein localizes to the endoplasmic reticulum and vacuole, while mCherry fusion localizes to the vacuole; member of the seripauperin multigene family encoded mainly in subtelomeric regions +S000035788 CDS YDR542W 4 1523249 1523611 W 2011-02-03 1996-07-31 +S000028948 telomere TEL04R chromosome 4 4 1524625 1531933 W 321 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome IV; composed of an X element core sequence, X element combinatorial repeats, a short stretch of telomeric repeats, and a long Y' element +S000028949 telomeric_repeat TEL04R 4 1525371 1525466 W 2011-02-03 2003-09-09 Internal telomeric repeats on the right arm of Chromosome IV +S000028950 X_element TEL04R 4 1524625 1525089 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome IV; spans 464 bp and contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YDR543C +S000028951 X_element_combinatorial_repeat TEL04R 4 1525090 1525370 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr IV; spans 280 bp and contains repeats of the D, C, B and A types, Tbf1p binding sites, and ORF YDR544C; formerly called SubTelomeric Repeats +S000028952 Y_prime_element TEL04R 4 1525467 1531933 W 2011-02-03 2003-09-09 Telomeric long Y' element on the right arm of Chromosome IV; contains an ARS consensus sequence, a region of 36-bp repeats, and ORFs YRF1-1/YDR545W and YDR545C-A +S000002951 ORF Dubious YDR543C chromosome 4 4 1524933 1524634 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035825 CDS YDR543C 4 1524933 1524634 C 2011-02-03 1996-07-31 +S000002952 ORF Dubious YDR544C chromosome 4 4 1525523 1525095 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035945 CDS YDR544C 4 1525523 1525095 C 2011-02-03 1996-07-31 +S000002953 ORF Verified YDR545W YRF1-1 Y' element ATP-dependent helicase protein 1 copy 1|YRF1 chromosome 4 L000004879 4 1526321 1531711 W 2011-02-03 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p +S000036865 CDS YDR545W 4 1526321 1531711 W 2011-02-03 1996-07-31 +S000028617 ORF Dubious YDR545C-A chromosome 4 4 1531342 1530863 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF YRF1-1/YDR545W +S000031458 CDS YDR545C-A 4 1531342 1530863 C 2011-02-03 2003-07-29 +S000028621 ORF Dubious YEL077W-A chromosome 5 5 630 1112 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031470 CDS YEL077W-A 5 630 1112 W 2003-07-29 2003-07-29 +S000006409 ORF Uncharacterized YEL077C Y' element ATP-dependent helicase chromosome 5 5 4097 264 C 1996-07-31 1996-07-31 Helicase-like protein encoded within the telomeric Y' element +S000034008 CDS YEL077C 5 4097 264 C 1996-07-31 1996-07-31 +S000077377 ARS ARS502 chromosome 5 5 4097 4185 2004-10-19 2004-10-19 Autonomously Replicating Sequence +S000002956 ORF Dubious YEL075W-A YEL076W-C chromosome 5 5 4870 5481 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031130 CDS YEL075W-A 5 4870 5481 W 1996-07-31 1996-07-31 +S000002955 ORF Uncharacterized YEL076C-A chromosome 5 5 5114 4185 C 1996-07-31 1996-07-31 Putative protein of unknown function +S000036122 CDS YEL076C-A 5 4322 4185 C 1996-07-31 1996-07-31 +S000036121 CDS YEL076C-A 5 5114 4602 C 1996-07-31 1996-07-31 +S000036123 intron YEL076C-A 5 4601 4323 C 1996-07-31 1996-07-31 +S000000802 ORF Uncharacterized YEL076C chromosome 5 5 5114 4464 C 1996-07-31 1996-07-31 Putative protein of unknown function +S000033207 CDS YEL076C 5 5114 4464 C 1996-07-31 1996-07-31 +S000000801 ORF Uncharacterized YEL075C chromosome 5 5 5713 5345 C 1996-07-31 1996-07-31 Putative protein of unknown function +S000033136 CDS YEL075C 5 5713 5345 C 1996-07-31 1996-07-31 +S000000800 ORF Dubious YEL074W chromosome 5 5 6126 6464 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; large scale expression analysis showed an increase in mRNA accumulation in strains mutant for exosome components +S000033091 CDS YEL074W 5 6126 6464 W 1996-07-31 1996-07-31 +S000077378 ARS ARS503 chromosome 5 5 6378 6453 2014-11-18 2004-10-19|2014-11-18 Autonomously Replicating Sequence +S000028879 telomere TEL05L chromosome 5 5 6473 1 C -52 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome V; annotated components include an X element core sequence and a long Y' element; TEL05L does have telomeric repeats (TEL05L-TR), but they are missing from the genome annotation due to difficulties encountered during sequencing and/or assembly +S000028880 X_element TEL05L 5 6473 6279 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome V; contains an ARS consensus sequence and spans ORF YEL074W +S000028881 Y_prime_element TEL05L 5 6278 1 C 2003-09-09 2003-09-09 Telomeric long Y' element on the left arm of Chromosome V; contains an ARS consensus sequence, a region of 36-bp repeats, and six ORFs (YEL075C, YEL076C, YEL076C-A, YEL077C, YEL075W-A, YEL077W-A) +S000000799 ORF Uncharacterized YEL073C chromosome 5 5 7553 7230 C 1996-07-31 1996-07-31 Putative protein of unknown function; located adjacent to ARS503 and the telomere on the left arm of chromosome V; regulated by inositol/choline +S000032128 CDS YEL073C 5 7553 7230 C 1996-07-31 1996-07-31 +S000077379 ARS ARS504 chromosome 5 5 8786 10019 2004-10-19 2004-10-19|2011-02-03 Autonomously Replicating Sequence +S000000798 ORF Verified YEL072W RMD6 chromosome 5 5 13720 14415 W 1996-07-31 1996-07-31 Protein required for sporulation +S000032092 CDS YEL072W 5 13720 14415 W 1996-07-31 1996-07-31 +S000000797 ORF Verified YEL071W DLD3 D-lactate dehydrogenase chromosome 5 5 16355 17845 W 1996-07-31 1996-07-31 2-hydroxyglutarate transhydrogenase, and minor D-lactate dehydrogenase; converts D-2-hydroxyglutarate (D-2HG), an oncometabolite, to alpha-ketoglutarate in the presence of FAD, with concomitant reduction of pyruvate to D-lactate; minor lactate dehydrogenase activity; component of the retrograde regulon that consists of genes whose expression are stimulated by damage to mitochondria and reduced in cells grown with glutamate as the sole nitrogen source; located in the cytoplasm +S000031974 CDS YEL071W 5 16355 17845 W 1996-07-31 1996-07-31 +S000000796 ORF Verified YEL070W DSF1 MAN1|mannitol dehydrogenase DSF1 chromosome 5 5 19589 21097 W 1996-07-31 1996-07-31 Mannitol dehydrogenase; deletion suppresses mutation of mpt5; DSF1 has a paralog, MAN2, that arose from a segmental duplication +S000031743 CDS YEL070W 5 19589 21097 W 1996-07-31 1996-07-31 +S000000795 ORF Verified YEL069C HXT13 HLT1|hexose transporter HXT13 chromosome 5 L000002640 5 23231 21537 C 1996-07-31 1996-07-31 Putative transmembrane polyol transporter; supports growth on and uptake of mannitol and sorbitol with moderate affinity when overexpressed in a strain deleted for hexose family members; minor hexose transport activity when overexpressed in a similar strain; induced by non-fermentable carbon sources; induced in low glucose, repressed in high glucose; HXT13 has a paralog, HXT17, that arose from a segmental duplication +S000030787 CDS YEL069C 5 23231 21537 C 1996-07-31 1996-07-31 +S000000794 ORF Uncharacterized YEL068C chromosome 5 5 25978 25646 C 1996-07-31 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels; SWAT-GFP and seamless-GFP fusion proteins localize to the endoplasmic reticulum and mCherry fusion protein localizes to the vacuole +S000037857 CDS YEL068C 5 25978 25646 C 1996-07-31 1996-07-31 +S000000792 ORF Verified YEL066W HPA3 D-amino-acid N-acetyltransferase chromosome 5 L000004380 5 26667 27206 W 1996-07-31 1996-07-31 D-Amino acid N-acetyltransferase that detoxifies D-amino acids; catalyzes N-acetylation of D-amino acids through ordered bi-bi mechanism in which acetyl-CoA is first substrate bound and CoA is last product liberated; acetylates histones and polyamines, also autoacetylates +S000037723 CDS YEL066W 5 26667 27206 W 1996-07-31 1996-07-31 +S000000793 ORF Uncharacterized YEL067C chromosome 5 5 26776 26189 C 1996-07-31 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000037750 CDS YEL067C 5 26776 26189 C 1996-07-31 1996-07-31 +S000000791 ORF Verified YEL065W SIT1 siderophore transporter|ARN3 chromosome 5 5 27657 29543 W 1996-07-31 1996-07-31 Ferrioxamine B transporter; member of the ARN family of transporters that specifically recognize siderophore-iron chelates; transcription is induced during iron deprivation and diauxic shift; potentially phosphorylated by Cdc28p +S000036964 CDS YEL065W 5 27657 29543 W 1996-07-31 1996-07-31 +S000000790 ORF Verified YEL064C AVT2 chromosome 5 5 31239 29797 C 1996-07-31 1996-07-31 Putative transporter; member of a family of seven S. cerevisiae genes (AVT1-7) related to vesicular GABA-glycine transporters +S000036881 CDS YEL064C 5 31239 29797 C 1996-07-31 1996-07-31 +S000000789 ORF Verified YEL063C CAN1 arginine permease CAN1 chromosome 5 L000000213 5 33466 31694 C -50 1996-07-31 1996-07-31 Plasma membrane arginine permease; requires phosphatidyl ethanolamine (PE) for localization, exclusively associated with lipid rafts; mutation confers canavanine resistance; CAN1 has a paralog, ALP1, that arose from the whole genome duplication +S000036793 CDS YEL063C 5 33466 31694 C 1996-07-31 1996-07-31 +S000000788 ORF Verified YEL062W NPR2 nitrogen permease regulating protein NPR2 chromosome 5 L000001274 5 34407 36254 W 2003-09-22 2003-09-22|1996-07-31 Subunit of the Iml1p/SEACIT complex; SEACIT (Iml1p-Npr2p-Npr3p) is a subcomplex of the SEA complex, a coatomer-related complex that associates dynamically with the vacuole; Npr2p may have a structural or regulatory role, supporting Iml1p function as a GAP for the Rag family GTPase Gtr1p, and resulting in inhibition of TORC1 signaling in response to amino acid deprivation; SEACIT is required for non-nitrogen-starvation-induced autophagy; homolog of human tumor suppressor NPRL2 +S000035991 CDS YEL062W 5 34407 36254 W 2003-09-22 2003-09-22|1996-07-31 +S000000787 ORF Verified YEL061C CIN8 kinesin motor protein CIN8|SDS15|KSL2 chromosome 5 L000000340 5 39537 36535 C 2003-09-22 2003-09-22|1996-07-31 Kinesin motor protein; involved in mitotic spindle assembly and chromosome segregation +S000035795 CDS YEL061C 5 39537 36535 C 2003-09-22 2003-09-22|1996-07-31 +S000000786 ORF Verified YEL060C PRB1 proteinase B|CVT1 chromosome 5 L000001480 5 41953 40046 C -48 1996-07-31 1996-07-31 Vacuolar proteinase B (yscB) with H3 N-terminal endopeptidase activity; serine protease of the subtilisin family; involved in protein degradation in the vacuole and required for full protein degradation during sporulation; activity inhibited by Pbi2p; protein abundance increases in response to DNA replication stress; PRB1 has a paralog, YSP3, that arose from the whole genome duplication +S000035710 CDS YEL060C 5 41953 40046 C 1996-07-31 1996-07-31 +S000002954 ORF Verified YEL059C-A SOM1 chromosome 5 L000003993 5 42624 42400 C 1996-07-31 1996-07-31 Subunit of the mitochondrial inner membrane peptidase (IMP); IMP is required for maturation of mitochondrial proteins of the intermembrane space; Som1p facilitates cleavage of a subset of substrates; contains twin cysteine-x9-cysteine motifs +S000035802 CDS YEL059C-A 5 42624 42400 C 1996-07-31 1996-07-31 +S000000785 ORF Dubious YEL059W HHY1 ENV6 chromosome 5 5 42652 42960 W 1996-07-31 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; mutant is hypersensitive to hygromycin B indicative of defects in vacuolar trafficking +S000034663 CDS YEL059W 5 42652 42960 W 1996-07-31 1996-07-31 +S000000784 ORF Verified YEL058W PCM1 phosphoacetylglucosamine mutase PCM1|AGM1 chromosome 5 L000001351 5 43252 44925 W 1996-07-31 1996-07-31 Essential N-acetylglucosamine-phosphate mutase; converts GlcNAc-6-P to GlcNAc-1-P, which is a precursor for the biosynthesis of chitin and for the formation of N-glycosylated mannoproteins and glycosylphosphatidylinositol anchors +S000033785 CDS YEL058W 5 43252 44925 W 1996-07-31 1996-07-31 +S000000783 ORF Verified YEL057C SDD1 chromosome 5 5 45721 45020 C 1996-07-31 1996-07-31 Protein of unknown function; overproduction suppresses lethality due to expression of the dominant PET9 allele AAC2-A128P; may have a role in telomere maintenance; target of UME6 regulation +S000033614 CDS YEL057C 5 45721 45020 C 1996-07-31 1996-07-31 +S000000782 ORF Verified YEL056W HAT2 chromosome 5 L000003400 5 47168 48373 W 1996-07-31 1996-07-31 Subunit of the Hat1p-Hat2p histone acetyltransferase complex; required for high affinity binding of the complex to free histone H4, thereby enhancing Hat1p activity; similar to human RbAp46 and 48; has a role in telomeric silencing +S000033568 CDS YEL056W 5 47168 48373 W 1996-07-31 1996-07-31 +S000000781 ORF Verified YEL055C POL5 DNA-directed DNA polymerase chromosome 5 L000004119 5 51539 48471 C 1996-07-31 1996-07-31 DNA Polymerase phi; has sequence similarity to the human MybBP1A and weak sequence similarity to B-type DNA polymerases, not required for chromosomal DNA replication; required for the synthesis of rRNA +S000032784 CDS YEL055C 5 51539 48471 C 1996-07-31 1996-07-31 +S000081374 snoRNA_gene snR80 SNR80 chromosome 5 5 52320 52150 C 2005-11-29 2005-11-29 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U776 and small subunit (SSU) rRNA at position U759 +S000113618 noncoding_exon snR80 5 52320 52150 C 2005-11-29 2005-11-29 +S000028744 ORF Dubious YEL053W-A chromosome 5 5 52908 53255 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene RPL12A/YEL054C +S000033414 CDS YEL053W-A 5 52908 53255 W 2003-07-29 2003-07-29 +S000000780 ORF Verified YEL054C RPL12A uL11|ribosomal 60S subunit protein L12A|L11|YL23|L15A|L12A chromosome 5 L000001712 5 53218 52721 C 1996-07-31 1996-07-31 Ribosomal 60S subunit protein L12A; rpl12a rpl12b double mutant exhibits slow growth and slow translation; homologous to mammalian ribosomal protein L12 and bacterial L11; RPL12A has a paralog, RPL12B, that arose from the whole genome duplication +S000032694 CDS YEL054C 5 53218 52721 C 1996-07-31 1996-07-31 +S000000779 ORF Verified YEL053C MAK10 NAA35 chromosome 5 L000000983 5 56102 53901 C -43 1996-07-31 1996-07-31 Non-catalytic subunit of the NatC N-terminal acetyltransferase; required for replication of dsRNA virus; expression is glucose-repressible; human NatC ortholog, Naa35, requires co-expression of the human catalytic subunit, Naa30, to functionally complement the null allele +S000032563 CDS YEL053C 5 56102 53901 C 1996-07-31 1996-07-31 +S000000778 ORF Verified YEL052W AFG1 chromosome 5 L000000055 5 56571 58100 W 1996-07-31 1996-07-31 Protein that may act as a chaperone for cytochrome c oxidase subunits; conserved protein; may act as a chaperone in the degradation of misfolded or unassembled cytochrome c oxidase subunits; localized to matrix face of the mitochondrial inner membrane; member of the AAA family but lacks a protease domain +S000031642 CDS YEL052W 5 56571 58100 W 1996-07-31 1996-07-31 +S000000777 ORF Verified YEL051W VMA8 H(+)-transporting V1 sector ATPase subunit D chromosome 5 L000002463 5 58378 59148 W 1996-07-31 1996-07-31 Subunit D of the V1 peripheral membrane domain of V-ATPase; part of the electrogenic proton pump found throughout the endomembrane system; plays a role in the coupling of proton transport and ATP hydrolysis; the V1 peripheral membrane domain of the vacuolar H+-ATPase (V-ATPase) has eight subunits +S000031545 CDS YEL051W 5 58378 59148 W 1996-07-31 1996-07-31 +S000077380 ARS ARS507 ARSV-59 chromosome 5 5 59338 59477 2014-11-18 2014-11-18|2004-10-19|2006-09-07 Autonomously Replicating Sequence +S000178082 ARS_consensus_sequence ARS507 5 59470 59454 C 2014-11-18 2014-11-18 +S000028545 ORF Dubious YEL050W-A chromosome 5 5 59549 59740 W 2003-07-29 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by fungal homology and RT-PCR +S000031195 CDS YEL050W-A 5 59549 59740 W 2003-07-29 2003-07-29 +S000000776 ORF Verified YEL050C RML2 mitochondrial 54S ribosomal protein RML2 chromosome 5 L000004131 5 60851 59670 C 1996-07-31 1996-07-31 Mitochondrial ribosomal protein of the large subunit (L2); has similarity to E. coli L2 ribosomal protein; mutant allele (fat21) causes inability to utilize oleate, and induce oleic acid oxidation; may interfere with activity of the Adr1p transcription factor +S000031449 CDS YEL050C 5 60851 59670 C 1996-07-31 1996-07-31 +S000006458 snoRNA_gene snR67 SNR67 chromosome 5 L000004536 5 61352 61433 W 2000-05-19 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at positions G2619 and U2724 +S000030853 noncoding_exon snR67 5 61352 61433 W 2000-05-19 2000-05-19 +S000006444 snoRNA_gene snR53 SNR53 chromosome 5 L000004522 5 61699 61789 W 2000-05-19 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of small subunit (SSU) rRNA at position A796 +S000030737 noncoding_exon snR53 5 61699 61789 W 2000-05-19 2000-05-19 +S000006578 tRNA_gene tG(GCC)E chromosome 5 L000003808 5 61960 61890 C 2000-05-19 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis +S000037897 noncoding_exon tG(GCC)E 5 61960 61890 C 2000-05-19 2000-05-19 +S000006889 long_terminal_repeat YELWdelta1 chromosome 5 5 62081 62756 W 2000-05-19 2000-05-19 Ty1 LTR +S000006890 long_terminal_repeat YELWdelta2 chromosome 5 5 62142 62474 W 2000-05-19 2000-05-19 Ty1 LTR +S000000775 ORF Verified YEL049W PAU2 seripauperin PAU2 chromosome 5 L000002738 5 63728 64090 W 1996-07-31 1996-07-31 Member of the seripauperin multigene family; encoded mainly in subtelomeric region; active during alcoholic fermentation; regulated by anaerobiosis; negatively regulated by oxygen; repressed by heme +S000030708 CDS YEL049W 5 63728 64090 W 1996-07-31 1996-07-31 +S000000774 ORF Verified YEL048C TCA17 chromosome 5 5 65167 64709 C 1996-07-31 1996-07-31 Component of transport protein particle (TRAPP) complex II; TRAPPII is a multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating intra-Golgi and endosome-Golgi traffic; promotes association of TRAPPII-specific subunits with the TRAPP core complex; sedlin related; human Sedlin mutations cause SEDT, a skeletal disorder +S000030547 CDS YEL048C 5 65167 64709 C 1996-07-31 1996-07-31 +S000000773 ORF Verified YEL047C FRD1 fumarate reductase|FRDS1 chromosome 5 5 66797 65385 C 1996-07-31 1996-07-31 Soluble fumarate reductase; required with isoenzyme Osm1p for anaerobic growth; may interact with ribosomes, based on co-purification experiments; authentic, non-tagged protein is detected in purified mitochondria in high-throughput studies; similar to Arxula adeninovorans fumarate reductase; protein abundance increases in response to DNA replication stress; FRD1 has a paralog, OSM1, that arose from the whole genome duplication +S000030396 CDS YEL047C 5 66797 65385 C 1996-07-31 1996-07-31 +S000000772 ORF Verified YEL046C GLY1 threonine aldolase GLY1 chromosome 5 L000000718 5 68792 67629 C 1996-07-31 1996-07-31 Threonine aldolase; catalyzes the cleavage of L-allo-threonine and L-threonine to glycine; involved in glycine biosynthesis +S000037630 CDS YEL046C 5 68792 67629 C 1996-07-31 1996-07-31 +S000000771 ORF Dubious YEL045C chromosome 5 5 69265 68840 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; deletion gives MMS sensitivity, growth defect under alkaline conditions, less than optimal growth upon citric acid stress +S000037503 CDS YEL045C 5 69265 68840 C 1996-07-31 1996-07-31 +S000000770 ORF Verified YEL044W IES6 chromosome 5 5 69757 70257 W 1996-07-31 1996-07-31 Component of the INO80 chromatin remodeling complex; critical for INO80 function; involved in regulation of chromosome segregation and maintenance of normal centromeric chromatin structure; human ortholog INO80C is a member of the human INO80 complex; implicated in DNA repair based on genetic interactions with RAD52 epistasis genes +S000037449 CDS YEL044W 5 69757 70257 W 1996-07-31 1996-07-31 +S000000769 ORF Verified YEL043W chromosome 5 5 70478 73348 W 1996-07-31 1996-07-31 Predicted cytoskeleton protein involved in intracellular signaling; based on quantitative analysis of protein-protein interaction maps; may interact with ribosomes, based on co-purification studies; contains fibronectin type III domain fold +S000036714 CDS YEL043W 5 70478 73348 W 1996-07-31 1996-07-31 +S000000768 ORF Verified YEL042W GDA1 guanosine diphosphatase chromosome 5 L000000695 5 73771 75327 W 1996-07-31 1996-07-31 Guanosine diphosphatase located in the Golgi; involved in the transport of GDP-mannose into the Golgi lumen, converting GDP to GMP after mannose is transferred to substrates; null mutants are defective in sporulation and pre-meiotic S phase entry; orthologous to human ENTPD6, a meiosis-associated non-obstructive azoospermia (NOA) related gene identified in GWAS studies +S000036632 CDS YEL042W 5 73771 75327 W 1996-07-31 1996-07-31 +S000000767 ORF Verified YEL041W YEF1 NADH/NAD(+) kinase chromosome 5 5 75944 77431 W 1996-07-31 1996-07-31 ATP-NADH kinase; phosphorylates both NAD and NADH; homooctameric structure consisting of 60-kDa subunits; similar to Pos5p; overexpression complements certain pos5 phenotypes; YEF1 has a paralog, UTR1, that arose from the whole genome duplication +S000036511 CDS YEL041W 5 75944 77431 W 1996-07-31 1996-07-31 +S000000766 ORF Verified YEL040W UTR2 CRH2 chromosome 5 L000002448 5 78053 79456 W 1996-07-31 1996-07-31 Chitin transglycosylase; functions in the transfer of chitin to beta(1-6) and beta(1-3) glucans in the cell wall; similar to and functionally redundant with Crh1; glycosylphosphatidylinositol (GPI)-anchored protein localized to bud neck +S000036453 CDS YEL040W 5 78053 79456 W 1996-07-31 1996-07-31 +S000000765 ORF Verified YEL039C CYC7 cytochrome c isoform 2 chromosome 5 L000000451 5 79977 79636 C -27 1996-07-31 1996-07-31 Cytochrome c isoform 2, expressed under hypoxic conditions; also known as iso-2-cytochrome c; electron carrier of the mitochondrial intermembrane space that transfers electrons from ubiquinone-cytochrome c oxidoreductase to cytochrome c oxidase during cellular respiration; protein abundance increases in response to DNA replication stress; CYC7 has a paralog, CYC1, that arose from the whole genome duplication +S000035665 CDS YEL039C 5 79977 79636 C 1996-07-31 1996-07-31 +S000000764 ORF Verified YEL038W UTR4 putative acireductone synthase UTR4 chromosome 5 L000002449 5 80462 81145 W 2006-05-09 1996-07-31|2006-05-09 Protein with sequence similarity to acireductone synthases; involved in methionine salvage; found in both the cytoplasm and nucleus +S000035624 CDS YEL038W 5 80462 81145 W 2006-05-09 1996-07-31|2006-05-09 +S000000763 ORF Verified YEL037C RAD23 chromosome 5 L000001568 5 82603 81407 C -26 1996-07-31 1996-07-31 Protein with ubiquitin-like N terminus; subunit of Nuclear Excision Repair Factor 2 (NEF2) with Rad4p that binds damaged DNA; enhances protein deglycosylation activity of Png1p; also involved, with Rad4p, in ubiquitylated protein turnover; Rad4p-Rad23p heterodimer binds to promoters of DNA damage response genes to repress their transcription in the absence of DNA damage +S000035488 CDS YEL037C 5 82603 81407 C 1996-07-31 1996-07-31 +S000000762 ORF Verified YEL036C ANP1 MNN8|GEM3 chromosome 5 L000000089 5 84552 83050 C -26 1996-07-31 1996-07-31 Subunit of the alpha-1,6 mannosyltransferase complex; type II membrane protein; has a role in retention of glycosyltransferases in the Golgi; involved in osmotic sensitivity and resistance to aminonitrophenyl propanediol +S000034468 CDS YEL036C 5 84552 83050 C 1996-07-31 1996-07-31 +S000000761 ORF Uncharacterized YEL035C UTR5 chromosome 5 L000002450 5 85545 85045 C 1996-07-31 1996-07-31 Protein of unknown function; transcription may be regulated by Gcr1p; essential for growth under standard (aerobic) conditions but not under anaerobic conditions +S000034388 CDS YEL035C 5 85545 85045 C 1996-07-31 1996-07-31 +S000000760 ORF Verified YEL034W HYP2 translation elongation factor eIF-5A|eIF-5A|eIF5A|TIF51A chromosome 5 L000000847|L000002307 5 85676 86149 W 1996-07-31 1996-07-31 Translation elongation factor eIF-5A; required for translation of proteins containing polyproline stretches, including Bni1p, and this leads to a requirement for mating projection formation; structural homolog of bacterial EF-P; undergoes an essential hypusination modification; HYP2 has a paralog, ANB1, that arose from the whole genome duplication; human EIF5A complements the inviability of the yeast hyp2 anb1 double null mutant +S000034356 CDS YEL034W 5 85676 86149 W 1996-07-31 1996-07-31 +S000000759 ORF Uncharacterized YEL033W MTC7 chromosome 5 5 86179 86598 W 1996-07-31 1996-07-31 Protein of unknown function; predicted metabolic role based on network analysis derived from ChIP experiments, a large-scale deletion study and localization of transcription factor binding sites; null mutant is sensitive to temperature oscillation in a cdc13-1 mutant +S000033441 CDS YEL033W 5 86179 86598 W 1996-07-31 1996-07-31 +S000028743 ORF Dubious YEL034C-A chromosome 5 5 86215 85613 C 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps HYP2/YEL034W, a verified gene that encodes eiF-5A +S000033413 CDS YEL034C-A 5 86215 85613 C 2003-07-29 2003-07-29 +S000006724 tRNA_gene tS(AGA)E chromosome 5 L000003789 5 86604 86685 W 2000-05-19 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000032362 noncoding_exon tS(AGA)E 5 86604 86685 W 2000-05-19 2000-05-19 +S000000758 ORF Verified YEL032W MCM3 MCM DNA helicase complex subunit MCM3 chromosome 5 L000001039 5 86937 89852 W -24 1996-07-31 1996-07-31 Protein involved in DNA replication; component of the Mcm2-7 hexameric helicase complex that binds chromatin as a part of the pre-replicative complex +S000033351 CDS YEL032W 5 86937 89852 W 1996-07-31 1996-07-31 +S000028620 ORF Dubious YEL032C-A chromosome 5 5 87201 87040 C 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031469 CDS YEL032C-A 5 87201 87040 C 2003-07-29 2003-07-29 +S000000757 ORF Verified YEL031W SPF1 ion-transporting P-type ATPase SPF1|PER9|PIO1|COD1 chromosome 5 L000003454 5 90258 93905 W 1996-07-31 1996-07-31 P-type ATPase, ion transporter of the ER membrane; required to maintain normal lipid composition of intracellular compartments and proper targeting of mitochondrial outer membrane tail-anchored proteins; involved in ER function and Ca2+ homeostasis; required for regulating Hmg2p degradation; confers sensitivity to a killer toxin (SMKT) produced by Pichia farinosa KK1 +S000033284 CDS YEL031W 5 90258 93905 W 1996-07-31 1996-07-31 +S000077381 ARS ARS508 ARSV-94 chromosome 5 5 93978 94218 2006-09-07 2004-10-19|2006-09-07 Autonomously Replicating Sequence +S000178083 ARS_consensus_sequence ARS508 5 94055 94071 W 2014-11-18 2014-11-18 +S000000756 ORF Verified YEL030W ECM10 Hsp70 family ATPase ECM10|SSC3 chromosome 5 L000003885 5 94644 96578 W 1996-07-31 1996-07-31 Heat shock protein of the Hsp70 family; localized in mitochondrial nucleoids, plays a role in protein translocation, interacts with Mge1p in an ATP-dependent manner; overexpression induces extensive mitochondrial DNA aggregations; ECM10 has a paralog, SSC1, that arose from the whole genome duplication +S000033225 CDS YEL030W 5 94644 96578 W 1996-07-31 1996-07-31 +S000028619 ORF Dubious YEL030C-A chromosome 5 5 94897 94583 C 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031462 CDS YEL030C-A 5 94897 94583 C 2003-07-29 2003-07-29 +S000000755 ORF Verified YEL029C BUD16 putative pyridoxal kinase BUD16 chromosome 5 5 97796 96858 C 1996-07-31 1996-07-31 Putative pyridoxal kinase; a key enzyme involved in pyridoxal 5'-phosphate synthesis, the active form of vitamin B6; required for genome integrity; involved in bud-site selection; similarity to yeast BUD17 and human pyridoxal kinase (PDXK) +S000032366 CDS YEL029C 5 97796 96858 C 1996-07-31 1996-07-31 +S000000754 ORF Uncharacterized YEL028W chromosome 5 5 98668 99129 W 1996-07-31 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YEL028C is not an essential gene +S000031432 CDS YEL028W 5 98668 99129 W 1996-07-31 1996-07-31 +S000006886 long_terminal_repeat YELCdelta3 chromosome 5 5 99664 99490 C 2000-05-19 2000-05-19 Ty1 LTR +S000006660 tRNA_gene tM(CAU)E IMT4 chromosome 5 L000003790 5 100133 100204 W 2000-05-19 2000-05-19 Methionine initiator tRNA (tRNA-Met); predicted by tRNAscan-SE analysis; one of four initiator methionine tRNAs in yeast that are functional for translation +S000034533 noncoding_exon tM(CAU)E 5 100133 100204 W 2000-05-19 2000-05-19 +S000000753 ORF Verified YEL027W VMA3 H(+)-transporting V0 sector ATPase subunit c|CUP5|GEF2|CLS7 chromosome 5 L000000441 5 100769 101251 W -18 1996-07-31 1996-07-31 Proteolipid subunit c of the V0 domain of vacuolar H(+)-ATPase; dicyclohexylcarbodiimide binding subunit; required for vacuolar acidification and important for copper and iron metal ion homeostasis +S000031319 CDS YEL027W 5 100769 101251 W 1996-07-31 1996-07-31 +S000000752 ORF Verified YEL026W SNU13 RNA binding protein SNU13 chromosome 5 5 101943 102323 W 1996-07-31 1996-07-31 RNA binding protein; part of U3 snoRNP involved in rRNA processing, part of U4/U6-U5 tri-snRNP involved in mRNA splicing, similar to human 15.5K protein +S000031209 CDS YEL026W 5 101943 102323 W 1996-07-31 1996-07-31 +S000000751 ORF Uncharacterized YEL025C SRI1 chromosome 5 5 106147 102581 C 1996-07-31 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus +S000030133 CDS YEL025C 5 106147 102581 C 1996-07-31 1996-07-31 +S000000750 ORF Verified YEL024W RIP1 ubiquinol--cytochrome-c reductase catalytic subunit RIP1 chromosome 5 L000001643 5 107260 107907 W 1996-07-31 1996-07-31 Ubiquinol-cytochrome-c reductase; a Rieske iron-sulfur protein of the mitochondrial cytochrome bc1 complex; transfers electrons from ubiquinol to cytochrome c1 during respiration; during import, Rip1p is first imported into the mitochondrial matrix where it is processed, acquires its Fe-S cluster, and is folded, then is translocated into the inner membrane by the action of a homo-oligomer of Bcs1p, and finally is delivered by Bcs1p to Complex III for assembly +S000030065 CDS YEL024W 5 107260 107907 W 1996-07-31 1996-07-31 +S000000749 ORF Uncharacterized YEL023C chromosome 5 5 110552 108504 C 1996-07-31 1996-07-31 Putative protein of unknown function; expression is increased greatly during sporulation; YEL023C is not an essential gene +S000029902 CDS YEL023C 5 110552 108504 C 1996-07-31 1996-07-31 +S000000748 ORF Verified YEL022W GEA2 Arf family guanine nucleotide exchange factor GEA2 chromosome 5 L000004717 5 111421 115800 W 1996-07-31 1996-07-31 Guanine nucleotide exchange factor for ADP ribosylation factors (ARFs); involved in vesicular transport between the Golgi and ER, Golgi organization, and actin cytoskeleton organization; GEA2 has a paralog, GEA1, that arose from the whole genome duplication +S000037316 CDS YEL022W 5 111421 115800 W 1996-07-31 1996-07-31 +S000000747 ORF Verified YEL021W URA3 orotidine-5'-phosphate decarboxylase chromosome 5 L000002432 5 116167 116970 W -7 1996-07-31 1996-07-31 Orotidine-5'-phosphate (OMP) decarboxylase; catalyzes the sixth enzymatic step in the de novo biosynthesis of pyrimidines, converting OMP into uridine monophosphate (UMP); converts 5-FOA into 5-fluorouracil, a toxic compound +S000037201 CDS YEL021W 5 116167 116970 W 1996-07-31 1996-07-31 +S000007256 ORF Verified YEL020W-A TIM9 protein transporter TIM9 chromosome 5 L000004718 5 117211 117474 W 1999-07-17 1999-07-17 Essential protein of the mitochondrial intermembrane space; forms a complex with Tim10p (TIM10 complex) that delivers hydrophobic proteins to the TIM22 complex for insertion into the inner membrane +S000034788 CDS YEL020W-A 5 117211 117474 W 1999-07-17 1999-07-17 +S000028544 ORF Dubious YEL020C-B chromosome 5 5 117380 117183 C 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene YEL020W-A; identified by fungal homology and RT-PCR +S000031194 CDS YEL020C-B 5 117380 117183 C 2003-07-29 2003-07-29 +S000006490 ncRNA_gene RPR1 RPR1 chromosome 5 L000001748 5 118035 117667 C -6 2000-05-19 2000-05-19 RNA component of nuclear RNase P; nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs; may be responsible for recognition of substrate tRNAs +S000032263 noncoding_exon RPR1 5 118035 117667 C 2000-05-19 2000-05-19 +S000006888 long_terminal_repeat YELCtau1 chromosome 5 5 118551 118230 C 2000-05-19 2000-05-19 Ty4 LTR +S000000746 ORF Verified YEL020C PXP1 putative indolepyruvate decarboxylase family protein chromosome 5 5 120299 118617 C 1996-07-31 1996-07-31 Peroxisomal matrix protein; well-conserved in fungi; contains tripartite homology domain of thiamine pyrophosphate (TPP) enzymes; targeted to peroxisomes by Pex5p; contains low sequence identity with Pdc1p; mRNA identified as translated by ribosome profiling data +S000037043 CDS YEL020C 5 120299 118617 C 1996-07-31 1996-07-31 +S000000745 ORF Verified YEL019C MMS21 SUMO ligase MMS21|PSO10|NSE2 chromosome 5 L000001125 5 121301 120498 C 1996-07-31 1996-07-31 Highly conserved SUMO E3 ligase subunit of SMC5-SMC6 complex; required for anchoring dsDNA breaks to the nuclear periphery; SMC5-SMC6 plays a key role in removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair; required for efficient sister chromatid cohesion; mutants are sensitive to MMS, show increased spontaneous mutation and mitotic recombination; SUMOylates and inhibits Snf1p function; supports nucleolar function +S000035285 CDS YEL019C 5 121301 120498 C 1996-07-31 1996-07-31 +S000000744 ORF Verified YEL018W EAF5 chromosome 5 5 121471 122310 W 1996-07-31 1996-07-31 Non-essential subunit of the NuA4 acetyltransferase complex; Esa1p-associated factor; relocalizes to the cytosol in response to hypoxia +S000035234 CDS YEL018W 5 121471 122310 W 1996-07-31 1996-07-31 +S000028742 ORF Dubious YEL018C-A chromosome 5 5 121988 121455 C 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF EAF5/YEL018W +S000033412 CDS YEL018C-A 5 121988 121455 C 2003-07-29 2003-07-29 +S000002103 ORF Verified YEL017C-A PMP2 proteolipid ATPase chromosome 5 L000001454 5 122929 122798 C 1996-07-31 1996-07-31 Proteolipid associated with plasma membrane H(+)-ATPase (Pma1p); regulates plasma membrane H(+)-ATPase activity; protein abundance increases in response to DNA replication stress; PMP2 has a paralog, PMP1, that arose from the whole genome duplication +S000035297 CDS YEL017C-A 5 122929 122798 C 1996-07-31 1996-07-31 +S000000743 ORF Verified YEL017W GTT3 chromosome 5 5 123657 124670 W 1996-07-31 1996-07-31 Protein of unknown function may be involved in glutathione metabolism; function suggested by computational analysis of large-scale protein-protein interaction data; N- and C-terminal fusion proteins localize to the cell periphery +S000035057 CDS YEL017W 5 123657 124670 W 1996-07-31 1996-07-31 +S000000742 ORF Verified YEL016C NPP2 nucleotide diphosphatase/phosphodiesterase NPP2 chromosome 5 5 126218 124737 C 1996-07-31 1996-07-31 Nucleotide pyrophosphatase/phosphodiesterase; mediates extracellular nucleotide phosphate hydrolysis along with Npp1p and Pho5p; activity and expression enhanced during conditions of phosphate starvation; involved in spore wall assembly; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; NPP2 has a paralog, NPP1, that arose from the whole genome duplication; npp1 npp2 double mutant exhibits reduced dityrosine fluorescence relative to single mutants +S000034054 CDS YEL016C 5 126218 124737 C 1996-07-31 1996-07-31 +S000000741 ORF Verified YEL015W EDC3 LSM16|DCP3 chromosome 5 5 126629 128284 W 1996-07-31 1996-07-31 Non-essential conserved protein with a role in mRNA decapping; specifically affects the function of the decapping enzyme Dcp1p; mediates decay of the RPS28B mRNA via binding to both Rps28Bp (or Rps28Ap) and the RPS28B mRNA; mediates decay of the YRA1 mRNA by a different, translation-independent mechanism; localizes to cytoplasmic mRNA processing bodies; forms cytoplasmic foci upon DNA replication stress +S000034021 CDS YEL015W 5 126629 128284 W 1996-07-31 1996-07-31 +S000000740 ORF Dubious YEL014C chromosome 5 5 128608 128303 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033749 CDS YEL014C 5 128608 128303 C 1996-07-31 1996-07-31 +S000000739 ORF Verified YEL013W VAC8 protein anchor VAC8|YEB3 chromosome 5 L000004028 5 128825 130561 W 1996-07-31 1996-07-31 Phosphorylated and palmitoylated vacuolar membrane protein; interacts with Atg13p, required for the cytoplasm-to-vacuole targeting (Cvt) pathway; interacts with Nvj1p to form nucleus-vacuole junctions +S000033107 CDS YEL013W 5 128825 130561 W 1996-07-31 1996-07-31 +S000006697 tRNA_gene tQ(UUG)E2 chromosome 5 L000003807 5 131153 131082 C 2000-05-19 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000034949 noncoding_exon tQ(UUG)E2 5 131153 131082 C 2000-05-19 2000-05-19 +S000000738 ORF Verified YEL012W UBC8 E2 ubiquitin-conjugating protein UBC8|GID3 chromosome 5 L000002410 5 131772 132551 W 2000-12-01 2000-12-01|1996-07-31 Ubiquitin-conjugating enzyme that regulates gluconeogenesis; negatively regulates gluconeogenesis by mediating the glucose-induced ubiquitination of fructose-1,6-bisphosphatase (FBPase); cytoplasmic enzyme that catalyzes the ubiquitination of histones in vitro +S000033012 CDS YEL012W 5 131772 131776 W 2000-12-01 2000-12-01 +S000033013 CDS YEL012W 5 131900 132551 W 2000-12-01 2000-12-01|1996-07-31 +S000033014 intron YEL012W 5 131777 131899 W 2000-12-01 2000-12-01 +S000000737 ORF Verified YEL011W GLC3 1,4-alpha-glucan branching enzyme|GHA1 chromosome 5 L000000705 5 133120 135234 W -2 1996-07-31 1996-07-31 Glycogen branching enzyme, involved in glycogen accumulation; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress; glycogen accumulation defect of the null mutant is functionally complemented by human GBE1, which is associated with glycogen storage disease +S000032907 CDS YEL011W 5 133120 135234 W 1996-07-31 1996-07-31 +S000006618 tRNA_gene tK(CUU)E1 chromosome 5 L000003806 5 135497 135425 C 2000-05-19 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000037790 noncoding_exon tK(CUU)E1 5 135497 135425 C 2000-05-19 2000-05-19 +S000006887 long_terminal_repeat YELCdelta4 chromosome 5 5 135939 135612 C 2000-05-19 2000-05-19 Ty1 LTR +S000000736 ORF Dubious YEL010W chromosome 5 5 136279 136629 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032835 CDS YEL010W 5 136279 136629 W 1996-07-31 1996-07-31 +S000028741 ORF Dubious YEL009C-A chromosome 5 5 136778 136371 C 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF YEL010W +S000033411 CDS YEL009C-A 5 136778 136371 C 2003-07-29 2003-07-29 +S000006891 long_terminal_repeat YELWdelta5 chromosome 5 5 137324 137639 W 2000-05-19 2000-05-19 Ty1 LTR +S000006892 long_terminal_repeat YELWdelta6 chromosome 5 5 138221 138553 W 2000-05-19 2000-05-19 Ty1 LTR +S000006710 tRNA_gene tR(UCU)E chromosome 5 L000003791 5 138666 138737 W 2000-05-19 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000037841 noncoding_exon tR(UCU)E 5 138666 138737 W 2000-05-19 2000-05-19 +S000000735 ORF Verified YEL009C GCN4 amino acid starvation-responsive transcription factor GCN4|AAS101|ARG9|AAS3 chromosome 5 L000000683 5 139763 138918 C -3 1996-07-31 1996-07-31 bZIP transcriptional activator of amino acid biosynthetic genes; activator responds to amino acid starvation; expression is tightly regulated at both the transcriptional and translational levels +S000032641 CDS YEL009C 5 139763 138918 C 1996-07-31 1996-07-31 +S000000734 ORF Uncharacterized YEL008W chromosome 5 5 140512 140892 W 1996-07-31 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YEL008W is not an essential gene; predicted to be involved in metabolism +S000032595 CDS YEL008W 5 140512 140892 W 1996-07-31 1996-07-31 +S000028618 ORF Dubious YEL008C-A chromosome 5 5 140818 140726 C 2003-07-29 2003-07-29 Protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031461 CDS YEL008C-A 5 140818 140726 C 2003-07-29 2003-07-29 +S000000733 ORF Verified YEL007W MIT1 TOS9 chromosome 5 5 141892 143892 W 2011-02-03 1996-07-31 Transcriptional regulator of pseudohyphal growth; protein with sequence similarity to S. pombe gti1+ (gluconate transport inducer 1) and C. albicans Wor1 +S000031610 CDS YEL007W 5 141892 143892 W 2011-02-03 1996-07-31 +S000000732 ORF Verified YEL006W YEA6 NAD+ transporter|NDT2 chromosome 5 5 144327 145334 W 2011-02-03 1996-07-31 Putative mitochondrial NAD+ transporter; member of the mitochondrial carrier subfamily (see also YIA6); has putative human ortholog; YEA6 has a paralog, YIA6, that arose from the whole genome duplication +S000031480 CDS YEL006W 5 144327 145334 W 2011-02-03 1996-07-31 +S000077382 ARS ARS510 ARSV-146 chromosome 5 5 145678 145840 2014-11-18 2014-11-18|2004-10-19|2006-09-07 Autonomously Replicating Sequence +S000000731 ORF Verified YEL005C VAB2 VAB31 chromosome 5 5 146755 145907 C 2011-02-03 1996-07-31 Subunit of the BLOC-1 complex involved in endosomal maturation; interacts with Vps21p-GFP; has potential role in vacuolar function, as suggested by its ability to bind Vac8p; likely member of; Vab2p-GFP-fusion localizes to cytoplasm in punctate pattern +S000030477 CDS YEL005C 5 146755 145907 C 2011-02-03 1996-07-31 +S000000730 ORF Verified YEL004W YEA4 chromosome 5 L000004419 5 146951 147979 W 2011-02-03 1996-07-31 Uridine diphosphate-N-acetylglucosamine (UDP-GlcNAc) transporter; required for cell wall chitin synthesis; localized to the ER +S000030440 CDS YEL004W 5 146951 147979 W 2011-02-03 1996-07-31 +S000000729 ORF Verified YEL003W GIM4 tubulin-binding prefolding complex subunit GIM4|PFD2 chromosome 5 L000004368 5 148176 148599 W 2011-02-03 1996-07-31|2007-07-09 Subunit of the heterohexameric cochaperone prefoldin complex; complex binds specifically to cytosolic chaperonin and transfers target proteins to it +S000030310 CDS YEL003W 5 148176 148194 W 2011-02-03 1996-07-31|2007-07-09 +S000123269 CDS YEL003W 5 148283 148599 W 2011-02-03 2007-07-09 +S000123268 intron YEL003W 5 148195 148282 W 2011-02-03 2007-07-09 +S000000728 ORF Verified YEL002C WBP1 dolichyl-diphosphooligosaccharide-protein glycotransferase chromosome 5 L000002483 5 150014 148722 C 2011-02-03 1996-07-31 Beta subunit of the oligosaccharyl transferase glycoprotein complex; required for N-linked glycosylation of proteins in the endoplasmic reticulum; human homolog DDOST can complement yeast growth defect during down-regulation of yeast gene +S000037446 CDS YEL002C 5 150014 148722 C 2011-02-03 1996-07-31 +S000000727 ORF Verified YEL001C IRC22 chromosome 5 5 150978 150301 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion localizes to the ER; YEL001C is non-essential; null mutant displays increased levels of spontaneous Rad52p foci +S000037333 CDS YEL001C 5 150978 150301 C 2011-02-03 1996-07-31 +S000006467 centromere CEN5 CEN5 chromosome 5 L000000298 5 151987 152104 W 0 2011-02-03 2000-05-19|2006-05-08 Chromosome V centromere +S000077269 centromere_DNA_Element_I CEN5 5 151987 151996 W 2011-02-03 2004-10-04 +S000077270 centromere_DNA_Element_II CEN5 5 151997 152079 W 2011-02-03 2004-10-04 +S000077271 centromere_DNA_Element_III CEN5 5 152080 152104 W 2011-02-03 2004-10-04 +S000000803 ORF Verified YER001W MNN1 alpha-1,3-mannosyltransferase MNN1 chromosome 5 L000001126 5 153520 155808 W 0 2011-02-03 1996-07-31 Alpha-1,3-mannosyltransferase; integral membrane glycoprotein of the Golgi complex, required for addition of alpha1,3-mannose linkages to N-linked and O-linked oligosaccharides, one of five S. cerevisiae proteins of the MNN1 family +S000033040 CDS YER001W 5 153520 155808 W 2011-02-03 1996-07-31 +S000000804 ORF Verified YER002W NOP16 chromosome 5 5 156803 157498 W 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; involved in 60S ribosomal subunit biogenesis +S000033709 CDS YER002W 5 156803 157498 W 2011-02-03 1996-07-31 +S000000805 ORF Verified YER003C PMI40 mannose-6-phosphate isomerase PMI40|PMI chromosome 5 L000001452 5 159118 157736 C 2011-02-03 1996-07-31 Mannose-6-phosphate isomerase; catalyzes the interconversion of fructose-6-P and mannose-6-P; required for early steps in protein mannosylation +S000033753 CDS YER003C 5 158994 157736 C 2011-02-03 1996-07-31 +S000033752 CDS YER003C 5 159118 159088 C 2011-02-03 1996-07-31 +S000033754 intron YER003C 5 159087 158995 C 2011-02-03 1996-07-31 +S000000806 ORF Verified YER004W FMP52 chromosome 5 5 159580 160275 W 2011-02-03 1996-07-31 Protein of unknown function; localized to the mitochondrial outer membrane; induced by treatment with 8-methoxypsoralen and UVA irradiation +S000033918 CDS YER004W 5 159580 160275 W 2011-02-03 1996-07-31 +S000000807 ORF Verified YER005W YND1 apyrase|YEJ5|APY1 chromosome 5 S000007428 5 160550 162442 W 2011-02-03 1996-07-31 Apyrase with wide substrate specificity; helps prevent inhibition of glycosylation by hydrolyzing nucleoside tri- and diphosphates that inhibit glycotransferases; partially redundant with Gda1p; mediates adenovirus E4orf4-induced toxicity +S000034049 CDS YER005W 5 160550 162442 W 2011-02-03 1996-07-31 +S000000808 ORF Verified YER006W NUG1 RNA-binding GTPase NUG1 chromosome 5 5 162723 164285 W 2011-02-03 1996-07-31 GTPase that associates with nuclear 60S pre-ribosomes; required for export of 60S ribosomal subunits from the nucleus +S000034937 CDS YER006W 5 162723 164285 W 2011-02-03 1996-07-31 +S000000809 ORF Verified YER007W PAC2 chromosome 5 L000001329 5 164527 166083 W 2011-02-03 1996-07-31 Microtubule effector required for tubulin heterodimer formation; binds alpha-tubulin, required for normal microtubule function, null mutant exhibits cold-sensitive microtubules and sensitivity to benomyl +S000035125 CDS YER007W 5 164527 166083 W 2011-02-03 1996-07-31 +S000028745 ORF Dubious YER006C-A chromosome 5 5 164661 164344 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF PAC2/YER007W +S000033415 CDS YER006C-A 5 164661 164344 C 2011-02-03 2003-07-29 +S000002957 ORF Verified YER007C-A TMA20 RBF20 chromosome 5 5 166885 166237 C 2011-02-03 1996-07-31 Protein of unknown function that associates with ribosomes; has a putative RNA binding domain; interacts with Tma22p; null mutant exhibits translation defects; has homology to human oncogene MCT-1; protein abundance increases in response to DNA replication stress +S000032950 CDS YER007C-A 5 166771 166237 C 2011-02-03 1996-07-31 +S000032949 CDS YER007C-A 5 166885 166875 C 2011-02-03 1996-07-31 +S000032951 intron YER007C-A 5 166874 166772 C 2011-02-03 1996-07-31 +S000006499 snRNA_gene snR14 SNR14 U4 chromosome 5 L000001965 5 167586 167427 C 2011-02-03 2000-05-19 U4 spliceosomal RNA (U4 snRNA); interacts with U6 +S000036593 noncoding_exon snR14 5 167586 167427 C 2011-02-03 2000-05-19 +S000000810 ORF Verified YER008C SEC3 GTP-Rho binding exocyst subunit SEC3|PSL1 chromosome 5 L000001829|L000001520 5 171818 167808 C 3 2011-02-03 1996-07-31 Subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to sites of exocytosis prior to SNARE-mediated fusion; PtdIns[4,5]P2-binding protein that localizes to exocytic sites in a Rho1p-dependent, actin-independent manner, targeting and anchoring the exocyst to the plasma membrane with Exo70p; direct GTP Rho1p effector; required for ER inheritance; relocalizes away from bud neck upon DNA replication stress +S000035220 CDS YER008C 5 171818 167808 C 2011-02-03 1996-07-31 +S000000811 ORF Verified YER009W NTF2 Ran GTPase-binding protein NTF2 chromosome 5 L000002863 5 172115 172492 W 2011-02-03 1996-07-31 Nuclear envelope protein; interacts with GDP-bound Gsp1p and with proteins of the nuclear pore to transport Gsp1p into the nucleus where it is an essential player in nucleocytoplasmic transport +S000036204 CDS YER009W 5 172115 172492 W 2011-02-03 1996-07-31 +S000000812 ORF Verified YER010C bifunctional 4-hydroxy-4-methyl-2-oxoglutarate aldolase/oxaloacetate decarboxylase chromosome 5 5 173338 172634 C 2011-02-03 1996-07-31 Bifunctional HMG aldolase/oxaloacetate decarboxylase; requires divalent metal ions for activity; competitively inhibited by oxalate; forms a ring-shaped homotrimer; similar to members of the prokaryotic RraA family of class II (divalent metal ion dependent) pyruvate aldolases from the meta cleavage pathways of protocatechuate and gallate +S000036925 CDS YER010C 5 173338 172634 C 2011-02-03 1996-07-31 +S000077383 ARS ARS511 ARSV-174 chromosome 5 5 173700 173864 2014-11-18 2014-11-18|2004-10-19|2006-09-07 Autonomously Replicating Sequence +S000178084 ARS_consensus_sequence ARS511 5 173808 173792 C 2014-11-18 2014-11-18 +S000000813 ORF Verified YER011W TIR1 GPI-anchored mannoprotein|SRP1 chromosome 5 L000002059 5 175248 176012 W 2011-02-03 1996-07-31 Cell wall mannoprotein; expression is downregulated at acidic pH and induced by cold shock and anaerobiosis; abundance is increased in cells cultured without shaking; member of the Srp1p/Tip1p family of serine-alanine-rich proteins +S000037042 CDS YER011W 5 175248 176012 W 2011-02-03 1996-07-31 +S000006912 long_terminal_repeat YERWdelta7 chromosome 5 5 176705 176856 W 2011-02-03 2000-05-19 Ty1 LTR +S000006550 tRNA_gene tE(UUC)E1 chromosome 5 L000003792 5 177099 177170 W 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; target of K. lactis zymocin +S000034436 noncoding_exon tE(UUC)E1 5 177099 177170 W 2011-02-03 2000-05-19 +S000000814 ORF Verified YER012W PRE1 proteasome core particle subunit beta 4 chromosome 5 L000001483 5 177835 178431 W 2011-02-03 1996-07-31 Beta 4 subunit of the 20S proteasome; localizes to the nucleus throughout the cell cycle +S000037113 CDS YER012W 5 177835 178431 W 2011-02-03 1996-07-31 +S000000815 ORF Verified YER013W PRP22 DEAH-box ATP-dependent RNA helicase PRP22 chromosome 5 L000001508 5 178841 182278 W 2011-02-03 1996-07-31 DEAH-box RNA-dependent ATPase/ATP-dependent RNA helicase; associates with lariat intermediates before the second catalytic step of splicing; mediates ATP-dependent mRNA release from the spliceosome and unwinds RNA duplexes; required for proofreading the exon ligation reaction +S000037868 CDS YER013W 5 178841 182278 W 2011-02-03 1996-07-31 +S000000816 ORF Verified YER014W HEM14 oxygen-dependent protoporphyrinogen oxidase chromosome 5 L000003353 5 182600 184219 W 2011-02-03 1996-07-31 Protoporphyrinogen oxidase; a mitochondrial enzyme that catalyzes the seventh step in the heme biosynthetic pathway, converting protoporphyrinogen IX to protoporphyrin IX; inhibited by diphenyl ether-type herbicides +S000029903 CDS YER014W 5 182600 184219 W 2011-02-03 1996-07-31 +S000000817 ORF Verified YER015W FAA2 medium-chain fatty acid-CoA ligase FAA2|FAM1 chromosome 5 L000000595|L000000599 5 184541 186775 W 2011-02-03 1996-07-31 Medium chain fatty acyl-CoA synthetase; activates imported fatty acids; accepts a wide range of fatty acid chain lengths with a preference for medium chains, C9:0-C13:0; localized to the peroxisome; comparative analysis suggests that a mitochondrially targeted form may result from translation starting at a non-canonical codon upstream of the annotated start codon +S000030015 CDS YER015W 5 184541 186775 W 2011-02-03 1996-07-31 +S000007590 ORF Verified YER014C-A BUD25 chromosome 5 5 184700 183731 C 2011-02-03 2001-02-14 Protein involved in bud-site selection; diploid mutants display a random budding pattern instead of the wild-type bipolar pattern +S000037101 CDS YER014C-A 5 184169 183731 C 2011-02-03 2001-02-14 +S000037100 CDS YER014C-A 5 184700 184678 C 2011-02-03 2001-02-14 +S000037102 intron YER014C-A 5 184677 184170 C 2011-02-03 2001-02-14 +S000000818 ORF Verified YER016W BIM1 microtubule-binding protein BIM1|EB1|YEB1 chromosome 5 L000003272 5 188277 189311 W 2011-02-03 1996-07-31 Microtubule plus end-tracking protein; together with Kar9p makes up the cortical microtubule capture site and delays the exit from mitosis when the spindle is oriented abnormally; homolog of human end binding protein 1 (EB1) +S000031017 CDS YER016W 5 188277 189311 W 2011-02-03 1996-07-31 +S000000819 ORF Verified YER017C AFG3 AAA family ATPase AFG3|YTA10 chromosome 5 L000002562|L000000057 5 191788 189503 C 2011-02-03 1996-07-31 Mitochondrial inner membrane m-AAA protease component; mediates degradation of misfolded or unassembled proteins; also required for correct assembly of mitochondrial enzyme complexes; involved in cytoplasmic mRNA translation and aging; expression of human homolog AFG3L2 can complement yeast yta12 afg3 double mutant +S000031051 CDS YER017C 5 191788 189503 C 2011-02-03 1996-07-31 +S000000820 ORF Verified YER018C SPC25 kinetochore-associated Ndc80 complex subunit SPC25 chromosome 5 L000004695 5 192624 191959 C 2011-02-03 1996-07-31 Component of the kinetochore-associated Ndc80 complex; involved in chromosome segregation, spindle checkpoint activity, and kinetochore clustering; evolutionarily conserved; other members include Ndc80p, Nuf2p, Spc24p, and Spc25p +S000031164 CDS YER018C 5 192624 191959 C 2011-02-03 1996-07-31 +S000000821 ORF Verified YER019W ISC1 inositol phosphosphingolipid phospholipase chromosome 5 5 192797 194230 W 2011-02-03 1996-07-31 Inositol phosphosphingolipid phospholipase C; mitochondrial membrane localized; hydrolyzes complex sphingolipids to produce ceramide; activates genes required for non-fermentable carbon source metabolism during diauxic shift; activated by phosphatidylserine, cardiolipin, and phosphatidylglycerol; mediates Na+ and Li+ halotolerance; ortholog of mammalian neutral sphingomyelinase type 2 +S000032239 CDS YER019W 5 192797 194230 W 2011-02-03 1996-07-31 +S000002127 ORF Verified YER019C-A SBH2 Arf family guanine nucleotide exchange factor SBH2|SEB2 chromosome 5 L000002847|L000004138 5 194539 194273 C 2011-02-03 1996-07-31 Ssh1p-Sss1p-Sbh2p complex component; involved in protein translocation into the endoplasmic reticulum; SBH2 has a paralog, SBH1, that arose from the whole genome duplication +S000032656 CDS YER019C-A 5 194539 194273 C 2011-02-03 1996-07-31 +S000000822 ORF Verified YER020W GPA2 guanine nucleotide-binding protein subunit alpha|SSP101 chromosome 5 L000000721 5 195168 196517 W 10 2011-02-03 1996-07-31 Nucleotide binding alpha subunit of the heterotrimeric G protein; interacts with the receptor Gpr1p, has signaling role in response to nutrients; required for the recruitment of Ras-GTP at the plasma membrane and in the nucleus +S000032231 CDS YER020W 5 195168 196517 W 2011-02-03 1996-07-31 +S000000823 ORF Verified YER021W RPN3 proteasome regulatory particle lid subunit RPN3|SUN2 chromosome 5 L000003109 5 196948 198519 W 2011-02-03 1996-07-31 Essential non-ATPase regulatory subunit of the 26S proteasome lid; similar to the p58 subunit of the human 26S proteasome; temperature-sensitive alleles cause metaphase arrest, suggesting a role for the proteasome in cell cycle control +S000032304 CDS YER021W 5 196948 198519 W 2011-02-03 1996-07-31 +S000000824 ORF Verified YER022W SRB4 MED17 chromosome 5 L000002051 5 198812 200875 W 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; required for basal RNA polymerase II transcription; homozygosity of the human MED17 L371P mutation is associated with infantile cerebral and cerebellar atrophy with poor myelination +S000033166 CDS YER022W 5 198812 200875 W 2011-02-03 1996-07-31 +S000000825 ORF Verified YER023W PRO3 pyrroline-5-carboxylate reductase|ORE2 chromosome 5 L000001493 5 201076 201936 W 23 2011-02-03 1996-07-31 Delta 1-pyrroline-5-carboxylate reductase; catalyzes the last step in proline biosynthesis +S000033229 CDS YER023W 5 201076 201936 W 2011-02-03 1996-07-31 +S000028622 ORF Dubious YER023C-A chromosome 5 5 201734 201522 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified gene PRO3; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching +S000031472 CDS YER023C-A 5 201734 201522 C 2011-02-03 2003-07-29 +S000000826 ORF Verified YER024W YAT2 carnitine O-acetyltransferase YAT2 chromosome 5 5 202192 204963 W 2011-02-03 1996-07-31 Carnitine acetyltransferase; has similarity to Yat1p, which is a carnitine acetyltransferase associated with the mitochondrial outer membrane +S000033278 CDS YER024W 5 202192 204963 W 2011-02-03 1996-07-31 +S000000827 ORF Verified YER025W GCD11 translation initiation factor eIF2 subunit gamma|SUI4 chromosome 5 L000000677 5 205251 206834 W 14 2011-02-03 1996-07-31 Gamma subunit of the translation initiation factor eIF2; involved in the identification of the start codon; binds GTP when forming the ternary complex with GTP and tRNAi-Met; mutations in human ortholog cause X-linked intellectual disability (XLID) +S000034151 CDS YER025W 5 205251 206834 W 2011-02-03 1996-07-31 +S000006593 tRNA_gene tH(GUG)E1 chromosome 5 L000003793 5 207357 207428 W 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis +S000035209 noncoding_exon tH(GUG)E1 5 207357 207428 W 2011-02-03 2000-05-19 +S000000828 ORF Verified YER026C CHO1 CDP-diacylglycerol-serine O-phosphatidyltransferase|PSS1 chromosome 5 L000000327|L000001521 5 208474 207644 C 22 2011-02-03 1996-07-31 Phosphatidylserine synthase; functions in phospholipid biosynthesis; catalyzes the reaction CDP-diaclyglycerol + L-serine = CMP + L-1-phosphatidylserine, transcriptionally repressed by myo-inositol and choline +S000034205 CDS YER026C 5 208474 207644 C 2011-02-03 1996-07-31 +S000000829 ORF Verified YER027C GAL83 SPM1 chromosome 5 L000000666 5 210232 208979 C 11 2011-02-03 1996-07-31 One of three possible beta-subunits of the Snf1 kinase complex; allows nuclear localization of the Snf1 kinase complex in the presence of a nonfermentable carbon source; necessary and sufficient for phosphorylation of the Mig2p transcription factor in response to alkaline stress; functionally redundant with SIP1 and SIP2 for the phosphorylation of Mig1p in response to glucose deprivation; contains a glycogen-binding domain +S000034334 CDS YER027C 5 210232 208979 C 2011-02-03 1996-07-31 +S000000830 ORF Verified YER028C MIG3 chromosome 5 5 211876 210692 C 2011-02-03 1996-07-31 Transcriptional regulator; partially nonfunctional in S288C strains but has a major role in catabolite repression and ethanol response in some other strains; involved in response to toxic agents; phosphorylation by Snf1p or the Mec1p pathway inactivates Mig3p, allowing induction of damage response genesenvironment +S000035341 CDS YER028C 5 211876 210692 C 2011-02-03 1996-07-31 +S000077384 ARS ARS512 ARSV-212 chromosome 5 5 212383 212631 2011-02-03 2004-10-19|2006-09-07 Autonomously Replicating Sequence +S000178085 ARS_consensus_sequence ARS512 5 212454 212470 W 2014-11-18 2014-11-18 +S000000831 ORF Verified YER029C SMB1 mRNA splicing protein SMB1|Sm B|SmB chromosome 5 L000004361 5 213177 212587 C 2011-02-03 1996-07-31 Core Sm protein Sm B; part of heteroheptameric complex (with Smd1p, Smd2p, Smd3p, Sme1p, Smx3p, and Smx2p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; homolog of human Sm B and Sm B' +S000035476 CDS YER029C 5 213177 212587 C 2011-02-03 1996-07-31 +S000000832 ORF Verified YER030W CHZ1 chromosome 5 5 213437 213898 W 2011-02-03 1996-07-31|2005-11-29 Histone chaperone for Htz1p/H2A-H2B dimer; required for the stabilization of the Chz1p-Htz1-H2B complex; has overlapping function with Nap1p; null mutant displays weak sensitivity to MMS and benomyl; contains a highly conserved CHZ motif; protein abundance increases in response to DNA replication stress +S000036549 CDS YER030W 5 213437 213898 W 2011-02-03 1996-07-31|2005-11-29 +S000000833 ORF Verified YER031C YPT31 Rab family GTPase YPT31|YPT8 chromosome 5 L000002545 5 214747 214076 C 2011-02-03 1996-07-31 Rab family GTPase; involved in the exocytic pathway; mediates intra-Golgi traffic or the budding of post-Golgi vesicles from the trans-Golgi; YPT31 has a paralog, YPT32, that arose from the whole genome duplication; localizes to the transitional and late Golgi +S000036578 CDS YER031C 5 214747 214076 C 2011-02-03 1996-07-31 +S000000834 ORF Verified YER032W FIR1 PIP1 chromosome 5 L000003487 5 215063 217693 W 2011-02-03 2003-09-22|1996-07-31 Protein involved in 3' mRNA processing; interacts with Ref2p; APCC(Cdh1) substrate; potential Cdc28p substrate +S000037329 CDS YER032W 5 215063 217693 W 2011-02-03 2003-09-22|1996-07-31 +S000000835 ORF Verified YER033C ZRG8 chromosome 5 S000007518 5 221287 218057 C 2011-02-03 1996-07-31 Protein of unknown function; authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; GFP-fusion protein is localized to the cytoplasm; transcription induced under conditions of zinc deficiency +S000037376 CDS YER033C 5 221287 218057 C 2011-02-03 1996-07-31 +S000000836 ORF Verified YER034W chromosome 5 5 221846 222403 W 2011-02-03 1996-07-31 Protein of unknown function; non-essential gene; expression induced upon calcium shortage; protein abundance increases in response to DNA replication stress +S000030147 CDS YER034W 5 221846 222403 W 2011-02-03 1996-07-31 +S000000837 ORF Verified YER035W EDC2 chromosome 5 5 222639 223076 W 2011-02-03 1996-07-31 RNA-binding protein that directly activates mRNA decapping; binds mRNA substrate and enhances activity of decapping proteins Dcp1p and Dcp2p; has a role in translation during heat stress; protein increases in abundance and relocalizes to nucleolus and to nuclear foci upon DNA replication stress; EDC2 has a paralog, EDC1, that arose from the whole genome duplication +S000030324 CDS YER035W 5 222639 223076 W 2011-02-03 1996-07-31 +S000000838 ORF Verified YER036C ARB1 ATP-binding cassette family ATPase ARB1 chromosome 5 5 225199 223367 C 2011-02-03 1996-07-31 ATPase of the ATP-binding cassette (ABC) family; involved in 40S and 60S ribosome biogenesis, has similarity to Gcn20p; shuttles from nucleus to cytoplasm, physically interacts with Tif6p, Lsg1p; human homolog ABCF2 can complement yeast ARB1 mutant +S000030397 CDS YER036C 5 225199 223367 C 2011-02-03 1996-07-31 +S000000839 ORF Verified YER037W PHM8 bifunctional nucleotidase/lysophosphatidic acid phosphatase chromosome 5 5 225889 226854 W 2011-02-03 1996-07-31 Lysophosphatidic acid (LPA) phosphatase, nucleotidase; principle and physiological nucleotidase working on GMP, UMP and CMP; involved in LPA hydrolysis in response to phosphate starvation and ribose salvage pathway; phosphatase activity is soluble and Mg2+ dependent; expression is induced by low phosphate levels and by inactivation of Pho85p; repressed by Gcn4p under normal conditions; PHM8 has a paralog, SDT1, that arose from the whole genome duplication +S000031397 CDS YER037W 5 225889 226854 W 2011-02-03 1996-07-31 +S000000840 ORF Verified YER038C KRE29 Smc5-Smc6 complex subunit KRE29|NSE6 chromosome 5 5 228252 226858 C 2011-02-03 1996-07-31 Subunit of the SMC5-SMC6 complex; this complex is involved in removal of X-shaped DNA structures that arise between sister chromatids during DNA replication and repair; heterozygous mutant shows haploinsufficiency in K1 killer toxin resistance +S000031448 CDS YER038C 5 228252 226858 C 2011-02-03 1996-07-31 +S000028746 ORF Uncharacterized YER038W-A FMP49 chromosome 5 5 228451 228831 W 2011-02-03 2003-07-29 Mitochondrial protein of unknown function; almost completely overlaps ORF HVG1/YER039C +S000033416 CDS YER038W-A 5 228451 228831 W 2011-02-03 2003-07-29 +S000000841 ORF Verified YER039C HVG1 putative GDP-mannose transporter|YEM9 chromosome 5 L000003907 5 229205 228456 C 2011-02-03 1996-07-31 Protein of unknown function; HVG1 has a paralog, VRG4, that arose from the whole genome duplication +S000031567 CDS YER039C 5 229205 228456 C 2011-02-03 1996-07-31 +S000007226 ORF Uncharacterized YER039C-A chromosome 5 5 229481 229263 C 2011-02-03 1999-07-17 Putative protein of unknown function; YER039C-A is not an essential gene +S000030146 CDS YER039C-A 5 229481 229263 C 2011-02-03 1999-07-17 +S000000842 ORF Verified YER040W GLN3 nitrogen-responsive transcriptional regulator GLN3 chromosome 5 L000000710 5 229795 231987 W 38 2011-02-03 1996-07-31 Transcriptional activator of genes regulated by nitrogen catabolite repression; localization and activity regulated by quality of nitrogen source and Ure2p +S000031823 CDS YER040W 5 229795 231987 W 2011-02-03 1996-07-31 +S000000843 ORF Verified YER041W YEN1 crossover junction endodeoxyribonuclease chromosome 5 5 232461 234740 W 2011-02-03 1996-07-31|2011-02-03 Holliday junction resolvase; promotes template switching during break-induced replication (BIR), causing non-reciprocal translocations (NRTs); localization is cell-cycle dependent and regulated by Cdc28p phosphorylation; homolog of human GEN1; similar to S. cerevisiae endonuclease Rth1p +S000031953 CDS YER041W 5 232461 234740 W 2011-02-03 1996-07-31|2011-02-03 +S000000844 ORF Verified YER042W MXR1 peptide-methionine-S-sulfoxide reductase|msrA chromosome 5 L000004794 5 234937 235491 W 2011-02-03 1996-07-31 Methionine-S-sulfoxide reductase; involved in the response to oxidative stress; protects iron-sulfur clusters from oxidative inactivation along with MXR2; involved in the regulation of lifespan; reduced activity of human homolog implicated in Alzheimer disease +S000032841 CDS YER042W 5 234937 235491 W 2011-02-03 1996-07-31 +S000000845 ORF Verified YER043C SAH1 adenosylhomocysteinase chromosome 5 L000002989 5 237119 235770 C 2011-02-03 1996-07-31 S-adenosyl-L-homocysteine hydrolase; catabolizes S-adenosyl-L-homocysteine which is formed after donation of the activated methyl group of S-adenosyl-L-methionine (AdoMet) to an acceptor; regulates cellular lipid homoeostasis by regulating phosphatidylcholine(PC)synthesis and triacylglycerol (TG) levels +S000032879 CDS YER043C 5 237119 235770 C 2011-02-03 1996-07-31 +S000000846 ORF Verified YER044C ERG28 BUD18 chromosome 5 5 238016 237570 C 2011-02-03 1996-07-31 Endoplasmic reticulum membrane protein; may facilitate protein-protein interactions between the Erg26p dehydrogenase and the Erg27p 3-ketoreductase and/or tether these enzymes to the ER, also interacts with Erg6p +S000032987 CDS YER044C 5 238016 237570 C 2011-02-03 1996-07-31 +S000001954 ORF Verified YER044C-A MEI4 chromosome 5 L000001060 5 239774 238460 C 41 2011-02-03 1996-07-31 Meiosis-specific protein involved in forming DSBs; involved in double-strand break (DSBs) formation during meiotic recombination; required for chromosome synapsis and production of viable spores +S000032766 CDS YER044C-A 5 239623 238460 C 2011-02-03 1996-07-31 +S000032765 CDS YER044C-A 5 239774 239712 C 2011-02-03 1996-07-31 +S000032767 intron YER044C-A 5 239711 239624 C 2011-02-03 1996-07-31 +S000000847 ORF Verified YER045C ACA1 chromosome 5 5 241501 240032 C 2011-02-03 1996-07-31 ATF/CREB family basic leucine zipper (bZIP) transcription factor; binds as a homodimer to the ATF/CREB consensus sequence TGACGTCA; important for carbon source utilization; target genes include GRE2 and COS8; ACA1 has a paralog, CST6, that arose from the whole genome duplication +S000033081 CDS YER045C 5 241501 240032 C 2011-02-03 1996-07-31 +S000000848 ORF Verified YER046W SPO73 chromosome 5 5 243180 243611 W 2011-02-03 1996-07-31 Meiosis-specific protein required for prospore membrane morphogenesis; required for the proper shape of the prospore membrane (PSM) and for spore wall formation; functions cooperatively with SPO71 in PSM elongation; physically interacts with Spo71p; genetically antagonistic to SPO1, similar to SPO71; localizes to the PSM; required for spore wall formation during sporulation; dispensable for both nuclear divisions during meiosis; dysferlin domain-only protein +S000033892 CDS YER046W 5 243180 243611 W 2011-02-03 1996-07-31 +S000028747 ORF Dubious YER046W-A chromosome 5 5 243700 244029 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF SAP1/YER047C +S000033417 CDS YER046W-A 5 243700 244029 W 2011-02-03 2003-07-29 +S000000849 ORF Verified YER047C SAP1 putative AAA family ATPase SAP1 chromosome 5 L000004134 5 246503 243810 C 2011-02-03 1996-07-31 Putative ATPase of the AAA family; interacts with the Sin1p transcriptional repressor in the two-hybrid system +S000033982 CDS YER047C 5 246503 243810 C 2011-02-03 1996-07-31 +S000000850 ORF Verified YER048C CAJ1 chromosome 5 L000000210 5 248157 246982 C 2011-02-03 1996-07-31 Nuclear type II J heat shock protein of the E. coli dnaJ family; contains a leucine zipper-like motif, binds to non-native substrates for presentation to Ssa3p, may function during protein translocation, assembly and disassembly +S000034089 CDS YER048C 5 248157 246982 C 2011-02-03 1996-07-31 +S000006893 long_terminal_repeat YERCdelta8 chromosome 5 5 249331 249109 C 2011-02-03 2000-05-19|2007-04-03 Ty1 LTR +S000006913 long_terminal_repeat YERWdelta9 chromosome 5 5 249445 249752 W 2011-02-03 2000-05-19 Ty1 LTR +S000006904 long_terminal_repeat YERCsigma1 chromosome 5 5 250270 249930 C 2011-02-03 2000-05-19 Ty3 LTR +S000006696 tRNA_gene tQ(UUG)E1 chromosome 5 L000003794 5 250286 250357 W 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000034942 noncoding_exon tQ(UUG)E1 5 250286 250357 W 2011-02-03 2000-05-19 +S000007237 ORF Verified YER048W-A ISD11 chromosome 5 5 250718 251002 W 2011-02-03 1999-07-17 Cysteine desulfurase (Nfs1p) activator; essential for the formation of the persulfide intermediate at the desulfurase active site during pyridoxal phosphate-dependent desulfuration of cysteine; required for mitochondrial iron-sulfur cluster biosynthesis; exclusive to eukaryotes, implicated as eukaryotic supplement to the bacterium-derived Fe-S cluster (ISC) assembly apparatus; involved in regulation of iron metabolism; member of the LYR protein family +S000036074 CDS YER048W-A 5 250718 251002 W 2011-02-03 1999-07-17 +S000000851 ORF Verified YER049W TPA1 oxidative DNA demethylase chromosome 5 5 251728 253662 W 2011-02-03 1996-07-31 Fe(II)/2-oxoglutarate-dependent dioxygenase family member; catalyzes the repair of methyl-base lesions in both ss and dsDNA by oxidative demethylation; Poly(rA)-binding protein involved in mRNA poly(A) tail length and mRNA stability; role in translation termination efficiency; interacts with Sup45p (eRF1), Sup35p (eRF3) and Pab1p; similar to human prolyl 4-hydroxylase OGFOD1; binds Fe(II) and 2-oxoglutarate +S000035095 CDS YER049W 5 251728 253662 W 2011-02-03 1996-07-31 +S000000852 ORF Verified YER050C RSM18 mitochondrial 37S ribosomal protein RSM18 chromosome 5 5 254387 253971 C 2011-02-03 1996-07-31|2005-11-28 Mitochondrial ribosomal protein of the small subunit; has similarity to E. coli S18 ribosomal protein +S000036333 CDS YER050C 5 254387 253971 C 2011-02-03 1996-07-31|2005-11-28 +S000000853 ORF Verified YER051W JHD1 [Histone H3]-lysine-36 demethylase|KDM2|JHDM1 chromosome 5 5 254656 256134 W 2011-02-03 1996-07-31 JmjC domain family histone demethylase specific for H3-K36; similar to proteins found in human, mouse, drosophila, X. laevis, C. elegans, and S. pombe +S000037038 CDS YER051W 5 254656 256134 W 2011-02-03 1996-07-31 +S000000854 ORF Verified YER052C HOM3 aspartate kinase|THR3|SIL4|BOR1 chromosome 5 L000000800 5 257958 256375 C 48 2011-02-03 1996-07-31 Aspartate kinase (L-aspartate 4-P-transferase); cytoplasmic enzyme that catalyzes the first step in the common pathway for methionine and threonine biosynthesis; expression regulated by Gcn4p and the general control of amino acid synthesis +S000037071 CDS YER052C 5 257958 256375 C 2011-02-03 1996-07-31 +S000077385 ARS ARS513 chromosome 5 5 257958 258737 2011-02-03 2004-10-19 Autonomously Replicating Sequence +S000000855 ORF Verified YER053C PIC2 Cu/Pi carrier chromosome 5 5 259639 258737 C 2011-02-03 1996-07-31 Mitochondrial copper and phosphate carrier; imports copper and inorganic phosphate into mitochondria; functionally redundant with Mir1p but less abundant than Mir1p under normal conditions; expression is induced at high temperature +S000037192 CDS YER053C 5 259639 258737 C 2011-02-03 1996-07-31 +S000007523 ORF Verified YER053C-A chromosome 5 5 261046 260933 C 2011-02-03 2000-07-14 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; protein abundance increases in response to DNA replication stress +S000037059 CDS YER053C-A 5 261046 260933 C 2011-02-03 2000-07-14 +S000000856 ORF Verified YER054C GIP2 chromosome 5 L000003093 5 263698 262052 C 2011-02-03 1996-07-31 Putative regulatory subunit of protein phosphatase Glc7p; involved in glycogen metabolism; contains a conserved motif (GVNK motif) that is also found in Gac1p, Pig1p, and Pig2p; GIP2 has a paralog, PIG2, that arose from the whole genome duplication +S000037276 CDS YER054C 5 263698 262052 C 2011-02-03 1996-07-31 +S000000857 ORF Verified YER055C HIS1 ATP phosphoribosyltransferase chromosome 5 L000000778 5 265785 264892 C 49 2011-02-03 1996-07-31 ATP phosphoribosyltransferase; a hexameric enzyme, catalyzes the first step in histidine biosynthesis; mutations cause histidine auxotrophy and sensitivity to Cu, Co, and Ni salts; transcription is regulated by general amino acid control +S000029938 CDS YER055C 5 265785 264892 C 2011-02-03 1996-07-31 +S000000858 ORF Verified YER056C FCY2 purine-cytosine permease|BRA7 chromosome 5 L000000607 5 268113 266512 C 49 2011-02-03 1996-07-31 Purine-cytosine permease; mediates purine (adenine, guanine, and hypoxanthine) and cytosine accumulation; relative distribution to the vacuole increases upon DNA replication stress +S000030053 CDS YER056C 5 268113 266512 C 2011-02-03 1996-07-31 +S000002135 ORF Verified YER056C-A RPL34A eL34|ribosomal 60S subunit protein L34A|L34e|L34A chromosome 5 L000004465 5 270185 269423 C 2011-02-03 2000-12-01|1996-07-31 Ribosomal 60S subunit protein L34A; homologous to mammalian ribosomal protein L34, no bacterial homolog; RPL34A has a paralog, RPL34B, that arose from the whole genome duplication +S000031749 CDS YER056C-A 5 269751 269423 C 2011-02-03 2000-12-01|1996-07-31 +S000031748 CDS YER056C-A 5 270185 270149 C 2011-02-03 2000-12-01|1996-07-31 +S000031750 intron YER056C-A 5 270148 269752 C 2011-02-03 2000-12-01|1996-07-31 +S000000859 ORF Verified YER057C HMF1 putative isoleucine biosynthesis protein HMF1|HIG1 chromosome 5 L000004440 5 271126 270737 C 2011-02-03 1996-07-31 Member of the p14.5 protein family; functionally complements Mmf1p function when targeted to mitochondria; heat shock inducible; high-dosage growth inhibitor; forms a homotrimer in vitro; HMF1 has a paralog, MMF1, that arose from the whole genome duplication +S000030235 CDS YER057C 5 271126 270737 C 2011-02-03 1996-07-31 +S000000860 ORF Verified YER058W PET117 chromosome 5 L000001396 5 271768 272091 W 2011-02-03 1996-07-31 Protein required for assembly of cytochrome c oxidase +S000031258 CDS YER058W 5 271768 272091 W 2011-02-03 1996-07-31 +S000000861 ORF Verified YER059W PCL6 chromosome 5 L000004038 5 272624 273886 W 2011-02-03 1996-07-31 Pho85p cyclin of the Pho80p subfamily; forms the major Glc8p kinase together with Pcl7p and Pho85p; involved in the control of glycogen storage by Pho85p; stabilized by Elongin C binding; PCL6 has a paralog, PCL7, that arose from the whole genome duplication +S000031353 CDS YER059W 5 272624 273886 W 2011-02-03 1996-07-31 +S000000862 ORF Verified YER060W FCY21 purine-cytosine permease chromosome 5 L000003373 5 274567 276153 W 2011-02-03 1996-07-31 Putative purine-cytosine permease; very similar to Fcy2p but cannot substitute for its function +S000032301 CDS YER060W 5 274567 276153 W 2011-02-03 1996-07-31 +S000178086 ARS ARS513.5 chromosome 5 5 276130 276528 2014-11-18 2014-11-18 Very weak autonomously replicating sequence +S000002958 ORF Verified YER060W-A FCY22 purine-cytosine permease chromosome 5 L000003374 5 276572 278164 W 2011-02-03 1999-07-17|1996-07-31 Putative purine-cytosine permease; very similar to Fcy2p but cannot substitute for its function +S000032822 CDS YER060W-A 5 276572 278164 W 2011-02-03 1999-07-17|1996-07-31 +S000178087 ARS ARS513.7 chromosome 5 5 278076 278357 2014-11-18 2014-11-18 Weak autonomously replicating sequence +S000178088 ARS_consensus_sequence ARS513.7 5 278177 278161 C 2014-11-18 2014-11-18 +S000000863 ORF Verified YER061C CEM1 fatty acid synthase CEM1 chromosome 5 L000000292 5 279626 278298 C 2011-02-03 1996-07-31|2011-02-03 Mitochondrial beta-keto-acyl synthase; possible role in fatty acid synthesis; required for mitochondrial respiration; human homolog OXSM can complement yeast cem1 null mutant +S000032319 CDS YER061C 5 279626 278298 C 2011-02-03 1996-07-31|2011-02-03 +S000000864 ORF Verified YER062C GPP2 HOR2|glycerol-1-phosphatase HOR2 chromosome 5 L000003979 5 280682 279930 C 2011-02-03 1996-07-31 DL-glycerol-3-phosphate phosphatase involved in glycerol biosynthesis; also known as glycerol-1-phosphatase; induced in response to hyperosmotic or oxidative stress, and during diauxic shift; GPP2 has a paralog, GPP1, that arose from the whole genome duplication +S000032451 CDS YER062C 5 280682 279930 C 2011-02-03 1996-07-31 +S000000865 ORF Verified YER063W THO1 chromosome 5 L000004712 5 281710 282366 W 2011-02-03 1996-07-31 Conserved nuclear RNA-binding protein; specifically binds to transcribed chromatin in a THO- and RNA-dependent manner, genetically interacts with shuttling hnRNP NAB2; overproduction suppresses transcriptional defect caused by hpr1 mutation +S000033296 CDS YER063W 5 281710 282366 W 2011-02-03 1996-07-31 +S000000866 ORF Verified YER064C VHR2 chromosome 5 5 284222 282705 C 2011-02-03 1996-07-31 Non-essential nuclear protein; null mutation has global effects on transcription; VHR2 has a paralog, VHR1, that arose from the whole genome duplication; relative distribution to the nucleus increases upon DNA replication stress +S000033339 CDS YER064C 5 284222 282705 C 2011-02-03 1996-07-31 +S000000867 ORF Verified YER065C ICL1 isocitrate lyase 1 chromosome 5 L000000848 5 286914 285241 C 2011-02-03 1996-07-31 Isocitrate lyase; catalyzes the formation of succinate and glyoxylate from isocitrate, a key reaction of the glyoxylate cycle; expression of ICL1 is induced by growth on ethanol and repressed by growth on glucose +S000033405 CDS YER065C 5 286914 285241 C 2011-02-03 1996-07-31 +S000077386 ARS ARS514 ARSV-288 chromosome 5 5 287552 287629 2014-11-18 2014-11-18|2004-10-19|2006-09-07 Autonomously Replicating Sequence +S000178089 ARS_consensus_sequence ARS514 5 287565 287581 W 2014-11-18 2014-11-18 +S000006894 long_terminal_repeat YERCdelta10 chromosome 5 5 288062 287745 C 2011-02-03 2000-05-19 Ty1 LTR +S000006734 tRNA_gene tS(UGA)E SUP19 SUP20 chromosome 5 L000002192|L000003805 5 288524 288443 C 50 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations +S000034046 noncoding_exon tS(UGA)E 5 288524 288443 C 2011-02-03 2000-05-19 +S000000868 ORF Uncharacterized YER066W RRT13 chromosome 5 5 290242 290799 W 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene identified in a screen for mutants with decreased levels of rDNA transcription +S000034374 CDS YER066W 5 290242 290799 W 2011-02-03 1996-07-31 +S000000869 ORF Verified YER067W RGI1 chromosome 5 5 292066 292551 W 2011-02-03 1996-07-31 Protein of unknown function; involved in energy metabolism under respiratory conditions; protein abundance is increased upon intracellular iron depletion or in response to DNA replication stress; RGI1 has a paralog, RGI2, that arose from the whole genome duplication +S000034452 CDS YER067W 5 292066 292551 W 2011-02-03 1996-07-31 +S000002959 ORF Dubious YER066C-A chromosome 5 5 292203 291703 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps uncharacterized ORF YER067W +S000035687 CDS YER066C-A 5 292203 291703 C 2011-02-03 1996-07-31 +S000028748 ORF Dubious YER067C-A chromosome 5 5 292563 292240 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF RGI1/YER067W +S000033418 CDS YER067C-A 5 292563 292240 C 2011-02-03 2003-07-29 +S000000870 ORF Verified YER068W MOT2 CCR4-NOT core ubiquitin-protein ligase subunit MOT2|SIG1|NOT4 chromosome 5 L000001887|L000001137 5 293050 294813 W 2011-02-03 1996-07-31 Ubiquitin-protein ligase subunit of the CCR4-NOT complex; with Ubc4p, ubiquitinates nascent polypeptide-associated complex subunits and histone demethyase Jhd2p; CCR4-NOT has roles in transcription regulation, mRNA degradation, and post-transcriptional modifications; regulates levels of DNA Polymerase-{alpha} to promote efficient and accurate DNA replication +S000035479 CDS YER068W 5 293050 294813 W 2011-02-03 1996-07-31 +S000000871 ORF Verified YER069W ARG5,6 argC|argB|bifunctional acetylglutamate kinase/N-acetyl-gamma-glutamyl-phosphate reductase chromosome 5 L000000110 5 295410 298001 W 55 2011-02-03 1996-07-31 Acetylglutamate kinase and N-acetyl-gamma-glutamyl-phosphate reductase; N-acetyl-L-glutamate kinase (NAGK) catalyzes the 2nd and N-acetyl-gamma-glutamyl-phosphate reductase (NAGSA), the 3rd step in arginine biosynthesis; synthesized as a precursor which is processed in the mitochondrion to yield mature NAGK and NAGSA; enzymes form a metabolon complex with Arg2p; NAGK C-terminal domain stabilizes the enzymes, slows catalysis and is involved in feed-back inhibition by arginine +S000035588 CDS YER069W 5 295410 298001 W 2011-02-03 1996-07-31 +S000028749 ORF Dubious YER068C-A chromosome 5 5 295732 295301 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF ARG5,6/YER069W +S000033419 CDS YER068C-A 5 295732 295301 C 2011-02-03 2003-07-29 +S000000872 ORF Verified YER070W RNR1 ribonucleotide-diphosphate reductase subunit RNR1|SDS12|RIR1|CRT7 chromosome 5 L000001655 5 298950 301616 W 2011-02-03 1996-07-31 Major isoform of large subunit of ribonucleotide-diphosphate reductase; the RNR complex catalyzes rate-limiting step in dNTP synthesis, regulated by DNA replication and DNA damage checkpoint pathways via localization of small subunits; relative distribution to the nucleus increases upon DNA replication stress; RNR1 has a paralog, RNR3, that arose from the whole genome duplication +S000035499 CDS YER070W 5 298950 301616 W 2011-02-03 1996-07-31 +S000000873 ORF Uncharacterized YER071C TDA2 chromosome 5 5 302327 301947 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm in a punctate pattern; null mutant is sensitive to expression of the top1-T722A allele +S000035526 CDS YER071C 5 302327 301947 C 2011-02-03 1996-07-31 +S000000874 ORF Verified YER072W VTC1 PHM4|NRF1 chromosome 5 L000004689 5 302806 303195 W 2011-02-03 1996-07-31 Regulatory subunit of the vacuolar transporter chaperone (VTC) complex; VTC complex is involved in membrane trafficking, vacuolar polyphosphate accumulation, microautophagy and non-autophagic vacuolar fusion; also has mRNA binding activity; protein abundance increases in response to DNA replication stress +S000036469 CDS YER072W 5 302806 303195 W 2011-02-03 1996-07-31 +S000000875 ORF Verified YER073W ALD5 aldehyde dehydrogenase (NAD(P)(+)) ALD5 chromosome 5 L000004949 5 304030 305592 W 2011-02-03 1996-07-31|2011-02-03 Mitochondrial aldehyde dehydrogenase; involved in regulation or biosynthesis of electron transport chain components and acetate formation; activated by K+; utilizes NADP+ as the preferred coenzyme; constitutively expressed +S000036548 CDS YER073W 5 304030 305592 W 2011-02-03 1996-07-31|2011-02-03 +S000000876 ORF Verified YER074W RPS24A eS24|ribosomal 40S subunit protein S24A|S24e|S24A|RPS24EA chromosome 5 L000002710 5 306323 307196 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S24, no bacterial homolog; RPS24A has a paralog, RPS24B, that arose from the whole genome duplication +S000036669 CDS YER074W 5 306323 306325 W 2011-02-03 1996-07-31 +S000036670 CDS YER074W 5 306792 307196 W 2011-02-03 1996-07-31 +S000036671 intron YER074W 5 306326 306791 W 2011-02-03 1996-07-31 +S000007651 ORF Verified YER074W-A YOS1 chromosome 5 5 307653 308123 W 2011-02-03 2004-01-08|2001-06-29 Integral membrane protein required for ER to Golgi transport; localized to the Golgi, the ER, and COPII vesicles; interacts with Yip1p and Yif1p +S000037341 CDS YER074W-A 5 307653 307746 W 2011-02-03 2004-01-08|2001-06-29 +S000037342 CDS YER074W-A 5 307849 307956 W 2011-02-03 2004-01-08|2001-06-29 +S000037343 CDS YER074W-A 5 308068 308123 W 2011-02-03 2004-01-08|2001-06-29 +S000037344 intron YER074W-A 5 307747 307848 W 2011-02-03 2004-01-08|2001-06-29 +S000037345 intron YER074W-A 5 307957 308067 W 2011-02-03 2004-01-08|2001-06-29 +S000000877 ORF Verified YER075C PTP3 tyrosine protein phosphatase PTP3 chromosome 5 L000003996 5 311199 308413 C 2011-02-03 1996-07-31|2011-02-03 Phosphotyrosine-specific protein phosphatase; involved in the inactivation of mitogen-activated protein kinase (MAPK) during osmolarity sensing; dephosporylates Hog1p MAPK and regulates its localization; localized to the cytoplasm +S000036705 CDS YER075C 5 311199 308413 C 2011-02-03 1996-07-31|2011-02-03 +S000006522 tRNA_gene tA(UGC)E chromosome 5 L000003804 5 312095 312023 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 5 nuclear tRNA genes containing the tDNA-anticodon TGC (mature tRNA may be UGC or may contain modified bases), decodes GCA and probably GCG codons into alanine, one of 16 nuclear tRNAs for alanine +S000034855 noncoding_exon tA(UGC)E 5 312095 312023 C 2011-02-03 2000-05-19 +S000006914 long_terminal_repeat YERWdelta11 chromosome 5 5 312274 312445 W 2011-02-03 2000-05-19 Ty1 LTR +S000028750 ORF Dubious YER076W-A chromosome 5 5 313390 313737 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YER076C +S000033444 CDS YER076W-A 5 313390 313737 W 2011-02-03 2003-07-29 +S000000878 ORF Uncharacterized YER076C chromosome 5 5 313498 312590 C 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; analysis of HA-tagged protein suggests a membrane localization +S000037415 CDS YER076C 5 313498 312590 C 2011-02-03 1996-07-31 +S000000879 ORF Uncharacterized YER077C MRX1 chromosome 5 5 316600 314534 C 2011-02-03 1996-07-31 Protein that associates with mitochondrial ribosome; green fluorescent protein (GFP)-fusion protein localizes to the mitochondrion; null mutation results in a decrease in plasma membrane electron transport +S000037540 CDS YER077C 5 316600 314534 C 2011-02-03 1996-07-31 +S000077387 ARS ARS515 chromosome 5 5 316600 316807 2011-02-03 2004-10-19 Autonomously Replicating Sequence +S000000880 ORF Verified YER078C ICP55 aminopeptidase chromosome 5 5 318342 316807 C 2011-02-03 1996-07-31 Mitochondrial aminopeptidase; cleaves the N termini of at least 38 imported proteins after cleavage by the mitochondrial processing peptidase (MPP), thereby increasing their stability; member of the aminopeptidase P family +S000037656 CDS YER078C 5 318342 316807 C 2011-02-03 1996-07-31 +S000028546 ORF Uncharacterized YER078W-A chromosome 5 5 318646 318810 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031196 CDS YER078W-A 5 318646 318810 W 2011-02-03 2003-07-29 +S000000881 ORF Uncharacterized YER079W chromosome 5 5 318920 319552 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000030524 CDS YER079W 5 318920 319552 W 2011-02-03 1996-07-31 +S000000882 ORF Verified YER080W AIM9 FMP29 chromosome 5 5 319963 321846 W 2011-02-03 1996-07-31 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; null mutant displays elevated frequency of mitochondrial genome loss +S000031341 CDS YER080W 5 319963 321846 W 2011-02-03 1996-07-31 +S000028751 ORF Dubious YER079C-A chromosome 5 5 320240 319902 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF AIM9/YER080W +S000033445 CDS YER079C-A 5 320240 319902 C 2011-02-03 2003-07-29 +S000029010 ncRNA_gene SRG1 SRG1 chromosome 5 5 322212 322762 W 2011-02-03 2003-10-29 Non-protein-coding RNA that regulates the transcription of SER3; expression of SRG1 RNA represses expression of its neighboring gene SER3 via a transcription-interference mechanism +S000035975 noncoding_exon SRG1 5 322212 322762 W 2011-02-03 2003-10-29 +S000000883 ORF Verified YER081W SER3 phosphoglycerate dehydrogenase SER3 chromosome 5 S000007457 5 322686 324095 W 2011-02-03 1996-07-31 3-phosphoglycerate dehydrogenase and alpha-ketoglutarate reductase; 3PG dehydrogenase that catalyzes the first step in serine and glycine biosynthesis; also functions as an alpha-ketoglutarate reductase, converting alpha-ketoglutarate to D-2-hydroxyglutarate (D-2HG); localizes to the cytoplasm; SER3 has a paralog, SER33, that arose from the whole genome duplication +S000031424 CDS YER081W 5 322686 324095 W 2011-02-03 1996-07-31 +S000000884 ORF Verified YER082C UTP7 KRE31 chromosome 5 5 325936 324272 C 2011-02-03 1996-07-31 Nucleolar protein; component of the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA +S000031483 CDS YER082C 5 325936 324272 C 2011-02-03 1996-07-31 +S000000885 ORF Verified YER083C GET2 GET complex subunit GET2|RMD7|HUR2 chromosome 5 5 327031 326174 C 2011-02-03 2003-09-22|1996-07-31 Subunit of the GET complex; involved in insertion of proteins into the ER membrane; required for the retrieval of HDEL proteins from the Golgi to the ER in an ERD2 dependent fashion and for meiotic nuclear division +S000031538 CDS YER083C 5 327031 326174 C 2011-02-03 2003-09-22|1996-07-31 +S000000886 ORF Uncharacterized YER084W chromosome 5 5 327065 327451 W 2011-02-03 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels +S000032559 CDS YER084W 5 327065 327451 W 2011-02-03 1996-07-31 +S000028752 ORF Dubious YER084W-A chromosome 5 5 327598 328110 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps uncharacterized ORF YER085C +S000033446 CDS YER084W-A 5 327598 328110 W 2011-02-03 2003-07-29 +S000000887 ORF Uncharacterized YER085C chromosome 5 5 328140 327619 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000032615 CDS YER085C 5 328140 327619 C 2011-02-03 1996-07-31 +S000000888 ORF Verified YER086W ILV1 threonine ammonia-lyase ILV1|ISO1 chromosome 5 L000000857 5 328477 330207 W 64 2011-02-03 1999-07-17|1996-07-31 Threonine deaminase, catalyzes first step in isoleucine biosynthesis; expression is under general amino acid control; ILV1 locus exhibits highly positioned nucleosomes whose organization is independent of known ILV1 regulation +S000032774 CDS YER086W 5 328477 330207 W 2011-02-03 1996-07-31 +S000000889 ORF Verified YER087W AIM10 putative proline--tRNA ligase AIM10 chromosome 5 5 330576 332306 W 2011-02-03 1996-07-31 Protein with similarity to tRNA synthetases; non-tagged protein is detected in purified mitochondria; null mutant is viable and displays elevated frequency of mitochondrial genome loss +S000033504 CDS YER087W 5 330576 332306 W 2011-02-03 1996-07-31 +S000028753 ORF Dubious YER087C-A chromosome 5 5 332368 331817 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF AIM10/YER087W +S000033447 CDS YER087C-A 5 332368 331817 C 2011-02-03 2003-07-29 +S000002128 ORF Verified YER087C-B SBH1 Arf family guanine nucleotide exchange factor SBH1|YER087C-A|SEB1 chromosome 5 L000002846|L000004137 5 332830 332582 C 2011-02-03 1996-07-31 Beta subunit of Sec61p ER translocation complex (Sec61p-Sss1p-Sbh1p); involved in protein translocation into the endoplasmic reticulum; interacts with the exocyst complex and also with Rtn1p; cotranslationally N-acetylated by NatA; SBH1 has a paralog, SBH2, that arose from the whole genome duplication +S000037045 CDS YER087C-B 5 332830 332582 C 2011-02-03 1996-07-31 +S000000890 ORF Verified YER088C DOT6 PBF2 chromosome 5 L000004393 5 335188 333176 C 2011-02-03 1996-07-31 Protein involved in rRNA and ribosome biogenesis; activated in stochastic pulses of nuclear localization; binds polymerase A and C motif; subunit of the RPD3L histone deacetylase complex; has chromatin specific SANT domain; involved in telomeric gene silencing and filamentation; relative distribution to the nucleus increases upon DNA replication stress +S000033553 CDS YER088C 5 335188 333176 C 2011-02-03 1996-07-31 +S000028623 ORF Dubious YER088W-B chromosome 5 5 335927 336073 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the ORF PTC2/YER089C; identified by gene-trapping, expression analysis, and homology searching +S000031475 CDS YER088W-B 5 335927 336073 W 2011-02-03 2003-07-29 +S000028754 ORF Dubious YER088C-A chromosome 5 5 336019 335696 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORFs PTC2/YER089C and YER088W-B +S000033448 CDS YER088C-A 5 336019 335696 C 2011-02-03 2003-07-29 +S000000891 ORF Verified YER089C PTC2 type 2C protein phosphatase PTC2 chromosome 5 L000003403 5 337340 335946 C 2011-02-03 1996-07-31 Type 2C protein phosphatase (PP2C); dephosphorylates Hog1p to limit maximal osmostress induced kinase activity; dephosphorylates Ire1p to downregulate the unfolded protein response; dephosphorylates Cdc28p; inactivates the DNA damage checkpoint; PTC2 has a paralog, PTC3, that arose from the whole genome duplication +S000033635 CDS YER089C 5 337340 335946 C 2011-02-03 1996-07-31 +S000000892 ORF Verified YER090W TRP2 anthranilate synthase TRP2 chromosome 5 L000002353 5 337949 339472 W 76 2011-02-03 1996-07-31 Anthranilate synthase; catalyzes the initial step of tryptophan biosynthesis, forms multifunctional hetero-oligomeric anthranilate synthase:indole-3-glycerol phosphate synthase enzyme complex with Trp3p +S000035640 CDS YER090W 5 337949 339472 W 2011-02-03 1996-07-31 +S000029725 ORF Dubious YER090C-A chromosome 5 5 338411 338322 C 2011-02-03 2004-08-27 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036876 CDS YER090C-A 5 338411 338322 C 2011-02-03 2004-08-27 +S000000893 ORF Verified YER091C MET6 5-methyltetrahydropteroyltriglutamate-homocysteine S-methyltransferase chromosome 5 L000001081 5 342167 339864 C 77 2011-02-03 1996-07-31 Cobalamin-independent methionine synthase; involved in methionine biosynthesis and regeneration; requires a minimum of two glutamates on the methyltetrahydrofolate substrate, similar to bacterial metE homologs +S000035673 CDS YER091C 5 342167 339864 C 2011-02-03 1996-07-31 +S000007238 ORF Dubious YER091C-A chromosome 5 5 342611 342390 C 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034939 CDS YER091C-A 5 342611 342390 C 2011-02-03 1999-07-17 +S000000894 ORF Verified YER092W IES5 chromosome 5 5 342855 343232 W 2011-02-03 1996-07-31 Non-essential INO80 chromatin remodeling complex subunit; deletion affects telomere maintenance via recombination +S000035789 CDS YER092W 5 342855 343232 W 2011-02-03 1996-07-31 +S000000895 ORF Verified YER093C TSC11 TORC2 complex subunit TSC11|AVO3 chromosome 5 5 347612 343320 C 2011-02-03 1996-07-31 Subunit of TORC2 (Tor2p-Lst8p-Avo1-Avo2-Tsc11p-Bit61p); TORC2 is a membrane-associated complex that regulates actin cytoskeletal dynamics during polarized growth and cell wall integrity; involved in sphingolipid metabolism; contains a RasGEFN domain +S000035826 CDS YER093C 5 347612 343320 C 2011-02-03 1996-07-31 +S000002960 ORF Verified YER093C-A AIM11 GEP8 chromosome 5 5 348400 347912 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant is viable but shows increased loss of mitochondrial genome and synthetic interaction with prohibitin (phb1); contains an intron; SWAT-GFP and mCherry fusion proteins localize to the mitochondria; YER093C-A has a paralog, YBL059W, that arose from the whole genome duplication +S000030866 CDS YER093C-A 5 348201 347912 C 2011-02-03 1996-07-31 +S000030865 CDS YER093C-A 5 348400 348277 C 2011-02-03 1996-07-31 +S000030867 intron YER093C-A 5 348276 348202 C 2011-02-03 1996-07-31 +S000000896 ORF Verified YER094C PUP3 proteasome core particle subunit beta 3|SCS32 chromosome 5 L000001532 5 349346 348729 C 2011-02-03 1996-07-31 Beta 3 subunit of the 20S proteasome; involved in ubiquitin-dependent catabolism; human homolog is subunit C10 +S000035946 CDS YER094C 5 349346 348729 C 2011-02-03 1996-07-31 +S000000897 ORF Verified YER095W RAD51 recombinase RAD51|MUT5 chromosome 5 L000001571 5 349980 351182 W 78 2011-02-03 1996-07-31 Strand exchange protein; forms a helical filament with DNA that searches for homology; involved in the recombinational repair of double-strand breaks in DNA during vegetative growth and meiosis; homolog of Dmc1p and bacterial RecA protein +S000036878 CDS YER095W 5 349980 351182 W 2011-02-03 1996-07-31 +S000000898 ORF Verified YER096W SHC1 chromosome 5 L000001879 5 351698 353236 W 79.23 2011-02-03 1996-07-31 Sporulation-specific activator of Chs3p (chitin synthase III); required for the synthesis of the chitosan layer of ascospores; transcriptionally induced at alkaline pH; SHC1 has a paralog, SKT5, that arose from the whole genome duplication +S000036926 CDS YER096W 5 351698 353236 W 2011-02-03 1996-07-31 +S000006915 long_terminal_repeat YERWdelta12 chromosome 5 5 353399 353735 W 2011-02-03 2000-05-19 Ty1 LTR +S000077388 ARS ARS516 ARSV-354 chromosome 5 5 353578 353636 2014-11-18 2014-11-18|2004-10-19|2006-10-02 Autonomously Replicating Sequence +S000178090 ARS_consensus_sequence ARS516 5 353582 353598 W 2014-11-18 2014-11-18 +S000006916 long_terminal_repeat YERWdelta13 chromosome 5 5 354136 354850 W 2011-02-03 2000-05-19 Ty1 LTR +S000006908 long_terminal_repeat YERCtau2 chromosome 5 5 354730 354360 C 2011-02-03 2000-05-19 Ty4 LTR +S000006905 long_terminal_repeat YERCsigma2 chromosome 5 5 354917 354851 C 2011-02-03 2000-05-19 Ty3 LTR +S000006551 tRNA_gene tE(UUC)E2 chromosome 5 L000003795 5 354934 355005 W 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000034437 noncoding_exon tE(UUC)E2 5 354934 355005 W 2011-02-03 2000-05-19 +S000000899 ORF Dubious YER097W chromosome 5 5 355140 355469 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036977 CDS YER097W 5 355140 355469 W 2011-02-03 1996-07-31 +S000000900 ORF Verified YER098W UBP9 putative ubiquitin-specific protease UBP9 chromosome 5 L000003170 5 355466 357730 W 2011-02-03 1996-07-31 Ubiquitin-specific protease that cleaves ubiquitin-protein fusions; UBP9 has a paralog, UBP13, that arose from the whole genome duplication +S000037747 CDS YER098W 5 355466 357730 W 2011-02-03 1996-07-31 +S000000901 ORF Verified YER099C PRS2 ribose phosphate diphosphokinase subunit PRS2 chromosome 5 L000001512 5 359061 358105 C 2011-02-03 1996-07-31 5-phospho-ribosyl-1(alpha)-pyrophosphate synthetase, synthesizes PRPP; which is required for nucleotide, histidine, and tryptophan biosynthesis; one of five related enzymes, which are active as heteromultimeric complexes; PRS2 has a paralog, PRS4, that arose from the whole genome duplication +S000037788 CDS YER099C 5 359061 358105 C 2011-02-03 1996-07-31 +S000000902 ORF Verified YER100W UBC6 E2 ubiquitin-conjugating protein UBC6|DOA2 chromosome 5 L000002409 5 359562 360314 W 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme involved in ERAD; located at the cytosolic side of the ER membrane; tail region contains a transmembrane segment at the C-terminus; substrate of the ubiquitin-proteasome pathway; ER-associated protein degradation is also known as ERAD +S000035454 CDS YER100W 5 359562 360314 W 2011-02-03 1996-07-31 +S000000903 ORF Verified YER101C AST2 chromosome 5 L000000134 5 361794 360502 C 2011-02-03 1996-07-31 Lipid raft associated protein; overexpression restores Pma1p localization to lipid rafts which is required for targeting of Pma1p to the plasma membrane; sometimes classified in the medium-chain dehydrogenase/reductases (MDRs) superfamily; AST2 has a paralog, AST1, that arose from the whole genome duplication +S000036309 CDS YER101C 5 361794 360502 C 2011-02-03 1996-07-31 +S000000904 ORF Verified YER102W RPS8B eS8|ribosomal 40S subunit protein S8B|S8e|rp19|YS9|S8B|S14B chromosome 5 L000001754 5 363100 363702 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S8, no bacterial homolog; RPS8B has a paralog, RPS8A, that arose from the whole genome duplication +S000036450 CDS YER102W 5 363100 363702 W 2011-02-03 1996-07-31 +S000122096 five_prime_UTR_intron YER102W 5 362733 363092 W 2011-02-03 2007-04-04 +S000000905 ORF Verified YER103W SSA4 Hsp70 family chaperone SSA4|YG107 chromosome 5 L000002072 5 364589 366517 W 2011-02-03 1996-07-31 Heat shock protein that is highly induced upon stress; plays a role in SRP-dependent cotranslational protein-membrane targeting and translocation; member of the HSP70 family; cytoplasmic protein that concentrates in nuclei upon starvation; SSA4 has a paralog, SSA3, that arose from the whole genome duplication +S000036552 CDS YER103W 5 364589 366517 W 2011-02-03 1996-07-31 +S000000906 ORF Verified YER104W RTT105 chromosome 5 S000007476 5 366802 367428 W 2011-02-03 1996-07-31 Protein with a role in regulation of Ty1 transposition +S000037250 CDS YER104W 5 366802 367428 W 2011-02-03 1996-07-31 +S000000907 ORF Verified YER105C NUP157 chromosome 5 L000003139 5 372013 367838 C 2011-02-03 1996-07-31 Subunit of the inner ring of the nuclear pore complex (NPC); contributes to NPC assembly and tethering of DNA to the nuclear periphery; both Nup170p and NUP157p are similar to human Nup155p; NUP157 has a paralog, NUP170, that arose from the whole genome duplication +S000037287 CDS YER105C 5 372013 367838 C 2011-02-03 1996-07-31 +S000000908 ORF Verified YER106W MAM1 chromosome 5 5 372326 373234 W 2011-02-03 1996-07-31 Monopolin; meiosis-specific kinetochore-associated protein involved in monopolar attachment of sister kinetochores to the meiotic spindle; subunit of monopolin, a complex that prevents biorientation of sister kinetochores to ensure homolog biorientation during meiosis I; regulates the conformation, enzyme kinetics and substrate specificity of the Dsn1p kinase, Hrr1p; expressed only during the first meiotic division +S000037445 CDS YER106W 5 372326 373234 W 2011-02-03 1996-07-31 +S000028755 ORF Dubious YER107W-A chromosome 5 5 374394 374714 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF GLE2/YER107C +S000033449 CDS YER107W-A 5 374394 374714 W 2011-02-03 2003-07-29 +S000000909 ORF Verified YER107C GLE2 RNA export factor GLE2|RAE1 chromosome 5 L000004084 5 374545 373448 C 2011-02-03 1996-07-31 RNA export factor associated with the nuclear pore complex (NPC); associates with NUP116p; required for polyadenylated RNA export but not for protein import; homologous to S. pombe Rae1p and human RAE1 +S000037509 CDS YER107C 5 374545 373448 C 2011-02-03 1996-07-31 +S000000911 blocked_reading_frame YER109C FLO8 transcription factor FLO8|STA10|YER108C|PHD5 chromosome 5 L000003202|S000000910|S000029523|L000004208 5 377614 375215 C 2011-02-03 1999-07-17|1996-07-31 Transcription factor; required for flocculation, diploid filamentous growth, and haploid invasive growth; forms a heterodimer with Mss1p that interacts with the Swi/Snf complex during transcriptional activation of FLO1, FLO11, and STA1; S. cerevisiae genome reference strain S288C contains an internal in-frame stop at codon 142, which in other strains encodes tryptophan +S000030400 CDS YER109C 5 377614 375215 C 2011-02-03 1999-07-17|1996-07-31 +S000000912 ORF Verified YER110C KAP123 YRB4 chromosome 5 L000003445|L000003466 5 382103 378762 C 2011-02-03 1996-07-31 Karyopherin beta; mediates nuclear import of ribosomal proteins prior to assembly into ribosomes and import of histones H3 and H4; localizes to the nuclear pore, nucleus, and cytoplasm; exhibits genetic interactions with RAI1 +S000030722 CDS YER110C 5 382103 378762 C 2011-02-03 1996-07-31 +S000000913 ORF Verified YER111C SWI4 SBF complex DNA-binding subunit SWI4|ART1 chromosome 5 L000000124|L000002252 5 385876 382595 C 2011-02-03 1996-07-31 DNA binding component of the SBF complex (Swi4p-Swi6p); a transcriptional activator that in concert with MBF (Mbp1-Swi6p) regulates late G1-specific transcription of targets including cyclins and genes required for DNA synthesis and repair; Slt2p-independent regulator of cold growth; acetylation at two sites, K1016 and K1066, regulates interaction with Swi6p +S000031559 CDS YER111C 5 385876 382595 C 2011-02-03 1996-07-31 +S000000914 ORF Verified YER112W LSM4 U6 snRNA complex subunit LSM4|USS1|SDB23 chromosome 5 L000002447 5 387232 387795 W 2011-02-03 1996-07-31 Lsm (Like Sm) protein; part of heteroheptameric complexes (Lsm2p-7p and either Lsm1p or 8p): cytoplasmic Lsm1p complex involved in mRNA decay; nuclear Lsm8p complex part of U6 snRNP and possibly involved in processing tRNA, snoRNA, and rRNA; forms cytoplasmic foci upon DNA replication stress +S000031681 CDS YER112W 5 387232 387795 W 2011-02-03 1996-07-31 +S000000915 ORF Verified YER113C TMN3 chromosome 5 5 390052 387932 C 2011-02-03 1996-07-31 Protein with a role in cellular adhesion and filamentous growth; similar to Emp70p and Tmn2p; member of Transmembrane Nine family with 9 transmembrane segments; localizes to Golgi; induced by 8-methoxypsoralen plus UVA irradiation +S000031762 CDS YER113C 5 390052 387932 C 2011-02-03 1996-07-31 +S000000916 ORF Verified YER114C BOI2 BEB1 chromosome 5 L000000166|L000002916 5 393712 390590 C 2011-02-03 1996-07-31 Protein implicated in polar growth, functionally redundant with Boi1p; interacts with bud-emergence protein Bem1p; contains an SH3 (src homology 3) domain and a PH (pleckstrin homology) domain; BOI2 has a paralog, BOI1, that arose from the whole genome duplication +S000031880 CDS YER114C 5 393712 390590 C 2011-02-03 1996-07-31 +S000000917 ORF Verified YER115C SPR6 chromosome 5 L000002023 5 394867 394292 C 93 2011-02-03 1996-07-31 Protein of unknown function; expressed during sporulation; not required for sporulation, but gene exhibits genetic interactions with other genes required for sporulation +S000032791 CDS YER115C 5 394867 394292 C 2011-02-03 1996-07-31 +S000000918 ORF Verified YER116C SLX8 SUMO-targeted ubiquitin ligase complex subunit SLX8 chromosome 5 5 396172 395348 C 2011-02-03 1996-07-31 Subunit of Slx5-Slx8 SUMO-targeted ubiquitin ligase (STUbL) complex; role in proteolysis of spindle positioning protein Kar9, DNA repair proteins Rad52p and Rad57p; stimulated by SUMO-modified substrates; contains a C-terminal RING domain; forms nuclear foci upon DNA replication stress; required for maintenance of genome integrity like human ortholog RNF +S000032881 CDS YER116C 5 396172 395348 C 2011-02-03 1996-07-31 +S000000919 ORF Verified YER117W RPL23B uL14|ribosomal 60S subunit protein L23B|L14|YL32|L23B|L17aB chromosome 5 L000001717 5 396769 397653 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L23B; homologous to mammalian ribosomal protein L23 and bacterial L14; RPL23B has a paralog, RPL23A, that arose from the whole genome duplication +S000033044 CDS YER117W 5 396769 396810 W 2011-02-03 1996-07-31 +S000033045 CDS YER117W 5 397282 397653 W 2011-02-03 1996-07-31 +S000033046 intron YER117W 5 396811 397281 W 2011-02-03 1996-07-31 +S000000920 ORF Verified YER118C SHO1 osmosensor SHO1|SSU81 chromosome 5 L000002632|L000002823 5 399055 397952 C 2011-02-03 1996-07-31 Transmembrane osmosensor for filamentous growth and HOG pathways; involved in activation of the Cdc42p- and MAP kinase-dependent filamentous growth pathway and the high-osmolarity glycerol (HOG) response pathway; phosphorylated by Hog1p; interacts with Pbs2p, Msb2p, Hkr1p, and Ste11p +S000033082 CDS YER118C 5 399055 397952 C 2011-02-03 1996-07-31 +S000000921 ORF Verified YER119C AVT6 aspartate/glutamate transporter chromosome 5 5 400842 399496 C 2011-02-03 1996-07-31 Vacuolar aspartate and glutamate exporter; member of a family of seven genes (AVT1-7) related to vesicular GABA-glycine transporters; involved in compartmentalizing acidic amino acids in response to nitrogen starvation; AVT6 has a paralog, AVT5, that arose from the whole genome duplication +S000033839 CDS YER119C 5 400842 399496 C 2011-02-03 1996-07-31 +S000000922 ORF Verified YER120W SCS2 phosphatidylinositol-binding protein SCS2 chromosome 5 L000002629 5 401135 401869 W 2011-02-03 1996-07-31 Integral ER membrane protein, regulates phospholipid metabolism; one of 6 proteins (Ist2p, Scs2p, Scs22p, Tcb1p, Tcb2p, Tcb3p) that connect ER to plasma membrane (PM) and regulate PI4P levels by controlling access of Sac1p phosphatase to substrate PI4P in the PM; interacts with FFAT motifs in Opi1p, Swh1p, Osh2p, and Osh3p; involved in telomeric silencing; VAP homolog; SCS2 has a paralog, SCS22, that arose from the whole genome duplication +S000036090 CDS YER120W 5 401135 401869 W 2011-02-03 1996-07-31 +S000002961 ORF Dubious YER119C-A chromosome 5 5 401238 400867 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; deletion mutation blocks replication of Brome mosaic virus in S. cerevisiae, but this is likely due to effects on the overlapping gene SCS2 +S000033092 CDS YER119C-A 5 401238 400867 C 2011-02-03 1996-07-31 +S000000923 ORF Uncharacterized YER121W chromosome 5 5 402375 402719 W 2011-02-03 1996-07-31 Putative protein of unknown function; may be involved in phosphatase regulation and/or generation of precursor metabolites and energy +S000036211 CDS YER121W 5 402375 402719 W 2011-02-03 1996-07-31 +S000000924 ORF Verified YER122C GLO3 ADP-ribosylation factor GTPase-activating protein chromosome 5 L000000713 5 404352 402871 C 2011-02-03 1996-07-31 ADP-ribosylation factor GTPase activating protein (ARF GAP); involved in ER-Golgi transport; shares functional similarity with Gcs1p +S000036231 CDS YER122C 5 404352 402871 C 2011-02-03 1996-07-31 +S000000925 ORF Verified YER123W YCK3 casein kinase YCK3|CKI3 chromosome 5 L000002915 5 404813 406387 W 2011-02-03 2000-03-16|1996-07-31 Palmitoylated vacuolar membrane-localized casein kinase I isoform; negatively regulates vacuole fusion during hypertonic stress via phosphorylation of Vps41p; shares essential functions with Hrr25p; regulates vesicle fusion in AP-3 pathway +S000036985 CDS YER123W 5 404813 406387 W 2011-02-03 2000-03-16|1996-07-31 +S000077389 ARS ARS517 ARSV-407 chromosome 5 5 406752 406953 2011-02-03 2004-10-19|2006-09-07 Autonomously Replicating Sequence +S000000926 ORF Verified YER124C DSE1 chromosome 5 5 409063 407342 C 2011-02-03 1996-07-31 Daughter cell-specific protein; may regulate cross-talk between the mating and filamentation pathways; deletion affects cell separation after division and sensitivity to alpha-factor and drugs affecting the cell wall; relocalizes from bud neck to cytoplasm upon DNA replication stress +S000037009 CDS YER124C 5 409063 407342 C 2011-02-03 1996-07-31 +S000000927 ORF Verified YER125W RSP5 NEDD4 family E3 ubiquitin-protein ligase|SMM1|UBY1|NPI1|MUT2|MDP1 chromosome 5 L000001054|L000001779|L000001220 5 410189 412618 W 2011-02-03 1996-07-31 NEDD4 family E3 ubiquitin ligase; regulates processes including: MVB sorting, the heat shock response, transcription, endocytosis and ribosome stability; ubiquitinates Sec23p, Sna3p, Ste4p, Nfi1p, Rpo21p and Sem1p; autoubiquitinates; deubiquitinated by Ubp2p; regulated by SUMO ligase Siz1p, in turn regulates Siz1p SUMO ligase activity; required for efficient Golgi-to-ER trafficking in COPI mutants; mutant tolerates aneuploidy; human homolog implicated in Liddle syndrome +S000037135 CDS YER125W 5 410189 412618 W 2011-02-03 1996-07-31 +S000000928 ORF Verified YER126C NSA2 rRNA-processing protein NSA2 chromosome 5 5 414179 413394 C 2011-02-03 1996-07-31 Protein constituent of 66S pre-ribosomal particles; contributes to processing of the 27S pre-rRNA; recruited by ribosomal proteins L17, L35, and L37 to assembling ribosomes after 27SB pre-rRNA is generated, immediately preceding removal of ITS2 +S000037193 CDS YER126C 5 414179 413394 C 2011-02-03 1996-07-31 +S000000929 ORF Verified YER127W LCP5 chromosome 5 L000004265 5 414481 415554 W 2011-02-03 1996-07-31 Essential protein involved in maturation of 18S rRNA; depletion leads to inhibited pre-rRNA processing and reduced polysome levels; localizes primarily to the nucleolus +S000029893 CDS YER127W 5 414481 415554 W 2011-02-03 1996-07-31 +S000000930 ORF Verified YER128W VFA1 chromosome 5 5 415859 416470 W 2011-02-03 1996-07-31 Protein that interacts with Vps4p and has a role in vacuolar sorting; stimulates the ATPase activity of Vps4; localizes to endosomes in a Vps4-dependent manner; overexpression causes canavanine sensitivity and confers a partial class D vacuole morphology +S000030007 CDS YER128W 5 415859 416470 W 2011-02-03 1996-07-31 +S000000931 ORF Verified YER129W SAK1 serine/threonine protein kinase SAK1|PAK1 chromosome 5 L000001333 5 417281 420709 W 2011-02-03 1996-07-31 Upstream serine/threonine kinase for the SNF1 complex; plays a role in pseudohyphal groth; partially redundant with Elm1p and Tos3p; members of this family have functional orthology with LKB1, a mammalian kinase associated with Peutz-Jeghers cancer-susceptibility syndrome; SAK1 has a paralog, TOS3, that arose from the whole genome duplication +S000030128 CDS YER129W 5 417281 420709 W 2011-02-03 1996-07-31 +S000000932 ORF Verified YER130C COM2 chromosome 5 5 422446 421115 C 2011-02-03 1996-07-31 Transcription factor that binds IME1 Upstream Activation Signal (UAS)ru; COM2 transcription is regulated by Haa1p, Sok2p and Zap1p transcriptional activators; may bind the IME1 promoter under all growth conditions to negatively regulate its transcription in the absence of a positive regulator that binds more effectively; repressor activity may depend on phosphorylation by PKA; C. albicans homolog (MNL1) plays a role in adaptation to stress +S000031102 CDS YER130C 5 422446 421115 C 2011-02-03 1996-07-31 +S000000933 ORF Verified YER131W RPS26B eS26|ribosomal 40S subunit protein S26B|S26e|S26B chromosome 5 L000001763 5 423952 424311 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S26, no bacterial homolog; RPS26B has a paralog, RPS26A, that arose from the whole genome duplication; human homolog can partially complement an RPS26A, RPS26B double null mutant; mutations in the human gene are associated with Diamond-Blackfan anemia +S000031231 CDS YER131W 5 423952 424311 W 2011-02-03 1996-07-31 +S000122097 five_prime_UTR_intron YER131W 5 423591 423951 W 2011-02-03 2007-04-04 +S000006493 snoRNA_gene snR4 SNR4 chromosome 5 L000001959 5 424698 424883 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA) but not shown to be active; no target site is predicted within the ribosomal RNAs +S000034305 noncoding_exon snR4 5 424698 424883 W 2011-02-03 2000-05-19 +S000000934 ORF Verified YER132C PMD1 chromosome 5 L000003968 5 430449 425188 C 2011-02-03 1996-07-31 Protein with an N-terminal kelch-like domain; putative negative regulator of early meiotic gene expression; required, with Mds3p, for growth under alkaline conditions; PMD1 has a paralog, MDS3, that arose from the whole genome duplication +S000032160 CDS YER132C 5 430449 425188 C 2011-02-03 1996-07-31 +S000006443 snoRNA_gene snR52 SNR52 chromosome 5 L000004521 5 431220 431129 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position U2921 and small subunit (SSU) rRNA at position A420 +S000030733 noncoding_exon snR52 5 431220 431129 C 2011-02-03 2000-05-19 +S000006895 long_terminal_repeat YERCdelta14 chromosome 5 5 431822 431490 C 2011-02-03 2000-05-19 Ty1 LTR +S000000935 ORF Verified YER133W GLC7 type 1 serine/threonine-protein phosphatase catalytic subunit GLC7|DIS2S1|PP1|DIS2|CID1 chromosome 5 L000000706 5 432495 433958 W 2011-02-03 1996-07-31 Type 1 S/T protein phosphatase (PP1) catalytic subunit; involved in glycogen metabolism, sporulation and mitotic progression; interacts with multiple regulatory subunits; regulates actomyosin ring formation; subunit of CPF; recruited to mating projections by Afr1p interaction; regulates nucleocytoplasmic shuttling of Hxk2p; import into the nucleus is inhibited during spindle assembly checkpoint arrest; involved in dephosphorylating Rps6a/b and Bnr1p +S000032307 CDS YER133W 5 432495 432671 W 2011-02-03 1996-07-31 +S000032308 CDS YER133W 5 433197 433958 W 2011-02-03 1996-07-31 +S000032309 intron YER133W 5 432672 433196 W 2011-02-03 1996-07-31 +S000006594 tRNA_gene tH(GUG)E2 chromosome 5 L000003803 5 434612 434541 C 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis +S000035212 noncoding_exon tH(GUG)E2 5 434612 434541 C 2011-02-03 2000-05-19 +S000006906 long_terminal_repeat YERCsigma3 chromosome 5 5 434971 434631 C 2011-02-03 2000-05-19 Ty3 LTR +S000006896 long_terminal_repeat YERCdelta15 chromosome 5 5 435447 435128 C 2011-02-03 2000-05-19 Ty1 LTR +S000006619 tRNA_gene tK(CUU)E2 chromosome 5 L000003802 5 435824 435752 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000037795 noncoding_exon tK(CUU)E2 5 435824 435752 C 2011-02-03 2000-05-19 +S000006897 long_terminal_repeat YERCdelta16 chromosome 5 5 436277 435946 C 2011-02-03 2000-05-19 Ty1 LTR +S000006909 long_terminal_repeat YERCtau3 chromosome 5 5 436605 436279 C 2011-02-03 2000-05-19 Ty4 LTR +S000028756 ORF Dubious YER133W-A chromosome 5 5 437191 437532 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF YER134C +S000033450 CDS YER133W-A 5 437191 437532 W 2011-02-03 2003-07-29 +S000000936 ORF Verified YER134C Mg-dependent acid phosphatase|MDP-1 chromosome 5 5 437803 437267 C 2011-02-03 1996-07-31 Magnesium-dependent acid phosphatase; member of the haloacid dehalogenase superfamily; non-essential gene +S000032339 CDS YER134C 5 437803 437267 C 2011-02-03 1996-07-31 +S000000937 ORF Uncharacterized YER135C chromosome 5 5 438344 437952 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YER135C is not an essential gene +S000032452 CDS YER135C 5 438344 437952 C 2011-02-03 1996-07-31 +S000006753 tRNA_gene tV(AAC)E1 chromosome 5 L000003796 5 438700 438773 W 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000035942 noncoding_exon tV(AAC)E1 5 438700 438773 W 2011-02-03 2000-05-19 +S000077390 ARS ARS518 ARSV-439 chromosome 5 5 438934 439182 2011-02-03 2004-10-19|2006-09-07 Autonomously Replicating Sequence +S000178091 ARS_consensus_sequence ARS518 5 439102 439086 C 2014-11-18 2014-11-18 +S000000938 ORF Verified YER136W GDI1 SEC19 chromosome 5 L000000699 5 439616 440971 W 2011-02-03 1996-07-31 GDP dissociation inhibitor; regulates vesicle traffic in secretory pathways by regulating the dissociation of GDP from the Sec4/Ypt/rab family of GTP binding proteins +S000033298 CDS YER136W 5 439616 440971 W 2011-02-03 1996-07-31 +S000028757 ORF Dubious YER137W-A chromosome 5 5 441575 441880 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF YER137C +S000033451 CDS YER137W-A 5 441575 441880 W 2011-02-03 2003-07-29 +S000000939 ORF Uncharacterized YER137C chromosome 5 5 441819 441373 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000033341 CDS YER137C 5 441819 441373 C 2011-02-03 1996-07-31 +S000006491 ncRNA_gene SCR1 SCR1 chromosome 5 L000001818 5 441987 442508 W 2011-02-03 2000-05-19|2004-10-08 RNA subunit of the Signal Recognition Particle (SRP) +S000034550 noncoding_exon SCR1 5 441987 442508 W 2011-02-03 2000-05-19|2004-10-08 +S000077391 ARS ARS519 chromosome 5 5 442416 442735 2011-02-03 2004-10-19 Autonomously Replicating Sequence +S000006917 long_terminal_repeat YERWdelta17 chromosome 5 5 442734 443072 W 2011-02-03 2000-05-19 Ty1 LTR +S000006602 tRNA_gene tI(AAU)E1 chromosome 5 L000003801 5 443275 443202 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000037353 noncoding_exon tI(AAU)E1 5 443275 443202 C 2011-02-03 2000-05-19 +S000006898 long_terminal_repeat YERCdelta19 chromosome 5 5 443733 443397 C 2011-02-03 2000-05-19 Ty1 LTR +S000006919 long_terminal_repeat YERWdelta21 chromosome 5 5 444834 445139 W 2011-02-03 2000-05-19 Ty1 LTR +S000000940 transposable_element_gene YER138C gag-pol fusion protein chromosome 5 5 449024 443756 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000033407 CDS YER138C 5 447721 443756 C 2011-02-03 1996-07-31 +S000033406 CDS YER138C 5 449024 447723 C 2011-02-03 1996-07-31 +S000033408 plus_1_translational_frameshift YER138C 5 447722 447722 C 2011-02-03 1996-07-31 +S000007402 transposable_element_gene YER137C-A gag protein chromosome 5 5 449024 447702 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000034807 CDS YER137C-A 5 449024 447702 C 2011-02-03 1999-07-17 +S000006910 LTR_retrotransposon YERCTy1-1 Ty1 chromosome 5 5 449320 443397 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000006899 long_terminal_repeat YERCdelta20 chromosome 5 5 449320 448984 C 2011-02-03 2000-05-19 Ty1 LTR +S000007239 ORF Uncharacterized YER138W-A chromosome 5 5 449474 449578 W 2011-02-03 1999-07-17 Putative protein of unknown function; YER138W-A has a paralog, YBL107W-A, that arose from a single-locus duplication +S000030980 CDS YER138W-A 5 449474 449578 W 2011-02-03 1999-07-17 +S000000941 ORF Verified YER139C RTR1 RNA polymerase II subunit B1 CTD phosphatase RTR1 chromosome 5 5 451243 450563 C 2011-02-03 1996-07-31 CTD phosphatase; dephosphorylates S5-P in the C-terminal domain of Rpo21p; has a cysteine-rich motif required for function and conserved in eukaryotes; shuttles between the nucleus and cytoplasm; RTR1 has a paralog, RTR2, that arose from the whole genome duplication +S000034331 CDS YER139C 5 451243 450563 C 2011-02-03 1996-07-31 +S000000942 ORF Verified YER140W EMP65 chromosome 5 5 451565 453235 W 2011-02-03 1996-07-31 Integral membrane protein of the ER; forms an ER-membrane associated protein complex with Slp1p; identified along with SLP1 in a screen for mutants defective in the unfolded protein response (UPR); proposed to function in the folding of integral membrane proteins; interacts genetically with MPS3; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000035305 CDS YER140W 5 451565 453235 W 2011-02-03 1996-07-31 +S000000943 ORF Verified YER141W COX15 chromosome 5 L000002578 5 453459 454919 W 2011-02-03 1996-07-31 Protein required for the hydroxylation of heme O to form heme A; heme A is an essential prosthetic group for cytochrome c oxidase +S000035366 CDS YER141W 5 453459 454919 W 2011-02-03 1996-07-31 +S000000944 ORF Verified YER142C MAG1 MMS5 chromosome 5 L000000976 5 456036 455146 C 110 2011-02-03 1996-07-31 3-methyl-adenine DNA glycosylase; involved in protecting DNA against alkylating agents; initiates base excision repair by removing damaged bases to create abasic sites that are subsequently repaired; protein abundance increases in response to DNA replication stress +S000035403 CDS YER142C 5 456036 455146 C 2011-02-03 1996-07-31 +S000000945 ORF Verified YER143W DDI1 VSM1 chromosome 5 L000004257 5 456319 457605 W 2011-02-03 1996-07-31 DNA damage-inducible v-SNARE binding protein; role in suppression of protein secretion; may play a role in S-phase checkpoint control; has ubiquitin-associated (UBA), ubiquitin-like (UBL), and retroviral-like proteinase (RVP) domains +S000035500 CDS YER143W 5 456319 457605 W 2011-02-03 1996-07-31 +S000000946 ORF Verified YER144C UBP5 putative ubiquitin-specific protease UBP5 chromosome 5 L000002419 5 460223 457806 C 2011-02-03 1996-07-31 Putative ubiquitin-specific protease; concentrates at the bud neck; UBP5 has a paralog, DOA4, that arose from the whole genome duplication +S000035528 CDS YER144C 5 460223 457806 C 2011-02-03 1996-07-31 +S000000947 ORF Verified YER145C FTR1 high-affinity iron permease FTR1 chromosome 5 L000003066 5 461740 460526 C 2011-02-03 1996-07-31 High affinity iron permease; involved in the transport of iron across the plasma membrane; forms complex with Fet3p; expression is regulated by iron; protein abundance increases in response to DNA replication stress +S000035592 CDS YER145C 5 461740 460526 C 2011-02-03 1996-07-31 +S000000948 ORF Verified YER146W LSM5 RNA-binding protein LSM5 chromosome 5 L000004684 5 462585 462866 W 2011-02-03 1996-07-31 Lsm (Like Sm) protein; part of heteroheptameric complexes (Lsm2p-7p and either Lsm1p or 8p): cytoplasmic Lsm1p complex involved in mRNA decay; nuclear Lsm8p complex part of U6 snRNP and possibly involved in processing tRNA, snoRNA, and rRNA +S000036550 CDS YER146W 5 462585 462866 W 2011-02-03 1996-07-31 +S000028758 ORF Dubious YER145C-A chromosome 5 5 462823 462386 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps verified ORF LSM5/YER146W +S000033452 CDS YER145C-A 5 462823 462386 C 2011-02-03 2003-07-29 +S000000949 ORF Verified YER147C SCC4 cohesin-loading factor complex subunit SCC4 chromosome 5 5 464842 462968 C 2011-02-03 1996-07-31 Subunit of cohesin loading factor (Scc2p-Scc4p); complex is required for the loading of cohesin complexes onto chromosomes; involved in establishing sister chromatid cohesion during double-strand break repair via phosphorylated histone H2AX +S000036587 CDS YER147C 5 464842 462968 C 2011-02-03 1996-07-31 +S000000950 ORF Verified YER148W SPT15 TATA-binding protein|TBP|TBP1|BTF1 chromosome 5 L000002037 5 465303 466025 W 110 2011-02-03 1996-07-31 TATA-binding protein (TBP); general transcription factor that interacts with other factors to form the preinitiation complex at promoters; essential for viability, highly conserved; yeast gene can complement mutations in human homolog TBP +S000037378 CDS YER148W 5 465303 466025 W 2011-02-03 1996-07-31 +S000028759 ORF Dubious YER147C-A chromosome 5 5 465613 465203 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF SPT15/YER148W +S000033453 CDS YER147C-A 5 465613 465203 C 2011-02-03 2003-07-29 +S000028760 ORF Dubious YER148W-A chromosome 5 5 466185 466763 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF PEA2/YER149C +S000033464 CDS YER148W-A 5 466185 466763 W 2011-02-03 2003-07-29 +S000000951 ORF Verified YER149C PEA2 PPF2|DFG9 chromosome 5 L000003143 5 467470 466208 C 2011-02-03 1996-07-31 Coiled-coil 12S polarisome subunit; required for polarity establishment, apical bud growth, shmoo formation, filamentous differentiation; involved in Bni1p localization at sites of polarized growth, controlling polarized assembly of actin cables; role in apical growth affects diploid-specific bipolar bud site selection; retains Slt2p at bud tip to regulate ER inheritance; role in Ca2+ influx, cell fusion; S288C allele encoding Leu409 rather than Met linked with non-invasion +S000037418 CDS YER149C 5 467470 466208 C 2011-02-03 1996-07-31 +S000000952 ORF Verified YER150W SPI1 chromosome 5 L000004852 5 468370 468816 W 2011-02-03 1996-07-31 GPI-anchored cell wall protein involved in weak acid resistance; basal expression requires Msn2p/Msn4p; expression is induced under conditions of stress and during the diauxic shift; SPI1 has a paralog, SED1, that arose from the whole genome duplication +S000030182 CDS YER150W 5 468370 468816 W 2011-02-03 1996-07-31 +S000006754 tRNA_gene tV(AAC)E2 chromosome 5 L000003797 5 469457 469530 W 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000035943 noncoding_exon tV(AAC)E2 5 469457 469530 W 2011-02-03 2000-05-19 +S000000953 ORF Verified YER151C UBP3 mRNA-binding ubiquitin-specific protease UBP3|BLM3 chromosome 5 L000002417|S000086717 5 472424 469686 C 2011-02-03 1996-07-31 Ubiquitin-specific protease involved in transport and osmotic response; negatively regulates Ras/PKA signaling; interacts with Bre5p to coregulate anterograde, retrograde transport between ER and Golgi; involved in transcription elongation in response to osmostress through phosphorylation at Ser695 by Hog1p; inhibitor of gene silencing; role in ribophagy; cleaves ubiquitin fusions but not polyubiquitin; protein abundance increases in response to DNA replication stress +S000030288 CDS YER151C 5 472424 469686 C 2011-02-03 1996-07-31 +S000028761 ORF Dubious YER152W-A chromosome 5 5 473485 474051 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF YER152C +S000033465 CDS YER152W-A 5 473485 474051 W 2011-02-03 2003-07-29 +S000000954 ORF Verified YER152C 2-aminoadipate transaminase chromosome 5 5 473988 472657 C 2011-02-03 1996-07-31 Protein with 2-aminoadipate transaminase activity; shares amino acid similarity with the aminotransferases Aro8p and Aro9p; YER152C is not an essential gene +S000030401 CDS YER152C 5 473988 472657 C 2011-02-03 1996-07-31 +S000000955 ORF Verified YER153C PET122 chromosome 5 L000001397 5 474805 474041 C 118 2011-02-03 1996-07-31 Mitochondrial translational activator specific for the COX3 mRNA; acts together with Pet54p and Pet494p; located in the mitochondrial inner membrane +S000031314 CDS YER153C 5 474805 474041 C 2011-02-03 1996-07-31 +S000000956 ORF Verified YER154W OXA1 membrane insertase OXA1|PET1402 chromosome 5 L000001318 5 475020 476228 W 112 2011-02-03 1996-07-31 Mitochondrial inner membrane insertase; mediates the insertion of both mitochondrial- and nuclear-encoded proteins from the matrix into the inner membrane; also has a role in insertion of carrier proteins into the inner membrane; acts as a voltage-gated ion channel, activated by substrate peptides; interacts with mitochondrial ribosomes; conserved from bacteria to animals +S000031446 CDS YER154W 5 475020 476228 W 2011-02-03 1996-07-31 +S000000957 ORF Verified YER155C BEM2 TSL1|SUP9|IPL2 chromosome 5 L000000168 5 482848 476345 C 119 2011-02-03 1996-07-31 Rho GTPase activating protein (RhoGAP); involved in the control of cytoskeleton organization and cellular morphogenesis; required for bud emergence; potential GAP for Rho4p +S000031485 CDS YER155C 5 482848 476345 C 2011-02-03 1996-07-31 +S000000958 ORF Uncharacterized YER156C chromosome 5 5 484341 483325 C 2011-02-03 1996-07-31 Putative protein of unknown function; interacts with Hsp82p and copurifies with Ipl1p; expression is copper responsive and downregulated in strains deleted for MAC1, a copper-responsive transcription factor; similarity to mammalian MYG1 +S000031540 CDS YER156C 5 484341 483325 C 2011-02-03 1996-07-31 +S000000959 ORF Verified YER157W COG3 Golgi transport complex subunit COG3|SEC34|GRD20 chromosome 5 L000004876 5 484788 487193 W 2011-02-03 1996-07-31 Essential component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments +S000032561 CDS YER157W 5 484788 487193 W 2011-02-03 1996-07-31 +S000006552 tRNA_gene tE(UUC)E3 chromosome 5 L000003800 5 487402 487331 C 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; target of K. lactis zymocin +S000034442 noncoding_exon tE(UUC)E3 5 487402 487331 C 2011-02-03 2000-05-19 +S000006920 long_terminal_repeat YERWdelta22 chromosome 5 5 487834 488165 W 2011-02-03 2000-05-19 Ty1 LTR +S000000960 ORF Uncharacterized YER158C chromosome 5 5 490578 488857 C 2011-02-03 1996-07-31 Protein of unknown function; potentially phosphorylated by Cdc28p; YER158C has a paralog, AFR1, that arose from the whole genome duplication +S000032616 CDS YER158C 5 490578 488857 C 2011-02-03 1996-07-31 +S000028624 ORF Dubious YER158W-A chromosome 5 5 491487 491702 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031478 CDS YER158W-A 5 491487 491702 W 2011-02-03 2003-07-29 +S000000961 ORF Verified YER159C BUR6 negative cofactor 2 transcription regulator complex subunit BUR6|NCB1 chromosome 5 L000003240 5 491958 491530 C 2011-02-03 1996-07-31 Subunit of a heterodimeric NC2 transcription regulator complex; complex binds to TBP and can repress transcription by preventing preinitiation complex assembly or stimulate activated transcription; homologous to human NC2alpha; complex also includes Ncb2p; bur6 ncb2 double mutation is functionally complemented by coexpression of human DRAP1 and DR1, although the single bur6 mutation is not complemented by its ortholog DRAP1 +S000032723 CDS YER159C 5 491958 491530 C 2011-02-03 1996-07-31 +S000006701 tRNA_gene tR(ACG)E chromosome 5 L000003799 5 492424 492352 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 6 nuclear tRNA genes containing the tDNA-anticodon ACG (converted to ICG in the mature tRNA), decodes CGU, CGC, and probably CGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000030371 noncoding_exon tR(ACG)E 5 492424 492352 C 2011-02-03 2000-05-19 +S000006900 long_terminal_repeat YERCdelta23 chromosome 5 5 492833 492695 C 2011-02-03 2000-05-19 Ty1 LTR +S000000962 transposable_element_gene YER160C gag-pol fusion protein chromosome 5 5 498124 492856 C 2011-02-03 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000034492 CDS YER160C 5 496821 492856 C 2011-02-03 1996-07-31 +S000034491 CDS YER160C 5 498124 496823 C 2011-02-03 1996-07-31 +S000034493 plus_1_translational_frameshift YER160C 5 496822 496822 C 2011-02-03 1996-07-31 +S000007403 transposable_element_gene YER159C-A gag protein chromosome 5 5 498124 496802 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000030149 CDS YER159C-A 5 498124 496802 C 2011-02-03 1999-07-17 +S000006911 LTR_retrotransposon YERCTy1-2 Ty1 chromosome 5 5 498421 492695 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000006901 long_terminal_repeat YERCdelta24 chromosome 5 5 498421 498084 C 2011-02-03 2000-05-19 Ty1 LTR +S000077392 ARS ARS520 chromosome 5 5 498884 499182 2014-11-18 2004-10-19|2014-11-18 Autonomously Replicating Sequence +S000178092 ARS_consensus_sequence ARS520 5 498884 498900 W 2014-11-18 2014-11-18 +S000000963 ORF Verified YER161C SPT2 EXA1|SIN1 chromosome 5 L000002028 5 500348 499347 C 127 2011-02-03 1996-07-31 Protein involved in negative regulation of transcription; required for RNA polyadenylation; exhibits regulated interactions with both histones and SWI-SNF components; relocalizes to the cytosol in response to hypoxia; similar to mammalian HMG1 proteins +S000034600 CDS YER161C 5 500348 499347 C 2011-02-03 1996-07-31 +S000000964 ORF Verified YER162C RAD4 chromosome 5 L000001558 5 502894 500630 C 128 2011-02-03 1996-07-31|2011-02-03 Protein that recognizes and binds damaged DNA (with Rad23p) during NER; subunit of Nuclear Excision Repair Factor 2 (NEF2); also involved, with Rad23p, in turnover of ubiquitylated proteins; Rad4p-Rad23p heterodimer binds to promoters of DNA damage response genes to repress their transcription in the absence of DNA damage; NER stands for nucleotide excision repair +S000034668 CDS YER162C 5 502894 500630 C 2011-02-03 1996-07-31|2011-02-03 +S000000965 ORF Verified YER163C GCG1 gamma-glutamylcyclotransferase chromosome 5 5 503782 503084 C 2011-02-03 1996-07-31 Gamma-glutamyl cyclotransferase; cleaves the gamma-glutamyl bond of glutathione to yield 5-oxoproline and a Cys-Gly dipeptide; similar to mammalian pro-apoptotic protein ChaC1; expression of mouse ChaC1 in yeast increases apoptosis; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; periodically expressed during the metabolic cycle +S000034748 CDS YER163C 5 503782 503084 C 2011-02-03 1996-07-31 +S000000966 ORF Verified YER164W CHD1 chromatin-remodeling ATPase CHD1 chromosome 5 L000003467 5 505392 509798 W 2011-02-03 1996-07-31 Chromatin remodeler that regulates various aspects of transcription; acts in in conjunction with Isw1b to regulate chromatin structure and maintain chromatin integrity during transcription elongation by RNAP II by preventing trans-histone exchange over coding regions; contains a chromo domain, a helicase domain and a DNA-binding domain; component of both the SAGA and SLIK complexes +S000035707 CDS YER164W 5 505392 509798 W 2011-02-03 1996-07-31 +S000000967 ORF Verified YER165W PAB1 polyadenylate-binding protein chromosome 5 L000001327 5 510373 512106 W 2011-02-03 1996-07-31 Poly(A) binding protein; part of the 3'-end RNA-processing complex, mediates interactions between the 5' cap structure and the 3' mRNA poly(A) tail, involved in control of poly(A) tail length, interacts with translation factor eIF-4G; stimulates, but is not required for the deadenylation activity of the Pan2p-Pan3p poly(A)-ribonuclease complex +S000035793 CDS YER165W 5 510373 512106 W 2011-02-03 1996-07-31 +S000000968 ORF Verified YER166W DNF1 aminophospholipid-translocating P4-type ATPase DNF1 chromosome 5 5 512744 517459 W 2011-02-03 1996-07-31 Aminophospholipid translocase (flippase); type 4 P-type ATPase; involved in phospholipid translocation, contributing to endocytosis, protein transport, and cellular polarization; localizes primarily to the plasma membrane; localizes to the shmoo tip where it has a redundant role in the cellular response to mating pheromone; DNF1 has a paralog, DNF2, that arose from the whole genome duplication +S000035898 CDS YER166W 5 512744 517459 W 2011-02-03 1996-07-31 +S000028762 ORF Dubious YER165C-A chromosome 5 5 512983 512627 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene DNF1/YER166W +S000033466 CDS YER165C-A 5 512983 512627 C 2011-02-03 2003-07-29 +S000000969 ORF Verified YER167W BCK2 CTR7 chromosome 5 L000000163 5 518216 520771 W 2011-02-03 1996-07-31 Serine/threonine-rich protein involved in PKC1 signaling pathway; protein kinase C (PKC1) signaling pathway controls cell integrity; overproduction suppresses pkc1 mutations +S000036791 CDS YER167W 5 518216 520771 W 2011-02-03 1996-07-31 +S000077393 ARS ARS521 chromosome 5 5 520772 521030 2011-02-03 2004-10-19 Autonomously Replicating Sequence +S000000970 ORF Verified YER168C CCA1 tRNA adenylyltransferase|TNT1 chromosome 5 L000000232 5 522669 521029 C 2011-02-03 1996-07-31 ATP (CTP):tRNA-specific tRNA nucleotidyltransferase; different forms targeted to the nucleus, cytosol, and mitochondrion are generated via the use of multiple transcriptional and translational start sites; human homolog TRNT1 complements yeast null mutant +S000036817 CDS YER168C 5 522669 521029 C 2011-02-03 1996-07-31 +S000000971 ORF Verified YER169W RPH1 KDM4 chromosome 5 L000004504 5 523369 525759 W 2011-02-03 1996-07-31 JmjC domain-containing histone demethylase; targets tri- and dimethylated H3K36; associates with actively transcribed regions and promotes elongation; repressor of autophagy-related genes in nutrient-replete conditions; damage-responsive repressor of PHR1; phosphorylated by the Rad53p-dependent DNA damage checkpoint pathway and by a Rim1p-mediated event during starvation; target of stress-induced hormesis; RPH1 has a paralog, GIS1, that arose from the whole genome duplication +S000036928 CDS YER169W 5 523369 525759 W 2011-02-03 1996-07-31 +S000000972 ORF Verified YER170W ADK2 adenylate kinase ADK2|PAK3|AKY3 chromosome 5 L000000047 5 525974 526651 W 146 2011-02-03 1996-07-31 Mitochondrial adenylate kinase; catalyzes the reversible synthesis of GTP and AMP from GDP and ADP; may serve as a back-up for synthesizing GTP or ADP depending on metabolic conditions; 3' sequence of ADK2 varies with strain background +S000036684 CDS YER170W 5 525974 526651 W 2011-02-03 1996-07-31 +S000000973 ORF Verified YER171W RAD3 TFIIH/NER complex ATP-dependent 5'-3' DNA helicase subunit RAD3|REM1 chromosome 5 L000001557 5 527082 529418 W 146 2011-02-03 1996-07-31 5' to 3' DNA helicase; involved in nucleotide excision repair and transcription; subunit of RNA polII initiation factor TFIIH and of Nucleotide Excision Repair Factor 3 (NEF3); homolog of human XPD protein; mutant has aneuploidy tolerance; protein abundance increases in response to DNA replication stress +S000036770 CDS YER171W 5 527082 529418 W 2011-02-03 1996-07-31 +S000000974 ORF Verified YER172C BRR2 ATP-dependent RNA helicase BRR2|PRP44|SNU246|SLT22|RSS1 chromosome 5 L000003100|L000003283 5 536021 529530 C 2011-02-03 1996-07-31 RNA-dependent ATPase RNA helicase (DEIH box); required for disruption of U4/U6 base-pairing in native snRNPs to activate the spliceosome for catalysis; homologous to human U5-200kD +S000030569 CDS YER172C 5 536021 529530 C 2011-02-03 1996-07-31 +S000000975 ORF Verified YER173W RAD24 RS1 chromosome 5 L000001777 5 536300 538279 W 147 2011-02-03 1996-07-31 Checkpoint protein; involved in the activation of the DNA damage and meiotic pachytene checkpoints; subunit of a clamp loader that loads Rad17p-Mec3p-Ddc1p onto DNA; homolog of human and S. pombe Rad17 protein +S000030767 CDS YER173W 5 536300 538279 W 2011-02-03 1996-07-31 +S000028763 ORF Dubious YER172C-A chromosome 5 5 536655 536275 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF RAD24/YER173W +S000033467 CDS YER172C-A 5 536655 536275 C 2011-02-03 2003-07-29 +S000000976 ORF Verified YER174C GRX4 monothiol glutaredoxin GRX4 chromosome 5 S000007445 5 539168 538434 C 2011-02-03 1996-07-31 Glutathione-dependent oxidoreductase; hydroperoxide and superoxide-radical responsive; monothiol glutaredoxin subfamily member along with Grx3p and Grx5p; protects cells from oxidative damage; with Grx3p, binds to Aft1p in iron-replete conditions, promoting its dissociation from promoters; mutant has increased aneuploidy tolerance; transcription regulated by Yap5p; GRX4 has a paralog, GRX3, that arose from the whole genome duplication +S000030799 CDS YER174C 5 539168 538434 C 2011-02-03 1996-07-31 +S000000977 ORF Verified YER175C TMT1 TAM1 chromosome 5 5 540363 539464 C 2011-02-03 1996-07-31 Trans-aconitate methyltransferase; cytosolic enzyme that catalyzes the methyl esterification of 3-isopropylmalate, an intermediate of the leucine biosynthetic pathway, and trans-aconitate, which inhibits the citric acid cycle +S000031738 CDS YER175C 5 540363 539464 C 2011-02-03 1996-07-31 +S000028625 ORF Uncharacterized YER175W-A chromosome 5 5 540650 540814 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031479 CDS YER175W-A 5 540650 540814 W 2011-02-03 2003-07-29 +S000000978 ORF Verified YER176W ECM32 MTT1|HEL1 chromosome 5 L000003934 5 541690 545055 W 2011-02-03 1996-07-31 DNA dependent ATPase/DNA helicase; helicase belonging to the Dna2p- and Nam7p-like family of helicases that is involved in modulating translation termination; interacts with the translation termination factors, localized to polysomes +S000032015 CDS YER176W 5 541690 545055 W 2011-02-03 1996-07-31 +S000000979 ORF Verified YER177W BMH1 14-3-3 family protein BMH1|APR6 chromosome 5 L000000185 5 545611 546414 W 148 2011-02-03 1996-07-31 14-3-3 protein, major isoform; controls proteome at post-transcriptional level, binds proteins and DNA, involved in regulation of exocytosis, vesicle transport, Ras/MAPK and rapamycin-sensitive signaling, aggresome formation, spindle position checkpoint; protein increases in abundance and relative distribution to the nucleus increases upon DNA replication stress; antiapoptotic gene similar to human 14-3-3; BMH1 has a paralog, BMH2, that arose from whole genome duplication +S000032121 CDS YER177W 5 545611 546414 W 2011-02-03 1996-07-31 +S000000980 ORF Verified YER178W PDA1 pyruvate dehydrogenase (acetyl-transferring) subunit E1 alpha chromosome 5 L000001352 5 546817 548079 W 143 2011-02-03 2003-09-22|1996-07-31 E1 alpha subunit of the pyruvate dehydrogenase (PDH) complex; catalyzes the direct oxidative decarboxylation of pyruvate to acetyl-CoA; phosphorylated; regulated by glucose; PDH complex is concentrated in spots within the mitochondrial matrix, often near the ERMES complex and near peroxisomes +S000033032 CDS YER178W 5 546817 548079 W 2011-02-03 2003-09-22|1996-07-31 +S000000981 ORF Verified YER179W DMC1 recombinase DMC1|ISC2 chromosome 5 L000000509 5 548421 549517 W 2011-02-03 1996-07-31 Meiosis-specific recombinase required for double-strand break repair; also required for pairing between homologous chromosomes; required for the normal morphogenesis of synaptonemal complex; homolog of Rad51p and the bacterial RecA protein; binds ssDNA and dsDNA, forms helical filaments; stimulated by Rdh54p +S000033128 CDS YER179W 5 548421 548552 W 2011-02-03 1996-07-31 +S000033129 CDS YER179W 5 548645 549517 W 2011-02-03 1996-07-31 +S000033130 intron YER179W 5 548553 548644 W 2011-02-03 1996-07-31 +S000077394 ARS ARS522 ARSV-550|ARS501 chromosome 5 5 549566 549814 2011-02-03 2004-10-19|2006-09-07 Autonomously Replicating Sequence; active origin of replication near the right end of Chromosome V that is activated late in S phase, late activation appears to result from telomeric proximity +S000000982 ORF Verified YER180C ISC10 chromosome 5 L000000876 5 550527 549724 C 2011-02-03 1996-07-31 Protein required for sporulation; transcript is induced 7.5 hours after induction of meiosis, expected to play significant role in the formation of reproductive cells +S000032813 CDS YER180C 5 550527 549724 C 2011-02-03 1996-07-31 +S000028437 ORF Verified YER180C-A SLO1 chromosome 5 S000028475 5 551122 550865 C 2011-02-03 2003-03-07 Protein interacting with Arl3p; Arl3p is a GTPase of the Ras superfamily involved in vesicle-tethering at the Golgi; putative ortholog of human SCOCO +S000030116 CDS YER180C-A 5 551122 550865 C 2011-02-03 2003-03-07 +S000006603 tRNA_gene tI(AAU)E2 chromosome 5 L000003798 5 551358 551285 C 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000037354 noncoding_exon tI(AAU)E2 5 551358 551285 C 2011-02-03 2000-05-19 +S000006921 long_terminal_repeat YERWdelta25 chromosome 5 5 551442 551773 W 2011-02-03 2000-05-19 Ty1 LTR +S000000983 ORF Verified YER181C chromosome 5 5 551796 551473 C 2011-02-03 1996-07-31 Mitochondrial protein of unknown function; conserved among S. cerevisiae strains; extensively overlaps a Ty1 LTR; YER181C is not an essential gene +S000032942 CDS YER181C 5 551796 551473 C 2011-02-03 1996-07-31 +S000006902 long_terminal_repeat YERCdelta26 chromosome 5 5 552267 552040 C 2011-02-03 2000-05-19 Ty1 LTR +S000000984 ORF Uncharacterized YER182W FMP10 chromosome 5 5 552525 553259 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000034960 CDS YER182W 5 552525 553259 W 2011-02-03 1996-07-31 +S000000985 ORF Verified YER183C FAU1 5-formyltetrahydrofolate cyclo-ligase chromosome 5 5 553969 553334 C 2011-02-03 1996-07-31 5,10-methenyltetrahydrofolate synthetase; involved in folic acid biosynthesis +S000035021 CDS YER183C 5 553969 553334 C 2011-02-03 1996-07-31 +S000000986 ORF Verified YER184C TOG1 chromosome 5 5 558680 556296 C 2011-02-03 1996-07-31 Transcriptional activator of oleate genes; regulates genes involved in fatty acid utilization; zinc cluster protein; deletion confers sensitivity to Calcufluor white, and prevents growth on glycerol or lactate as sole carbon source +S000035120 CDS YER184C 5 558680 556296 C 2011-02-03 1996-07-31 +S000000987 ORF Verified YER185W PUG1 chromosome 5 5 559454 560365 W 2011-02-03 1996-07-31 Plasma membrane protein involved in protoprophyrin and heme transport; roles in the uptake of protoprophyrin IX and the efflux of heme; expression is induced under both low-heme and low-oxygen conditions; member of the fungal lipid-translocating exporter (LTE) family of proteins +S000036056 CDS YER185W 5 559454 560365 W 2011-02-03 1996-07-31 +S000000988 ORF Uncharacterized YER186C chromosome 5 5 562625 561705 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000036102 CDS YER186C 5 562625 561705 C 2011-02-03 1996-07-31 +S000006903 long_terminal_repeat YERComega1 chromosome 5 5 564024 563928 C 2011-02-03 2000-05-19 Ty5 LTR +S000000989 ORF Uncharacterized YER187W chromosome 5 5 566230 566655 W 2011-02-03 1996-07-31 Putative protein of unknown function; induced in respiratory-deficient cells +S000031676 CDS YER187W 5 566230 566655 W 2011-02-03 1996-07-31 +S000000990 ORF Dubious YER188W chromosome 5 5 568040 568759 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; large-scale analyses show mRNA expression increases under anaerobic conditions and two-hybrid interactions with Sst2p +S000031818 CDS YER188W 5 568040 568759 W 2011-02-03 1996-07-31 +S000006922 long_terminal_repeat YERWomega2 chromosome 5 5 568791 569024 W 2011-02-03 2000-05-19 Ty5 LTR +S000028953 telomere TEL05R chromosome 5 5 569599 576874 W 151 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome V; annotated components include an X element core sequence, X element combinatorial repeats, and a long Y' element; TEL05R does have telomeric repeats (TEL05R-TR), but they are missing from the genome annotation due to difficulties encountered during sequencing and/or assembly +S000028954 X_element TEL05R 5 569599 570060 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome V; contains an ARS consensus sequence, an Abf1p binding site consensus sequence, and ORF YER188C-A +S000028955 X_element_combinatorial_repeat TEL05R 5 570061 570329 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr V; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; Formerly called SubTelomeric Repeats +S000028956 Y_prime_element TEL05R 5 570330 576874 W 2011-02-03 2003-09-09 Telomeric long Y' element on the right arm of Chromosome V; contains an ARS consensus sequence, a region of 36-bp repeats, and four ORFs (YRF1-2/YER190W, YER189W, YER190C-A, YER190C-B) +S000077395 ARS ARS523 chromosome 5 5 569618 569695 2014-11-18 2014-11-18|2004-10-19 Autonomously Replicating Sequence +S000178093 ARS_consensus_sequence ARS523 5 569629 569645 W 2014-11-18 2014-11-18 +S000028764 ORF Uncharacterized YER188C-A chromosome 5 5 569907 569608 C 2011-02-03 2003-07-29 Putative protein of unknown function +S000033468 CDS YER188C-A 5 569907 569608 C 2011-02-03 2003-07-29 +S000000991 ORF Uncharacterized YER189W chromosome 5 5 571155 571523 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000031933 CDS YER189W 5 571155 571523 W 2011-02-03 1996-07-31 +S000000992 ORF Verified YER190W YRF1-2 Y' element ATP-dependent helicase protein 1 copy 2|YRF1 chromosome 5 5 571480 576525 W 2011-02-03 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p; induced by treatment with 8-methoxypsoralen and UVA irradiation +S000036410 CDS YER190W 5 571480 576525 W 2011-02-03 1996-07-31 +S000028626 ORF Dubious YER190C-A chromosome 5 5 575379 574804 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF YRF1-2/YER190W; identified by gene-trapping, expression analysis, and homology +S000031482 CDS YER190C-A 5 575379 574804 C 2011-02-03 2003-07-29 +S000028627 ORF Uncharacterized YER190C-B chromosome 5 5 576162 575680 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031484 CDS YER190C-B 5 576162 575680 C 2011-02-03 2003-07-29 +S000001826 ORF Uncharacterized YFL068W chromosome 6 6 53 535 W 1996-07-31 1996-07-31 Putative protein of unknown function; SWAT-GFP and mCherry fusion proteins localize to the cytosol +S000030466 CDS YFL068W 6 53 535 W 1996-07-31 1996-07-31 +S000001827 ORF Uncharacterized YFL067W chromosome 6 6 836 1363 W 1996-07-31 1996-07-31 Protein of unknown function; down-regulated at low calcium levels; mCherry fusion protein localizes to the vacuole +S000037641 CDS YFL067W 6 836 1363 W 1996-07-31 1996-07-31 +S000001828 ORF Uncharacterized YFL066C Y' element ATP-dependent helicase chromosome 6 6 2615 1437 C 1996-07-31 1996-07-31 Helicase-like protein encoded within the telomeric Y' element; induced by treatment with 8-methoxypsoralen and UVA irradiation; SWAT-GFP and mCherry fusion proteins localize to the nucleus +S000037520 CDS YFL066C 6 2615 1437 C 1996-07-31 1996-07-31 +S000001829 ORF Uncharacterized YFL065C chromosome 6 6 3338 3030 C 1996-07-31 1996-07-31 Putative protein of unknown function; induced by treatment with 8-methoxypsoralen and UVA irradiation +S000037426 CDS YFL065C 6 3338 3030 C 1996-07-31 1996-07-31 +S000001830 ORF Uncharacterized YFL064C chromosome 6 6 3846 3322 C 1996-07-31 1996-07-31 Putative protein of unknown function +S000031930 CDS YFL064C 6 3846 3322 C 1996-07-31 1996-07-31 +S000001831 ORF Dubious YFL063W chromosome 6 6 5066 5521 W 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031881 CDS YFL063W 6 5066 5521 W 1996-07-31 1996-07-31 +S000029653 ARS ARS600 ARS600 ARS600.1|ARS120 chromosome 6 L000000123 6 5426 5529 2014-11-18 2014-11-18|2006-03-02 Subtelomeric Autonomously Replicating Sequence; originally published as ARS120 +S000114519 ARS_consensus_sequence ARS600 6 5492 5482 C 2006-03-02 2006-03-02 +S000028882 telomere TEL06L chromosome 6 6 5530 1 C -60 2003-09-09 2003-09-09|2011-02-03 Telomeric region on the left arm of Chromosome VI; composed of an X element core sequence, X element combinatorial repeats, a stretch of telomeric repeats, and a short Y' element +S000028883 telomeric_repeat TEL06L 6 4819 4685 C 2003-09-09 2003-09-09 Internal telomeric repeats on the left arm of Chromosome VI +S000028884 X_element TEL06L 6 5530 5068 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome VI; contains an ARS consensus sequence, an Abf1p binding site consensus sequence and ORF YFL063W +S000028885 X_element_combinatorial_repeat TEL06L 6 5067 4820 C 2003-09-09 2003-09-09|2011-02-03 Telomeric X element combinatorial repeat on the left arm of Chr VI; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000028886 Y_prime_element TEL06L 6 4684 1 C 2003-09-09 2003-09-09 Telomeric short Y' element on the left arm of Chromosome VI; contains a region of 36-bp repeats and five ORFs (YFL064C, YFL065C, YFL066C, YFL067W, YFL068W) +S000001832 ORF Verified YFL062W COS4 chromosome 6 L000004062 6 6426 7565 W 1996-07-31 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins +S000031765 CDS YFL062W 6 6426 7565 W 1996-07-31 1996-07-31 +S000001833 ORF Verified YFL061W DDI2 cyanamide hydratase chromosome 6 6 9545 10222 W 1996-07-31 1996-07-31 Cyanamide hydratase that detoxifies cyanamide; member of the HD domain metalloprotein superfamily; expression is induced over 100-fold by cyanamide and by SN2-type DNA alkylating agents such as MMS and DMA; induction decreased in rad6 and rad18 mutants; gene and protein are identical to DDI3 and Ddi3p +S000036244 CDS YFL061W 6 9545 10222 W 1996-07-31 1996-07-31 +S000001834 ORF Verified YFL060C SNO3 putative pyridoxal 5'-phosphate synthase chromosome 6 L000003453 6 10969 10301 C 1996-07-31 1996-07-31 Protein of unknown function; nearly identical to Sno2p; expression is induced before the diauxic shift and also in the absence of thiamin +S000036055 CDS YFL060C 6 10969 10301 C 1996-07-31 1996-07-31 +S000001835 ORF Verified YFL059W SNZ3 pyridoxine biosynthesis protein SNZ3 chromosome 6 L000002577 6 11363 12259 W 1996-07-31 1996-07-31 Member of a stationary phase-induced gene family; expressed in the presence of galactose; transcription of SNZ3 is induced prior to diauxic shift, and also in the absence of thiamin in a Thi2p-dependent manner; forms a coregulated gene pair with SNO3 +S000035247 CDS YFL059W 6 11363 12259 W 1996-07-31 1996-07-31 +S000001836 ORF Verified YFL058W THI5 4-amino-5-hydroxymethyl-2-methylpyrimidine phosphate synthase chromosome 6 L000002850 6 12929 13951 W 1996-07-31 1996-07-31 Protein involved in synthesis of the thiamine precursor HMP; member of a subtelomeric gene family including THI5, THI11, THI12, and THI13; hydroxymethylpyrimidine is also known as HMP +S000035156 CDS YFL058W 6 12929 13951 W 1996-07-31 1996-07-31 +S000001838 pseudogene YFL056C AAD6 YFL057C chromosome 6 L000004638 6 15431 14305 C 2014-11-18 1996-07-31|2014-11-18 Putative aryl-alcohol dehydrogenase; involved in oxidative stress response; similar to P. chrysosporium aryl-alcohol dehydrogenase; ORFs AAD6/YFL056C and AAD16/YFL057C are displaced from one another by -1 frameshift; members of the AAD gene family comprise three pairs (AAD3 + AAD15, AAD6/AAD16 + AAD4, AAD10 + AAD14) whose two genes are more related to one another than to other members of the family; expression induced in cells treated with the mycotoxin patulin +S000034007 CDS YFL056C 6 15431 14305 C 2014-11-18 1996-07-31|2014-11-18 +S000001839 ORF Verified YFL055W AGP3 chromosome 6 L000003948 6 17004 18680 W 1996-07-31 1996-07-31 Low-affinity amino acid permease; may act to supply the cell with amino acids as nitrogen source in nitrogen-poor conditions; transcription is induced under conditions of sulfur limitation; plays a role in regulating Ty1 transposition +S000033961 CDS YFL055W 6 17004 18680 W 1996-07-31 1996-07-31 +S000178094 ARS ARS600.4 chromosome 6 6 20702 20900 2014-11-18 2014-11-18 Strong autonomously replicating sequence +S000001840 ORF Uncharacterized YFL054C AQY3 chromosome 6 6 22787 20847 C 1996-07-31 1996-07-31 Putative channel-like protein; similar to Fps1p; mediates passive diffusion of glycerol in the presence of ethanol +S000033120 CDS YFL054C 6 22787 20847 C 1996-07-31 1996-07-31 +S000001841 ORF Verified YFL053W DAK2 dihydroxyacetone kinase chromosome 6 L000004204 6 23423 25198 W 1996-07-31 1996-07-31 Dihydroxyacetone kinase; required for detoxification of dihydroxyacetone (DHA); involved in stress adaptation +S000033090 CDS YFL053W 6 23423 25198 W 1996-07-31 1996-07-31 +S000001842 ORF Verified YFL052W ZNF1 DNA-binding domain containing protein|ROP1 chromosome 6 6 28232 29629 W 1996-07-31 1996-07-31 Zinc cluster transcription factor that regulates respiratory growth; binds to promoters of genes involved in respiration, gluconeogenesis, and the glyoxylate shunt; required for normal carbon source utilization and stress response +S000032997 CDS YFL052W 6 28232 29629 W 1996-07-31 1996-07-31 +S000001843 ORF Uncharacterized YFL051C chromosome 6 6 30540 30058 C 1996-07-31 1996-07-31 Putative protein of unknown function; SWAT-GFP fusion protein localizes to the cell periphery while mCherry fusion protein localizes to both the cell periphery and vacuole; YFL051C is not an essential gene +S000032013 CDS YFL051C 6 30540 30058 C 1996-07-31 1996-07-31 +S000007633 ARS ARS601 ARS601 chromosome 6 6 32473 32995 2001-03-02 2001-03-02 Autonomously replicating sequence on Chromosome VI; overlaps ARS602, ARS601/ARS602 together appear to be activated during the second half of S phase in ~32% of cell cycles +S000121262 ARS_consensus_sequence ARS601 6 32708 32718 W 2007-03-08 2007-03-08 +S000007634 ARS ARS602 ARS602 chromosome 6 6 32667 33247 2001-03-02 2001-03-02 Autonomously replicating sequence on Chromosome VI; overlaps ARS601, ARS601/ARS602 together appear to be activated during the second half of S phase in ~32% of cell cycles +S000121263 ARS_consensus_sequence ARS602 6 32970 32960 C 2007-03-08 2007-03-08 +S000001844 ORF Verified YFL050C ALR2 putative Mg(2+) transporter ALR2 chromosome 6 L000002888 6 35848 33272 C 1996-07-31 1996-07-31 Probable Mg(2+) transporter; overexpression confers increased tolerance to Al(3+) and Ga(3+) ions; plays a role in regulating Ty1 transposition +S000031839 CDS YFL050C 6 35848 33272 C 1996-07-31 1996-07-31 +S000001845 ORF Verified YFL049W SWP82 chromosome 6 6 36803 38674 W 1996-07-31 1996-07-31 Member of the SWI/SNF chromatin remodeling complex; has an as yet unidentified role in the complex; has identifiable counterparts in closely related yeast species; abundantly expressed in many growth conditions; paralog of Npl6p; relocates to the cytosol under hypoxic conditions +S000030907 CDS YFL049W 6 36803 38674 W 1996-07-31 1996-07-31 +S000001846 ORF Verified YFL048C EMP47 chromosome 6 L000002804 6 40180 38843 C 1996-07-31 1996-07-31 Integral membrane component of ER-derived COPII-coated vesicles; functionS in ER to Golgi transport; EMP47 has a paralog, EMP46, that arose from the whole genome duplication +S000030785 CDS YFL048C 6 40180 38843 C 1996-07-31 1996-07-31 +S000001847 ORF Verified YFL047W RGD2 chromosome 6 6 40421 42565 W 1996-07-31 1996-07-31 GTPase-activating protein (RhoGAP) for Cdc42p and Rho5p; relocalizes from bud neck to cytoplasm upon DNA replication stress +S000037893 CDS YFL047W 6 40421 42565 W 1996-07-31 1996-07-31 +S000001848 ORF Verified YFL046W FMP32 chromosome 6 6 42815 43438 W 1996-07-31 1996-07-31 Putative assembly factor for cytochrome c oxidase; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; has similarity to human MCUR1/CCDC90A +S000037798 CDS YFL046W 6 42815 43438 W 1996-07-31 1996-07-31 +S000001849 ORF Verified YFL045C SEC53 phosphomannomutase SEC53|ALG4 chromosome 6 L000001849 6 44392 43628 C 1996-07-31 1996-07-31 Phosphomannomutase; involved in synthesis of GDP-mannose and dolichol-phosphate-mannose; required for folding and glycosylation of secretory proteins in the ER lumen +S000037699 CDS YFL045C 6 44392 43628 C 1996-07-31 1996-07-31 +S000001850 ORF Verified YFL044C OTU1 ubiquitin-specific protease OTU1|YOD1 chromosome 6 6 45560 44655 C 1996-07-31 1996-07-31 Deubiquitylation enzyme that binds to the chaperone-ATPase Cdc48p; may contribute to regulation of protein degradation by deubiquitylating substrates that have been ubiquitylated by Ufd2p; member of the Ovarian Tumor (OTU) family; protein abundance increases in response to DNA replication stress +S000036927 CDS YFL044C 6 45560 44655 C 1996-07-31 1996-07-31 +S000001852 ORF Verified YFL042C LAM5 LTC2|YFL043C chromosome 6 6 47744 45720 C 2001-05-29 2001-05-29|1996-07-31 Putative sterol transfer protein; one of six StART-like domain-containing proteins in yeast that may be involved in sterol transfer between intracellular membranes; conserved across eukaryotes; has both GRAM and StART-like (VASt) domains; localizes to membrane contact sites throughout the cell, including nucleus-vacuole junctions and ER-mitochondrial contact sites +S000036790 CDS YFL042C 6 47744 45720 C 2001-05-29 2001-05-29|1996-07-31 +S000028547 ORF Uncharacterized YFL041W-A chromosome 6 6 48734 48925 W 2003-07-29 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031197 CDS YFL041W-A 6 48734 48925 W 2003-07-29 2003-07-29 +S000001853 ORF Verified YFL041W FET5 ferroxidase FET5 chromosome 6 L000002773 6 49139 51007 W 2001-05-29 1996-07-31 Multicopper oxidase; integral membrane protein with similarity to Fet3p; may have a role in iron transport +S000035986 CDS YFL041W 6 49139 51007 W 2001-05-29 1996-07-31 +S000001854 ORF Uncharacterized YFL040W chromosome 6 6 51350 52972 W 2001-05-29 1996-07-31 Putative transporter; member of the sugar porter family; YFL040W is not an essential gene; may have a role in intracellular sterol transport +S000035851 CDS YFL040W 6 51350 52972 W 2001-05-29 1996-07-31 +S000001855 ORF Verified YFL039C ACT1 actin|ABY1|END7 chromosome 6 L000000025 6 54696 53260 C -59 2011-02-03 1996-07-31|2011-02-03 Actin; structural protein involved in cell polarization, endocytosis, and other cytoskeletal functions +S000034732 CDS YFL039C 6 54377 53260 C 2001-05-29 1996-07-31 +S000034731 CDS YFL039C 6 54696 54687 C 2011-02-03 1996-07-31 +S000034733 intron YFL039C 6 54686 54378 C 2011-02-03 1996-07-31|2011-02-03 +S000001856 ORF Verified YFL038C YPT1 Rab family GTPase YPT1|YP2 chromosome 6 L000002543 6 55986 55366 C -59 2011-02-03 1996-07-31 Rab family GTPase; involved in the ER-to-Golgi step of the secretory pathway; complex formation with the Rab escort protein Mrs6p is required for prenylation of Ypt1p by type II protein geranylgeranyltransferase (Bet2p-Bet4p); binds to unspliced HAC1 mRNA; regulates the unfolded protein response (UPR) by promoting the decay of HAC1 RNA; localizes to the early Golgi, the transitional Golgi and ER membranes, pre-autophagosomal structures, and cytoplasmic vesicles +S000033828 CDS YFL038C 6 55986 55366 C 2011-02-03 1996-07-31 +S000001857 ORF Verified YFL037W TUB2 beta-tubulin|SHE8|ARM10 chromosome 6 L000002388 6 56336 57709 W -59 2011-02-03 1996-07-31 Beta-tubulin; associates with alpha-tubulin (Tub1p and Tub3p) to form tubulin dimer, which polymerizes to form microtubules; mutation in human ortholog is associated with congenital fibrosis of the extraocular muscles (CFEOM) with polymicrogyria +S000033779 CDS YFL037W 6 56336 57709 W 2011-02-03 1996-07-31 +S000130129 ncRNA_gene RUF21 RUF21 chromosome 6 6 58521 57815 C 2011-02-03 2009-05-04|2011-02-03 RNA of Unknown Function +S000130130 noncoding_exon RUF21 6 58521 57815 C 2011-02-03 2009-05-04|2011-02-03 +S000001858 ORF Verified YFL036W RPO41 DNA-directed RNA polymerase chromosome 6 L000001747 6 58782 62837 W 2011-02-03 1996-07-31 Mitochondrial RNA polymerase; single subunit enzyme similar to those of T3 and T7 bacteriophages; requires a specificity subunit encoded by MTF1 for promoter recognition; Mtf1p interacts with and stabilizes the Rpo41p-promoter complex, enhancing DNA bending and melting to facilitate pre-initiation open complex formation; Rpo41p also synthesizes RNA primers for mitochondrial DNA replication +S000033655 CDS YFL036W 6 58782 62837 W 2011-02-03 1996-07-31 +S000001859 ORF Verified YFL034C-B MOB2 YFL035C-A|YFL035C chromosome 6 L000003535|S000007658|S000002966 6 63993 63016 C 2011-02-03 1996-07-31 Activator of Cbk1p kinase; component of the RAM signaling network that regulates cellular polarity and morphogenesis; activation of Cbk1p facilitates the Ace2p-dependent daughter cell-specific transcription of genes involved in cell separation; similar to Mob1p +S000036508 CDS YFL034C-B 6 63859 63016 C 2011-02-03 1996-07-31 +S000036507 CDS YFL034C-B 6 63993 63974 C 2011-02-03 1996-07-31 +S000036509 intron YFL034C-B 6 63973 63860 C 2011-02-03 1996-07-31 +S000006436 ORF Verified YFL034C-A RPL22B eL22|ribosomal 60S subunit protein L22B|L22e|rp4|l1c|YL31|L22B|YFL035C-B chromosome 6 L000004513|S000002967 6 64932 64243 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L22A; required for translation of long 5' UTR of IME1 mRNA and meiotic entry; homologous to mammalian ribosomal protein L22, no bacterial homolog; RPL22B has a paralog, RPL22A, that arose from the whole genome duplication +S000036495 CDS YFL034C-A 6 64599 64243 C 2011-02-03 1996-07-31 +S000036494 CDS YFL034C-A 6 64932 64921 C 2011-02-03 1996-07-31 +S000036496 intron YFL034C-A 6 64920 64600 C 2011-02-03 1996-07-31 +S000001860 ORF Uncharacterized YFL034W MIL1 chromosome 6 6 65477 68698 W 2011-02-03 1996-07-31|2011-02-03 Predicted lipase; binds variant medium clathrin chain Apm2p and contributes to its membrane recruitment; putative integral membrane protein that interacts with Rpp0p component of ribosomal stalk +S000032866 CDS YFL034W 6 65477 68698 W 2011-02-03 1996-07-31|2011-02-03 +S000007635 ARS ARS603 ARS603 chromosome 6 6 68759 68861 2014-11-18 2001-03-02|2014-11-18 Highly-efficient autonomously replicating sequence on Chromosome VI; activated during the second half of S phase in ~67% of cell cycles +S000121268 ARS_consensus_sequence ARS603 6 68829 68839 W 2011-02-03 2007-03-08 +S000121269 ARS_consensus_sequence ARS603 6 68855 68845 C 2011-02-03 2007-03-08 +S000001861 ORF Verified YFL033C RIM15 protein kinase RIM15|TAK1 chromosome 6 L000003524|L000003204 6 74427 69115 C 2011-02-03 1996-07-31 Protein kinase involved in cell proliferation in response to nutrients; glucose-repressible; involved in signal transduction during cell proliferation in response to nutrients, specifically the establishment of stationary phase; identified as a regulator of IME2; phosphorylates Igo1p and Igo2p; substrate of Pho80p-Pho85p kinase +S000032693 CDS YFL033C 6 74427 69115 C 2011-02-03 1996-07-31 +S000001862 ORF Dubious YFL032W chromosome 6 6 74872 75192 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene HAC1/YFL031W; YFL032W is not an essential gene +S000032655 CDS YFL032W 6 74872 75192 W 2011-02-03 1996-07-31 +S000001863 ORF Verified YFL031W HAC1 transcription factor HAC1|IRE15|ERN4 chromosome 6 L000002611 6 75179 76147 W 2011-02-03 2001-05-29|1996-07-31 Basic leucine zipper (bZIP) transcription factor (ATF/CREB1 homolog); regulates the unfolded protein response, via UPRE binding, and membrane biogenesis; ER stress-induced splicing pathway facilitates efficient Hac1p synthesis; two functional forms of Hac1p are produced; translation initiation is repressed under non-stress conditions; protein abundance increases in response to DNA replication stress +S000031638 CDS YFL031W 6 75179 75839 W 2011-02-03 2001-05-29|1996-07-31 +S000031639 CDS YFL031W 6 76092 76147 W 2011-02-03 2001-05-29 +S000031640 intron YFL031W 6 75840 76091 W 2011-02-03 2001-05-29 +S000028629 ORF Dubious YFL031C-A YFL030C-A chromosome 6 6 76115 76014 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps HAC1/YFL031W; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000031489 CDS YFL031C-A 6 76115 76014 C 2011-02-03 2003-07-29 +S000001864 ORF Verified YFL030W AGX1 alanine--glyoxylate transaminase chromosome 6 6 76831 77988 W 2011-02-03 1996-07-31 Alanine:glyoxylate aminotransferase (AGT); catalyzes the synthesis of glycine from glyoxylate, which is one of three pathways for glycine biosynthesis in yeast; similar to mammalian and plant alanine:glyoxylate aminotransferases; human homolog AGXT complements yeast null mutant +S000031544 CDS YFL030W 6 76831 77988 W 2011-02-03 1996-07-31 +S000001865 ORF Verified YFL029C CAK1 cyclin-dependent protein kinase-activating kinase CAK1|CIV1 chromosome 6 L000003177 6 79161 78055 C 2011-02-03 1996-07-31 Cyclin-dependent kinase-activating kinase; required for passage through the cell cycle; phosphorylates and activates Cdc28p; nucleotide-binding pocket differs significantly from those of most other protein kinases +S000031499 CDS YFL029C 6 79161 78055 C 2011-02-03 1996-07-31 +S000001866 ORF Verified YFL028C CAF16 putative ATP-binding cassette family ATPase CAF16 chromosome 6 L000003418 6 80213 79344 C 2011-02-03 1996-07-31 Part of evolutionarily-conserved CCR4-NOT regulatory complex; contains single ABC-type ATPase domain but no transmembrane domain; interacts with several subunits of Mediator +S000030636 CDS YFL028C 6 80213 79344 C 2011-02-03 1996-07-31 +S000001867 ORF Verified YFL027C GYP8 chromosome 6 6 81912 80419 C 2011-02-03 1996-07-31 GTPase-activating protein for yeast Rab family members; Ypt1p is the preferred in vitro substrate but also acts on Sec4p, Ypt31p and Ypt32p; involved in the regulation of ER to Golgi vesicle transport +S000030523 CDS YFL027C 6 81912 80419 C 2011-02-03 1996-07-31 +S000001868 ORF Verified YFL026W STE2 alpha-factor pheromone receptor STE2 chromosome 6 L000002112 6 82580 83875 W -37 2011-02-03 1996-07-31|2011-02-03 Receptor for alpha-factor pheromone; seven transmembrane-domain GPCR that interacts with both pheromone and a heterotrimeric G protein to initiate the signaling response that leads to mating between haploid a and alpha cells +S000030488 CDS YFL026W 6 82580 83875 W 2011-02-03 1996-07-31|2011-02-03 +S000001869 ORF Verified YFL025C BST1 PER17 chromosome 6 L000004294 6 87234 84145 C 2011-02-03 1996-07-31 GPI inositol deacylase of the endoplasmic reticulum (ER); negatively regulates COPII vesicle formation; prevents production of vesicles with defective subunits; required for proper discrimination between resident ER proteins and Golgi-bound cargo molecules; functional ortholog of human PGAP1, mutation of which is associated with intellectual disability and encephalopathy +S000037627 CDS YFL025C 6 87234 84145 C 2011-02-03 1996-07-31 +S000001870 ORF Verified YFL024C EPL1 chromosome 6 L000004576 6 90345 87847 C 2011-02-03 1996-07-31 Subunit of NuA4, an essential histone H4/H2A acetyltransferase complex; conserved region at N-terminus is essential for interaction with the NPC (nucleosome core particle); required for autophagy; homologous to Drosophila Enhancer of Polycomb; coding sequence contains length polymorphisms in different strains +S000037484 CDS YFL024C 6 90345 87847 C 2011-02-03 1996-07-31 +S000001871 ORF Verified YFL023W BUD27 URI1 chromosome 6 S000007647 6 90986 93376 W 2011-02-03 1996-07-31 Unconventional prefoldin protein involved in translation initiation; required for correct assembly of RNAP I, II, and III in an Rpb5p-dependent manner; shuttles between nucleus and cytoplasm; mutants have inappropriate expression of nutrient sensitive genes due to translational derepression of Gcn4p transcription factor; diploid mutants show random budding; ortholog of human URI/RMP +S000037447 CDS YFL023W 6 90986 93376 W 2011-02-03 1996-07-31 +S000001872 ORF Verified YFL022C FRS2 phenylalanine--tRNA ligase subunit alpha chromosome 6 L000000630 6 95010 93499 C 2011-02-03 1996-07-31|2011-02-03 Alpha subunit of cytoplasmic phenylalanyl-tRNA synthetase; forms a tetramer with Frs1p to form active enzyme; evolutionarily distant from mitochondrial phenylalanyl-tRNA synthetase based on protein sequence, but substrate binding is similar +S000036666 CDS YFL022C 6 95010 93499 C 2011-02-03 1996-07-31|2011-02-03 +S000001873 ORF Verified YFL021W GAT1 MEP80|NIL1 chromosome 6 L000002835 6 95966 97498 W 2011-02-03 1996-07-31 Transcriptional activator of nitrogen catabolite repression genes; contains a GATA-1-type zinc finger DNA-binding motif; activity and localization regulated by nitrogen limitation and Ure2p; different translational starts produce two major and two minor isoforms that are differentially regulated and localized +S000036630 CDS YFL021W 6 95966 97498 W 2011-02-03 1996-07-31 +S000028766 ORF Dubious YFL021C-A chromosome 6 6 96615 95761 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF GAT1/YFL021W +S000033470 CDS YFL021C-A 6 96615 95761 C 2011-02-03 2003-07-29 +S000001874 ORF Verified YFL020C PAU5 seripauperin PAU5 chromosome 6 L000002815 6 99599 99231 C 2011-02-03 1996-07-31 Member of the seripauperin multigene family; encoded mainly in subtelomeric regions; induced during alcoholic fermentation; induced by low temperature and also by anaerobic conditions; negatively regulated by oxygen and repressed by heme +S000036468 CDS YFL020C 6 99599 99231 C 2011-02-03 1996-07-31 +S000006924 long_terminal_repeat YFLWdelta1 chromosome 6 6 100581 100901 W 2011-02-03 2000-05-19 Ty1 LTR +S000001875 ORF Dubious YFL019C chromosome 6 6 100605 100252 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YFL019C is not an essential gene +S000035776 CDS YFL019C 6 100605 100252 C 2011-02-03 1996-07-31 +S000006681 tRNA_gene tP(UGG)F SUF9 chromosome 6 L000002157|L000003809 6 101376 101478 W -13 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in proline codons +S000035980 intron tP(UGG)F 6 101412 101442 W 2011-02-03 2000-05-19 +S000035978 noncoding_exon tP(UGG)F 6 101376 101411 W 2011-02-03 2000-05-19 +S000035979 noncoding_exon tP(UGG)F 6 101443 101478 W 2011-02-03 2000-05-19 +S000001876 ORF Verified YFL018C LPD1 dihydrolipoyl dehydrogenase|HPD1 chromosome 6 L000000951 6 103127 101628 C 2011-02-03 1996-07-31 Dihydrolipoamide dehydrogenase; the lipoamide dehydrogenase component (E3) of the pyruvate dehydrogenase and 2-oxoglutarate dehydrogenase multi-enzyme complexes; PDH complex is concentrated in spots within the mitochondrial matrix, often near the ERMES complex and near peroxisomes; LPD1 has a paralog, IRC15, that arose from the whole genome duplication +S000035657 CDS YFL018C 6 103127 101628 C 2011-02-03 1996-07-31 +S000002965 ORF Verified YFL017W-A SMX2 mRNA splicing protein SMX2|Sm G|SmG|YFL018W-A|SNP2 chromosome 6 L000001955 6 103699 103932 W 2011-02-03 1996-07-31 Core Sm protein Sm G; part of heteroheptameric complex (with Smb1p, Smd1p, Smd2p, Smd3p, Sme1p, and Smx3p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; homolog of human Sm G +S000037748 CDS YFL017W-A 6 103699 103932 W 2011-02-03 1996-07-31 +S000001877 ORF Verified YFL017C GNA1 glucosamine 6-phosphate N-acetyltransferase|PAT1 chromosome 6 L000004865 6 104462 103983 C 2011-02-03 1996-07-31 Glucosamine-6-phosphate acetyltransferase; evolutionarily conserved; required for multiple cell cycle events including passage through START, DNA synthesis, and mitosis; involved in UDP-N-acetylglucosamine synthesis, forms GlcNAc6P from AcCoA +S000035587 CDS YFL017C 6 104462 103983 C 2011-02-03 1996-07-31 +S000178095 ARS ARS603.1 chromosome 6 6 104463 104701 2014-11-18 2014-11-18 Very weak autonomously replicating sequence +S000001878 ORF Verified YFL016C MDJ1 chromosome 6 L000001048 6 106236 104701 C 2011-02-03 1996-07-31 Co-chaperone that stimulates HSP70 protein Ssc1p ATPase activity; involved in protein folding/refolding in the mitochodrial matrix; required for proteolysis of misfolded proteins; member of the HSP40 (DnaJ) family of chaperones +S000035478 CDS YFL016C 6 106236 104701 C 2011-02-03 1996-07-31 +S000028765 ORF Dubious YFL015W-A chromosome 6 6 106415 106732 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF YFL015C +S000033469 CDS YFL015W-A 6 106415 106732 W 2011-02-03 2003-07-29 +S000001879 ORF Dubious YFL015C chromosome 6 6 106963 106469 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps dubious ORF YFL015W-A; YFL015C is not an essential gene +S000034451 CDS YFL015C 6 106963 106469 C 2011-02-03 1996-07-31 +S000001880 ORF Verified YFL014W HSP12 lipid-binding protein HSP12|HOR5|GLP1 chromosome 6 L000000816 6 107256 107585 W 2011-02-03 1996-07-31 Plasma membrane protein involved in maintaining membrane organization; involved in maintaining organization during stress conditions; induced by heat shock, oxidative stress, osmostress, stationary phase, glucose depletion, oleate and alcohol; protein abundance increased in response to DNA replication stress and dietary restriction; regulated by the HOG and Ras-Pka pathways; required for dietary restriction-induced lifespan extension +S000034418 CDS YFL014W 6 107256 107585 W 2011-02-03 1996-07-31 +S000028628 ORF Dubious YFL013W-A chromosome 6 6 107799 108602 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps IES1/YFL013C; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching +S000031487 CDS YFL013W-A 6 107799 108602 W 2011-02-03 2003-07-29 +S000002964 ORF Dubious YFL012W-A YFL013W-A chromosome 6 6 109810 110184 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene IES1/YFL013C +S000029905 CDS YFL012W-A 6 109810 110184 W 2011-02-03 1996-07-31 +S000001881 ORF Verified YFL013C IES1 chromosome 6 6 109930 107852 C 2011-02-03 1996-07-31 Subunit of the INO80 chromatin remodeling complex; relocalizes to the cytosol in response to hypoxia +S000034280 CDS YFL013C 6 109930 107852 C 2011-02-03 1996-07-31 +S000001882 ORF Uncharacterized YFL012W chromosome 6 6 110647 111093 W 2011-02-03 1996-07-31 Putative protein of unknown function; transcribed during sporulation; null mutant exhibits increased resistance to rapamycin +S000033440 CDS YFL012W 6 110647 111093 W 2011-02-03 1996-07-31 +S000001883 ORF Verified YFL011W HXT10 hexose transporter HXT10 chromosome 6 L000000844 6 112345 113985 W 2011-02-03 1996-07-31 Putative hexose transporter; expressed at low levels and expression is repressed by glucose +S000033350 CDS YFL011W 6 112345 113985 W 2011-02-03 1996-07-31 +S000001955 ORF Verified YFL010W-A AUA1 YFL011W-A chromosome 6 L000000156 6 114990 115274 W 2011-02-03 1999-07-17 Protein required for the negative regulation by ammonia of Gap1p; Gap1p is a general amino acid permease +S000031553 CDS YFL010W-A 6 114990 115274 W 2011-02-03 1999-07-17 +S000001884 ORF Verified YFL010C WWM1 chromosome 6 6 115743 115108 C 2011-02-03 1996-07-31 WW domain containing protein of unknown function; binds to Mca1p, a caspase-related protease that regulates H2O2-induced apoptosis; overexpression causes G1 phase growth arrest and clonal death that is suppressed by overexpression of MCA1 +S000033237 CDS YFL010C 6 115743 115108 C 2011-02-03 1996-07-31 +S000001885 ORF Verified YFL009W CDC4 SCF ubiquitin ligase complex subunit CDC4 chromosome 6 L000000244 6 116145 118484 W -9 2011-02-03 1996-07-31 F-box protein required for both the G1/S and G2/M phase transitions; modular substrate specificity factor which associates with core SCF (Cdc53p, Skp1p and Hrt1p/Rbx1p) to form the SCFCdc4 complex; SCFCdc4 acts as a ubiquitin-protein ligase directing ubiquitination of cyclin-dependent kinase (CDK) phosphorylated substrates, such as: Sic1p, Far1p, Cdc6p, Clb6p, and Cln3p +S000032546 CDS YFL009W 6 116145 118484 W 2011-02-03 1996-07-31 +S000007645 ARS ARS603.5 ARS603.5 chromosome 6 6 118637 118957 2011-02-03 2001-03-15 Autonomously replicating sequence on Chromosome VI; activated early in S phase in ~50% of cell cycles +S000121270 ARS_consensus_sequence ARS603.5 6 118688 118678 C 2011-02-03 2007-03-08 +S000001886 ORF Verified YFL008W SMC1 cohesin subunit SMC1|CHL10 chromosome 6 L000001926 6 119429 123106 W -10 2011-02-03 1996-07-31 Subunit of the multiprotein cohesin complex; essential protein involved in chromosome segregation and in double-strand DNA break repair; SMC chromosomal ATPase family member, binds DNA with a preference for DNA with secondary structure +S000032447 CDS YFL008W 6 119429 123106 W 2011-02-03 1996-07-31 +S000001887 ORF Verified YFL007W BLM10 YFL006W chromosome 6 S000007437 6 123479 129910 W 2011-02-03 2003-09-26|1996-07-31 Proteasome activator; binds the core proteasome (CP) and stimulates proteasome-mediated protein degradation by inducing gate opening; required for sequestering CP into proteasome storage granule (PSG) during quiescent phase and for nuclear import of CP in proliferating cells; required for resistance to bleomycin, may be involved in protecting against oxidative damage; similar to mammalian PA200 +S000031431 CDS YFL007W 6 123479 129910 W 2011-02-03 2003-09-26|1996-07-31 +S000007636 ARS ARS604 ARS604 chromosome 6 6 127751 128071 2011-02-03 2001-03-02 Extremely inefficient ARS on Chromosome VI +S000121271 ARS_consensus_sequence ARS604 6 127869 127879 W 2011-02-03 2007-03-08 +S000001889 ORF Verified YFL005W SEC4 Rab family GTPase SEC4|SRO6 chromosome 6 L000001830 6 130334 130981 W -6 2011-02-03 1996-07-31 Rab family GTPase; essential for vesicle-mediated exocytic secretion and autophagy; associates with the exocyst component Sec15p and may regulate polarized delivery of transport vesicles to the exocyst at the plasma membrane +S000031208 CDS YFL005W 6 130334 130981 W 2011-02-03 1996-07-31 +S000130127 ncRNA_gene RUF20 RUF20 chromosome 6 6 131503 131061 C 2011-02-03 2009-05-04 RNA of Unknown Function +S000130128 noncoding_exon RUF20 6 131503 131061 C 2011-02-03 2009-05-04 +S000001890 ORF Verified YFL004W VTC2 vacuolar transporter chaperone|PHM1 chromosome 6 S000007511 6 131810 134296 W 2011-02-03 1996-07-31 Regulatory subunit of the vacuolar transporter chaperone (VTC) complex; involved in membrane trafficking, vacuolar polyphosphate accumulation, microautophagy and non-autophagic vacuolar fusion; VTC2 has a paralog, VTC3, that arose from the whole genome duplication +S000031094 CDS YFL004W 6 131810 134296 W 2011-02-03 1996-07-31 +S000007637 ARS ARS605 ARS605 chromosome 6 6 135985 136085 2011-02-03 2001-03-02 Autonomously replicating sequence on Chromosome VI; activated early in S phase in ~27% of cell cycles; inactive during premeiotic S phase +S000121274 ARS_consensus_sequence ARS605 6 136047 136037 C 2011-02-03 2007-03-08 +S000001891 ORF Verified YFL003C MSH4 MutS family protein MSH4 chromosome 6 L000001192 6 137157 134521 C 2011-02-03 1996-07-31 Protein involved in meiotic recombination; required for normal levels of crossing over, colocalizes with Zip2p to discrete foci on meiotic chromosomes, has homology to bacterial MutS protein +S000030006 CDS YFL003C 6 137157 134521 C 2011-02-03 1996-07-31 +S000006669 tRNA_gene tN(GUU)F chromosome 6 L000003818 6 137559 137486 C 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis +S000030707 noncoding_exon tN(GUU)F 6 137559 137486 C 2011-02-03 2000-05-19 +S000006925 long_terminal_repeat YFLWdelta2 chromosome 6 6 137663 137912 W 2011-02-03 2000-05-19 Ty1 LTR +S000006926 long_terminal_repeat YFLWdelta3 chromosome 6 6 137913 138240 W 2011-02-03 2000-05-19 Ty2 LTR +S000006930 LTR_retrotransposon YFLWTy2-1 Ty2 chromosome 6 6 137913 143871 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007404 transposable_element_gene YFL002W-B gag protein chromosome 6 6 138204 139520 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000031732 CDS YFL002W-B 6 138204 139520 W 2011-02-03 1999-07-17 +S000002962 transposable_element_gene YFL002W-A gag-pol fusion protein chromosome 6 6 138204 143517 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000031719 CDS YFL002W-A 6 138204 139496 W 2011-02-03 1999-07-17 +S000031720 CDS YFL002W-A 6 139498 143517 W 2011-02-03 1999-07-17 +S000031721 plus_1_translational_frameshift YFL002W-A 6 139497 139497 W 2011-02-03 1999-07-17 +S000006927 long_terminal_repeat YFLWdelta4 chromosome 6 6 143540 143871 W 2011-02-03 2000-05-19 Ty2 LTR +S000006928 long_terminal_repeat YFLWdelta5 chromosome 6 6 143872 143947 W 2011-02-03 2000-05-19 Ty1 LTR +S000006929 long_terminal_repeat YFLWtau1 chromosome 6 6 144203 144523 W 2011-02-03 2000-05-19 Ty4 LTR +S000006923 long_terminal_repeat YFLCdelta6 chromosome 6 6 144822 144524 C 2011-02-03 2000-05-19 Ty1 LTR +S000001894 ORF Verified YFL002C SPB4 putative ATP-dependent RNA helicase SPB4 chromosome 6 L000001991 6 146934 145114 C 2011-02-03 1996-07-31 Putative ATP-dependent RNA helicase; nucleolar protein required for synthesis of 60S ribosomal subunits at a late step in the pathway; sediments with 66S pre-ribosomes in sucrose gradients +S000029891 CDS YFL002C 6 146934 145114 C 2011-02-03 1996-07-31 +S000001895 ORF Verified YFL001W DEG1 pseudouridine synthase DEG1|HRM3|PUS3 chromosome 6 L000000501 6 147131 148459 W -1 2011-02-03 1996-07-31 tRNA:pseudouridine synthase; introduces pseudouridines at position 38 or 39 in tRNA; also responsible for pseudouracil modification of some mRNAs; important for maintenance of translation efficiency and normal cell growth, localizes to both the nucleus and cytoplasm; non-essential for viability +S000037314 CDS YFL001W 6 147131 148459 W 2011-02-03 1996-07-31 +S000001896 centromere CEN6 CEN6 chromosome 6 L000000299 6 148510 148627 W 0 2011-02-03 2000-05-19|2006-05-08 Chromosome VI centromere +S000077272 centromere_DNA_Element_I CEN6 6 148510 148519 W 2011-02-03 2004-10-04 +S000077273 centromere_DNA_Element_II CEN6 6 148520 148602 W 2011-02-03 2004-10-04 +S000077274 centromere_DNA_Element_III CEN6 6 148603 148627 W 2011-02-03 2004-10-04 +S000001897 ORF Verified YFR001W LOC1 chromosome 6 6 149110 149724 W 2011-02-03 1996-07-31 Nuclear protein involved in asymmetric localization of ASH1 mRNA; binds double-stranded RNA in vitro; constituent of 66S pre-ribosomal particles; required at post-transcriptional step for efficient retrotransposition; absence results in decreased Ty1 Gag:GFP protein levels; relocalizes from nucleus to cytoplasm upon DNA replication stress +S000033165 CDS YFR001W 6 149110 149724 W 2011-02-03 1996-07-31 +S000001898 ORF Verified YFR002W NIC96 linker nucleoporin NIC96 chromosome 6 L000001250 6 150016 152535 W 2011-02-03 1996-07-31 Linker nucleoporin component of the nuclear pore complex (NPC); also part of the NPC nuclear basket; contributes to nucleocytoplasmic transport and NPC biogenesis; forms stable associations with three FG-nucleoporins (Nsp1p, Nup57p, and Nup49p) +S000033226 CDS YFR002W 6 150016 152535 W 2011-02-03 1996-07-31 +S000001899 ORF Verified YFR003C YPI1 type 1 protein phosphatase-activating protein YPI1 chromosome 6 6 153124 152657 C 2011-02-03 1996-07-31 Regulatory subunit of the type I protein phosphatase (PP1) Glc7p; Glc7p participates in the regulation of a variety of metabolic processes including mitosis and glycogen metabolism; in vitro evidence suggests Ypi1p is an inhibitor of Glc7p while in vivo evidence suggests it is an activator; overproduction causes decreased cellular content of glycogen; partial depletion causes lithium sensitivity, while overproduction confers lithium-tolerance +S000033251 CDS YFR003C 6 153124 152657 C 2011-02-03 1996-07-31 +S000001900 ORF Verified YFR004W RPN11 proteasome regulatory particle lid subunit RPN11|MPR1 chromosome 6 L000002976|L000002965 6 153393 154313 W 2011-02-03 1996-07-31 Metalloprotease subunit of 19S regulatory particle; part of 26S proteasome lid; couples the deubiquitination and degradation of proteasome substrates; involved, independent of catalytic activity, in fission of mitochondria and peroxisomes; protein abundance increases in response to DNA replication stress +S000034135 CDS YFR004W 6 153393 154313 W 2011-02-03 1996-07-31 +S000001901 ORF Verified YFR005C SAD1 mRNA splicing protein SAD1 chromosome 6 L000001795 6 155873 154527 C 2011-02-03 1996-07-31 Conserved zinc-finger domain protein involved in pre-mRNA splicing; critical for splicing of nearly all intron-containing genes; required for assembly of U4 snRNA into the U4/U6 particle +S000034191 CDS YFR005C 6 155873 154527 C 2011-02-03 1996-07-31 +S000001902 ORF Uncharacterized YFR006W putative Xaa-Pro dipeptidase chromosome 6 6 156145 157752 W 2011-02-03 1996-07-31 Putative X-Pro aminopeptidase; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YFR006W is not an essential gene +S000034389 CDS YFR006W 6 156145 157752 W 2011-02-03 1996-07-31 +S000006564 tRNA_gene tF(GAA)F chromosome 6 L000003817 6 158007 157916 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis +S000035384 intron tF(GAA)F 6 157970 157952 C 2011-02-03 2000-05-19 +S000035383 noncoding_exon tF(GAA)F 6 157951 157916 C 2011-02-03 2000-05-19 +S000035382 noncoding_exon tF(GAA)F 6 158007 157971 C 2011-02-03 2000-05-19 +S000006933 long_terminal_repeat YFRWdelta7 chromosome 6 6 158376 158686 W 2011-02-03 2000-05-19 Ty1 LTR +S000001903 ORF Verified YFR007W YFH7 AIM12 chromosome 6 6 159299 160360 W 2011-02-03 1996-07-31 Putative kinase with similarity to the PRK/URK/PANK kinase subfamily; the PRK/URK/PANK subfamily of P-loop kinases is also known as phosphoribulokinase/uridine kinase/bacterial pantothenate kinase +S000035412 CDS YFR007W 6 159299 160360 W 2011-02-03 1996-07-31 +S000001904 ORF Verified YFR008W FAR7 chromosome 6 6 160535 161200 W 2011-02-03 1996-07-31 Protein involved in recovery from pheromone-induced cell cycle arrest; acts in a Far1p-independent pathway; interacts with Far3p, Far8p, Far9p, Far10p, and Far11p; protein abundance increases in response to DNA replication stress +S000035513 CDS YFR008W 6 160535 161200 W 2011-02-03 1996-07-31 +S000006931 long_terminal_repeat YFRCdelta8 chromosome 6 6 162135 161804 C 2011-02-03 2000-05-19 Ty1 LTR +S000006579 tRNA_gene tG(GCC)F1 SUF20 chromosome 6 L000002167|L000003810 6 162228 162298 W 6 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons +S000031966 noncoding_exon tG(GCC)F1 6 162228 162298 W 2011-02-03 2000-05-19 +S000001905 ORF Verified YFR009W GCN20 putative AAA family ATPase GCN20 chromosome 6 L000000689 6 162488 164746 W 2011-02-03 1996-07-31 Positive regulator of the Gcn2p kinase activity; forms a complex with Gcn1p; proposed to stimulate Gcn2p activation by an uncharged tRNA +S000035605 CDS YFR009W 6 162488 164746 W 2011-02-03 1996-07-31 +S000028823 ORF Dubious YFR009W-A chromosome 6 6 163875 164132 W 2011-02-03 2003-08-07|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified gene YFR009W; identified by expression profiling and mass spectrometry +S000033643 CDS YFR009W-A 6 163875 164132 W 2011-02-03 2003-08-07|2003-07-29 +S000001906 ORF Verified YFR010W UBP6 ubiquitin-specific protease UBP6 chromosome 6 L000004586 6 165067 166566 W 2011-02-03 1996-07-31 Ubiquitin-specific protease; situated in the base subcomplex of the 26S proteasome, releases free ubiquitin from branched polyubiquitin chains en bloc, rather than from the distal tip of the chain; negatively regulates degradation of ubiquitinated proteins by the proteasome; works in opposition to Hul5p polyubiquitin elongation activity; mutant has aneuploidy tolerance; human homolog UBP14 complements yeast null mutant +S000037248 CDS YFR010W 6 165067 166566 W 2011-02-03 1996-07-31 +S000028824 ORF Dubious YFR010W-A chromosome 6 6 166728 166916 W 2011-02-03 2003-08-07|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized gene YFR011C; identified by expression profiling and mass spectrometry +S000033645 CDS YFR010W-A 6 166728 166916 W 2011-02-03 2003-08-07|2003-07-29 +S000001907 ORF Verified YFR011C MIC19 AIM13|MCS19 chromosome 6 6 167258 166746 C 2011-02-03 1996-07-31 Component of the MICOS complex; MICOS (formerly MINOS or MitOS) is a mitochondrial inner membrane complex that extends into the intermembrane space and has a role in the maintenance of crista junctions, inner membrane architecture, and formation of contact sites to the outer membrane; Mic19p is peripheral to the inner membrane and may connect Mic60p with the Mic10p-Mic12p-Mic27p subcomplex; both yeast and human Mic19p become oxidized, and oxidation may regulate MICOS +S000037259 CDS YFR011C 6 167258 166746 C 2011-02-03 1996-07-31 +S000006779 tRNA_gene tY(GUA)F1 SUP11 chromosome 6 L000003811|L000002188 6 167437 167525 W 4 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations +S000030879 intron tY(GUA)F1 6 167476 167489 W 2011-02-03 2000-05-19 +S000030877 noncoding_exon tY(GUA)F1 6 167437 167475 W 2011-02-03 2000-05-19 +S000030878 noncoding_exon tY(GUA)F1 6 167490 167525 W 2011-02-03 2000-05-19 +S000007638 ARS ARS606 ARS606 chromosome 6 6 167547 167801 2014-11-18 2001-03-06|2014-11-18 Highly-efficient autonomously replicating sequence on Chromosome VI; activated early in S phase in ~74% of cell cycles; replication capacity dependent upon Sum1p +S000121275 ARS_consensus_sequence ARS606 6 167736 167726 C 2011-02-03 2007-03-08 +S000001908 ORF Verified YFR012W DCV1 chromosome 6 6 167888 168496 W 2011-02-03 1996-07-31 Protein of unknown function; deletion mutant shows strong genetic interaction with cdc28-as1 mutant in the presence of 1-NM-PP1; DCV1 has a paralog, YOL019W, that arose from the whole genome duplication +S000037437 CDS YFR012W 6 167888 168496 W 2011-02-03 1996-07-31 +S000007606 ORF Uncharacterized YFR012W-A chromosome 6 6 169224 169310 W 2011-02-03 2001-02-26 Putative protein of unknown function; identified by homology +S000037183 CDS YFR012W-A 6 169224 169310 W 2011-02-03 2001-02-26 +S000001909 ORF Verified YFR013W IOC3 chromosome 6 6 169922 172285 W 2011-02-03 1996-07-31 Subunit of the Isw1a complex; Isw1a has nucleosome-stimulated ATPase activity and represses transcription initiation by specific positioning of a promoter proximal dinucleosome; promotes nucleosome shifts in the 5 prime direction; IOC3 has a paralog, ESC8, that arose from the whole genome duplication +S000037546 CDS YFR013W 6 169922 172285 W 2011-02-03 1996-07-31 +S000001910 ORF Verified YFR014C CMK1 calmodulin-dependent protein kinase CMK1 chromosome 6 L000000366 6 173877 172537 C 2011-02-03 1996-07-31|2011-02-03 Calmodulin-dependent protein kinase; may play a role in stress response, many Ca++/calmodulin dependent phosphorylation substrates demonstrated in vitro, amino acid sequence similar to mammalian Cam Kinase II; CMK1 has a paralog, CMK2, that arose from the whole genome duplication +S000030207 CDS YFR014C 6 173877 172537 C 2011-02-03 1996-07-31|2011-02-03 +S000001911 ORF Verified YFR015C GSY1 glycogen (starch) synthase GSY1 chromosome 6 L000000739 6 176391 174265 C 2011-02-03 1996-07-31 Glycogen synthase; expression induced by glucose limitation, nitrogen starvation, environmental stress, and entry into stationary phase; GSY1 has a paralog, GSY2, that arose from the whole genome duplication; relocalizes from nucleus to cytoplasmic foci upon DNA replication stress +S000030390 CDS YFR015C 6 176391 174265 C 2011-02-03 1996-07-31 +S000001912 ORF Verified YFR016C chromosome 6 6 180743 177042 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and bud; interacts with Spa2p; YFR016C is not an essential gene +S000030514 CDS YFR016C 6 180743 177042 C 2011-02-03 1996-07-31 +S000006580 tRNA_gene tG(GCC)F2 chromosome 6 L000003816 6 181044 180974 C 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis +S000031970 noncoding_exon tG(GCC)F2 6 181044 180974 C 2011-02-03 2000-05-19 +S000001913 ORF Verified YFR017C IGD1 chromosome 6 6 182861 182274 C 2011-02-03 1996-07-31 Cytoplasmic protein that inhibits Gdb1p glycogen debranching activity; required for normal intracellular accumulation of glycogen; phosphorylated in vivo; expression increases during wine fermentation; protein abundance increases in response to DNA replication stress; IGD1 has a paralog, YOL024W, that arose from the whole genome duplication +S000031438 CDS YFR017C 6 182861 182274 C 2011-02-03 1996-07-31 +S000001914 ORF Uncharacterized YFR018C chromosome 6 6 184222 183131 C 2011-02-03 1996-07-31 Putative protein of unknown function; SWAT-GFP and seamless GFP fusion proteins localize to the endoplasmic reticulum and mCherry fusion protein localizes to the vacuole +S000031539 CDS YFR018C 6 184222 183131 C 2011-02-03 1996-07-31 +S000001915 ORF Verified YFR019W FAB1 1-phosphatidylinositol-3-phosphate 5-kinase|SVL7 chromosome 6 L000000597 6 184502 191338 W 2011-02-03 1996-07-31|2011-02-03 1-phosphatidylinositol-3-phosphate 5-kinase; vacuolar membrane kinase that generates phosphatidylinositol (3,5)P2, which is involved in vacuolar sorting and homeostasis +S000032628 CDS YFR019W 6 184502 191338 W 2011-02-03 1996-07-31|2011-02-03 +S000006731 tRNA_gene tS(GCU)F chromosome 6 L000003815 6 191613 191513 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000037442 intron tS(GCU)F 6 191576 191558 C 2011-02-03 2000-05-19 +S000037441 noncoding_exon tS(GCU)F 6 191557 191513 C 2011-02-03 2000-05-19 +S000037440 noncoding_exon tS(GCU)F 6 191613 191577 C 2011-02-03 2000-05-19 +S000006932 long_terminal_repeat YFRCdelta9 chromosome 6 6 191854 191685 C 2011-02-03 2000-05-19 Ty1 LTR +S000001916 ORF Verified YFR020W CSS2 chromosome 6 6 192737 193435 W 2011-02-03 1996-07-31 Protein of unknown function, secreted when constitutively expressed; SWAT-GFP fusion protein localizes to the endoplasmic reticulum (ER) and extracellular region, while mCherry fusion protein localizes to the ER and vacuole; mRNA identified as translated by ribosome profiling data; CSS2 is a non-essential gene +S000031952 CDS YFR020W 6 192737 193435 W 2011-02-03 1996-07-31 +S000001917 ORF Verified YFR021W ATG18 phosphoinositide binding protein ATG18|SVP1|AUT10|CVT18|NMR1 chromosome 6 6 194812 196314 W 2011-02-03 1996-07-31 Phosphoinositide binding protein; required for vesicle formation in autophagy and the cytoplasm-to-vacuole targeting (Cvt) pathway; binds both phosphatidylinositol (3,5)-bisphosphate and phosphatidylinositol 3-phosphate; WD-40 repeat protein; relocalizes from vacuole to cytoplasm upon DNA replication stress; has 4 mammalian homologs WIPI1, WIPI2, WIPI3 and WIPI4/WDR45; mutations in human WDR45 cause static encephalopathy of childhood with neurodegeneration in adulthood +S000032840 CDS YFR021W 6 194812 196314 W 2011-02-03 1996-07-31 +S000001918 ORF Verified YFR022W ROG3 ART7 chromosome 6 6 196833 199034 W 2011-02-03 1996-07-31 Alpha-arrestin involved in ubiquitin-dependent endocytosis; contributes to desensitization of agonist-occupied alpha-factor receptor Ste2p by Rsp5p-independent internalization; PPXY motif-mediated binding of the ubiquitin ligase Rsp5p is not required for adaptation; mutation suppresses the temperature sensitivity of an mck1 rim11 double mutant; SWAT-GFP and mCherry fusion proteins localize to the cytosol; ROG3 has a paralog, ROD1, that arose from the whole genome duplication +S000032952 CDS YFR022W 6 196833 199034 W 2011-02-03 1996-07-31 +S000007639 ARS ARS607 ARS607 chromosome 6 6 199395 199505 2011-02-03 2001-03-06 Highly-efficient autonomously replicating sequence on Chromosome VI; activated very early in S phase in >85% of cell cycles +S000121276 ARS_consensus_sequence ARS607 6 199416 199426 W 2011-02-03 2007-03-08 +S000130131 ncRNA_gene RUF22 RUF22 chromosome 6 6 199813 199299 C 2011-02-03 2009-05-04 RNA of Unknown Function; precise location of 3' end uncertain; RUF22 may be longer than currently annotated +S000130132 noncoding_exon RUF22 6 199813 199299 C 2011-02-03 2009-05-04 +S000001919 ORF Verified YFR023W PES4 chromosome 6 L000001381 6 199874 201709 W 2011-02-03 1996-07-31 Poly(A) binding protein, suppressor of DNA polymerase epsilon mutation; PES4 has a paralog, MIP6, that arose from the whole genome duplication +S000033022 CDS YFR023W 6 199874 201709 W 2011-02-03 1996-07-31 +S000002968 ORF Verified YFR024C-A LSB3 YFR024C chromosome 6 6 203433 201960 C 2011-02-03 1996-07-31|2008-06-02 Protein containing a C-terminal SH3 domain; binds Las17p, which is a homolog of human Wiskott-Aldrich Syndrome protein involved in actin patch assembly and actin polymerization; protein abundance increases in response to DNA replication stress; LSB3 has a paralog, YSC84, that arose from the whole genome duplication +S000035055 CDS YFR024C-A 6 203292 201960 C 2011-02-03 1996-07-31|2008-06-02 +S000035054 CDS YFR024C-A 6 203433 203387 C 2011-02-03 1996-07-31 +S000035056 intron YFR024C-A 6 203386 203293 C 2011-02-03 1996-07-31|2008-06-02 +S000001921 ORF Verified YFR025C HIS2 histidinol-phosphatase chromosome 6 L000000779 6 204750 203743 C 32 2011-02-03 1996-07-31 Histidinolphosphatase; catalyzes the eighth step in histidine biosynthesis; mutations cause histidine auxotrophy and sensitivity to Cu, Co, and Ni salts; transcription is regulated by general amino acid control +S000033826 CDS YFR025C 6 204750 203743 C 2011-02-03 1996-07-31 +S000006511 tRNA_gene tA(AGC)F chromosome 6 L000003814 6 204996 204924 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine +S000032277 noncoding_exon tA(AGC)F 6 204996 204924 C 2011-02-03 2000-05-19 +S000001922 ORF Verified YFR026C ULI1 chromosome 6 6 206257 205748 C 2011-02-03 1996-07-31 Protein of unknown function; involved in and induced by the endoplasmic reticulum unfolded protein response (UPR); SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum +S000033947 CDS YFR026C 6 206257 205748 C 2011-02-03 1996-07-31 +S000006934 long_terminal_repeat YFRWdelta10 chromosome 6 6 206922 207138 W 2011-02-03 2000-05-19 Ty1 LTR +S000001923 ORF Verified YFR027W ECO1 CTF7 chromosome 6 L000004789 6 207452 208297 W 2011-02-03 1996-07-31 Acetyltransferase; required for establishment of sister chromatid cohesion; acetylates Mps3p to regulate nuclear organization; modifies Smc3p at replication forks and Mcd1p in response to dsDNA breaks; phosphorylated by three kinases (Cdc28p, Cdc7p, Mck1p) to generate pair of phosphates spaced precisely for recognition by ubiquitin ligase SCF-Cdc4; mutations in human homolog ESCO2 cause Roberts syndrome; relative distribution to nucleus increases upon DNA replication stress +S000034947 CDS YFR027W 6 207452 208297 W 2011-02-03 1996-07-31 +S000001924 ORF Verified YFR028C CDC14 phosphoprotein phosphatase CDC14|OAF3 chromosome 6 L000000254 6 210068 208413 C 36 2011-02-03 1996-07-31 Protein phosphatase required for mitotic exit; required for rDNA segregation, cytokinesis, meiosis I spindle disassembly, environmental stress response; held in nucleolus by Cdc55p in early meiosis, liberated by FEAR and Mitotic Exit Network in anaphase, enabling it to effect a decrease in CDK/B-cyclin activity and mitotic exit; sequestered in metaphase II, released upon entry into anaphase II; human homolog CDC14A can complement thermosensitivity of yeast cdc14-1 mutant +S000035011 CDS YFR028C 6 210068 208413 C 2011-02-03 1996-07-31 +S000006780 tRNA_gene tY(GUA)F2 SUP6 chromosome 6 L000003813|L000002185 6 210707 210619 C 38 2011-02-03 2000-05-19 Tyrosine tRNA (tRNA-Tyr), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations +S000030888 intron tY(GUA)F2 6 210668 210655 C 2011-02-03 2000-05-19 +S000030887 noncoding_exon tY(GUA)F2 6 210654 210619 C 2011-02-03 2000-05-19 +S000030886 noncoding_exon tY(GUA)F2 6 210707 210669 C 2011-02-03 2000-05-19 +S000001925 ORF Verified YFR029W PTR3 RAA2|SSY3 chromosome 6 L000003185|L000003493|S000029400|L000001554 6 210937 212973 W 46 2011-02-03 1996-07-31 Component of the SPS plasma membrane amino acid sensor system; senses external amino acid concentration and transmits intracellular signals that result in regulation of expression of amino acid permease genes; other members are Ssy1p, Ptr3p, and Ssy5p +S000035279 CDS YFR029W 6 210937 212973 W 2011-02-03 1996-07-31 +S000001926 ORF Verified YFR030W MET10 sulfite reductase subunit alpha chromosome 6 L000001084 6 213312 216419 W 41 2011-02-03 1996-07-31 Subunit alpha of assimilatory sulfite reductase; complex converts sulfite into sulfide +S000037036 CDS YFR030W 6 213312 216419 W 2011-02-03 1996-07-31 +S000007640 ARS ARS608 ARS608 chromosome 6 6 216357 216704 2011-02-03 2001-03-06 Extremely inefficient autonomously replicating sequence on Chr VI; activated early in S phase in <10% of cell cycles +S000121280 ARS_consensus_sequence ARS608 6 216484 216494 W 2011-02-03 2007-03-08 +S000001927 ORF Verified YFR031C SMC2 condensin subunit SMC2 chromosome 6 L000001927 6 220106 216594 C 2011-02-03 1996-07-31|2011-02-03 Subunit of the condensin complex; condensin reorganizes chromosomes during both mitosis and meiosis; essential SMC chromosomal ATPase family member that forms a subcomplex with Smc2p that has ATP-hydrolyzing and DNA-binding activity, but other condensin subunits are required for chromatin binding; required for clustering of tRNA genes at the nucleolus +S000037057 CDS YFR031C 6 220106 216594 C 2011-02-03 1996-07-31|2011-02-03 +S000002104 ORF Verified YFR031C-A RPL2A uL2|ribosomal 60S subunit protein L2A|L2|rp8|YL6|L5A|L2A|RPL5B chromosome 6 L000003147 6 221418 220507 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L2A; homologous to mammalian ribosomal protein L2 and bacterial L2; RPL2A has a paralog, RPL2B, that arose from the whole genome duplication +S000032329 CDS YFR031C-A 6 221267 220507 C 2011-02-03 1996-07-31 +S000032328 CDS YFR031C-A 6 221418 221415 C 2011-02-03 1996-07-31 +S000032330 intron YFR031C-A 6 221414 221268 C 2011-02-03 1996-07-31 +S000130133 ncRNA_gene RUF23 RUF23 chromosome 6 6 221714 221967 W 2011-02-03 2009-05-04 RNA of Unknown Function; precise location of 3' end uncertain; RUF23 may be longer than currently annotated +S000130134 noncoding_exon RUF23 6 221714 221967 W 2011-02-03 2009-05-04 +S000001928 ORF Uncharacterized YFR032C RRT5 chromosome 6 6 222959 222090 C 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene identified in a screen for mutants with increased levels of rDNA transcription; expressed at high levels during sporulation +S000037177 CDS YFR032C 6 222959 222090 C 2011-02-03 1996-07-31 +S000006437 ORF Verified YFR032C-A RPL29 eL29|ribosomal 60S subunit protein L29|L29e|YL43|L29 chromosome 6 L000004514 6 223437 223258 C 2011-02-03 1999-07-17 Ribosomal 60S subunit protein L29; not essential for translation, but required for proper joining of large and small ribosomal subunits and for normal translation rate; homologous to mammalian ribosomal protein L29, no bacterial homolog +S000034020 CDS YFR032C-A 6 223437 223258 C 2011-02-03 1999-07-17 +S000122098 five_prime_UTR_intron YFR032C-A 6 223771 223441 C 2011-02-03 2007-04-04 +S000028630 ORF Uncharacterized YFR032C-B chromosome 6 6 223973 223710 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032386 CDS YFR032C-B 6 223973 223710 C 2011-02-03 2003-07-29 +S000001929 ORF Verified YFR033C QCR6 ubiquinol--cytochrome-c reductase subunit 6|UCR6|COR3 chromosome 6 L000001546 6 224769 224326 C 2011-02-03 1996-07-31 Subunit 6 of the ubiquinol cytochrome-c reductase complex; the complex, also known as the cytochrome bc(1) complex or Complex III, is a component of the mitochondrial inner membrane electron transport chain; highly acidic protein; required for maturation of cytochrome c1; may be loosely associated with the complex since it is easily released into the intermembrane space +S000037271 CDS YFR033C 6 224769 224326 C 2011-02-03 1996-07-31 +S000001930 ORF Verified YFR034C PHO4 phosphate-sensing transcription factor PHO4|phoD chromosome 6 L000001420 6 225958 225020 C 47 2011-02-03 1996-07-31 Basic helix-loop-helix (bHLH) transcription factor of the myc-family; activates transcription cooperatively with Pho2p in response to phosphate limitation; binding to 'CACGTG' motif is regulated by chromatin restriction, competitive binding of Cbf1p to the same DNA binding motif and cooperation with Pho2p; function is regulated by phosphorylation at multiple sites and by phosphate availability +S000029931 CDS YFR034C 6 225958 225020 C 2011-02-03 1996-07-31 +S000028631 ORF Dubious YFR034W-A chromosome 6 6 226022 226309 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps YFR035C; identified by gene-trapping, microarray expression analysis, and genome-wide homology searching +S000032387 CDS YFR034W-A 6 226022 226309 W 2011-02-03 2003-07-29 +S000001931 ORF Uncharacterized YFR035C chromosome 6 6 226465 226121 C 2011-02-03 1996-07-31 Putative protein of unknown function; deletion mutant exhibits synthetic phenotype with alpha-synuclein +S000030041 CDS YFR035C 6 226465 226121 C 2011-02-03 1996-07-31 +S000006620 tRNA_gene tK(CUU)F chromosome 6 L000003812 6 226760 226688 C 2011-02-03 2000-05-19|2011-02-03 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000036006 noncoding_exon tK(CUU)F 6 226760 226688 C 2011-02-03 2000-05-19|2011-02-03 +S000001932 ORF Verified YFR036W CDC26 anaphase promoting complex subunit CDC26|SCD26|HIT3 chromosome 6 L000000265|L000001809 6 226963 227337 W 52 2011-02-03 1996-07-31 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); which is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition; relocalizes to the cytosol in response to hypoxia +S000031122 CDS YFR036W 6 226963 227337 W 2011-02-03 1996-07-31 +S000028767 ORF Dubious YFR036W-A chromosome 6 6 227451 228101 W 2011-02-03 2003-08-07|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps verified ORF RSC8/YFR037C +S000033471 CDS YFR036W-A 6 227451 228101 W 2011-02-03 2003-08-07|2003-07-29 +S000001933 ORF Verified YFR037C RSC8 SWH3 chromosome 6 L000003458|L000003393 6 229186 227513 C 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; essential for viability and mitotic growth; homolog of SWI/SNF subunit Swi3p, but unlike Swi3p, does not activate transcription of reporters +S000031163 CDS YFR037C 6 229186 227513 C 2011-02-03 1996-07-31 +S000001934 ORF Verified YFR038W IRC5 putative ATPase chromosome 6 6 229380 231941 W 2011-02-03 2004-02-05|1996-07-31 Putative ATPase containing the DEAD/H helicase-related sequence motif; null mutant displays increased levels of spontaneous Rad52p foci; SWAT-GFP and mCherry fusion proteins localize to the nucleus +S000031348 CDS YFR038W 6 229380 231941 W 2011-02-03 2004-02-05|1996-07-31 +S000001935 ORF Verified YFR039C OSW7 chromosome 6 6 233544 232012 C 2011-02-03 1996-07-31 Protein involved in outer spore wall assembly; likely involved directly in dityrosine layer assembly; may be involved in response to high salt and changes in carbon source; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; deletion mutant has decreased spore survival in Drosophila feces; OSW7 has a paralog, SHE10, that arose from the whole genome duplication; paralogs are redundant for spore wall dityrosine assembly +S000031395 CDS YFR039C 6 233544 232012 C 2011-02-03 1996-07-31 +S000001936 ORF Verified YFR040W SAP155 chromosome 6 L000002598 6 234242 237250 W 2011-02-03 2003-09-26|1996-07-31|2011-02-03 Protein required for function of the Sit4p protein phosphatase; forms a complex with Sit4p; member of a family of similar proteins including Sap4p, Sap185p, and Sap190p; protein abundance increases in response to DNA replication stress; SAP155 has a paralog, SAP4, that arose from the whole genome duplication +S000032382 CDS YFR040W 6 234242 237250 W 2011-02-03 2003-09-26|1996-07-31|2011-02-03 +S000001937 ORF Verified YFR041C ERJ5 chromosome 6 6 238255 237368 C 2011-02-03 1996-07-31 Type I membrane protein with a J domain; required to preserve the folding capacity of the endoplasmic reticulum; loss of the non-essential ERJ5 gene leads to a constitutively induced unfolded protein response +S000032446 CDS YFR041C 6 238255 237368 C 2011-02-03 1996-07-31 +S000001938 ORF Verified YFR042W KEG1 chromosome 6 6 238458 239060 W 2011-02-03 1996-07-31 Integral membrane protein of the ER; physically interacts with Kre6p; has a role in the synthesis of beta-1,6-glucan in the cell wall; required for cell viability +S000033287 CDS YFR042W 6 238458 239060 W 2011-02-03 1996-07-31 +S000001939 ORF Verified YFR043C IRC6 chromosome 6 6 239827 239114 C 2011-02-03 1996-07-31 Clathrin coat accessory factor; involved in clathrin-mediated vesicle trafficking; may function to link the AP-1 clathrin adaptor complex with the Rab GTPase Ypt31p; has structural similarity to G-proteins; mouse homolog Aagab (p34) functionally complements irc6 null mutation; null mutant displays increased levels of spontaneous Rad52p foci +S000033328 CDS YFR043C 6 239827 239114 C 2011-02-03 1996-07-31 +S000001940 ORF Verified YFR044C DUG1 metallodipeptidase chromosome 6 6 241437 239992 C 2011-02-03 1996-07-31 Cys-Gly metallo-di-peptidase; forms a complex with Dug2p and Dug3p to degrade glutathione (GSH) and other peptides containing a gamma-glu-X bond in an alternative pathway to GSH degradation by gamma-glutamyl transpeptidase (Ecm38p); human homolog CNDP2 can complement yeast dug1 mutant +S000033403 CDS YFR044C 6 241437 239992 C 2011-02-03 1996-07-31 +S000001941 ORF Uncharacterized YFR045W chromosome 6 6 241998 242999 W 2011-02-03 2004-02-05|2007-04-04|1996-07-31 Putative mitochondrial transport protein; null mutant is viable, exhibits decreased levels of chitin and normal resistance to calcofluor white +S000122078 CDS YFR045W 6 241998 242009 W 2011-02-03 2007-04-04 +S000034370 CDS YFR045W 6 242082 242999 W 2011-02-03 2004-02-05|2007-04-04|1996-07-31 +S000122079 intron YFR045W 6 242010 242081 W 2011-02-03 2007-04-04 +S000001942 ORF Verified YFR046C CNN1 centromere-binding protein CNN1 chromosome 6 6 244159 243074 C 2011-02-03 1996-07-31 Kinetochore protein; associated with the essential kinetochore proteins Nnf1p and Spc24p; phosphorylated by Clb5-Cdk1, Mps1p, Ipl1p and to a lesser extent by Clb2-Cdk1; localizes to the lower region of the Ndc80 complex during anaphase and regulates KMN activity by inhibiting the Mtw1 and Spc105 complexes from binding to the Ndc80 complex; similar to metazoan CENP-T +S000034403 CDS YFR046C 6 244159 243074 C 2011-02-03 1996-07-31 +S000001943 ORF Verified YFR047C BNA6 nicotinate-nucleotide diphosphorylase (carboxylating)|QPT1 chromosome 6 6 245166 244279 C 2011-02-03 1996-07-31 Quinolinate phosphoribosyl transferase; required for the de novo biosynthesis of NAD from tryptophan via kynurenine; expression regulated by Hst1p +S000034510 CDS YFR047C 6 245166 244279 C 2011-02-03 1996-07-31 +S000001944 ORF Verified YFR048W RMD8 chromosome 6 6 246146 248134 W 2011-02-03 1996-07-31 Cytosolic protein required for sporulation +S000035572 CDS YFR048W 6 246146 248134 W 2011-02-03 1996-07-31 +S000001945 ORF Verified YFR049W YMR31 KGD4|mitochondrial 37S ribosomal protein YMR31 chromosome 6 L000002726 6 248523 248894 W 2011-02-03 1996-07-31 Subunit of the mitochondrial alpha-ketoglutarate dehydrogenase; recruits E3 subunit (Lpd1p) to the E1-E2 (Kgd1p, Kgd2p) core; has similarity to human mitochondrial ribosomal protein MRP-S36 +S000035651 CDS YFR049W 6 248523 248894 W 2011-02-03 1996-07-31 +S000001946 ORF Verified YFR050C PRE4 proteasome core particle subunit beta 7 chromosome 6 L000001486 6 249866 249066 C 2011-02-03 1996-07-31 Beta 7 subunit of the 20S proteasome +S000035525 CDS YFR050C 6 249866 249066 C 2011-02-03 1996-07-31 +S000001947 ORF Verified YFR051C RET2 coatomer subunit delta chromosome 6 L000004127 6 251803 250163 C 2011-02-03 1996-07-31 Delta subunit of the coatomer complex (COPI); COPI coats Golgi-derived transport vesicles; involved in retrograde transport between Golgi and ER +S000035589 CDS YFR051C 6 251803 250163 C 2011-02-03 1996-07-31 +S000001948 ORF Verified YFR052W RPN12 proteasome regulatory particle lid subunit RPN12|NIN1 chromosome 6 L000001251 6 252505 253329 W 2011-02-03 1996-07-31 Subunit of the 19S regulatory particle of the 26S proteasome lid; synthetically lethal with RPT1, which is an ATPase component of the 19S regulatory particle; physically interacts with Nob1p and Rpn3p; protein abundance increases in response to DNA replication stress +S000036541 CDS YFR052W 6 252505 253329 W 2011-02-03 1996-07-31 +S000028768 ORF Dubious YFR052C-A chromosome 6 6 253734 253429 C 2011-02-03 2003-08-07|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF HXK1/YFR053C +S000033472 CDS YFR052C-A 6 253734 253429 C 2011-02-03 2003-08-07|2003-07-29 +S000001949 ORF Verified YFR053C HXK1 hexokinase 1 chromosome 6 L000000833 6 255049 253592 C 70 2011-02-03 1996-07-31 Hexokinase isoenzyme 1; a cytosolic protein that catalyzes phosphorylation of glucose during glucose metabolism; expression is highest during growth on non-glucose carbon sources; glucose-induced repression involves hexokinase Hxk2p; HXK1 has a paralog, HXK2, that arose from the whole genome duplication +S000036582 CDS YFR053C 6 255049 253592 C 2011-02-03 1996-07-31 +S000007641 ARS ARS609 ARS609 chromosome 6 6 256277 256431 2011-02-03 2001-03-06 Autonomously replicating sequence on Chromosome VI; activated very late in S phase in ~37% of cell cycles; this origin is specifically fired in the absence of RAD53 in the presence of hydroxyurea +S000121281 ARS_consensus_sequence ARS609 6 256385 256375 C 2011-02-03 2007-03-08 +S000001950 ORF Dubious YFR054C chromosome 6 6 259433 258855 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000036701 CDS YFR054C 6 259433 258855 C 2011-02-03 1996-07-31 +S000001952 ORF Verified YFR055W IRC7 cysteine-S-conjugate beta-lyase IRC7 chromosome 6 6 264204 265226 W 2011-02-03 1996-07-31 Beta-lyase involved in the production of thiols; null mutant displays increased levels of spontaneous Rad52p foci; expression induced by nitrogen limitation in a GLN3, GAT1-dependent manner and by copper levels in a Mac1-dependent manner +S000037482 CDS YFR055W 6 264204 265226 W 2011-02-03 1996-07-31 +S000001951 ORF Dubious YFR056C chromosome 6 6 264325 263957 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized gene YFR055W +S000037536 CDS YFR056C 6 264325 263957 C 2011-02-03 1996-07-31 +S000001953 ORF Uncharacterized YFR057W chromosome 6 6 269061 269516 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000030392 CDS YFR057W 6 269061 269516 W 2011-02-03 1996-07-31 +S000121260 ARS ARS610 ARS610 ARSVI-270 chromosome 6 6 269417 270035 2011-02-03 2007-03-08 Autonomously Replicating Sequence +S000028957 telomere TEL06R chromosome 6 6 269731 270161 W 73 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome VI; composed of an X element core sequence and a short terminal stretch of telomeric repeats +S000028958 telomeric_repeat TEL06R 6 270113 270161 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome VI +S000028959 X_element TEL06R 6 269731 270112 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome VI; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000029680 gene_group MAL1 MAL1 chromosome 7 L000001000 7 Multigene complex, polymeric locus for maltose fermentation; encodes the MAL13 trans-acting MAL-activator, MAL11 maltose permease, and MAL12 maltase +S000028887 telomere TEL07L chromosome 7 7 781 1 C -172 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome VII; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats +S000028888 telomeric_repeat TEL07L 7 34 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome VII +S000028889 X_element TEL07L 7 781 318 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome VII; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028890 X_element_combinatorial_repeat TEL07L 7 317 35 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr VII; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000006948 long_terminal_repeat YGLWomega1 chromosome 7 7 838 1079 W 2000-05-19 2000-05-19 Ty5 LTR +S000003232 ORF Verified YGL263W COS12 chromosome 7 L000004069 7 2790 3932 W 1996-07-31 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins +S000031687 CDS YGL263W 7 2790 3932 W 1996-07-31 1996-07-31 +S000003231 ORF Uncharacterized YGL262W chromosome 7 7 5312 5839 W 1996-07-31 1996-07-31 Putative protein of unknown function; null mutant displays elevated sensitivity to expression of a mutant huntingtin fragment or of alpha-synuclein; YGL262W is not an essential gene +S000031603 CDS YGL262W 7 5312 5839 W 1996-07-31 1996-07-31 +S000003230 ORF Uncharacterized YGL261C PAU11 seripauperin PAU11 chromosome 7 7 6652 6290 C 1996-07-31 1996-07-31 Putative protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; mRNA expression appears to be regulated by SUT1 and UPC2 +S000030725 CDS YGL261C 7 6652 6290 C 1996-07-31 1996-07-31 +S000003229 ORF Uncharacterized YGL260W chromosome 7 7 6860 7090 W 1996-07-31 1996-07-31 Putative protein of unknown function; transcription is significantly increased in a NAP1 deletion background; deletion mutant has increased accumulation of nickel and selenium +S000030684 CDS YGL260W 7 6860 7090 W 1996-07-31 1996-07-31 +S000003228 ORF Uncharacterized YGL259W YPS5 chromosome 7 L000004385 7 8470 8967 W 1996-07-31 1996-07-31 Protein with similarity to GPI-anchored aspartic proteases; such proteases are Yap1p and Yap3p; mCherry fusion protein localizes to the vacuole +S000030354 CDS YGL259W 7 8470 8967 W 1996-07-31 1996-07-31 +S000007607 ORF Uncharacterized YGL258W-A chromosome 7 7 9162 9395 W 2001-02-26 2001-02-26 Putative protein of unknown function +S000037184 CDS YGL258W-A 7 9162 9395 W 2001-02-26 2001-02-26 +S000003227 ORF Verified YGL258W VEL1 chromosome 7 7 11110 11730 W 1996-07-31 1996-07-31 Protein of unknown function; highly induced in zinc-depleted conditions and has increased expression in NAP1 deletion mutants; VEL1 has a paralog, YOR387C, that arose from a single-locus duplication +S000030158 CDS YGL258W 7 11110 11730 W 1996-07-31 1996-07-31 +S000003226 ORF Verified YGL257C MNT2 alpha-1,3-mannosyltransferase MNT2 chromosome 7 S000007417 7 14157 12481 C 1996-07-31 1996-07-31 Mannosyltransferase; involved in adding the 4th and 5th mannose residues of O-linked glycans +S000037390 CDS YGL257C 7 14157 12481 C 1996-07-31 1996-07-31 +S000003225 ORF Verified YGL256W ADH4 alcohol dehydrogenase ADH4|ZRG5|NRC465 chromosome 7 L000000044 7 15159 16307 W -169 2008-06-02 1996-07-31|2008-06-02 Alcohol dehydrogenase isoenzyme type IV; dimeric enzyme demonstrated to be zinc-dependent despite sequence similarity to iron-activated alcohol dehydrogenases; transcription is induced in response to zinc deficiency +S000037356 CDS YGL256W 7 15159 16307 W 2008-06-02 1996-07-31|2008-06-02 +S000003224 ORF Verified YGL255W ZRT1 high-affinity Zn(2+) transporter ZRT1 chromosome 7 L000003260 7 20978 22108 W 1996-07-31 1996-07-31 High-affinity zinc transporter of the plasma membrane; responsible for the majority of zinc uptake; transcription is induced under low-zinc conditions by the Zap1p transcription factor +S000037251 CDS YGL255W 7 20978 22108 W 1996-07-31 1996-07-31 +S000003223 ORF Verified YGL254W FZF1 SUL1|RSU1|NRC299 chromosome 7 L000001781|L000000656 7 22304 23203 W 1996-07-31 1996-07-31 Transcription factor involved in sulfite metabolism; sole identified regulatory target is SSU1; overexpression suppresses sulfite-sensitivity of many unrelated mutants due to hyperactivation of SSU1, contains five zinc fingers; protein abundance increases in response to DNA replication stress +S000036566 CDS YGL254W 7 22304 23203 W 1996-07-31 1996-07-31 +S000003222 ORF Verified YGL253W HXK2 hexokinase 2|SCI2|HKB|HEX1 chromosome 7 L000000834 7 23935 25395 W -167 1996-07-31 1996-07-31 Hexokinase isoenzyme 2; phosphorylates glucose in cytosol; predominant hexokinase during growth on glucose; represses expression of HXK1, GLK1, induces expression of its own gene; antiapoptotic; phosphorylation/dephosphorylation at Ser14 by kinase Snf1p, phosphatase Glc7p-Reg1p regulates nucleocytoplasmic shuttling of Hxk2p; functions downstream of Sit4p in control of cell cycle, mitochondrial function, oxidative stress resistance, chronological lifespan; has paralog HXK1 +S000036456 CDS YGL253W 7 23935 25395 W 1996-07-31 1996-07-31 +S000003221 ORF Verified YGL252C RTG2 chromosome 7 L000001784 7 27484 25718 C 1996-07-31 1996-07-31 Sensor of mitochondrial dysfunction; regulates the subcellular location of Rtg1p and Rtg3p, transcriptional activators of the retrograde (RTG) and TOR pathways; Rtg2p is inhibited by the phosphorylated form of Mks1p +S000036310 CDS YGL252C 7 27484 25718 C 1996-07-31 1996-07-31 +S000003220 ORF Verified YGL251C HFM1 MER3 chromosome 7 L000002581 7 31636 27921 C 2000-07-14 2000-07-14|1996-07-31 Meiosis specific DNA helicase; involved in the conversion of double-stranded breaks to later recombination intermediates and in crossover control; catalyzes the unwinding of Holliday junctions; has ssDNA and dsDNA stimulated ATPase activity +S000035419 CDS YGL251C 7 31426 27921 C 2000-07-14 2000-07-14|1996-07-31 +S000035418 CDS YGL251C 7 31636 31579 C 2000-07-14 2000-07-14 +S000035420 intron YGL251C 7 31578 31427 C 2000-07-14 2000-07-14 +S000003219 ORF Verified YGL250W RMR1 chromosome 7 7 31910 32635 W 2003-09-22 2003-09-22|1996-07-31 Protein required for meiotic recombination and gene conversion; null mutant displays reduced PIS1 expression and growth defects on non-fermentable carbon sources and minimal media; GFP-fusion protein localizes to both cytoplasm and nucleus +S000035397 CDS YGL250W 7 31910 32635 W 2003-09-22 2003-09-22|1996-07-31 +S000003218 ORF Verified YGL249W ZIP2 chromosome 7 L000003536 7 33098 35212 W 1996-07-31 1996-07-31 Meiosis-specific protein; involved in normal synaptonemal complex formation and pairing between homologous chromosomes during meiosis; relocalizes from mitochondrion to cytoplasm upon DNA replication stress +S000034159 CDS YGL249W 7 33098 35212 W 1996-07-31 1996-07-31 +S000144910 ncRNA_gene RME3 RME3 SUT534 chromosome 7 7 35013 33109 C 2014-11-18 2014-11-18 Antisense transcript that represses the meiosis-specific ZIP2 gene; expressed in haploid cells under sporulation inducing conditions; regulates ZIP2 in a cis-dependent manner; RME3 is repressed by the MAT a1/alpha2 complex in diploid cells +S000178099 noncoding_exon RME3 7 35013 33109 C 2014-11-18 2014-11-18 +S000003217 ORF Verified YGL248W PDE1 3',5'-cyclic-nucleotide phosphodiesterase PDE1 chromosome 7 L000001358 7 35653 36762 W 1996-07-31 1996-07-31 Low-affinity cyclic AMP phosphodiesterase; controls glucose and intracellular acidification-induced cAMP signaling, target of the cAMP-protein kinase A (PKA) pathway; glucose induces transcription and inhibits translation +S000033288 CDS YGL248W 7 35653 36762 W 1996-07-31 1996-07-31 +S000003216 ORF Verified YGL247W BRR6 chromosome 7 7 36933 37526 W 1996-07-31 1996-07-31 Essential nuclear envelope integral membrane protein; interacts and functions with Apq12p and Brl1p in lipid homeostasis; mutants are defective in nuclear pore complex biogenesis, nuclear envelope morphology, mRNA nuclear export, and are sensitive to sterol biosynthesis inhibitors and membrane fluidizing agents; exhibits synthetic lethal genetic interactions with genes involved in lipid metabolism; homologous to Brl1p +S000033240 CDS YGL247W 7 36933 37526 W 1996-07-31 1996-07-31 +S000003215 ORF Verified YGL246C RAI1 decapping nuclease chromosome 7 S000007430 7 38780 37617 C 1996-07-31 1996-07-31 Nuclear protein with decapping endonuclease activity; targets mRNAs with unmethylated 7-methylguanosine cap structures and 5'-triphosphates; binds to and stabilizes the exoribonuclease Rat1p; required for pre-rRNA processing; relocalizes to the cytosol in response to hypoxia; homologous to human DOM3Z +S000033150 CDS YGL246C 7 38780 37617 C 1996-07-31 1996-07-31 +S000003214 ORF Verified YGL245W GUS1 glutamate--tRNA ligase GUS1|GluRS|GSN1 chromosome 7 7 39023 41149 W 2003-09-22 2003-09-22|1996-07-31 Glutamyl-tRNA synthetase (GluRS); forms a complex with methionyl-tRNA synthetase (Mes1p) and Arc1p; complex formation increases the catalytic efficiency of both tRNA synthetases and ensures their correct localization to the cytoplasm; protein abundance increases in response to DNA replication stress +S000033122 CDS YGL245W 7 39023 41149 W 2003-09-22 2003-09-22|1996-07-31 +S000003213 ORF Verified YGL244W RTF1 CSL3 chromosome 7 L000001782 7 41498 43174 W 1999-07-17 1999-07-17|1996-07-31 Subunit of RNAPII-associated chromatin remodeling Paf1 complex; regulates gene expression by directing cotranscriptional histone modification, influences transcription and chromatin structure through several independent functional domains; directly or indirectly regulates DNA-binding properties of Spt15p and relative activities of different TATA elements; involved in transcription elongation as demonstrated by the G-less-based run-on (GLRO) assay +S000032242 CDS YGL244W 7 41498 43174 W 1999-07-17 1999-07-17|1996-07-31 +S000003212 ORF Verified YGL243W TAD1 tRNA-specific adenosine deaminase chromosome 7 L000004621 7 43307 44509 W 1996-07-31 1996-07-31 tRNA-specific adenosine deaminase; deaminates adenosine-37 to inosine in tRNA-Ala +S000032159 CDS YGL243W 7 43307 44509 W 1996-07-31 1996-07-31 +S000003211 ORF Verified YGL242C chromosome 7 7 45197 44652 C 1996-07-31 1996-07-31 Protein of unknown function; N-terminally propionylated in vivo; deletion mutant is viable +S000032036 CDS YGL242C 7 45197 44652 C 1996-07-31 1996-07-31 +S000003210 ORF Verified YGL241W KAP114 chromosome 7 L000004867 7 45445 48459 W 1996-07-31 1996-07-31 Karyopherin, responsible for nuclear import of specific proteins; cargoes include Spt15p, Sua7p, histones H2A and H2B, and Nap1p; amino terminus shows similarity to those of other importins, particularly Cse1p; localization is primarily nuclear; function is regulated by sumoylation; protein abundance increases in response to DNA replication stress +S000032007 CDS YGL241W 7 45445 48459 W 1996-07-31 1996-07-31 +S000003209 ORF Verified YGL240W DOC1 anaphase promoting complex subunit DOC1|APC10 chromosome 7 L000004350 7 48613 49365 W 2003-09-22 2003-09-22|1996-07-31 Processivity factor; required for the ubiquitination activity of the anaphase promoting complex (APC), mediates the activity of the APC by contributing to substrate recognition; involved in cyclin proteolysis; contains a conserved DOC1 homology domain +S000031054 CDS YGL240W 7 48613 49365 W 2003-09-22 2003-09-22|1996-07-31 +S000003207 ORF Verified YGL238W CSE1 importin-alpha export receptor|KAP109 chromosome 7 L000000425 7 49552 52434 W 1996-07-31 1996-07-31 Nuclear envelope protein that acts as a recycling factor; mediates the nuclear export of Srp1p (importin alpha) back to the cytoplasm after its import substrates have been released into the nucleoplasm, thereby allowing the participation of Srp1p in multiple rounds of nuclear import; required for accurate chromosome segregation; homolog of metazoan CAS and human CSE1L, overexpression of which is implicated in cancer progression +S000029914 CDS YGL238W 7 49552 52434 W 1996-07-31 1996-07-31 +S000003208 ORF Dubious YGL239C chromosome 7 7 49745 49431 C 1996-07-31 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified gene CSE1 +S000029968 CDS YGL239C 7 49745 49431 C 1996-07-31 1996-07-31 +S000003206 ORF Verified YGL237C HAP2 chromosome 7 L000000752 7 53528 52731 C -148 1996-07-31 1996-07-31 Subunit of the Hap2p/3p/4p/5p CCAAT-binding complex; complex is heme-activated and glucose-repressed; complex is a transcriptional activator and global regulator of respiratory gene expression; contains sequences sufficient for both complex assembly and DNA binding; respiratory defect of the null mutant is functionally complemented by human NFYA +S000037826 CDS YGL237C 7 53528 52731 C 1996-07-31 1996-07-31 +S000003204 ORF Uncharacterized YGL235W chromosome 7 7 55279 55815 W 2004-07-15 1996-07-31 Putative protein of unknown function; potential Cdc28p substrate; null mutant displays increased resistance to antifungal agents gliotoxin, cycloheximide and H2O2 +S000037051 CDS YGL235W 7 55279 55815 W 2004-07-15 1996-07-31 +S000003205 ORF Verified YGL236C MTO1 tRNA modification protein MTO1|IPS1 chromosome 7 7 55796 53787 C 2004-07-15 2004-07-15|1996-07-31 Mitochondrial protein; forms heterodimer complex with Mss1p that performs 5-carboxymethylaminomethyl modification of the wobble uridine base in mitochondrial tRNAs; required for respiration in paromomycin-resistant 15S rRNA mutants; human homolog MTO1 can complement yeast null mutant +S000037073 CDS YGL236C 7 55796 53787 C 2004-07-15 2004-07-15|1996-07-31 +S000003203 ORF Verified YGL234W ADE5,7 bifunctional aminoimidazole ribotide synthase/glycinamide ribotide synthase chromosome 7 L000000035 7 56482 58890 W -152 2004-07-15 1996-07-31 Enzyme of the 'de novo' purine nucleotide biosynthetic pathway; contains aminoimidazole ribotide synthetase and glycinamide ribotide synthetase activities +S000036969 CDS YGL234W 7 56482 58890 W 2004-07-15 1996-07-31 +S000003202 ORF Verified YGL233W SEC15 Rab GTPase-binding exocyst subunit SEC15 chromosome 7 L000001840 7 59122 61854 W 2004-07-15 1996-07-31 Essential 113 kDa subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis prior to SNARE-mediated fusion; interacts with and functions as a downstream effector of active, GTP-bound Sec4p, a Rab family GTPase +S000036914 CDS YGL233W 7 59122 61854 W 2004-07-15 1996-07-31 +S000003201 ORF Verified YGL232W TAN1 putative tRNA acetyltransferase chromosome 7 7 62075 63002 W 2004-07-15 1996-07-31 Putative tRNA acetyltransferase; RNA-binding protein required for the formation of the modified nucleoside N(4)-acetylcytidine in serine and leucine tRNAs but not required for the same modification in 18S rRNA; protein abundance increases in response to DNA replication stress +S000036130 CDS YGL232W 7 62075 62131 W 2004-07-15 1996-07-31 +S000036131 CDS YGL232W 7 62190 63002 W 2004-07-15 1996-07-31 +S000036132 intron YGL232W 7 62132 62189 W 2004-07-15 1996-07-31 +S000003200 ORF Verified YGL231C EMC4 chaperone EMC4 chromosome 7 7 63620 63048 C 2004-07-15 1996-07-31 Member of conserved ER transmembrane complex; required for efficient folding of proteins in the ER; null mutant displays induction of the unfolded protein response; homologous to worm ZK616.6/EMC-4 and fly CG11137; mutation is functionally complemented by human EMC4 +S000035888 CDS YGL231C 7 63620 63048 C 2004-07-15 1996-07-31 +S000003199 ORF Uncharacterized YGL230C chromosome 7 7 64215 63772 C 2004-07-15 1996-07-31 Putative protein of unknown function; non-essential gene +S000034975 CDS YGL230C 7 64215 63772 C 2004-07-15 1996-07-31 +S000118451 ARS ARS702 ARSVII-64 chromosome 7 7 64360 64464 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000119018 ARS_consensus_sequence ARS702 7 64458 64444 C 2006-10-03 2006-10-03 +S000003198 ORF Verified YGL229C SAP4 chromosome 7 L000003341 7 66959 64503 C 2004-07-15 1996-07-31 Protein required for function of the Sit4p protein phosphatase; member of a family of similar proteins that form complexes with Sit4p, including Sap155p, Sap185p, and Sap190p; SAP4 has a paralog, SAP155, that arose from the whole genome duplication +S000034012 CDS YGL229C 7 66959 64503 C 2004-07-15 1996-07-31 +S000003197 ORF Verified YGL228W SHE10 chromosome 7 L000002872 7 67598 69331 W 2004-07-15 1996-07-31 Protein involved in outer spore wall assembly; likely involved directly in dityrosine layer assembly; putative GPI-anchored protein; overexpression causes growth arrest;; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; SHE10 has a paralog, OSW7/YFR039C, that arose from the whole genome duplication; paralogs are redundant for spore wall dityrosine assembly +S000033924 CDS YGL228W 7 67598 69331 W 2004-07-15 1996-07-31 +S000003196 ORF Verified YGL227W VID30 glucose-induced degradation complex subunit VID30|GID1 chromosome 7 L000004008 7 69671 72547 W 2004-07-15 1996-07-31 Central component of GID Complex, involved in FBPase degradation; interacts strongly with Gid8p to serve as a scaffold for other GID Complex subunits; contains SPRY domain and 3 domains that are also found in Gid8p - LisH, CTLH, and CRA; required for association of Vid vesicles and actin patches in vacuole import and degradation pathway; shifts the balance of nitrogen metabolism toward glutamate production; localizes to the nucleus and the cytoplasm +S000033846 CDS YGL227W 7 69671 72547 W 2004-07-15 1996-07-31 +S000003194 ORF Verified YGL226C-A OST5 dolichyl-diphosphooligosaccharide--protein glycotransferase subunit chromosome 7 L000002944 7 73158 72749 C 2011-02-03 1996-07-31 Zeta subunit of the oligosaccharyltransferase complex of the ER lumen; complex catalyzes asparagine-linked glycosylation of newly synthesized proteins +S000037108 CDS YGL226C-A 7 72988 72749 C 2011-02-03 1996-07-31 +S000037107 CDS YGL226C-A 7 73158 73138 C 2011-02-03 1996-07-31 +S000037109 intron YGL226C-A 7 73137 72989 C 2011-02-03 1996-07-31 +S000003195 ORF Verified YGL226W MTC3 chromosome 7 7 73340 73711 W 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the mitochondrion; mtc3 is synthetically sick with cdc13-1 +S000033716 CDS YGL226W 7 73340 73711 W 2011-02-03 1996-07-31 +S000006757 tRNA_gene tV(AAC)G3 chromosome 7 L000003854 7 73902 73829 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000036907 noncoding_exon tV(AAC)G3 7 73902 73829 C 2011-02-03 2000-05-19 +S000003193 ORF Verified YGL225W VRG4 GDP-mannose transporter|VIG4|LDB3|GOG5|VAN2 chromosome 7 L000000719 7 76894 77907 W 2011-02-03 1996-07-31 Golgi GDP-mannose transporter; regulates Golgi function and glycosylation in Golgi; VRG4 has a paralog, HVG1, that arose from the whole genome duplication +S000033042 CDS YGL225W 7 76894 77907 W 2011-02-03 1996-07-31 +S000003192 ORF Verified YGL224C SDT1 nucleotidase|SSM1 chromosome 7 L000003406 7 78857 78015 C 2011-02-03 1996-07-31 Pyrimidine nucleotidase; responsible for production of nicotinamide riboside and nicotinic acid riboside; overexpression suppresses the 6-AU sensitivity of transcription elongation factor S-II, as well as resistance to other pyrimidine derivatives; SDT1 has a paralog, PHM8, that arose from the whole genome duplication +S000032898 CDS YGL224C 7 78857 78015 C 2011-02-03 1996-07-31 +S000003191 ORF Verified YGL223C COG1 Golgi transport complex subunit COG1|SEC36|LDB11|COD3 chromosome 7 7 80365 79112 C 2011-02-03 1996-07-31 Essential component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments +S000032824 CDS YGL223C 7 80365 79112 C 2011-02-03 1996-07-31 +S000003190 ORF Verified YGL222C EDC1 chromosome 7 7 81186 80659 C 2011-02-03 1996-07-31 RNA-binding protein that activates mRNA decapping directly; binds to mRNA substrate and enhances activity of decapping proteins Dcp1p and Dcp2p; has a role in translation during heat stress; protein becomes more abundant and forms cytoplasmic foci in response to DNA replication stress; EDC1 has a paralog, EDC2, that arose from the whole genome duplication +S000031900 CDS YGL222C 7 81186 80659 C 2011-02-03 1996-07-31 +S000003189 ORF Verified YGL221C NIF3 hypothetical protein chromosome 7 L000003316 7 82292 81426 C 2011-02-03 1996-07-31 Protein of unknown function; similar to Listeria monocytogenes major sigma factor (rpoD gene product); the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000031759 CDS YGL221C 7 82292 81426 C 2011-02-03 1996-07-31 +S000003188 ORF Verified YGL220W BOL2 FRA2|AIM15 chromosome 7 7 82374 82736 W 2011-02-03 1996-07-31 Cytosolic protein involved in repression of iron regulon transcription; forms an iron-independent complex with Fra1p, Grx3p, and Grx4p; null mutant fails to repress the iron regulon and is sensitive to nickel; sequence similarity to human BOLA family member, BOLA2 +S000031708 CDS YGL220W 7 82374 82736 W 2011-02-03 1996-07-31 +S000003186 ORF Dubious YGL218W SRF1 chromosome 7 7 83650 84300 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 93% of ORF overlaps the verified gene MDM34; deletion in cyr1 mutant results in loss of stress resistance +S000030779 CDS YGL218W 7 83650 84300 W 2011-02-03 1996-07-31 +S000003187 ORF Verified YGL219C MDM34 ERMES complex subunit MDM34|MMM2 chromosome 7 7 84257 82878 C 2011-02-03 1996-07-31 Mitochondrial component of the ERMES complex; links the ER to mitochondria and may promote inter-organellar calcium and phospholipid exchange as well as coordinating mitochondrial DNA replication and growth; required for mitophagy; ERMES complex is often co-localized with peroxisomes and with concentrated areas of pyruvate dehydrogenase +S000030809 CDS YGL219C 7 84257 82878 C 2011-02-03 1996-07-31 +S000003184 ORF Verified YGL216W KIP3 tubulin-dependent ATPase KIP3 chromosome 7 L000003911 7 84885 87302 W 2011-02-03 1996-07-31 Kinesin-related antiparallel sliding motor protein; involved in mitotic spindle positioning; sliding activity promotes bipolar spindle assembly and maintenance of genome stability; inhibits spindle elongation, destabilizing late anaphase spindle microtubules that polymerize beyond the midzone +S000037780 CDS YGL216W 7 84885 87302 W 2011-02-03 1996-07-31 +S000003185 ORF Dubious YGL217C chromosome 7 7 85180 84839 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF KIP3/YGL216W +S000030618 CDS YGL217C 7 85180 84839 C 2011-02-03 1996-07-31 +S000003183 ORF Verified YGL215W CLG1 chromosome 7 L000000356 7 87981 89339 W 2011-02-03 1996-07-31 Cyclin-like protein that interacts with Pho85p; has sequence similarity to G1 cyclins PCL1 and PCL2 +S000037731 CDS YGL215W 7 87981 89339 W 2011-02-03 1996-07-31 +S000003182 ORF Dubious YGL214W chromosome 7 7 90010 90495 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; deletion mutation phenotype is likely due to the overlapping verified ORF SKI8/YGL213C +S000037674 CDS YGL214W 7 90010 90495 W 2011-02-03 1996-07-31|2011-02-03 +S000003181 ORF Verified YGL213C SKI8 SKI complex subunit WD repeat protein SKI8|REC103 chromosome 7 L000001906 7 91247 90054 C -149 2011-02-03 1996-07-31 Ski complex component and WD-repeat protein; mediates 3'-5' RNA degradation by the cytoplasmic exosome; also required for meiotic double-strand break recombination; null mutants have superkiller phenotype +S000037570 CDS YGL213C 7 91247 90054 C 2011-02-03 1996-07-31 +S000003180 ORF Verified YGL212W VAM7 VPL24|VPS43 chromosome 7 L000002452 7 91432 92382 W 2011-02-03 1996-07-31 Vacuolar SNARE protein; functions with Vam3p in vacuolar protein trafficking; has an N-terminal PX domain (phosphoinositide-binding module) that binds PtdIns-3-P and mediates membrane binding; SNAP-25 homolog; protein abundance increases in response to DNA replication stress +S000036874 CDS YGL212W 7 91432 92382 W 2011-02-03 1996-07-31 +S000003179 ORF Verified YGL211W NCS6 TUC1|YGL210W-A chromosome 7 7 92512 93591 W 2011-02-03 2004-07-20|1996-07-31 Protein required for uridine thiolation of Gln, Lys, and Glu tRNAs; required for the thiolation of uridine at the wobble position of Gln, Lys, and Glu tRNAs; has a role in urmylation and in invasive and pseudohyphal growth; inhibits replication of Brome mosaic virus in S. cerevisiae +S000036823 CDS YGL211W 7 92512 93591 W 2011-02-03 2004-07-20|1996-07-31 +S000003178 ORF Verified YGL210W YPT32 Rab family GTPase YPT32 chromosome 7 L000002897 7 93792 94460 W 2011-02-03 1996-07-31 Rab family GTPase involved in the exocytic pathway; mediates intra-Golgi traffic or the budding of post-Golgi vesicles from the trans-Golgi; protein abundance increases in response to DNA replication stress; YPT32 has a paralog, YPT31, that arose from the whole genome duplication +S000036765 CDS YGL210W 7 93792 94460 W 2011-02-03 1996-07-31 +S000003177 ORF Verified YGL209W MIG2 MLZ1 chromosome 7 L000003254 7 95858 97006 W 2011-02-03 1996-07-31 Zinc finger transcriptional repressor; cooperates with Mig1p in glucose-induced gene repression; under low glucose conditions relocalizes to mitochondrion, where it interacts with Ups1p, antagonizes mitochondrial fission factor Dnm1p, indicative of a role in mitochondrial fusion or regulating morphology; regulates filamentous growth in response to glucose depletion; activated in stochastic pulses of nuclear localization in response to low glucose +S000035806 CDS YGL209W 7 95858 97006 W 2011-02-03 1996-07-31 +S000003176 ORF Verified YGL208W SIP2 SPM2 chromosome 7 L000001891|L000001998 7 97338 98585 W 2011-02-03 1996-07-31|2011-02-03 One of three beta subunits of the Snf1 kinase complex; involved in the response to glucose starvation; null mutants exhibit accelerated aging; N-myristoylprotein localized to the cytoplasm and the plasma membrane; SIP2 has a paralog, GAL83, that arose from the whole genome duplication +S000035685 CDS YGL208W 7 97338 98585 W 2011-02-03 1996-07-31|2011-02-03 +S000003175 ORF Verified YGL207W SPT16 chromatin-remodeling protein SPT16|SSF1|CDC68 chromosome 7 L000002038 7 98969 102076 W -134 2011-02-03 1996-07-31 Subunit of the heterodimeric FACT complex (Spt16p-Pob3p); FACT associates with chromatin via interaction with Nhp6Ap and Nhp6Bp, and reorganizes nucleosomes to facilitate access to DNA by RNA and DNA polymerases; specifically required for diauxic shift-induced H2B deposition onto rDNA genes; mutations cause reduced nucleosome occupancy over highly transcribed regions; coregulates transcription with Mot1p through preinitiation complex assembly and nucleosome organization +S000034683 CDS YGL207W 7 98969 102076 W 2011-02-03 1996-07-31 +S000003174 ORF Verified YGL206C CHC1 clathrin heavy chain|SWA5 chromosome 7 L000000317 7 107504 102543 C -133 2011-02-03 1996-07-31 Clathrin heavy chain; subunit of the major coat protein involved in intracellular protein transport and endocytosis; the clathrin triskelion is a trimeric molecule composed of three heavy chains that radiate from a vertex and three light chains which bind noncovalently near the vertex of the triskelion; the light chain (CLC1) is thought to regulate function +S000034547 CDS YGL206C 7 107504 102543 C 2011-02-03 1996-07-31 +S000003173 ORF Verified YGL205W POX1 acyl-CoA oxidase|FOX1 chromosome 7 L000001467 7 108158 110404 W 2011-02-03 1996-07-31 Fatty-acyl coenzyme A oxidase; involved in the fatty acid beta-oxidation pathway; localized to the peroxisomal matrix +S000034502 CDS YGL205W 7 108158 110404 W 2011-02-03 1996-07-31 +S000006595 tRNA_gene tH(GUG)G1 chromosome 7 L000003822 7 110696 110625 C 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis +S000036197 noncoding_exon tH(GUG)G1 7 110696 110625 C 2011-02-03 2000-05-19 +S000006950 long_terminal_repeat YGLWtau1 chromosome 7 7 110855 111225 W 2011-02-03 2000-05-19 Ty4 LTR +S000006935 long_terminal_repeat YGLCdelta1 chromosome 7 7 111505 111226 C 2011-02-03 2000-05-19 Ty1 LTR +S000006940 long_terminal_repeat YGLWdelta2 chromosome 7 7 111506 111698 W 2011-02-03 2000-05-19 Ty1 LTR +S000003172 ORF Uncharacterized YGL204C chromosome 7 7 112005 111700 C 2011-02-03 1996-07-31 Protein of unknown function; mRNA identified as translated by ribosome profiling data; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum +S000033547 CDS YGL204C 7 112005 111700 C 2011-02-03 1996-07-31 +S000118452 ARS ARS704 ARSVII-112 chromosome 7 7 112079 112317 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000119019 ARS_consensus_sequence ARS704 7 112125 112139 W 2011-02-03 2006-10-03 +S000003171 ORF Verified YGL203C KEX1 serine-type carboxypeptidase chromosome 7 L000000895 7 114664 112475 C -131 2011-02-03 1996-07-31 Cell death protease essential for hypochlorite-induced apoptosis; involved in the processing of killer toxin and alpha factor precursor; cleaves Lys and Arg residues from the C-terminus of peptides and proteins +S000033480 CDS YGL203C 7 114664 112475 C 2011-02-03 1996-07-31 +S000006941 long_terminal_repeat YGLWdelta3 chromosome 7 7 114939 115269 W 2011-02-03 2000-05-19 Ty1 LTR +S000006630 tRNA_gene tK(UUU)G1 chromosome 7 L000003819 7 115488 115583 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000033672 intron tK(UUU)G1 7 115525 115547 W 2011-02-03 2000-05-19 +S000033670 noncoding_exon tK(UUU)G1 7 115488 115524 W 2011-02-03 2000-05-19 +S000033671 noncoding_exon tK(UUU)G1 7 115548 115583 W 2011-02-03 2000-05-19 +S000003170 ORF Verified YGL202W ARO8 bifunctional 2-aminoadipate transaminase/aromatic-amino-acid:2-oxoglutarate transaminase chromosome 7 L000003949 7 116059 117561 W 2011-02-03 1996-07-31 Aromatic aminotransferase I; expression is regulated by general control of amino acid biosynthesis +S000033459 CDS YGL202W 7 116059 117561 W 2011-02-03 1996-07-31 +S000114845 ARS ARS706 ARS706 ARO8 ARS chromosome 7 7 117561 117854 2011-02-03 2006-04-12 Autonomously Replicating Sequence +S000003169 ORF Verified YGL201C MCM6 MCM DNA helicase complex subunit MCM6 chromosome 7 L000004104 7 120907 117854 C 2011-02-03 2004-01-23|1996-07-31 Protein involved in DNA replication; component of the Mcm2-7 hexameric helicase complex that binds chromatin as a part of the pre-replicative complex; forms a subcomplex with Mcm4p and Mcm7p +S000033344 CDS YGL201C 7 120907 117854 C 2011-02-03 2004-01-23|1996-07-31 +S000006621 tRNA_gene tK(CUU)G1 chromosome 7 L000003820 7 122269 122341 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000029888 noncoding_exon tK(CUU)G1 7 122269 122341 W 2011-02-03 2000-05-19 +S000003168 ORF Verified YGL200C EMP24 BST2 chromosome 7 L000000549 7 123305 122694 C 2011-02-03 1996-07-31 Component of the p24 complex; role in misfolded protein quality control; binds to GPI anchor proteins and mediates their efficient transport from the ER to the Golgi; integral membrane protein that associates with endoplasmic reticulum-derived COPII-coated vesicles +S000032658 CDS YGL200C 7 123305 122694 C 2011-02-03 1996-07-31 +S000003166 ORF Verified YGL198W YIP4 chromosome 7 7 123591 124298 W 2011-02-03 2004-01-23|1996-07-31 Protein that interacts with Rab GTPases; localized to late Golgi vesicles; computational analysis of large-scale protein-protein interaction data suggests a possible role in vesicle-mediated transport +S000034057 CDS YGL198W 7 123591 124298 W 2011-02-03 2004-01-23|1996-07-31 +S000003167 ORF Dubious YGL199C chromosome 7 7 124042 123572 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YIP4/YGL198W +S000034896 CDS YGL199C 7 124042 123572 C 2011-02-03 1996-07-31 +S000003165 ORF Verified YGL197W MDS3 chromosome 7 L000003960 7 124698 129161 W 2011-02-03 1996-07-31|2011-02-03 Putative component of the TOR regulatory pathway; negative regulator of early meiotic gene expression; required, with Pmd1p, for growth under alkaline conditions; has an N-terminal kelch-like domain; MDS3 has a paralog, PMD1, that arose from the whole genome duplication +S000033900 CDS YGL197W 7 124698 129161 W 2011-02-03 1996-07-31|2011-02-03 +S000003164 ORF Verified YGL196W DSD1 D-serine ammonia-lyase DSD1 chromosome 7 7 129883 131169 W 2011-02-03 2004-07-19|1996-07-31 D-serine dehydratase (aka D-serine ammonia-lyase); converts D-serine to pyruvate and ammonia by a reaction dependent on pyridoxal 5'-phosphate and zinc; may play a role in D-serine detoxification; L-serine is not a substrate +S000033780 CDS YGL196W 7 129883 131169 W 2011-02-03 2004-07-19|1996-07-31 +S000003163 ORF Verified YGL195W GCN1 AAS103|NDR1 chromosome 7 L000000680 7 131525 139543 W 2011-02-03 1996-07-31 Positive regulator of the Gcn2p kinase activity; forms a complex with Gcn20p; proposed to stimulate Gcn2p activation by an uncharged tRNA +S000033049 CDS YGL195W 7 131525 139543 W 2011-02-03 1996-07-31 +S000087160 ORF Uncharacterized YGL194C-A chromosome 7 7 139961 139719 C 2011-02-03 2005-11-10 Putative protein of unknown function; identified based on comparisons of the genome sequences of six Saccharomyces species; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum +S000087161 CDS YGL194C-A 7 139961 139719 C 2011-02-03 2005-11-10 +S000003162 ORF Verified YGL194C HOS2 histone deacetylase HOS2|RTL1 chromosome 7 L000004092|L000003448 7 141726 140368 C 2011-02-03 1996-07-31 Histone deacetylase and subunit of Set3 and Rpd3L complexes; required for gene activation via specific deacetylation of lysines in H3 and H4 histone tails; subunit of the Set3 complex, a meiotic-specific repressor of sporulation specific genes that contains deacetylase activity; co-localizes with Cmr1p in nuclear foci in response to DNA damage by MMS +S000032901 CDS YGL194C 7 141726 140368 C 2011-02-03 1996-07-31 +S000003161 ORF Uncharacterized YGL193C chromosome 7 7 142227 141916 C 2011-02-03 1996-07-31 Haploid-specific gene repressed by a1-alpha2; turned off in sir3 null strains, absence enhances the sensitivity of rad52-327 cells to campothecin almost 100-fold +S000032793 CDS YGL193C 7 142227 141916 C 2011-02-03 1996-07-31 +S000003160 ORF Verified YGL192W IME4 mRNA (N6-adenosine)-methyltransferase|SPO8 chromosome 7 L000000863|L000002001 7 142246 144048 W -130 2011-02-03 1996-07-31 mRNA N6-adenosine methyltransferase required for entry into meiosis; mediates N6-adenosine methylation of bulk mRNA during the induction of sporulation which includes the meiotic regulators IME1, IME2 and IME4 itself; repressed in haploids via production of antisense IME4 transcripts; transcribed in diploid cells where antisense transcription is repressed; orthologous to human METTL3 (MT-A70) +S000031956 CDS YGL192W 7 142246 144048 W 2011-02-03 1996-07-31 +S000144908 ncRNA_gene RME2 RME2 IME4-AS chromosome 7 7 144120 141898 C 2014-11-18 2014-11-18 Antisense transcript initiated from the 3' end of the IME4 locus; expressed in haploids and interferes with IME4 expression through a cis-acting mechanism; RME2 expression is repressed by the MAT a1/alpha2 repressor complex +S000178098 noncoding_exon RME2 7 144120 141898 C 2014-11-18 2014-11-18 +S000003159 ORF Verified YGL191W COX13 cytochrome c oxidase subunit VIa chromosome 7 L000000397 7 144808 145197 W 2011-02-03 1996-07-31 Subunit VIa of cytochrome c oxidase; present in a subclass of cytochrome c oxidase complexes that may have a role in mimimizing generation of reactive oxygen species; not essential for cytochrome c oxidase activity but may modulate activity in response to ATP; required for assembly of Rcf2p into cytochrome c oxidase - cytochrome bc1 supercomplexes +S000031830 CDS YGL191W 7 144808 145197 W 2011-02-03 1996-07-31 +S000003158 ORF Verified YGL190C CDC55 TMR4|protein phosphatase 2A regulatory subunit CDC55 chromosome 7 L000000282|S000029602|L000003191 7 147389 145809 C -125 2011-02-03 1996-07-31 Regulatory subunit B of protein phosphatase 2A (PP2A); Zds1p/2p-dependent localization to cytoplasm promotes mitotic entry; localization to nucleus prevents mitotic exit; required for correct nuclear division, chromosome segregation during achiasmate meiosis; maintains nucleolar sequestration of Cdc14p during early meiosis; limits formation of PP2A-Rts1p holocomplexes to ensure timely dissolution of sister chromosome cohesion; homolog of mammalian B55 +S000031647 CDS YGL190C 7 147389 145809 C 2011-02-03 1996-07-31 +S000003157 ORF Verified YGL189C RPS26A eS26|ribosomal 40S subunit protein S26A|S26e|S26A|RPS26 chromosome 7 L000003256|L000001762 7 148588 148229 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S26, no bacterial homolog; RPS26A has a paralog, RPS26B, that arose from the whole genome duplication; human homolog can partially complement an RPS26A, RPS26B double null mutant; mutations in the human gene are associated with Diamond-Blackfan anemia +S000031468 CDS YGL189C 7 148588 148229 C 2011-02-03 1996-07-31 +S000122100 five_prime_UTR_intron YGL189C 7 148966 148599 C 2011-02-03 2007-04-04 +S000028635 ORF Uncharacterized YGL188C-A chromosome 7 7 148964 148824 C 2011-02-03 2003-07-29 Putative protein of unknown function +S000032391 CDS YGL188C-A 7 148964 148824 C 2011-02-03 2003-07-29 +S000003156 ORF Dubious YGL188C chromosome 7 7 149516 149343 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030546 CDS YGL188C 7 149516 149343 C 2011-02-03 1996-07-31 +S000003155 ORF Verified YGL187C COX4 cytochrome c oxidase subunit IV chromosome 7 L000000386 7 150171 149704 C 2011-02-03 1996-07-31 Subunit IV of cytochrome c oxidase; the terminal member of the mitochondrial inner membrane electron transport chain; precursor N-terminal 25 residues are cleaved during mitochondrial import; phosphorylated; spermidine enhances translation +S000030404 CDS YGL187C 7 150171 149704 C 2011-02-03 1996-07-31 +S000122089 five_prime_UTR_intron YGL187C 7 150525 150184 C 2011-02-03 2007-03-28 +S000003154 ORF Verified YGL186C TPN1 chromosome 7 7 152776 151037 C 2011-02-03 1996-07-31 Plasma membrane pyridoxine (vitamin B6) transporter; member of the purine-cytosine permease subfamily within the major facilitator superfamily; proton symporter with similarity to Fcy21p, Fcy2p, and Fcy22p +S000030268 CDS YGL186C 7 152776 151037 C 2011-02-03 1996-07-31 +S000003153 ORF Uncharacterized YGL185C putative hydroxyacid dehydrogenase chromosome 7 7 154306 153167 C 2011-02-03 1996-07-31 Putative protein with sequence similar to hydroxyacid dehydrogenases; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000037513 CDS YGL185C 7 154306 153167 C 2011-02-03 1996-07-31 +S000003152 ORF Verified YGL184C STR3 cystathionine beta-lyase STR3 chromosome 7 7 156012 154615 C 2011-02-03 1996-07-31 Peroxisomal cystathionine beta-lyase; converts cystathionine into homocysteine; may be redox regulated by Gto1p; involved in the release of the aromatic thiol 3-mercaptohexanol during wine fermentation +S000037385 CDS YGL184C 7 156012 154615 C 2011-02-03 1996-07-31 +S000003151 ORF Verified YGL183C MND1 chromosome 7 7 157285 156543 C 2011-02-03 2003-01-07|1996-07-31 Protein required for recombination and meiotic nuclear division; forms a complex with Hop2p, which is involved in chromosome pairing and repair of meiotic double-strand breaks +S000037289 CDS YGL183C 7 157199 156543 C 2011-02-03 2003-01-07|1996-07-31 +S000037288 CDS YGL183C 7 157285 157283 C 2011-02-03 2003-01-07 +S000037290 intron YGL183C 7 157282 157200 C 2011-02-03 2003-01-07 +S000003150 ORF Dubious YGL182C chromosome 7 7 157596 157273 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF MND1/YGL183C +S000036583 CDS YGL182C 7 157596 157273 C 2011-02-03 1996-07-31 +S000003149 ORF Verified YGL181W GTS1 LSR1|FHT1 chromosome 7 L000000743 7 157906 159096 W 2011-02-03 1996-07-31 Protein involved in Arf3p regulation and in transcription regulation; localizes to the nucleus and to endocytic patches; contains an N-terminal Zn-finger and ArfGAP homology domain, a C-terminal glutamine-rich region, and a UBA (ubiquitin associated) domain; gts1 mutations affect budding, cell size, heat tolerance, sporulation, life span, ultradian rhythms, endocytosis; expression oscillates in a pattern similar to metabolic oscillations +S000036556 CDS YGL181W 7 157906 159096 W 2011-02-03 1996-07-31 +S000003148 ORF Verified YGL180W ATG1 serine/threonine protein kinase ATG1|APG1|CVT10|AUT3 chromosome 7 L000003955|S000028502|L000004761 7 160065 162758 W 2011-02-03 1996-07-31 Protein serine/threonine kinase; required for vesicle formation in autophagy and the cytoplasm-to-vacuole targeting (Cvt) pathway; structurally required for phagophore assembly site formation; during autophagy forms a complex with Atg13p and Atg17p; essential for cell cycle progression from G2/M to G1 under nitrogen starvation +S000036454 CDS YGL180W 7 160065 162758 W 2011-02-03 1996-07-31 +S000118453 ARS ARS707 ARSVII-163 chromosome 7 7 163218 163318 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000119020 ARS_consensus_sequence ARS707 7 163236 163250 W 2011-02-03 2006-10-03 +S000003147 ORF Verified YGL179C TOS3 serine/threonine protein kinase TOS3 chromosome 7 7 165091 163409 C 2011-02-03 1996-07-31 Protein kinase; related to and functionally redundant with Elm1p and Sak1p for the phosphorylation and activation of Snf1p; functionally orthologous to LKB1, a mammalian kinase associated with Peutz-Jeghers cancer-susceptibility syndrome; TOS3 has a paralog, SAK1, that arose from the whole genome duplication +S000035343 CDS YGL179C 7 165091 163409 C 2011-02-03 1996-07-31 +S000003146 ORF Verified YGL178W MPT5 UTH4|PUF5|HTR1 chromosome 7 L000001146 7 167352 170571 W 2011-02-03 1996-07-31 mRNA-binding protein of the PUF family; binds to specific mRNAs, often in the 3' UTR; has broad specificity and binds to more than 1000 mRNAs (16% of the transcriptome); recruits the CCR4-NOT deadenylase complex to mRNAs along with Dhh1p and Dcp1p to promote deadenylation, decapping, and decay; also interacts with the Caf20p translational initiation repressor, affecting its mRNA target specificity +S000034396 CDS YGL178W 7 167352 167354 W 2011-02-03 1996-07-31 +S000034397 CDS YGL178W 7 167995 170571 W 2011-02-03 1996-07-31 +S000034398 intron YGL178W 7 167355 167994 W 2011-02-03 1996-07-31 +S000003145 ORF Dubious YGL177W chromosome 7 7 167559 167906 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034289 CDS YGL177W 7 167559 167906 W 2011-02-03 1996-07-31 +S000003144 ORF Uncharacterized YGL176C chromosome 7 7 173079 171415 C 2011-02-03 1996-07-31 Putative protein of unknown function; deletion mutant is viable and has no detectable phenotype +S000033315 CDS YGL176C 7 173079 171415 C 2011-02-03 1996-07-31 +S000003143 ORF Verified YGL175C SAE2 ssDNA endodeoxyribonuclease SAE2|COM1 chromosome 7 L000002892 7 174322 173285 C 2011-02-03 1996-07-31 Endonuclease required for telomere elongation; required for telomeric 5' C-rich strand resection; involved in ds-break repair and processing hairpin DNA structures with the MRX complex; function requires sumoylation and phosphorylation; exists as inactive oligomers that are transiently released into smaller active units by phosphorylation; DNA damage triggers Sae2p removal, so active Sae2p is present only transiently; sequence and functional similarity with human CtIP/RBBP8 +S000033258 CDS YGL175C 7 174322 173285 C 2011-02-03 1996-07-31 +S000003142 ORF Verified YGL174W BUD13 CWC26 chromosome 7 7 174545 175345 W 2011-02-03 1996-07-31 Subunit of the RES complex; RES complex is required for nuclear pre-mRNA retention and splicing; involved in bud-site selection; diploid mutants display a unipolar budding pattern instead of the wild-type bipolar pattern due to a specific defect in MATa1 pre-mRNA splicing which leads to haploid gene expression in diploids +S000033236 CDS YGL174W 7 174545 175345 W 2011-02-03 1996-07-31 +S000003141 ORF Verified YGL173C XRN1 chromatin-binding exonuclease XRN1|KEM1|SKI1|SEP1|RAR5|DST2 chromosome 7 L000000891|L000001902 7 180113 175527 C -111 2011-02-03 1996-07-31 Evolutionarily-conserved 5'-3' exonuclease; component of cytoplasmic processing (P) bodies involved in mRNA decay; also enters the nucleus and positively regulates transcription initiation and elongation; plays a role in microtubule-mediated processes, filamentous growth, ribosomal RNA maturation, and telomere maintenance; activated by the scavenger decapping enzyme Dcs1p +S000033145 CDS YGL173C 7 180113 175527 C 2011-02-03 1996-07-31 +S000003140 ORF Verified YGL172W NUP49 FG-nucleoporin NUP49|NSP49 chromosome 7 L000001290 7 180700 182118 W 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; contributes directly to nucleocytoplasmic transport and maintenance of the nuclear pore complex (NPC) permeability barrier; found in stable complex with Nic96p and two other FG-nucleoproteins (Nsp1p and Nup57p) +S000032312 CDS YGL172W 7 180700 182118 W 2011-02-03 1996-07-31 +S000003139 ORF Verified YGL171W ROK1 RNA-dependent ATPase ROK1 chromosome 7 L000003005 7 182390 184084 W 2011-02-03 1996-07-31 RNA-dependent ATPase; involved in pre-rRNA processing at sites A0, A1, and A2, and in control of cell cycle progression; contains two upstream open reading frames (uORFs) in 5' untranslated region which regulate translation +S000032238 CDS YGL171W 7 182390 184084 W 2011-02-03 1996-07-31 +S000003138 ORF Verified YGL170C SPO74 chromosome 7 7 185394 184153 C 2011-02-03 1996-07-31 Component of the meiotic outer plaque of the spindle pole body; involved in modifying the meiotic outer plaque that is required prior to prospore membrane formation +S000032119 CDS YGL170C 7 185394 184153 C 2011-02-03 1996-07-31 +S000006622 tRNA_gene tK(CUU)G2 chromosome 7 L000003852 7 185786 185714 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000029890 noncoding_exon tK(CUU)G2 7 185786 185714 C 2011-02-03 2000-05-19 +S000003137 ORF Verified YGL169W SUA5 threonylcarbamoyladenylate synthase chromosome 7 L000002140 7 186059 187339 W -104.06 2011-02-03 1996-07-31 Protein involved in threonylcarbamoyl adenosine biosynthesis; Sua5p and Qri7p are necessary and sufficient for RNA t6A modification in vitro; null mutant lacks N6-threonylcarbamoyl adenosine (t6A) modification in the anticodon loop of ANN-decoding tRNA; member of conserved YrdC/Sua5 family; binds single-stranded telomeric DNA and null mutant has abnormal telomere length +S000031262 CDS YGL169W 7 186059 187339 W 2011-02-03 1996-07-31 +S000003136 ORF Verified YGL168W HUR1 chromosome 7 7 187464 187796 W 2011-02-03 1996-07-31 Protein of unknown function; reported null mutant phenotype of hydroxyurea sensitivity may be due to effects on overlapping PMR1 gene +S000031124 CDS YGL168W 7 187464 187796 W 2011-02-03 1996-07-31 +S000130163 ARS ARS709 chromosome 7 7 187464 187796 2011-02-03 2009-05-07 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay +S000003135 ORF Verified YGL167C PMR1 Ca(2+)/Mn(2+)-transporting P-type ATPase PMR1|SSC1|LDB1|BSD1 chromosome 7 L000004740|L000001455 7 190468 187616 C -104 2011-02-03 1996-07-31 High affinity Ca2+/Mn2+ P-type ATPase; required for Ca2+ and Mn2+ transport into Golgi; involved in Ca2+ dependent protein sorting, processing; D53A mutant (Mn2+ transporting) is rapamycin sensitive, Q783A mutant (Ca2+ transporting) is rapamycin resistant; Mn2+ transport into Golgi lumen required for rapamycin sensitivity; mutations in human homolog ATP2C1 cause acantholytic skin condition Hailey-Hailey disease; human ATP2C1 can complement yeast null mutant +S000030956 CDS YGL167C 7 190468 187616 C 2011-02-03 1996-07-31 +S000003134 ORF Verified YGL166W CUP2 ACE1 chromosome 7 L000000439 7 191129 191806 W -101 2011-02-03 1996-07-31 Copper-binding transcription factor; activates transcription of the metallothionein genes CUP1-1 and CUP1-2 in response to elevated copper concentrations; required for regulation of copper genes in response to DNA-damaging reagents; CUP2 has a paralog, HAA1, that arose from the whole genome duplication +S000030040 CDS YGL166W 7 191129 191806 W 2011-02-03 1996-07-31 +S000003133 ORF Dubious YGL165C chromosome 7 7 191976 191398 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF CUP2/YGL166W +S000029838 CDS YGL165C 7 191976 191398 C 2011-02-03 1996-07-31 +S000003132 ORF Verified YGL164C YRB30 chromosome 7 7 193300 191978 C 2011-02-03 1996-07-31 RanGTP-binding protein; inhibits RanGAP1 (Rna1p)-mediated GTP hydrolysis of RanGTP (Gsp1p); shares similarity to proteins in other fungi but not in higher eukaryotes +S000037824 CDS YGL164C 7 193300 191978 C 2011-02-03 1996-07-31 +S000003131 ORF Verified YGL163C RAD54 DNA-dependent ATPase RAD54|XRS1 chromosome 7 L000001574 7 196403 193707 C -111 2011-02-03 1996-07-31 DNA-dependent ATPase that stimulates strand exchange; modifies the topology of double-stranded DNA; involved in the recombinational repair of double-strand breaks in DNA during vegetative growth and meiosis; member of the SWI/SNF family of DNA translocases; forms nuclear foci upon DNA replication stress +S000037069 CDS YGL163C 7 196403 193707 C 2011-02-03 1996-07-31 +S000003130 ORF Verified YGL162W SUT1 chromosome 7 L000003483 7 198138 199037 W 2011-02-03 1996-07-31 Zn(II)2Cys6 family transcription factor; positively regulates sterol uptake genes under anaerobic conditions; involved in hypoxic gene expression; represses filamentation-inducing genes during vegetative growth; positively regulates mating with SUT2 by repressing expression of genes that act as mating inhibitors; repressed by STE12; relocalizes from the nucleus to the cytoplasm upon DNA replication stress; SUT1 has a paralog, SUT2, that arose from the whole genome duplication +S000037047 CDS YGL162W 7 198138 199037 W 2011-02-03 1996-07-31 +S000003129 ORF Verified YGL161C YIP5 chromosome 7 7 200142 199210 C 2011-02-03 1996-07-31 Protein that interacts with Rab GTPases; localized to late Golgi vesicles; computational analysis of large-scale protein-protein interaction data suggests a possible role in vesicle-mediated transport +S000036937 CDS YGL161C 7 200142 199210 C 2011-02-03 1996-07-31 +S000003128 ORF Verified YGL160W AIM14 putative metalloreductase|YNO1 chromosome 7 7 200561 202273 W 2011-02-03 1996-07-31 NADPH oxidase localized to the perinuclear ER; produces superoxide from NADPH; overexpression causes MCA1 dependent apoptosis; likely involved in superoxide-mediated regulation of the actin cytoskeleton; member of a conserved superfamily of NADPH oxidases (NOX enzymes); has similarity to iron/copper reductases (FRE1-8), particularly Fre8p +S000036910 CDS YGL160W 7 200561 202273 W 2011-02-03 1996-07-31 +S000003127 ORF Uncharacterized YGL159W chromosome 7 7 202721 203833 W 2011-02-03 1996-07-31 Putative protein of unknown function; deletion mutant has no detectable phenotype +S000036059 CDS YGL159W 7 202721 203833 W 2011-02-03 1996-07-31 +S000118454 ARS ARS710 ARSVII-204 chromosome 7 7 203914 204155 2011-02-03 2006-08-30|2011-02-03 Autonomously Replicating Sequence +S000119021 ARS_consensus_sequence ARS710 7 203972 203986 W 2011-02-03 2006-10-03 +S000006951 long_terminal_repeat YGLWtau2 chromosome 7 7 204982 205337 W 2011-02-03 2000-05-19 Ty4 LTR +S000006639 tRNA_gene tL(CAA)G1 chromosome 7 L000003821 7 205521 205634 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000034236 intron tL(CAA)G1 7 205559 205590 W 2011-02-03 2000-05-19 +S000034234 noncoding_exon tL(CAA)G1 7 205521 205558 W 2011-02-03 2000-05-19 +S000034235 noncoding_exon tL(CAA)G1 7 205591 205634 W 2011-02-03 2000-05-19 +S000003126 ORF Verified YGL158W RCK1 putative serine/threonine protein kinase RCK1 chromosome 7 L000001592 7 207033 208571 W 2011-02-03 1996-07-31 Protein kinase involved in oxidative stress response; promotes pseudohyphal growth via activation of Ubp3p phosphorylation; identified as suppressor of S. pombe cell cycle checkpoint mutations; RCK1 has a paralog, RCK2, that arose from the whole genome duplication +S000035130 CDS YGL158W 7 207033 208571 W 2011-02-03 1996-07-31 +S000003125 ORF Verified YGL157W ARI1 carbonyl reductase (NADPH-dependent) ARI1 chromosome 7 7 209006 210049 W 2011-02-03 1996-07-31 NADPH-dependent aldehyde reductase; utilizes aromatic and alophatic aldehyde substrates; member of the short-chain dehydrogenase/reductase superfamily +S000034964 CDS YGL157W 7 209006 210049 W 2011-02-03 1996-07-31 +S000003124 ORF Verified YGL156W AMS1 alpha-mannosidase chromosome 7 L000000084 7 210416 213667 W -98 2011-02-03 1996-07-31 Vacuolar alpha mannosidase; involved in free oligosaccharide (fOS) degradation; delivered to the vacuole in a novel pathway separate from the secretory pathway +S000034834 CDS YGL156W 7 210416 213667 W 2011-02-03 1996-07-31 +S000003123 ORF Verified YGL155W CDC43 protein geranylgeranyltransferase type I subunit CDC43|CAL1 chromosome 7 L000000277 7 214081 215211 W -99 2011-02-03 1996-07-31 Beta subunit of geranylgeranyltransferase type I; subunit of the Ram2p-Cdc43p heterodimer that catalyzes the geranylgeranylation of the cysteine residue in proteins containing a C-terminal CaaX sequence ending in Leu or Phe; has substrates important for morphogenesis +S000033923 CDS YGL155W 7 214081 215211 W 2011-02-03 1996-07-31 +S000003122 ORF Verified YGL154C LYS5 holo-[acyl-carrier-protein] synthase chromosome 7 L000000967 7 216096 215278 C -97 2011-02-03 1996-07-31 Phosphopantetheinyl transferase involved in lysine biosynthesis; converts inactive apo-form of Lys2p (alpha-aminoadipate reductase) into catalytically active holo-form by posttranslational addition of phosphopantetheine +S000033755 CDS YGL154C 7 216096 215278 C 2011-02-03 1996-07-31 +S000003121 ORF Verified YGL153W PEX14 chromosome 7 L000004118 7 216273 217298 W 2011-02-03 1996-07-31 Central component of the peroxisomal importomer complex; peroxisomal protein import machinery docking complex component; interacts with both PTS1 (Pex5p) and PTS2 (Pex7p) peroxisomal matrix protein signal recognition factors and membrane receptor Pex13p +S000033715 CDS YGL153W 7 216273 217298 W 2011-02-03 1996-07-31 +S000003120 ORF Dubious YGL152C chromosome 7 7 217369 216692 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF PEX14/YGL153W +S000033004 CDS YGL152C 7 217369 216692 C 2011-02-03 1996-07-31 +S000003119 ORF Verified YGL151W NUT1 SSX4|MED5 chromosome 7 L000003073|S000029517|L000002100 7 217524 220922 W 2011-02-03 1996-07-31 Component of the RNA polymerase II mediator complex; mediator is required for transcriptional activation and also has a role in basal transcription +S000032975 CDS YGL151W 7 217524 220922 W 2011-02-03 1996-07-31 +S000003117 ORF Uncharacterized YGL149W chromosome 7 7 225572 225877 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YGL149W is not an essential gene +S000032110 CDS YGL149W 7 225572 225877 W 2011-02-03 1996-07-31 +S000003118 ORF Verified YGL150C INO80 chromatin-remodeling ATPase INO80 chromosome 7 L000004543 7 225573 221104 C 2011-02-03 1996-07-31 ATPase and nucleosome spacing factor; subunit of complex containing actin and actin-related proteins that has chromatin remodeling activity and 3' to 5' DNA helicase activity in vitro; promotes nucleosome shifts in the 3 prime direction; has a role in modulating stress gene transcription +S000032821 CDS YGL150C 7 225573 221104 C 2011-02-03 1996-07-31 +S000003116 ORF Verified YGL148W ARO2 bifunctional chorismate synthase/riboflavin reductase [NAD(P)H] ARO2 chromosome 7 L000000117 7 226399 227529 W -90 2011-02-03 1996-07-31 Bifunctional chorismate synthase and flavin reductase; catalyzes the conversion of 5-enolpyruvylshikimate 3-phosphate (EPSP) to form chorismate, which is a precursor to aromatic amino acids; protein abundance increases in response to DNA replication stress +S000031990 CDS YGL148W 7 226399 227529 W 2011-02-03 1996-07-31 +S000003115 ORF Verified YGL147C RPL9A uL6|ribosomal 60S subunit protein L9A|L6|rp24|YL11|L9A|L8A chromosome 7 L000001708 7 228329 227754 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L9A; homologous to mammalian ribosomal protein L9 and bacterial L6; RPL9A has a paralog, RPL9B, that arose from a single-locus duplication +S000031756 CDS YGL147C 7 228329 227754 C 2011-02-03 1996-07-31 +S000003114 ORF Uncharacterized YGL146C RRT6 chromosome 7 7 229686 228751 C 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene identified in a screen for mutants with increased levels of rDNA transcription; contains two putative transmembrane spans, but no significant homology to other known proteins +S000030808 CDS YGL146C 7 229686 228751 C 2011-02-03 1996-07-31 +S000003113 ORF Verified YGL145W TIP20 TIP1 chromosome 7 L000002756 7 230243 232348 W 2011-02-03 1996-07-31|2011-02-03 Peripheral membrane protein required for COPI vesicle fusion to the ER; mediates Sey1p-independent homotypic ER fusion; prohibits back-fusion of COPII vesicles with the ER; forms a tethering complex with Sec39p and Dsl1p that interacts with ER SNAREs Sec20p and Use1p +S000030778 CDS YGL145W 7 230243 232348 W 2011-02-03 1996-07-31|2011-02-03 +S000007642 ARS ARS701 ARS137 chromosome 7 7 231907 231981 2011-02-03 2001-03-06 ARS containing only an imperfect match to the core consensus sequence +S000003112 ORF Verified YGL144C ROG1 putative lipase ROG1 chromosome 7 7 234507 232450 C 2011-02-03 1996-07-31 Lipase with specificity for monoacylglycerol; preferred substrate is 1-oleoylglycerol; null mutation affects lipid droplet morphology and overexpression causes increased accumulation of reactive oxygen species +S000030591 CDS YGL144C 7 234507 232450 C 2011-02-03 1996-07-31 +S000003111 ORF Verified YGL143C MRF1 chromosome 7 L000001150 7 235958 234717 C 2011-02-03 1996-07-31 Mitochondrial translation release factor; involved in stop codon recognition and hydrolysis of the peptidyl-tRNA bond during mitochondrial translation; lack of MRF1 causes mitochondrial genome instability +S000037757 CDS YGL143C 7 235958 234717 C 2011-02-03 1996-07-31 +S000003110 ORF Verified YGL142C GPI10 putative glycosylphosphatidylinositol-alpha 1,2 mannosyltransferase chromosome 7 L000004297 7 238119 236269 C 2011-02-03 1996-07-31 Integral membrane protein involved in GPI anchor synthesis; putative alpha 1,2 mannosyltransferase required for addition of the third mannose onto the glycosylphosphatidylinositol (GPI) core structure; human PIG-Bp is a functional homolog +S000037696 CDS YGL142C 7 238119 236269 C 2011-02-03 1996-07-31 +S000003109 ORF Verified YGL141W HUL5 ubiquitin-ubiquitin ligase HUL5 chromosome 7 7 238353 241085 W 2011-02-03 1996-07-31 Multiubiquitin chain assembly factor (E4); proteasome processivity factor that elongates polyUb chains on substrates, opposing Ubp6p, a branched polyubiquitin protease; required for retrograde transport of misfolded proteins during ERAD; required for ubiquitination of a subset of cytosolic misfolded proteins upon heat shock +S000037673 CDS YGL141W 7 238353 241085 W 2011-02-03 1996-07-31 +S000130164 ARS ARS712 chromosome 7 7 241085 241353 2011-02-03 2009-05-07 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay +S000003108 ORF Uncharacterized YGL140C chromosome 7 7 245012 241353 C 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene; contains multiple predicted transmembrane domains +S000037564 CDS YGL140C 7 245012 241353 C 2011-02-03 1996-07-31 +S000003107 ORF Verified YGL139W FLC3 putative flavin adenine dinucleotide transporter|HUF3 chromosome 7 7 245716 248124 W 2011-02-03 1996-07-31 Putative FAD transporter, similar to Flc1p and Flc2p; localized to the ER; FLC3 has a paralog, FLC1, that arose from the whole genome duplication +S000037900 CDS YGL139W 7 245716 248124 W 2011-02-03 1996-07-31 +S000003106 ORF Uncharacterized YGL138C chromosome 7 7 249531 248494 C 2011-02-03 1996-07-31 Putative protein of unknown function; has no significant sequence similarity to any known protein +S000036000 CDS YGL138C 7 249531 248494 C 2011-02-03 1996-07-31 +S000003105 ORF Verified YGL137W SEC27 coatomer subunit beta' chromosome 7 L000001848 7 249869 252738 W 2011-02-03 1996-07-31 Essential beta'-coat protein of the COPI coatomer; involved in ER-to-Golgi and Golgi-to-ER transport; contains WD40 domains that mediate cargo selective interactions; 45% sequence identity to mammalian beta'-COP +S000035921 CDS YGL137W 7 249869 249886 W 2011-02-03 1996-07-31 +S000035922 CDS YGL137W 7 250087 252738 W 2011-02-03 1996-07-31 +S000035923 intron YGL137W 7 249887 250086 W 2011-02-03 1996-07-31 +S000003104 ORF Verified YGL136C MRM2 21S rRNA (uridine2791-2'-O) methyltransferase chromosome 7 7 253859 252897 C 2011-02-03 1996-07-31 Mitochondrial 2' O-ribose methyltransferase; required for methylation of U(2791) in 21S rRNA; MRM2 deletion confers thermosensitive respiration and loss of mitochondrial DNA; has similarity to Spb1p and Trm7p, and to E. coli FtsJ/RrmJ +S000035725 CDS YGL136C 7 253859 252897 C 2011-02-03 1996-07-31 +S000003103 ORF Verified YGL135W RPL1B uL1|ribosomal 60S subunit protein L1B|L1|L1B|SSM2 chromosome 7 L000002658 7 254641 255294 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L1B; N-terminally acetylated; homologous to mammalian ribosomal protein L10A and bacterial L1; RPL1B has a paralog, RPL1A, that arose from the whole genome duplication; rpl1a rpl1b double null mutation is lethal +S000035683 CDS YGL135W 7 254641 255294 W 2011-02-03 1996-07-31 +S000003102 ORF Verified YGL134W PCL10 chromosome 7 L000004042 7 255663 256964 W 2011-02-03 1996-07-31 Pho85p cyclin; recruits, activates, and targets Pho85p cyclin-dependent protein kinase to its substrate; PCL10 has a paralog, PCL8, that arose from the whole genome duplication +S000034682 CDS YGL134W 7 255663 256964 W 2011-02-03 1996-07-31 +S000003101 ORF Verified YGL133W ITC1 chromosome 7 7 257707 261501 W 2011-02-03 1996-07-31 Subunit of ATP-dependent Isw2p-Itc1p chromatin remodeling complex; required for repression of a-specific genes, repression of early meiotic genes during mitotic growth, and repression of INO1; similar to mammalian Acf1p, the regulatory subunit of the mammalian ATP-utilizing chromatin assembly and modifying factor (ACF) complex; ITC1 has a paralog, YPL216W, that arose from the whole genome duplication +S000034589 CDS YGL133W 7 257707 261501 W 2011-02-03 1996-07-31 +S000003100 ORF Dubious YGL132W chromosome 7 7 261580 261915 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene SNT2/YGL131C +S000034500 CDS YGL132W 7 261580 261915 W 2011-02-03 1996-07-31 +S000003099 ORF Verified YGL131C SNT2 DNA-binding E3 ubiquitin-protein ligase SNT2 chromosome 7 7 265859 261648 C 2011-02-03 1996-07-31 Subunit of Snt2C complex, RING finger ubiquitin ligase (E3); physically associates with Ecm5p and Rpd3p; along with Ecm5p, recruits Rpd3p to small number of promoters; colocalizes with Ecm5p, independently of Rpd3p, to promoters of stress response genes upon oxidative stress; involved in ubiquitination, degradation of excess histones; interacts with Ubc4p; role in regulating genes encoding amine transporters; relocalizes from nucleus to cytoplasm upon DNA replication stress +S000033546 CDS YGL131C 7 265859 261648 C 2011-02-03 1996-07-31 +S000003098 ORF Verified YGL130W CEG1 mRNA guanylyltransferase chromosome 7 L000000291 7 266145 267524 W 2011-02-03 1996-07-31 Guanylyltransferase involved in mRNA 5' capping; subunit of mRNA capping enzyme, which is a heterotetramer composed of two molecules of Ceg1p and a homodimer of Cet1p, the mRNA 5'-triphosphatase subunit; nuclear import of Ceg1p requires interaction with Cet1p; mammalian capping enzyme is a single bifunctional polypeptide; human homolog RNGTT can complement yeast ceg1 null mutant +S000033518 CDS YGL130W 7 266145 267524 W 2011-02-03 1996-07-31 +S000003097 ORF Verified YGL129C RSM23 mitochondrial 37S ribosomal protein RSM23 chromosome 7 7 269075 267723 C 2011-02-03 1996-07-31|2011-02-03 Mitochondrial ribosomal protein of the small subunit; has similarity to mammalian apoptosis mediator proteins; null mutation prevents induction of apoptosis by overproduction of metacaspase Mca1p +S000033944 CDS YGL129C 7 269075 267723 C 2011-02-03 1996-07-31|2011-02-03 +S000003096 ORF Verified YGL128C CWC23 U2-type spliceosomal complex subunit CWC23 chromosome 7 7 270144 269293 C 2011-02-03 2003-09-22|1996-07-31 Component of a complex containing Cef1p; putatively involved in pre-mRNA splicing; has similarity to E. coli DnaJ and other DnaJ-like proteins and to S. pombe Cwf23p +S000033837 CDS YGL128C 7 270144 269293 C 2011-02-03 2003-09-22|1996-07-31 +S000003095 ORF Verified YGL127C SOH1 MED31 chromosome 7 L000001982 7 270775 270392 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; involved in telomere maintenance; conserved with other metazoan MED31 subunits +S000033696 CDS YGL127C 7 270775 270392 C 2011-02-03 1996-07-31 +S000003094 ORF Verified YGL126W SCS3 FIT2B chromosome 7 L000002845 7 270997 272139 W 2011-02-03 1996-07-31 Protein required for inositol prototrophy; required for normal ER membrane biosynthesis; ortholog of the FIT family of proteins involved in triglyceride droplet biosynthesis and homologous to human FIT2; disputed role in the synthesis of inositol phospholipids from inositol +S000033638 CDS YGL126W 7 270997 272139 W 2011-02-03 1996-07-31 +S000003093 ORF Verified YGL125W MET13 methylenetetrahydrofolate reductase (NAD(P)H) MET13|MRPL45|MET11 chromosome 7 L000003570|L000001085 7 272520 274322 W -77 2011-02-03 2003-01-06|1996-07-31 Major isozyme of methylenetetrahydrofolate reductase; catalyzes the reduction of 5,10-methylenetetrahydrofolate to 5-methyltetrahydrofolate in the methionine biosynthesis pathway +S000030346 CDS YGL125W 7 272520 274322 W 2011-02-03 2003-01-06|1996-07-31 +S000003092 ORF Verified YGL124C MON1 AUT12 chromosome 7 7 276714 274780 C 2011-02-03 1996-07-31|2011-02-03 Subunit of a heterodimeric guanine nucleotide exchange factor (GEF); subunit of the Mon1-Ccz1 GEF complex which stimulates nucleotide exchange and activation of Ypt7p, a Rab family GTPase involved in membrane tethering and fusion events at the late endosome and vacuole; GEF activity is stimulated by membrane association and anionic phospholipids; role in localizing Ypt7p to the vacuolar membrane; required for autophagy, the CVT pathway and mitophagy; potential Cdc28 substrate +S000030087 CDS YGL124C 7 276714 274780 C 2011-02-03 1996-07-31|2011-02-03 +S000003091 ORF Verified YGL123W RPS2 uS5|ribosomal 40S subunit protein S2|rp12|Ys5|S5|S4|S2|SUP138|SUP44|SUP38|RPS4 chromosome 7 L000002205 7 277617 278381 W -72 2011-02-03 1996-07-31 Protein component of the small (40S) subunit; essential for control of translational accuracy; phosphorylation by C-terminal domain kinase I (CTDK-I) enhances translational accuracy; methylated on one or more arginine residues by Hmt1p; homologous to mammalian ribosomal protein S2 and bacterial S5 +S000030054 CDS YGL123W 7 277617 278381 W 2011-02-03 1996-07-31 +S000028634 ORF Dubious YGL123C-A chromosome 7 7 277864 277634 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene RPS2/YGL123W +S000032390 CDS YGL123C-A 7 277864 277634 C 2011-02-03 2003-07-29 +S000003090 ORF Verified YGL122C NAB2 mRNA-binding protein NAB2 chromosome 7 L000001227 7 280523 278946 C 2011-02-03 1996-07-31 Nuclear polyadenylated RNA-binding protein; required for nuclear mRNA export and poly(A) tail length control; stimulates RNA polymerase III transcription by enhancing TFIIIB binding to promoters; protects mRNA against decay by the nuclear exosome in a poly(A)-tail-dependent manner; involved in forming export-competent mRNPs in the nucleus; autoregulates mRNA levels; NLS binds Kap104p; protein abundance increases under DNA replication stress; related to human hnRNPs +S000037370 CDS YGL122C 7 280523 278946 C 2011-02-03 1996-07-31 +S000003089 ORF Verified YGL121C GPG1 chromosome 7 7 281157 280777 C 2011-02-03 1996-07-31 Proposed gamma subunit of the heterotrimeric G protein; interacts with the receptor Gpr1p; involved in regulation of pseudohyphal growth; requires Gpb1p or Gpb2p to interact with Gpa2p; overproduction causes prion curing +S000037311 CDS YGL121C 7 281157 280777 C 2011-02-03 1996-07-31 +S000003088 ORF Verified YGL120C PRP43 DEAH-box ATP-dependent RNA helicase PRP43|JA1 chromosome 7 L000003359 7 283937 281634 C 2011-02-03 1996-07-31 RNA helicase in the DEAH-box family; functions in both RNA polymerase I and polymerase II transcript metabolism; catalyzes removal of U2, U5, and U6 snRNPs from the postsplicing lariat-intron ribonucleoprotein complex; required for efficient biogenesis of both small- and large-subunit rRNAs; acts with Sqs1p to promote 20S to 18S rRNA processing catalyzed by endonuclease Nob1p +S000037207 CDS YGL120C 7 283937 281634 C 2011-02-03 1996-07-31 +S000003087 ORF Verified YGL119W COQ8 protein kinase COQ8|ABC1 chromosome 7 L000000010 7 284442 285947 W 2011-02-03 1996-07-31 ATPase required for ubiquinone biosynthesis and respiratory growth; maintains levels of CoQ biosynthetic proteins; binds to CoQ biosynthesis intermediates; UbiB protein kinase-like family member that lacks canonical protein kinase activity; similar to prokaryotic proteins involved in ubiquinone biosynthesis; human homolog ADCK3 complements a coq8 null, is associated with CoQ and respiratory-chain deficiencies, and is mutated in autosomal-recessive cerebellar ataxia type 2 +S000037639 CDS YGL119W 7 284442 285947 W 2011-02-03 1996-07-31 +S000118455 ARS ARS714 ARSVII-286 chromosome 7 7 285991 286081 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000119022 ARS_consensus_sequence ARS714 7 286004 286018 W 2011-02-03 2006-10-03 +S000006771 tRNA_gene tW(CCA)G1 chromosome 7 L000003851 7 287455 287350 C 2011-02-03 2000-05-19 Tryptophan tRNA (tRNA-Trp), predicted by tRNAscan-SE analysis +S000032524 intron tW(CCA)G1 7 287419 287386 C 2011-02-03 2000-05-19 +S000032523 noncoding_exon tW(CCA)G1 7 287385 287350 C 2011-02-03 2000-05-19 +S000032522 noncoding_exon tW(CCA)G1 7 287455 287420 C 2011-02-03 2000-05-19 +S000003086 ORF Uncharacterized YGL118C chromosome 7 7 288451 288014 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YGL118C is not an essential gene +S000037518 CDS YGL118C 7 288451 288014 C 2011-02-03 1996-07-31 +S000130165 ARS ARS715 chromosome 7 7 288451 288512 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000003085 ORF Uncharacterized YGL117W chromosome 7 7 288512 289309 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000037461 CDS YGL117W 7 288512 289309 W 2011-02-03 1996-07-31 +S000003084 ORF Verified YGL116W CDC20 ubiquitin-protein transferase activating protein CDC20|PAC5 chromosome 7 L000000259 7 289809 291641 W -70 2011-02-03 1996-07-31 Activator of anaphase-promoting complex/cyclosome (APC/C); APC/C is required for metaphase/anaphase transition; directs ubiquitination of mitotic cyclins, Pds1p, and other anaphase inhibitors; cell-cycle regulated; potential Cdc28p substrate; relative distribution to the nucleus increases upon DNA replication stress +S000032000 CDS YGL116W 7 289809 291641 W 2011-02-03 1996-07-31 +S000003083 ORF Verified YGL115W SNF4 AMP-activated serine/threonine-protein kinase regulatory subunit SNF4|SCI1|CAT3 chromosome 7 L000001947 7 292033 293001 W 2011-02-03 1996-07-31 Activating gamma subunit of the AMP-activated Snf1p kinase complex; additional subunits of the complex are Snf1p and a Sip1p/Sip2p/Gal83p family member; activates glucose-repressed genes, represses glucose-induced genes; role in sporulation, and peroxisome biogenesis; protein abundance increases in response to DNA replication stress +S000031879 CDS YGL115W 7 292033 293001 W 2011-02-03 1996-07-31 +S000003082 ORF Uncharacterized YGL114W OPT3 chromosome 7 7 293460 295637 W 2011-02-03 1996-07-31 Putative protein of unknown function; predicted member of the oligopeptide transporter (OPT) family of membrane transporters +S000031734 CDS YGL114W 7 293460 295637 W 2011-02-03 1996-07-31 +S000003081 ORF Verified YGL113W SLD3 chromosome 7 7 295932 297938 W 2011-02-03 1996-07-31 Protein involved in the initiation of DNA replication; required for proper assembly of replication proteins at the origins of replication; interacts with Cdc45p; localizes to nuclear foci that become diffuse upon DNA replication stress; homologous to the human Treslin/Ticrr protein +S000036243 CDS YGL113W 7 295932 297938 W 2011-02-03 1996-07-31 +S000003080 ORF Verified YGL112C TAF6 TafII60|TAF60 chromosome 7 L000002828 7 299728 298178 C 2011-02-03 1996-07-31 Subunit (60 kDa) of TFIID and SAGA complexes; involved in transcription initiation of RNA polymerase II and in chromatin modification, similar to histone H4; relocalizes to the cytosol in response to hypoxia +S000036054 CDS YGL112C 7 299728 298178 C 2011-02-03 1996-07-31 +S000003079 ORF Verified YGL111W NSA1 ribosome biosynthesis protein NSA1 chromosome 7 7 299978 301369 W 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; involved in 60S ribosomal subunit biogenesis +S000035260 CDS YGL111W 7 299978 301369 W 2011-02-03 1996-07-31 +S000003078 ORF Verified YGL110C CUE3 chromosome 7 7 303411 301537 C 2011-02-03 1996-07-31 Protein of unknown function; has a CUE domain that binds ubiquitin, which may facilitate intramolecular monoubiquitination +S000035107 CDS YGL110C 7 303411 301537 C 2011-02-03 1996-07-31 +S000003077 ORF Dubious YGL109W chromosome 7 7 303513 303836 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the uncharacterized gene YGL108C +S000034172 CDS YGL109W 7 303513 303836 W 2011-02-03 1996-07-31|2011-02-03 +S000003076 ORF Verified YGL108C chromosome 7 7 304071 303649 C 2011-02-03 1996-07-31 Protein of unknown function, predicted to be palmitoylated; SWAT-GFP, seamless-GFP and mCherry C-terminal fusion proteins localize to the cytosol, while N-terminal GFP fusion protein localizes to the cell periphery; protein abundance increases in response to DNA replication stress +S000034006 CDS YGL108C 7 304071 303649 C 2011-02-03 1996-07-31 +S000003075 ORF Verified YGL107C RMD9 chromosome 7 7 306273 304333 C 2011-02-03 1996-07-31 Mitochondrial protein required for respiratory growth; mutant phenotype and genetic interactions suggest a role in delivering mt mRNAs to ribosomes; located on matrix face of the inner membrane and loosely associated with mitoribosomes; RMD9 has a paralog, YBR238C, that arose from the whole genome duplication +S000033204 CDS YGL107C 7 306273 304333 C 2011-02-03 1996-07-31 +S000003074 ORF Verified YGL106W MLC1 chromosome 7 L000004170 7 306560 307009 W 2011-02-03 1996-07-31 Essential light chain for Myo1p; light chain for Myo2p; stabilizes Myo2p by binding to the neck region; interacts with Myo1p, Iqg1p, and Myo2p to coordinate formation and contraction of the actomyosin ring with targeted membrane deposition +S000033181 CDS YGL106W 7 306560 307009 W 2011-02-03 1996-07-31 +S000003073 ORF Verified YGL105W ARC1 chromosome 7 L000003553 7 307437 308567 W 2011-02-03 1996-07-31 Protein that binds tRNA and methionyl- and glutamyl-tRNA synthetases; involved in tRNA delivery, stimulating catalysis, and ensuring localization; also binds quadruplex nucleic acids; protein abundance increases in response to DNA replication stress; methionyl-tRNA synthetase is Mes1p; glutamyl-tRNA synthetase is Gus1p +S000033089 CDS YGL105W 7 307437 308567 W 2011-02-03 1996-07-31 +S000003072 ORF Verified YGL104C VPS73 putative sugar transporter chromosome 7 7 310173 308713 C 2011-02-03 1996-07-31 Mitochondrial protein; mutation affects vacuolar protein sorting; putative transporter; member of the sugar porter family; VPS73 has a paralog, YBR241C, that arose from the whole genome duplication +S000032120 CDS YGL104C 7 310173 308713 C 2011-02-03 1996-07-31 +S000003071 ORF Verified YGL103W RPL28 uL15|ribosomal 60S subunit protein L28|L15|rp44|YL24|L29|L28|CYH2 chromosome 7 L000000454 7 310967 311927 W -64 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L28; homologous to mammalian ribosomal protein L27A and bacterial L15; may have peptidyl transferase activity; can mutate to cycloheximide resistance +S000032088 CDS YGL103W 7 310967 311015 W 2011-02-03 1996-07-31 +S000032089 CDS YGL103W 7 311527 311927 W 2011-02-03 1996-07-31 +S000032090 intron YGL103W 7 311016 311526 W 2011-02-03 1996-07-31 +S000003070 ORF Dubious YGL102C chromosome 7 7 311933 311505 C 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; overlaps 3' end of essential RPL28 gene encoding a large subunit ribosomal protein +S000031837 CDS YGL102C 7 311933 311505 C 2011-02-03 1996-07-31 +S000003069 ORF Uncharacterized YGL101W chromosome 7 7 312193 312840 W 2011-02-03 1996-07-31 Protein of unknown function; non-essential gene; interacts with the DNA helicase Hpr5p; YGL101W has a paralog, YBR242W, that arose from the whole genome duplication +S000031742 CDS YGL101W 7 312193 312840 W 2011-02-03 1996-07-31 +S000003068 ORF Verified YGL100W SEH1 chromosome 7 L000003153 7 313234 314283 W 2011-02-03 1996-07-31 Subunit of the Nup84 nuclear pore and SEACAT subcomplexes; involved in nucleocytoplasmic transport and NPC biogenesis in the nuclear pore subcomplex; subunit of SEACAT, a subcomplex of the SEA complex that inhibits the TORC1 inhibitory role of SEACIT (Iml1p-Npr2p-Npr3p), a GAP for Gtr1p in response to amino acid limitation, thereby resulting in activation of TORC1 signaling; SEA is a coatomer-related complex that associates dynamically with the vacuole; human SEH1 homolog +S000030802 CDS YGL100W 7 313234 314283 W 2011-02-03 1996-07-31 +S000003067 ORF Verified YGL099W LSG1 putative GTPase LSG1|KRE35 chromosome 7 7 314631 316553 W 2011-02-03 1996-07-31 Putative GTPase involved in 60S ribosomal subunit biogenesis; required for the release of Nmd3p from 60S subunits in the cytoplasm +S000032465 CDS YGL099W 7 314631 316553 W 2011-02-03 1996-07-31 +S000028467 snoRNA_gene snR82 SNR82 RUF2 chromosome 7 7 316788 317055 W 2011-02-03 2003-03-06 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at positions U1110, U2349, and U2351 +S000030074 noncoding_exon snR82 7 316788 317055 W 2011-02-03 2003-03-06 +S000003066 ORF Verified YGL098W USE1 SNAP receptor USE1|SLT1 chromosome 7 7 317342 318079 W 2011-02-03 1996-07-31 Essential SNARE protein localized to the ER; involved in retrograde traffic from the Golgi to the ER and Sey1p-independent homotypic ER fusion; required for efficient nuclear fusion during mating; forms a complex with the SNAREs Sec22p, Sec20p and Ufe1p +S000032364 CDS YGL098W 7 317342 318079 W 2011-02-03 1996-07-31 +S000006942 long_terminal_repeat YGLWdelta4 chromosome 7 7 318697 318860 W 2011-02-03 2000-05-19 Ty1 LTR +S000006936 long_terminal_repeat YGLCdelta5 chromosome 7 7 319341 319009 C 2011-02-03 2000-05-19 Ty1 LTR +S000006937 long_terminal_repeat YGLCsigma1 chromosome 7 7 319762 319423 C 2011-02-03 2000-05-19 Ty3 LTR +S000006596 tRNA_gene tH(GUG)G2 chromosome 7 L000003853 7 319781 319852 W 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis +S000036200 noncoding_exon tH(GUG)G2 7 319781 319852 W 2011-02-03 2000-05-19 +S000006939 long_terminal_repeat YGLCtau3 chromosome 7 7 320707 320355 C 2011-02-03 2000-05-19 Ty4 LTR +S000003065 ORF Verified YGL097W SRM1 Ran guanyl-nucleotide exchange factor|TSM437|PRP20|MTR1 chromosome 7 L000002058|L000001216|S000029621|L000002370 7 321782 323230 W 2011-02-03 1996-07-31 Nucleotide exchange factor for Gsp1p; localizes to the nucleus, required for nucleocytoplasmic trafficking of macromolecules; suppressor of the pheromone response pathway; potentially phosphorylated by Cdc28p; human homolog of the RAN GEF, RCC1, can complement a temperature sensitive point mutant +S000032259 CDS YGL097W 7 321782 323230 W 2011-02-03 1996-07-31 +S000003064 ORF Verified YGL096W TOS8 chromosome 7 7 325331 326161 W 2011-02-03 1996-07-31 Homeodomain-containing protein and putative transcription factor; found associated with chromatin; target of SBF transcription factor; induced during meiosis and under cell-damaging conditions; TOS8 has a paralog, CUP9, that arose from the whole genome duplication +S000031260 CDS YGL096W 7 325331 326161 W 2011-02-03 1996-07-31 +S000006943 long_terminal_repeat YGLWdelta6 chromosome 7 7 327904 328224 W 2011-02-03 2000-05-19 Ty1 LTR +S000006553 tRNA_gene tE(UUC)G1 SOE1 chromosome 7 L000003823|L000001980 7 328583 328654 W -63 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; can mutate to become a missense suppressor tRNA that inserts glutamate residues at lysine codons; target of K. lactis zymocin +S000034645 noncoding_exon tE(UUC)G1 7 328583 328654 W 2011-02-03 2000-05-19 +S000003063 ORF Verified YGL095C VPS45 VPL28|STT10 chromosome 7 L000002478 7 330607 328874 C 2011-02-03 1996-07-31 Protein of the Sec1p/Munc-18 family; essential for vacuolar protein sorting; required for the function of Pep12p and the early endosome/late Golgi SNARE Tlg2p; essential for fusion of Golgi-derived vesicles with the prevacuolar compartment +S000031062 CDS YGL095C 7 330607 328874 C 2011-02-03 1996-07-31 +S000003062 ORF Verified YGL094C PAN2 poly(A)-specific ribonuclease chromosome 7 L000003115 7 334465 331118 C 2011-02-03 1996-07-31 Catalytic subunit of the Pan2p-Pan3p poly(A)-ribonuclease complex; complex acts to control poly(A) tail length and regulate the stoichiometry and activity of postreplication repair complexes +S000030953 CDS YGL094C 7 334465 331118 C 2011-02-03 1996-07-31 +S000003061 ORF Verified YGL093W SPC105 chromosome 7 L000004697 7 334886 337639 W 2011-02-03 1996-07-31 Subunit of a kinetochore-microtubule binding complex; complex bridges centromeric heterochromatin and kinetochore MAPs and motors; required for sister chromatid bi-orientation and kinetochore binding of SAC components; complex also includes Kre28p; modified by sumoylation +S000030038 CDS YGL093W 7 334886 337639 W 2011-02-03 1996-07-31 +S000003060 ORF Verified YGL092W NUP145 nucleocytoplasmic transporter NUP145|RAT10 chromosome 7 L000001294 7 337906 341859 W 2011-02-03 1996-07-31 Essential protein with distinct roles in two nuclear pore subcomplexes; catalyzes its own proteolytic cleavage in vivo to generate a C-terminal fragment that is a structural component of the Nup84p subcomplex (with roles in NPC biogenesis and localization of genes to the nuclear periphery), and an N-terminal fragment that is one of several FG-nucleoporins within the NPC central core directly responsible for nucleocytoplasmic transport; homologous to human NUP98 +S000029907 CDS YGL092W 7 337906 341859 W 2011-02-03 1996-07-31 +S000003059 ORF Verified YGL091C NBP35 Fe-S cluster-binding ATPase chromosome 7 L000003338 7 343042 342056 C 2011-02-03 1996-07-31 Essential cytoplasmic iron-sulfur cluster binding protein; forms a complex with Cfd1p that is involved in iron-sulfur protein assembly in the cytosol; similar to P-loop NTPases +S000037170 CDS YGL091C 7 343042 342056 C 2011-02-03 1996-07-31 +S000003058 ORF Verified YGL090W LIF1 chromosome 7 L000004541 7 343319 344584 W 2011-02-03 1996-07-31 Component of the DNA ligase IV complex; this complex mediates nonhomologous end joining in DNA double-strand break repair; physically interacts with Dnl4p and Nej1p; homologous to mammalian XRCC4 protein +S000037116 CDS YGL090W 7 343319 344584 W 2011-02-03 1996-07-31 +S000003057 ORF Verified YGL089C MF(ALPHA)2 chromosome 7 L000001095 7 345153 344791 C -58 2011-02-03 1996-07-31 Mating pheromone alpha-factor, made by alpha cells; interacts with mating type a cells to induce cell cycle arrest and other responses leading to mating; also encoded by MF(ALPHA)1, which is more highly expressed; binds copper(II) ions +S000036327 CDS YGL089C 7 345153 344791 C 2011-02-03 1996-07-31 +S000003056 ORF Dubious YGL088W chromosome 7 7 345836 346201 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps snR10, a snoRNA required for preRNA processing +S000036288 CDS YGL088W 7 345836 346201 W 2011-02-03 1996-07-31 +S000007499 snoRNA_gene snR10 SNR10 chromosome 7 7 345986 346230 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); essential gene required for for preRNA processing, specifically for cleavage at sites A1 and A2; also guides pseudouridylation of large subunit (LSU) rRNA at position U2923 +S000036589 noncoding_exon snR10 7 345986 346230 W 2011-02-03 2000-05-19 +S000003055 ORF Verified YGL087C MMS2 E2 ubiquitin-conjugating protein MMS2 chromosome 7 L000004015 7 346904 346406 C 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme variant; involved in error-free postreplication repair; forms a heteromeric complex with Ubc13p, an active ubiquitin-conjugating enzyme; cooperates with chromatin-associated RING finger proteins, Rad18p and Rad5p; protein abundance increases in response to DNA replication stress +S000036106 CDS YGL087C 7 346808 346406 C 2011-02-03 1996-07-31 +S000036105 CDS YGL087C 7 346904 346894 C 2011-02-03 1996-07-31 +S000036107 intron YGL087C 7 346893 346809 C 2011-02-03 1996-07-31 +S000003054 ORF Verified YGL086W MAD1 coiled-coil domain-containing protein MAD1 chromosome 7 L000000974 7 347119 349368 W 2011-02-03 1996-07-31 Coiled-coil protein involved in spindle-assembly checkpoint; required for inhibition of karyopherin/importin Pse1p (aka Kap121p) upon spindle assembly checkpoint arrest; phosphorylated by Mps1p upon checkpoint activation which leads to inhibition of anaphase promoting complex activity; forms a complex with Mad2p; gene dosage imbalance between MAD1 and MAD2 leads to chromosome instability +S000035277 CDS YGL086W 7 347119 349368 W 2011-02-03 1996-07-31 +S000003053 ORF Uncharacterized YGL085W LCL3 chromosome 7 7 349616 350440 W 2011-02-03 1996-07-31 Putative protein of unknown function; mutant has long chronological lifespan; has homology to Staphylococcus aureus nuclease; GFP-fusion protein localizes to mitochondria; is induced in response to the DNA-damaging agent MMS +S000035126 CDS YGL085W 7 349616 350440 W 2011-02-03 1996-07-31 +S000003052 ORF Verified YGL084C GUP1 O-acyltransferase chromosome 7 L000004739 7 352298 350616 C 2011-02-03 1996-07-31 Plasma membrane protein involved in remodeling GPI anchors; member of the MBOAT family of putative membrane-bound O-acyltransferases; role in misfolded protein quality control; proposed to be involved in glycerol transport; homolog of the mammalian Hedgehog pathway modulator HHATL; GUP1 has a paralog, GUP2, that arose from the whole genome duplication +S000034877 CDS YGL084C 7 352298 350616 C 2011-02-03 1996-07-31 +S000118456 ARS ARS716 ARSVII-353 chromosome 7 7 352760 352906 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178100 ARS_consensus_sequence ARS716 7 352865 352849 C 2014-11-18 2014-11-18 +S000003051 ORF Verified YGL083W SCY1 chromosome 7 L000003258 7 353058 355472 W 2011-02-03 1996-07-31 Putative kinase; suppressor of GTPase mutant; similar to bovine rhodopsin kinase; may have a role in intracellular sterol transport +S000034832 CDS YGL083W 7 353058 355472 W 2011-02-03 1996-07-31 +S000003050 ORF Uncharacterized YGL082W chromosome 7 7 355827 356972 W 2011-02-03 1996-07-31 Putative protein of unknown function; predicted prenylation/proteolysis target of Afc1p and Rce1p; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and nucleus; not an essential gene; YGL082W has a paralog, YPL191C, that arose from the whole genome duplication +S000033922 CDS YGL082W 7 355827 356972 W 2011-02-03 1996-07-31 +S000003049 ORF Uncharacterized YGL081W chromosome 7 7 357377 358339 W 2011-02-03 1996-07-31 Putative protein of unknown function; non-essential gene; interacts genetically with CHS5, a gene involved in chitin biosynthesis +S000033825 CDS YGL081W 7 357377 358339 W 2011-02-03 1996-07-31 +S000003048 ORF Verified YGL080W MPC1 pyruvate transporter MPC1|FMP37 chromosome 7 7 358636 359028 W 2011-02-03 1996-07-31 Highly conserved subunit of mitochondrial pyruvate carrier (MPC); MPC is a mitochondrial inner membrane complex that mediates pyruvate uptake and comprises Mpc1p and Mpc2p during fermentative growth, or Mcp1p and Mpc3p during respiratory growth; null mutant displays slow growth that is complemented by expression of human or mouse ortholog; mutation in human ortholog MPC1 is associated with lactic acidosis and hyperpyruvatemia +S000033711 CDS YGL080W 7 358636 359028 W 2011-02-03 1996-07-31 +S000003047 ORF Verified YGL079W KXD1 KIB1 chromosome 7 7 359444 360100 W 2011-02-03 1996-07-31 Subunit of the BLOC-1 complex involved in endosomal maturation; null mutant is sensitive to drug inducing secretion of vacuolar cargo; GFP-fusion protein localizes to the endosome +S000034302 CDS YGL079W 7 359444 360100 W 2011-02-03 1996-07-31 +S000003046 ORF Verified YGL078C DBP3 RNA-dependent ATPase DBP3 chromosome 7 L000000494 7 361859 360288 C 2011-02-03 1996-07-31 RNA-Dependent ATPase, member of DExD/H-box family; involved in cleavage of site A3 within the ITS1 spacer during rRNA processing; not essential for growth, but deletion causes severe slow-growth phenotype +S000034146 CDS YGL078C 7 361859 360288 C 2011-02-03 1996-07-31 +S000003045 ORF Verified YGL077C HNM1 CTR1 chromosome 7 L000000433|L000000795 7 363916 362225 C 2011-02-03 1996-07-31 Plasma membrane transporter for choline, ethanolamine, and carnitine; involved in the uptake of nitrogen mustard and the uptake of glycine betaine during hypersaline stress; co-regulated with phospholipid biosynthetic genes and negatively regulated by choline and myo-inositol +S000034066 CDS YGL077C 7 363916 362225 C 2011-02-03 1996-07-31 +S000007302 snoRNA_gene snR39 SNR39 chromosome 7 L000003054 7 365251 365163 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A807 +S000036769 noncoding_exon snR39 7 365251 365163 C 2011-02-03 2000-05-19 +S000003044 ORF Verified YGL076C RPL7A uL30|ribosomal 60S subunit protein L7A|YL8|L7A|L6A|L30|rp11 chromosome 7 L000002704|L000003255 7 365996 364335 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L7A; required for processing of 27SA3 pre-rRNA to 27SB pre-rRNA during assembly of large ribosomal subunit; depletion leads to a turnover of pre-rRNA; contains a conserved C-terminal Nucleic acid Binding Domain (NDB2); binds to Domain II of 25S and 5.8S rRNAs; homologous to mammalian ribosomal protein L7 and bacterial L30; RPL7A has a paralog, RPL7B, that arose from the whole genome duplication +S000032065 CDS YGL076C 7 364964 364335 C 2011-02-03 1996-07-31 +S000032064 CDS YGL076C 7 365526 365433 C 2011-02-03 1996-07-31 +S000032063 CDS YGL076C 7 365996 365986 C 2011-02-03 1996-07-31 +S000032067 intron YGL076C 7 365432 364965 C 2011-02-03 1996-07-31 +S000032066 intron YGL076C 7 365985 365527 C 2011-02-03 1996-07-31 +S000007303 snoRNA_gene snR39B SNR39B chromosome 7 L000003494 7 366469 366374 C 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position G805 +S000030654 noncoding_exon snR39B 7 366469 366374 C 2011-02-03 2000-05-19 +S000003043 ORF Verified YGL075C MPS2 MMC1 chromosome 7 L000004546|L000004250 7 368088 366925 C 2011-02-03 1996-07-31 Essential membrane protein localized at nuclear envelope and SPBs; required for insertion of the newly duplicated spindle pole body into the nuclear envelope; potentially phosphorylated by Cdc28p; MPS2 has a paralog, CSM4, that arose from the whole genome duplication +S000031904 CDS YGL075C 7 368088 366925 C 2011-02-03 1996-07-31 +S000003041 ORF Verified YGL073W HSF1 stress-responsive transcription factor HSF1|MAS3|EXA3 chromosome 7 L000000814 7 368753 371254 W 2011-02-03 1996-07-31 Trimeric heat shock transcription factor; activates multiple genes in response to highly diverse stresses; recognizes variable heat shock elements (HSEs) consisting of inverted NGAAN repeats; monitors translational status of cell through an RQC (Ribosomal Quality Control)-mediated translation-stress signal; involved in diauxic shift; posttranslationally regulated; human homolog HSF1 with linker region mutations can complement yeast hsf1 mutant +S000030864 CDS YGL073W 7 368753 371254 W 2011-02-03 1996-07-31 +S000003042 ORF Dubious YGL074C chromosome 7 7 368922 368596 C 2011-02-03 1996-07-31 Dubious open reading frame unlikely to encode a functional protein; overlaps 5' end of essential HSF1 gene encoding heat shock transcription factor +S000031746 CDS YGL074C 7 368922 368596 C 2011-02-03 1996-07-31 +S000003040 ORF Dubious YGL072C chromosome 7 7 371362 371003 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified gene HSF1; null mutant displays increased resistance to antifungal agents gliotoxin, cycloheximide and H2O2 +S000030701 CDS YGL072C 7 371362 371003 C 2011-02-03 1996-07-31 +S000003039 ORF Verified YGL071W AFT1 DNA-binding transcription factor AFT1|RCS1 chromosome 7 L000002660|L000001594 7 372012 374084 W 2011-02-03 1996-07-31 Transcription factor involved in iron utilization and homeostasis; binds consensus site PyPuCACCCPu and activates transcription in response to changes in iron availability; in iron-replete conditions localization is regulated by Grx3p, Grx4p, and Fra2p, and promoter binding is negatively regulated via Grx3p-Grx4p binding; AFT1 has a paralog, AFT2, that arose from the whole genome duplication; relative distribution to the nucleus increases upon DNA replication stress +S000030658 CDS YGL071W 7 372012 374084 W 2011-02-03 1996-07-31 +S000003038 ORF Verified YGL070C RPB9 DNA-directed RNA polymerase II core subunit RPB9|B12.6|SSU73|SHI chromosome 7 L000001683|L000001880 7 374827 374459 C 2011-02-03 1996-07-31 RNA polymerase II subunit B12.6; contacts DNA; mutations affect transcription start site selection and fidelity of transcription +S000037754 CDS YGL070C 7 374827 374459 C 2011-02-03 1996-07-31 +S000003036 ORF Verified YGL068W MNP1 mitochondrial nucleoid protein MNP1 chromosome 7 7 375087 375671 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; has similarity to E. coli L7/L12 and human MRPL7 ribosomal proteins; associates with the mitochondrial nucleoid; required for normal respiratory growth +S000030909 CDS YGL068W 7 375087 375671 W 2011-02-03 1996-07-31 +S000003037 ORF Dubious YGL069C SRF3 chromosome 7 7 375514 375050 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; 92% of ORF overlaps the uncharacterized ORF YGL068W; deletion in cyr1 mutant results in loss of stress resistance +S000030942 CDS YGL069C 7 375514 375050 C 2011-02-03 1996-07-31 +S000003035 ORF Verified YGL067W NPY1 NAD(+) diphosphatase chromosome 7 S000007505 7 376101 377255 W 2011-02-03 1996-07-31 NADH diphosphatase (pyrophosphatase); hydrolyzes the pyrophosphate linkage in NADH and related nucleotides; localizes to peroxisomes; nudix hydrolase family member +S000029896 CDS YGL067W 7 376101 377255 W 2011-02-03 1996-07-31 +S000003034 ORF Verified YGL066W SGF73 deubiquitination module subunit SGF73|SCA7 chromosome 7 7 377609 379582 W 2011-02-03 1996-07-31 Subunit of DUBm module of SAGA and SLIK; has roles in anchoring deubiquitination module (DUBm) into SAGA and SLIK complexes, maintaining organization and ubiquitin-binding conformation of Ubp8p, thereby contributing to overall DUBm activity; involved in preinitiation complex assembly at promoters; relocalizes to cytosol under hypoxia; human homolog ATXN7 implicated in spinocerebellar ataxia, and can complement yeast null mutant +S000037894 CDS YGL066W 7 377609 379582 W 2011-02-03 1996-07-31 +S000003033 ORF Verified YGL065C ALG2 GDP-Man:Man(1)GlcNAc(2)-PP-dolichol alpha-1,3-mannosyltransferase chromosome 7 L000002798 7 381271 379760 C 2011-02-03 1996-07-31 Mannosyltransferase in the N-linked glycosylation pathway; catalyzes two consecutive steps in the N-linked glycosylation pathway; alg2 mutants exhibit temperature-sensitive growth and abnormal accumulation of the lipid-linked oligosaccharide Man2GlcNAc2-PP-Dol; human ALG2 complements the temperature sensitivity and dolichol-linked oligosaccharide biosynthesis defect of the alg2-1 mutant, but mutant form from a patient with CDG-Ii fails to complement +S000035998 CDS YGL065C 7 381271 379760 C 2011-02-03 1996-07-31 +S000003032 ORF Verified YGL064C MRH4 ATP-dependent RNA helicase chromosome 7 7 383208 381523 C 2011-02-03 1996-07-31 Mitochondrial ATP-dependent RNA helicase of the DEAD-box family; required for assembly of the large subunit of mitochondrial ribosomes; binds to the large subunit rRNA, 21S_rRNA; localizes to the matrix face of the mitochondrial inner membrane and associates with the large subunit precursor and with mature ribosomes +S000035835 CDS YGL064C 7 383208 381523 C 2011-02-03 1996-07-31 +S000003031 ORF Verified YGL063W PUS2 pseudouridine synthase PUS2 chromosome 7 L000003361 7 383654 384766 W 2011-02-03 1996-07-31|2011-02-03 Mitochondrial tRNA:pseudouridine synthase; acts at positions 27 and 28, but not at position 72; efficiently and rapidly targeted to mitochondria, specifically dedicated to mitochondrial tRNA modification; mutation also affects pseudouridylation of some nuclear-encoded mRNAs; PUS2 has a paralog, PUS1, that arose from the whole genome duplication +S000035805 CDS YGL063W 7 383654 384766 W 2011-02-03 1996-07-31|2011-02-03 +S000028633 ORF Dubious YGL063C-A chromosome 7 7 384651 384502 C 2011-02-03 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032389 CDS YGL063C-A 7 384651 384502 C 2011-02-03 2003-07-29 +S000003030 ORF Verified YGL062W PYC1 pyruvate carboxylase 1 chromosome 7 L000001542 7 385196 388732 W 2011-02-03 1996-07-31 Pyruvate carboxylase isoform; cytoplasmic enzyme that converts pyruvate to oxaloacetate; differentially regulated than isoform Pyc2p; mutations in the human homolog are associated with lactic acidosis; PYC1 has a paralog, PYC2, that arose from the whole genome duplication +S000035682 CDS YGL062W 7 385196 388732 W 2011-02-03 1996-07-31 +S000118457 ARS ARS717 ARSVII-389 chromosome 7 7 388658 388891 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000119023 ARS_consensus_sequence ARS717 7 388846 388832 C 2011-02-03 2006-10-03 +S000003029 ORF Verified YGL061C DUO1 chromosome 7 L000004421 7 389711 388968 C 2011-02-03 1996-07-31 Essential subunit of the Dam1 complex (aka DASH complex); cooperates with Dam1p to connect the DASH complex with microtubules (MT); couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; is transferred to the kinetochore prior to mitosis +S000034613 CDS YGL061C 7 389711 388968 C 2011-02-03 1996-07-31 +S000003028 ORF Verified YGL060W YBP2 YBH1 chromosome 7 7 390065 391990 W 2011-02-03 1996-07-31 Central kinetochore associated protein; mediates mitotic progression; interacts with several central kinetochore proteins and centromeric histone Cse4p; role in resistance to oxidative stress; similar to Slk19p; YBP2 has a paralog, YBP1, that arose from the whole genome duplication +S000034586 CDS YGL060W 7 390065 391990 W 2011-02-03 1996-07-31 +S000003027 ORF Verified YGL059W PKP2 protein kinase PKP2 chromosome 7 7 392223 393698 W 2011-02-03 2003-01-02|1996-07-31|2011-02-03 Mitochondrial protein kinase; negatively regulates activity of the pyruvate dehydrogenase complex by phosphorylating the ser-133 residue of the Pda1p subunit; acts in concert with kinase Pkp1p and phosphatases Ptc5p and Ptc6p; relocalizes from mitochondrion to cytoplasm upon DNA replication stress +S000035146 CDS YGL059W 7 392223 393698 W 2011-02-03 2003-01-02|1996-07-31|2011-02-03 +S000003026 ORF Verified YGL058W RAD6 E2 ubiquitin-conjugating protein RAD6|PSO8|UBC2 chromosome 7 L000001560 7 393986 394504 W -44 2011-02-03 1996-07-31 Ubiquitin-conjugating enzyme (E2); involved in postreplication repair as a heterodimer with Rad18p, regulation of K63 polyubiquitination in response to oxidative stress, DSBR and checkpoint control as a heterodimer with Bre1p, ubiquitin-mediated N-end rule protein degradation as a heterodimer with Ubr1p, ERAD with Ubr1p in the absence of canonical ER membrane ligases, and Rpn4p turnover as part of proteasome homeostasis, in complex with Ubr2p and Mub1p +S000035031 CDS YGL058W 7 393986 394504 W 2011-02-03 1996-07-31 +S000003025 ORF Verified YGL057C GEP7 chromosome 7 7 395829 394966 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant exhibits a respiratory growth defect and synthetic interactions with prohibitin (phb1) and gem1; authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000034817 CDS YGL057C 7 395829 394966 C 2011-02-03 1996-07-31 +S000003024 ORF Verified YGL056C SDS23 chromosome 7 L000004692 7 397618 396035 C 2011-02-03 1996-07-31|2011-02-03 Protein involved in cell separation during budding; one of two S. cerevisiae homologs (Sds23p and Sds24p) of the S. pombe Sds23 protein, which is implicated in APC/cyclosome regulation; SDS23 has a paralog, SDS24, that arose from the whole genome duplication +S000033939 CDS YGL056C 7 397618 396035 C 2011-02-03 1996-07-31|2011-02-03 +S000003023 ORF Verified YGL055W OLE1 stearoyl-CoA 9-desaturase|MDM2 chromosome 7 L000001052|L000001297 7 398628 400160 W -37 2011-02-03 1996-07-31 Delta(9) fatty acid desaturase; required for monounsaturated fatty acid synthesis and for normal distribution of mitochondria +S000033893 CDS YGL055W 7 398628 400160 W 2011-02-03 1996-07-31 +S000003022 ORF Verified YGL054C ERV14 cornichon family protein chromosome 7 L000004816 7 401287 400871 C 2011-02-03 1996-07-31 COPII-coated vesicle protein; involved in vesicle formation and incorporation of specific secretory cargo; required for the delivery of bud-site selection protein Axl2p and Nha1p antiporter to cell surface; related to Drosophila cornichon; ERV14 has a paralog, ERV15, that arose from the whole genome duplication +S000033689 CDS YGL054C 7 401287 400871 C 2011-02-03 1996-07-31 +S000006554 tRNA_gene tE(UUC)G2 chromosome 7 L000003850 7 401598 401527 C 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000034647 noncoding_exon tE(UUC)G2 7 401598 401527 C 2011-02-03 2000-05-19 +S000006949 long_terminal_repeat YGLWsigma2 chromosome 7 7 401616 401894 W 2011-02-03 2000-05-19 Ty3 LTR +S000006944 long_terminal_repeat YGLWdelta7 chromosome 7 7 401959 402290 W 2011-02-03 2000-05-19 Ty1 LTR +S000003021 ORF Verified YGL053W PRM8 pheromone-regulated DUP240 family protein PRM8 chromosome 7 7 402589 403302 W 2011-02-03 1996-07-31 Pheromone-regulated protein; contains with 2 predicted transmembrane segments and an FF sequence, a motif involved in COPII binding; forms a complex with Prp9p in the ER; member of DUP240 gene family; PRM8 has a paralog, PRM9, that arose from a segmental duplication +S000033637 CDS YGL053W 7 402589 403302 W 2011-02-03 1996-07-31 +S000003020 ORF Dubious YGL052W chromosome 7 7 403437 403742 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF MST27 +S000030345 CDS YGL052W 7 403437 403742 W 2011-02-03 1996-07-31 +S000003019 ORF Verified YGL051W MST27 DUP240 family protein MST27 chromosome 7 7 403687 404391 W 2011-02-03 1996-07-31 Putative integral membrane protein, involved in vesicle formation; forms complex with Mst28p; member of DUP240 gene family; binds COPI and COPII vesicles; MST27 has a paralog, MST28, that arose from a segmental duplication +S000030145 CDS YGL051W 7 403687 404391 W 2011-02-03 1996-07-31 +S000006945 long_terminal_repeat YGLWdelta8 chromosome 7 7 405004 405145 W 2011-02-03 2000-05-19 Ty1 LTR +S000006946 long_terminal_repeat YGLWdelta9 chromosome 7 7 405146 405207 W 2011-02-03 2000-05-19 Ty1 LTR +S000006938 long_terminal_repeat YGLCsigma3 chromosome 7 7 405453 405208 C 2011-02-03 2000-05-19 Ty3 LTR +S000006711 tRNA_gene tR(UCU)G1 chromosome 7 L000003824 7 405470 405541 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000037328 noncoding_exon tR(UCU)G1 7 405470 405541 W 2011-02-03 2000-05-19 +S000003018 ORF Verified YGL050W TYW3 tRNA methyltransferase TYW3 chromosome 7 7 405776 406597 W 2011-02-03 1996-07-31 tRNA methyltransferase required for synthesis of wybutosine; a modified guanosine found at the 3'-position adjacent to the anticodon of phenylalanine tRNA which supports reading frame maintenance by stabilizing codon-anticodon interactions +S000030037 CDS YGL050W 7 405776 406597 W 2011-02-03 1996-07-31 +S000003017 ORF Verified YGL049C TIF4632 translation initiation factor eIF4G|eIF4G2 chromosome 7 L000002310 7 409604 406860 C 2011-02-03 1996-07-31 Translation initiation factor eIF4G; subunit of the mRNA cap-binding protein complex (eIF4F) that also contains eIF4E (Cdc33p); associates with the poly(A)-binding protein Pab1p, also interacts with eIF4A (Tif1p); TIF4632 has a paralog, TIF4631, that arose from the whole genome duplication +S000030563 CDS YGL049C 7 409604 406860 C 2011-02-03 1996-07-31 +S000003016 ORF Verified YGL048C RPT6 proteasome regulatory particle base subunit RPT6|SUG1|SCB68|CRL3|CIM3 chromosome 7 L000002174|L000000406|L000002265 7 411286 410069 C -43 2011-02-03 1996-07-31 ATPase of the 19S regulatory particle of the 26S proteasome; one of six ATPases of the regulatory particle; involved in the degradation of ubiquitinated substrates; bound by ubiquitin-protein ligases Ubr1p and Ufd4p; localized mainly to the nucleus throughout the cell cycle; protein abundance increases in response to DNA replication stress +S000030499 CDS YGL048C 7 411286 410069 C 2011-02-03 1996-07-31 +S000003015 ORF Verified YGL047W ALG13 N-acetylglucosaminyldiphosphodolichol N-acetylglucosaminyltransferase catalytic subunit ALG13 chromosome 7 7 411552 412160 W 2011-02-03 1996-07-31 Catalytic component of UDP-GlcNAc transferase; required for the second step of dolichyl-linked oligosaccharide synthesis; anchored to the ER membrane via interaction with Alg14p; similar to bacterial and human glycosyltransferases; protein abundance increases in response to DNA replication stress; both human homologs ALG13 and ALG14 are required to complement yeast alg13 mutant +S000030465 CDS YGL047W 7 411552 412160 W 2011-02-03 1996-07-31 +S000006755 tRNA_gene tV(AAC)G1 chromosome 7 L000003849 7 412367 412294 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000036903 noncoding_exon tV(AAC)G1 7 412367 412294 C 2011-02-03 2000-05-19 +S000006947 long_terminal_repeat YGLWdelta10 chromosome 7 7 412456 412725 W 2011-02-03 2000-05-19 Ty1 LTR +S000003013 ORF Verified YGL045W RIM8 ART9|YGL046W|PAL3 chromosome 7 L000004171 7 414102 415730 W 2011-02-03 2003-01-09|1996-07-31 Protein involved in proteolytic activation of Rim101p; part of response to alkaline pH; interacts with ESCRT-1 subunits Stp22p and Vps28p; essential for anaerobic growth; member of the arrestin-related trafficking adaptor family +S000037558 CDS YGL045W 7 414102 415730 W 2011-02-03 2003-01-09|1996-07-31 +S000003012 ORF Verified YGL044C RNA15 chromosome 7 L000001651 7 417036 416146 C 2011-02-03 1996-07-31 Component of the cleavage and polyadenylation factor I (CF I); CF 1, composed of the CF 1A complex (Rna14p, Rna15p, Clp1p, Pcf11p) and Hrp1, is involved in cleavage and polyadenylation of mRNA 3' ends; interacts with the A-rich polyadenylation signal in complex with Rna14p and Hrp1p; mutant displays reduced transcription elongation in the G-less-based run-on (GLRO) assay; required for gene looping and maintenance of genome stability +S000037423 CDS YGL044C 7 417036 416146 C 2011-02-03 1996-07-31 +S000003011 ORF Verified YGL043W DST1 SII|S-II|TFIIS|P37|PPR2 chromosome 7 L000001476|L000000530 7 417483 418412 W 24 2011-02-03 1996-07-31 General transcription elongation factor TFIIS; enables RNA polymerase II to read through blocks to elongation by stimulating cleavage of nascent transcripts stalled at transcription arrest sites; maintains RNAPII elongation activity on ribosomal protein genes during conditions of transcriptional stress +S000031998 CDS YGL043W 7 417483 418412 W 2011-02-03 1996-07-31 +S000003010 ORF Dubious YGL042C chromosome 7 7 418593 418288 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; deletion mutation blocks replication of Brome mosaic virus in S. cerevisiae, but this is likely due to effects on the overlapping gene DST1 +S000031778 CDS YGL042C 7 418593 418288 C 2011-02-03 1996-07-31 +S000028826 ORF Uncharacterized YGL041W-A chromosome 7 7 418825 419289 W 2011-02-03 2003-07-29|2011-02-03 Putative protein of unknown function; conserved in fungi; identified by expression profiling and mass spectrometry +S000033650 CDS YGL041W-A 7 418825 419289 W 2011-02-03 2003-07-29|2011-02-03 +S000028548 ORF Uncharacterized YGL041C-B chromosome 7 7 418886 418704 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum +S000031198 CDS YGL041C-B 7 418886 418704 C 2011-02-03 2003-07-29 +S000003009 ORF Dubious YGL041C chromosome 7 7 419225 419022 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000029877 CDS YGL041C 7 419225 419022 C 2011-02-03 1996-07-31|2011-02-03 +S000003008 ORF Verified YGL040C HEM2 porphobilinogen synthase HEM2|OLE4|SLU1 chromosome 7 L000000761 7 420555 419527 C 2011-02-03 1996-07-31 Aminolevulinate dehydratase; a homo-octameric enzyme, catalyzes the conversion of 5-aminolevulinate to porphobilinogen, the second step in heme biosynthesis; enzymatic activity is zinc-dependent; localizes to the cytoplasm and nucleus; human homolog ALAD can complement yeast hem2 mutant +S000036193 CDS YGL040C 7 420555 419527 C 2011-02-03 1996-07-31 +S000118458 ARS ARS718 ARSVII-421 chromosome 7 7 421171 421279 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000119024 ARS_consensus_sequence ARS718 7 421279 421265 C 2011-02-03 2006-10-03 +S000006640 tRNA_gene tL(CAA)G2 SUP54 chromosome 7 L000003825|L000002211 7 423092 423205 W -24 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis; can mutate to suppress amber nonsense mutations +S000034245 intron tL(CAA)G2 7 423130 423161 W 2011-02-03 2000-05-19 +S000034243 noncoding_exon tL(CAA)G2 7 423092 423129 W 2011-02-03 2000-05-19 +S000034244 noncoding_exon tL(CAA)G2 7 423162 423205 W 2011-02-03 2000-05-19 +S000003007 ORF Verified YGL039W carbonyl reductase (NADPH-dependent) chromosome 7 7 423961 425007 W 2011-02-03 1996-07-31 Aldehyde reductase; reduces aliphatic aldehyde substrates using NADH as cofactor; shown to reduce carbonyl compounds to chiral alcohols +S000035325 CDS YGL039W 7 423961 425007 W 2011-02-03 1996-07-31 +S000003006 ORF Verified YGL038C OCH1 LDB12|NGD29 chromosome 7 L000001295 7 426804 425362 C -31.86 2011-02-03 1996-07-31 Mannosyltransferase of the cis-Golgi apparatus; initiates the polymannose outer chain elongation of N-linked oligosaccharides of glycoproteins +S000035173 CDS YGL038C 7 426804 425362 C 2011-02-03 1996-07-31 +S000003005 ORF Verified YGL037C PNC1 nicotinamidase chromosome 7 7 427947 427297 C 2011-02-03 1996-07-31 Nicotinamidase that converts nicotinamide to nicotinic acid; part of the NAD(+) salvage pathway; required for life span extension by calorie restriction; lacks a peroxisomal targeting signal but is imported into peroxisomes via binding to Gpd1p; PNC1 expression responds to all known stimuli that extend replicative life span; protein increases in abundance and relative distribution to cytoplasmic foci decreases upon DNA replication stress +S000034206 CDS YGL037C 7 427947 427297 C 2011-02-03 1996-07-31 +S000003004 ORF Uncharacterized YGL036W chromosome 7 L000003392 7 428601 431330 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; YGL036W is not an essential gene +S000034168 CDS YGL036W 7 428601 431330 W 2011-02-03 1996-07-31 +S000003003 ORF Verified YGL035C MIG1 transcription factor MIG1|TDS22|SSN1|CAT4 chromosome 7 L000001110 7 433062 431548 C -27 2011-02-03 1996-07-31 Transcription factor involved in glucose repression; sequence specific DNA binding protein containing two Cys2His2 zinc finger motifs; regulated by the SNF1 kinase and the GLC7 phosphatase; regulates filamentous growth along with Mig2p in response to glucose depletion; activated in stochastic pulses of nuclear localization, shuttling between cytosol and nucleus depending on external glucose levels and its phosphorylation state +S000034005 CDS YGL035C 7 433062 431548 C 2011-02-03 1996-07-31 +S000003002 ORF Uncharacterized YGL034C chromosome 7 7 433579 433214 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YGL034C is not an essential gene +S000033200 CDS YGL034C 7 433579 433214 C 2011-02-03 1996-07-31 +S000003001 ORF Verified YGL033W HOP2 chromosome 7 L000004230 7 435625 436401 W 2014-11-18 2000-12-01|2014-11-18|1996-07-31 Meiosis-specific protein that localizes to chromosomes; prevents synapsis between nonhomologous chromosomes and ensures synapsis between homologs; complexes with Mnd1p to promote homolog pairing and meiotic double-strand break repair; heterodimer of Hop2p-Mnd1p stimulates the Dmc1p-mediated strand invasion +S000033177 CDS YGL033W 7 435625 435679 W 2011-02-03 2000-12-01|1996-07-31 +S000033178 CDS YGL033W 7 435750 436312 W 2014-11-18 2000-12-01|2014-11-18|1996-07-31 +S000178097 CDS YGL033W 7 436375 436401 W 2014-11-18 2014-11-18 +S000033179 intron YGL033W 7 435680 435749 W 2011-02-03 2000-12-01|1996-07-31 +S000178096 intron YGL033W 7 436313 436374 W 2014-11-18 2014-11-18 +S000003000 ORF Verified YGL032C AGA2 chromosome 7 L000000062 7 436833 436570 C -23.06 2011-02-03 1996-07-31 Adhesion subunit of a-agglutinin of a-cells; C-terminal sequence acts as a ligand for alpha-agglutinin (Sag1p) during agglutination, modified with O-linked oligomannosyl chains, linked to anchorage subunit Aga1p via two disulfide bonds +S000033030 CDS YGL032C 7 436833 436570 C 2011-02-03 1996-07-31 +S000002999 ORF Verified YGL031C RPL24A eL24|ribosomal 60S subunit protein L24A|L24e|rp29|YL21|L30A|L24A|RPL30A chromosome 7 L000001724 7 437934 437467 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L24A; not essential for translation but may be required for normal translation rate; homologous to mammalian ribosomal protein L24, no bacterial homolog; RPL24A has a paralog, RPL24B, that arose from the whole genome duplication +S000032115 CDS YGL031C 7 437934 437467 C 2011-02-03 1996-07-31 +S000122099 five_prime_UTR_intron YGL031C 7 438397 437942 C 2011-02-03 2007-04-04 +S000002998 ORF Verified YGL030W RPL30 eL30|ribosomal 60S subunit protein L30|L30e|rp73|YL38|L32|L30 chromosome 7 L000001726 7 439091 439638 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L30; involved in pre-rRNA processing in the nucleolus; autoregulates splicing of its transcript; homologous to mammalian ribosomal protein L30, no bacterial homolog +S000032082 CDS YGL030W 7 439091 439093 W 2011-02-03 1996-07-31 +S000032083 CDS YGL030W 7 439324 439638 W 2011-02-03 1996-07-31 +S000032084 intron YGL030W 7 439094 439323 W 2011-02-03 1996-07-31 +S000002997 ORF Verified YGL029W CGR1 chromosome 7 S000007411 7 440063 440425 W 2011-02-03 1996-07-31 Protein involved in nucleolar integrity and processing of pre-rRNA; has a role in processing rRNA for the 60S ribosome subunit; transcript is induced in response to cytotoxic stress but not genotoxic stress; relocalizes from nucleus to nucleolus upon DNA replication stress +S000030962 CDS YGL029W 7 440063 440425 W 2011-02-03 1996-07-31 +S000006565 tRNA_gene tF(GAA)G chromosome 7 L000003848 7 440807 440716 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis +S000035389 intron tF(GAA)G 7 440770 440752 C 2011-02-03 2000-05-19 +S000035388 noncoding_exon tF(GAA)G 7 440751 440716 C 2011-02-03 2000-05-19 +S000035387 noncoding_exon tF(GAA)G 7 440807 440771 C 2011-02-03 2000-05-19 +S000002996 ORF Verified YGL028C SCW11 putative glucan endo-1,3-beta-D-glucosidase chromosome 7 7 442909 441281 C 2011-02-03 1996-07-31 Cell wall protein with similarity to glucanases; may play a role in conjugation during mating based on its regulation by Ste12p +S000030849 CDS YGL028C 7 442909 441281 C 2011-02-03 1996-07-31 +S000002995 ORF Verified YGL027C CWH41 DER7|GLS1 chromosome 7 L000003121|L000000715 7 446143 443642 C 2011-02-03 1996-07-31 Processing alpha glucosidase I; ER type II integral membrane N-glycoprotein involved in assembly of cell wall beta 1,6 glucan and asparagine-linked protein glycosylation; also involved in ER protein quality control and sensing of ER stress +S000029845 CDS YGL027C 7 446143 443642 C 2011-02-03 1996-07-31 +S000002994 ORF Verified YGL026C TRP5 tryptophan synthase TRP5 chromosome 7 L000002356 7 448535 446412 C -22 2011-02-03 1996-07-31 Tryptophan synthase; catalyzes the last step of tryptophan biosynthesis; regulated by the general control system of amino acid biosynthesis +S000037836 CDS YGL026C 7 448535 446412 C 2011-02-03 1996-07-31 +S000002992 ORF Dubious YGL024W SST3 chromosome 7 7 449788 450123 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially/completely overlaps the verified ORF PGD1/YGL025C +S000037721 CDS YGL024W 7 449788 450123 W 2011-02-03 1996-07-31 +S000002993 ORF Verified YGL025C PGD1 MED3|HRS1 chromosome 7 L000000811|L000001408 7 449957 448764 C 2011-02-03 2003-09-22|1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for basal and activated transcription; direct target of Cyc8p-Tup1p transcriptional corepressor +S000037746 CDS YGL025C 7 449957 448764 C 2011-02-03 2003-09-22|1996-07-31 +S000002991 ORF Verified YGL023C PIB2 chromosome 7 S000007475 7 452104 450197 C 2011-02-03 1996-07-31 Protein of unknown function; contains FYVE domain; similar to Fab1 and Vps27 +S000036924 CDS YGL023C 7 452104 450197 C 2011-02-03 1996-07-31 +S000002990 ORF Verified YGL022W STT3 dolichyl-diphosphooligosaccharide--protein glycosyltransferase subunit STT3 chromosome 7 L000002716 7 452404 454560 W 2011-02-03 1996-07-31 Subunit of the oligosaccharyltransferase complex of the ER lumen; complex catalyzes asparagine-linked glycosylation of newly synthesized proteins; forms a subcomplex with Ost3p and Ost4p and is directly involved in catalysis +S000036896 CDS YGL022W 7 452404 454560 W 2011-02-03 1996-07-31 +S000002989 ORF Verified YGL021W ALK1 protein kinase ALK1 chromosome 7 L000002852 7 454785 457067 W 2011-02-03 1996-07-31 Protein kinase; along with its paralog, ALK2, required for proper spindle positioning and nuclear segregation following mitotic arrest, proper organization of cell polarity factors in mitosis, proper localization of formins and polarity factors, and survival in cells that activate spindle assembly checkpoint; phosphorylated in response to DNA damage; ALK1 has a paralog, ALK2, that arose from the whole genome duplication; similar to mammalian haspins +S000036836 CDS YGL021W 7 454785 457067 W 2011-02-03 1996-07-31 +S000002988 ORF Verified YGL020C GET1 GET complex subunit GET1|MDM39 chromosome 7 7 457870 457163 C 2011-02-03 1996-07-31 Subunit of the GET complex; involved in insertion of proteins into the ER membrane; required for the retrieval of HDEL proteins from the Golgi to the ER in an ERD2 dependent fashion and for normal mitochondrial morphology and inheritance +S000035892 CDS YGL020C 7 457870 457163 C 2011-02-03 1996-07-31 +S000002987 ORF Verified YGL019W CKB1 casein kinase 2 regulatory subunit CKB1 chromosome 7 L000002856 7 458156 458992 W 2011-02-03 1996-07-31 Beta regulatory subunit of casein kinase 2 (CK2); a Ser/Thr protein kinase with roles in cell growth and proliferation; CK2, comprised of CKA1, CKA2, CKB1 and CKB2, has many substrates including transcription factors and all RNA polymerases +S000034946 CDS YGL019W 7 458156 458992 W 2011-02-03 1996-07-31 +S000002986 ORF Verified YGL018C JAC1 J-type chaperone JAC1 chromosome 7 L000003591 7 459664 459110 C 2011-02-03 1996-07-31 Specialized J-protein that functions in Fe-S cluster biogenesis; functions with Hsp70 in Fe-S cluster biogenesis in mitochondria; involved in iron metabolism; contains a J domain typical to J-type chaperones; localizes to the mitochondrial matrix +S000034703 CDS YGL018C 7 459664 459110 C 2011-02-03 1996-07-31 +S000002985 ORF Verified YGL017W ATE1 arginyltransferase chromosome 7 L000000137 7 459854 461365 W -12 2011-02-03 1996-07-31 Arginyl-tRNA-protein transferase; catalyzes post-translational conjugation of arginine to the amino termini of acceptor proteins which are then subject to degradation via the N-end rule pathway +S000034655 CDS YGL017W 7 459854 461365 W 2011-02-03 1996-07-31 +S000002984 ORF Verified YGL016W KAP122 PDR6 chromosome 7 L000001366 7 461666 464911 W -10 2011-02-03 1996-07-31 Karyopherin beta; responsible for import of the Toa1p-Toa2p complex into the nucleus; binds to nucleoporins Nup1p and Nup2p; may play a role in regulation of pleiotropic drug resistance +S000033773 CDS YGL016W 7 461666 464911 W 2011-02-03 1996-07-31 +S000002983 ORF Uncharacterized YGL015C chromosome 7 7 465435 465043 C 2011-02-03 1996-07-31 Putative protein of unknown function; null mutants accumulate cargo in the Golgi +S000033596 CDS YGL015C 7 465435 465043 C 2011-02-03 1996-07-31 +S000002982 ORF Verified YGL014W PUF4 YGL023 chromosome 7 7 466141 468807 W 2011-02-03 1996-07-31 Member of the PUF protein family; PUF family is defined by the presence of Pumilio homology domains that confer RNA binding activity; preferentially binds mRNAs encoding nucleolar ribosomal RNA-processing factors +S000033567 CDS YGL014W 7 466141 468807 W 2011-02-03 1996-07-31 +S000028825 ORF Dubious YGL014C-A chromosome 7 7 466398 466237 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by expression profiling and mass spectrometry +S000033647 CDS YGL014C-A 7 466398 466237 C 2011-02-03 2003-07-29 +S000002981 ORF Verified YGL013C PDR1 drug-responsive transcription factor PDR1|TPE3|TPE1|TIL1|SMR2|NRA2|CYH3|BOR2|ANT1|AMY1 chromosome 7 L000002984|L000003503|L000001361 7 472298 469092 C -8 2011-02-03 1996-07-31 Transcription factor that regulates the pleiotropic drug response; zinc cluster protein that is a master regulator involved in recruiting other zinc cluster proteins to pleiotropic drug response elements (PDREs) to fine tune the regulation of multidrug resistance genes; relocalizes to the cytosol in response to hypoxia; PDR1 has a paralog, PDR3, that arose from the whole genome duplication +S000032756 CDS YGL013C 7 472298 469092 C 2011-02-03 1996-07-31 +S000002980 ORF Verified YGL012W ERG4 delta(24(24(1)))-sterol reductase chromosome 7 L000000571 7 472855 474276 W 2011-02-03 1996-07-31 C-24(28) sterol reductase; catalyzes the final step in ergosterol biosynthesis; mutants are viable, but lack ergosterol +S000032737 CDS YGL012W 7 472855 474276 W 2011-02-03 1996-07-31 +S000002979 ORF Verified YGL011C SCL1 proteasome core particle subunit alpha 1|PRC2 chromosome 7 L000001812 7 475247 474489 C -8 2011-02-03 1996-07-31 Alpha 1 subunit of the 20S proteasome; involved in the degradation of ubiquitinated substrates; 20S proteasome is the core complex of the 26S proteasome; essential for growth; detected in the mitochondria +S000032541 CDS YGL011C 7 475247 474489 C 2011-02-03 1996-07-31 +S000002978 ORF Verified YGL010W MPO1 chromosome 7 7 475545 476069 W 2011-02-03 1996-07-31 Protein involved in metabolism of phytosphingosine; not an essential gene +S000031636 CDS YGL010W 7 475545 476069 W 2011-02-03 1996-07-31 +S000002977 ORF Verified YGL009C LEU1 3-isopropylmalate dehydratase LEU1 chromosome 7 L000000942 7 478652 476313 C -5 2011-02-03 1996-07-31 Isopropylmalate isomerase; catalyzes the second step in the leucine biosynthesis pathway +S000031584 CDS YGL009C 7 478652 476313 C 2011-02-03 1996-07-31 +S000002976 ORF Verified YGL008C PMA1 H(+)-exporting P2-type ATPase PMA1|KTI10 chromosome 7 L000001449 7 482666 479910 C -2 2011-02-03 1996-07-31 Plasma membrane P2-type H+-ATPase; pumps protons out of cell; major regulator of cytoplasmic pH and plasma membrane potential; long-lived protein asymmetrically distributed at plasma membrane between mother cells and buds; accumulates at high levels in mother cells during aging, buds emerge with very low levels of Pma1p, newborn cells have low levels of Pma1p; Hsp30p plays a role in Pma1p regulation; interactions with Std1p appear to propagate [GAR+] +S000030720 CDS YGL008C 7 482666 479910 C 2011-02-03 1996-07-31 +S000028632 ORF Uncharacterized YGL007C-A chromosome 7 7 483027 482941 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; deletion exhibits slow-growth phenotype; computationally predicted to have a role in cell budding +S000032388 CDS YGL007C-A 7 483027 482941 C 2011-02-03 2003-07-29 +S000002975 ORF Uncharacterized YGL007W BRP1 chromosome 7 7 483260 483637 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; located in the upstream region of PMA1; deletion leads to polyamine resistance due to downregulation of PMA1 +S000030678 CDS YGL007W 7 483260 483637 W 2011-02-03 1996-07-31 +S000118459 ARS ARS719 ARSVII-485 chromosome 7 7 484930 485157 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000119025 ARS_consensus_sequence ARS719 7 485110 485096 C 2011-02-03 2006-10-03 +S000028769 ORF Uncharacterized YGL006W-A chromosome 7 7 485423 485533 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by SAGE +S000033473 CDS YGL006W-A 7 485423 485533 W 2011-02-03 2003-07-29 +S000002974 ORF Verified YGL006W PMC1 calcium-transporting ATPase PMC1 chromosome 7 L000001451 7 485921 489442 W 2011-02-03 1996-07-31 Vacuolar Ca2+ ATPase involved in depleting cytosol of Ca2+ ions; prevents growth inhibition by activation of calcineurin in the presence of elevated concentrations of calcium; similar to mammalian PMCA1a +S000030624 CDS YGL006W 7 485921 489442 W 2011-02-03 1996-07-31 +S000002973 ORF Verified YGL005C COG7 Golgi transport complex subunit COG7|COD5 chromosome 7 7 490547 489708 C 2011-02-03 1996-07-31 Component of the conserved oligomeric Golgi complex; a cytosolic tethering complex (Cog1p through Cog8p) that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments +S000030391 CDS YGL005C 7 490547 489708 C 2011-02-03 1996-07-31 +S000002972 ORF Verified YGL004C RPN14 chromosome 7 7 491956 490703 C 2011-02-03 1996-07-31 Evolutionarily conserved 19S regulatory particle assembly-chaperone; proteasome-interacting protein involved in the assembly of the base subcomplex of the 19S proteasome regulatory particle (RP); null mutants accumulate ubiquitinated Gcn4p and display decreased 26S proteasome stability; interacts with Rpt5p +S000037620 CDS YGL004C 7 491956 490703 C 2011-02-03 1996-07-31 +S000002971 ORF Verified YGL003C CDH1 HCT1 chromosome 7 L000004229 7 494174 492474 C 2011-02-03 1996-07-31 Activator of anaphase-promoting complex/cyclosome (APC/C); antagonist of the spindle assembly checkpoint; directs ubiquitination of cyclins resulting in mitotic exit; targets the APC/C to specific substrates including: Cdc20p, Ase1p, Cin8p, Fin1p and Clb5p; partially active in metaphase, and fully active in anaphase; cell-cycle regulated +S000037480 CDS YGL003C 7 494174 492474 C 2011-02-03 1996-07-31 +S000002970 ORF Verified YGL002W ERP6 chromosome 7 L000004683 7 494517 495167 W 2011-02-03 1996-07-31 Member of the p24 family involved in ER to Golgi transport; similar to Emp24p and Erv25p; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; ERP6 has a paralog, ERP1, that arose from the whole genome duplication +S000037443 CDS YGL002W 7 494517 495167 W 2011-02-03 1996-07-31 +S000002969 ORF Verified YGL001C ERG26 sterol-4-alpha-carboxylate 3-dehydrogenase (decarboxylating) chromosome 7 7 496502 495453 C 2011-02-03 1996-07-31 C-3 sterol dehydrogenase; catalyzes the second of three steps required to remove two C-4 methyl groups from an intermediate in ergosterol biosynthesis; human homolog NSDHL implicated in CK syndrome, and can complement yeast null mutant; molecular target of natural product and antifungal compound FR171456 +S000036649 CDS YGL001C 7 496502 495453 C 2011-02-03 1996-07-31 +S000006468 centromere CEN7 CEN7 chromosome 7 L000000300 7 497038 496920 C 0 2011-02-03 2000-05-19|2004-10-08|2006-05-09 Chromosome VII centromere +S000077293 centromere_DNA_Element_I CEN7 7 497038 497029 C 2011-02-03 2004-10-08 +S000077294 centromere_DNA_Element_II CEN7 7 497028 496945 C 2011-02-03 2004-10-08 +S000077295 centromere_DNA_Element_III CEN7 7 496944 496920 C 2011-02-03 2004-10-08 +S000003233 ORF Verified YGR001C EFM5 protein-lysine N-methyltransferase|AML1 chromosome 7 7 498034 497133 C 2011-02-03 2000-07-14|1996-07-31 S-adenosylmethionine-dependent lysine methyltransferase; involved in the trimethylation of eEF1A (Tef1p/Tef2p) at lysine 79; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; required for replication of Brome mosaic virus in budding yeast; expresses a circular RNA; originally misclassified as a N-6-adenine specific DNA methyltransferase based on sequence similarity; both Efm5p and human ortholog N6AMT2 can methylate eEF1a from either species in vitro +S000032873 CDS YGR001C 7 497365 497133 C 2011-02-03 1996-07-31 +S000032872 CDS YGR001C 7 497937 497459 C 2011-02-03 2000-07-14|1996-07-31 +S000032871 CDS YGR001C 7 498034 498000 C 2011-02-03 2000-07-14 +S000032875 intron YGR001C 7 497458 497366 C 2011-02-03 1996-07-31 +S000032874 intron YGR001C 7 497999 497938 C 2011-02-03 2000-07-14 +S000003234 ORF Verified YGR002C SWC4 GOD1|EAF2 chromosome 7 7 499906 498476 C 2011-02-03 1996-07-31 Component of the Swr1p complex that incorporates Htz1p into chromatin; component of the NuA4 histone acetyltransferase complex +S000032986 CDS YGR002C 7 499906 498476 C 2011-02-03 1996-07-31 +S000003235 ORF Verified YGR003W CUL3 cullin CUL3|CULLIN B|CULB chromosome 7 7 500132 502366 W 2011-02-03 1996-07-31 Ubiquitin-protein ligase; forms a complex with Elc1p that polyubiquitylates monoubiquitylated RNA polymerase II to trigger its proteolysis; cullin family member with similarity to Cdc53p and human CUL3 +S000033740 CDS YGR003W 7 500132 502366 W 2011-02-03 1996-07-31 +S000003236 ORF Verified YGR004W PEX31 peroxisome biogenesis protein chromosome 7 7 502938 504326 W 2011-02-03 1996-07-31 Peroxisomal integral membrane protein; involved in negative regulation of peroxisome size; partially functionally redundant with Pex30p and Pex32p; probably acts at a step downstream of steps mediated by Pex28p and Pex29p; PEX31 has a paralog, PEX30, that arose from the whole genome duplication +S000033874 CDS YGR004W 7 502938 504326 W 2011-02-03 1996-07-31 +S000003237 ORF Verified YGR005C TFG2 transcription factor IIF subunit TFG2 chromosome 7 L000002633 7 505859 504657 C 2011-02-03 1996-07-31 TFIIF (Transcription Factor II) middle subunit; involved in both transcription initiation and elongation of RNA polymerase II; homologous to human RAP30 +S000033942 CDS YGR005C 7 505859 504657 C 2011-02-03 1996-07-31 +S000003238 ORF Verified YGR006W PRP18 mRNA splicing protein PRP18 chromosome 7 L000001505 7 506070 506825 W 2011-02-03 2004-01-22|1996-07-31 Splicing factor and component of snRNP U5; factor involved in the positioning of the 3' splice site during the second catalytic step of splicing; interacts with Slu7p +S000034938 CDS YGR006W 7 506070 506825 W 2011-02-03 2004-01-22|1996-07-31 +S000003239 ORF Verified YGR007W ECT1 ethanolamine-phosphate cytidylyltransferase|MUQ1 chromosome 7 L000001218 7 506969 507940 W 2011-02-03 1996-07-31 Ethanolamine-phosphate cytidylyltransferase; catalyzes the second step of phosphatidylethanolamine biosynthesis; involved in the maintenance of plasma membrane; similar to mammalian CTP: phosphocholine cytidylyl-transferases; inability of the null mutant to synthesize phosphatidylethanolamine and phosphatidylcholine from ethanolamine is functionally complemented by human PCYT2 +S000035086 CDS YGR007W 7 506969 507940 W 2011-02-03 1996-07-31 +S000003240 ORF Verified YGR008C STF2 ATPase-stabilizing factor family protein chromosome 7 L000002127 7 508364 508110 C 2011-02-03 1996-07-31 Protein involved in resistance to desiccation stress; Stf2p exhibits antioxidant properties, and its overexpression prevents ROS accumulation and apoptosis; binds to F0 sector of mitochondrial F1F0 ATPase in vitro and may modulate the inhibitory action of Inh1p and Stf1p; protein abundance increases in response to DNA replication stress; STF2 has a paralog, TMA10, that arose from the whole genome duplication +S000035152 CDS YGR008C 7 508364 508110 C 2011-02-03 1996-07-31 +S000118460 ARS ARS720 ARSVII-509 chromosome 7 7 508729 508977 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178101 ARS_consensus_sequence ARS720 7 508909 508893 C 2014-11-18 2014-11-18 +S000003241 ORF Verified YGR009C SEC9 HSS7 chromosome 7 L000001835 7 511002 509047 C 2011-02-03 1996-07-31 t-SNARE protein required for secretory vesicle-plasma membrane fusion; similar to but not functionally redundant with Spo20p; interacts non-exocyst bound Sec6p; SNAP-25 homolog +S000035315 CDS YGR009C 7 511002 509047 C 2011-02-03 1996-07-31 +S000003242 ORF Verified YGR010W NMA2 nicotinamide-nucleotide adenylyltransferase NMA2 chromosome 7 7 511545 512732 W 2011-02-03 1996-07-31 Nicotinic acid mononucleotide adenylyltransferase; catalyzes the transfer of the adenylyl moiety of ATP to nicotinamide mononucleotide to form NAD; involved in de novo and salvage synthesis of NAD(+); homolog of human NMNAT; NMA2 has a paralog, NMA1, that arose from the whole genome duplication +S000037117 CDS YGR010W 7 511545 512732 W 2011-02-03 1996-07-31 +S000003243 ORF Dubious YGR011W chromosome 7 7 512497 512823 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037223 CDS YGR011W 7 512497 512823 W 2011-02-03 1996-07-31 +S000003244 ORF Verified YGR012W MCY1 putative cysteine synthase chromosome 7 7 513159 514340 W 2011-02-03 1996-07-31 Putative cysteine synthase; localized to the mitochondrial outer membrane +S000029879 CDS YGR012W 7 513159 514340 W 2011-02-03 1996-07-31 +S000003245 ORF Verified YGR013W SNU71 chromosome 7 L000004363 7 514554 516416 W 2011-02-03 1996-07-31 Component of U1 snRNP required for mRNA splicing via spliceosome; yeast specific, no metazoan counterpart +S000029977 CDS YGR013W 7 514554 516416 W 2011-02-03 1996-07-31 +S000003246 ORF Verified YGR014W MSB2 chromosome 7 L000001185 7 516943 520863 W 2 2011-02-03 1996-07-31 Mucin family member involved in various signaling pathways; functions as osmosensor in the Sho1p-mediated HOG pathway; functions in Cdc42p- and MAP kinase-dependent filamentous growth signaling pathway; processed into secreted and cell-associated forms by aspartyl protease Yps1p; potential Cdc28p substrate +S000030086 CDS YGR014W 7 516943 520863 W 2011-02-03 1996-07-31 +S000003247 ORF Uncharacterized YGR015C putative hydrolase chromosome 7 7 522076 521090 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the mitochondrion +S000030196 CDS YGR015C 7 522076 521090 C 2011-02-03 1996-07-31 +S000003248 ORF Uncharacterized YGR016W chromosome 7 7 522261 522833 W 2011-02-03 1996-07-31 Putative protein of unknown function +S000031230 CDS YGR016W 7 522261 522833 W 2011-02-03 1996-07-31 +S000003249 ORF Uncharacterized YGR017W chromosome 7 7 523787 524680 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the nucleus and the cytoplasm +S000031323 CDS YGR017W 7 523787 524680 W 2011-02-03 1996-07-31 +S000003250 ORF Uncharacterized YGR018C chromosome 7 7 524694 524365 C 2011-02-03 1996-07-31 Protein of unknown function; mRNA identified as translated by ribosome profiling data; partially overlaps the uncharacterized ORF YGR017W +S000031392 CDS YGR018C 7 524694 524365 C 2011-02-03 1996-07-31 +S000003251 ORF Verified YGR019W UGA1 4-aminobutyrate transaminase chromosome 7 L000002422 7 525229 526644 W 2011-02-03 1996-07-31 Gamma-aminobutyrate (GABA) transaminase; also known as 4-aminobutyrate aminotransferase; involved in the 4-aminobutyrate and glutamate degradation pathways; required for normal oxidative stress tolerance and nitrogen utilization; protein abundance increases in response to DNA replication stress +S000032468 CDS YGR019W 7 525229 526644 W 2011-02-03 1996-07-31 +S000003252 ORF Verified YGR020C VMA7 H(+)-transporting V1 sector ATPase subunit F chromosome 7 L000002462 7 527329 526973 C 2011-02-03 1996-07-31 Subunit F of the V1 peripheral membrane domain of V-ATPase; part of the electrogenic proton pump found throughout the endomembrane system; required for the V1 domain to assemble onto the vacuolar membrane; the V1 peripheral membrane domain of vacuolar H+-ATPase (V-ATPase) has eight subunits +S000032415 CDS YGR020C 7 527329 526973 C 2011-02-03 1996-07-31 +S000003253 ORF Uncharacterized YGR021W HAH1 chromosome 7 7 527632 528504 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000033286 CDS YGR021W 7 527632 528504 W 2011-02-03 1996-07-31 +S000003255 ORF Verified YGR023W MTL1 chromosome 7 L000004649 7 529264 530919 W 2011-02-03 1996-07-31 Putative plasma membrane sensor; involved in cell integrity signaling and stress response during glucose starvation and oxidative stress; has structural and functional similarity to Mid2p; MTL1 has a paralog, MID2, that arose from the whole genome duplication +S000034269 CDS YGR023W 7 529264 530919 W 2011-02-03 1996-07-31 +S000003254 ORF Dubious YGR022C chromosome 7 7 529586 529257 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps almost completely with the verified ORF MTL1/YGR023W +S000033318 CDS YGR022C 7 529586 529257 C 2011-02-03 1996-07-31 +S000006532 tRNA_gene tD(GUC)G1 chromosome 7 L000003826 7 531610 531681 W 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000036686 noncoding_exon tD(GUC)G1 7 531610 531681 W 2011-02-03 2000-05-19 +S000003256 ORF Verified YGR024C THG1 tRNA guanylyltransferase chromosome 7 7 532596 531883 C 2011-02-03 1996-07-31 tRNAHis guanylyltransferase; adds a guanosine residue to the 5' end of tRNAH is after transcription and RNase P cleavage; can also catalyze reverse (3'-5') polymerization with certain substrates in a template-dependent reaction; couples nuclear division and migration to cell budding and cytokinesis; essential enzyme conserved among eukaryotes +S000034310 CDS YGR024C 7 532596 531883 C 2011-02-03 1996-07-31 +S000003257 ORF Dubious YGR025W chromosome 7 7 532639 532941 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034440 CDS YGR025W 7 532639 532941 W 2011-02-03 1996-07-31 +S000003258 ORF Uncharacterized YGR026W chromosome 7 7 532985 533821 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery +S000034561 CDS YGR026W 7 532985 533821 W 2011-02-03 1996-07-31 +S000003259 ORF Verified YGR027C RPS25A eS25|ribosomal 40S subunit protein S25A|S25e|rp45|YS23|S31A|S25A|RPS31A chromosome 7 L000003257 7 534458 534132 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S25, no bacterial homolog; RPS25A has a paralog, RPS25B, that arose from the whole genome duplication +S000035521 CDS YGR027C 7 534458 534132 C 2011-02-03 1996-07-31 +S000122101 five_prime_UTR_intron YGR027C 7 534785 534474 C 2011-02-03 2007-04-04 +S000006965 long_terminal_repeat YGRWdelta11 chromosome 7 7 535211 535542 W 2011-02-03 2000-05-19 Ty1 LTR +S000006952 long_terminal_repeat YGRCdelta12 chromosome 7 7 535759 535607 C 2011-02-03 2000-05-19 Ty1 LTR +S000006966 long_terminal_repeat YGRWdelta13 chromosome 7 7 535760 536097 W 2011-02-03 2000-05-19 Ty1 LTR +S000006982 LTR_retrotransposon YGRWTy1-1 Ty1 chromosome 7 7 535760 541685 W 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007405 transposable_element_gene YGR027W-A gag protein chromosome 7 7 536057 537379 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000036251 CDS YGR027W-A 7 536057 537379 W 2011-02-03 1999-07-17 +S000007406 transposable_element_gene YGR027W-B gag-pol fusion protein chromosome 7 S000029013 7 536057 541325 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000036253 CDS YGR027W-B 7 536057 537361 W 2011-02-03 1999-07-17 +S000036254 CDS YGR027W-B 7 537363 541325 W 2011-02-03 1999-07-17 +S000036255 plus_1_translational_frameshift YGR027W-B 7 537362 537362 W 2011-02-03 1999-07-17 +S000006967 long_terminal_repeat YGRWdelta14 chromosome 7 7 541348 541685 W 2011-02-03 2000-05-19 Ty1 LTR +S000006555 tRNA_gene tE(UUC)G3 chromosome 7 L000003827 7 541850 541921 W 2011-02-03 2000-05-19 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p; target of K. lactis zymocin +S000034674 noncoding_exon tE(UUC)G3 7 541850 541921 W 2011-02-03 2000-05-19 +S000003260 ORF Verified YGR028W MSP1 YTA4 chromosome 7 L000001200|L000002558 7 542203 543291 W 2011-02-03 1996-07-31 Highly-conserved N-terminally anchored AAA-ATPase; distributed in the mitochondrial outer membrane and peroxisomes; involved in mitochondrial protein sorting; functions as an extraction engine in local organelle surveillance to remove and initiate degradation of mistargeted proteins, ensuring fidelity of organelle-specific localization of tail-anchored proteins; contains an N-terminal transmembrane domain and C-terminal cytoplasmic ATPase domain +S000035635 CDS YGR028W 7 542203 543291 W 2011-02-03 1996-07-31 +S000003261 ORF Verified YGR029W ERV1 flavin-linked sulfhydryl oxidase chromosome 7 L000000583 7 543553 544205 W 2011-02-03 2000-07-14|1996-07-31 Flavin-linked sulfhydryl oxidase of the mitochondrial IMS; N-terminus is an intrinsically disordered domain that in the cytosol helps target Erv1p to mitochondria, and in the intermembrane space oxidizes Mia40p as part of a disulfide relay system that promotes intermembrane space retention of imported proteins; functional ortholog of human GFER (ALR); human GFER carrying N-terminal 21 amino acids of Erv1p functionally complements the lethality of the erv1 null mutation +S000035763 CDS YGR029W 7 543553 543638 W 2011-02-03 2000-07-14 +S000035764 CDS YGR029W 7 543722 544205 W 2011-02-03 2000-07-14|1996-07-31 +S000035765 intron YGR029W 7 543639 543721 W 2011-02-03 2000-07-14 +S000006533 tRNA_gene tD(GUC)G2 chromosome 7 L000003847 7 544648 544577 C 2011-02-03 2000-05-19 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000036692 noncoding_exon tD(GUC)G2 7 544648 544577 C 2011-02-03 2000-05-19 +S000006506 snoRNA_gene snR46 SNR46 chromosome 7 L000003413 7 545370 545566 W 2011-02-03 2000-05-19|2007-05-08 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2865 +S000030619 noncoding_exon snR46 7 545370 545566 W 2011-02-03 2000-05-19|2007-05-08 +S000003262 ORF Verified YGR030C POP6 ribonuclease P/MRP protein subunit POP6 chromosome 7 L000004302 7 546157 545681 C 2011-02-03 1996-07-31 Subunit of RNase MRP, nuclear RNase P and telomerase; forms a soluble heterodimer with Pop7p that binds P3 domain of RNase MRP and RNase P RNAs; RNase MRP cleaves pre-rRNA, nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs, while telomerase replenishes telomeric DNA; relocalizes to the cytosol in response to hypoxia +S000035582 CDS YGR030C 7 546157 545681 C 2011-02-03 1996-07-31 +S000003263 ORF Verified YGR031W IMO32 chromosome 7 7 546441 547469 W 2011-02-03 1996-07-31 Conserved mitochondrial protein of unknown function; processed by both mitochondrial processing peptidase and mitochondrial octapeptidyl aminopeptidase; gene contains the nested antisense gene NAG1 +S000036524 CDS YGR031W 7 546441 547469 W 2011-02-03 1996-07-31 +S000028636 ORF Verified YGR031C-A NAG1 chromosome 7 7 547300 546809 C 2011-02-03 2003-07-29 Protein involved in yeast cell wall biogenesis; localizes to the cell periphery; production of Nag1p is dependent upon the presence of Slt2p and Rlm1p; gene is nested within and antisense to IMO32 +S000032392 CDS YGR031C-A 7 547300 546809 C 2011-02-03 2003-07-29 +S000003264 ORF Verified YGR032W GSC2 1,3-beta-glucan synthase GSC2|FKS2 chromosome 7 L000000716|L000000733 7 548264 553951 W 2011-02-03 1996-07-31 Catalytic subunit of 1,3-beta-glucan synthase; involved in formation of the inner layer of the spore wall; activity positively regulated by Rho1p and negatively by Smk1p; GSC2 has a paralog, FKS1, that arose from the whole genome duplication +S000036645 CDS YGR032W 7 548264 553951 W 2011-02-03 1996-07-31 +S000003265 ORF Verified YGR033C TIM21 FMP17 chromosome 7 7 554967 554248 C 2011-02-03 1996-07-31 Nonessential component of the TIM23 complex; interacts with the Translocase of the Outer Mitochondrial membrane (TOM complex) and with respiratory enzymes; may regulate the Translocase of the Inner Mitochondrial membrane (TIM23 complex) activity +S000036681 CDS YGR033C 7 554967 554248 C 2011-02-03 1996-07-31 +S000003266 ORF Verified YGR034W RPL26B uL24|ribosomal 60S subunit protein L26B|L24|YL33|L33B|L26B chromosome 7 L000004462 7 555812 556672 W 2011-02-03 1996-07-31|2006-10-05 Ribosomal 60S subunit protein L26B; binds to 5.8S rRNA; non-essential even when paralog is also deleted; deletion has minimal affections on ribosome biosynthesis; homologous to mammalian ribosomal protein L26 and bacterial L24; RPL26B has a paralog, RPL26A, that arose from the whole genome duplication +S000037472 CDS YGR034W 7 555812 555830 W 2011-02-03 1996-07-31|2006-10-05 +S000037473 CDS YGR034W 7 556308 556672 W 2011-02-03 1996-07-31 +S000037474 intron YGR034W 7 555831 556307 W 2011-02-03 1996-07-31|2006-10-05 +S000003267 ORF Uncharacterized YGR035C chromosome 7 7 557422 557072 C 2011-02-03 1996-07-31 Putative protein of unknown function, potential Cdc28p substrate; transcription is activated by paralogous transcription factors Yrm1p and Yrr1p along with genes involved in multidrug resistance; YGR035C has a paralog, YLR346C, that arose from the whole genome duplication +S000037516 CDS YGR035C 7 557422 557072 C 2011-02-03 1996-07-31 +S000028827 ORF Uncharacterized YGR035W-A chromosome 7 7 557565 557786 W 2011-02-03 2003-07-29 Putative protein of unknown function +S000033652 CDS YGR035W-A 7 557565 557786 W 2011-02-03 2003-07-29 +S000003268 ORF Verified YGR036C CAX4 CWH8 chromosome 7 L000002917 7 558868 558149 C 2011-02-03 1996-07-31 Dolichyl pyrophosphate (Dol-P-P) phosphatase; has a luminally oriented active site in the ER; cleaves the anhydride linkage in Dol-P-P; required for Dol-P-P-linked oligosaccharide intermediate synthesis and protein N-glycosylation +S000037649 CDS YGR036C 7 558868 558149 C 2011-02-03 1996-07-31 +S000003269 ORF Verified YGR037C ACB1 long-chain fatty acid transporter ACB1 chromosome 7 L000000016 7 559994 559731 C 2011-02-03 1996-07-31 Acyl-CoA-binding protein; transports newly synthesized acyl-CoA esters from fatty acid synthetase (Fas1p-Fas2p) to acyl-CoA-consuming processes; subject to starvation-induced, Grh1p-mediated unconventional secretion; protein abundance increases in response to DNA replication stress +S000030442 CDS YGR037C 7 559994 559731 C 2011-02-03 1996-07-31 +S000003270 ORF Verified YGR038W ORM1 sphingolipid homeostasis protein ORM1 chromosome 7 L000003422 7 560682 561350 W 2011-02-03 1996-07-31 Protein that mediates sphingolipid homeostasis; evolutionarily conserved, required for resistance to agents that induce unfolded protein response; Orm1p and Orm2p together control membrane biogenesis by coordinating lipid homeostasis with protein quality control; ORM1 has a paralog, ORM2, that arose from the whole genome duplication +S000030632 CDS YGR038W 7 560682 561350 W 2011-02-03 1996-07-31 +S000006725 tRNA_gene tS(AGA)G chromosome 7 L000003846 7 561743 561662 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000032368 noncoding_exon tS(AGA)G 7 561743 561662 C 2011-02-03 2000-05-19 +S000006953 long_terminal_repeat YGRCdelta15 chromosome 7 7 562176 561843 C 2011-02-03 2000-05-19 Ty1 LTR +S000007408 transposable_element_gene YGR038C-B gag-pol fusion protein chromosome 7 7 567467 562199 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000031864 CDS YGR038C-B 7 566161 562199 C 2011-02-03 1999-07-17 +S000031863 CDS YGR038C-B 7 567467 566163 C 2011-02-03 1999-07-17 +S000031865 plus_1_translational_frameshift YGR038C-B 7 566162 566162 C 2011-02-03 1999-07-17 +S000007407 transposable_element_gene YGR038C-A gag protein chromosome 7 7 567467 566145 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000031828 CDS YGR038C-A 7 567467 566145 C 2011-02-03 1999-07-17 +S000006962 LTR_retrotransposon YGRCTy1-2 Ty1 chromosome 7 7 567760 561843 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000006954 long_terminal_repeat YGRCdelta16 chromosome 7 7 567760 567427 C 2011-02-03 2000-05-19 Ty1 LTR +S000118461 ARS ARS721 ARSVII-569 chromosome 7 7 568490 568737 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000119026 ARS_consensus_sequence ARS721 7 568660 568646 C 2011-02-03 2006-10-03 +S000006955 long_terminal_repeat YGRCdelta17 chromosome 7 7 569072 568740 C 2011-02-03 2000-05-19 Ty2 LTR +S000118462 ARS ARS722 ARSVII-575 chromosome 7 7 574622 574915 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178102 ARS_consensus_sequence ARS722 7 574701 574717 W 2014-11-18 2014-11-18 +S000006964 LTR_retrotransposon YGRCTy2-1 Ty2 chromosome 7 7 574700 568740 C 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; mutated in S288C +S000006956 long_terminal_repeat YGRCdelta18 chromosome 7 7 574700 574369 C 2011-02-03 2000-05-19 Ty2 LTR +S000003271 ORF Uncharacterized YGR039W chromosome 7 7 574888 575199 W 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YGR039W is not an essential gene +S000030717 CDS YGR039W 7 574888 575199 W 2011-02-03 1996-07-31 +S000003272 ORF Verified YGR040W KSS1 mitogen-activated serine/threonine-protein kinase KSS1 chromosome 7 L000000922 7 575398 576504 W 2011-02-03 1996-07-31 Mitogen-activated protein kinase (MAPK); involved in signal transduction pathways that control filamentous growth and pheromone response; regulates septum assembly, and may directly phosphorylate Bni4p; the KSS1 gene is nonfunctional in S288C strains and functional in W303 strains +S000031506 CDS YGR040W 7 575398 576504 W 2011-02-03 1996-07-31 +S000130166 ARS ARS723 chromosome 7 7 575484 576346 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000003273 ORF Verified YGR041W BUD9 chromosome 7 L000003939 7 577487 579130 W 2011-02-03 1996-07-31 Protein involved in bud-site selection; mutant has increased aneuploidy tolerance; diploid mutants display a unipolar budding pattern instead of the wild-type bipolar pattern, and bud at the distal pole; BUD9 has a paralog, BUD8, that arose from the whole genome duplication +S000031558 CDS YGR041W 7 577487 579130 W 2011-02-03 1996-07-31 +S000003274 ORF Verified YGR042W MTE1 chromosome 7 7 579476 580291 W 2011-02-03 1996-07-31 Protein of unknown function; involved in maintenance of proper telomere length; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus; forms nuclear foci upon DNA replication stress +S000032536 CDS YGR042W 7 579476 580291 W 2011-02-03 1996-07-31 +S000003275 ORF Verified YGR043C NQM1 sedoheptulose-7-phosphate:D-glyceraldehyde-3-phosphate transaldolase NQM1 chromosome 7 7 581436 580435 C 2011-02-03 1996-07-31 Transaldolase of unknown function; transcription is repressed by Mot1p and induced by alpha-factor and during diauxic shift; NQM1 has a paralog, TAL1, that arose from the whole genome duplication +S000032607 CDS YGR043C 7 581436 580435 C 2011-02-03 1996-07-31 +S000130167 ARS ARS724 chromosome 7 7 581436 582213 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000003276 ORF Verified YGR044C RME1 CSP1 chromosome 7 L000001648 7 583892 582990 C 14 2011-02-03 1996-07-31 Zinc finger protein involved in control of meiosis; prevents meiosis by repressing IME1 expression and promotes mitosis by activating CLN2 expression; directly repressed by a1-alpha2 regulator; mediates cell type control of sporulation; relocalizes from nucleus to cytoplasm upon DNA replication stress +S000032718 CDS YGR044C 7 583892 582990 C 2011-02-03 1996-07-31 +S000003277 ORF Dubious YGR045C chromosome 7 7 584296 583934 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032825 CDS YGR045C 7 584296 583934 C 2011-02-03 1996-07-31 +S000003278 ORF Verified YGR046W TAM41 putative phosphatidate cytidylyltransferase|MMP37 chromosome 7 7 584895 586052 W 2011-02-03 1996-07-31 Mitochondrial phosphatidate cytidylyltransferase (CDP-DAG synthase); required for cardiolipin biosynthesis; viability of null mutant is strain-dependent; mRNA is targeted to the bud; mutant displays defect in mitochondrial protein import, likely due to altered membrane lipid composition +S000033590 CDS YGR046W 7 584895 586052 W 2011-02-03 1996-07-31 +S000003279 ORF Verified YGR047C TFC4 transcription factor TFIIIC subunit TFC4|tau 131|PCF1 chromosome 7 L000001348|L000002288 7 589469 586392 C 2011-02-03 1996-07-31 Subunit of RNA polymerase III transcription initiation factor complex; one of six subunits of RNA polymerase III transcription initiation factor complex (TFIIIC); part of the TauA domain of TFIIIC that binds BoxA DNA promoter sites of tRNA and similar genes; has TPR motifs; human homolog is TFIIIC-102 +S000033631 CDS YGR047C 7 589469 586392 C 2011-02-03 1996-07-31 +S000003280 ORF Verified YGR048W UFD1 polyubiquitin-binding protein UFD1 chromosome 7 L000002787 7 589826 590911 W 2011-02-03 1996-07-31 Substrate-recruiting cofactor of the Cdc48p-Npl4p-Ufd1p segregase; polyubiquitin binding protein that assists in the dislocation of misfolded, ERAD substrates that are subsequently delivered to the proteasome for degradation; involved in regulated destruction of ER membrane proteins such as HMG-CoA reductase (Hmg1/2p) and cytoplasmic proteins (Fbp1p); involved in mobilizing membrane bound transcription factors by regulated Ub/proteasome-dependent processing (RUP) +S000033814 CDS YGR048W 7 589826 590911 W 2011-02-03 1996-07-31 +S000003281 ORF Verified YGR049W SCM4 chromosome 7 L000001814 7 591314 591877 W 2011-02-03 1996-07-31 Mitochondrial outer membrane protein of unknown function; predicted to have 4 transmembrane segments; import is mediated by Tom70p and Mim1p; interacts genetically with a cdc4 mutation; SCM4 has a paralog, ATG33, that arose from the whole genome duplication +S000034690 CDS YGR049W 7 591314 591877 W 2011-02-03 1996-07-31 +S000003282 ORF Uncharacterized YGR050C chromosome 7 7 592442 592086 C 2011-02-03 1996-07-31 Protein of unknown function; mRNA identified as translated by ribosome profiling data +S000035714 CDS YGR050C 7 592442 592086 C 2011-02-03 1996-07-31 +S000003283 ORF Dubious YGR051C chromosome 7 7 593229 592906 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YGR051C is not an essential gene +S000035801 CDS YGR051C 7 593229 592906 C 2011-02-03 1996-07-31 +S000003284 ORF Uncharacterized YGR052W FMP48 protein kinase FMP48 chromosome 7 7 593596 594705 W 2011-02-03 1996-07-31 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; induced by treatment with 8-methoxypsoralen and UVA irradiation +S000036785 CDS YGR052W 7 593596 594705 W 2011-02-03 1996-07-31 +S000003285 ORF Uncharacterized YGR053C chromosome 7 7 595837 594986 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000036816 CDS YGR053C 7 595837 594986 C 2011-02-03 1996-07-31 +S000003286 ORF Verified YGR054W chromosome 7 7 596693 598621 W 2011-02-03 1996-07-31|2011-02-03 Eukaryotic initiation factor eIF2A; associates specifically with both 40S subunits and 80 S ribosomes, and interacts genetically with both eIF5b and eIF4E; homologous to mammalian eIF2A +S000036916 CDS YGR054W 7 596693 598621 W 2011-02-03 1996-07-31|2011-02-03 +S000003287 ORF Verified YGR055W MUP1 chromosome 7 L000003071 7 599417 601141 W 2011-02-03 1996-07-31 High affinity methionine permease; integral membrane protein with 13 putative membrane-spanning regions; also involved in cysteine uptake +S000036973 CDS YGR055W 7 599417 601141 W 2011-02-03 1996-07-31 +S000003288 ORF Verified YGR056W RSC1 RSC subunit protein RSC1 chromosome 7 L000004024 7 601661 604447 W 2011-02-03 1996-07-31 Component of the RSC chromatin remodeling complex; required for expression of mid-late sporulation-specific genes; contains two essential bromodomains, a bromo-adjacent homology (BAH) domain, and an AT hook; RSC1 has a paralog, RSC2, that arose from the whole genome duplication +S000037741 CDS YGR056W 7 601661 604447 W 2011-02-03 1996-07-31 +S000003289 ORF Verified YGR057C LST7 chromosome 7 L000004355 7 605501 604773 C 2011-02-03 2003-09-22|1996-07-31 Subunit of the Lst4p-Lst7p GTPase activating protein complex for Gtr2p; stimulates the GTPase activity of Rag family GTPase Gtr2p, within the context of the Gtr1p-Gtr2p heterodimer, after amino acid stimulation; required for activation of TORC1 in response to amino acid stimulation; recruited to the vacuolar membrane during amino acid starvation and released from the membrane by TORC1; required for the transport of amino acid permease Gap1p from the Golgi to the cell surface +S000037768 CDS YGR057C 7 605501 604773 C 2011-02-03 2003-09-22|1996-07-31 +S000003290 ORF Verified YGR058W PEF1 chromosome 7 7 606136 607143 W 2011-02-03 1996-07-31|2011-02-03 Penta-EF-hand protein; required for polar bud growth and cell wall abscission; binds calcium and zinc with different affinity; localizes to bud site in G1, bud neck in G2; binds to Sec31p and modulates COPII coat assembly +S000029835 CDS YGR058W 7 606136 607143 W 2011-02-03 1996-07-31|2011-02-03 +S000003291 ORF Verified YGR059W SPR3 septin SPR3 chromosome 7 L000002022 7 607563 609101 W 2011-02-03 1996-07-31 Sporulation-specific homolog of the CDC3/10/11/12 family of genes; septin protein involved in sporulation; regulated by ABFI; the yeast CDC3/10/11/12 family is a family of bud neck microfilament genes +S000030838 CDS YGR059W 7 607563 609101 W 2011-02-03 1996-07-31 +S000006440 snoRNA_gene snR48 SNR48 chromosome 7 L000004518 7 609584 609696 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at positions G2791 and G2793 +S000030651 noncoding_exon snR48 7 609584 609696 W 2011-02-03 2000-05-19 +S000003292 ORF Verified YGR060W ERG25 methylsterol monooxygenase chromosome 7 L000003089 7 610564 611493 W 2011-02-03 1996-07-31 C-4 methyl sterol oxidase; catalyzes the first of three steps required to remove two C-4 methyl groups from an intermediate in ergosterol biosynthesis; mutants accumulate the sterol intermediate 4,4-dimethylzymosterol; human MSMO1 functionally complements the growth defect caused by repression of ERG25 expression +S000031788 CDS YGR060W 7 610564 611493 W 2011-02-03 1996-07-31 +S000003293 ORF Verified YGR061C ADE6 phosphoribosylformylglycinamidine synthase chromosome 7 L000000036 7 615965 611889 C 39 2011-02-03 1996-07-31 Formylglycinamidine-ribonucleotide (FGAM)-synthetase; catalyzes a step in the 'de novo' purine nucleotide biosynthetic pathway +S000031938 CDS YGR061C 7 615965 611889 C 2011-02-03 1996-07-31 +S000003294 ORF Verified YGR062C COX18 membrane insertase COX18|OXA2 chromosome 7 L000003308 7 617278 616328 C 2011-02-03 1996-07-31 Protein required for membrane insertion of C-terminus of Cox2p; mitochondrial integral inner membrane protein; interacts genetically and physically with Mss2p and Pnt1p; similar to S. cerevisiae Oxa1, N. crassa Oxa2p, and E. coli YidC; respiratory defect of the null mutant is functionally complemented by human COX18 carrying the N-terminal 54 amino acids of S. cerevisiae Cox18p +S000032054 CDS YGR062C 7 617278 616328 C 2011-02-03 1996-07-31 +S000003296 ORF Dubious YGR064W chromosome 7 7 617621 617989 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF SPT4/YGR063C +S000033116 CDS YGR064W 7 617621 617989 W 2011-02-03 1996-07-31 +S000003295 ORF Verified YGR063C SPT4 transcription elongation factor SPT4 chromosome 7 L000002030 7 617824 617516 C 40 2011-02-03 1996-07-31 Spt4p/5p (DSIF) transcription elongation factor complex subunit; the Spt4/5 complex binds to ssRNA in a sequence-specific manner, and along with RNAP I and II has multiple roles regulating transcriptional elongation, RNA processing, quality control, and transcription-coupled repair; localizes to kinetochores and heterochromatin, influencing chromosomal dynamics and silencing; required for transcription through long trinucleotide repeats in ORFs and non-protein coding regions +S000032968 CDS YGR063C 7 617824 617516 C 2011-02-03 1996-07-31 +S000003297 ORF Verified YGR065C VHT1 chromosome 7 S000007487 7 619858 618077 C 2011-02-03 1996-07-31 High-affinity plasma membrane H+-biotin (vitamin H) symporter; mutation results in fatty acid auxotrophy; 12 transmembrane domain containing major facilitator subfamily member; mRNA levels negatively regulated by iron deprivation and biotin +S000033152 CDS YGR065C 7 619858 618077 C 2011-02-03 1996-07-31 +S000003298 ORF Uncharacterized YGR066C chromosome 7 7 621799 620921 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000033915 CDS YGR066C 7 621799 620921 C 2011-02-03 1996-07-31 +S000003299 ORF Uncharacterized YGR067C chromosome 7 7 624786 622372 C 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; contains a zinc finger motif similar to that of Adr1p +S000034061 CDS YGR067C 7 624786 622372 C 2011-02-03 1996-07-31|2011-02-03 +S000028637 ORF Dubious YGR068W-A chromosome 7 7 626294 626389 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps with the uncharacterized ORF YGR068C +S000032393 CDS YGR068W-A 7 626294 626389 W 2011-02-03 2003-07-29 +S000003301 ORF Dubious YGR069W chromosome 7 7 627083 627418 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035169 CDS YGR069W 7 627083 627418 W 2011-02-03 1996-07-31 +S000003300 ORF Verified YGR068C ART5 chromosome 7 7 627084 625324 C 2011-02-03 1996-07-31 Protein proposed to regulate endocytosis of plasma membrane proteins; regulates by recruiting the ubiquitin ligase Rsp5p to its target in the plasma membrane; SWAT-GFP and mCherry fusion proteins localize to the cytosol +S000034144 CDS YGR068C 7 627084 625324 C 2011-02-03 1996-07-31 +S000003302 ORF Verified YGR070W ROM1 Rho family guanine nucleotide exchange factor ROM1|SKC1 chromosome 7 L000003181 7 627806 631273 W 2011-02-03 1996-07-31|2011-02-03 Guanine nucleotide exchange factor (GEF) for Rho1p; mutations are synthetically lethal with mutations in rom2, which also encodes a GEP; ROM1 has a paralog, ROM2, that arose from the whole genome duplication +S000036051 CDS YGR070W 7 627806 631273 W 2011-02-03 1996-07-31|2011-02-03 +S000003303 ORF Verified YGR071C ENV11 chromosome 7 7 634063 631481 C 2011-02-03 1996-07-31 Protein proposed to be involved in vacuolar functions; mutant shows defect in CPY processing and fragmented vacuoles; deletion mutant has increased glycogen accumulation and displays elongated buds; green fluorescent protein (GFP)-fusion protein localizes to the nucleus; ENV11 has a paralog, VID22, that arose from the whole genome duplication +S000036097 CDS YGR071C 7 634063 631481 C 2011-02-03 1996-07-31 +S000003304 ORF Verified YGR072W UPF3 SUP112|SUA6 chromosome 7 L000003057|S000029549|L000002231 7 634304 635467 W 32 2011-02-03 1996-07-31 Component of the nonsense-mediated mRNA decay (NMD) pathway; along with Nam7p and Nmd2p; involved in decay of mRNA containing nonsense codons; involved in telomere maintenance +S000029860 CDS YGR072W 7 634304 635467 W 2011-02-03 1996-07-31 +S000003306 ORF Verified YGR074W SMD1 mRNA splicing protein SMD1|SPP92 chromosome 7 L000001928 7 635712 636152 W 2011-02-03 1996-07-31 Core Sm protein Sm D1; part of heteroheptameric complex (with Smb1p, Smd2p, Smd3p, Sme1p, Smx3p, and Smx2p) that is part of the spliceosomal U1, U2, U4, and U5 snRNPs; relocalizes to the cytosol in response to hypoxia; homolog of human Sm D1; protein abundance increases in response to DNA replication stress +S000031921 CDS YGR074W 7 635712 636152 W 2011-02-03 1996-07-31 +S000003305 ORF Dubious YGR073C chromosome 7 7 635986 635615 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; extensively overlaps essential SMD1 gene encoding a U6 snRNP protein +S000031714 CDS YGR073C 7 635986 635615 C 2011-02-03 1996-07-31 +S000003307 ORF Verified YGR075C PRP38 U4/U6-U5 snRNP complex subunit PRP38 chromosome 7 L000001510 7 636875 636147 C 2011-02-03 1996-07-31 Unique component of the U4/U6.U5 tri-snRNP particle; tri-snRNP is required for conformational changes which result in the catalytic activation of the spliceosome; dispensable for spliceosome assembly +S000031968 CDS YGR075C 7 636875 636147 C 2011-02-03 1996-07-31 +S000003308 ORF Verified YGR076C MRPL25 mitochondrial 54S ribosomal protein YmL25|AFO1|YmL25|YMR26 chromosome 7 L000002532 7 637577 637104 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit; mutation confers increased replicative lifespan +S000037456 CDS YGR076C 7 637577 637104 C 2011-02-03 1996-07-31 +S000003309 ORF Verified YGR077C PEX8 PAS6 chromosome 7 L000004222|L000003962 7 639513 637744 C 2011-02-03 1996-07-31 Intraperoxisomal organizer of the peroxisomal import machinery; organizes the formation of the importomer complex, bridging the docking complex with the RING finger complex; tightly associated with the lumenal face of the peroxisomal membrane; essential for peroxisome biogenesis; binds PTS1-signal receptor Pex5p, and PTS2-signal receptor Pex7p +S000037552 CDS YGR077C 7 639513 637744 C 2011-02-03 1996-07-31 +S000003310 ORF Verified YGR078C PAC10 tubulin-binding prefolding complex subunit PAC10|RKS2|PFD3|GIM2 chromosome 7 L000002864 7 640371 639772 C 2011-02-03 1996-07-31 Part of the heteromeric co-chaperone GimC/prefoldin complex; complex promotes efficient protein folding +S000037609 CDS YGR078C 7 640371 639772 C 2011-02-03 1996-07-31 +S000003311 ORF Uncharacterized YGR079W chromosome 7 7 640720 641832 W 2011-02-03 1996-07-31 Putative protein of unknown function; YGR079W is not an essential gene +S000030491 CDS YGR079W 7 640720 641832 W 2011-02-03 1996-07-31 +S000003312 ORF Verified YGR080W TWF1 chromosome 7 L000004372 7 642010 643008 W 2011-02-03 1996-07-31 Twinfilin; highly conserved actin monomer-sequestering protein involved in regulation of the cortical actin cytoskeleton; coordinates actin filament severing and monomer sequestering at sites of rapid actin turnover; composed of two cofilin-like regions, stimulates actin depolymerization as does the mouse homolog, mTwf1 +S000037367 CDS YGR080W 7 642010 643008 W 2011-02-03 1996-07-31 +S000003313 ORF Verified YGR081C SLX9 chromosome 7 7 643780 643148 C 2011-02-03 1996-07-31 Protein required for pre-rRNA processing; associated with the 90S pre-ribosome and 43S small ribosomal subunit precursor; interacts with U3 snoRNA; deletion mutant has synthetic fitness defect with an sgs1 deletion mutant +S000037394 CDS YGR081C 7 643780 643148 C 2011-02-03 1996-07-31 +S000003314 ORF Verified YGR082W TOM20 MOM19|MAS20 chromosome 7 L000001029 7 644044 644595 W 2011-02-03 1996-07-31 Component of the TOM (translocase of outer membrane) complex; responsible for recognition and initial import steps for all mitochondrially directed proteins; acts as a receptor for incoming precursor proteins +S000030069 CDS YGR082W 7 644044 644595 W 2011-02-03 1996-07-31 +S000003315 ORF Verified YGR083C GCD2 translation initiation factor eIF2B subunit delta|GCD12 chromosome 7 L000000671 7 646815 644860 C 54 2011-02-03 1996-07-31 Delta subunit of the translation initiation factor eIF2B; the guanine-nucleotide exchange factor for eIF2; activity subsequently regulated by phosphorylated eIF2; first identified as a negative regulator of GCN4 expression +S000030132 CDS YGR083C 7 646815 644860 C 2011-02-03 1996-07-31 +S000003316 ORF Verified YGR084C MRP13 mitochondrial 37S ribosomal protein YmS-A chromosome 7 L000001142|L000001157 7 648142 647123 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit +S000030307 CDS YGR084C 7 648142 647123 C 2011-02-03 1996-07-31 +S000003317 ORF Verified YGR085C RPL11B uL5|ribosomal 60S subunit protein L11B|rp39B|YL22|L5|L16A|L11B chromosome 7 L000001730|L000001713 7 648907 648383 C 56 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L11B; expressed at half the level of Rpl11Ap; involved in ribosomal assembly; depletion causes degradation of 60S proteins and RNA; homologous to mammalian ribosomal protein L11 and bacterial L5; RPL11B has a paralog, RPL11A, that arose from the whole genome duplication +S000033620 CDS YGR085C 7 648907 648383 C 2011-02-03 1996-07-31 +S000003318 ORF Verified YGR086C PIL1 lipid-binding protein PIL1 chromosome 7 7 650617 649598 C 2011-02-03 1996-07-31 Eisosome core component; eisosomes are large immobile cell cortex structures associated with endocytosis; detected in phosphorylated state in mitochondria; phosphorylated on Thr233 upon Pkc1p hyperactivation in a Slt2p MAPK-dependent fashion; null mutant shows activation of Pkc1p/Ypk1p stress resistance pathways; member of BAR domain family; protein increases in abundance and relocalizes from plasma membrane to cytoplasm upon DNA replication stress +S000033727 CDS YGR086C 7 650617 649598 C 2011-02-03 1996-07-31 +S000003319 ORF Verified YGR087C PDC6 indolepyruvate decarboxylase 6 chromosome 7 L000001357 7 652981 651290 C 2011-02-03 1996-07-31 Minor isoform of pyruvate decarboxylase; decarboxylates pyruvate to acetaldehyde, involved in amino acid catabolism; transcription is glucose- and ethanol-dependent, and is strongly induced during sulfur limitation +S000033866 CDS YGR087C 7 652981 651290 C 2011-02-03 1996-07-31 +S000003320 ORF Verified YGR088W CTT1 catalase T|SPS101 chromosome 7 L000000435 7 654634 656322 W 2011-02-03 1996-07-31|2006-01-23 Cytosolic catalase T; has a role in protection from oxidative damage by hydrogen peroxide +S000034811 CDS YGR088W 7 654634 656322 W 2011-02-03 1996-07-31|2006-01-23 +S000003321 ORF Verified YGR089W NNF2 chromosome 7 7 656960 659770 W 2011-02-03 1996-07-31 Protein that exhibits physical and genetic interactions with Rpb8p; Rpb8p is a subunit of RNA polymerases I, II, and III; computational analysis of large-scale protein-protein interaction data suggests a role in chromosome segregation +S000034943 CDS YGR089W 7 656960 659770 W 2011-02-03 1996-07-31 +S000118463 ARS ARS727 ARSVII-660 chromosome 7 7 659907 660002 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000119027 ARS_consensus_sequence ARS727 7 660000 659986 C 2011-02-03 2006-10-03 +S000006749 tRNA_gene tT(UGU)G1 chromosome 7 L000003828 7 661749 661820 W 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000030910 noncoding_exon tT(UGU)G1 7 661749 661820 W 2011-02-03 2000-05-19 +S000003322 ORF Verified YGR090W UTP22 rRNA-processing protein UTP22 chromosome 7 7 662358 666071 W 2011-02-03 1996-07-31 Component of the small-subunit processome; required for nuclear export of tRNAs; may facilitate binding of Utp8p to aminoacylated tRNAs and their delivery to Los1p for export; conserved from yeast to mammals +S000033602 CDS YGR090W 7 662358 666071 W 2011-02-03 1996-07-31 +S000003323 ORF Verified YGR091W PRP31 U4/U6-U5 snRNP complex subunit PRP31 chromosome 7 L000002947 7 666341 667825 W 2011-02-03 1996-07-31 Splicing factor; component of the U4/U6-U5 snRNP complex +S000034543 CDS YGR091W 7 666341 667825 W 2011-02-03 1996-07-31 +S000003324 ORF Verified YGR092W DBF2 serine/threonine-protein kinase DBF2 chromosome 7 L000000487 7 668189 669907 W 28 2011-02-03 1996-07-31 Ser/Thr kinase involved in transcription and stress response; functions as part of a network of genes in exit from mitosis; localization is cell cycle regulated; activated by Cdc15p during the exit from mitosis; also plays a role in regulating the stability of SWI5 and CLB2 mRNAs; phosphorylates Chs2p to regulate primary septum formation and Hof1p to regulate cytokinesis; DBF2 has a paralog, DBF20, that arose from the whole genome duplication +S000034610 CDS YGR092W 7 668189 669907 W 2011-02-03 1996-07-31 +S000003325 ORF Verified YGR093W DRN1 chromosome 7 7 670388 671911 W 2011-02-03 1996-07-31 Splicing factor that modulates turnover of branched RNAs by Dbr1p; interacts with spliceosomal components and branched RNA splicing products; enhances Dbr1p debranching in vitro; conserved protein with domain organization identical from yeast to human; N-terminal homology to Dbr1p N-terminus, but Dbr1p catalytic residues not conserved; relocalizes to the cytosol in response to hypoxia +S000034725 CDS YGR093W 7 670388 671911 W 2011-02-03 1996-07-31 +S000003326 ORF Verified YGR094W VAS1 valine--tRNA ligase chromosome 7 L000002457 7 672186 675500 W 2011-02-03 1996-07-31 Mitochondrial and cytoplasmic valyl-tRNA synthetase; human homolog VARS2 implicated in mitochondrial diseases, can partially complement yeast null mutant +S000035718 CDS YGR094W 7 672186 675500 W 2011-02-03 1996-07-31 +S000003327 ORF Verified YGR095C RRP46 exosome non-catalytic core subunit RRP46 chromosome 7 L000004579 7 676342 675671 C 2011-02-03 2003-09-22|1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; has similarity to E. coli RNase PH and to human hRrp46p (EXOSC5) +S000035767 CDS YGR095C 7 676342 675671 C 2011-02-03 2003-09-22|1996-07-31 +S000003328 ORF Verified YGR096W TPC1 thiamine transporter TPC1 chromosome 7 7 676621 677565 W 2011-02-03 1996-07-31 Mitochondrial membrane transporter; mediates uptake of the essential cofactor thiamine pyrophosphate (ThPP) into mitochondria; expression appears to be regulated by carbon source; member of the mitochondrial carrier family +S000035962 CDS YGR096W 7 676621 677565 W 2011-02-03 1996-07-31 +S000003329 ORF Verified YGR097W ASK10 RGC2 chromosome 7 L000002770 7 678695 682135 W 2011-02-03 1996-07-31 Regulator of the Fps1p glycerol channel; under nonstress conditions, binds to Fps1p to positively regulate glycerol transport; under osmotic stress, multiple phosphorylation by Hog1p causes Ask10p to dissociate from Fps1p; forms homodimers and heterodimerizes with paralog Rgc1p; phosphorylated in response to oxidative stress; has a role in destruction of Ssn8p; associates with RNA polymerase II holoenzyme +S000037821 CDS YGR097W 7 678695 682135 W 2011-02-03 1996-07-31 +S000003330 ORF Verified YGR098C ESP1 separase chromosome 7 L000000584 7 687458 682566 C 60 2011-02-03 1996-07-31 Separase, a caspase-like cysteine protease; promotes sister chromatid separation by mediating dissociation of the cohesin Scc1p from chromatin; inhibits protein phosphatase 2A-Cdc55p to promote mitotic exit; inhibited by Pds1p; relative distribution to the nucleus increases upon DNA replication stress +S000037871 CDS YGR098C 7 687458 682566 C 2011-02-03 1996-07-31 +S000003331 ORF Verified YGR099W TEL2 chromosome 7 L000002913 7 687899 689965 W 2011-02-03 1996-07-31 Subunit of the ASTRA complex, involved in chromatin remodeling; subunit of the telomere cap complex DNA-binding protein specific to single-stranded yeast telomeric DNA repeats, required for telomere length regulation and telomere position effect; involved in the stability or biogenesis of PIKKs such as TORC1 +S000029946 CDS YGR099W 7 687899 689965 W 2011-02-03 1996-07-31 +S000003332 ORF Verified YGR100W MDR1 GYP2|MIC1 chromosome 7 L000003270 7 690245 693097 W 2011-02-03 1996-07-31 Cytoplasmic GTPase-activating protein; activates Ypt/Rab transport GTPases Ypt6p, Ypt31p and Sec4p; involved in recycling of internalized proteins and regulation of Golgi secretory function +S000035442 CDS YGR100W 7 690245 693097 W 2011-02-03 1996-07-31 +S000003333 ORF Verified YGR101W PCP1 rhomboid protease PCP1|RBD1|MDM37 chromosome 7 7 693363 694403 W 2011-02-03 1996-07-31 Mitochondrial serine protease; required for the processing of various mitochondrial proteins and maintenance of mitochondrial DNA and morphology; belongs to the rhomboid-GlpG superfamily of intramembrane peptidases +S000035497 CDS YGR101W 7 693363 694403 W 2011-02-03 1996-07-31 +S000003334 ORF Verified YGR102C GTF1 glutamyl-tRNA(Gln) amidotransferase subunit F chromosome 7 7 695135 694584 C 2011-02-03 1996-07-31 Subunit of the trimeric GatFAB AmidoTransferase(AdT) complex; involved in the formation of Q-tRNAQ; transposon insertion mutant is salt sensitive and null mutant has growth defects; non-tagged protein is detected in purified mitochondria +S000035523 CDS YGR102C 7 695135 694584 C 2011-02-03 1996-07-31 +S000003335 ORF Verified YGR103W NOP7 mRNA-binding ribosome synthesis protein NOP7|YPH1 chromosome 7 S000007661 7 695417 697234 W 2011-02-03 1996-07-31 Component of several different pre-ribosomal particles; forms a complex with Ytm1p and Erb1p that is required for maturation of the large ribosomal subunit; required for exit from G0 and the initiation of cell proliferation +S000036462 CDS YGR103W 7 695417 697234 W 2011-02-03 1996-07-31 +S000003336 ORF Verified YGR104C SRB5 MED18 chromosome 7 L000002052 7 698368 697445 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation; required for proper termination of transcription for some genes; involved in telomere maintenance +S000036489 CDS YGR104C 7 698368 697445 C 2011-02-03 1996-07-31 +S000003337 ORF Verified YGR105W VMA21 chromosome 7 L000002466 7 698599 698832 W 2011-02-03 1996-07-31 Integral membrane protein required for V-ATPase function; not an actual component of the vacuolar H+-ATPase (V-ATPase) complex; diverged ortholog of human XMEA (X-linked Myopathy with Excessive Autophagy); functions in the assembly of the V-ATPase; localized to the yeast endoplasmic reticulum (ER) +S000036647 CDS YGR105W 7 698599 698832 W 2011-02-03 1996-07-31 +S000003338 ORF Verified YGR106C VOA1 chromosome 7 7 699786 698989 C 2011-02-03 1996-07-31 ER protein that functions in assembly of the V0 sector of V-ATPase; functions with other assembly factors; null mutation enhances the vacuolar ATPase (V-ATPase) deficiency of a vma21 mutant impaired in endoplasmic reticulum (ER) retrieval +S000036683 CDS YGR106C 7 699786 698989 C 2011-02-03 1996-07-31 +S000006646 tRNA_gene tL(GAG)G chromosome 7 L000003829 7 700675 700756 W 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis; not essential for viability even though this is the only tRNA that decodes GAG codons +S000031926 noncoding_exon tL(GAG)G 7 700675 700756 W 2011-02-03 2000-05-19 +S000006631 tRNA_gene tK(UUU)G2 chromosome 7 L000003845 7 701048 700953 C 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000033693 intron tK(UUU)G2 7 701011 700989 C 2011-02-03 2000-05-19 +S000033692 noncoding_exon tK(UUU)G2 7 700988 700953 C 2011-02-03 2000-05-19 +S000033691 noncoding_exon tK(UUU)G2 7 701048 701012 C 2011-02-03 2000-05-19 +S000006968 long_terminal_repeat YGRWdelta19 chromosome 7 7 701104 701350 W 2011-02-03 2000-05-19 Ty1 LTR +S000003339 ORF Dubious YGR107W chromosome 7 7 702667 703116 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037476 CDS YGR107W 7 702667 703116 W 2011-02-03 1996-07-31 +S000003340 ORF Verified YGR108W CLB1 B-type cyclin CLB1|SCB1 chromosome 7 L000000349 7 703636 705051 W 2011-02-03 1996-07-31 B-type cyclin involved in cell cycle progression; activates Cdc28p to promote the transition from G2 to M phase; accumulates during G2 and M, then targeted via a destruction box motif for ubiquitin-mediated degradation by the proteasome; CLB1 has a paralog, CLB2, that arose from the whole genome duplication +S000037604 CDS YGR108W 7 703636 705051 W 2011-02-03 1996-07-31 +S000003341 ORF Verified YGR109C CLB6 B-type cyclin CLB6 chromosome 7 L000000354 7 706501 705359 C 2011-02-03 1996-07-31 B-type cyclin involved in DNA replication during S phase; activates Cdc28p to promote initiation of DNA synthesis; functions in formation of mitotic spindles along with Clb3p and Clb4p; most abundant during late G1; CLB6 has a paralog, CLB5, that arose from the whole genome duplication +S000037653 CDS YGR109C 7 706501 705359 C 2011-02-03 1996-07-31 +S000006527 tRNA_gene tC(GCA)G chromosome 7 L000003844 7 707179 707108 C 2011-02-03 2000-05-19 Cysteine tRNA (tRNA-Cys), predicted by tRNAscan-SE analysis +S000035213 noncoding_exon tC(GCA)G 7 707179 707108 C 2011-02-03 2000-05-19 +S000006978 long_terminal_repeat YGRWsigma4 chromosome 7 7 707195 707534 W 2011-02-03 2000-05-19 Ty3 LTR +S000006984 LTR_retrotransposon YGRWTy3-1 Ty3 chromosome 7 7 707195 712545 W 2011-02-03 2000-05-19 Ty3 element, LTR retrotransposon of the Gypsy (Metaviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; transposition is induced upon exposure to mating pheromone +S000007346 transposable_element_gene YGR109W-A gag protein chromosome 7 7 707610 708482 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000033102 CDS YGR109W-A 7 707610 708482 W 2011-02-03 1999-07-17 +S000007347 transposable_element_gene YGR109W-B gag-pol fusion protein chromosome 7 7 707610 712254 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000033103 CDS YGR109W-B 7 707610 708459 W 2011-02-03 1999-07-17 +S000033104 CDS YGR109W-B 7 708461 712254 W 2011-02-03 1999-07-17 +S000033105 plus_1_translational_frameshift YGR109W-B 7 708460 708460 W 2011-02-03 1999-07-17 +S000006979 long_terminal_repeat YGRWsigma5 chromosome 7 7 712206 712545 W 2011-02-03 2000-05-19 Ty3 LTR +S000006957 long_terminal_repeat YGRCdelta20 chromosome 7 7 713384 713084 C 2011-02-03 2000-05-19 Ty1 LTR +S000003342 ORF Verified YGR110W CLD1 carboxylic ester hydrolase chromosome 7 7 713709 715046 W 2011-02-03 1996-07-31 Mitochondrial cardiolipin-specific phospholipase; functions upstream of Taz1p to generate monolyso-cardiolipin; transcription increases upon genotoxic stress; involved in restricting Ty1 transposition; has homology to mammalian CGI-58 +S000030464 CDS YGR110W 7 713709 715046 W 2011-02-03 1996-07-31 +S000118464 ARS ARS728 ARSVII-715 chromosome 7 7 715312 715377 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000119028 ARS_consensus_sequence ARS728 7 715315 715329 W 2011-02-03 2006-10-03 +S000003343 ORF Uncharacterized YGR111W chromosome 7 7 715828 717030 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus +S000031339 CDS YGR111W 7 715828 717030 W 2011-02-03 1996-07-31 +S000003344 ORF Verified YGR112W SHY1 chromosome 7 L000004140 7 717358 718527 W 2011-02-03 1996-07-31 Mitochondrial inner membrane protein required for complex IV assembly; associates with complex IV assembly intermediates and complex III/complex IV supercomplexes; similar to human SURF1 involved in Leigh Syndrome; complex IV is also known as cytochrome c oxidase +S000031421 CDS YGR112W 7 717358 718527 W 2011-02-03 1996-07-31 +S000003345 ORF Verified YGR113W DAM1 chromosome 7 L000004420 7 718893 719924 W 2011-02-03 2001-05-31|1996-07-31 Essential subunit of the Dam1 complex (aka DASH complex); cooperates with Duo1p to connect the DASH complex with the microtubules (MT); couples kinetochores to the force produced by MT depolymerization thereby aiding in chromosome segregation; Ipl1p target for regulating kinetochore-MT attachments +S000031509 CDS YGR113W 7 718893 719924 W 2011-02-03 2001-05-31|1996-07-31 +S000003348 ORF Verified YGR116W SPT6 chromatin-remodeling histone chaperone SPT6|SSN20|CRE2 chromosome 7 L000002032 7 720409 724764 W 87.64 2011-02-03 1996-07-31 Nucleosome remodeling protein; functions in various aspects of transcription, chromatin maintenance, and RNA processing; required for the maintenance of chromatin structure during transcription in order to inhibit transcription from promoters within the coding region; required for H3K36 trimethylation but not dimethylation by Set2p +S000032690 CDS YGR116W 7 720409 724764 W 2011-02-03 1996-07-31 +S000003346 ORF Dubious YGR114C chromosome 7 7 720654 720265 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; open reading frame overlaps 5' end of the essential gene SPT6 +S000031522 CDS YGR114C 7 720654 720265 C 2011-02-03 1996-07-31 +S000003347 ORF Dubious YGR115C chromosome 7 7 721151 720372 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified and essential ORF SPT6/YGR115C +S000031629 CDS YGR115C 7 721151 720372 C 2011-02-03 1996-07-31 +S000003349 ORF Uncharacterized YGR117C chromosome 7 7 726479 725049 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000032722 CDS YGR117C 7 726479 725049 C 2011-02-03 1996-07-31 +S000003350 ORF Verified YGR118W RPS23A uS12|ribosomal 40S subunit protein S23A|rp37|YS14|S28A|S23A|S12 chromosome 7 L000001764 7 726974 727730 W 2011-02-03 1996-07-31|2011-02-03 Ribosomal protein 28 (rp28) of the small (40S) ribosomal subunit; required for translational accuracy; homologous to mammalian ribosomal protein S23 and bacterial S12; RPS23A has a paralog, RPS23B, that arose from the whole genome duplication; deletion of both RPS23A and RPS23B is lethal +S000033494 CDS YGR118W 7 726974 727038 W 2011-02-03 1996-07-31 +S000033495 CDS YGR118W 7 727358 727730 W 2011-02-03 1996-07-31 +S000033496 intron YGR118W 7 727039 727357 W 2011-02-03 1996-07-31|2011-02-03 +S000003351 ORF Verified YGR119C NUP57 FG-nucleoporin NUP57 chromosome 7 L000002619 7 729671 728046 C 2011-02-03 1996-07-31 FG-nucleoporin component of central core of the nuclear pore complex; contributes directly to nucleocytoplasmic transport and maintenance of the nuclear pore complex (NPC) permeability barrier; found in stable complex with Nic96p and two other FG-nucleoproteins (Nsp1p and Nup49p) +S000033534 CDS YGR119C 7 729671 728046 C 2011-02-03 1996-07-31 +S000003352 ORF Verified YGR120C COG2 Golgi transport complex subunit COG2|SEC35 chromosome 7 L000004877 7 730821 730033 C 2011-02-03 2003-09-22|1996-07-31 Essential component of the conserved oligomeric Golgi complex; a cytosolic tethering complex that functions in protein trafficking to mediate fusion of transport vesicles to Golgi compartments; the components of the Golgi complex are Gog1p through Cog8p +S000034667 CDS YGR120C 7 730821 730033 C 2011-02-03 2003-09-22|1996-07-31 +S000006670 tRNA_gene tN(GUU)G chromosome 7 L000003830 7 731137 731210 W 2011-02-03 2000-05-19 Asparagine tRNA (tRNA-Asn), predicted by tRNAscan-SE analysis +S000030710 noncoding_exon tN(GUU)G 7 731137 731210 W 2011-02-03 2000-05-19 +S000003353 ORF Verified YGR121C MEP1 ammonium permease MEP1|AMT1 chromosome 7 L000001073 7 732927 731449 C 2011-02-03 1996-07-31 Ammonium permease; belongs to a ubiquitous family of cytoplasmic membrane proteins that transport only ammonium (NH4+); expression is under the nitrogen catabolite repression regulation; human homolog RHCG complements yeast null mutant; mutations in human homolog RHCG implicated in metabolic acidosis; MEP1 has a paralog, MEP3, that arose from the whole genome duplication +S000034743 CDS YGR121C 7 732927 731449 C 2011-02-03 1996-07-31 +S000028550 ORF Uncharacterized YGR121W-A chromosome 7 7 733412 733627 W 2011-02-03 2003-07-29 Putative protein of unknown function +S000031236 CDS YGR121W-A 7 733412 733627 W 2011-02-03 2003-07-29 +S000003354 ORF Verified YGR122W chromosome 7 7 733935 735143 W 2011-02-03 1996-07-31 Protein that may be involved in pH regulation; probable ortholog of A. nidulans PalC, which is involved in pH regulation and binds to the ESCRT-III complex; null mutant does not properly process Rim101p and has decreased resistance to rapamycin; GFP-fusion protein is cytoplasmic; relative distribution to cytoplasm increases upon DNA replication stress +S000035706 CDS YGR122W 7 733935 735143 W 2011-02-03 1996-07-31 +S000006969 long_terminal_repeat YGRWdelta21 chromosome 7 7 735542 735872 W 2011-02-03 2000-05-19 Ty1 LTR +S000007240 ORF Dubious YGR122C-A chromosome 7 7 735758 735630 C 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; similar to YLR334C and YOL106W +S000032623 CDS YGR122C-A 7 735758 735630 C 2011-02-03 1999-07-17 +S000006980 long_terminal_repeat YGRWsigma6 chromosome 7 7 735982 736322 W 2011-02-03 2000-05-19 Ty3 LTR +S000006713 tRNA_gene tR(UCU)G3 chromosome 7 L000003831 7 736340 736411 W 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000037332 noncoding_exon tR(UCU)G3 7 736340 736411 W 2011-02-03 2000-05-19 +S000003355 ORF Verified YGR123C PPT1 protein serine/threonine phosphatase chromosome 7 L000002624 7 738203 736662 C 2011-02-03 1996-07-31 Protein serine/threonine phosphatase; regulates Hsp90 chaperone by affecting its ATPase and cochaperone binding activities; has similarity to human phosphatase PP5; present in both the nucleus and cytoplasm; expressed during logarithmic growth +S000035715 CDS YGR123C 7 738203 736662 C 2011-02-03 1996-07-31 +S000006604 tRNA_gene tI(AAU)G chromosome 7 L000003832 7 739122 739195 W 2011-02-03 2000-05-19 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000030407 noncoding_exon tI(AAU)G 7 739122 739195 W 2011-02-03 2000-05-19 +S000003356 ORF Verified YGR124W ASN2 asparagine synthase (glutamine-hydrolyzing) 2 chromosome 7 L000003156 7 739944 741662 W 2011-02-03 1996-07-31 Asparagine synthetase; catalyzes the synthesis of L-asparagine from L-aspartate in the asparagine biosynthetic pathway; ASN2 has a paralog, ASN1, that arose from the whole genome duplication +S000035868 CDS YGR124W 7 739944 741662 W 2011-02-03 1996-07-31 +S000003357 ORF Uncharacterized YGR125W chromosome 7 7 742325 745435 W 2011-02-03 1996-07-31 Putative protein of unknown function; deletion mutant has decreased rapamycin resistance but normal wormannin resistance; green fluorescent protein (GFP)-fusion protein localizes to the vacuole +S000036786 CDS YGR125W 7 742325 745435 W 2011-02-03 1996-07-31 +S000003358 ORF Uncharacterized YGR126W chromosome 7 7 745835 746527 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus and is induced in response to the DNA-damaging agent MMS +S000036861 CDS YGR126W 7 745835 746527 W 2011-02-03 1996-07-31 +S000003359 ORF Uncharacterized YGR127W chromosome 7 7 746798 747736 W 2011-02-03 1996-07-31 Putative protein of unknown function; expression is regulated by Msn2p/Msn4p, indicating a possible role in stress response +S000036917 CDS YGR127W 7 746798 747736 W 2011-02-03 1996-07-31 +S000003360 ORF Verified YGR128C UTP8 chromosome 7 7 750091 747950 C 2011-02-03 1996-07-31 Nucleolar protein required for export of tRNAs from the nucleus; also copurifies with the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA +S000036949 CDS YGR128C 7 750091 747950 C 2011-02-03 1996-07-31 +S000003361 ORF Verified YGR129W SYF2 NTC31 chromosome 7 L000004196 7 750400 751047 W 2011-02-03 1996-07-31 Member of the NineTeen Complex (NTC); NTC contains Prp19p and stabilizes U6 snRNA in catalytic forms of the spliceosome containing U2, U5, and U6 snRNAs; relocalizes to the cytosol in response to hypoxia; isy1 syf2 cells have defective spindles activiating cell cycle arrest +S000037743 CDS YGR129W 7 750400 751047 W 2011-02-03 1996-07-31 +S000003362 ORF Verified YGR130C chromosome 7 7 753844 751394 C 2011-02-03 1996-07-31 Component of the eisosome with unknown function; GFP-fusion protein localizes to the cytoplasm; specifically phosphorylated in vitro by mammalian diphosphoinositol pentakisphosphate (IP7) +S000030568 CDS YGR130C 7 753844 751394 C 2011-02-03 1996-07-31 +S000003363 ORF Verified YGR131W FHN1 chromosome 7 7 754726 755250 W 2011-02-03 1996-07-31 Protein of unknown function; induced by ketoconazole; promoter region contains sterol regulatory element motif, which has been identified as a Upc2p-binding site; overexpression complements function of Nce102p in NCE102 deletion strain; FHN1 has a paralog, NCE102, that arose from the whole genome duplication +S000030762 CDS YGR131W 7 754726 755250 W 2011-02-03 1996-07-31 +S000003364 ORF Verified YGR132C PHB1 prohibitin subunit PHB1 chromosome 7 L000001416|L000001415 7 756452 755589 C 2011-02-03 1996-07-31 Subunit of the prohibitin complex (Phb1p-Phb2p); prohibitin is a 1.2 MDa ring-shaped inner mitochondrial membrane chaperone that stabilizes newly synthesized proteins; determinant of replicative life span; involved in mitochondrial segregation; prohibitin deficiency induces a mitochondrial unfolded protein response (mtUPR) +S000030798 CDS YGR132C 7 756452 755589 C 2011-02-03 1996-07-31 +S000003365 ORF Verified YGR133W PEX4 E2 ubiquitin-protein ligase peroxin 4|UBC10|PAS2 chromosome 7 L000001338 7 756896 757447 W 2011-02-03 1996-07-31 Peroxisomal ubiquitin conjugating enzyme; required for peroxisomal matrix protein import and peroxisome biogenesis +S000031790 CDS YGR133W 7 756896 757447 W 2011-02-03 1996-07-31 +S000003366 ORF Verified YGR134W CAF130 CCR4-NOT core subunit CAF130 chromosome 7 7 757770 761138 W 2011-02-03 1996-07-31 Subunit of the CCR4-NOT transcriptional regulatory complex; CCR4-NOT complex is evolutionarily-conserved and involved in controlling mRNA initiation, elongation, and degradation +S000031982 CDS YGR134W 7 757770 761138 W 2011-02-03 1996-07-31 +S000003367 ORF Verified YGR135W PRE9 proteasome core particle subunit alpha 3 chromosome 7 L000002701 7 761392 762168 W 2011-02-03 1996-07-31 Alpha 3 subunit of the 20S proteasome; the only nonessential 20S subunit; may be replaced by the alpha 4 subunit (Pre6p) under stress conditions to create a more active proteasomal isoform +S000032101 CDS YGR135W 7 761392 762168 W 2011-02-03 1996-07-31 +S000003368 ORF Verified YGR136W LSB1 chromosome 7 7 762428 763153 W 2011-02-03 1996-07-31 Negative regulator of actin nucleation-promoting factor activity; interacts with Las17p, a homolog of human Wiskott-Aldrich Syndrome protein (WASP), via an N-terminal SH3 domain, and along with PIN3 cooperatively inhibits the nucleation of actin filaments; overexpression blocks receptor-mediated endocytosis; protein increases in abundance and forms nuclear foci in response to DNA replication stress; LSB1 has a paralog, PIN3, that arose from the whole genome duplication +S000033027 CDS YGR136W 7 762428 763153 W 2011-02-03 1996-07-31 +S000003369 ORF Dubious YGR137W chromosome 7 7 762888 763262 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033117 CDS YGR137W 7 762888 763262 W 2011-02-03 1996-07-31 +S000003370 ORF Verified YGR138C TPO2 spermine transporter chromosome 7 7 765606 763762 C 2011-02-03 1996-07-31 Polyamine transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; specific for spermine; localizes to the plasma membrane; transcription of TPO2 is regulated by Haa1p; TPO2 has a paralog, TPO3, that arose from the whole genome duplication +S000033153 CDS YGR138C 7 765606 763762 C 2011-02-03 1996-07-31 +S000003371 ORF Dubious YGR139W chromosome 7 7 765726 766064 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034004 CDS YGR139W 7 765726 766064 W 2011-02-03 1996-07-31 +S000003372 ORF Verified YGR140W CBF2 CSL5|NDC10|CTF14|CEP2|CBF3A chromosome 7 L000000430|L000001238|L000000221 7 767429 770299 W 2011-02-03 1996-07-31 Essential kinetochore protein; component of the CBF3 multisubunit complex that binds to the CDEIII region of the centromere; Cbf2p also binds to the CDEII region possibly forming a different multimeric complex, ubiquitinated in vivo; sumoylated in an Mms21p-dependent manner; relative distribution to the spindle pole body decreases upon DNA replication stress +S000034959 CDS YGR140W 7 767429 770299 W 2011-02-03 1996-07-31 +S000003373 ORF Verified YGR141W VPS62 chromosome 7 7 770569 771972 W 2011-02-03 1996-07-31 Vacuolar protein sorting (VPS) protein; required for cytoplasm to vacuole targeting of proteins; VPS62 has a paralog, TDA6, that arose from the whole genome duplication +S000035068 CDS YGR141W 7 770569 771972 W 2011-02-03 1996-07-31 +S000003374 ORF Verified YGR142W BTN2 chromosome 7 7 772454 773686 W 2011-02-03 1996-07-31 v-SNARE binding protein; facilitates specific protein retrieval from a late endosome to the Golgi; modulates arginine uptake, possible role in mediating pH homeostasis between the vacuole and plasma membrane H(+)-ATPase; contributes to prion curing; preferentially expressed after severe ethanol stress +S000035175 CDS YGR142W 7 772454 773686 W 2011-02-03 1996-07-31 +S000006970 long_terminal_repeat YGRWdelta22 chromosome 7 7 774040 774162 W 2011-02-03 2000-05-19 Ty1 LTR +S000006512 tRNA_gene tA(AGC)G chromosome 7 L000003833 7 774349 774421 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine +S000032279 noncoding_exon tA(AGC)G 7 774349 774421 W 2011-02-03 2000-05-19 +S000003375 ORF Verified YGR143W SKN1 beta-glucan synthesis-associated protein SKN1 chromosome 7 L000001907 7 775193 777508 W 88.14 2011-02-03 1996-07-31 Protein involved in sphingolipid biosynthesis; type II membrane protein; SKN1 has a paralog, KRE6, that arose from the whole genome duplication +S000036052 CDS YGR143W 7 775193 777508 W 2011-02-03 1996-07-31 +S000118465 ARS ARS729 ARSVII-778 chromosome 7 7 777966 778214 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000119029 ARS_consensus_sequence ARS729 7 778014 778028 W 2011-02-03 2006-10-03 +S000178103 ARS_consensus_sequence ARS729 7 778196 778180 C 2014-11-18 2014-11-18 +S000006971 long_terminal_repeat YGRWdelta23 chromosome 7 7 778784 779112 W 2011-02-03 2000-05-19 Ty1 LTR +S000006972 long_terminal_repeat YGRWdelta24 chromosome 7 7 779116 779224 W 2011-02-03 2000-05-19 Ty1 LTR +S000006958 long_terminal_repeat YGRCdelta25 chromosome 7 7 779515 779225 C 2011-02-03 2000-05-19 Ty1 LTR +S000006590 tRNA_gene tG(UCC)G SUF4 chromosome 7 L000002152|L000003834 7 779616 779687 W 105 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis; can mutate to suppress +1 frameshift mutations in glycine codons +S000037534 noncoding_exon tG(UCC)G 7 779616 779687 W 2011-02-03 2000-05-19 +S000003376 ORF Verified YGR144W THI4 thiamine thiazole synthase|MOL1|ESP35 chromosome 7 L000001133|L000000585 7 780399 781379 W 2011-02-03 1996-07-31 Thiazole synthase; abundant protein involved in the formation of the thiazole moiety of thiamine during thiamine biosynthesis; acts more as a co-substrate rather than an enzyme by providing the sulphur source for thiazole formation; undergoes a single turnover only; required for mitochondrial genome stability in response to DNA damaging agents +S000036192 CDS YGR144W 7 780399 781379 W 2011-02-03 1996-07-31 +S000003377 ORF Verified YGR145W ENP2 ribosome biosynthesis protein ENP2 chromosome 7 7 781767 783890 W 2011-02-03 1996-07-31|2011-02-03 Component of the SSU; required for pre-18S rRNA processing, biogenesis of the small ribosomal subunit; interacts with U3 snoRNA, Mpp10p and Bfr2p; contains WD repeats, and has homology to Spb1p +S000029871 CDS YGR145W 7 781767 783890 W 2011-02-03 1996-07-31|2011-02-03 +S000003378 ORF Verified YGR146C ECL1 chromosome 7 7 784858 784223 C 2011-02-03 1996-07-31 Protein of unknown function; mitochondrial-dependent role in the extension of chronological lifespan; overexpression increases oxygen consumption and respiratory activity while deletion results in reduced oxygen consumption under conditions of caloric restriction; induced by iron homeostasis transcription factor Aft2p; multicopy suppressor of temperature sensitive hsf1 mutant; induced by treatment with 8-methoxypsoralen and UVA irradiation +S000031718 CDS YGR146C 7 784858 784223 C 2011-02-03 1996-07-31 +S000028638 ORF Uncharacterized YGR146C-A chromosome 7 7 785437 785276 C 2011-02-03 2003-07-29 Putative protein of unknown function +S000032394 CDS YGR146C-A 7 785437 785276 C 2011-02-03 2003-07-29 +S000003379 ORF Verified YGR147C NAT2 chromosome 7 L000001233 7 786920 786054 C 2011-02-03 1996-07-31 Protein of unknown function; has an apparent role in acetylation of N-terminal methionine residues +S000031870 CDS YGR147C 7 786920 786054 C 2011-02-03 1996-07-31 +S000003380 ORF Verified YGR148C RPL24B eL24|ribosomal 60S subunit protein L24B|L24e|rp29|YL21|L30B|L24B|RPL30B chromosome 7 L000001725 7 787779 787312 C 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L24B; not essential for translation but may be required for normal translation rate; homologous to mammalian ribosomal protein L24, no bacterial homolog; RPL24B has a paralog, RPL24A, that arose from the whole genome duplication +S000031971 CDS YGR148C 7 787779 787312 C 2011-02-03 1996-07-31 +S000122102 five_prime_UTR_intron YGR148C 7 788178 787787 C 2011-02-03 2007-04-04 +S000003381 ORF Verified YGR149W GPC1 chromosome 7 7 789031 790329 W 2011-02-03 1996-07-31 Glycerophosphocholine acyltransferase (GPCAT); involved in in phosphatidylcholine (PC) synthesis; uses acetyl-CoA to acylate glycero-3-phosphocholine to yield lyso-PC; also catalyzes acylation of glycerophosphoethanolamine with acyl-CoA; predicted to be an integal membrane protein +S000037495 CDS YGR149W 7 789031 790329 W 2011-02-03 1996-07-31 +S000003382 ORF Verified YGR150C CCM1 DMR1|RRG2 chromosome 7 7 793053 790459 C 2011-02-03 1996-07-31 Mitochondrial 15S rRNA-binding protein; required for intron removal of COB and COX1 pre-mRNAs; has separable roles in stabilizing mitochondrial 15S rRNA and in maturation of the COB and COX1 mRNAs; contains pentatricopeptide repeat (PPR) motifs; mutant is respiratory deficient and has defective plasma membrane electron transport +S000036478 CDS YGR150C 7 793053 790459 C 2011-02-03 1996-07-31 +S000006973 long_terminal_repeat YGRWdelta26 chromosome 7 7 793237 793559 W 2011-02-03 2000-05-19 Ty1 LTR +S000006523 tRNA_gene tA(UGC)G chromosome 7 L000003835 7 794417 794489 W 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 5 nuclear tRNA genes containing the tDNA-anticodon TGC (mature tRNA may be UGC or may contain modified bases), decodes GCA and probably GCG codons into alanine, one of 16 nuclear tRNAs for alanine +S000034874 noncoding_exon tA(UGC)G 7 794417 794489 W 2011-02-03 2000-05-19 +S000003383 ORF Dubious YGR151C chromosome 7 7 794990 794655 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps almost completely with the verified ORF RSR1/BUD1/YGR152C; relative distribution to the nucleus increases upon DNA replication stress +S000037176 CDS YGR151C 7 794990 794655 C 2011-02-03 1996-07-31 +S000003384 ORF Verified YGR152C RSR1 Ras family GTPase RSR1|BUD1 chromosome 7 L000001780 7 795492 794674 C 98 2011-02-03 1996-07-31 GTP-binding protein of the Ras superfamily; required for bud site selection, morphological changes in response to mating pheromone, and efficient cell fusion; localized to the plasma membrane; significantly similar to mammalian Rap GTPases +S000037247 CDS YGR152C 7 795492 794674 C 2011-02-03 1996-07-31 +S000003385 ORF Uncharacterized YGR153W TOS10 chromosome 7 7 796092 796745 W 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function +S000037368 CDS YGR153W 7 796092 796745 W 2011-02-03 1996-07-31|2011-02-03 +S000003386 ORF Verified YGR154C GTO1 omega-class glutathione transferase chromosome 7 7 797868 796798 C 2011-02-03 1996-07-31 Omega-class glutathione transferase; induced under oxidative stress; putative peroxisomal localization +S000037395 CDS YGR154C 7 797868 796798 C 2011-02-03 1996-07-31 +S000003387 ORF Verified YGR155W CYS4 cystathionine beta-synthase CYS4|VMA41|STR4|NHS5 chromosome 7 L000001248|L000000471 7 798543 800066 W 87.14 2011-02-03 1996-07-31 Cystathionine beta-synthase; catalyzes synthesis of cystathionine from serine and homocysteine, the first committed step in cysteine biosynthesis; responsible for hydrogen sulfide generation; advances passage through START by promoting cell growth which requires catalytic activity, and reducing critical cell size independent of catalytic activity; mutations in human ortholog CBS cause homocystinuria; human CBS can complement yeast null mutant +S000030070 CDS YGR155W 7 798543 800066 W 2011-02-03 1996-07-31 +S000003388 ORF Verified YGR156W PTI1 cleavage polyadenylation factor subunit PTI1 chromosome 7 7 800546 801823 W 2011-02-03 1996-07-31 Essential component of CPF (cleavage and polyadenylation factor); involved in 3' end formation of snoRNA and mRNA; interacts directly with Pta1p; relocalizes to the cytosol in response to hypoxia; similar to mammalian Cleavage-Stimulation Factor CstF-64 +S000030236 CDS YGR156W 7 800546 801823 W 2011-02-03 1996-07-31 +S000003389 ORF Verified YGR157W CHO2 phosphatidylethanolamine N-methyltransferase|PEM1 chromosome 7 L000000328 7 802440 805049 W 2011-02-03 1996-07-31 Phosphatidylethanolamine methyltransferase (PEMT); catalyzes the first step in the conversion of phosphatidylethanolamine to phosphatidylcholine during the methylation pathway of phosphatidylcholine biosynthesis +S000030380 CDS YGR157W 7 802440 805049 W 2011-02-03 1996-07-31 +S000003390 ORF Verified YGR158C MTR3 exosome non-catalytic core subunit MTR3 chromosome 7 L000003982 7 806021 805269 C 2011-02-03 1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; has similarity to E. coli RNase PH and to human hMtr3p (EXOSC6) +S000033622 CDS YGR158C 7 806021 805269 C 2011-02-03 1996-07-31 +S000003392 ORF Dubious YGR160W chromosome 7 7 807073 807684 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033399 CDS YGR160W 7 807073 807684 W 2011-02-03 1996-07-31 +S000003391 ORF Verified YGR159C NSR1 SHE5 chromosome 7 L000001278 7 807656 806412 C 2011-02-03 1996-07-31 Nucleolar protein that binds nuclear localization sequences; required for pre-rRNA processing and ribosome biogenesis; binds to single stranded telomeric DNA and mRNA; methylated by Hmt1p; interaction with Top1p and nucleolar localization are negatively regulated by polyphosphorylation +S000033736 CDS YGR159C 7 807656 806412 C 2011-02-03 1996-07-31 +S000003393 ORF Uncharacterized YGR161C RTS3 chromosome 7 7 809420 808629 C 2011-02-03 1996-07-31 Putative component of the protein phosphatase type 2A complex +S000033431 CDS YGR161C 7 809420 808629 C 2011-02-03 1996-07-31 +S000029726 ORF Uncharacterized YGR161W-C chromosome 7 7 810227 810505 W 2011-02-03 2004-08-27 Putative protein of unknown function; identified by sequence comparison with hemiascomycetous yeast species +S000036877 CDS YGR161W-C 7 810227 810505 W 2011-02-03 2004-08-27 +S000006974 long_terminal_repeat YGRWdelta27 chromosome 7 7 811447 811778 W 2011-02-03 2000-05-19 Ty2 LTR +S000006983 LTR_retrotransposon YGRWTy2-2 Ty2 chromosome 7 7 811447 817397 W 2011-02-03 2000-05-19 Ty2 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007369 transposable_element_gene YGR161W-A gag protein chromosome 7 7 811738 813054 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000030119 CDS YGR161W-A 7 811738 813054 W 2011-02-03 1999-07-17 +S000007370 transposable_element_gene YGR161W-B gag-pol fusion protein chromosome 7 S000029014 7 811738 817051 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000030122 CDS YGR161W-B 7 811738 813030 W 2011-02-03 1999-07-17 +S000030123 CDS YGR161W-B 7 813032 817051 W 2011-02-03 1999-07-17 +S000030124 plus_1_translational_frameshift YGR161W-B 7 813031 813031 W 2011-02-03 1999-07-17 +S000006975 long_terminal_repeat YGRWdelta28 chromosome 7 7 817074 817397 W 2011-02-03 2000-05-19 Ty2 LTR +S000006959 long_terminal_repeat YGRCdelta29 chromosome 7 7 817724 817393 C 2011-02-03 2000-05-19 Ty1 LTR +S000007368 transposable_element_gene YGR161C-D gag-pol fusion protein chromosome 7 7 823015 817747 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000036390 CDS YGR161C-D 7 821709 817747 C 2011-02-03 1999-07-17 +S000036389 CDS YGR161C-D 7 823015 821711 C 2011-02-03 1999-07-17 +S000036391 plus_1_translational_frameshift YGR161C-D 7 821710 821710 C 2011-02-03 1999-07-17 +S000007367 transposable_element_gene YGR161C-C gag protein chromosome 7 7 823015 821693 C 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000036388 CDS YGR161C-C 7 823015 821693 C 2011-02-03 1999-07-17 +S000006963 LTR_retrotransposon YGRCTy1-3 Ty1 chromosome 7 7 823306 817393 C 2011-02-03 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000006960 long_terminal_repeat YGRCdelta30 chromosome 7 7 823306 822975 C 2011-02-03 2000-05-19 Ty1 LTR +S000006756 tRNA_gene tV(AAC)G2 chromosome 7 L000003836 7 823482 823555 W 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000036904 noncoding_exon tV(AAC)G2 7 823482 823555 W 2011-02-03 2000-05-19 +S000003394 ORF Verified YGR162W TIF4631 translation initiation factor eIF4G|eiF4G1 chromosome 7 L000002309 7 824059 826917 W 2011-02-03 1996-07-31 Translation initiation factor eIF4G; subunit of the mRNA cap-binding protein complex (eIF4F) that also contains eIF4E (Cdc33p); interacts with Pab1p and with eIF4A (Tif1p); also has a role in biogenesis of the large ribosomal subunit; TIF4631 has a paralog, TIF4632, that arose from the whole genome duplication +S000033543 CDS YGR162W 7 824059 826917 W 2011-02-03 1996-07-31 +S000003395 ORF Verified YGR163W GTR2 chromosome 7 L000004611 7 827552 828577 W 2011-02-03 1996-07-31 Subunit of a TORC1-stimulating GTPase complex; subunit of the Gtr1-Gtr2 GTPase complex that stimulates TORC1 in response to amino acid stimulation; stimulates the GTPase activity of Gtr1p; negatively regulates the Ran/Tc4 GTPase cycle; activates transcription; tethered to the vacuolar membrane as part of the EGO complex (EGOC); required for sorting of Gap1p; activated by the the Lst4p-Lst7p GAP complex; localizes to cytoplasm and to chromatin; homolog of human RagC and +S000033603 CDS YGR163W 7 827552 828577 W 2011-02-03 1996-07-31 +S000003396 ORF Dubious YGR164W chromosome 7 7 828625 828960 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034546 CDS YGR164W 7 828625 828960 W 2011-02-03 1996-07-31 +S000006712 tRNA_gene tR(UCU)G2 chromosome 7 L000003843 7 828794 828723 C 2011-02-03 2000-05-19 Arginine tRNA (tRNA-Arg), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon UCU (converted to mcm5-UCU in the mature tRNA), decodes AGA codons into arginine, one of 19 nuclear tRNAs for arginine +S000037330 noncoding_exon tR(UCU)G2 7 828794 828723 C 2011-02-03 2000-05-19 +S000003397 ORF Verified YGR165W MRPS35 mitochondrial 37S ribosomal protein MRPS35 chromosome 7 7 829116 830153 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit; null mutant does not grow on glycerol, is sensitive to 2,4-dichlorophenol, and accumulates large lipid droplets +S000034612 CDS YGR165W 7 829116 830153 W 2011-02-03 1996-07-31 +S000003398 ORF Verified YGR166W TRS65 KRE11 chromosome 7 L000000918 7 830515 832197 W 154.34 2011-02-03 1996-07-31 Component of transport protein particle (TRAPP) complex II; TRAPPII is a multimeric guanine nucleotide-exchange factor for the GTPase Ypt1p, regulating intra-Golgi and endosome-Golgi traffic; role in cell wall beta-glucan biosynthesis and the stress response +S000034756 CDS YGR166W 7 830515 832197 W 2011-02-03 1996-07-31 +S000003399 ORF Verified YGR167W CLC1 SCD4 chromosome 7 L000000355 7 832456 833157 W 2011-02-03 1996-07-31 Clathrin light chain; subunit of the major coat protein involved in intracellular protein transport and endocytosis; regulates endocytic progression; thought to regulate clathrin function; the clathrin triskelion is a trimeric molecule composed of three heavy chains that radiate from a vertex and three light chains which bind noncovalently near the vertex of the triskelion +S000035721 CDS YGR167W 7 832456 833157 W 2011-02-03 1996-07-31 +S000003400 ORF Uncharacterized YGR168C chromosome 7 7 834482 833352 C 2011-02-03 1996-07-31 Putative protein of unknown function; YGR168C is not an essential gene +S000035768 CDS YGR168C 7 834482 833352 C 2011-02-03 1996-07-31 +S000118466 ARS ARS731 ARSVII-835 chromosome 7 7 834491 834734 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000119030 ARS_consensus_sequence ARS731 7 834664 834650 C 2011-02-03 2006-10-03 +S000003401 ORF Verified YGR169C PUS6 pseudouridine synthase PUS6 chromosome 7 7 835903 834689 C 2011-02-03 1996-07-31 tRNA:pseudouridine synthase; catalyzes the conversion of uridine to pseudouridine at position 31 in cytoplasmic and mitochondrial tRNAs; mutation of Asp168 to Ala abolishes enzyme activity; not essential for viability +S000035880 CDS YGR169C 7 835903 834689 C 2011-02-03 1996-07-31 +S000028521 ORF Verified YGR169C-A LSO2 YGR169C-C chromosome 7 7 836665 836387 C 2011-02-03 2003-07-29 Protein with a potential role in response to iron deprivation; localizes to nucleus and cytoplasm, and nuclear localization is enhanced under iron-replete conditions; null mutant exhibits slow growth during iron deprivation; LSO2 has a paralog, LSO1, that arose from the whole genome duplication +S000030316 CDS YGR169C-A 7 836665 836387 C 2011-02-03 2003-07-29 +S000003402 ORF Verified YGR170W PSD2 phosphatidylserine decarboxylase 2 chromosome 7 L000002817 7 837142 840558 W 2011-02-03 1996-07-31 Phosphatidylserine decarboxylase of the Golgi and vacuolar membranes; converts phosphatidylserine to phosphatidylethanolamine; controls vacuolar membrane phospholipid content by regulating phospholipids in compartments that will eventually give rise to the vacuole; loss of Psd2p causes a specific reduction in vacuolar membrane PE levels while total PE levels are not significantly affected +S000036827 CDS YGR170W 7 837142 840558 W 2011-02-03 1996-07-31 +S000003403 ORF Verified YGR171C MSM1 methionine--tRNA ligase MSM1 chromosome 7 L000001196 7 842551 840824 C 2011-02-03 1996-07-31 Mitochondrial methionyl-tRNA synthetase (MetRS); functions as a monomer in mitochondrial protein synthesis; functions similarly to cytoplasmic MetRS although the cytoplasmic form contains a zinc-binding domain not found in Msm1p +S000036868 CDS YGR171C 7 842551 840824 C 2011-02-03 1996-07-31 +S000003404 ORF Verified YGR172C YIP1 transporter YIP1 chromosome 7 L000003259 7 843591 842845 C 2011-02-03 1996-07-31 Integral membrane protein; required for the biogenesis of ER-derived COPII transport vesicles; interacts with Yif1p and Yos1p; localizes to the Golgi, the ER, and COPII vesicles; human homolog YIPF5 can complement yeast yip1 mutant +S000037595 CDS YGR172C 7 843591 842845 C 2011-02-03 1996-07-31 +S000003405 ORF Verified YGR173W RBG2 GIR1 chromosome 7 7 843854 844960 W 2011-02-03 1996-07-31 Protein with a role in translation; forms a complex with Gir2p; has similarity to mammalian developmentally regulated GTP-binding protein +S000037694 CDS YGR173W 7 843854 844960 W 2011-02-03 1996-07-31 +S000006981 long_terminal_repeat YGRWsigma7 chromosome 7 7 845281 845602 W 2011-02-03 2000-05-19 Ty3 LTR +S000006581 tRNA_gene tG(GCC)G1 chromosome 7 L000003837 7 845649 845719 W 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis +S000037454 noncoding_exon tG(GCC)G1 7 845649 845719 W 2011-02-03 2000-05-19 +S000003406 ORF Verified YGR174C CBP4 chromosome 7 L000000227 7 846405 845893 C 2011-02-03 1996-07-31 Mitochondrial protein required for assembly of cytochrome bc1 complex; interacts with the Cbp3p-Cbp6p complex and newly synthesized cytochrome b (Cobp) to promote assembly of Cobp into the cytochrome bc1 complex +S000037715 CDS YGR174C 7 846405 845893 C 2011-02-03 1996-07-31 +S000028639 ORF Uncharacterized YGR174W-A chromosome 7 7 846655 846741 W 2011-02-03 2003-07-29 Putative protein of unknown function; predicted to have a role in cell budding based on computational "guilt by association" analysis +S000032395 CDS YGR174W-A 7 846655 846741 W 2011-02-03 2003-07-29 +S000003407 ORF Verified YGR175C ERG1 squalene monooxygenase chromosome 7 L000000568 7 848423 846933 C 2011-02-03 1996-07-31 Squalene epoxidase; catalyzes the epoxidation of squalene to 2,3-oxidosqualene; plays an essential role in the ergosterol-biosynthesis pathway and is the specific target of the antifungal drug terbinafine; human SQLE functionally complements the lethality of the erg1 null mutation +S000037776 CDS YGR175C 7 848423 846933 C 2011-02-03 1996-07-31 +S000003408 ORF Dubious YGR176W chromosome 7 7 848720 849067 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030672 CDS YGR176W 7 848720 849067 W 2011-02-03 1996-07-31 +S000003409 ORF Verified YGR177C ATF2 alcohol O-acetyltransferase chromosome 7 L000003345 7 850436 848829 C 2011-02-03 1996-07-31 Alcohol acetyltransferase; may play a role in steroid detoxification; forms volatile esters during fermentation, which is important for brewing and winemaking +S000030746 CDS YGR177C 7 850436 848829 C 2011-02-03 1996-07-31 +S000003410 ORF Verified YGR178C PBP1 MRS16 chromosome 7 L000003967 7 853215 851047 C 2011-02-03 1996-07-31 Component of glucose deprivation induced stress granules; involved in P-body-dependent granule assembly; similar to human ataxin-2; interacts with Pab1p to regulate mRNA polyadenylation; interacts with Mkt1p to regulate HO translation; protein increases in abundance and relative distribution to the nucleus increases upon DNA replication stress +S000030834 CDS YGR178C 7 853215 851047 C 2011-02-03 1996-07-31 +S000003411 ORF Verified YGR179C OKP1 chromosome 7 7 854895 853675 C 2011-02-03 1996-07-31 Outer kinetochore protein required for accurate chromosome segregation; component of COMA (Ctf19p, Okp1p, Mcm21p, Ame1p) a kinetochore sub-complex which functions as a platform for kinetochore assembly; orthologous to human centromere constitutive-associated network (CCAN) subunit CENP-Q and fission yeast fta7 +S000031845 CDS YGR179C 7 854895 853675 C 2011-02-03 1996-07-31 +S000003412 ORF Verified YGR180C RNR4 ribonucleotide-diphosphate reductase subunit RNR4|PSO3|CRT3 chromosome 7 L000002819|S000029396|L000004184 7 856301 855264 C 2011-02-03 1996-07-31 Ribonucleotide-diphosphate reductase (RNR) small subunit; the RNR complex catalyzes the rate-limiting step in dNTP synthesis and is regulated by DNA replication and DNA damage checkpoint pathways via localization of the small subunits; relocalizes from nucleus to cytoplasm upon DNA replication stress; RNR4 has a paralog, RNR2, that arose from the whole genome duplication +S000031850 CDS YGR180C 7 856301 855264 C 2011-02-03 1996-07-31 +S000006641 tRNA_gene tL(CAA)G3 chromosome 7 L000003842 7 857491 857378 C 2011-02-03 2000-05-19 Leucine tRNA (tRNA-Leu), predicted by tRNAscan-SE analysis +S000034251 intron tL(CAA)G3 7 857453 857422 C 2011-02-03 2000-05-19 +S000034250 noncoding_exon tL(CAA)G3 7 857421 857378 C 2011-02-03 2000-05-19 +S000034249 noncoding_exon tL(CAA)G3 7 857491 857454 C 2011-02-03 2000-05-19 +S000003413 ORF Verified YGR181W TIM13 protein translocase subunit TIM13 chromosome 7 7 858287 858604 W 2011-02-03 1996-07-31 Mitochondrial intermembrane space protein; forms a complex with Tim8p that delivers a subset of hydrophobic proteins to the TIM22 complex for insertion into the inner membrane +S000032812 CDS YGR181W 7 858287 858604 W 2011-02-03 1996-07-31 +S000003414 ORF Dubious YGR182C chromosome 7 7 858904 858551 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF TIM13/YGR181W +S000032855 CDS YGR182C 7 858904 858551 C 2011-02-03 1996-07-31 +S000003415 ORF Verified YGR183C QCR9 ubiquinol--cytochrome-c reductase subunit 9|UCR9 chromosome 7 L000001549 7 859476 859063 C 148 2011-02-03 1996-07-31 Subunit 9 of ubiquinol cytochrome-c reductase (Complex III); Complex III is a component of the mitochondrial inner membrane electron transport chain; required for electron transfer at the ubiquinol oxidase site of the complex +S000032944 CDS YGR183C 7 859260 859063 C 2011-02-03 1996-07-31 +S000032943 CDS YGR183C 7 859476 859474 C 2011-02-03 1996-07-31 +S000032945 intron YGR183C 7 859473 859261 C 2011-02-03 1996-07-31 +S000003416 ORF Verified YGR184C UBR1 E3 ubiquitin-protein ligase UBR1|PTR1 chromosome 7 L000002420 7 865753 859901 C 2011-02-03 1996-07-31 E3 ubiquitin ligase (N-recognin); heterodimerizes with Rad6p to recognize and ubiquitinate substrates of the N-end rule pathway; role in endoplasmic reticulum-associated protein degradation (ERAD) in the absence of canonical ER membrane ligases or after stress; major role in targeting misfolded cytosolic proteins for degradation; regulates peptide transport via Cup9p ubiquitination; mutation in human UBR1 causes Johansson-Blizzard Syndrome (JBS) +S000033034 CDS YGR184C 7 865753 859901 C 2011-02-03 1996-07-31 +S000003417 ORF Verified YGR185C TYS1 tyrosine--tRNA ligase TYS1|TyrRS|TTS1 chromosome 7 L000001105 7 867520 866336 C 2011-02-03 1996-07-31 Cytoplasmic tyrosyl-tRNA synthetase; required for cytoplasmic protein synthesis; interacts with positions 34 and 35 of the tRNATyr anticodon; mutations in human ortholog YARS are associated with Charcot-Marie-Tooth (CMT) neuropathies; human ortholog YARS functionally complements the heat sensitivity of a ts allele; protein abundance increases in response to DNA replication stress +S000033686 CDS YGR185C 7 867520 866336 C 2011-02-03 1996-07-31 +S000003418 ORF Verified YGR186W TFG1 transcription factor IIF subunit TFG1|RAP74|SSU71 chromosome 7 L000002594 7 867774 869981 W 2011-02-03 1996-07-31 TFIIF (Transcription Factor II) largest subunit; involved in both transcription initiation and elongation of RNA polymerase II; homologous to human RAP74 +S000033854 CDS YGR186W 7 867774 869981 W 2011-02-03 1996-07-31 +S000003419 ORF Verified YGR187C HGH1 chromosome 7 L000003003 7 871416 870232 C 2011-02-03 1996-07-31 Nonessential protein of unknown function; predicted to be involved in ribosome biogenesis; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; similar to mammalian BRP16 (Brain protein 16); relative distribution to the nucleus increases upon DNA replication stress +S000033880 CDS YGR187C 7 871416 870232 C 2011-02-03 1996-07-31 +S000003420 ORF Verified YGR188C BUB1 protein kinase BUB1 chromosome 7 L000000196 7 875109 872044 C 150 2011-02-03 1996-07-31 Protein kinase involved in the cell cycle checkpoint into anaphase; in complex with Mad1p and Bub3p, prevents progression into anaphase in presence of spindle damage; Cdc28p-mediated phosphorylation at Bub1p-T566 is important for degradation in anaphase and adaptation of checkpoint to prolonged mitotic arrest; associates with centromere DNA via Skp1p; involved in Sgo1p relocalization in response to sister kinetochore tension; paralog MAD3 arose from whole genome duplication +S000034040 CDS YGR188C 7 875109 872044 C 2011-02-03 1996-07-31 +S000006976 long_terminal_repeat YGRWdelta31 chromosome 7 7 875951 876279 W 2011-02-03 2000-05-19 Ty1 LTR +S000006623 tRNA_gene tK(CUU)G3 chromosome 7 L000003838 7 876394 876466 W 2011-02-03 2000-05-19 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000029892 noncoding_exon tK(CUU)G3 7 876394 876466 W 2011-02-03 2000-05-19 +S000003421 ORF Verified YGR189C CRH1 transglycosylase chromosome 7 S000007423 7 878192 876669 C 2011-02-03 1996-07-31 Chitin transglycosylase; functions in the transfer of chitin to beta(1-6) and beta(1-3) glucans in the cell wall; similar and functionally redundant to Utr2; localizes to sites of polarized growth; expression induced by cell wall stress +S000034926 CDS YGR189C 7 878192 876669 C 2011-02-03 1996-07-31 +S000006772 tRNA_gene tW(CCA)G2 chromosome 7 L000003841 7 878815 878710 C 2011-02-03 2000-05-19 Tryptophan tRNA (tRNA-Trp), predicted by tRNAscan-SE analysis +S000032530 intron tW(CCA)G2 7 878779 878746 C 2011-02-03 2000-05-19 +S000032529 noncoding_exon tW(CCA)G2 7 878745 878710 C 2011-02-03 2000-05-19 +S000032528 noncoding_exon tW(CCA)G2 7 878815 878780 C 2011-02-03 2000-05-19 +S000003423 ORF Verified YGR191W HIP1 histidine permease chromosome 7 L000000775 7 880420 882231 W 146 2011-02-03 1996-07-31 High-affinity histidine permease; also involved in the transport of manganese ions +S000036175 CDS YGR191W 7 880420 882231 W 2011-02-03 1996-07-31 +S000003422 ORF Dubious YGR190C chromosome 7 7 880661 880296 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene HIP1/YGR191W +S000035932 CDS YGR190C 7 880661 880296 C 2011-02-03 1996-07-31 +S000003424 ORF Verified YGR192C TDH3 glyceraldehyde-3-phosphate dehydrogenase (phosphorylating) TDH3|GAPDH|GPD|SSS2|HSP36|HSP35|GLD1 chromosome 7 L000002274 7 883810 882812 C 2011-02-03 1996-07-31 Glyceraldehyde-3-phosphate dehydrogenase (GAPDH), isozyme 3; involved in glycolysis and gluconeogenesis; tetramer that catalyzes the reaction of glyceraldehyde-3-phosphate to 1,3 bis-phosphoglycerate; detected in the cytoplasm and cell wall; GAPDH-derived antimicrobial peptides secreted by S. cerevisiae are active against a wide variety of wine-related yeasts and bacteria; binds AU-rich RNA +S000036226 CDS YGR192C 7 883810 882812 C 2011-02-03 1996-07-31 +S000003425 ORF Verified YGR193C PDX1 chromosome 7 L000001369 7 885741 884509 C 2011-02-03 1996-07-31 E3-binding protein of the mitochondrial pyruvate dehydrogenase complex; plays a structural role in the complex by binding and positioning dihydrolipoamide dehydrogenase (E3) to the dihydrolipoamide acetyltransferase (E2) core +S000036958 CDS YGR193C 7 885741 884509 C 2011-02-03 1996-07-31 +S000003426 ORF Verified YGR194C XKS1 xylulokinase chromosome 7 7 887875 886073 C 2011-02-03 1996-07-31 Xylulokinase; converts D-xylulose and ATP to xylulose 5-phosphate and ADP; rate limiting step in fermentation of xylulose; required for xylose fermentation by recombinant S. cerevisiae strains +S000037017 CDS YGR194C 7 887875 886073 C 2011-02-03 1996-07-31 +S000119032 ARS ARS737 ARSVII-888|ARS731.5 chromosome 7 7 888413 888493 2014-11-18 2014-11-18|2006-10-03 Autonomously Replicating Sequence +S000119033 ARS_consensus_sequence ARS737 7 888414 888430 W 2014-11-18 2014-11-18|2006-10-03 +S000003427 ORF Verified YGR195W SKI6 exosome non-catalytic core subunit SKI6|RRP41|ECM20 chromosome 7 L000003895|L000004426 7 888882 889622 W 2011-02-03 1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; has similarity to E. coli RNase PH and to human hRrp41p (EXOSC4) +S000037164 CDS YGR195W 7 888882 889622 W 2011-02-03 1996-07-31 +S000003428 ORF Verified YGR196C FYV8 chromosome 7 7 892186 889733 C 2011-02-03 1996-07-31 Protein of unknown function; required for survival upon exposure to K1 killer toxin +S000037853 CDS YGR196C 7 892186 889733 C 2011-02-03 1996-07-31 +S000003429 ORF Verified YGR197C SNG1 chromosome 7 L000002747 7 894140 892497 C 2011-02-03 1996-07-31 Protein involved in resistance to nitrosoguanidine and 6-azauracil; expression is regulated by transcription factors involved in multidrug resistance; SNG1 has a paralog, YJR015W, that arose from the whole genome duplication +S000029875 CDS YGR197C 7 894140 892497 C 2011-02-03 1996-07-31 +S000003430 ORF Verified YGR198W YPP1 chromosome 7 7 894693 897146 W 2011-02-03 1996-07-31 Cargo-transport protein involved in endocytosis; interacts with phosphatidylinositol-4-kinase Stt4p; is required, along with Efr3p, for the assembly and recruitment of multiple copies of the kinase into phosphoinositide kinase (PIK) patches at the plasma membrane; positively regulates Stt4p; GFP-fusion protein localizes to the cytoplasm; YGR198W is an essential gene +S000030951 CDS YGR198W 7 894693 897146 W 2011-02-03 1996-07-31 +S000003431 ORF Verified YGR199W PMT6 dolichyl-phosphate-mannose-protein mannosyltransferase PMT6 chromosome 7 L000004009|L000004020 7 897502 899781 W 2011-02-03 1996-07-31 Protein O-mannosyltransferase; transfers mannose from dolichyl phosphate-D-mannose to protein serine/threonine residues of secretory proteins; reaction is essential for cell wall rigidity; member of a family of mannosyltransferases +S000031053 CDS YGR199W 7 897502 899781 W 2011-02-03 1996-07-31 +S000003432 ORF Verified YGR200C ELP2 Elongator subunit ELP2|KTI3|TOT2 chromosome 7 7 902270 899904 C 2011-02-03 1996-07-31 Subunit of Elongator complex; binds to microtubules via conserved alkaline residues; has two seven-bladed WD40 β propellers; Elongator complex is required for modification of wobble nucleosides in tRNA; target of Kluyveromyces lactis zymocin +S000036532 CDS YGR200C 7 902270 899904 C 2011-02-03 1996-07-31 +S000003433 ORF Uncharacterized YGR201C chromosome 7 7 903197 902520 C 2011-02-03 2003-09-22|1996-07-31 Putative protein of unknown function +S000036618 CDS YGR201C 7 903197 902520 C 2011-02-03 2003-09-22|1996-07-31 +S000003434 ORF Verified YGR202C PCT1 choline-phosphate cytidylyltransferase|CCT1|BSR2 chromosome 7 L000000240 7 904748 903474 C 2011-02-03 1996-07-31 Cholinephosphate cytidylyltransferase; a rate-determining enzyme of the CDP-choline pathway for phosphatidylcholine synthesis, inhibited by Sec14p, activated upon lipid-binding; contains an element within the regulatory domain involved in both silencing and activation of enzymatic activity +S000036716 CDS YGR202C 7 904748 903474 C 2011-02-03 1996-07-31 +S000003435 ORF Verified YGR203W YCH1 phosphatase YCH1 chromosome 7 7 905237 905683 W 2011-02-03 1996-07-31 Phosphatase with sequence similarity to Cdc25p; Arr2p and Mih1p; member of the single-domain rhodanese homology superfamily; green fluorescent protein (GFP)-fusion protein localizes to both the cytoplasm and the nucleus +S000030650 CDS YGR203W 7 905237 905683 W 2011-02-03 1996-07-31 +S000003436 ORF Verified YGR204W ADE3 trifunctional formate-tetrahydrofolate ligase/methenyltetrahydrofolate cyclohydrolase/methylenetetrahydrofolate dehydrogenase ADE3 chromosome 7 L000000033 7 905934 908774 W 159 2011-02-03 1996-07-31 Cytoplasmic trifunctional enzyme C1-tetrahydrofolate synthase; involved in single carbon metabolism and required for biosynthesis of purines, thymidylate, methionine, and histidine; null mutation causes auxotrophy for adenine and histidine +S000030764 CDS YGR204W 7 905934 908774 W 2011-02-03 1996-07-31 +S000028640 ORF Uncharacterized YGR204C-A chromosome 7 7 909174 909061 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032416 CDS YGR204C-A 7 909174 909061 C 2011-02-03 2003-07-29 +S000003437 ORF Verified YGR205W TDA10 putative ATP-dependent kinase chromosome 7 7 909213 910085 W 2011-02-03 1996-07-31 ATP-binding protein of unknown function; crystal structure resembles that of E.coli pantothenate kinase and other small kinases; null mutant is sensitive to expression of the top1-T722A allele +S000030854 CDS YGR205W 7 909213 910085 W 2011-02-03 1996-07-31 +S000003438 ORF Verified YGR206W MVB12 ubiquitin-binding ESCRT-I subunit protein MVB12 chromosome 7 7 910432 910737 W 2011-02-03 1996-07-31 ESCRT-I subunit required to stabilize ESCRT-I core complex oligomers; the ESCRT-I core complex (Stp22p, Vps28p, Srn2p) is involved in ubiquitin-dependent sorting of proteins into the endosome; deletion mutant is sensitive to rapamycin and nystatin +S000031833 CDS YGR206W 7 910432 910737 W 2011-02-03 1996-07-31 +S000003439 ORF Verified YGR207C CIR1 chromosome 7 7 911628 910843 C 2011-02-03 1996-07-31 Mitochondrial protein that interacts with frataxin (Yfh1p); putative ortholog of mammalian electron transfer flavoprotein complex subunit ETF-beta; may have a role in oxidative stress response +S000031940 CDS YGR207C 7 911628 910843 C 2011-02-03 1996-07-31 +S000003440 ORF Verified YGR208W SER2 phosphoserine phosphatase chromosome 7 L000001866 7 911883 912812 W 168 2011-02-03 1996-07-31 Phosphoserine phosphatase of the phosphoglycerate pathway; involved in serine and glycine biosynthesis, expression is regulated by the available nitrogen source +S000032117 CDS YGR208W 7 911883 912812 W 2011-02-03 1996-07-31 +S000003441 ORF Verified YGR209C TRX2 thioredoxin TRX2|LMA1 chromosome 7 L000002358 7 913227 912913 C 161 2011-02-03 1996-07-31 Cytoplasmic thioredoxin isoenzyme; part of thioredoxin system which protects cells against oxidative and reductive stress; forms LMA1 complex with Pbi2p; acts as a cofactor for Tsa1p; required for ER-Golgi transport and vacuole inheritance; with Trx1p, facilitates mitochondrial import of small Tims Tim9p, Tim10p, Tim13p by maintaining them in reduced form; abundance increases under DNA replication stress; TRX2 has a paralog, TRX1, that arose from the whole genome duplication +S000032991 CDS YGR209C 7 913227 912913 C 2011-02-03 1996-07-31 +S000003442 ORF Uncharacterized YGR210C chromosome 7 7 914738 913503 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000032713 CDS YGR210C 7 914738 913503 C 2011-02-03 1996-07-31 +S000003443 ORF Verified YGR211W ZPR1 zinc finger-containing protein ZPR1 chromosome 7 L000004700 7 915241 916701 W 2011-02-03 1996-07-31 Essential protein with two zinc fingers; present in nucleus of growing cells, relocates to cytoplasm in starved cells via a process mediated by Cpr1p; binds translation elongation factor eEF-1 (Tef1p); relative distribution to nucleus increases upon DNA replication stress; human ZPR1 gene can complement yeast by allowing growth during down-regulation of yeast zpr1 +S000032885 CDS YGR211W 7 915241 916701 W 2011-02-03 1996-07-31 +S000003444 ORF Verified YGR212W SLI1 N-acetyltransferase chromosome 7 7 917040 918446 W 2011-02-03 1996-07-31 N-acetyltransferase; confers resistance to the sphingolipid biosynthesis inhibitor myriocin (ISP-1) by converting it into N-acetyl-myriocin, co-operates with Ypk1p in mediating resistance to myriocin +S000034830 CDS YGR212W 7 917040 918446 W 2011-02-03 1996-07-31 +S000003445 ORF Verified YGR213C RTA1 chromosome 7 L000003245 7 919465 918512 C 2011-02-03 1996-07-31 Protein involved in 7-aminocholesterol resistance; has seven potential membrane-spanning regions; expression is induced under both low-heme and low-oxygen conditions; member of the fungal lipid-translocating exporter (LTE) family of protein; RTA1 has a paralog, YLR046C, that arose from the whole genome duplication +S000034869 CDS YGR213C 7 919465 918512 C 2011-02-03 1996-07-31 +S000003446 ORF Verified YGR214W RPS0A uS2|ribosomal 40S subunit protein S0A|S2|S0A|YST1|NAB1A|NAB1 chromosome 7 L000001226|L000001225 7 920575 921788 W 2011-02-03 1996-07-31 Ribosomal 40S subunit protein S0A; required for maturation of 18S rRNA along with Rps0Bp; deletion of either RPS0 gene reduces growth rate, deletion of both genes is lethal; homologous to human ribosomal protein SA and bacterial S2; RPS0A has a paralog, RPS0B, that arose from the whole genome duplication; +S000035102 CDS YGR214W 7 920575 920664 W 2011-02-03 1996-07-31 +S000035103 CDS YGR214W 7 921120 921788 W 2011-02-03 1996-07-31 +S000035104 intron YGR214W 7 920665 921119 W 2011-02-03 1996-07-31 +S000003447 ORF Verified YGR215W RSM27 mitochondrial 37S ribosomal protein RSM27 chromosome 7 7 922175 922507 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit +S000035176 CDS YGR215W 7 922175 922507 W 2011-02-03 1996-07-31 +S000003448 ORF Verified YGR216C GPI1 phosphatidylinositol N-acetylglucosaminyltransferase chromosome 7 L000000725 7 924462 922633 C 2011-02-03 1996-07-31 Membrane protein involved in the synthesis of GlcNAc-PI; N-acetylglucosaminyl phosphatidylinositol (GlcNAc-PI) is the first intermediate in the synthesis of glycosylphosphatidylinositol (GPI) anchors; human and mouse GPI1p are functional homologs +S000035248 CDS YGR216C 7 924462 922633 C 2011-02-03 1996-07-31 +S000003449 ORF Verified YGR217W CCH1 chromosome 7 L000003440 7 924696 930815 W 2011-02-03 1996-07-31 Voltage-gated high-affinity calcium channel; involved in calcium influx in response to some environmental stresses as well as exposure to mating pheromones; interacts and partially co-localizes with Mid1p; however, evidence suggests CCH1 is not required for Mid1p function +S000036194 CDS YGR217W 7 924696 930815 W 2011-02-03 1996-07-31 +S000006582 tRNA_gene tG(GCC)G2 chromosome 7 L000003840 7 931023 930953 C 2011-02-03 2000-05-19 Glycine tRNA (tRNA-Gly), predicted by tRNAscan-SE analysis +S000037457 noncoding_exon tG(GCC)G2 7 931023 930953 C 2011-02-03 2000-05-19 +S000006961 long_terminal_repeat YGRCtau3 chromosome 7 7 931540 931171 C 2011-02-03 2000-05-19 Ty4 LTR +S000006977 long_terminal_repeat YGRWdelta32 chromosome 7 7 931688 932019 W 2011-02-03 2000-05-19 Ty1 LTR +S000003450 ORF Verified YGR218W CRM1 exportin CRM1|XPO1|KAP124 chromosome 7 L000000420 7 932541 935795 W 2011-02-03 1996-07-31 Major karyopherin; involved in export of proteins, RNAs, and ribosomal subunits from the nucleus; exportin +S000029874 CDS YGR218W 7 932541 935795 W 2011-02-03 1996-07-31 +S000003451 ORF Dubious YGR219W chromosome 7 7 936035 936376 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF MRPL9/YGR220C +S000031776 CDS YGR219W 7 936035 936376 W 2011-02-03 1996-07-31 +S000003452 ORF Verified YGR220C MRPL9 mitochondrial 54S ribosomal protein YmL9|YmL9 chromosome 7 L000001163|L000002525 7 936883 936074 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000036227 CDS YGR220C 7 936883 936074 C 2011-02-03 1996-07-31 +S000003453 ORF Verified YGR221C TOS2 chromosome 7 7 938992 937124 C 2011-02-03 1996-07-31|2011-02-03 Protein involved in localization of Cdc24p to the site of bud growth; may act as a membrane anchor; localizes to the bud neck and bud tip; potentially phosphorylated by Cdc28p; TOS2 has a paralog, SKG6, that arose from the whole genome duplication +S000036329 CDS YGR221C 7 938992 937124 C 2011-02-03 1996-07-31|2011-02-03 +S000006495 snRNA_gene snR7-L SNR7-L U5L|SNR7 chromosome 7 7 939672 939459 C 2011-02-03 2004-03-30 U5 spliceosomal RNA (U5 snRNA), long form; associated with spliceosome +S000033299 noncoding_exon snR7-L 7 939672 939459 C 2011-02-03 2004-03-30 +S000006496 snRNA_gene snR7-S SNR7-S U5S|SNR7 chromosome 7 7 939672 939494 C 2011-02-03 2004-04-01 U5 spliceosomal RNA (U5 snRNA), short form; derived from SNR7-L by 3' end processing; associated with spliceosome +S000033320 noncoding_exon snR7-S 7 939672 939494 C 2011-02-03 2004-04-01 +S000003454 ORF Verified YGR222W PET54 chromosome 7 L000001391 7 939923 940804 W 174 2011-02-03 1996-07-31 Mitochondrial inner membrane protein; binds to the 5' UTR of the COX3 mRNA to activate its translation together with Pet122p and Pet494p; also binds to the COX1 Group I intron AI5 beta to facilitate exon ligation during splicing +S000036470 CDS YGR222W 7 939923 940804 W 2011-02-03 1996-07-31 +S000003455 ORF Verified YGR223C HSV2 chromosome 7 7 942215 940869 C 2011-02-03 1996-07-31 Phosphatidylinositol 3,5-bisphosphate-binding protein; plays a role in micronucleophagy; belongs to the PROPPIN family of proteins; predicted to fold as a seven-bladed beta-propeller; displays punctate cytoplasmic localization +S000036479 CDS YGR223C 7 942215 940869 C 2011-02-03 1996-07-31 +S000003456 ORF Verified YGR224W AZR1 azole transporter chromosome 7 7 942806 944647 W 2011-02-03 1996-07-31 Plasma membrane transporter of the major facilitator superfamily; involved in resistance to azole drugs such as ketoconazole and fluconazole +S000037202 CDS YGR224W 7 942806 944647 W 2011-02-03 1996-07-31 +S000003457 ORF Verified YGR225W AMA1 SPO70 chromosome 7 L000004668 7 945145 947019 W 2011-02-03 2000-12-01|1996-07-31|2005-11-29 Activator of meiotic anaphase promoting complex (APC/C); Cdc20p family member; required for initiation of spore wall assembly; required for Clb1p degradation during meiosis; prevents premature assembly of the meiosis I spindle, required for DSB induced prophase I arrest +S000037306 CDS YGR225W 7 945145 946327 W 2011-02-03 2000-12-01|1996-07-31 +S000037307 CDS YGR225W 7 946421 947019 W 2011-02-03 2000-12-01|2005-11-29 +S000037308 intron YGR225W 7 946328 946420 W 2011-02-03 2000-12-01 +S000003458 ORF Dubious YGR226C chromosome 7 7 947001 946792 C 2011-02-03 1996-07-31|2005-11-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; overlaps significantly with a verified ORF, AMA1/YGR225W +S000037323 CDS YGR226C 7 947001 946792 C 2011-02-03 1996-07-31|2005-11-29 +S000003459 ORF Verified YGR227W DIE2 dolichyl-P-Glc:Glc(2)Man(9)GlcNAc(2)-PP-dolichol alpha-1,2- glucosyltransferase|ALG10 chromosome 7 L000002802 7 947420 948997 W 2011-02-03 1996-07-31|2011-02-03 Dolichyl-phosphoglucose-dependent alpha-1,2-glucosyltransferase; located in the ER; functions in pathway that synthesizes the dolichol-linked oligosaccharide precursor for N-linked protein glycosylation; has a role in regulation of ITR1 and INO1; human homolog ALG10B can complement yeast die2 null mutant +S000029996 CDS YGR227W 7 947420 948997 W 2011-02-03 1996-07-31|2011-02-03 +S000003460 ORF Dubious YGR228W chromosome 7 7 949365 949709 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF SMI1/YGR229C +S000030071 CDS YGR228W 7 949365 949709 W 2011-02-03 1996-07-31 +S000003461 ORF Verified YGR229C SMI1 KNR4 chromosome 7 L000000909 7 950899 949382 C 2011-02-03 1996-07-31 Protein involved in the regulation of cell wall synthesis; proposed to be involved in coordinating cell cycle progression with cell wall integrity +S000030134 CDS YGR229C 7 950899 949382 C 2011-02-03 1996-07-31 +S000003462 ORF Verified YGR230W BNS1 chromosome 7 L000004859 7 951894 952307 W 2011-02-03 1996-07-31 Protein of unknown function; overexpression bypasses need for Spo12p, but not required for meiosis; BNS1 has a paralog, SPO12, that arose from the whole genome duplication +S000032548 CDS YGR230W 7 951894 952307 W 2011-02-03 1996-07-31 +S000003463 ORF Verified YGR231C PHB2 prohibitin subunit PHB2 chromosome 7 L000004019 7 953480 952548 C 2011-02-03 2004-07-15|1996-07-31 Subunit of the prohibitin complex (Phb1p-Phb2p); prohibitin is a 1.2 MDa ring-shaped inner mitochondrial membrane chaperone that stabilizes newly synthesized proteins; determinant of replicative life span; involved in mitochondrial segregation; prohibitin deficiency induces a mitochondrial unfolded protein response (mtUPR) +S000032579 CDS YGR231C 7 953480 952548 C 2011-02-03 2004-07-15|1996-07-31 +S000003464 ORF Verified YGR232W NAS6 chromosome 7 7 953960 954646 W 2011-02-03 1996-07-31 Evolutionarily conserved 19S regulatory particle assembly-chaperone; proteasome-interacting protein involved in the assembly of the base subcomplex of the 19S proteasomal regulatory particle (RP); ortholog of human oncoprotein gankyrin, also known as p28, which interacts with the Rb tumor suppressor and CDK4/6 +S000033340 CDS YGR232W 7 953960 954646 W 2011-02-03 1996-07-31 +S000003465 ORF Verified YGR233C PHO81 VAC6|phoS chromosome 7 L000001427|S000029634|L000004050 7 958210 954674 C 2011-02-03 1996-07-31 Cyclin-dependent kinase (CDK) inhibitor; regulates Pho80p-Pho85p and Pcl7p-Pho85p cyclin-CDK complexes in response to phosphate levels; inhibitory activity for Pho80p-Pho85p requires myo-D-inositol heptakisphosphate (IP7) generated by Vip1p; relative distribution to the nucleus increases upon DNA replication stress +S000033365 CDS YGR233C 7 958210 954674 C 2011-02-03 1996-07-31 +S000003466 ORF Verified YGR234W YHB1 flavohemoglobin|YHB4 chromosome 7 L000002510 7 959904 961103 W 2011-02-03 1996-07-31 Nitric oxide oxidoreductase; flavohemoglobin that plays role in oxidative and nitrosative stress responses; protects against nitration of cellular targets and against cell growth inhibition under aerobic or anaerobic conditions; yeast flavohemoglobin Yhb1p and human homolog neuroglobin NGB protect cells against alpha-synuclein cytotoxicity and aggregate formation; protein increases in abundance, relocalizes from nucleus to cytoplasmic foci upon DNA replication stress +S000033479 CDS YGR234W 7 959904 961103 W 2011-02-03 1996-07-31 +S000003467 ORF Verified YGR235C MIC26 MOS2|MCS29|MIO27 chromosome 7 7 962061 961360 C 2011-02-03 1996-07-31 Component of the MICOS complex; MICOS (formerly MINOS or MitOS) is a mitochondrial inner membrane complex that extends into the intermembrane space and has a role in the maintenance of crista junctions, inner membrane architecture, and formation of contact sites to the outer membrane; Mic26p is a non-essential component of the complex +S000033513 CDS YGR235C 7 962061 961360 C 2011-02-03 1996-07-31 +S000003468 ORF Verified YGR236C SPG1 chromosome 7 7 962817 962530 C 2011-02-03 1996-07-31|2005-11-22 Protein required for high temperature survival during stationary phase; not required for growth on nonfermentable carbon sources; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000033575 CDS YGR236C 7 962817 962530 C 2011-02-03 1996-07-31|2005-11-22 +S000003469 ORF Uncharacterized YGR237C chromosome 7 7 965655 963298 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000034450 CDS YGR237C 7 965655 963298 C 2011-02-03 1996-07-31 +S000003470 ORF Verified YGR238C KEL2 chromosome 7 L000003593 7 968687 966039 C 2011-02-03 1996-07-31 Protein that negatively regulates mitotic exit; forms a complex with Kel1p and Bud14p that regulates Bnr1p (formin) to affect actin cable assembly, cytokinesis, and polarized growth; functions in a complex with Kel1p, interacts with Tem1p and Lte1p; localizes to regions of polarized growth; potential Cdc28p substrate +S000034584 CDS YGR238C 7 968687 966039 C 2011-02-03 1996-07-31 +S000003471 ORF Verified YGR239C PEX21 chromosome 7 L000004797 7 970053 969187 C 2011-02-03 1996-07-31 Peroxin required for peroxisomal matrix protein targeting; acts on proteins containing the PTS2 targeting sequence; interacts with Pex7p; constitutively expressed; partially redundant with Pex18p; required for import of the Gpd1p-Pnc1p heterodimer in which only Gpd1p has a peroxisomal targeting signal; relative distribution to cytoplasmic foci increases upon DNA replication stress +S000034676 CDS YGR239C 7 970053 969187 C 2011-02-03 1996-07-31 +S000003472 ORF Verified YGR240C PFK1 6-phosphofructokinase subunit alpha chromosome 7 L000001404 7 973734 970771 C 184 2011-02-03 1996-07-31 Alpha subunit of heterooctameric phosphofructokinase; involved in glycolysis, indispensable for anaerobic growth, activated by fructose-2,6-bisphosphate and AMP, mutation inhibits glucose induction of cell cycle-related genes +S000036620 CDS YGR240C 7 973734 970771 C 2011-02-03 1996-07-31 +S000028551 ORF Uncharacterized YGR240C-A chromosome 7 7 974777 974577 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031237 CDS YGR240C-A 7 974777 974577 C 2011-02-03 2003-07-29 +S000003474 ORF Dubious YGR242W chromosome 7 7 976415 976723 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF YAP1802/YGR241C +S000036776 CDS YGR242W 7 976415 976723 W 2011-02-03 1996-07-31 +S000003473 ORF Verified YGR241C YAP1802 chromosome 7 L000004199 7 976581 974875 C 2011-02-03 1996-07-31 Protein of the AP180 family, involved in clathrin cage assembly; binds Pan1p and clathrin; YAP1802 has a paralog, YAP1801, that arose from the whole genome duplication +S000036696 CDS YGR241C 7 976581 974875 C 2011-02-03 1996-07-31 +S000003475 ORF Verified YGR243W MPC3 mitochondrial pyruvate carrier|FMP43 chromosome 7 7 977336 977776 W 2011-02-03 1996-07-31 Highly conserved subunit of the mitochondrial pyruvate carrier (MPC); expressed during growth on nonfermentable carbon sources, and heterodimerizes with Mpc1p to form the respiratory isoform of MPC; MPC localizes to the mitochondrial inner membrane and mediates pyruvate uptake; MPC3 paralog, MPC2, heterodimerizes with Mpc1p to form the fermentative MPC isoform; protein abundance increases in response to DNA replication stress +S000036844 CDS YGR243W 7 977336 977776 W 2011-02-03 1996-07-31 +S000118467 ARS ARS733 ARSVII-978 chromosome 7 7 977728 977976 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000119031 ARS_consensus_sequence ARS733 7 977905 977891 C 2011-02-03 2006-10-03 +S000003476 ORF Verified YGR244C LSC2 succinate--CoA ligase (GDP-forming) subunit beta chromosome 7 L000004592 7 979319 978036 C 2011-02-03 1996-07-31 Beta subunit of succinyl-CoA ligase; succinyl-CoA ligase is a mitochondrial enzyme of the TCA cycle that catalyzes the nucleotide-dependent conversion of succinyl-CoA to succinate +S000036869 CDS YGR244C 7 979319 978036 C 2011-02-03 1996-07-31 +S000003477 ORF Verified YGR245C SDA1 chromosome 7 7 982068 979765 C 2011-02-03 1996-07-31 Protein required for actin organization and passage through Start; highly conserved nuclear protein; required for actin cytoskeleton organization; plays a critical role in G1 events; binds Nap1p; involved in 60S ribosome biogenesis +S000037596 CDS YGR245C 7 982068 979765 C 2011-02-03 1996-07-31 +S000003478 ORF Verified YGR246C BRF1 transcription factor TFIIIB subunit BRF1|TFIIIB70|TDS4|PCF4 chromosome 7 L000000193 7 984272 982482 C 2011-02-03 1996-07-31 TFIIIB B-related factor; one of three subunits of RNA polymerase III transcription initiation factor TFIIIB, binds TFIIIC and TBP and recruits RNA pol III to promoters, amino-terminal half is homologous to TFIIB; mutations in human homolog are associated with autosomal recessive cerebellar-facial-dental syndrome +S000037668 CDS YGR246C 7 984272 982482 C 2011-02-03 1996-07-31 +S000003479 ORF Verified YGR247W CPD1 2',3'-cyclic-nucleotide 3'-phosphodiesterase chromosome 7 7 984966 985685 W 2011-02-03 1996-07-31 Cyclic nucleotide phosphodiesterase; hydrolyzes ADP-ribose 1'', 2''-cyclic phosphate to ADP-ribose 1''-phosphate; may have a role in tRNA splicing; no detectable phenotype is conferred by null mutation or by overexpression; protein abundance increases in response to DNA replication stress +S000037753 CDS YGR247W 7 984966 985685 W 2011-02-03 1996-07-31 +S000003480 ORF Verified YGR248W SOL4 6-phosphogluconolactonase SOL4 chromosome 7 L000003365 7 985972 986739 W 2011-02-03 1996-07-31 6-phosphogluconolactonase; protein abundance increases in response to DNA replication stress; SOL4 has a paralog, SOL3, that arose from the whole genome duplication +S000030588 CDS YGR248W 7 985972 986739 W 2011-02-03 1996-07-31 +S000003481 ORF Verified YGR249W MGA1 chromosome 7 L000001100 7 988049 989419 W 2011-02-03 1996-07-31 Protein similar to heat shock transcription factor; multicopy suppressor of pseudohyphal growth defects of ammonium permease mutants +S000030700 CDS YGR249W 7 988049 989419 W 2011-02-03 1996-07-31 +S000003482 ORF Verified YGR250C RIE1 chromosome 7 7 993521 991176 C 2011-02-03 1996-07-31 Putative RNA binding protein; localizes to stress granules induced by glucose deprivation; interacts with Rbg1p in a two-hybrid assay; protein abundance increases in response to DNA replication stress +S000031515 CDS YGR250C 7 993521 991176 C 2011-02-03 1996-07-31 +S000003483 ORF Verified YGR251W NOP19 DHI1 chromosome 7 7 995639 996229 W 2011-02-03 1996-07-31 Ribosome biogenesis factor; nucleolar protein associated with pre-rRNA components of the 90S preribosome, required for cleavage of pre-rRNA at A0, A1 and A2 sites; interacts with RNA helicase Dhr2p and RNA helicase-like protein Utp25p; required for incorporation of Utp25p into preribosomes +S000031667 CDS YGR251W 7 995639 996229 W 2011-02-03 1996-07-31 +S000003484 ORF Verified YGR252W GCN5 histone acetyltransferase GCN5|AAS104|KAT2|SWI9|ADA4 chromosome 7 L000000684 7 996869 998188 W 2011-02-03 1996-07-31 Catalytic subunit of ADA and SAGA histone acetyltransferase complexes; modifies N-terminal lysines on histones H2B and H3; acetylates Rsc4p, a subunit of the RSC chromatin-remodeling complex, altering replication stress tolerance; relocalizes to the cytosol in response to hypoxia; mutant displays reduced transcription elongation in the G-less-based run-on (GLRO) assay; greater involvement in repression of RNAPII-dependent transcription than in activation +S000031757 CDS YGR252W 7 996869 998188 W 2011-02-03 1996-07-31 +S000003485 ORF Verified YGR253C PUP2 proteasome core particle subunit alpha 5|DOA5 chromosome 7 L000001531 7 999140 998358 C 2011-02-03 1996-07-31 Alpha 5 subunit of the 20S proteasome; involved in ubiquitin-dependent catabolism; human homolog is subunit zeta +S000031854 CDS YGR253C 7 999140 998358 C 2011-02-03 1996-07-31 +S000118468 ARS ARS734 ARSVII-999 chromosome 7 7 999456 999576 2014-11-18 2014-11-18|2006-08-30|2011-02-03 Autonomously Replicating Sequence +S000178104 ARS_consensus_sequence ARS734 7 999504 999520 W 2014-11-18 2014-11-18 +S000003486 ORF Verified YGR254W ENO1 phosphopyruvate hydratase ENO1|HSP48 chromosome 7 L000000559 7 1000927 1002240 W 2011-02-03 1996-07-31 Enolase I, a phosphopyruvate hydratase; catalyzes conversion of 2-phosphoglycerate to phosphoenolpyruvate during glycolysis and the reverse reaction during gluconeogenesis; expression repressed in response to glucose; protein abundance increases in response to DNA replication stress; N-terminally propionylated in vivo; ENO1 has a paralog, ENO2, that arose from the whole genome duplication +S000032820 CDS YGR254W 7 1000927 1002240 W 2011-02-03 1996-07-31 +S000130168 ARS ARS735 chromosome 7 7 1002239 1002522 2011-02-03 2009-05-07 Replication origin; identified in multiple array studies, confirmed by plasmid-based recombinational ARS assay +S000003487 ORF Verified YGR255C COQ6 putative N,N-dimethylaniline monooxygenase COQ6 chromosome 7 L000003876 7 1003962 1002523 C 2011-02-03 1996-07-31 Flavin-dependent monooxygenase involved in ubiquinone biosynthesis; responsible for hydroxylation at position C5 and deamination at C4 during ubiquinone (Coenzyme Q) biosynthesis; localizes to matrix face of mitochondrial inner membrane in a large complex with other ubiquinone biosynthetic enzymes; human homolog COQ6 can complement yeast null mutant and is implicated in steroid-resistant nephrotic syndrome (SRNS) +S000032856 CDS YGR255C 7 1003962 1002523 C 2011-02-03 1996-07-31 +S000006750 tRNA_gene tT(UGU)G2 chromosome 7 L000003839 7 1004216 1004287 W 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000030915 noncoding_exon tT(UGU)G2 7 1004216 1004287 W 2011-02-03 2000-05-19 +S000003488 ORF Verified YGR256W GND2 phosphogluconate dehydrogenase (decarboxylating) GND2 chromosome 7 L000003352 7 1004624 1006102 W 2011-02-03 1996-07-31 6-phosphogluconate dehydrogenase (decarboxylating); catalyzes an NADPH regenerating reaction in the pentose phosphate pathway; required for growth on D-glucono-delta-lactone; GND2 has a paralog, GND1, that arose from the whole genome duplication +S000033003 CDS YGR256W 7 1004624 1006102 W 2011-02-03 1996-07-31 +S000003489 ORF Verified YGR257C MTM1 chromosome 7 7 1007305 1006205 C 2011-02-03 1996-07-31 Mitochondrial protein of the mitochondrial carrier family; high affinity pyridoxal 5'-phosphate (PLP) transporter, important for delivery of PLP cofactor to mitochondrial enzymes; involved in mitochondrial iron homeostasis and in activating mitochondrial Sod2p by facilitating insertion of an essential manganese cofactor +S000033036 CDS YGR257C 7 1007305 1006205 C 2011-02-03 1996-07-31 +S000003490 ORF Verified YGR258C RAD2 ssDNA endodeoxyribonuclease RAD2 chromosome 7 L000001556 7 1010766 1007671 C 192 2011-02-03 1996-07-31 Single-stranded DNA endonuclease; cleaves single-stranded DNA during nucleotide excision repair to excise damaged DNA; subunit of Nucleotide Excision Repair Factor 3 (NEF3); homolog of human XPG protein +S000033688 CDS YGR258C 7 1010766 1007671 C 2011-02-03 1996-07-31 +S000077075 matrix_attachment_site ETC4 ETC4 chromosome 7 7 1010927 1010949 W 2014-11-18 2014-11-18 Chromosome-organizing-clamp; tethers chromosomal regions to the nuclear periphery; binds TFIIIC transcription factor but does not recruit RNA Polymerase III; can act as a transcription-blocking insulator or as a heterochromatin barrier element; remains predominantly localized to the nuclear periphery throughout cell cycle; located between divergently transcribed genes RAD2 and TNA1 +S000003492 ORF Verified YGR260W TNA1 chromosome 7 7 1012485 1014089 W 2011-02-03 1996-07-31 High affinity nicotinic acid plasma membrane permease; responsible for uptake of low levels of nicotinic acid; expression of the gene increases in the absence of extracellular nicotinic acid or para-aminobenzoate (PABA) +S000034815 CDS YGR260W 7 1012485 1014089 W 2011-02-03 1996-07-31 +S000003491 ORF Dubious YGR259C chromosome 7 7 1012921 1012481 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps almost completely with the verified ORF TNA1/YGR260W +S000033805 CDS YGR259C 7 1012921 1012481 C 2011-02-03 1996-07-31 +S000003493 ORF Verified YGR261C APL6 YKS5 chromosome 7 L000003034 7 1016750 1014321 C 2011-02-03 1996-07-31 Beta3-like subunit of the yeast AP-3 complex; functions in transport of alkaline phosphatase to the vacuole via the alternate pathway; exists in both cytosolic and peripherally associated membrane-bound pools +S000034880 CDS YGR261C 7 1016750 1014321 C 2011-02-03 1996-07-31 +S000003494 ORF Verified YGR262C BUD32 serine/threonine protein kinase BUD32|LDB14 chromosome 7 7 1017759 1016974 C 2011-02-03 1996-07-31 Protein kinase; component of the EKC/KEOPS complex with Kae1p, Cgi121p, Pcc1p, and Gon7p; Pyrococcus Bud32 ortholog functions as a P-loop ATPase rather than a protein kinase in the context of the complex; EKC/KEOPS complex is required for t6A tRNA modification and telomeric TG1-3 recombination; may have role in transcription; mutation is functionally complemented by human TP53RK +S000034994 CDS YGR262C 7 1017759 1016974 C 2011-02-03 1996-07-31 +S000003495 ORF Verified YGR263C SAY1 steryl deacetylase chromosome 7 7 1019241 1017967 C 2011-02-03 1996-07-31 Sterol deacetylase; component of the sterol acetylation/deacetylation cycle along with Atf2p; active both in the endoplasmic reticulum (ER) and in lipid droplets; integral membrane protein with active site in the ER lumen; green fluorescent protein (GFP)-fusion protein localizes to the ER +S000035935 CDS YGR263C 7 1019241 1017967 C 2011-02-03 1996-07-31 +S000003497 ORF Dubious YGR265W chromosome 7 7 1021648 1022058 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF MES1/YGR264C, which encodes methionyl-tRNA synthetase +S000036929 CDS YGR265W 7 1021648 1022058 W 2011-02-03 1996-07-31 +S000003496 ORF Verified YGR264C MES1 methionine--tRNA ligase MES1|MetRS|MESI chromosome 7 L000001075 7 1021853 1019598 C 204 2011-02-03 1996-07-31 Methionyl-tRNA synthetase; forms a complex with glutamyl-tRNA synthetase (Gus1p) and Arc1p, which increases the catalytic efficiency of both tRNA synthetases; also has a role in nuclear export of tRNAs; mutations in human ortholog MARS are associated with pediatric pulmonary alveolar proteinosis +S000036088 CDS YGR264C 7 1021853 1019598 C 2011-02-03 1996-07-31 +S000003498 ORF Verified YGR266W chromosome 7 7 1022656 1024761 W 2011-02-03 1996-07-31 Protein of unknown function; predicted to contain a single transmembrane domain; mutant has increased aneuploidy tolerance; localized to both the mitochondrial outer membrane and the plasma membrane; protein abundance increases in response to DNA replication stress +S000036991 CDS YGR266W 7 1022656 1024761 W 2011-02-03 1996-07-31 +S000003499 ORF Verified YGR267C FOL2 GTP cyclohydrolase I chromosome 7 L000000621 7 1025735 1025004 C 215 2011-02-03 1996-07-31 GTP-cyclohydrolase I, catalyzes first step in folic acid biosynthesis; human homolog GCH1 is implicated in dopa-responsive dystonia (DRD), and can complement yeast null mutant +S000037019 CDS YGR267C 7 1025735 1025004 C 2011-02-03 1996-07-31 +S000003501 ORF Dubious YGR269W chromosome 7 7 1026636 1026962 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF HUA1/YGR268C +S000029827 CDS YGR269W 7 1026636 1026962 W 2011-02-03 1996-07-31 +S000003500 ORF Verified YGR268C HUA1 chromosome 7 7 1026653 1026057 C 2011-02-03 1996-07-31 Cytoplasmic protein containing a zinc finger domain; sequence similarity to that of Type I J-proteins; computational analysis of large-scale protein-protein interaction data suggests a possible role in actin patch assembly +S000037084 CDS YGR268C 7 1026653 1026057 C 2011-02-03 1996-07-31 +S000003502 ORF Verified YGR270W YTA7 chromosome 7 L000002561 7 1027370 1031509 W 2011-02-03 1996-07-31 Protein that localizes to chromatin; has a role in regulation of histone gene expression; has a bromodomain-like region that interacts with the N-terminal tail of histone H3, and an ATPase domain; relocalizes to the cytosol in response to hypoxia; potentially phosphorylated by Cdc28p +S000030911 CDS YGR270W 7 1027370 1031509 W 2011-02-03 1996-07-31 +S000028641 ORF Dubious YGR270C-A chromosome 7 7 1027600 1027382 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the verified ORF YTA7/YGR270W +S000032417 CDS YGR270C-A 7 1027600 1027382 C 2011-02-03 2003-07-29 +S000003503 ORF Verified YGR271W SLH1 putative RNA helicase chromosome 7 7 1031791 1037694 W 2011-02-03 1996-07-31|2011-02-03 Putative RNA helicase related to Ski2p; involved in translation inhibition of non-poly(A) mRNAs; required for repressing propagation of dsRNA viruses +S000030983 CDS YGR271W 7 1031791 1037694 W 2011-02-03 1996-07-31|2011-02-03 +S000007608 ORF Verified YGR271C-A EFG1 YGR272C chromosome 7 7 1038501 1037800 C 2011-02-03 2001-02-26|2007-12-11 Essential protein required for maturation of 18S rRNA; null mutant is sensitive to hydroxyurea and is delayed in recovering from alpha-factor arrest; green fluorescent protein (GFP)-fusion protein localizes to the nucleolus +S000037185 CDS YGR271C-A 7 1038501 1037800 C 2011-02-03 2001-02-26|2007-12-11 +S000003505 ORF Uncharacterized YGR273C IBI1 chromosome 7 7 1039239 1038715 C 2011-02-03 1996-07-31 Putative protein of unknown function; expression downregulated by treatment with 8-methoxypsoralen plus UVA irradiation; not an essential gene; YGR273C has a paralog, YMR295C, that arose from the whole genome duplication +S000031075 CDS YGR273C 7 1039239 1038715 C 2011-02-03 1996-07-31 +S000003506 ORF Verified YGR274C TAF1 KAT4|TafII145|TafII130|TAF145|TAF130 chromosome 7 L000002748 7 1043095 1039895 C 2011-02-03 1996-07-31|2011-02-03 TFIID subunit, involved in RNA pol II transcription initiation; possesses in vitro histone acetyltransferase activity but its role in vivo appears to be minor; involved in promoter binding and G1/S progression; relocalizes to the cytosol in response to hypoxia +S000032074 CDS YGR274C 7 1043095 1039895 C 2011-02-03 1996-07-31|2011-02-03 +S000003507 ORF Verified YGR275W RTT102 chromosome 7 L000004851 7 1043276 1043749 W 2011-02-03 2003-09-22|1996-07-31 Component of both the SWI/SNF and RSC chromatin remodeling complexes; suggested role in chromosome maintenance; possible weak regulator of Ty1 transposition; protein abundance increases in response to DNA replication stress +S000032191 CDS YGR275W 7 1043276 1043749 W 2011-02-03 2003-09-22|1996-07-31 +S000003508 ORF Verified YGR276C RNH70 RNA82|REX1 chromosome 7 L000004048 7 1045480 1043819 C 2011-02-03 1996-07-31 3'-5' exoribonuclease; required for maturation of 3' ends of 5S rRNA and tRNA-Arg3 from dicistronic transcripts +S000032221 CDS YGR276C 7 1045480 1043819 C 2011-02-03 1996-07-31 +S000003509 ORF Verified YGR277C CAB4 putative pantetheine-phosphate adenylyltransferase chromosome 7 7 1046561 1045644 C 2011-02-03 1996-07-31 Subunit of the CoA-Synthesizing Protein Complex (CoA-SPC); subunits of this complex are: Cab2p, Cab3p, Cab4p, Cab5p, Sis2p and Vhs3p; probable pantetheine-phosphate adenylyltransferase (PPAT); PPAT catalyzes the fourth step in the biosynthesis of coenzyme A from pantothenate; null mutant lethality is complemented by E. coli coaD (encoding PPAT) and by human COASY +S000032280 CDS YGR277C 7 1046561 1045644 C 2011-02-03 1996-07-31 +S000003510 ORF Verified YGR278W CWC22 U2-type spliceosomal complex subunit CWC22 chromosome 7 7 1046731 1048464 W 2011-02-03 1996-07-31 Spliceosome-associated protein that is required for pre-mRNA splicing; necessary for Prp2p function at the first catalytic step of splicing; has similarity to S. pombe Cwf22p; CWC22 is an essential protein +S000033193 CDS YGR278W 7 1046731 1048464 W 2011-02-03 1996-07-31 +S000003511 ORF Verified YGR279C SCW4 putative family 17 glucosidase chromosome 7 L000004565 7 1049958 1048798 C 2011-02-03 1996-07-31 Cell wall protein with similarity to glucanases; scw4 scw10 double mutants exhibit defects in mating; SCW4 has a paralog, SCW10, that arose from the whole genome duplication +S000033219 CDS YGR279C 7 1049958 1048798 C 2011-02-03 1996-07-31 +S000003512 ORF Verified YGR280C PXR1 telomerase inhibitor|PinX1|GNO1 chromosome 7 S000007659 7 1051725 1050910 C 2011-02-03 1996-07-31 Essential protein involved in rRNA and snoRNA maturation; competes with TLC1 RNA for binding to Est2p, suggesting a role in negative regulation of telomerase; human homolog inhibits telomerase; contains a G-patch RNA interacting domain +S000035203 CDS YGR280C 7 1051725 1050910 C 2011-02-03 1996-07-31 +S000003513 ORF Verified YGR281W YOR1 ATP-binding cassette transporter YOR1|YRS1 chromosome 7 L000003083 7 1052824 1057257 W 2011-02-03 1996-07-31 Plasma membrane ATP-binding cassette (ABC) transporter; multidrug transporter mediates export of many different organic anions including oligomycin; homolog of human cystic fibrosis transmembrane receptor (CFTR) +S000035335 CDS YGR281W 7 1052824 1057257 W 2011-02-03 1996-07-31 +S000003514 ORF Verified YGR282C BGL2 glucan 1,3-beta-glucosidase|SCW9 chromosome 7 L000000175|S000029440|L000004570 7 1058724 1057783 C 2011-02-03 1996-07-31 Endo-beta-1,3-glucanase; major protein of the cell wall, involved in cell wall maintenance; involved in incorporation of newly synthesized mannoprotein molecules into the cell wall +S000035378 CDS YGR282C 7 1058724 1057783 C 2011-02-03 1996-07-31 +S000003515 ORF Verified YGR283C putative methyltransferase chromosome 7 7 1060040 1059015 C 2011-02-03 1996-07-31 Putative methyltransferase; may interact with ribosomes, based on co-purification experiments; predicted to be involved in ribosome biogenesis; null mutant is resistant to fluconazole; GFP-fusion protein localizes to the nucleolus; YGR283C has a paralog, YMR310C, that arose from the whole genome duplication +S000035443 CDS YGR283C 7 1060040 1059015 C 2011-02-03 1996-07-31 +S000003516 ORF Verified YGR284C ERV29 chromosome 7 7 1061590 1060658 C 2011-02-03 1996-07-31 Protein localized to COPII-coated vesicles; involved in vesicle formation and incorporation of specific secretory cargo; protein abundance increases in response to DNA replication stress +S000036349 CDS YGR284C 7 1061590 1060658 C 2011-02-03 1996-07-31 +S000003517 ORF Verified YGR285C ZUO1 zuotin chromosome 7 L000002571 7 1063153 1061852 C 2011-02-03 1996-07-31 Ribosome-associated chaperone; zuotin functions in ribosome biogenesis and as a chaperone for nascent polypeptide chains in partnership with Ssz1p and SSb1/2; contains a DnaJ domain and functions as a J-protein partner for Ssb1p and Ssb2p; human gene DNAJC2 can partially complement yeast zuo1 null mutant +S000036447 CDS YGR285C 7 1063153 1061852 C 2011-02-03 1996-07-31 +S000003518 ORF Verified YGR286C BIO2 biotin synthase chromosome 7 L000000181 7 1064940 1063813 C 2011-02-03 1996-07-31 Biotin synthase; catalyzes the conversion of dethiobiotin to biotin, which is the last step of the biotin biosynthesis pathway; complements E. coli bioB mutant +S000036536 CDS YGR286C 7 1064940 1063813 C 2011-02-03 1996-07-31 +S000003519 ORF Verified YGR287C IMA1 oligo-1,6-glucosidase IMA1 chromosome 7 7 1068991 1067222 C 2011-02-03 1996-07-31 Major isomaltase (alpha-1,6-glucosidase/alpha-methylglucosidase); required for isomaltose utilization; preferred specificity for isomaltose, alpha-methylglucoside, and palatinose, but also exhibits alpha-1,2 glucosidase activity on sucrose and kojibiose, and can cleave the 1,3-alpha linkage of nigerose and turanose and the alpha-1,5 linkage of leucrose in vitro; member of the IMA isomaltase family +S000036609 CDS YGR287C 7 1068991 1067222 C 2011-02-03 1996-07-31 +S000003520 ORF Verified YGR288W MAL13 transcription factor MAL13|MALR chromosome 7 L000001010 7 1070293 1071714 W 2011-02-03 1996-07-31 MAL-activator protein; part of complex locus MAL1; nonfunctional in genomic reference strain S288C +S000037379 CDS YGR288W 7 1070293 1071714 W 2011-02-03 1996-07-31 +S000003522 ORF Dubious YGR290W chromosome 7 7 1075482 1075925 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; putative HLH protein; partially overlaps the verified ORF MAL11/YGR289C (a high-affinity maltose transporter) +S000030534 CDS YGR290W 7 1075482 1075925 W 2011-02-03 1996-07-31 +S000003521 ORF Verified YGR289C MAL11 alpha-glucoside permease|MALT|AGT1 chromosome 7 L000002978 7 1075813 1073963 C 2011-02-03 1996-07-31 High-affinity maltose transporter (alpha-glucoside transporter); inducible; encoded in the MAL1 complex locus; broad substrate specificity that includes maltotriose; required for isomaltose utilization +S000037432 CDS YGR289C 7 1075813 1073963 C 2011-02-03 1996-07-31 +S000003523 ORF Dubious YGR291C chromosome 7 7 1076504 1076283 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030599 CDS YGR291C 7 1076504 1076283 C 2011-02-03 1996-07-31 +S000003524 ORF Verified YGR292W MAL12 alpha-glucosidase MAL12|MALS chromosome 7 L000001009 7 1076599 1078353 W 226 2011-02-03 1996-07-31 Maltase (alpha-D-glucosidase); inducible protein involved in maltose catabolism; encoded in the MAL1 complex locus; hydrolyzes the disaccharides maltose, turanose, maltotriose, and sucrose +S000030723 CDS YGR292W 7 1076599 1078353 W 2011-02-03 1996-07-31 +S000003526 ORF Verified YGR294W PAU12 seripauperin PAU12 chromosome 7 7 1080306 1080668 W 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP fusion protein localizes to both the endoplasmic reticulum and vacuole +S000031646 CDS YGR294W 7 1080306 1080668 W 2011-02-03 1996-07-31 +S000003525 ORF Dubious YGR293C chromosome 7 7 1080346 1079885 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YGR294W +S000030754 CDS YGR293C 7 1080346 1079885 C 2011-02-03 1996-07-31 +S000003527 ORF Verified YGR295C COS6 chromosome 7 L000004064 7 1082729 1081584 C 2011-02-03 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins +S000031677 CDS YGR295C 7 1082729 1081584 C 2011-02-03 1996-07-31 +S000028960 telomere TEL07R chromosome 7 7 1083635 1090940 W 231 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome VII; annotated components include an X element core sequence, X element combinatorial repeats, and a long Y' element; TEL07R does have telomeric repeats (TEL07R-TR), but they are missing from the genome annotation due to difficulties encountered during sequencing and/or assembly +S000028961 X_element TEL07R 7 1083635 1084092 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome VII; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028962 X_element_combinatorial_repeat TEL07R 7 1084093 1084346 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr VII; contains repeats of the D, C, and B types; formerly called SubTelomeric Repeats +S000028963 Y_prime_element TEL07R 7 1084347 1090940 W 2011-02-03 2003-09-09 Telomeric long Y' element on the right arm of Chromosome VII; contains an ARS consensus sequence, a region of 36-bp repeats, and three ORFs (YRF1-3/YGR296W, YGR296C-A, YGR296C-B) +S000130170 ARS ARS736 chromosome 7 7 1083795 1084863 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000003528 ORF Verified YGR296W YRF1-3 Y' element ATP-dependent helicase protein 1 copy 3|YRF1 chromosome 7 7 1084864 1090591 W 2011-02-03 1996-07-31 Helicase encoded by the Y' element of subtelomeric regions; highly expressed in the mutants lacking the telomerase component TLC1; potentially phosphorylated by Cdc28p +S000031882 CDS YGR296W 7 1084864 1084882 W 2011-02-03 1996-07-31 +S000031883 CDS YGR296W 7 1085031 1090591 W 2011-02-03 1996-07-31 +S000031884 intron YGR296W 7 1084883 1085030 W 2011-02-03 1996-07-31 +S000028642 ORF Dubious YGR296C-A chromosome 7 7 1089445 1088870 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps TEL07R +S000032418 CDS YGR296C-A 7 1089445 1088870 C 2011-02-03 2003-07-29 +S000028643 ORF Dubious YGR296C-B chromosome 7 7 1090228 1089746 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; contained completely within TEL07R +S000032419 CDS YGR296C-B 7 1090228 1089746 C 2011-02-03 2003-07-29 +S000028644 ORF Dubious YHL050W-A chromosome 8 8 811 1293 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032420 CDS YHL050W-A 8 811 1293 W 2003-07-29 2003-07-29 +S000001042 ORF Uncharacterized YHL050C chromosome 8 8 3311 445 C 2011-02-03 1996-07-31|2011-02-03 Putative protein of unknown function; potential Cdc28p substrate +S000030583 CDS YHL050C 8 1897 445 C 1996-07-31 1996-07-31 +S000030582 CDS YHL050C 8 3311 2671 C 2011-02-03 1996-07-31 +S000030584 intron YHL050C 8 2670 1898 C 2011-02-03 1996-07-31|2011-02-03 +S000001041 ORF Uncharacterized YHL049C chromosome 8 8 4541 3726 C 2011-02-03 1996-07-31 Putative protein of unknown function +S000031013 CDS YHL049C 8 4541 3726 C 2011-02-03 1996-07-31 +S000130145 ARS ARS801 chromosome 8 8 5471 6401 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000028891 telomere TEL08L chromosome 8 8 5505 1 C -40 2011-02-03 2003-09-09|2011-02-03 Telomeric region on the left arm of Chromosome VIII; composed of an X element core sequence, an X element combinatorial repeat, a short Y' element, and a short terminal stretch of telomeric repeats +S000028892 telomeric_repeat TEL08L 8 34 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome VIII +S000028893 X_element TEL08L 8 5505 5052 C 2011-02-03 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome VIII; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028894 X_element_combinatorial_repeat TEL08L 8 5051 4952 C 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr VIII; contains a D-type repeat; formerly called SubTelomeric Repeats +S000028895 Y_prime_element TEL08L 8 4951 35 C 2011-02-03 2003-09-09|2011-02-03 Telomeric short Y' element on the left arm of Chromosome VIII; contains an ARS consensus sequence, a region of 36-bp repeats, and three ORFs (YHL049C, YHL050C, YHL050W-A) +S000028829 ORF Uncharacterized YHL048C-A chromosome 8 8 5797 5663 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000033659 CDS YHL048C-A 8 5797 5663 C 2011-02-03 2003-07-29 +S000001040 ORF Verified YHL048W COS8 chromosome 8 L000004066 8 6401 7546 W 2011-02-03 1996-07-31 Endosomal protein involved in turnover of plasma membrane proteins; member of the DUP380 subfamily of conserved, often subtelomeric COS genes; required for the multivesicular vesicle body sorting pathway that internalizes plasma membrane proteins for degradation; Cos proteins provide ubiquitin in trans for nonubiquitinated cargo proteins +S000030997 CDS YHL048W 8 6401 7546 W 2011-02-03 1996-07-31 +S000118356 ARS ARS802 ARSVIII-8 chromosome 8 8 7702 7767 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178105 ARS_consensus_sequence ARS802 8 7755 7739 C 2014-11-18 2014-11-18 +S000006986 long_terminal_repeat YHLComega1 chromosome 8 8 8225 7994 C 2011-02-03 2000-05-19 Ty5 LTR +S000028775 ORF Dubious YHL046W-A chromosome 8 8 9981 10307 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF ARN2/YHL047C +S000033493 CDS YHL046W-A 8 9981 10307 W 2011-02-03 2003-07-29 +S000001039 ORF Verified YHL047C ARN2 siderophore transporter|TAF1 chromosome 8 8 10213 8351 C 2011-02-03 1996-07-31|2011-02-03 Transporter; member of the ARN family of transporters that specifically recognize siderophore-iron chelates; responsible for uptake of iron bound to the siderophore triacetylfusarinine C +S000029944 CDS YHL047C 8 10213 8351 C 2011-02-03 1996-07-31|2011-02-03 +S000001038 ORF Verified YHL046C PAU13 seripauperin PAU13 chromosome 8 8 12285 11923 C 2011-02-03 1996-07-31 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; expression is induced after ethanol shock; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively +S000029841 CDS YHL046C 8 12285 11923 C 2011-02-03 1996-07-31 +S000001037 ORF Dubious YHL045W chromosome 8 8 12502 12849 W 2011-02-03 1996-07-31 Putative protein of unknown function; not an essential gene +S000037882 CDS YHL045W 8 12502 12849 W 2011-02-03 1996-07-31 +S000001036 ORF Uncharacterized YHL044W DUP240 family protein chromosome 8 8 13565 14272 W 2011-02-03 1996-07-31 Putative integral membrane protein; member of DUP240 gene family; green fluorescent protein (GFP)-fusion protein localizes to the plasma membrane in a punctate pattern +S000037802 CDS YHL044W 8 13565 14272 W 2011-02-03 1996-07-31 +S000001035 ORF Verified YHL043W ECM34 chromosome 8 L000003903 8 14901 15413 W 2011-02-03 1996-07-31 Protein of unknown function; member of the DUP380 subfamily of conserved, often subtelomerically-encoded proteins; SWAT-GFP, seamless-GFP and mCherry C-terminal fusion proteins localize to the cytosol +S000035918 CDS YHL043W 8 14901 15413 W 2011-02-03 1996-07-31 +S000001034 ORF Uncharacterized YHL042W chromosome 8 8 15667 16119 W 2011-02-03 1996-07-31 Protein of unknown function; member of the DUP380 subfamily of conserved, often subtelomerically-encoded proteins; SWAT-GFP and mCherry fusion proteins localize to the vacuole +S000035803 CDS YHL042W 8 15667 16119 W 2011-02-03 1996-07-31 +S000001033 ORF Dubious YHL041W chromosome 8 8 17392 17841 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035678 CDS YHL041W 8 17392 17841 W 2011-02-03 1996-07-31 +S000001032 ORF Verified YHL040C ARN1 siderophore transporter chromosome 8 8 20971 19088 C 2011-02-03 1996-07-31 ARN family transporter for siderophore-iron chelates; responsible for uptake of iron bound to ferrirubin, ferrirhodin, and related siderophores; protein increases in abundance and relocalizes to the vacuole upon DNA replication stress +S000034609 CDS YHL040C 8 20971 19088 C 2011-02-03 1996-07-31 +S000001031 ORF Verified YHL039W EFM1 protein-lysine N-methyltransferase chromosome 8 8 21783 23540 W 2011-02-03 1996-07-31 Lysine methyltransferase; involved in the monomethylation of eEF1A (Tef1p/Tef2p); SET-domain family member; predicted involvement in ribosome biogenesis; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm +S000036027 CDS YHL039W 8 21783 23540 W 2011-02-03 1996-07-31 +S000001030 ORF Verified YHL038C CBP2 chromosome 8 L000000225 8 25509 23617 C 2011-02-03 1996-07-31 Required for splicing of the group I intron bI5 of the COB pre-mRNA; nuclear-encoded mitochondrial protein that binds to the RNA to promote splicing; also involved in but not essential for splicing of the COB bI2 intron and the intron in the 21S rRNA gene +S000035079 CDS YHL038C 8 25509 23617 C 2011-02-03 1996-07-31 +S000001029 ORF Dubious YHL037C chromosome 8 8 26179 25778 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034940 CDS YHL037C 8 26179 25778 C 2011-02-03 1996-07-31|2011-02-03 +S000001028 ORF Verified YHL036W MUP3 chromosome 8 L000003357 8 26241 27881 W 2011-02-03 1996-07-31 Low affinity methionine permease; similar to Mup1p +S000034885 CDS YHL036W 8 26241 27881 W 2011-02-03 1996-07-31 +S000001027 ORF Verified YHL035C VMR1 putative ATP-binding cassette multidrug transporter VMR1 chromosome 8 8 32756 27978 C 2011-02-03 1996-07-31 Vacuolar membrane protein; involved in multiple drug resistance and metal sensitivity; ATP-binding cassette (ABC) family member involved in drug transport; potential Cdc28p substrate; induced under respiratory conditions; VMR1 has a paralog, YBT1, that arose from the whole genome duplication +S000033937 CDS YHL035C 8 32756 27978 C 2011-02-03 1996-07-31 +S000028774 ORF Dubious YHL034W-A chromosome 8 8 33176 33637 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF SBP1/YHL034C +S000033492 CDS YHL034W-A 8 33176 33637 W 2011-02-03 2003-07-29 +S000001026 ORF Verified YHL034C SBP1 SSB1|SSBR1 chromosome 8 L000002628|L000002076 8 34077 33193 C 2011-02-03 1996-07-31 Protein that binds eIF4G and has a role in repression of translation; has an RGG motif; found in cytoplasmic P bodies; binds to mRNAs under glucose starvation stress, most often in the 5' UTR; found associated with small nucleolar RNAs snR10 and snR11; SBP1 has a paralog, RNP1, that arose from the whole genome duplication +S000033834 CDS YHL034C 8 34077 33193 C 2011-02-03 1996-07-31 +S000001025 ORF Verified YHL033C RPL8A eL8|ribosomal 60S subunit protein L8A|L8e|rp6|YL5|L8A|L4A|MAK7 chromosome 8 L000000981|L000001704 8 36025 35255 C -38 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L8A; required for processing of 27SA3 pre-rRNA to 27SB pre-rRNA during assembly of large ribosomal subunit; depletion leads to a turnover of pre-rRNA; L8 binds to Domain I of 25S and 5.8 S rRNAs; mutation results in decreased amounts of free 60S subunits; homologous to mammalian ribosomal protein L7A, no bacterial homolog; RPL8A has a paralog, RPL8B, that arose from the whole genome duplication +S000033669 CDS YHL033C 8 36025 35255 C 2011-02-03 1996-07-31 +S000001024 ORF Verified YHL032C GUT1 glycerol kinase chromosome 8 L000000746 8 38508 36379 C 2011-02-03 1996-07-31 Glycerol kinase; converts glycerol to glycerol-3-phosphate; glucose repression of expression is mediated by Adr1p and Ino2p-Ino4p; derepression of expression on non-fermentable carbon sources is mediated by Opi1p and Rsf1p +S000030379 CDS YHL032C 8 38508 36379 C 2011-02-03 1996-07-31 +S000028773 ORF Dubious YHL030W-A chromosome 8 8 39074 39535 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene GOS1/YHL031C +S000033490 CDS YHL030W-A 8 39074 39535 W 2011-02-03 2003-07-29 +S000001023 ORF Verified YHL031C GOS1 chromosome 8 L000004085 8 39486 38815 C 2011-02-03 1996-07-31 v-SNARE protein involved in Golgi transport; homolog of the mammalian protein GOS-28/GS28 +S000030199 CDS YHL031C 8 39486 38815 C 2011-02-03 1996-07-31 +S000001022 ORF Verified YHL030W ECM29 chromosome 8 L000003899 8 40084 45690 W 2011-02-03 1996-07-31 Scaffold protein; assists in association of the proteasome core particle with the regulatory particle; inhibits proteasomal ATPase activity; degraded by the mature proteasome after assembly; contains HEAT-like repeats; protein increases in abundance and relocalizes from nucleus to cytoplasm upon DNA replication stress +S000030143 CDS YHL030W 8 40084 45690 W 2011-02-03 1996-07-31 +S000001021 ORF Uncharacterized YHL029C OCA5 chromosome 8 8 47968 45929 C 2011-02-03 1996-07-31 Cytoplasmic protein required for replication of Brome mosaic virus; S. cerevisiae is a model system for studying replication of positive-strand RNA viruses in their natural hosts +S000030645 CDS YHL029C 8 47968 45929 C 2011-02-03 1996-07-31 +S000001020 ORF Verified YHL028W WSC4 YFW1|YHC8 chromosome 8 L000004219 8 48763 50580 W 2011-02-03 1996-07-31 Endoplasmic reticulum (ER) membrane protein; involved in the translocation of soluble secretory proteins and insertion of membrane proteins into the ER membrane; may also have a role in the stress response but has only partial functional overlap with WSC1-3 +S000030604 CDS YHL028W 8 48763 50580 W 2011-02-03 1996-07-31 +S000001019 ORF Verified YHL027W RIM101 alkaline-responsive transcriptional regulator RIM101|RIM1 chromosome 8 L000002818 8 51111 52988 W 2011-02-03 1996-07-31 Cys2His2 zinc-finger transcriptional repressor; involved in alkaline responsive gene repression as part of adaptation to alkaline conditions; involved in cell wall assembly; required for alkaline pH-stimulated haploid invasive growth and sporulation; activated by alkaline-dependent proteolytic processing which results in removal of the C-terminal tail; similar to A. nidulans PacC +S000030530 CDS YHL027W 8 51111 52988 W 2011-02-03 1996-07-31 +S000001018 ORF Uncharacterized YHL026C chromosome 8 8 54166 53219 C 2011-02-03 1996-07-31|2005-11-07 Putative protein of unknown function; transcriptionally regulated by Upc2p via an upstream sterol response element; SWAT-GFP fusion protein localizes to the cell periphery, while mCherry fusion localizes to both the cell periphery and vacuole; YHL026C is not an essential gene; in 2005 the start site was moved 141 nt upstream (see Locus History) +S000037665 CDS YHL026C 8 54166 53219 C 2011-02-03 1996-07-31|2005-11-07 +S000001017 ORF Verified YHL025W SNF6 chromosome 8 L000001949 8 54851 55849 W 2011-02-03 1996-07-31 Subunit of the SWI/SNF chromatin remodeling complex; involved in transcriptional regulation; functions interdependently in transcriptional activation with Snf2p and Snf5p; relocates to the cytosol under hypoxic conditions +S000037635 CDS YHL025W 8 54851 55849 W 2011-02-03 1996-07-31 +S000001016 ORF Verified YHL024W RIM4 chromosome 8 L000004288|L000004795 8 56649 58790 W 2011-02-03 1996-07-31 Putative RNA-binding protein; required for the expression of early and middle sporulation genes +S000037557 CDS YHL024W 8 56649 58790 W 2011-02-03 1996-07-31 +S000001015 ORF Verified YHL023C NPR3 RMD11 chromosome 8 8 62563 59123 C 2011-02-03 1996-07-31 Subunit of the Iml1p/SEACIT complex; SEACIT (Iml1p-Npr2p-Npr3p) is a subcomplex of SEAC, a coatomer-related complex that associates dynamically with the vacuole; Npr3p may have a structural or regulatory role, supporting Iml1p function as a GAP for the Rag family GTPase Gtr1p, and leading to inhibition of TORC1 signaling in response to amino acid deprivation; SEACIT is required for non-nitrogen-starvation-induced autophagy; null mutant has meiotic defects; human NPRL3 homolog +S000037421 CDS YHL023C 8 62563 59123 C 2011-02-03 1996-07-31 +S000006597 tRNA_gene tH(GUG)H chromosome 8 L000003855 8 62755 62826 W 2011-02-03 2000-05-19 Histidine tRNA (tRNA-His), predicted by tRNAscan-SE analysis +S000033884 noncoding_exon tH(GUG)H 8 62755 62826 W 2011-02-03 2000-05-19 +S000001014 ORF Verified YHL022C SPO11 chromosome 8 L000002002 8 64157 62961 C -23 2011-02-03 1996-07-31 Meiosis-specific protein that initiates meiotic recombination; initiates meiotic recombination by catalyzing the formation of double-strand breaks in DNA via a transesterification reaction; required for homologous chromosome pairing and synaptonemal complex formation +S000031919 CDS YHL022C 8 64157 62961 C 2011-02-03 1996-07-31 +S000114849 ARS ARS805 ARS805 ARSVIII-64|SPO11 ARS chromosome 8 8 64296 64371 2014-11-18 2014-11-18|2006-04-13|2006-09-07|2011-02-03 Autonomously Replicating Sequence +S000178106 ARS_consensus_sequence ARS805 8 64299 64315 W 2014-11-18 2014-11-18 +S000001013 ORF Verified YHL021C AIM17 FMP12 chromosome 8 8 65859 64462 C 2011-02-03 1996-07-31 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; null mutant displays reduced frequency of mitochondrial genome loss +S000031775 CDS YHL021C 8 65859 64462 C 2011-02-03 1996-07-31 +S000001012 ORF Verified YHL020C OPI1 transcriptional regulator OPI1 chromosome 8 L000001303 8 67456 66242 C 2011-02-03 1996-07-31 Transcriptional regulator of a variety of genes; phosphorylation by protein kinase A stimulates Opi1p function in negative regulation of phospholipid biosynthetic genes; involved in telomere maintenance; null exhibits disrupted mitochondrial metabolism and low cardiolipin content, strongly correlated with overproduction of inositol; binds to phosphatidic acid +S000029857 CDS YHL020C 8 67456 66242 C 2011-02-03 1996-07-31 +S000028772 ORF Dubious YHL019W-A chromosome 8 8 67711 68304 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene APM2/YHL019C +S000033486 CDS YHL019W-A 8 67711 68304 W 2011-02-03 2003-07-29 +S000001011 ORF Verified YHL019C APM2 chromosome 8 L000000095 8 69548 67731 C 2011-02-03 1996-07-31 Protein of unknown function; homologous to the medium chain of mammalian clathrin-associated protein complex; involved in vesicular transport +S000035353 CDS YHL019C 8 69548 67731 C 2011-02-03 1996-07-31 +S000001010 ORF Uncharacterized YHL018W 4a-hydroxytetrahydrobiopterin dehydratase chromosome 8 8 69708 70070 W 2011-02-03 1996-07-31 Putative 4a-hydroxytetrahydrobiopterin dehydratase; green fluorescent protein (GFP)-fusion protein localizes to mitochondria and is induced in response to the DNA-damaging agent MMS +S000035323 CDS YHL018W 8 69708 70070 W 2011-02-03 1996-07-31 +S000001009 ORF Uncharacterized YHL017W chromosome 8 8 70276 71874 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein co-localizes with clathrin-coated vesicles; YHL017W has a paralog, PTM1, that arose from the whole genome duplication +S000035245 CDS YHL017W 8 70276 71874 W 2011-02-03 1996-07-31 +S000001008 ORF Verified YHL016C DUR3 chromosome 8 L000000534 8 74244 72037 C -13 2011-02-03 1996-07-31 Plasma membrane transporter for both urea and polyamines; expression is highly sensitive to nitrogen catabolite repression and induced by allophanate, the last intermediate of the allantoin degradative pathway +S000034197 CDS YHL016C 8 74244 72037 C 2011-02-03 1996-07-31 +S000028828 ORF Uncharacterized YHL015W-A chromosome 8 8 74699 74782 W 2011-02-03 2003-07-29 Putative protein of unknown function +S000033654 CDS YHL015W-A 8 74699 74782 W 2011-02-03 2003-07-29 +S000001007 ORF Verified YHL015W RPS20 uS10|ribosomal 40S subunit protein S20|S10|URP2 chromosome 8 L000002442 8 75412 75777 W 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; overproduction suppresses mutations affecting RNA polymerase III-dependent transcription; homologous to mammalian ribosomal protein S20 and bacterial S10 +S000034165 CDS YHL015W 8 75412 75777 W 2011-02-03 1996-07-31 +S000001006 ORF Verified YHL014C YLF2 YLF1 chromosome 8 L000002519 8 77314 76097 C 2011-02-03 1996-07-31 Protein of unknown function; has weak similarity to E. coli GTP-binding protein gtp1; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000034003 CDS YHL014C 8 77314 76097 C 2011-02-03 1996-07-31 +S000001005 ORF Verified YHL013C OTU2 chromosome 8 8 78353 77430 C 2011-02-03 1996-07-31 Protein of unknown function; may interact with ribosomes, based on co-purification experiments; member of the ovarian tumor-like (OTU) superfamily of predicted cysteine proteases; shows cytoplasmic localization; protein abundance increases in response to DNA replication stress +S000033190 CDS YHL013C 8 78353 77430 C 2011-02-03 1996-07-31 +S000001004 ORF Uncharacterized YHL012W UTP--glucose-1-phosphate uridylyltransferase chromosome 8 8 78936 80417 W 2011-02-03 1996-07-31 Putative UTP glucose-1-phosphate uridylyltransferase; YHL012W has a paralog, UGP1, that arose from the whole genome duplication +S000033163 CDS YHL012W 8 78936 80417 W 2011-02-03 1996-07-31 +S000001003 ORF Verified YHL011C PRS3 ribose phosphate diphosphokinase subunit PRS3 chromosome 8 L000001514 8 81616 80654 C 2011-02-03 1996-07-31 5-phospho-ribosyl-1(alpha)-pyrophosphate synthetase; synthesizes PRPP, which is required for nucleotide, histidine, and tryptophan biosynthesis; one of five related enzymes, which are active as heteromultimeric complexes +S000033025 CDS YHL011C 8 81616 80654 C 2011-02-03 1996-07-31 +S000001002 ORF Verified YHL010C ETP1 BRP2 chromosome 8 8 83721 81964 C 2011-02-03 1996-07-31 Protein of unknown function required for growth on ethanol; contains a zinc finger region and has homology to human BRAP2, which is a cytoplasmic protein that binds nuclear localization sequences +S000032099 CDS YHL010C 8 83721 81964 C 2011-02-03 1996-07-31 +S000001001 ORF Verified YHL009C YAP3 chromosome 8 L000004382 8 85060 84068 C 2011-02-03 1996-07-31 Basic leucine zipper (bZIP) transcription factor +S000030991 CDS YHL009C 8 85060 84068 C 2011-02-03 1996-07-31 +S000006758 tRNA_gene tV(AAC)H chromosome 8 L000003865 8 85371 85298 C 2011-02-03 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000032130 noncoding_exon tV(AAC)H 8 85371 85298 C 2011-02-03 2000-05-19 +S000006987 long_terminal_repeat YHLCsigma1 chromosome 8 8 85538 85388 C 2011-02-03 2000-05-19 Ty3 LTR +S000006989 long_terminal_repeat YHLWtau1 chromosome 8 8 85539 85909 W 2011-02-03 2000-05-19 Ty4 LTR +S000006991 LTR_retrotransposon YHLWTy4-1 Ty4 chromosome 8 8 85539 91761 W 2011-02-03 2000-05-19 Ty4 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007371 transposable_element_gene YHL009W-A gag protein chromosome 8 8 85909 87150 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000032880 CDS YHL009W-A 8 85909 87150 W 2011-02-03 1999-07-17 +S000007372 transposable_element_gene YHL009W-B gag-pol fusion protein chromosome 8 S000029015 8 85909 91318 W 2011-02-03 1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000032882 CDS YHL009W-B 8 85909 86994 W 2011-02-03 1999-07-17 +S000032883 CDS YHL009W-B 8 86996 91318 W 2011-02-03 1999-07-17 +S000032884 plus_1_translational_frameshift YHL009W-B 8 86995 86995 W 2011-02-03 1999-07-17 +S000006990 long_terminal_repeat YHLWtau2 chromosome 8 8 91391 91761 W 2011-02-03 2000-05-19 Ty4 LTR +S000006985 long_terminal_repeat YHLCdelta1 chromosome 8 8 92099 91772 C 2011-02-03 2000-05-19 Ty1 LTR +S000006988 long_terminal_repeat YHLWdelta2 chromosome 8 8 92240 92390 W 2011-02-03 2000-05-19 Ty1 LTR +S000001000 ORF Uncharacterized YHL008C chromosome 8 8 94510 92627 C 2011-02-03 1996-07-31 Putative protein of unknown function; may be involved in the uptake of chloride ions; does not appear to be involved in monocarboxylic acid transport; green fluorescent protein (GFP)-fusion protein localizes to the vacuole +S000030923 CDS YHL008C 8 94510 92627 C 2011-02-03 1996-07-31 +S000028771 ORF Dubious YHL006W-A chromosome 8 8 97732 98085 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF STE20/YHL007C +S000033485 CDS YHL006W-A 8 97732 98085 W 2011-02-03 2003-07-29 +S000000999 ORF Verified YHL007C STE20 mitogen-activated protein kinase kinase kinase kinase STE20 chromosome 8 L000002123 8 97937 95118 C 2011-02-03 1996-07-31 Cdc42p-activated signal transducing kinase; involved in pheromone response, pseudohyphal/invasive growth, vacuole inheritance, down-regulation of sterol uptake; GBB motif binds Ste4p; member of the PAK (p21-activated kinase) family +S000030840 CDS YHL007C 8 97937 95118 C 2011-02-03 1996-07-31 +S000000998 ORF Verified YHL006C SHU1 chromosome 8 8 98795 98343 C 2011-02-03 2004-01-29|1996-07-31 Component of Shu complex (aka PCSS complex); Shu complex also includes Psy3, Csm2, Shu2, and promotes error-free DNA repair, mediates inhibition of Srs2p function; essential for promoting the establishment of homolog bias during meiotic homologous recombination; promotes both crossover (CO) and non-crossover (NCO) pathways of meiotic recombination and formation of Rad51p filaments +S000029837 CDS YHL006C 8 98795 98343 C 2011-02-03 2004-01-29|1996-07-31 +S000000996 ORF Verified YHL004W MRP4 mitochondrial 37S ribosomal protein MRP4 chromosome 8 L000001154 8 99219 100403 W 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the small subunit +S000037796 CDS YHL004W 8 99219 100403 W 2011-02-03 1996-07-31 +S000000997 ORF Uncharacterized YHL005C chromosome 8 8 99220 98828 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YHL005C is not an essential gene +S000037818 CDS YHL005C 8 99220 98828 C 2011-02-03 1996-07-31 +S000000995 ORF Verified YHL003C LAG1 sphingosine N-acyltransferase LAG1 chromosome 8 L000000928 8 101883 100648 C 2011-02-03 1996-07-31 Ceramide synthase component; involved in synthesis of ceramide from C26(acyl)-coenzyme A and dihydrosphingosine or phytosphingosine, functionally equivalent to Lac1p; forms ER foci upon DNA replication stress; homolog of human CERS2, a tumor metastasis suppressor gene whose silencing enhances invasion/metastasis of prostate cancer cells; LAG1 has a paralog, LAC1, that arose from the whole genome duplication +S000036974 CDS YHL003C 8 101883 100648 C 2011-02-03 1996-07-31 +S000000994 ORF Verified YHL002W HSE1 ESCRT-0 subunit protein HSE1 chromosome 8 8 102612 103970 W 2011-02-03 1996-07-31 Subunit of the endosomal Vps27p-Hse1p complex; complex is required for sorting of ubiquitinated membrane proteins into intralumenal vesicles prior to vacuolar degradation, as well as for recycling of Golgi proteins and formation of lumenal membranes +S000036957 CDS YHL002W 8 102612 103970 W 2011-02-03 1996-07-31 +S000028770 ORF Dubious YHL002C-A chromosome 8 8 103075 102587 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF HSE1/YHL002W +S000033484 CDS YHL002C-A 8 103075 102587 C 2011-02-03 2003-07-29 +S000000993 ORF Verified YHL001W RPL14B eL14|ribosomal 60S subunit protein L14B|L14e|L14B chromosome 8 L000002707 8 104277 105091 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L14B; homologous to mammalian ribosomal protein L14, no bacterial homolog; RPL14B has a paralog, RPL14A, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000036892 CDS YHL001W 8 104277 104405 W 2011-02-03 1996-07-31 +S000036893 CDS YHL001W 8 104804 105091 W 2011-02-03 1996-07-31 +S000036894 intron YHL001W 8 104406 104803 W 2011-02-03 1996-07-31 +S000006469 centromere CEN8 CEN8 chromosome 8 L000000301 8 105703 105586 C 0 2011-02-03 2000-05-19|2004-10-08 Chromosome VIII centromere +S000077284 centromere_DNA_Element_I CEN8 8 105703 105694 C 2011-02-03 2004-10-08 +S000077285 centromere_DNA_Element_II CEN8 8 105693 105611 C 2011-02-03 2004-10-08 +S000077286 centromere_DNA_Element_III CEN8 8 105610 105586 C 2011-02-03 2004-10-08 +S000001043 ORF Verified YHR001W OSH7 oxysterol-binding protein related protein OSH7 chromosome 8 8 106055 107368 W 2011-02-03 1996-07-31 Oxysterol-binding protein; part of family with seven members in S. cerevisiae; family members have overlapping, redundant functions in sterol metabolism and collectively perform a function essential for viability; OSH7 has a paralog, OSH6, that arose from the whole genome duplication +S000033353 CDS YHR001W 8 106055 107368 W 2011-02-03 1996-07-31 +S000003529 ORF Verified YHR001W-A QCR10 ubiquinol--cytochrome-c reductase subunit 10 chromosome 8 L000001550 8 107826 108122 W 2011-02-03 1996-07-31 Subunit of the ubiqunol-cytochrome c oxidoreductase complex; this complex comprises part of the mitochondrial respiratory chain; members include Cobp, Rip1p, Cyt1p, Cor1p, Qcr2p, Qcr6p, Qcr7p, Qcr8p, Qcr9p, and Qcr10p and comprises part of the mitochondrial respiratory chain +S000035662 CDS YHR001W-A 8 107826 107831 W 2011-02-03 1996-07-31 +S000035663 CDS YHR001W-A 8 107895 108122 W 2011-02-03 1996-07-31 +S000035664 intron YHR001W-A 8 107832 107894 W 2011-02-03 1996-07-31 +S000001044 ORF Verified YHR002W LEU5 coenzyme A transporter chromosome 8 L000000946 8 108812 109885 W 0 2011-02-03 1996-07-31 Mitochondrial carrier protein; involved in the accumulation of CoA in the mitochondrial matrix; homolog of human Graves disease protein SLC25A16, which complements yeast null mutant; does not encode an isozyme of Leu4p, as first hypothesized +S000034263 CDS YHR002W 8 108812 109885 W 2011-02-03 1996-07-31 +S000001045 ORF Verified YHR003C TCD1 tRNA threonylcarbamoyladenosine dehydratase chromosome 8 8 111317 110028 C 2011-02-03 1996-07-31 tRNA threonylcarbamoyladenosine dehydratase; required for the ct6A tRNA base modification, where an adenosine at position 37 is modified to form a cyclized active ester with an oxazolone ring; localized to the mitochondrial outer membrane; TCD1 has a paralog, TCD2, that arose from the whole genome duplication +S000034299 CDS YHR003C 8 111317 110028 C 2011-02-03 1996-07-31 +S000001046 ORF Verified YHR004C NEM1 Nem1-Spo7 phosphatase catalytic subunit NEM1 chromosome 8 8 113094 111754 C 2011-02-03 1996-07-31 Probable catalytic subunit of Nem1p-Spo7p phosphatase holoenzyme; regulates nuclear growth by controlling phospholipid biosynthesis, required for normal nuclear envelope morphology and sporulation; homolog of the human protein Dullard +S000034400 CDS YHR004C 8 113094 111754 C 2011-02-03 1996-07-31 +S000001047 ORF Verified YHR005C GPA1 guanine nucleotide-binding protein subunit alpha|SCG1|DAC1|CDC70 chromosome 8 L000000720 8 114917 113499 C 3 2011-02-03 1996-07-31 Subunit of the G protein involved in pheromone response; GTP-binding alpha subunit of the heterotrimeric G protein; negatively regulates the mating pathway by sequestering G(beta)gamma and by triggering an adaptive response; activates Vps34p at the endosome; protein abundance increases in response to DNA replication stress +S000034477 CDS YHR005C 8 114917 113499 C 2011-02-03 1996-07-31 +S000003530 ORF Verified YHR005C-A TIM10 protein transporter TIM10|MRS11 chromosome 8 L000003574 8 115901 115620 C 2011-02-03 1999-07-17 Essential protein of the mitochondrial intermembrane space; forms a complex with Tim9p (TIM10 complex) that delivers hydrophobic proteins to the TIM22 complex for insertion into the inner membrane +S000033460 CDS YHR005C-A 8 115901 115620 C 2011-02-03 1999-07-17 +S000006740 tRNA_gene tT(AGU)H chromosome 8 L000003864 8 116179 116107 C 2011-02-03 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000032165 noncoding_exon tT(AGU)H 8 116179 116107 C 2011-02-03 2000-05-19 +S000130146 ARS ARS806 chromosome 8 8 116179 116421 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000006992 long_terminal_repeat YHRCdelta3 chromosome 8 8 116752 116421 C 2011-02-03 2000-05-19 Ty1 LTR +S000006993 long_terminal_repeat YHRCdelta4 chromosome 8 8 117061 116763 C 2011-02-03 2000-05-19 Ty1 LTR +S000001048 ORF Verified YHR006W STP2 chromosome 8 L000003370 8 117814 119439 W 2011-02-03 1996-07-31 Transcription factor; activated by proteolytic processing in response to signals from the SPS sensor system for external amino acids; activates transcription of amino acid permease genes; STP2 has a paralog, STP1, that arose from the whole genome duplication +S000035553 CDS YHR006W 8 117814 119439 W 2011-02-03 1996-07-31 +S000001049 ORF Verified YHR007C ERG11 sterol 14-demethylase|CYP51 chromosome 8 L000000577 8 121683 120091 C 12 2011-02-03 1996-07-31 Lanosterol 14-alpha-demethylase; catalyzes C-14 demethylation of lanosterol to form 4,4''-dimethyl cholesta-8,14,24-triene-3-beta-ol in ergosterol biosynthesis pathway; transcriptionally down-regulated when ergosterol is in excess; member of cytochrome P450 family; associated and coordinately regulated with the P450 reductase Ncp1p; human CYP51A1 functionally complements the lethality of the erg11 null mutation +S000035603 CDS YHR007C 8 121683 120091 C 2011-02-03 1996-07-31 +S000028830 ORF Uncharacterized YHR007C-A chromosome 8 8 122765 122550 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry; SWAT-GFP fusion protein localizes to the nucleus +S000034480 CDS YHR007C-A 8 122765 122550 C 2011-02-03 2003-07-29 +S000001050 ORF Verified YHR008C SOD2 superoxide dismutase SOD2 chromosome 8 L000001979 8 123590 122889 C 12 2011-02-03 1996-07-31 Mitochondrial manganese superoxide dismutase; protects cells against oxygen toxicity and oxidative stress; human mitochondrial SOD2 can complement a yeast null mutant and human cytoplasmic SOD1 can also complement when targeted to the mitochondrial matrix +S000035694 CDS YHR008C 8 123590 122889 C 2011-02-03 1996-07-31 +S000001051 ORF Verified YHR009C TDA3 BTN3 chromosome 8 8 125680 124109 C 2011-02-03 1996-07-31 Putative oxidoreductase involved in late endosome to Golgi transport; physical and genetical interactions with Btn2p; null mutant is viable, has extended S phase, and sensitive to expression of top1-T722A allele; similar to human FOXRED1 +S000036628 CDS YHR009C 8 125680 124109 C 2011-02-03 1996-07-31 +S000001052 ORF Verified YHR010W RPL27A eL27|ribosomal 60S subunit protein L27A|L27e|L27A|RPL27 chromosome 8 L000002708 8 126521 127492 W 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L27A; homologous to mammalian ribosomal protein L27, no bacterial homolog; RPL27A has a paralog, RPL27B, that arose from the whole genome duplication +S000036518 CDS YHR010W 8 126521 126551 W 2011-02-03 1996-07-31 +S000036519 CDS YHR010W 8 127113 127492 W 2011-02-03 1996-07-31 +S000036520 intron YHR010W 8 126552 127112 W 2011-02-03 1996-07-31 +S000001053 ORF Verified YHR011W DIA4 putative serine--tRNA ligase DIA4 chromosome 8 8 127780 129120 W 2011-02-03 1996-07-31 Probable mitochondrial seryl-tRNA synthetase; mutant displays increased invasive and pseudohyphal growth +S000036641 CDS YHR011W 8 127780 129120 W 2011-02-03 1996-07-31 +S000001054 ORF Verified YHR012W VPS29 retromer subunit VPS29|VPT6|PEP11 chromosome 8 L000002840 8 129481 130448 W 2011-02-03 1996-07-31 Subunit of the membrane-associated retromer complex; endosomal protein; essential for endosome-to-Golgi retrograde transport; forms a subcomplex with Vps35p and Vps26p that selects cargo proteins for endosome-to-Golgi retrieval +S000036738 CDS YHR012W 8 129481 129528 W 2011-02-03 1996-07-31 +S000036739 CDS YHR012W 8 129648 130448 W 2011-02-03 1996-07-31 +S000036740 intron YHR012W 8 129529 129647 W 2011-02-03 1996-07-31 +S000001055 ORF Verified YHR013C ARD1 peptide alpha-N-acetyltransferase complex A subunit ARD1|NAA10 chromosome 8 L000000103 8 131446 130730 C 10 2011-02-03 1996-07-31 Subunit of protein N-terminal acetyltransferase NatA; NatA comprises Nat1p, Ard1p, Nat5p; acetylates many proteins to influence telomeric silencing, cell cycle, heat-shock resistance, mating, sporulation, early stages of mitophagy; protein abundance increases under DNA replication stress; mutations in human homolog X-linked NAA10 lead to Ogden syndrome (S37P) and intellectual disability (R116W); expression of human NAA10 and NAA15 can complement ard1 nat1 double mutant +S000037391 CDS YHR013C 8 131446 130730 C 2011-02-03 1996-07-31 +S000001056 ORF Verified YHR014W SPO13 chromosome 8 L000002004 8 132047 132922 W 11 2011-02-03 1996-07-31 Meiotic regulator; involved in maintaining sister chromatid cohesion during meiosis I as well as promoting proper attachment of kinetochores to the spindle during meiosis I and meiosis II; anaphase-promoting complex (APC) substrate that is degraded during anaphase I; expressed only in meiotic cells +S000037600 CDS YHR014W 8 132047 132922 W 2011-02-03 1996-07-31 +S000006726 tRNA_gene tS(AGA)H chromosome 8 L000003863 8 133107 133026 C 2011-02-03 2000-05-19 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis +S000032372 noncoding_exon tS(AGA)H 8 133107 133026 C 2011-02-03 2000-05-19 +S000118357 ARS ARS807 ARSVIII-134 chromosome 8 8 133438 133539 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178107 ARS_consensus_sequence ARS807 8 133530 133514 C 2014-11-18 2014-11-18 +S000006994 long_terminal_repeat YHRCdelta5 chromosome 8 8 133442 133201 C 2011-02-03 2000-05-19 Ty1 LTR +S000006995 long_terminal_repeat YHRCdelta6 chromosome 8 8 133684 133565 C 2011-02-03 2000-05-19 Ty1 LTR +S000007007 long_terminal_repeat YHRWdelta7 chromosome 8 8 133685 134009 W 2011-02-03 2000-05-19 Ty1 LTR +S000006698 tRNA_gene tQ(UUG)H chromosome 8 L000003856 8 134321 134392 W 2011-02-03 2000-05-19 Glutamine tRNA (tRNA-Gln), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000031701 noncoding_exon tQ(UUG)H 8 134321 134392 W 2011-02-03 2000-05-19 +S000001057 ORF Verified YHR015W MIP6 chromosome 8 L000004334 8 134554 136533 W 2011-02-03 1996-07-31 Putative RNA-binding protein; interacts with Mex67p, which is a component of the nuclear pore involved in nuclear mRNA export; MIP6 has a paralog, PES4, that arose from the whole genome duplication +S000030365 CDS YHR015W 8 134554 136533 W 2011-02-03 1996-07-31 +S000001058 ORF Verified YHR016C YSC84 LSB4 chromosome 8 L000003175 8 138455 136881 C 2011-02-03 1996-07-31 Actin-binding protein; involved in bundling of actin filaments and endocytosis of actin cortical patches; activity stimulated by Las17p; contains SH3 domain similar to Rvs167p; YSC84 has a paralog, LSB3, that arose from the whole genome duplication +S000030436 CDS YHR016C 8 138240 136881 C 2011-02-03 1996-07-31 +S000030435 CDS YHR016C 8 138455 138409 C 2011-02-03 1996-07-31 +S000030437 intron YHR016C 8 138408 138241 C 2011-02-03 1996-07-31 +S000001059 ORF Verified YHR017W YSC83 chromosome 8 L000002830 8 138694 139851 W 2011-02-03 1996-07-31 Non-essential mitochondrial protein of unknown function; mRNA induced during meiosis, peaking between mid to late prophase of meiosis I; similar to S. douglasii YSD83 +S000030626 CDS YHR017W 8 138694 139851 W 2011-02-03 1996-07-31 +S000029042 ARS ARS808 ARS2 chromosome 8 L000000122 8 140349 141274 2011-02-03 2006-04-13 Autonomously Replicating Sequence +S000001060 ORF Verified YHR018C ARG4 argininosuccinate lyase ARG4 chromosome 8 L000000109 8 141402 140011 C 12 2011-02-03 1996-07-31 Argininosuccinate lyase; catalyzes the final step in the arginine biosynthesis pathway +S000030670 CDS YHR018C 8 141402 140011 C 2011-02-03 1996-07-31 +S000001061 ORF Verified YHR019C DED81 asparagine--tRNA ligase DED81 chromosome 8 L000002734 8 143558 141894 C 2011-02-03 1996-07-31 Cytosolic asparaginyl-tRNA synthetase; required for protein synthesis, catalyzes the specific attachment of asparagine to its cognate tRNA +S000031533 CDS YHR019C 8 143558 141894 C 2011-02-03 1996-07-31 +S000001062 ORF Verified YHR020W proline--tRNA ligase chromosome 8 8 143996 146062 W 2011-02-03 1996-07-31 Prolyl-tRNA synthetase; N-terminal domain shows weak homology to prokaryotic posttransfer editing domain, but does not possess posttransfer editing activity; may interact with ribosomes, based on co-purification experiments +S000031552 CDS YHR020W 8 143996 146062 W 2011-02-03 1996-07-31 +S000006513 tRNA_gene tA(AGC)H chromosome 8 L000003862 8 146314 146242 C 2011-02-03 2000-05-19 Alanine tRNA (tRNA-Ala), predicted by tRNAscan-SE analysis; one of 11 nuclear tRNA genes containing the tDNA-anticodon AGC (converted to IGC in the mature tRNA), decodes GCU and GCC codons into alanine, one of 16 nuclear tRNAs for alanine +S000032282 noncoding_exon tA(AGC)H 8 146314 146242 C 2011-02-03 2000-05-19 +S000007003 long_terminal_repeat YHRCsigma2 chromosome 8 8 146671 146331 C 2011-02-03 2000-05-19 Ty3 LTR +S000007010 long_terminal_repeat YHRWtau3 chromosome 8 8 146844 147114 W 2011-02-03 2000-05-19 Ty4 LTR +S000001063 ORF Verified YHR021C RPS27B eS27|ribosomal 40S subunit protein S27B|S27e|rp61|YS20|S27B chromosome 8 L000002713 8 148669 147871 C 2011-02-03 1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S27, no bacterial homolog; RPS27B has a paralog, RPS27A, that arose from the whole genome duplication +S000031620 CDS YHR021C 8 148116 147871 C 2011-02-03 1996-07-31 +S000031619 CDS YHR021C 8 148669 148667 C 2011-02-03 1996-07-31 +S000031621 intron YHR021C 8 148666 148117 C 2011-02-03 1996-07-31 +S000003531 ORF Uncharacterized YHR021W-A ECM12 chromosome 8 L000003887 8 149225 149680 W 2011-02-03 1999-07-17 Putative protein of unknown function; may contribute to cell wall biosynthesis, mutants display zymolyase hypersensitivity +S000034210 CDS YHR021W-A 8 149225 149680 W 2011-02-03 1999-07-17 +S000001064 ORF Uncharacterized YHR022C chromosome 8 8 150345 149575 C 2011-02-03 1996-07-31 Putative protein of unknown function; YHR022C is not an essential gene +S000032603 CDS YHR022C 8 150345 149575 C 2011-02-03 1996-07-31 +S000028645 ORF Uncharacterized YHR022C-A chromosome 8 8 151306 151217 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032421 CDS YHR022C-A 8 151306 151217 C 2011-02-03 2003-07-29 +S000001065 ORF Verified YHR023W MYO1 myosin 1 chromosome 8 L000001222 8 151666 157452 W 2011-02-03 1996-07-31 Type II myosin heavy chain; required for wild-type cytokinesis and cell separation; localizes to the actomyosin ring; binds to myosin light chains Mlc1p and Mlc2p through its IQ1 and IQ2 motifs respectively +S000032750 CDS YHR023W 8 151666 157452 W 2011-02-03 1996-07-31 +S000001066 ORF Verified YHR024C MAS2 mitochondrial-processing protease subunit alpha|MIF2 chromosome 8 L000001027 8 159192 157744 C 26 2011-02-03 1996-07-31 Alpha subunit of the mitochondrial processing protease (MPP); essential processing enzyme that cleaves the N-terminal targeting sequences from mitochondrially imported proteins +S000032823 CDS YHR024C 8 159192 157744 C 2011-02-03 1996-07-31 +S000001067 ORF Verified YHR025W THR1 homoserine kinase chromosome 8 L000002298 8 159438 160511 W 26 2011-02-03 1996-07-31 Homoserine kinase; conserved protein required for threonine biosynthesis; long-lived protein that is preferentially retained in mother cells and forms cytoplasmic filaments; expression is regulated by the GCN4-mediated general amino acid control pathway +S000033588 CDS YHR025W 8 159438 160511 W 2011-02-03 1996-07-31 +S000001068 ORF Verified YHR026W VMA16 H(+)-transporting V0 sector ATPase subunit c''|PPA1 chromosome 8 L000001468 8 160844 161485 W 27 2011-02-03 1996-07-31 Subunit c'' of the vacuolar ATPase; v-ATPase functions in acidification of the vacuole; one of three proteolipid subunits of the V0 domain +S000033662 CDS YHR026W 8 160844 161485 W 2011-02-03 1996-07-31 +S000001069 ORF Verified YHR027C RPN1 proteasome regulatory particle base subunit RPN1|NAS1|HRD2 chromosome 8 L000003039 8 164711 161730 C 2011-02-03 1996-07-31 Non-ATPase base subunit of the 19S RP of the 26S proteasome; may participate in the recognition of several ligands of the proteasome; contains a leucine-rich repeat (LRR) domain, a site for protein-protein interactions; RP is the acronym for regulatory particle +S000033726 CDS YHR027C 8 164711 161730 C 2011-02-03 1996-07-31 +S000028776 ORF Dubious YHR028W-A chromosome 8 8 167352 167672 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF DAP2/YHR028C +S000033498 CDS YHR028W-A 8 167352 167672 W 2011-02-03 2003-07-29 +S000001070 ORF Verified YHR028C DAP2 DPP2 chromosome 8 L000000483 8 167434 164978 C 2011-02-03 1996-07-31 Dipeptidyl aminopeptidase; synthesized as a glycosylated precursor; localizes to the vacuolar membrane; similar to Ste13p +S000034620 CDS YHR028C 8 167434 164978 C 2011-02-03 1996-07-31 +S000118358 ARS ARS809 ARSVIII-169 chromosome 8 8 168549 168723 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000001071 ORF Verified YHR029C YHI9 chromosome 8 8 168561 167677 C 2011-02-03 1996-07-31 Protein of unknown function; null mutant is defective in unfolded protein response; possibly involved in a membrane regulation metabolic pathway; member of the PhzF superfamily, though most likely not involved in phenazine production +S000034772 CDS YHR029C 8 168561 167677 C 2011-02-03 1996-07-31 +S000001072 ORF Verified YHR030C SLT2 mitogen-activated serine/threonine-protein kinase SLT2|LYT2|SLK2|MPK1|BYC2 chromosome 8 L000001919 8 170344 168890 C 2011-02-03 1996-07-31 Serine/threonine MAP kinase; coordinates expression of all 19S regulatory particle assembly-chaperones (RACs) to control proteasome abundance; involved in regulating maintenance of cell wall integrity, cell cycle progression, nuclear mRNA retention in heat shock, septum assembly; required for mitophagy, pexophagy; affects recruitment of mitochondria to phagophore assembly site; plays role in adaptive response of cells to cold; regulated by the PKC1-mediated signaling pathway +S000035799 CDS YHR030C 8 170344 168890 C 2011-02-03 1996-07-31 +S000001073 ORF Verified YHR031C RRM3 RTT104 chromosome 8 S000007420 8 172970 170799 C 2011-02-03 1996-07-31 DNA helicase involved in rDNA replication and Ty1 transposition; binds to and suppresses DNA damage at G4 motifs in vivo; relieves replication fork pauses at telomeric regions; structurally and functionally related to Pif1p +S000035940 CDS YHR031C 8 172970 170799 C 2011-02-03 1996-07-31 +S000001074 ORF Verified YHR032W ERC1 chromosome 8 8 173344 175089 W 2011-02-03 1996-07-31 Member of the multi-drug and toxin extrusion (MATE) family; the MATE family is part of the multidrug/oligosaccharidyl-lipid/polysaccharide (MOP) exporter superfamily; overproduction confers ethionine resistance and accumulation of S-adenosylmethionine +S000036858 CDS YHR032W 8 173344 175089 W 2011-02-03 1996-07-31 +S000028831 ORF Dubious YHR032W-A chromosome 8 8 175195 175374 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YHR032C-A +S000034481 CDS YHR032W-A 8 175195 175374 W 2011-02-03 2003-07-29 +S000028646 ORF Dubious YHR032C-A chromosome 8 8 175394 175275 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the dubious ORF YHR032W-A +S000032422 CDS YHR032C-A 8 175394 175275 C 2011-02-03 2003-07-29 +S000001075 ORF Uncharacterized YHR033W putative glutamate 5-kinase chromosome 8 8 175548 176819 W 2011-02-03 1996-07-31 Putative protein of unknown function; epitope-tagged protein localizes to the cytoplasm; YHR033W has a paralog, PRO1, that arose from the whole genome duplication +S000036911 CDS YHR033W 8 175548 176819 W 2011-02-03 1996-07-31 +S000001076 ORF Verified YHR034C PIH1 NOP17 chromosome 8 8 177999 176965 C 2011-02-03 1996-07-31 Component of the conserved R2TP complex (Rvb1-Rvb2-Tah1-Pih1); R2TP complex interacts with Hsp90 (Hsp82p and Hsc82p) to mediate assembly large protein complexes such as box C/D snoRNPs and RNA polymerase II +S000036943 CDS YHR034C 8 177999 176965 C 2011-02-03 1996-07-31 +S000001077 ORF Verified YHR035W NEL1 chromosome 8 8 178219 180111 W 2011-02-03 1996-07-31 Activator of Sar1p GTPase activity; paralog of Sec23 but does not associate with the COPII components; not an essential gene +S000037726 CDS YHR035W 8 178219 180111 W 2011-02-03 1996-07-31 +S000001078 ORF Verified YHR036W BRL1 chromosome 8 8 180345 181760 W 2011-02-03 1996-07-31 Essential nuclear envelope/ER integral membrane protein; interacts and functions with Apq12p and Brr6p in lipid homeostasis; mutants are defective in nuclear pore complex biogenesis, mRNA nuclear export and are sensitive to sterol biosynthesis inhibitors and membrane fluidizing agents; identified as a dosage suppressor of a temperature sensitive mutation in the major karyopherin, CRM1; homologous to Brr6p +S000037810 CDS YHR036W 8 180345 181760 W 2011-02-03 1996-07-31 +S000001079 ORF Verified YHR037W PUT2 1-pyrroline-5-carboxylate dehydrogenase chromosome 8 L000001536 8 181977 183704 W 24 2011-02-03 1996-07-31 Delta-1-pyrroline-5-carboxylate dehydrogenase; nuclear-encoded mitochondrial protein involved in utilization of proline as sole nitrogen source; deficiency of human homolog ALDH4A1 causes type II hyperprolinemia (HPII), an autosomal recessive inborn error of metabolism; human homolog ALDH4A1 can complement yeast null mutant +S000037908 CDS YHR037W 8 181977 183704 W 2011-02-03 1996-07-31 +S000001080 ORF Verified YHR038W RRF1 FIL1|KIM4 chromosome 8 L000004366 8 184066 184758 W 2011-02-03 1996-07-31 Mitochondrial ribosome recycling factor; essential for mitochondrial protein synthesis and for the maintenance of the respiratory function of mitochondria +S000030835 CDS YHR038W 8 184066 184758 W 2011-02-03 1996-07-31 +S000001081 ORF Verified YHR039C MSC7 meiotic recombination directing protein chromosome 8 8 186809 184875 C 2011-02-03 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum; msc7 mutants are defective in directing meiotic recombination events to homologous chromatids +S000030880 CDS YHR039C 8 186809 184875 C 2011-02-03 1996-07-31 +S000002100 ORF Verified YHR039C-A VMA10 H(+)-transporting V1 sector ATPase subunit G|YHR039BC|YHR039C-B chromosome 8 L000002954 8 187679 187173 C 2011-02-03 1996-07-31 Subunit G of the V1 peripheral membrane domain of V-ATPase; part of the electrogenic proton pump found throughout the endomembrane system; involved in vacuolar acidification; the V1 peripheral membrane domain of the vacuolar H+-ATPase (V-ATPase) has eight subunits +S000035240 CDS YHR039C-A 8 187514 187173 C 2011-02-03 1996-07-31 +S000035239 CDS YHR039C-A 8 187679 187677 C 2011-02-03 1996-07-31 +S000035241 intron YHR039C-A 8 187676 187515 C 2011-02-03 1996-07-31 +S000001082 ORF Verified YHR040W BCD1 chromosome 8 8 187924 189024 W 2011-02-03 1996-07-31 Essential protein required for the accumulation of box C/D snoRNA +S000031978 CDS YHR040W 8 187924 189024 W 2011-02-03 1996-07-31 +S000001083 ORF Verified YHR041C SRB2 MED20|HRS2 chromosome 8 L000002050|L000003586 8 189864 189131 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; general transcription factor involved in telomere maintenance +S000032051 CDS YHR041C 8 189749 189131 C 2011-02-03 1996-07-31 +S000032050 CDS YHR041C 8 189864 189851 C 2011-02-03 1996-07-31 +S000032052 intron YHR041C 8 189850 189750 C 2011-02-03 1996-07-31 +S000001084 ORF Verified YHR042W NCP1 CPR1 chromosome 8 L000001482 8 190543 192618 W 2011-02-03 1996-07-31 NADP-cytochrome P450 reductase; involved in ergosterol biosynthesis; associated and coordinately regulated with Erg11p +S000033000 CDS YHR042W 8 190543 192618 W 2011-02-03 1996-07-31 +S000001085 ORF Verified YHR043C DOG2 2-deoxyglucose-6-phosphatase chromosome 8 L000000516 8 193545 192805 C 2011-02-03 1996-07-31 2-deoxyglucose-6-phosphate phosphatase; member of a family of low molecular weight phosphatases, induced by oxidative and osmotic stress, confers 2-deoxyglucose resistance when overexpressed; DOG2 has a paralog, DOG1, that arose from a single-locus duplication; the last half of DOG1 and DOG2 are subject to gene conversions among S. cerevisiae, S. paradoxus, and S. mikatae +S000033060 CDS YHR043C 8 193545 192805 C 2011-02-03 1996-07-31 +S000001086 ORF Verified YHR044C DOG1 2-deoxyglucose-6-phosphatase chromosome 8 L000000515 8 194808 194068 C 2011-02-03 1996-07-31 2-deoxyglucose-6-phosphate phosphatase; member of a family of low molecular weight phosphatases; confers 2-deoxyglucose resistance when overexpressed; DOG1 has a paralog, DOG2, that arose from a single-locus duplication; the last half of DOG1 and DOG2 are subject to gene conversions among S. cerevisiae, S. paradoxus, and S. mikatae +S000033147 CDS YHR044C 8 194808 194068 C 2011-02-03 1996-07-31 +S000001087 ORF Uncharacterized YHR045W chromosome 8 8 195551 197233 W 2011-02-03 1996-07-31 Putative protein of unknown function; possible role in iron metabolism and/or amino acid and carbohydrate metabolism; green fluorescent protein (GFP)-fusion protein localizes to the endoplasmic reticulum +S000033998 CDS YHR045W 8 195551 197233 W 2011-02-03 1996-07-31 +S000001088 ORF Verified YHR046C INM1 inositol monophosphate 1-phosphatase INM1 chromosome 8 8 198285 197398 C 2011-02-03 1996-07-31 Inositol monophosphatase; involved in biosynthesis of inositol and in phosphoinositide second messenger signaling; INM1 expression increases in the presence of inositol and decreases upon exposure to antibipolar drugs lithium and valproate +S000034037 CDS YHR046C 8 198285 197398 C 2011-02-03 1996-07-31 +S000001089 ORF Verified YHR047C AAP1 arginine/alanine aminopeptidase|AAP1' chromosome 8 L000000006 8 201310 198740 C 2011-02-03 1996-07-31 Arginine/alanine amino peptidase; overproduction stimulates glycogen accumulation; AAP1 has a paralog, APE2, that arose from the whole genome duplication +S000034139 CDS YHR047C 8 201310 198740 C 2011-02-03 1996-07-31 +S000001090 ORF Uncharacterized YHR048W YHK8 chromosome 8 8 204607 206151 W 2011-02-03 1996-07-31 Presumed antiporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; expression of gene is up-regulated in cells exhibiting reduced susceptibility to azoles +S000035165 CDS YHR048W 8 204607 206151 W 2011-02-03 1996-07-31 +S000001091 ORF Verified YHR049W FSH1 putative serine hydrolase chromosome 8 8 206462 207193 W 2011-02-03 1996-07-31 Putative serine hydrolase; localizes to both the nucleus and cytoplasm; sequence is similar to S. cerevisiae Fsh2p and Fsh3p and the human candidate tumor suppressor OVCA2 +S000035291 CDS YHR049W 8 206462 207193 W 2011-02-03 1996-07-31 +S000003532 ORF Dubious YHR049C-A chromosome 8 8 207530 207234 C 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031834 CDS YHR049C-A 8 207530 207234 C 2011-02-03 1996-07-31|2011-02-03 +S000001092 ORF Verified YHR050W SMF2 divalent metal ion transporter SMF2 chromosome 8 L000001932|L000001870 8 207654 209303 W 2011-02-03 1996-07-31 Divalent metal ion transporter involved in manganese homeostasis; has broad specificity for di-valent and tri-valent metals; post-translationally regulated by levels of metal ions; member of the Nramp family of metal transport proteins +S000036147 CDS YHR050W 8 207654 209303 W 2011-02-03 1996-07-31 +S000028832 ORF Uncharacterized YHR050W-A chromosome 8 8 209475 209645 W 2011-02-03 2003-07-29 Protein of unknown function; identified by expression profiling and mass spectrometry +S000034482 CDS YHR050W-A 8 209475 209645 W 2011-02-03 2003-07-29 +S000001093 ORF Verified YHR051W COX6 cytochrome c oxidase subunit VI chromosome 8 L000000390 8 209705 210151 W 2011-02-03 1996-07-31 Subunit VI of cytochrome c oxidase (Complex IV); Complex IV is the terminal member of the mitochondrial inner membrane electron transport chain; expression is regulated by oxygen levels +S000029851 CDS YHR051W 8 209705 210151 W 2011-02-03 1996-07-31 +S000001094 ORF Verified YHR052W CIC1 NSA3 chromosome 8 8 210848 211978 W 2011-02-03 1996-07-31 Essential protein that interacts with proteasome components; has a potential role in proteasome substrate specificity; also copurifies with 66S pre-ribosomal particles +S000031769 CDS YHR052W 8 210848 211978 W 2011-02-03 1996-07-31 +S000028470 ncRNA_gene RUF5-1 RUF5-1 RUF5 chromosome 8 8 212409 213118 W 2011-02-03 2004-04-01 RNA of Unknown Function +S000030107 noncoding_exon RUF5-1 8 212409 213118 W 2011-02-03 2004-04-01 +S000028647 ORF Dubious YHR052W-A chromosome 8 8 212510 212704 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps CUP1-1 +S000032423 CDS YHR052W-A 8 212510 212704 W 2011-02-03 2003-07-29 +S000001095 ORF Verified YHR053C CUP1-1 metallothionein CUP1|CUP1 chromosome 8 L000000436 8 212720 212535 C 2011-02-03 1996-07-31 Metallothionein; binds copper and mediates resistance to high concentrations of copper and cadmium; locus is variably amplified in different strains, with two copies, CUP1-1 and CUP1-2, in the genomic sequence reference strain S288C; CUP1-1 has a paralog, CUP1-2, that arose from a segmental duplication +S000031831 CDS YHR053C 8 212720 212535 C 2011-02-03 1996-07-31 +S000130147 ARS ARS810 chromosome 8 8 212720 213185 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000001096 ORF Uncharacterized YHR054C chromosome 8 8 214249 213185 C 2011-02-03 1996-07-31 Putative protein of unknown function; partial duplicate of RSC30/YHR056C, truncated remnant of segmental duplication +S000031964 CDS YHR054C 8 214249 213185 C 2011-02-03 1996-07-31 +S000028474 ncRNA_gene RUF5-2 RUF5-2 RUF5 chromosome 8 8 214407 215116 W 2011-02-03 2004-04-01 RNA of Unknown Function +S000030115 noncoding_exon RUF5-2 8 214407 215116 W 2011-02-03 2004-04-01 +S000028648 ORF Dubious YHR054W-A chromosome 8 8 214508 214702 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps CUP1-2 +S000032424 CDS YHR054W-A 8 214508 214702 W 2011-02-03 2003-07-29 +S000001097 ORF Verified YHR055C CUP1-2 metallothionein CUP1|CUP1 chromosome 8 8 214718 214533 C 2011-02-03 1996-07-31 Metallothionein; binds copper and mediates resistance to high concentrations of copper and cadmium; locus is variably amplified in different strains, with two copies, CUP1-1 and CUP1-2, in the genomic sequence reference strain S288C; CUP1-2 has a paralog, CUP1-1, that arose from a segmental duplication +S000037453 CDS YHR055C 8 214718 214533 C 2011-02-03 1996-07-31 +S000130148 ARS ARS811 chromosome 8 8 214718 215183 2011-02-03 2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000028777 ORF Dubious YHR056W-A chromosome 8 8 217406 217840 W 2011-02-03 2004-01-29|2011-02-03|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps ORF RSC30/YHR056C +S000033500 CDS YHR056W-A 8 217406 217840 W 2011-02-03 2004-01-29|2003-07-29|2011-02-03 +S000001098 ORF Verified YHR056C RSC30 chromosome 8 8 217834 215183 C 2011-02-03 2004-01-29|1996-07-31|2011-02-03 Component of the RSC chromatin remodeling complex; non-essential gene required for regulation of ribosomal protein genes and the cell wall/stress response; null mutants are osmosensitive; RSC30 has a paralog, RSC3, that arose from the whole genome duplication +S000037529 CDS YHR056C 8 217834 215183 C 2011-02-03 2004-01-29|1996-07-31|2011-02-03 +S000001099 ORF Verified YHR057C CPR2 peptidylprolyl isomerase CPR2|CYP2 chromosome 8 L000000463 8 218843 218226 C 2011-02-03 1996-07-31 Peptidyl-prolyl cis-trans isomerase (cyclophilin); catalyzes the cis-trans isomerization of peptide bonds N-terminal to proline residues; potential role in the secretory pathway; seamless-GFP and mCherry fusion proteins localize to the vacuole, while SWAT-GFP fusion localizes to both the endoplasmic reticulum and vacuole; suppresses toxicity of slow-folding human Z-type alpha1-antitrypsin variant associated with liver cirrhosis and emphysema +S000037607 CDS YHR057C 8 218843 218226 C 2011-02-03 1996-07-31 +S000001100 ORF Verified YHR058C MED6 mediator complex subunit MED6 chromosome 8 L000003569 8 219884 218997 C 2011-02-03 1996-07-31 Subunit of the RNA polymerase II mediator complex; associates with core polymerase subunits to form the RNA polymerase II holoenzyme; essential for transcriptional regulation; protein abundance increases in response to DNA replication stress +S000037687 CDS YHR058C 8 219884 218997 C 2011-02-03 1996-07-31 +S000001101 ORF Verified YHR059W FYV4 chromosome 8 8 220108 220500 W 2011-02-03 1996-07-31 Protein of unknown function; required for survival upon exposure to K1 killer toxin +S000030557 CDS YHR059W 8 220108 220500 W 2011-02-03 1996-07-31 +S000001102 ORF Verified YHR060W VMA22 VPH6|CEV1 chromosome 8 L000002789 8 220725 221270 W 2011-02-03 1996-07-31 Protein that is required for vacuolar H+-ATPase (V-ATPase) function; peripheral membrane protein; not an actual component of the V-ATPase complex; functions in the assembly of the V-ATPase; localized to the yeast endoplasmic reticulum (ER) +S000029986 CDS YHR060W 8 220725 221270 W 2011-02-03 1996-07-31 +S000001103 ORF Verified YHR061C GIC1 chromosome 8 L000003313 8 222478 221534 C 2011-02-03 1996-07-31 Protein involved in initiation of budding and cellular polarization; interacts with Cdc42p via the Cdc42/Rac-interactive binding (CRIB) domain; relocalizes from bud neck to nucleus upon DNA replication stress; GIC1 has a paralog, GIC2, that arose from the whole genome duplication +S000030028 CDS YHR061C 8 222478 221534 C 2011-02-03 1996-07-31 +S000001104 ORF Verified YHR062C RPP1 RNA-binding RNA processing protein RPP1 chromosome 8 L000004007 8 223758 222877 C 2011-02-03 1996-07-31 Subunit of both RNase MRP and nuclear RNase P; RNase MRP cleaves pre-rRNA, while nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs; relocalizes to the cytosol in response to hypoxia +S000030103 CDS YHR062C 8 223758 222877 C 2011-02-03 1996-07-31 +S000001105 ORF Verified YHR063C PAN5 2-dehydropantoate 2-reductase PAN5 chromosome 8 8 225169 224030 C 2011-02-03 1996-07-31 2-dehydropantoate 2-reductase; part of the pantothenic acid pathway, structurally homologous to E. coli panE +S000030303 CDS YHR063C 8 225169 224030 C 2011-02-03 1996-07-31 +S000028778 ORF Dubious YHR063W-A chromosome 8 8 225442 225777 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF SSZ1/YHR064C +S000033501 CDS YHR063W-A 8 225442 225777 W 2011-02-03 2003-07-29 +S000001106 ORF Verified YHR064C SSZ1 PDR13 chromosome 8 L000004029 8 227141 225525 C 2011-02-03 2003-09-22|1996-07-31 Hsp70 protein that interacts with Zuo1p (a DnaJ homolog); interacts with Zuo1p to form a ribosome-associated complex that binds the ribosome via the Zuo1p subunit; also involved in pleiotropic drug resistance via sequential activation of PDR1 and PDR5; binds ATP +S000030385 CDS YHR064C 8 227141 225525 C 2011-02-03 2003-09-22|1996-07-31 +S000001107 ORF Verified YHR065C RRP3 RNA-dependent ATPase RRP3 chromosome 8 L000004225 8 229037 227532 C 2011-02-03 2003-09-22|1996-07-31 Protein involved in rRNA processing; required for maturation of the 35S primary transcript of pre-rRNA and for cleavage leading to mature 18S rRNA; homologous to eIF-4a, which is a DEAD box RNA-dependent ATPase with helicase activity +S000033722 CDS YHR065C 8 229037 227532 C 2011-02-03 2003-09-22|1996-07-31 +S000001108 ORF Verified YHR066W SSF1 rRNA-binding ribosome biosynthesis protein chromosome 8 L000002080 8 229335 230696 W 2011-02-03 1996-07-31 Constituent of 66S pre-ribosomal particles; required for ribosomal large subunit maturation; functionally redundant with Ssf2p; member of the Brix family; SSF1 has a paralog, SSF2, that arose from the whole genome duplication +S000033935 CDS YHR066W 8 229335 230696 W 2011-02-03 1996-07-31 +S000001109 ORF Verified YHR067W HTD2 hydroxyacyl-thioester dehydratase HTD2|RMD12 chromosome 8 8 230970 231812 W 2011-02-03 1996-07-31 Mitochondrial 3-hydroxyacyl-thioester dehydratase; involved in fatty acid biosynthesis, required for respiratory growth and for normal mitochondrial morphology +S000034794 CDS YHR067W 8 230970 231812 W 2011-02-03 1996-07-31 +S000001110 ORF Verified YHR068W DYS1 deoxyhypusine synthase chromosome 8 L000003346 8 232133 233296 W 2011-02-03 1996-07-31 Deoxyhypusine synthase; catalyzes formation of deoxyhypusine, the first step in hypusine biosynthesis; triggers posttranslational hypusination of translation elongation factor eIF-5A and regulates its intracellular levels; tetrameric; human homolog DHPS allows growth of yeast haploid dys1 null mutant after sporulation of heterozygous diploid +S000034934 CDS YHR068W 8 232133 233296 W 2011-02-03 1996-07-31 +S000001111 ORF Verified YHR069C RRP4 exosome non-catalytic core subunit RRP4 chromosome 8 L000003549 8 234658 233579 C 2011-02-03 1996-07-31 Exosome non-catalytic core component; involved in 3'-5' RNA processing and degradation in both the nucleus and the cytoplasm; predicted to contain RNA binding domains; has similarity to human hRrp4p (EXOSC2) +S000034980 CDS YHR069C 8 234658 233579 C 2011-02-03 1996-07-31 +S000001112 ORF Verified YHR070W TRM5 tRNA (guanine) methyltransferase chromosome 8 8 234881 236380 W 2011-02-03 1996-07-31 tRNA(m(1)G37)methyltransferase; methylates a tRNA base adjacent to the anticodon that has a role in prevention of frameshifting; localized to both cytoplasm and mitochondria, and modifies both cytoplasmic and mitochondrial tRNAs; mutations in human ortholog TRMT5 are associated with skeletal muscle respiratory chain deficiencies, and trm5 mutations analogous to disease mutations decrease respiration +S000034511 CDS YHR070W 8 234881 236380 W 2011-02-03 1996-07-31 +S000028779 ORF Dubious YHR069C-A chromosome 8 8 235236 234874 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps ORF TRM5/YHR070W +S000033503 CDS YHR069C-A 8 235236 234874 C 2011-02-03 2003-07-29 +S000028780 ORF Dubious YHR070C-A chromosome 8 8 236512 236102 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene TRM5/YHR070W +S000033520 CDS YHR070C-A 8 236512 236102 C 2011-02-03 2003-07-29 +S000001113 ORF Verified YHR071W PCL5 chromosome 8 L000004037 8 237004 237693 W 2011-02-03 1996-07-31 Cyclin; interacts with and phosphorylated by Pho85p cyclin-dependent kinase (Cdk), induced by Gcn4p at level of transcription, specifically required for Gcn4p degradation, may be sensor of cellular protein biosynthetic capacity +S000034608 CDS YHR071W 8 237004 237693 W 2011-02-03 1996-07-31 +S000006566 tRNA_gene tF(GAA)H1 chromosome 8 L000003861 8 237939 237848 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis +S000032801 intron tF(GAA)H1 8 237902 237884 C 2011-02-03 2000-05-19 +S000032800 noncoding_exon tF(GAA)H1 8 237883 237848 C 2011-02-03 2000-05-19 +S000032799 noncoding_exon tF(GAA)H1 8 237939 237903 C 2011-02-03 2000-05-19 +S000001114 ORF Verified YHR072W ERG7 lanosterol synthase ERG7 chromosome 8 L000000573 8 239098 241293 W 2011-02-03 1996-07-31|2011-02-03 Lanosterol synthase; an essential enzyme that catalyzes the cyclization of squalene 2,3-epoxide, a step in ergosterol biosynthesis; human LSS functionally complements the lethality of the erg7 null mutation +S000034721 CDS YHR072W 8 239098 241293 W 2011-02-03 1996-07-31|2011-02-03 +S000028781 ORF Dubious YHR071C-A chromosome 8 8 239230 238910 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the verified ORF ERG7/YHR072W +S000033521 CDS YHR071C-A 8 239230 238910 C 2011-02-03 2003-07-29 +S000007455 ORF Verified YHR072W-A NOP10 snoRNP complex protein NOP10 chromosome 8 8 241664 241840 W 2011-02-03 2000-12-01 Subunit of box H/ACA snoRNP complex; required for pseudouridylation and processing of pre-18S rRNA +S000036439 CDS YHR072W-A 8 241664 241840 W 2011-02-03 2000-12-01 +S000001115 ORF Verified YHR073W OSH3 oxysterol-binding protein related protein OSH3 chromosome 8 8 242582 245572 W 2011-02-03 1996-07-31 Member of an oxysterol-binding protein family; this family has seven members in S. cerevisiae; family members have overlapping, redundant functions in sterol metabolism and collectively perform a function essential for viability; contains FFAT motif; interacts with ER anchor Scs2p at patches at the plasma membrane; regulated by sterol binding +S000035693 CDS YHR073W 8 242582 245572 W 2011-02-03 1996-07-31 +S000028834 ORF Dubious YHR073W-A chromosome 8 8 242868 243044 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF YHR073W; identified by expression profiling and mass spectrometry +S000034484 CDS YHR073W-A 8 242868 243044 W 2011-02-03 2003-07-29 +S000028833 ORF Dubious YHR073C-B chromosome 8 8 245502 245422 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF YHR073W; identified by expression profiling and mass spectrometry +S000034483 CDS YHR073C-B 8 245502 245422 C 2011-02-03 2003-07-29 +S000118359 ARS ARS813 ARSVIII-246 chromosome 8 8 245773 245847 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178108 ARS_consensus_sequence ARS813 8 245789 245805 W 2014-11-18 2014-11-18 +S000001116 ORF Verified YHR074W QNS1 glutamine-dependent NAD(+) synthetase chromosome 8 S000007569 8 246193 248337 W 2011-02-03 1996-07-31 Glutamine-dependent NAD(+) synthetase; essential for the formation of NAD(+) from nicotinic acid adenine dinucleotide +S000035833 CDS YHR074W 8 246193 248337 W 2011-02-03 1996-07-31 +S000001117 ORF Verified YHR075C PPE1 carboxylesterase-mitochondrial 37S ribosomal protein YmS2|YmS2|MRPS2 chromosome 8 8 249641 248439 C 2011-02-03 1996-07-31 Protein with carboxyl methyl esterase activity; may have a role in demethylation of the phosphoprotein phosphatase catalytic subunit; also identified as a small subunit mitochondrial ribosomal protein +S000035876 CDS YHR075C 8 249641 248439 C 2011-02-03 1996-07-31 +S000001118 ORF Verified YHR076W PTC7 type 2C protein phosphatase PTC7 chromosome 8 8 251101 252225 W 2011-02-03 1996-07-31|2007-07-09 Type 2C serine/threonine protein phosphatase (PP2C); alternatively spliced to create two mRNA isoforms; protein from spliced form localizes to the mitochondria while the one from the unspliced form is localized to the nuclear envelope; activates coenzyme Q6 biosynthesis by dephosphorylation of demethoxy-Q6 hydroxylase Coq7p +S000037820 CDS YHR076W 8 251101 251155 W 2011-02-03 1996-07-31|2007-07-09 +S000123271 CDS YHR076W 8 251249 252225 W 2011-02-03 2007-07-09 +S000123270 intron YHR076W 8 251156 251248 W 2011-02-03 2007-07-09 +S000001119 ORF Verified YHR077C NMD2 SUP111|UPF2|SUA1|IFS1 chromosome 8 L000001257|S000029548|L000002230 8 255756 252374 C 51 2011-02-03 1999-11-17|1996-07-31 Protein involved in the nonsense-mediated mRNA decay (NMD) pathway; interacts with Nam7p and Upf3p; involved in telomere maintenance +S000037864 CDS YHR077C 8 255637 252374 C 2011-02-03 1999-11-17 +S000037863 CDS YHR077C 8 255756 255751 C 2011-02-03 1999-11-17|1996-07-31 +S000037865 intron YHR077C 8 255750 255638 C 2011-02-03 1999-11-17 +S000001120 ORF Uncharacterized YHR078W chromosome 8 8 256360 258018 W 2011-02-03 1996-07-31 High osmolarity-regulated gene of unknown function +S000029926 CDS YHR078W 8 256360 258018 W 2011-02-03 1996-07-31 +S000001121 ORF Verified YHR079C IRE1 bifunctional endoribonuclease/protein kinase IRE1|ERN1 chromosome 8 L000000875 8 261591 258244 C 2011-02-03 1996-07-31 Serine-threonine kinase and endoribonuclease; transmembrane protein that mediates the unfolded protein response (UPR) by regulating Hac1p synthesis through HAC1 mRNA splicing; role in homeostatic adaptation to ER stress; Kar2p binds inactive Ire1p and releases from it upon ER stress +S000029980 CDS YHR079C 8 261591 258244 C 2011-02-03 1996-07-31 +S000001957 ORF Verified YHR079C-A SAE3 YHR079BC|YHR079C-B chromosome 8 L000002893 8 262553 262192 C 2011-02-03 1996-07-31|2005-11-03 Meiosis-specific protein involved in meiotic recombination; involved in DMC1-dependent meiotic recombination; forms heterodimer with Mei5p; proposed to be an assembly factor for Dmc1p +S000087058 CDS YHR079C-A 8 262354 262192 C 2011-02-03 2005-11-03 +S000034792 CDS YHR079C-A 8 262553 262441 C 2011-02-03 1996-07-31|2005-11-03 +S000087057 intron YHR079C-A 8 262440 262355 C 2011-02-03 2005-11-03 +S000001122 ORF Verified YHR080C LAM4 LTC3 chromosome 8 8 266838 262801 C 2011-02-03 1996-07-31 Sterol-binding protein that localizes to puncta in the cortical ER; sterol binding occurs via two StART-like domains; one of six StART-like domain-containing proteins in yeast that may be involved in intracellular sterol transfer between membranes; conserved across eukaryotes; has both GRAM and StART-like (VASt) domains; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies +S000037712 CDS YHR080C 8 266838 262801 C 2011-02-03 1996-07-31 +S000001123 ORF Verified YHR081W LRP1 RRP47|YC1D chromosome 8 8 267538 268092 W 2011-02-03 1996-07-31 Nuclear exosome-associated nucleic acid binding protein; involved in RNA processing, surveillance, degradation, tethering, and export; forms a stable heterodimer with Rrp6p and regulates its exonucleolytic activity; rapidly degraded by the proteasome in the absence of Rrp6p; homolog of mammalian nuclear matrix protein C1D involved in regulation of DNA repair and recombination +S000030578 CDS YHR081W 8 267538 268092 W 2011-02-03 1996-07-31 +S000001124 ORF Verified YHR082C KSP1 putative serine/threonine protein kinase KSP1 chromosome 8 L000000921 8 271548 268459 C 2011-02-03 1996-07-31 Serine/threonine protein kinase; associates with TORC1 and likely involved in TOR signaling cascades; negative regulator of autophagy; nuclear translocation required for haploid filamentous growth; regulates filamentous growth induced nuclear translocation of Bcy1p, Fus3p, and Sks1p; overproduction causes allele-specific suppression of prp20-10; protein abundance increases in response to DNA replication stress +S000030628 CDS YHR082C 8 271548 268459 C 2011-02-03 1996-07-31 +S000001125 ORF Verified YHR083W SAM35 SAM complex subunit SAM35|TOM38|TOB38|FMP20 chromosome 8 8 272627 273616 W 2011-02-03 1996-07-31 Component of the sorting and assembly machinery (SAM) complex; the SAM (or TOB) complex is located in the mitochondrial outer membrane; the complex binds precursors of beta-barrel proteins and facilitates their insertion into the outer membrane +S000030804 CDS YHR083W 8 272627 273616 W 2011-02-03 1996-07-31 +S000001126 ORF Verified YHR084W STE12 homeodomain family transcription factor STE12 chromosome 8 L000002119 8 274174 276240 W 65.64 2011-02-03 1996-07-31 Transcription factor that is activated by a MAPK signaling cascade; activates genes involved in mating or pseudohyphal/invasive growth pathways; cooperates with Tec1p transcription factor to regulate genes specific for invasive growth +S000030898 CDS YHR084W 8 274174 276240 W 2011-02-03 1996-07-31 +S000001127 ORF Verified YHR085W IPI1 chromosome 8 8 276764 277768 W 2011-02-03 1996-07-31 Component of the Rix1 complex and possibly pre-replicative complexes; required for processing of ITS2 sequences from 35S pre-rRNA; component of the pre-60S ribosomal particle with the dynein-related AAA-type ATPase Mdn1p; required for pre-replicative complex (pre-RC) formation and maintenance during DNA replication licensing; relocalizes to the cytosol in response to hypoxia; essential gene +S000031899 CDS YHR085W 8 276764 277768 W 2011-02-03 1996-07-31 +S000001128 ORF Verified YHR086W NAM8 MUD15|MRE2 chromosome 8 L000001147|L000001230 8 278153 279724 W 2011-02-03 1996-07-31 RNA binding protein, component of the U1 snRNP protein; mutants are defective in meiotic recombination and in formation of viable spores, involved in the formation of DSBs through meiosis-specific splicing of REC107 pre-mRNA; Nam8p regulon embraces the meiotic pre-mRNAs of REC107, HFM1, AMA1 SPO22 and PCH2; the putative RNA binding domains RRM2 and RRM3 are required for Nam8p meiotic function +S000032027 CDS YHR086W 8 278153 279724 W 2011-02-03 1996-07-31 +S000028552 ORF Uncharacterized YHR086W-A chromosome 8 8 280231 280392 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR; SWAT-GFP and mCherry fusion proteins localize to the endoplasmic reticulum and vacuole respectively +S000031238 CDS YHR086W-A 8 280231 280392 W 2011-02-03 2003-07-29 +S000001129 ORF Verified YHR087W RTC3 HGI1 chromosome 8 8 280820 281155 W 2011-02-03 1996-07-31 Protein of unknown function involved in RNA metabolism; has structural similarity to SBDS, the human protein mutated in Shwachman-Diamond Syndrome (the yeast SBDS ortholog = SDO1); null mutation suppresses cdc13-1 temperature sensitivity; protein abundance increases in response to DNA replication stress +S000032137 CDS YHR087W 8 280820 281155 W 2011-02-03 1996-07-31 +S000001130 ORF Verified YHR088W RPF1 rRNA-binding ribosome biosynthesis protein RPF1 chromosome 8 8 281495 282382 W 2011-02-03 1996-07-31 Protein involved in assembly and export of the large ribosomal subunit; nucleolar protein; constituent of 66S pre-ribosomal particles; contains a sigma(70)-like motif, which is thought to bind RNA +S000034136 CDS YHR088W 8 281495 282382 W 2011-02-03 1996-07-31 +S000001131 ORF Verified YHR089C GAR1 H/ACA snoRNP pseudouridylase subunit GAR1 chromosome 8 L000000668 8 283298 282681 C 2011-02-03 1996-07-31 Protein component of the H/ACA snoRNP pseudouridylase complex; involved in the modification and cleavage of the 18S pre-rRNA +S000034183 CDS YHR089C 8 283298 282681 C 2011-02-03 1996-07-31 +S000001132 ORF Verified YHR090C YNG2 histone acetyltransferase YNG2|EAF4|NBN1 chromosome 8 L000004452 8 284625 283777 C 2011-02-03 1996-07-31 Subunit of NuA4, an essential histone acetyltransferase complex; positions Piccolo NuA4 for efficient acetylation of histone H4 or histone H2A; relocalizes to the cytosol in response to hypoxia; similar to human tumor suppressor ING1 and its isoforms ING4 and ING5 +S000033033 CDS YHR090C 8 284625 283777 C 2011-02-03 1996-07-31 +S000001133 ORF Verified YHR091C MSR1 arginine--tRNA ligase MSR1 chromosome 8 L000002618 8 286770 284839 C 2011-02-03 1996-07-31 Mitochondrial arginyl-tRNA synthetase; mutations in human ortholog are associated with pontocerebellar hypoplasia type 6; MSR1 has a paralog, YDR341C, that arose from the whole genome duplication +S000033677 CDS YHR091C 8 286770 284839 C 2011-02-03 1996-07-31 +S000130149 ARS ARS814 chromosome 8 8 286770 287128 2011-02-03 2009-05-06|2011-02-03 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000001134 ORF Verified YHR092C HXT4 hexose transporter HXT4|RAG1|LGT1 chromosome 8 L000000838 8 288811 287081 C 2011-02-03 1996-07-31|2011-02-03 High-affinity glucose transporter; member of the major facilitator superfamily, expression is induced by low levels of glucose and repressed by high levels of glucose; HXT4 has a paralog, HXT7, that arose from the whole genome duplication +S000033772 CDS YHR092C 8 288811 287081 C 2011-02-03 1996-07-31|2011-02-03 +S000001135 ORF Dubious YHR093W AHT1 chromosome 8 L000000065 8 289142 289690 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; not conserved in closely related Saccharomyces species; multicopy suppressor of glucose transport defects, likely due to the presence of an HXT4 regulatory element in the region +S000033970 CDS YHR093W 8 289142 289690 W 2011-02-03 1996-07-31 +S000001136 ORF Verified YHR094C HXT1 hexose transporter HXT1|HOR4 chromosome 8 L000000835 8 292625 290913 C 66.54 2011-02-03 1996-07-31 Low-affinity glucose transporter of the major facilitator superfamily; expression is induced by Hxk2p in the presence of glucose and repressed by Rgt1p when glucose is limiting; HXT1 has a paralog, HXT6, what arose from the whole genome duplication +S000034018 CDS YHR094C 8 292625 290913 C 2011-02-03 1996-07-31 +S000001137 ORF Dubious YHR095W chromosome 8 8 292943 293437 W 2011-02-03 1996-07-31|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035020 CDS YHR095W 8 292943 293437 W 2011-02-03 1996-07-31|2011-02-03 +S000001138 ORF Verified YHR096C HXT5 hexose transporter HXT5 chromosome 8 L000000839 8 296447 294669 C 2011-02-03 1996-07-31 Hexose transporter with moderate affinity for glucose; induced in the presence of non-fermentable carbon sources, induced by a decrease in growth rate, contains an extended N-terminal domain relative to other HXTs; HXT5 has a paralog, HXT3, that arose from the whole genome duplication +S000035072 CDS YHR096C 8 296447 294669 C 2011-02-03 1996-07-31 +S000130150 ARS ARS815 chromosome 8 8 297060 297179 2014-11-18 2014-11-18|2009-05-06 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000001139 ORF Uncharacterized YHR097C chromosome 8 8 298609 297385 C 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and the nucleus; YHR097C has a paralog, PAL1, that arose from the whole genome duplication +S000035267 CDS YHR097C 8 298360 297385 C 2011-02-03 1996-07-31 +S000035266 CDS YHR097C 8 298609 298485 C 2011-02-03 1996-07-31 +S000035268 intron YHR097C 8 298484 298361 C 2011-02-03 1996-07-31 +S000001140 ORF Verified YHR098C SFB3 LST1 chromosome 8 L000004659 8 301934 299145 C 2011-02-03 1996-07-31 Component of the Sec23p-Sfb3p heterodimer of the COPII vesicle coat; COPII coat is required for cargo selection during vesicle formation in ER to Golgi transport; scaffolding function of Lst1p required to generate vesicles that can accommodate difficult cargo proteins that include large oligomeric assemblies and asymmetrically distributed membrane proteins; homologous to Sec24p and Sfb2p +S000036156 CDS YHR098C 8 301934 299145 C 2011-02-03 1996-07-31 +S000001141 ORF Verified YHR099W TRA1 histone acetyltransferase TRA1 chromosome 8 L000003945 8 302761 313995 W 2011-02-03 1996-07-31 Subunit of SAGA and NuA4 histone acetyltransferase complexes; interacts with acidic activators (e.g., Gal4p) which leads to transcription activation; similar to human TRRAP, which is a cofactor for c-Myc mediated oncogenic transformation +S000036322 CDS YHR099W 8 302761 313995 W 2011-02-03 1996-07-31 +S000001142 ORF Verified YHR100C GEP4 phosphatidylglycerophosphatase chromosome 8 8 314673 314116 C 2011-02-03 1996-07-31 Mitochondrial phosphatidylglycerophosphatase (PGP phosphatase); dephosphorylates phosphatidylglycerolphosphate to generate phosphatidylglycerol, an essential step during cardiolipin biosynthesis; null mutant is sensitive to tunicamycin, DTT +S000034711 CDS YHR100C 8 314673 314116 C 2011-02-03 1996-07-31 +S000001143 ORF Verified YHR101C BIG1 chromosome 8 L000003416 8 315968 314874 C 2011-02-03 1996-07-31 Integral membrane protein of the endoplasmic reticulum; required for normal content of cell wall beta-1,6-glucan +S000035670 CDS YHR101C 8 315771 314874 C 2011-02-03 1996-07-31 +S000035669 CDS YHR101C 8 315968 315859 C 2011-02-03 1996-07-31 +S000035671 intron YHR101C 8 315858 315772 C 2011-02-03 1996-07-31 +S000001144 ORF Verified YHR102W KIC1 putative serine/threonine protein kinase KIC1|NRK1 chromosome 8 L000001276 8 316572 319814 W 2011-02-03 1996-07-31 Protein kinase of the PAK/Ste20 family, required for cell integrity; physically interacts with Cdc31p (centrin), which is a component of the spindle pole body; part of the RAM network that regulates cellular polarity and morphogenesis +S000035759 CDS YHR102W 8 316572 319814 W 2011-02-03 1996-07-31 +S000001145 ORF Verified YHR103W SBE22 chromosome 8 L000003101 8 320414 322972 W 2011-02-03 1996-07-31 Protein involved in bud growth; involved in the transport of cell wall components from the Golgi to the cell surface; similar in structure and functionally redundant with Sbe2p; SBE22 has a paralog, SBE2, that arose from the whole genome duplication +S000035866 CDS YHR103W 8 320414 322972 W 2011-02-03 1996-07-31 +S000001146 ORF Verified YHR104W GRE3 trifunctional aldehyde reductase/xylose reductase/glucose 1-dehydrogenase (NADP(+)) chromosome 8 L000004178 8 323409 324392 W 2011-02-03 1996-07-31 Aldose reductase; involved in methylglyoxal, d-xylose, arabinose, and galactose metabolism; stress induced (osmotic, ionic, oxidative, heat shock, starvation and heavy metals); regulated by the HOG pathway; protein abundance increases in response to DNA replication stress +S000036784 CDS YHR104W 8 323409 324392 W 2011-02-03 1996-07-31 +S000001147 ORF Verified YHR105W YPT35 chromosome 8 8 324766 325410 W 2011-02-03 1996-07-31 Endosomal protein of unknown function; contains a phox (PX) homology domain; binds to both phosphatidylinositol-3-phosphate (PtdIns(3)P) and proteins involved in ER-Golgi or vesicular transport +S000036859 CDS YHR105W 8 324766 325410 W 2011-02-03 1996-07-31 +S000001148 ORF Verified YHR106W TRR2 thioredoxin-disulfide reductase TRR2 chromosome 8 L000003954 8 325598 326626 W 2011-02-03 1996-07-31 Mitochondrial thioredoxin reductase; involved in protection against oxidative stress, required with Glr1p to maintain the redox state of Trx3p; contains active-site motif (CAVC) present in prokaryotic orthologs; binds NADPH and FAD; TRR2 has a paralog, TRR1, that arose from the whole genome duplication +S000036915 CDS YHR106W 8 325598 326626 W 2011-02-03 1996-07-31 +S000001149 ORF Verified YHR107C CDC12 septin CDC12|PSL7|CLA10 chromosome 8 L000000348|L000000252 8 328036 326813 C 68.14 2011-02-03 1996-07-31 Component of the septin ring that is required for cytokinesis; septins are GTP-binding proteins that assemble into rod-like hetero-oligomers that can associate with other rods to form filaments; septin rings at the mother-bud neck act as scaffolds for recruiting cell division factors and as barriers to prevent diffusion of specific proteins between mother and daughter cells +S000036947 CDS YHR107C 8 328036 326813 C 2011-02-03 1996-07-31 +S000001150 ORF Verified YHR108W GGA2 phosphatidylinositol 4-phosphate-binding protein chromosome 8 S000007494 8 328303 330060 W 2011-02-03 1996-07-31 Protein that regulates Arf1p, Arf2p to facilitate Golgi trafficking; binds phosphatidylinositol 4-phosphate, which plays a role in TGN localization; has homology to gamma-adaptin; GGA2 has a paralog, GGA1, that arose from the whole genome duplication +S000037727 CDS YHR108W 8 328303 330060 W 2011-02-03 1996-07-31 +S000001151 ORF Verified YHR109W CTM1 cytochrome c lysine N-methyltransferase chromosome 8 S000007504 8 330310 332067 W 2011-02-03 1996-07-31 Cytochrome c lysine methyltransferase; trimethylates residue 72 of apo-cytochrome c (Cyc1p) in the cytosol; not required for normal respiratory growth +S000037814 CDS YHR109W 8 330310 332067 W 2011-02-03 1996-07-31 +S000001152 ORF Verified YHR110W ERP5 chromosome 8 L000004682 8 332282 332920 W 2011-02-03 1996-07-31 Protein with similarity to Emp24p and Erv25p; member of the p24 family involved in ER to Golgi transport +S000030739 CDS YHR110W 8 332282 332920 W 2011-02-03 1996-07-31 +S000001153 ORF Verified YHR111W UBA4 YHR1 chromosome 8 8 333072 334394 W 2011-02-03 1996-07-31 E1-like protein that activates Urm1p before urmylation; also acts in thiolation of the wobble base of cytoplasmic tRNAs by adenylating and then thiolating Urm1p; receives sulfur from Tum1p +S000030847 CDS YHR111W 8 333072 334394 W 2011-02-03 1996-07-31 +S000001154 ORF Verified YHR112C putative cystathionine beta-lyase chromosome 8 8 335663 334527 C 2011-02-03 1996-07-31 Protein of unknown function; localizes to the cytoplasm and nucleus; overexpression affects protein trafficking through the endocytic pathway +S000031735 CDS YHR112C 8 335663 334527 C 2011-02-03 1996-07-31 +S000001155 ORF Verified YHR113W APE4 aspartyl aminopeptidase chromosome 8 8 336337 337809 W 2011-02-03 1996-07-31 Cytoplasmic aspartyl aminopeptidase with possible vacuole function; Cvt pathway cargo protein; cleaves unblocked N-terminal acidic amino acids from peptide substrates; forms a 12-subunit homo-oligomer; M18 metalloprotease family +S000031980 CDS YHR113W 8 336337 337809 W 2011-02-03 1996-07-31 +S000001156 ORF Verified YHR114W BZZ1 LSB7 chromosome 8 8 338083 339984 W 2011-02-03 1996-07-31 SH3 domain protein implicated in regulating actin polymerization; able to recruit actin polymerization machinery through its SH3 domains; colocalizes with cortical actin patches and Las17p; interacts with type I myosins +S000032098 CDS YHR114W 8 338083 339984 W 2011-02-03 1996-07-31 +S000001157 ORF Verified YHR115C DMA1 ubiquitin-conjugating protein DMA1|CHF1 chromosome 8 S000029719 8 341359 340109 C 2011-02-03 1996-07-31 Ubiquitin-protein ligase (E3); controls septin dynamics, spindle position checkpoint (SPOC) with ligase Dma2p by regulating recruitment of Elm1p to bud neck; regulates levels of eIF2 subunit Gcd11p, as well as abundance, localization, and ubiquitination of Cdk inhibitory kinase Swe1p; ubiquitinates cyclin Pcl1p; ortholog of human RNF8, similar to human Chfr; contains FHA, RING fingers; DMA1 has a paralog, DMA2, that arose from the whole genome duplication +S000032967 CDS YHR115C 8 341359 340109 C 2011-02-03 1996-07-31 +S000001158 ORF Verified YHR116W COX23 chromosome 8 8 341665 342120 W 2011-02-03 1996-07-31 Protein that functions in mitochondrial copper homeostasis; mitochondrial intermembrane space protein; essential for functional cytochrome oxidase expression; homologous to Cox17p; contains twin cysteine-x9-cysteine motifs +S000033114 CDS YHR116W 8 341665 342120 W 2011-02-03 1996-07-31 +S000001159 ORF Verified YHR117W TOM71 protein channel TOM71|TOM72 chromosome 8 L000003252 8 342349 344268 W 2011-02-03 1996-07-31 Mitochondrial outer membrane protein; probable minor component of the TOM (translocase of outer membrane) complex responsible for recognition and import of mitochondrially directed proteins; TOM71 has a paralog, TOM70, that arose from the whole genome duplication +S000033188 CDS YHR117W 8 342349 344268 W 2011-02-03 1996-07-31 +S000001160 ORF Verified YHR118C ORC6 origin recognition complex subunit 6 chromosome 8 L000001306 8 345628 344321 C 2011-02-03 1996-07-31 Subunit of the origin recognition complex (ORC); ORC directs DNA replication by binding to replication origins and is also involved in transcriptional silencing; phosphorylated by Cdc28p; mutation in the human Orc6p is linked to Meier-Gorlin syndrome +S000033913 CDS YHR118C 8 345628 344321 C 2011-02-03 1996-07-31 +S000001161 ORF Verified YHR119W SET1 histone methyltransferase SET1|KMT2|YTX1 chromosome 8 L000003286 8 346043 349285 W 2011-02-03 1996-07-31 Histone methyltransferase, subunit of the COMPASS (Set1C) complex; COMPASS methylates histone H3K4; Set1p-dependent H3K4 trimethylation recruits Nrd1p, allowing efficient termination of snoRNAs and cryptic unstable transcripts (CUTs) by Nrd1p-Nab3p-Sen1p pathway; modulates histone acetylation levels in promoter proximal regions to ensure efficient Nrd1p-dependent termination; required in transcriptional silencing near telomeres and at silent mating type loci; has a SET domain +S000034097 CDS YHR119W 8 346043 349285 W 2011-02-03 1996-07-31 +S000001162 ORF Verified YHR120W MSH1 mismatch repair ATPase MSH1 chromosome 8 L000001189 8 349574 352453 W 70.44 2011-02-03 1996-07-31 DNA-binding protein of the mitochondria; involved in repair of mitochondrial DNA; has ATPase activity and binds to DNA mismatches; has homology to E. coli MutS; transcription is induced during meiosis +S000035066 CDS YHR120W 8 349574 352453 W 2011-02-03 1996-07-31 +S000001163 ORF Verified YHR121W LSM12 chromosome 8 8 352756 353319 W 2011-02-03 1996-07-31 Protein of unknown function that may function in RNA processing; interacts with Pbp1p and Pbp4p and associates with ribosomes; contains an RNA-binding LSM domain and an AD domain; GFP-fusion protein is induced by the DNA-damaging agent MMS; relative distribution to the nucleus increases upon DNA replication stress +S000035174 CDS YHR121W 8 352756 353319 W 2011-02-03 1996-07-31 +S000001164 ORF Verified YHR122W CIA2 iron-sulfur cluster assembly protein CIA2 chromosome 8 8 353625 354320 W 2011-02-03 1996-07-31 Component of cytosolic iron-sulfur protein assembly (CIA) machinery; acts at a late step of Fe-S cluster assembly; forms the CIA targeting complex with Cia1p and Met18p that directs Fe-S cluster incorporation into a subset of proteins involved in methionine biosynthesis, DNA replication and repair, transcription, and telomere maintenance; ortholog of human FAM96B +S000036050 CDS YHR122W 8 353625 354320 W 2011-02-03 1996-07-31 +S000001165 ORF Verified YHR123W EPT1 bifunctional diacylglycerol cholinephosphotransferase/ethanolaminephosphotransferase chromosome 8 L000000563 8 354815 356081 W 2011-02-03 1996-07-31 sn-1,2-diacylglycerol ethanolamine- and cholinephosphotranferase; not essential for viability; EPT1 has a paralog, CPT1, that arose from the whole genome duplication +S000036151 CDS YHR123W 8 354815 354864 W 2011-02-03 1996-07-31 +S000036152 CDS YHR123W 8 354956 356081 W 2011-02-03 1996-07-31 +S000036153 intron YHR123W 8 354865 354955 W 2011-02-03 1996-07-31 +S000001166 ORF Verified YHR124W NDT80 transcription factor NDT80 chromosome 8 L000003016 8 356561 358444 W 2011-02-03 1996-07-31 Meiosis-specific transcription factor; required for exit from pachytene and for full meiotic recombination; activates middle sporulation genes; competes with Sum1p for binding to promoters containing middle sporulation elements (MSE) +S000029855 CDS YHR124W 8 356561 358444 W 2011-02-03 1996-07-31 +S000006567 tRNA_gene tF(GAA)H2 chromosome 8 L000003860 8 358569 358478 C 2011-02-03 2000-05-19 Phenylalanine tRNA (tRNA-Phe), predicted by tRNAscan-SE analysis +S000032804 intron tF(GAA)H2 8 358532 358514 C 2011-02-03 2000-05-19 +S000032803 noncoding_exon tF(GAA)H2 8 358513 358478 C 2011-02-03 2000-05-19 +S000032802 noncoding_exon tF(GAA)H2 8 358569 358533 C 2011-02-03 2000-05-19 +S000006996 long_terminal_repeat YHRCdelta8 chromosome 8 8 358850 358672 C 2011-02-03 2000-05-19 Ty1 LTR +S000001167 ORF Dubious YHR125W chromosome 8 8 358858 359163 W 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031773 CDS YHR125W 8 358858 359163 W 2011-02-03 1996-07-31 +S000007005 long_terminal_repeat YHRCtau4 chromosome 8 8 359067 358850 C 2011-02-03 2000-05-19 Ty4 LTR +S000007008 long_terminal_repeat YHRWdelta9 chromosome 8 8 359079 359372 W 2011-02-03 2000-05-19 Ty1 LTR +S000001168 ORF Uncharacterized YHR126C ANS1 chromosome 8 8 360181 359702 C 2011-02-03 1996-07-31 Putative GPI protein; SWAT-GFP and mCherry fusion proteins localize to the vacuole; transcription dependent upon Azf1p +S000031832 CDS YHR126C 8 360181 359702 C 2011-02-03 1996-07-31 +S000001169 ORF Verified YHR127W HSN1 chromosome 8 L000004353 8 360913 361644 W 2011-02-03 1996-07-31 Protein of unknown function; localizes to the nucleus; required for asymmetric localization of Kar9p during mitosis +S000032038 CDS YHR127W 8 360913 361644 W 2011-02-03 1996-07-31 +S000001170 ORF Verified YHR128W FUR1 uracil phosphoribosyltransferase chromosome 8 L000000651 8 362115 362765 W 91 2011-02-03 2003-09-22|1996-07-31 Uracil phosphoribosyltransferase; synthesizes UMP from uracil; involved in the pyrimidine salvage pathway +S000037493 CDS YHR128W 8 362115 362765 W 2011-02-03 2003-09-22|1996-07-31 +S000001171 ORF Verified YHR129C ARP1 actin-related protein 1|ACT5 chromosome 8 L000000028 8 364153 362999 C 2011-02-03 1996-07-31 Actin-related protein of the dynactin complex; required for spindle orientation and nuclear migration; forms actin-like short filament composed of 9 or 10 Arp1p monomers; putative ortholog of mammalian centractin +S000037551 CDS YHR129C 8 364153 362999 C 2011-02-03 1996-07-31 +S000001172 ORF Uncharacterized YHR130C chromosome 8 8 365300 364965 C 2011-02-03 1996-07-31 Putative protein of unknown function; conserved among S. cerevisiae strains; YHR130C is not an essential gene +S000037165 CDS YHR130C 8 365300 364965 C 2011-02-03 1996-07-31 +S000028782 ORF Dubious YHR131W-A chromosome 8 8 367747 367992 W 2011-02-03 2004-07-26|2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YHR131C +S000033522 CDS YHR131W-A 8 367747 367992 W 2011-02-03 2004-07-26|2003-07-29 +S000001173 ORF Uncharacterized YHR131C chromosome 8 8 367892 365340 C 2011-02-03 2004-07-26|1996-07-31 Putative protein of unknown function; GFP-fusion protein localizes to the cytoplasm; overexpression causes cell cycle delay or arrest; contains a PH domain and binds phosphatidylinositols and other lipids in a large-scale study; YHR131C has a paralog, YNL144C, that arose from the whole genome duplication +S000037245 CDS YHR131C 8 367892 365340 C 2011-02-03 2004-07-26|1996-07-31 +S000001174 ORF Verified YHR132C ECM14 putative metallocarboxypeptidase chromosome 8 L000003889 8 369794 368502 C 2011-02-03 1996-07-31 Putative metalloprotease with similarity to zinc carboxypeptidases; required for normal cell wall assembly +S000037322 CDS YHR132C 8 369794 368502 C 2011-02-03 1996-07-31 +S000007496 ORF Verified YHR132W-A IGO2 phosphatase regulator chromosome 8 8 370054 370449 W 2011-02-03 2000-01-21 Protein required for initiation of G0 program; prevents degradation of nutrient-regulated mRNAs via the 5'-3' mRNA decay pathway; phosphorylated by Rim15p; GFP protein localizes to the cytoplasm and nucleus; IGO2 has a paralog, IGO1, that arose from the whole genome duplication +S000032170 CDS YHR132W-A 8 370054 370449 W 2011-02-03 2000-01-21 +S000001175 ORF Verified YHR133C NSG1 chromosome 8 8 371597 370722 C 2011-02-03 1996-07-31 Protein involved in regulation of sterol biosynthesis; specifically stabilizes Hmg2p, one of two HMG-CoA isoenzymes that catalyze the rate-limiting step in sterol biosynthesis; forms foci at the nuclear periphery upon DNA replication stress; relocalizes to the cytosol in response to hypoxia; homolog of mammalian INSIG proteins; NSG1 has a paralog, NSG2, that arose from the whole genome duplication +S000037393 CDS YHR133C 8 371597 370722 C 2011-02-03 1996-07-31 +S000001176 ORF Verified YHR134W WSS1 metalloendopeptidase WSS1 chromosome 8 8 371749 372558 W 2011-02-03 1996-07-31 Metalloprotease involved in DNA repair, removes DNA-protein crosslinks at stalled replication forks during replication of damaged DNA; localizes to a single spot on the nuclear periphery of mother cells but not daughters; interacts genetically with SMT3; activated by DNA binding +S000030068 CDS YHR134W 8 371749 372558 W 2011-02-03 1996-07-31 +S000001177 ORF Verified YHR135C YCK1 serine/threonine protein kinase YCK1|CKI2 chromosome 8 L000002500 8 374310 372694 C 2011-02-03 1996-07-31 Palmitoylated plasma membrane-bound casein kinase I (CK1) isoform; shares redundant functions with Yck2p in morphogenesis, proper septin assembly, endocytic trafficking, and glucose sensing; stabilized by Sod1p binding in the presence of glucose and oxygen, causing glucose repression of respiratory metabolism; involved in the phosphorylation and regulation of glucose sensor Rgt2p; YCK1 has a paralog, YCK2, that arose from the whole genome duplication +S000030130 CDS YHR135C 8 374310 372694 C 2011-02-03 1996-07-31 +S000001178 ORF Verified YHR136C SPL2 chromosome 8 L000004174 8 375100 374654 C 2011-02-03 1996-07-31 Protein with similarity to cyclin-dependent kinase inhibitors; downregulates low-affinity phosphate transport during phosphate limitation by targeting Pho87p to the vacuole; upstream region harbors putative hypoxia response element (HRE) cluster; overproduction suppresses a plc1 null mutation; promoter shows an increase in Snf2p occupancy after heat shock; GFP-fusion protein localizes to the cytoplasm +S000030305 CDS YHR136C 8 375100 374654 C 2011-02-03 1996-07-31 +S000001179 ORF Verified YHR137W ARO9 aromatic-amino-acid:2-oxoglutarate transaminase chromosome 8 L000003950 8 375709 377250 W 2011-02-03 1996-07-31 Aromatic aminotransferase II; catalyzes the first step of tryptophan, phenylalanine, and tyrosine catabolism +S000033667 CDS YHR137W 8 375709 377250 W 2011-02-03 1996-07-31 +S000028649 ORF Dubious YHR137C-A chromosome 8 8 376388 375738 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified gene ARO9/YHR137W; identified by gene-trapping, expression analysis, and genome-wide homology searching +S000032425 CDS YHR137C-A 8 376388 375738 C 2011-02-03 2003-07-29 +S000001180 ORF Verified YHR138C chromosome 8 8 377699 377355 C 2011-02-03 1996-07-31 Protein of unknown function; similar to Pbi2p; double null mutant lacking Pbi2p and Yhr138cp exhibits highly fragmented vacuoles; protein abundance increases in response to DNA replication stress +S000033725 CDS YHR138C 8 377699 377355 C 2011-02-03 1996-07-31 +S000001181 ORF Verified YHR139C SPS100 chromosome 8 L000002027 8 379199 378219 C 2011-02-03 1996-07-31 Protein required for spore wall maturation; expressed during sporulation; may be a component of the spore wall; expression also induced in cells treated with the mycotoxin patulin; SPS100 has a paralog, YGP1, that arose from the whole genome duplication +S000033864 CDS YHR139C 8 379199 378219 C 2011-02-03 1996-07-31 +S000003533 ORF Dubious YHR139C-A chromosome 8 8 380419 380108 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035738 CDS YHR139C-A 8 380419 380108 C 2011-02-03 1996-07-31 +S000001182 ORF Uncharacterized YHR140W chromosome 8 8 380572 381291 W 2011-02-03 1996-07-31 Putative integral membrane protein of unknown function +S000033477 CDS YHR140W 8 380572 381291 W 2011-02-03 1996-07-31 +S000007297 snoRNA_gene snR32 SNR32 chromosome 8 L000001970 8 381540 381727 W 2011-02-03 2000-05-19 H/ACA box small nucleolar RNA (snoRNA); guides pseudouridylation of large subunit (LSU) rRNA at position U2191 +S000036759 noncoding_exon snR32 8 381540 381727 W 2011-02-03 2000-05-19 +S000001183 ORF Verified YHR141C RPL42B eL42|ribosomal 60S subunit protein L42B|L44e|YP44|YL27|L42B|L41B|MAK18 chromosome 8 L000001732|L000000990 8 382751 381990 C 95 2011-02-03 1996-07-31 Ribosomal 60S subunit protein L42B; required for propagation of the killer toxin-encoding M1 double-stranded RNA satellite of the L-A double-stranded RNA virus; homologous to mammalian ribosomal protein L36A, no bacterial homolog; RPL42B has a paralog, RPL42A, that arose from the whole genome duplication +S000033511 CDS YHR141C 8 382306 381990 C 2011-02-03 1996-07-31 +S000033510 CDS YHR141C 8 382751 382748 C 2011-02-03 1996-07-31 +S000033512 intron YHR141C 8 382747 382307 C 2011-02-03 1996-07-31 +S000001184 ORF Verified YHR142W CHS7 chromosome 8 S000007442 8 383538 384488 W 2011-02-03 1996-07-31 Protein of unknown function; may be involved in chitin biosynthesis by regulation of Chs3p export from the ER; relocalizes from bud neck to ER upon DNA replication stress +S000033600 CDS YHR142W 8 383538 384488 W 2011-02-03 1996-07-31 +S000001186 ORF Verified YHR143W DSE2 chromosome 8 8 385510 386487 W 2011-02-03 1996-07-31 Daughter cell-specific secreted protein with similarity to glucanases; degrades cell wall from the daughter side causing daughter to separate from mother; expression is repressed by cAMP +S000034514 CDS YHR143W 8 385510 386487 W 2011-02-03 1996-07-31 +S000001185 ORF Verified YHR143W-A RPC10 DNA-directed RNA polymerase core subunit RPC10|ABC10-alpha|RPB12 chromosome 8 L000001686 8 387233 387445 W 2011-02-03 1996-07-31 RNA polymerase subunit ABC10-alpha, found in RNA pol I, II, and III; relocalizes from nucleolus to cytoplasm upon DNA replication stress +S000036603 CDS YHR143W-A 8 387233 387445 W 2011-02-03 1996-07-31 +S000001187 ORF Verified YHR144C DCD1 deoxycytidine monophosphate deaminase chromosome 8 L000000496 8 388726 387788 C 2011-02-03 1996-07-31 Deoxycytidine monophosphate (dCMP) deaminase; involved in dUMP and dTMP biosynthesis; expression is NOT cell cycle regulated +S000034581 CDS YHR144C 8 388726 387788 C 2011-02-03 1996-07-31 +S000006682 tRNA_gene tP(UGG)H SUF8 chromosome 8 L000002156|L000003859 8 388995 388893 C 82 2011-02-03 2000-05-19 Proline tRNA (tRNA-Pro), predicted by tRNAscan-SE analysis; target of K. lactis zymocin; can mutate to suppress +1 frameshift mutations in proline codons +S000035984 intron tP(UGG)H 8 388959 388929 C 2011-02-03 2000-05-19 +S000035983 noncoding_exon tP(UGG)H 8 388928 388893 C 2011-02-03 2000-05-19 +S000035982 noncoding_exon tP(UGG)H 8 388995 388960 C 2011-02-03 2000-05-19 +S000001188 ORF Dubious YHR145C chromosome 8 8 389337 388981 C 2011-02-03 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034646 CDS YHR145C 8 389337 388981 C 2011-02-03 1996-07-31 +S000006997 long_terminal_repeat YHRCdelta10 chromosome 8 8 389509 389177 C 2011-02-03 2000-05-19 Ty2 LTR +S000006998 long_terminal_repeat YHRCdelta11 chromosome 8 8 389845 389613 C 2011-02-03 2000-05-19 Ty1 LTR +S000001189 ORF Verified YHR146W CRP1 chromosome 8 8 390300 391697 W 2011-02-03 1996-07-31 Protein that binds to cruciform DNA structures; CRP1 has a paralog, MDG1, that arose from the whole genome duplication +S000035695 CDS YHR146W 8 390300 391697 W 2011-02-03 1996-07-31 +S000118360 ARS ARS818 ARSVIII-392 chromosome 8 8 392180 392395 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178109 ARS_consensus_sequence ARS818 8 392249 392233 C 2014-11-18 2014-11-18 +S000001190 ORF Verified YHR147C MRPL6 mitochondrial 54S ribosomal protein YmL16|YmL16 chromosome 8 L000001161 8 393283 392639 C 2011-02-03 1996-07-31 Mitochondrial ribosomal protein of the large subunit +S000035761 CDS YHR147C 8 393283 392639 C 2011-02-03 1996-07-31 +S000001191 ORF Verified YHR148W IMP3 snoRNA-binding rRNA-processing protein IMP3 chromosome 8 S000007425 8 393534 394085 W 2011-02-03 1996-07-31 Component of the SSU processome; SSU processome is required for pre-18S rRNA processing, essential protein that interacts with Mpp10p and mediates interactions of Imp4p and Mpp10p with U3 snoRNA +S000035958 CDS YHR148W 8 393534 394085 W 2011-02-03 1996-07-31 +S000001192 ORF Verified YHR149C SKG6 chromosome 8 8 396659 394455 C 2011-02-03 1996-07-31 Integral membrane protein; localizes primarily to growing sites such as the bud tip or the cell periphery; potential Cdc28p substrate; Skg6p interacts with Zds1p and Zds2p; SKG6 has a paralog, TOS2, that arose from the whole genome duplication +S000037794 CDS YHR149C 8 396659 394455 C 2011-02-03 1996-07-31 +S000001193 ORF Verified YHR150W PEX28 chromosome 8 8 397251 398990 W 2011-02-03 1996-07-31 Peroxisomal integral membrane peroxin; involved in the regulation of peroxisomal size, number and distribution; genetic interactions suggest that Pex28p and Pex29p act at steps upstream of those mediated by Pex30p, Pex31p, and Pex32p +S000037560 CDS YHR150W 8 397251 398990 W 2011-02-03 1996-07-31 +S000001194 ORF Verified YHR151C MTC6 chromosome 8 8 400848 399268 C 2011-02-03 1996-07-31 Protein of unknown function; mtc6 is synthetically sick with cdc13-1; SWAT-GFP and mCherry fusion proteins localize to the vacuole while SWAT-GFP fusion also localizes to the endoplasmic reticulum +S000037592 CDS YHR151C 8 400848 399268 C 2011-02-03 1996-07-31 +S000001195 ORF Verified YHR152W SPO12 SDB21 chromosome 8 L000002003|S000029441|L000001821 8 401434 401955 W 83 2011-02-03 1996-07-31 Nucleolar protein of unknown function; positive regulator of mitotic exit; involved in regulating release of Cdc14p from the nucleolus in early anaphase, may play similar role in meiosis; SPO12 has a paralog, BNS1, that arose from the whole genome duplication +S000037692 CDS YHR152W 8 401434 401955 W 2011-02-03 1996-07-31 +S000001196 ORF Verified YHR153C SPO16 chromosome 8 L000002007 8 402682 402086 C 83 2011-02-03 1996-07-31 Meiosis-specific protein involved in synaptonemal complex assembly; implicated in regulation of crossover formation; required for sporulation +S000037713 CDS YHR153C 8 402682 402086 C 2011-02-03 1996-07-31 +S000001197 ORF Verified YHR154W RTT107 ESC4 chromosome 8 L000004424 8 402966 406178 W 2011-02-03 1996-07-31 Protein implicated in Mms22-dependent DNA repair during S phase; involved in recruiting the SMC5/6 complex to double-strand breaks; DNA damage induces phosphorylation by Mec1p at one or more SQ/TQ motifs; interacts with Mms22p and Slx4p; has four BRCT domains; has a role in regulation of Ty1 transposition; relative distribution to nuclear foci increases upon DNA replication stress +S000030580 CDS YHR154W 8 402966 406178 W 2011-02-03 1996-07-31 +S000001198 ORF Verified YHR155W LAM1 YSP1 chromosome 8 8 407103 410789 W 2011-02-03 1996-07-31 Putative sterol transfer protein; localizes to puncta in the cortical ER; probable role in retrograde transport of sterols from the plasma membrane to the ER; one of six StART-like domain-containing proteins in yeast that may be involved in sterol transfer between intracellular membranes; conserved across eukaryotes; contains GRAM, StART-like (VASt) and two PH-like domains +S000030669 CDS YHR155W 8 407103 410789 W 2011-02-03 1996-07-31 +S000006462 snoRNA_gene snR71 SNR71 chromosome 8 L000004540 8 411228 411317 W 2011-02-03 2000-05-19 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A2946 +S000031782 noncoding_exon snR71 8 411228 411317 W 2011-02-03 2000-05-19 +S000001199 ORF Verified YHR156C LIN1 U5 snRNP complex subunit LIN1|SNU40 chromosome 8 8 412406 411384 C 2011-02-03 1996-07-31 Non-essential component of U5 snRNP; nuclear protein; physically interacts with Irr1p of cohesin complex; may link together proteins involved in chromosome segregation, mRNA splicing and DNA replication +S000030744 CDS YHR156C 8 412406 411384 C 2011-02-03 1996-07-31 +S000001200 ORF Verified YHR157W REC104 chromosome 8 L000001605 8 412907 413455 W 107 2011-02-03 1996-07-31 Protein involved in early stages of meiotic recombination; required for meiotic crossing over; forms a complex with Rec102p and Spo11p necessary during the initiation of recombination +S000030900 CDS YHR157W 8 412907 413455 W 2011-02-03 1996-07-31 +S000001201 ORF Verified YHR158C KEL1 chromosome 8 L000003592 8 417179 413685 C 2011-02-03 1996-07-31 Protein required for proper cell fusion and cell morphology; forms a complex with Bud14p and Kel2p that regulates Bnr1p (formin) to affect actin cable assembly, cytokinesis, and polarized growth; functions in a complex with Kel2p to negatively regulate mitotic exit, interacts with Tem1p and Lte1p; localizes to regions of polarized growth; potential Cdc28p substrate +S000031842 CDS YHR158C 8 417179 413685 C 2011-02-03 1996-07-31 +S000001202 ORF Uncharacterized YHR159W TDA11 chromosome 8 8 417549 419063 W 2011-02-03 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; potential Cdc28p substrate; null mutant is sensitive to expression of the top1-T722A allele +S000032058 CDS YHR159W 8 417549 419063 W 2011-02-03 1996-07-31 +S000001203 ORF Verified YHR160C PEX18 chromosome 8 L000004796 8 420072 419221 C 2011-02-03 1996-07-31 Peroxin; required for targeting of peroxisomal matrix proteins containing PTS2; interacts with Pex7p; partially redundant with Pex21p; primarily responsible for peroxisomal import during growth on oleate, and expression is induced during oleate growth +S000031912 CDS YHR160C 8 420072 419221 C 2011-02-03 1996-07-31 +S000001204 ORF Verified YHR161C YAP1801 chromosome 8 L000004198 8 422286 420373 C 2011-02-03 1996-07-31 Protein of the AP180 family, involved in clathrin cage assembly; binds Pan1p and clathrin; YAP1801 has a paralog, YAP1802, that arose from the whole genome duplication +S000032851 CDS YHR161C 8 422286 420373 C 2011-02-03 1996-07-31 +S000001205 ORF Verified YHR162W MPC2 mitochondrial pyruvate carrier chromosome 8 8 423072 423461 W 2011-02-03 1996-07-31 Highly conserved subunit of the mitochondrial pyruvate carrier (MPC); expressed during growth on fermentable carbon sources, and heterodimerizes with Mpc1p to form the fermentative isoform of MPC; MPC localizes to the mitochondrial inner membrane and mediates pyruvate uptake; MPC2 paralog, MPC3, heterodimerizes with Mpc1p to form the respiratory MPC isoform +S000033001 CDS YHR162W 8 423072 423461 W 2011-02-03 1996-07-31 +S000001206 ORF Verified YHR163W SOL3 6-phosphogluconolactonase SOL3 chromosome 8 L000003117 8 423724 424473 W 2011-02-03 1996-07-31|2005-11-07 6-phosphogluconolactonase; catalyzes the second step of the pentose phosphate pathway; weak multicopy suppressor of los1-1 mutation; homologous to Sol2p and Sol1p; SOL3 has a paralog, SOL4, that arose from the whole genome duplication +S000033074 CDS YHR163W 8 423724 424473 W 2011-02-03 1996-07-31|2005-11-07 +S000001207 ORF Verified YHR164C DNA2 bifunctional ATP-dependent DNA helicase/ssDNA endodeoxyribonuclease DNA2|WEB2 chromosome 8 L000003158 8 429178 424610 C 2011-02-03 1996-07-31 Tripartite DNA replication factor; single-stranded DNA-dependent ATPase, ATP-dependent nuclease, helicase; tracking protein for flap cleavage during Okazaki fragment maturation; involved in DNA repair/processing of meiotic DNA double strand breaks; component of telomeric chromatin with cell-cycle dependent localization; required for telomerase-dependent telomere synthesis; forms nuclear foci upon DNA replication stress; human homolog DNA2 complements yeast dna2 mutant +S000033680 CDS YHR164C 8 429178 424610 C 2011-02-03 1996-07-31 +S000028783 ORF Dubious YHR165W-A chromosome 8 8 436647 436958 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps ORF PRP8/YHR165C +S000033524 CDS YHR165W-A 8 436647 436958 W 2011-02-03 2003-07-29 +S000001208 ORF Verified YHR165C PRP8 U4/U6-U5 snRNP complex subunit PRP8|USA2|SLT21|RNA8|DNA39|DBF3 chromosome 8 L000001500|L000003226 8 436948 429707 C 2011-02-03 1996-07-31 Component of U4/U6-U5 snRNP complex; involved in second catalytic step of splicing; participates in spliceosomal assembly through its interaction with U1 snRNA; largest and most evolutionarily conserved protein of the spliceosome; mutations in human ortholog, PRPF8, cause Retinitis pigmentosa and missplicing in Myelodysplastic syndrome; mouse ortholog interacts with androgen receptor and may have a role in prostate cancer +S000033804 CDS YHR165C 8 436948 429707 C 2011-02-03 1996-07-31 +S000001209 ORF Verified YHR166C CDC23 anaphase promoting complex subunit CDC23 chromosome 8 L000000261 8 439050 437170 C 2011-02-03 1996-07-31 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); APC/C is a ubiquitin-protein ligase required for degradation of anaphase inhibitors, including mitotic cyclins, during the metaphase/anaphase transition +S000033878 CDS YHR166C 8 439050 437170 C 2011-02-03 1996-07-31 +S000001210 ORF Verified YHR167W THP2 chromosome 8 8 439342 440127 W 2011-02-03 1996-07-31 Subunit of the THO and TREX complexes; THO connects transcription elongation and mitotic recombination, and TREX is recruited to activated genes and couples transcription to mRNA export; involved in telomere maintenance +S000034871 CDS YHR167W 8 439342 440127 W 2011-02-03 1996-07-31 +S000001211 ORF Verified YHR168W MTG2 putative GTPase MTG2 chromosome 8 8 440377 441933 W 2011-02-03 1996-07-31|2011-02-03 Putative GTPase; member of the Obg family; peripheral protein of the mitochondrial inner membrane that associates with the large ribosomal subunit; required for mitochondrial translation, possibly via a role in ribosome assembly +S000035023 CDS YHR168W 8 440377 441933 W 2011-02-03 1996-07-31|2011-02-03 +S000001212 ORF Verified YHR169W DBP8 ATP-dependent RNA helicase DBP8 chromosome 8 L000004248 8 442181 443476 W 2011-02-03 1996-07-31 ATPase, putative RNA helicase of the DEAD-box family; component of 90S preribosome complex involved in production of 18S rRNA and assembly of 40S small ribosomal subunit; ATPase activity stimulated by association with Esf2p +S000035188 CDS YHR169W 8 442181 443476 W 2011-02-03 1996-07-31 +S000001213 ORF Verified YHR170W NMD3 ribosome-binding protein NMD3|SRC5 chromosome 8 L000002937 8 443828 445384 W 2011-02-03 1996-07-31 Protein involved in nuclear export of the large ribosomal subunit; acts as a Crm1p-dependent adapter protein for export of nascent ribosomal subunits through the nuclear pore complex +S000036170 CDS YHR170W 8 443828 445384 W 2011-02-03 1996-07-31 +S000001214 ORF Verified YHR171W ATG7 APG11|APG7|CVT2 chromosome 8 L000004701|S000029035|L000004786 8 445713 447605 W 2005-11-07 1996-07-31 Autophagy-related protein and dual specificity member of the E1 family; mediates the attachment of Atg12p to Atg5p and Atg8p to phosphatidylethanolamine which are required steps in autophagosome formation; E1 enzymes are also known as ubiquitin-activating enzymes; involved in methionine restriction extension of chronological lifespan in an autophagy-dependent manner +S000036922 CDS YHR171W 8 445713 447605 W 2005-11-07 1996-07-31 +S000118361 ARS ARS820 ARSVIII-448 chromosome 8 8 447714 447795 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178110 ARS_consensus_sequence ARS820 8 447793 447777 C 2014-11-18 2014-11-18 +S000001215 ORF Verified YHR172W SPC97 chromosome 8 L000003543 8 448335 450806 W 2005-11-07 1996-07-31 Component of the microtubule-nucleating Tub4p (gamma-tubulin) complex; interacts with Spc110p at the spindle pole body (SPB) inner plaque and with Spc72p at the SPB outer plaque +S000036987 CDS YHR172W 8 448335 450806 W 2005-11-07 1996-07-31 +S000001216 ORF Uncharacterized YHR173C chromosome 8 8 451153 450815 C 2005-11-07 1996-07-31 Protein of unknown function; expressed at both mRNA and protein levels; SWAT-GFP and mCherry fusion proteins localize to the vacuole +S000037013 CDS YHR173C 8 451153 450815 C 2005-11-07 1996-07-31 +S000001217 ORF Verified YHR174W ENO2 phosphopyruvate hydratase ENO2 chromosome 8 L000000560 8 451327 452640 W 2005-11-07 1996-07-31 Enolase II, a phosphopyruvate hydratase; catalyzes conversion of 2-phosphoglycerate to phosphoenolpyruvate during glycolysis and the reverse reaction during gluconeogenesis; expression induced in response to glucose; ENO2 has a paralog, ENO1, that arose from the whole genome duplication +S000037161 CDS YHR174W 8 451327 452640 W 2005-11-07 1996-07-31 +S000001218 ORF Verified YHR175W CTR2 low-affinity Cu transporter chromosome 8 L000004070 8 452872 453441 W 2005-11-07 1996-07-31 Low-affinity copper transporter of the vacuolar membrane; mutation confers resistance to toxic copper concentrations, while overexpression confers resistance to copper starvation; regulated by nonsense-mediated mRNA decay pathway +S000029818 CDS YHR175W 8 452872 453441 W 2005-11-07 1996-07-31 +S000028553 ORF Uncharacterized YHR175W-A chromosome 8 8 453558 453707 W 2005-11-07 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031239 CDS YHR175W-A 8 453558 453707 W 2005-11-07 2003-07-29 +S000001219 ORF Verified YHR176W FMO1 N,N-dimethylaniline monooxygenase chromosome 8 8 454229 455527 W 2005-11-07 2004-01-29|1996-07-31 Flavin-containing monooxygenase; localized to the cytoplasmic face of the ER membrane; catalyzes oxidation of biological thiols to maintain the ER redox buffer ratio for correct folding of disulfide-bonded proteins +S000029937 CDS YHR176W 8 454229 455527 W 2005-11-07 2004-01-29|1996-07-31 +S000001220 ORF Verified YHR177W GON3 chromosome 8 8 456591 457952 W 2005-11-07 1996-07-31 Putative transcription factor containing a WOPR domain; binds DNA in vitro; similar to C. albicans Wor1p transcription factor that regulates white-opaque switching; overexpression causes a cell cycle delay or arrest +S000030949 CDS YHR177W 8 456591 457952 W 2005-11-07 1996-07-31 +S000001221 ORF Verified YHR178W STB5 chromosome 8 L000003368 8 459299 461530 W 2005-11-07 1996-07-31 Transcription factor; involved in regulating multidrug resistance and oxidative stress response; forms a heterodimer with Pdr1p; contains a Zn(II)2Cys6 zinc finger domain that interacts with a pleiotropic drug resistance element in vitro +S000031050 CDS YHR178W 8 459299 461530 W 2005-11-07 1996-07-31 +S000001222 ORF Verified YHR179W OYE2 NADPH dehydrogenase chromosome 8 L000001325 8 462502 463704 W 2005-11-07 1996-07-31 Conserved NADPH oxidoreductase containing flavin mononucleotide (FMN); responsible for geraniol reduction into citronellol during fermentation; homologous to Oye3p with different ligand binding and catalytic properties; may be involved in sterol metabolism, oxidative stress response, and programmed cell death; protein abundance increases in response to DNA replication stress +S000031157 CDS YHR179W 8 462502 463704 W 2005-11-07 1996-07-31 +S000006999 long_terminal_repeat YHRCdelta12 chromosome 8 8 464147 463920 C 2005-11-07 2000-05-19 Ty1 LTR +S000001223 ORF Dubious YHR180W chromosome 8 8 465178 465669 W 2005-11-07 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000032113 CDS YHR180W 8 465178 465669 W 2005-11-07 1996-07-31 +S000007009 long_terminal_repeat YHRWdelta13 chromosome 8 8 466549 466863 W 2005-11-07 2000-05-19 Ty1 LTR +S000028555 ORF Dubious YHR180W-A chromosome 8 8 466932 467114 W 2005-11-07 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps dubious ORF YHR180C-B and long terminal repeat YHRCsigma3 +S000031241 CDS YHR180W-A 8 466932 467114 W 2005-11-07 2003-07-29 +S000007004 long_terminal_repeat YHRCsigma3 chromosome 8 8 466975 466884 C 2005-11-07 2000-05-19 Ty3 LTR +S000006751 tRNA_gene tT(UGU)H chromosome 8 L000003857 8 466990 467061 W 2005-11-07 2000-05-19 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000036268 noncoding_exon tT(UGU)H 8 466990 467061 W 2005-11-07 2000-05-19 +S000028554 ORF Dubious YHR180C-B chromosome 8 8 467062 466958 C 2005-11-07 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the dubious ORF YHR180W-A +S000031240 CDS YHR180C-B 8 467062 466958 C 2005-11-07 2003-07-29 +S000001224 ORF Verified YHR181W SVP26 ERV26 chromosome 8 8 467228 467914 W 2005-11-07 1996-07-31 Integral membrane protein of the early Golgi apparatus and ER; involved in COP II vesicle transport; may also function to promote retention of proteins in the early Golgi compartment +S000032177 CDS YHR181W 8 467228 467914 W 2005-11-07 1996-07-31 +S000001225 ORF Verified YHR182W chromosome 8 8 468219 470576 W 2005-11-07 1996-07-31 Protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery and cytoplasm; relocalizes from bud neck to cytoplasm upon DNA replication stress +S000032262 CDS YHR182W 8 468219 470576 W 2005-11-07 1996-07-31 +S000001226 ORF Verified YHR183W GND1 phosphogluconate dehydrogenase (decarboxylating) GND1 chromosome 8 L000003125 8 470960 472429 W 2005-11-07 1996-07-31 6-phosphogluconate dehydrogenase (decarboxylating); catalyzes an NADPH regenerating reaction in the pentose phosphate pathway; required for growth on D-glucono-delta-lactone and adaptation to oxidative stress; GND1 has a paralog, GND2, that arose from the whole genome duplication +S000033135 CDS YHR183W 8 470960 472429 W 2005-11-07 1996-07-31 +S000028784 ORF Dubious YHR182C-A chromosome 8 8 471412 470939 C 2005-11-07 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF GND1/YHR183W +S000033525 CDS YHR182C-A 8 471412 470939 C 2005-11-07 2003-07-29 +S000001227 ORF Verified YHR184W SSP1 SPO3 chromosome 8 L000004410|L000004488 8 472744 474459 W 2005-11-07 1996-07-31 Protein involved in the control of meiotic nuclear division; involved in the coordination of meiosis with spore formation; subunit of the leading edge protein (LEP) complex (Ssp1-Ady3-Don1-Irc10) that forms a ring-like structure at the leading edge of the prospore membrane during meiosis II; required for assembly of the leading edge coat and both prospore membrane shaping and organization; transcription is induced midway through meiosis +S000033191 CDS YHR184W 8 472744 474459 W 2005-11-07 1996-07-31 +S000001228 ORF Verified YHR185C PFS1 ADY1 chromosome 8 L000004781 8 475340 474627 C 2005-11-07 1996-07-31 Sporulation protein required for prospore membrane formation; required for prospore membrane formation at selected spindle poles; ensures functionality of all four spindle pole bodies during meiosis II; not required for meiotic recombination or meiotic chromosome segregation +S000033215 CDS YHR185C 8 475340 474627 C 2005-11-07 1996-07-31 +S000006768 tRNA_gene tV(CAC)H chromosome 8 L000003858 8 475778 475706 C 2005-11-07 2000-05-19 Valine tRNA (tRNA-Val), predicted by tRNAscan-SE analysis +S000030621 noncoding_exon tV(CAC)H 8 475778 475706 C 2005-11-07 2000-05-19 +S000001229 ORF Verified YHR186C KOG1 ubiquitin-binding TORC1 subunit KOG1|LAS24 chromosome 8 8 480672 475999 C 2005-11-07 1996-07-31 Subunit of TORC1; TORC1 is a rapamycin-sensitive complex involved in growth control that contains Tor1p or Tor2p, Lst8p and Tco89p; contains four HEAT repeats and seven WD-40 repeats; may act as a scaffold protein to couple TOR and its effectors +S000033270 CDS YHR186C 8 480672 475999 C 2005-11-07 1996-07-31 +S000001230 ORF Verified YHR187W IKI1 Elongator subunit IKI1|HAP2|ELP5|TOT5 chromosome 8 L000003562 8 480990 481919 W 2005-11-07 1996-07-31 Subunit of hexameric RecA-like ATPase Elp456 Elongator subcomplex; which is required for modification of wobble nucleosides in tRNA; iki1 mutations confer resistance to the K. lactis toxin zymocin +S000034195 CDS YHR187W 8 480990 481919 W 2005-11-07 1996-07-31 +S000001231 ORF Verified YHR188C GPI16 GPI-anchor transamidase subunit GPI16 chromosome 8 8 483837 482005 C 2005-11-07 1996-07-31 Subunit of the glycosylphosphatidylinositol transamidase complex; transmembrane protein; adds GPIs to newly synthesized proteins; human PIG-Tp homolog +S000034241 CDS YHR188C 8 483837 482005 C 2005-11-07 1996-07-31 +S000001232 ORF Verified YHR189W PTH1 aminoacyl-tRNA hydrolase|PTH chromosome 8 8 484028 484600 W 2005-11-07 1996-07-31 One of two mitochondrially-localized peptidyl-tRNA hydrolases; dispensable for respiratory growth on rich medium, but required for respiratory growth on minimal medium; see also PTH2 +S000034422 CDS YHR189W 8 484028 484600 W 2005-11-07 1996-07-31 +S000001233 ORF Verified YHR190W ERG9 bifunctional farnesyl-diphosphate farnesyltransferase/squalene synthase chromosome 8 L000000575 8 484845 486179 W 2005-11-07 1996-07-31 Farnesyl-diphosphate farnesyl transferase (squalene synthase); joins two farnesyl pyrophosphate moieties to form squalene in the sterol biosynthesis pathway +S000036394 CDS YHR190W 8 484845 486179 W 2005-11-07 1996-07-31 +S000001234 ORF Verified YHR191C CTF8 chromosome 8 L000003309 8 486631 486230 C 2005-11-07 1996-07-31 Subunit of a complex with Ctf18p; shares some subunits with Replication Factor C; required for sister chromatid cohesion +S000036427 CDS YHR191C 8 486631 486230 C 2005-11-07 1996-07-31 +S000001235 ORF Verified YHR192W LNP1 chromosome 8 8 486826 487662 W 2005-11-07 1996-07-31 Lunapark family member involved in ER network formation; regulates the ER asymmetry-induced inheritance block during ER stress; localizes to ER junctions and this localization is regulated by the yeast atlastin ortholog Sey1p; interacts with the reticulon protein Rtn1p; induced in response to the DNA-damaging agent MMS +S000036575 CDS YHR192W 8 486826 487662 W 2005-11-07 1996-07-31 +S000001236 ORF Verified YHR193C EGD2 chromosome 8 L000000546|L000002606 8 488236 487712 C 2005-11-07 1996-07-31 Alpha subunit of the nascent polypeptide-associated complex (NAC); involved in protein sorting and translocation; associated with cytoplasmic ribosomes +S000036606 CDS YHR193C 8 488236 487712 C 2005-11-07 1996-07-31 +S000001237 ORF Verified YHR194W MDM31 chromosome 8 8 488657 490396 W 2005-11-07 1996-07-31 Mitochondrial protein that may have a role in phospholipid metabolism; inner membrane protein with similarity to Mdm32p; required for normal mitochondrial morphology and inheritance; interacts genetically with MMM1, MMM2, MDM10, MDM12, and MDM34 +S000037365 CDS YHR194W 8 488657 490396 W 2005-11-07 1996-07-31 +S000028785 ORF Dubious YHR193C-A chromosome 8 8 489027 488653 C 2005-11-07 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified ORF MDM31/YHR194W +S000033528 CDS YHR193C-A 8 489027 488653 C 2005-11-07 2003-07-29 +S000001238 ORF Verified YHR195W NVJ1 VAB36 chromosome 8 8 490747 491712 W 2005-11-07 1996-07-31 Nuclear envelope protein; anchored to the nuclear inner membrane, that interacts with the vacuolar membrane protein Vac8p to promote formation of nucleus-vacuole junctions during piecemeal microautophagy of the nucleus (PMN) +S000037505 CDS YHR195W 8 490747 491712 W 2005-11-07 1996-07-31 +S000001239 ORF Verified YHR196W UTP9 chromosome 8 8 491931 493658 W 2005-11-07 1996-07-31 Nucleolar protein; component of the small subunit (SSU) processome containing the U3 snoRNA that is involved in processing of pre-18S rRNA +S000030211 CDS YHR196W 8 491931 493658 W 2005-11-07 1996-07-31 +S000001240 ORF Verified YHR197W RIX1 IPI2 chromosome 8 8 493896 496187 W 2005-11-07 1996-07-31|2011-02-03 Component of the Rix1 complex and possibly pre-replicative complexes; required for processing of ITS2 sequences from 35S pre-rRNA; component of the pre-60S ribosomal particle with the dynein-related AAA-type ATPase Mdn1p; required for pre-replicative complex (pre-RC) formation and maintenance during DNA replication licensing; relocalizes to the cytosol in response to hypoxia; essential gene +S000030393 CDS YHR197W 8 493896 496187 W 2005-11-07 1996-07-31|2011-02-03 +S000001241 ORF Verified YHR198C AIM18 FMP22 chromosome 8 8 497280 496315 C 2005-11-07 1996-07-31 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; null mutant displays elevated frequency of mitochondrial genome loss +S000030441 CDS YHR198C 8 497280 496315 C 2005-11-07 1996-07-31 +S000001242 ORF Verified YHR199C AIM46 FMP34 chromosome 8 8 498422 497490 C 2005-11-07 1996-07-31 Protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; null mutant displays elevated frequency of mitochondrial genome loss +S000031364 CDS YHR199C 8 498422 497490 C 2005-11-07 1996-07-31 +S000029704 ORF Verified YHR199C-A NBL1 MCL1 chromosome 8 8 498859 498571 C 2005-11-07 2004-02-20 Subunit of the conserved chromosomal passenger complex (CPC); complex regulates mitotic chromosome segregation; not required for the kinase activity of the complex; mediates the interaction of Sli15p and Bir1p; other complex members are Ipl1p, Sli15p, and Bir1p +S000036811 CDS YHR199C-A 8 498719 498571 C 2005-11-07 2004-02-20 +S000036810 CDS YHR199C-A 8 498859 498787 C 2005-11-07 2004-02-20 +S000036812 intron YHR199C-A 8 498786 498720 C 2005-11-07 2004-02-20 +S000001243 ORF Verified YHR200W RPN10 proteasome regulatory particle base subunit RPN10|SUN1|MCB1 chromosome 8 L000003108 8 499079 499885 W 2005-11-07 1996-07-31 Non-ATPase base subunit of the 19S RP of the 26S proteasome; N-terminus plays a role in maintaining the structural integrity of the regulatory particle (RP); binds selectively to polyubiquitin chains; homolog of the mammalian S5a protein +S000036384 CDS YHR200W 8 499079 499885 W 2005-11-07 1996-07-31 +S000001244 ORF Verified YHR201C PPX1 exopolyphosphatase chromosome 8 L000001477 8 501143 499950 C 2005-11-07 1996-07-31 Exopolyphosphatase; hydrolyzes inorganic polyphosphate (poly P) into Pi residues; located in the cytosol, plasma membrane, and mitochondrial matrix +S000036416 CDS YHR201C 8 501143 499950 C 2005-11-07 1996-07-31 +S000118362 ARS ARS822 ARSVIII-502 chromosome 8 8 501756 501996 2006-08-30 2006-08-30 Autonomously Replicating Sequence +S000001245 ORF Uncharacterized YHR202W chromosome 8 8 502388 504196 W 2005-11-07 1996-07-31 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole, while HA-tagged protein is found in the soluble fraction, suggesting cytoplasmic localization +S000037129 CDS YHR202W 8 502388 504196 W 2005-11-07 1996-07-31 +S000001246 ORF Verified YHR203C RPS4B eS4|ribosomal 40S subunit protein S4B|S4e|rp5|YS6|S7B|S4B chromosome 8 L000001750 8 505530 504476 C 2005-11-07 1999-07-17|1996-07-31 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S4, no bacterial homolog; RPS4B has a paralog, RPS4A, that arose from the whole genome duplication +S000037172 CDS YHR203C 8 505247 504476 C 2005-11-07 1999-07-17|1996-07-31 +S000037171 CDS YHR203C 8 505530 505517 C 2005-11-07 1999-07-17|1996-07-31 +S000037173 intron YHR203C 8 505516 505248 C 2005-11-07 1999-07-17|1996-07-31 +S000001247 ORF Verified YHR204W MNL1 alpha-1,2-mannosidase MNL1|HTM1 chromosome 8 8 506319 508709 W 2005-11-07 1996-07-31 Alpha-1,2-specific exomannosidase of the endoplasmic reticulum; involved in glycan trimming of both folded and misfolded glycoproteins; complexes with Pdi1p, and trims a mannose from Man8GlcNac2 glycans to generate Man7GlcNac2, an oligosaccharide signal on glycoproteins destined for ER-associated protein degradation; requires Pdi1p for stability and substrate recognition; human homolog EDEM1 can complement yeast null mutant +S000037304 CDS YHR204W 8 506319 508709 W 2005-11-07 1996-07-31 +S000001248 ORF Verified YHR205W SCH9 serine/threonine protein kinase SCH9|HRM2|KOM1 chromosome 8 L000001810 8 509363 511837 W 2005-11-07 1996-07-31 AGC family protein kinase; functional ortholog of mammalian S6 kinase; phosphorylated by Tor1p and required for TORC1-mediated regulation of ribosome biogenesis, translation initiation, and entry into G0 phase; involved in transactivation of osmostress-responsive genes; regulates G1 progression, cAPK activity and nitrogen activation of the FGM pathway; integrates nutrient signals and stress signals from sphingolipids to regulate lifespan +S000037366 CDS YHR205W 8 509363 511837 W 2005-11-07 1996-07-31 +S000001249 ORF Verified YHR206W SKN7 kinase-regulated stress-responsive transcription factor SKN7|POS9|BRY1 chromosome 8 L000001908 8 512732 514600 W 2005-11-07 1996-07-31 Nuclear response regulator and transcription factor; physically interacts with the Tup1-Cyc8 complex and recruits Tup1p to its targets; part of a branched two-component signaling system; required for optimal induction of heat-shock genes in response to oxidative stress; involved in osmoregulation; relocalizes to the cytosol in response to hypoxia; SKN7 has a paralog, HMS2, that arose from the whole genome duplication +S000029994 CDS YHR206W 8 512732 514600 W 2005-11-07 1996-07-31 +S000001250 ORF Verified YHR207C SET5 S-adenosylmethionine-dependent methyltransferase chromosome 8 8 516485 514905 C 2005-11-07 1996-07-31 Methyltransferase involved in methylation of histone H4 Lys5, -8, -12; S-adenosylmethionine-dependent; zinc-finger protein, contains one canonical and two unusual fingers in unusual arrangements; deletion enhances replication of positive-strand RNA virus +S000030030 CDS YHR207C 8 516485 514905 C 2005-11-07 1996-07-31 +S000001251 ORF Verified YHR208W BAT1 branched-chain-amino-acid transaminase BAT1|TWT1|ECA39 chromosome 8 L000002396 8 517532 518713 W 2005-11-07 1996-07-31 Mitochondrial branched-chain amino acid (BCAA) aminotransferase; preferentially involved in BCAA biosynthesis; homolog of murine ECA39; highly expressed during logarithmic phase and repressed during stationary phase; BAT1 has a paralog, BAT2, that arose from the whole genome duplication +S000030198 CDS YHR208W 8 517532 518713 W 2005-11-07 1996-07-31 +S000001252 ORF Verified YHR209W CRG1 S-adenosylmethionine-dependent methyltransferase chromosome 8 8 519437 520312 W 2005-11-07 1996-07-31 S-AdoMet-dependent methyltransferase involved in lipid homeostasis; mediates resistance to a drug cantharidin +S000030378 CDS YHR209W 8 519437 520312 W 2005-11-07 1996-07-31 +S000001253 ORF Uncharacterized YHR210C aldose 1-epimerase superfamily protein chromosome 8 8 521737 520712 C 2005-11-07 1996-07-31 Putative aldose 1-epimerase superfamily protein; non-essential gene; highly expressed under anaeorbic conditions +S000032576 CDS YHR210C 8 521737 520712 C 2005-11-07 1996-07-31 +S000001254 ORF Verified YHR211W FLO5 flocculin FLO5 chromosome 8 L000000618 8 525392 528619 W 2005-11-07 1996-07-31 Lectin-like cell wall protein (flocculin) involved in flocculation; binds mannose chains on the surface of other cells, confers floc-forming ability that is chymotrypsin resistant but heat labile; important for co-flocculation with other yeasts, mediating interaction with specific species; FLO5 has a paralog, FLO1, that arose from a segmental duplication +S000033338 CDS YHR211W 8 525392 528619 W 2005-11-07 1996-07-31 +S000007000 long_terminal_repeat YHRCdelta14 chromosome 8 8 530379 530049 C 2005-11-07 2000-05-19 Ty1 LTR +S000001255 ORF Dubious YHR212C chromosome 8 8 538094 537759 C 2005-11-07 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; YHR212C has a paralog, YAR060C, that arose from a segmental duplication +S000033360 CDS YHR212C 8 538094 537759 C 2005-11-07 1996-07-31 +S000028650 ORF Uncharacterized YHR212W-A chromosome 8 8 538742 538945 W 2005-11-07 2003-07-29 Pseudogenic fragment with similarity to flocculins; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the endoplasmic reticulum; YHR212W-A has a paralog, YAR061W, that arose from a segmental duplication +S000032453 CDS YHR212W-A 8 538742 538945 W 2005-11-07 2003-07-29 +S000001256 ORF Uncharacterized YHR213W chromosome 8 8 539151 539747 W 2005-11-07 1996-07-31 Pseudogenic fragment with similarity to flocculins; YHR213W has a paralog, YAR062W, that arose from a segmental duplication +S000033478 CDS YHR213W 8 539151 539747 W 2005-11-07 1996-07-31 +S000028651 ORF Uncharacterized YHR213W-A chromosome 8 8 540549 540782 W 2005-11-07 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032454 CDS YHR213W-A 8 540549 540782 W 2005-11-07 2003-07-29 +S000028652 ORF Uncharacterized YHR213W-B chromosome 8 8 540800 541099 W 2005-11-07 2003-07-29 Pseudogenic fragment with similarity to flocculins; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; YHR213W-B has a paralog, YAR064W, that arose from a segmental duplication +S000032455 CDS YHR213W-B 8 540800 541099 W 2005-11-07 2003-07-29 +S000001257 ORF Uncharacterized YHR214W chromosome 8 8 541651 542262 W 2005-11-07 1996-07-31 Putative protein of unknown function; predicted to be a glycosylphosphatidylinositol-modified (GPI) protein; YHR214W has a paralog, YAR066W, that arose from a segmental duplication +S000033542 CDS YHR214W 8 541651 542262 W 2005-11-07 1996-07-31 +S000003535 ORF Dubious YHR214W-A chromosome 8 8 543008 543493 W 2005-11-07 1996-07-31 Dubious open reading frame; induced by zinc deficiency; YHR214W-A has a paralog, YAR068W, that arose from a segmental duplication +S000035568 CDS YHR214W-A 8 543008 543493 W 2005-11-07 1996-07-31 +S000007001 long_terminal_repeat YHRCdelta15 chromosome 8 8 543941 543610 C 2005-11-07 2000-05-19 Ty1 LTR +S000003534 transposable_element_gene YHR214C-B gag-pol fusion protein chromosome 8 8 549346 543964 C 2005-11-07 1996-07-31 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes; YHR214C-B has a paralog, YAR070C, that arose from a segmental duplication +S000035139 CDS YHR214C-B 8 547929 543964 C 2005-11-07 1996-07-31 +S000035138 CDS YHR214C-B 8 549346 547931 C 2005-11-07 1996-07-31 +S000035140 plus_1_translational_frameshift YHR214C-B 8 547930 547930 C 2005-11-07 1996-07-31 +S000007421 transposable_element_gene YHR214C-C gag protein chromosome 8 8 549346 547910 C 2005-11-07 1999-07-17 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000035142 CDS YHR214C-C 8 549346 547910 C 2005-11-07 1999-07-17 +S000007006 LTR_retrotransposon YHRCTy1-1 Ty1 chromosome 8 8 549637 543610 C 2005-11-07 2000-05-19 Ty1 element, LTR retrotransposon of the Copia (Pseudoviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats +S000007002 long_terminal_repeat YHRCdelta16 chromosome 8 8 549637 549306 C 2005-11-07 2000-05-19 Ty1 LTR +S000028653 ORF Uncharacterized YHR214C-D chromosome 8 8 550941 550648 C 2005-11-07 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; SWAT-GFP and mCherry fusion proteins localize to the nucleus and endoplasmic reticulum respectively; YHR214C-D has a paralog, YAR069C, that arose from a segmental duplication +S000032456 CDS YHR214C-D 8 550941 550648 C 2005-11-07 2003-07-29 +S000028654 ORF Uncharacterized YHR214C-E chromosome 8 8 551499 551200 C 2005-11-07 2003-07-29 Putative protein of unknown function; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032457 CDS YHR214C-E 8 551499 551200 C 2005-11-07 2003-07-29 +S000001258 ORF Verified YHR215W PHO12 acid phosphatase PHO12|PHO10 chromosome 8 L000001424 8 552099 553502 W 2005-11-07 1996-07-31 One of three repressible acid phosphatases; glycoprotein that is transported to the cell surface by the secretory pathway; pregulated by phosphate starvation; PHO12 has a paralog, PHO11, that arose from a segmental duplication +S000033601 CDS YHR215W 8 552099 553502 W 2005-11-07 1996-07-31 +S000001259 ORF Verified YHR216W IMD2 IMP dehydrogenase IMD2|PUR5 chromosome 8 8 554396 555967 W 2005-11-07 1996-07-31 Inosine monophosphate dehydrogenase; catalyzes the rate-limiting step in GTP biosynthesis, expression is induced by mycophenolic acid resulting in resistance to the drug, expression is repressed by nutrient limitation; IMD2 has a paralog, YAR073W/YAR075W, that arose from a segmental duplication +S000034515 CDS YHR216W 8 554396 555967 W 2005-11-07 1996-07-31 +S000118363 ARS ARS824 ARSVIII-556 chromosome 8 8 556001 556331 2006-08-30 2006-08-30 Autonomously Replicating Sequence +S000028964 telomere TEL08R chromosome 8 8 556105 562643 W 131 2005-11-07 2003-09-09 Telomeric region on the right arm of Chromosome VIII; composed of an X element core sequence, X element combinatorial repeats, an internal stretch of telomeric repeats, a short Y' element, and a terminal stretch of telomeric repeats +S000028966 telomeric_repeat TEL08R 8 556832 556985 W 2005-11-07 2003-09-09 Internal telomeric repeats on the right arm of Chromosome VIII +S000028965 telomeric_repeat TEL08R 8 562457 562643 W 2005-11-07 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome VIII +S000028967 X_element TEL08R 8 556105 556575 W 2005-11-07 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome VIII; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028968 X_element_combinatorial_repeat TEL08R 8 556576 556831 W 2005-11-07 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr VIII; contains repeats of the D, C, and B types; formerly called SubTelomeric Repeats +S000028969 Y_prime_element TEL08R 8 556986 562456 W 2005-11-07 2003-09-09 Telomeric short Y' element on the right arm of Chromosome VIII; contains an ARS consensus sequence, a region of 36-bp repeats, and four ORFs (YHR218W, YHR219W, YHR218W-A, YHR219C-A) +S000001260 ORF Dubious YHR217C chromosome 8 8 557042 556581 C 2005-11-07 1996-07-31 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; located in the telomeric region TEL08R +S000034583 CDS YHR217C 8 557042 556581 C 2005-11-07 1996-07-31 +S000001261 ORF Uncharacterized YHR218W chromosome 8 8 558014 559924 W 2005-11-07 1996-07-31 Helicase-like protein encoded within the telomeric Y' element +S000034722 CDS YHR218W 8 558014 558615 W 2005-11-07 1996-07-31 +S000034723 CDS YHR218W 8 558715 559924 W 2005-11-07 1996-07-31 +S000034724 intron YHR218W 8 558616 558714 W 2005-11-07 1996-07-31 +S000028786 ORF Dubious YHR218W-A chromosome 8 8 559932 560249 W 2005-11-07 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely within telomere TEL08L +S000033530 CDS YHR218W-A 8 559932 560249 W 2005-11-07 2003-07-29 +S000001262 ORF Uncharacterized YHR219W chromosome 8 8 560173 562047 W 2005-11-07 1996-07-31 Putative protein of unknown function with similarity to helicases; located in the telomere region on the right arm of chromosome VIII +S000035716 CDS YHR219W 8 560173 562047 W 2005-11-07 1996-07-31 +S000028655 ORF Dubious YHR219C-A chromosome 8 8 561681 561199 C 2005-11-07 2003-07-29 Dubious open reading frame unlikely to encode a functional protein; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching +S000032458 CDS YHR219C-A 8 561681 561199 C 2005-11-07 2003-07-29 +S000028658 ORF Dubious YIL177W-A chromosome 9 9 846 1328 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the uncharacterized gene YIL177C +S000032462 CDS YIL177W-A 9 846 1328 W 2003-07-29 2003-07-29 +S000001439 ORF Uncharacterized YIL177C Y' element ATP-dependent helicase chromosome 9 9 6147 483 C 1994-12-10 1994-12-10 Putative Y' element ATP-dependent helicase +S000034517 CDS YIL177C 9 4598 483 C 1994-12-10 1994-12-10 +S000034516 CDS YIL177C 9 6147 4987 C 1994-12-10 1994-12-10 +S000034518 intron YIL177C 9 4986 4599 C 1994-12-10 1994-12-10 +S000130156 ARS ARS902 chromosome 9 9 7470 8793 2009-05-07 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000028896 telomere TEL09L chromosome 9 9 7784 1 C -155 2003-09-09 2003-09-09 Telomeric region on the left arm of Chromosome IX; composed of an X element core sequence, X element combinatorial repeats, a long Y' element, and a short terminal stretch of telomeric repeats +S000028897 telomeric_repeat TEL09L 9 77 1 C 2003-09-09 2003-09-09 Terminal telomeric repeats on the left arm of Chromosome IX +S000028898 X_element TEL09L 9 7784 7322 C 2003-09-09 2003-09-09 Telomeric X element Core sequence on the left arm of Chromosome IX; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028899 X_element_combinatorial_repeat TEL09L 9 7321 6949 C 2003-09-09 2003-09-09 Telomeric X element combinatorial repeat on the left arm of Chr IX; contains a repeat of the D type with a group I mitochondrial bI4 intron insertion; formerly called SubTelomeric Repeats +S000028900 Y_prime_element TEL09L 9 6948 78 C 2003-09-09 2003-09-09 Telomeric long Y' element on the left arm of Chromosome IX; contains an ARS consensus sequence, a region of 36-bp repeats, and two ORFs YIL177C and YIL177W-A +S000001438 ORF Uncharacterized YIL176C PAU14 seripauperin PAU14 chromosome 9 9 9155 8793 C 1994-12-10 1994-12-10 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; identical to Pau1p +S000034408 CDS YIL176C 9 9155 8793 C 1994-12-10 1994-12-10 +S000001437 pseudogene YIL175W chromosome 9 9 9183 9500 W 1994-12-10 1994-12-10 Hypothetical protein; classified as pseudogene because there is no ATG at the beginning of this ORF +S000034372 CDS YIL175W 9 9183 9500 W 1994-12-10 1994-12-10 +S000001436 pseudogene YIL174W chromosome 9 9 9469 9696 W 1994-12-10 1994-12-10 Hypothetical protein +S000034275 CDS YIL174W 9 9469 9696 W 1994-12-10 1994-12-10 +S000001435 ORF Verified YIL173W VTH1 signal sequence-binding protein chromosome 9 9 11492 16141 W 1994-12-10 1994-12-10 Putative membrane glycoprotein; has strong similarity to Vth2p and Pep1p/Vps10p; may be involved in vacuolar protein sorting +S000033367 CDS YIL173W 9 11492 16141 W 1994-12-10 1994-12-10 +S000130157 ARS ARS904 chromosome 9 9 16141 16784 2009-05-07 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000028798 ORF Dubious YIL171W-A chromosome 9 9 18260 18712 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF IMA3/YIL172C +S000033565 CDS YIL171W-A 9 18260 18712 W 2003-07-29 2003-07-29 +S000001434 ORF Verified YIL172C IMA3 oligo-1,6-glucosidase IMA3 chromosome 9 9 18553 16784 C 1994-12-10 1994-12-10 Alpha-glucosidase; weak, but broad substrate specificity for alpha-1,4- and alpha-1,6-glucosides; member of IMA isomaltase family; not required for isomaltose utilization, but Ima3p overexpression allows the ima1 null mutant to grow on isomaltose; lower activitiy and thermostability in vitro than Ima2p despite sequence difference of only 3 amino acids; cleaves alpha-1,3 linkage of nigerose and turanose, but not alpha-1,5 of leucrose; identical to IMA4 +S000033269 CDS YIL172C 9 18553 16784 C 1994-12-10 1994-12-10 +S000001433 pseudogene YIL171W HXT12 chromosome 9 L000002639 9 19515 19844 W 1994-12-10 1994-12-10 Possible pseudogene in strain S288C; YIL171W and the adjacent ORF, YIL170W/HXT12, together encode a non-functional member of the hexose transporter family +S000033235 CDS YIL171W 9 19515 19844 W 1994-12-10 1994-12-10 +S000001432 pseudogene YIL170W HXT12 chromosome 9 9 19847 21220 W 1994-12-10 1994-12-10 Possible pseudogene in strain S288C; YIL170W/HXT12 and the adjacent ORF, YIL171W, together encode a non-functional member of the hexose transporter family +S000032383 CDS YIL170W 9 19847 21220 W 1994-12-10 1994-12-10 +S000001431 ORF Verified YIL169C CSS1 HPF1' chromosome 9 9 26106 23119 C 1994-12-10 1994-12-10 Protein of unknown function, secreted when constitutively expressed; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the cell periphery, SWAT-GFP fusion also localizes to the extracellular region, and mCherry fusion also localizes to the vacuole; S/T rich and highly similar to YOL155C, a putative glucan alpha-1,4-glucosidase; transcript is induced in both high and low pH environments; non-essential gene +S000031425 CDS YIL169C 9 26106 23119 C 1994-12-10 1994-12-10 +S000001429 blocked_reading_frame YIL167W SDL1 YIL168W chromosome 9 9 29032 30048 W 2014-11-18 1994-12-10|2014-11-18 Blocked reading frame otherwise encoding L-serine dehydratase +S000031256 CDS YIL167W 9 29032 30048 W 2014-11-18 1994-12-10|2014-11-18 +S000001428 ORF Uncharacterized YIL166C chromosome 9 9 32566 30938 C 1994-12-10 1994-12-10 Putative protein with similarity to allantoate permease; similar to the allantoate permease (Dal5p) subfamily of the major facilitator superfamily; mRNA expression is elevated by sulfur limitation; YIL166C is a non-essential gene +S000030233 CDS YIL166C 9 32566 30938 C 1994-12-10 1994-12-10 +S000001427 ORF Uncharacterized YIL165C chromosome 9 9 34077 33718 C 1994-12-10 1994-12-10 Putative protein of unknown function; mutant exhibits mitophagy defects; in closely related species and other S. cerevisiae strain backgrounds YIL165C and adjacent ORF, YIL164C, likely constitute a single ORF encoding a nitrilase gene +S000030045 CDS YIL165C 9 34077 33718 C 1994-12-10 1994-12-10 +S000001426 ORF Verified YIL164C NIT1 chromosome 9 L000004211 9 34686 34087 C 1994-12-10 1994-12-10 Nitrilase; member of the nitrilase branch of the nitrilase superfamily; in closely related species and other S. cerevisiae strain backgrounds YIL164C and adjacent ORF, YIL165C, likely constitute a single ORF encoding a nitrilase gene +S000029934 CDS YIL164C 9 34686 34087 C 1994-12-10 1994-12-10 +S000001425 ORF Uncharacterized YIL163C chromosome 9 9 37252 36899 C 1994-12-10 1994-12-10 Protein of unknown function; mRNA identified as translated by ribosome profiling data +S000037273 CDS YIL163C 9 37252 36899 C 1994-12-10 1994-12-10 +S000001424 ORF Verified YIL162W SUC2 beta-fructofuranosidase SUC2 chromosome 9 L000002144 9 37385 38983 W -153 1994-12-10 1994-12-10 Invertase; sucrose hydrolyzing enzyme; a secreted, glycosylated form is regulated by glucose repression, and an intracellular, nonglycosylated enzyme is produced constitutively +S000037231 CDS YIL162W 9 37385 38983 W 1994-12-10 1994-12-10 +S000001423 ORF Uncharacterized YIL161W chromosome 9 9 39433 40140 W 1994-12-10 1994-12-10 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm; mRNA is enriched in Scp160p-associated mRNPs; YIL161W is a non-essential gene +S000037133 CDS YIL161W 9 39433 40140 W 1994-12-10 1994-12-10 +S000001422 ORF Verified YIL160C POT1 acetyl-CoA C-acyltransferase|POX3|FOX3 chromosome 9 L000001466 9 41444 40191 C 1994-12-10 1994-12-10 3-ketoacyl-CoA thiolase with broad chain length specificity; cleaves 3-ketoacyl-CoA into acyl-CoA and acetyl-CoA during beta-oxidation of fatty acids +S000037007 CDS YIL160C 9 41444 40191 C 1994-12-10 1994-12-10 +S000001421 ORF Verified YIL159W BNR1 formin BNR1 chromosome 9 L000004058 9 41825 45952 W 1994-12-10 1994-12-10 Formin; nucleates the formation of linear actin filaments; involved in processes such as budding and mitotic spindle orientation which require the formation of polarized actin cables; activity is regulated by Hof1p and by the Bud14p-Kel1p-Kel2p complex; dephosphorylated and delocalized from the division site in a Glc7p/Ref2p-dependent manner; functionally redundant with BNI1 +S000035282 CDS YIL159W 9 41825 45952 W 1994-12-10 1994-12-10 +S000001420 ORF Verified YIL158W AIM20 chromosome 9 9 46201 46815 W 1994-12-10 1994-12-10 Protein of unknown function; overexpression causes cell cycle delay or arrest; green fluorescent protein (GFP)-fusion protein localizes to vacuole; null mutant displays elevated frequency of mitochondrial genome loss; relocalizes from nucleus to cytoplasm upon DNA replication stress; AIM20 has a paralog, SKG1, that arose from the whole genome duplication +S000035094 CDS YIL158W 9 46201 46815 W 1994-12-10 1994-12-10 +S000028797 ORF Dubious YIL156W-A chromosome 9 9 47292 47693 W 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF COA1/YIL157C +S000033563 CDS YIL156W-A 9 47292 47693 W 2003-07-29 2003-07-29 +S000001419 ORF Verified YIL157C COA1 FMP35 chromosome 9 9 47542 46949 C 1994-12-10 1994-12-10 Mitochondrial inner membrane protein; required for assembly of the cytochrome c oxidase complex (complex IV); interacts with complex IV assembly factor Shy1p during the early stages of assembly +S000034088 CDS YIL157C 9 47542 46949 C 1994-12-10 1994-12-10 +S000028511 ORF Uncharacterized YIL156W-B chromosome 9 9 47690 47973 W 2003-07-29 2003-07-29 Putative protein of unknown function; originally identified based on homology to Ashbya gossypii and other related yeasts; SWAT-GFP and mCherry fusion proteins localize to the vacuole, while SWAT-GFP fusion also localizes to the endoplasmic reticulum +S000030265 CDS YIL156W-B 9 47690 47698 W 2003-07-29 2003-07-29 +S000030266 CDS YIL156W-B 9 47761 47973 W 2003-07-29 2003-07-29 +S000030267 intron YIL156W-B 9 47699 47760 W 2003-07-29 2003-07-29 +S000001418 ORF Verified YIL156W UBP7 ubiquitin-specific protease UBP7 chromosome 9 L000003169 9 48091 51306 W 1994-12-10 1994-12-10 Ubiquitin-specific protease that cleaves ubiquitin-protein fusions; UBP7 has a paralog, UBP11, that arose from the whole genome duplication +S000034053 CDS YIL156W 9 48091 51306 W 1994-12-10 1994-12-10 +S000001417 ORF Verified YIL155C GUT2 glycerol-3-phosphate dehydrogenase chromosome 9 L000000747 9 53708 51759 C 1994-12-10 1994-12-10 Mitochondrial glycerol-3-phosphate dehydrogenase; expression is repressed by both glucose and cAMP and derepressed by non-fermentable carbon sources in a Snf1p, Rsf1p, Hap2/3/4/5 complex dependent manner +S000033832 CDS YIL155C 9 53708 51759 C 1994-12-10 1994-12-10 +S000001416 ORF Verified YIL154C IMP2' IMP2 chromosome 9 L000000865 9 55021 53981 C 1994-12-10 1994-12-10 Transcriptional activator involved in maintenance of ion homeostasis; also involved in protection against DNA damage caused by bleomycin and other oxidants; contains a C-terminal leucine-rich repeat +S000033080 CDS YIL154C 9 55021 53981 C 1994-12-10 1994-12-10 +S000001415 ORF Verified YIL153W RRD1 peptidylprolyl isomerase RRD1|YPA1 chromosome 9 L000004483 9 55198 56379 W 1994-12-10 1994-12-10 Peptidyl-prolyl cis/trans-isomerase; activator of the phosphotyrosyl phosphatase activity of PP2A; involved in G1 phase progression, microtubule dynamics, bud morphogenesis and DNA repair; required for rapid reduction of Sgs1p levels in response to rapamycin; subunit of the Tap42p-Sit4p-Rrd1p complex; protein increases in abundance and relative distribution to the nucleus increases upon DNA replication stress +S000033043 CDS YIL153W 9 55198 56379 W 1994-12-10 1994-12-10 +S000001414 ORF Uncharacterized YIL152W chromosome 9 9 56545 57252 W 1994-12-10 1994-12-10 Putative protein of unknown function +S000032954 CDS YIL152W 9 56545 57252 W 1994-12-10 1994-12-10 +S000001413 ORF Uncharacterized YIL151C ESL1 chromosome 9 9 60694 57338 C 1994-12-10 1994-12-10 hEST1A/B (SMG5/6)-like protein; contributes to environment-sensing adaptive gene expression responses; Esl1p and Esl2p contain a 14-3-3-like domain and a putative PilT N-terminus ribonuclease domain; ESL1 has a paralog, ESL2, that arose from the whole genome duplication +S000032789 CDS YIL151C 9 60694 57338 C 1994-12-10 1994-12-10 +S000001412 ORF Verified YIL150C MCM10 DNA43 chromosome 9 L000000512 9 62728 61013 C 1994-12-10 1994-12-10 Essential chromatin-associated protein; involved in initiation of DNA replication; required for association of MCM2-7 complex with replication origins; required to stabilize catalytic subunit of DNA polymerase-alpha; self-associates through its N-terminal domain +S000031878 CDS YIL150C 9 62728 61013 C 1994-12-10 1994-12-10 +S000001411 ORF Verified YIL149C MLP2 chromosome 9 S000007510 9 68067 63028 C 1994-12-10 1994-12-10 Myosin-like protein associated with the nuclear envelope; nuclear basket protein that connects the nuclear pore complex with the nuclear interior; involved in the Tel1p pathway that controls telomere length; MLP2 has a paralog, MLP1, that arose from the whole genome duplication +S000031703 CDS YIL149C 9 68067 63028 C 1994-12-10 1994-12-10 +S000001410 ORF Verified YIL148W RPL40A eL40|ubiquitin-ribosomal 60S subunit protein L40A fusion protein|L40e|L40A|UB11|UBI1|CEP52A chromosome 9 L000002411|L000000313 9 68708 69528 W 1994-12-10 1994-12-10 Ubiquitin-ribosomal 60S subunit protein L40A fusion protein; cleaved to yield ubiquitin and ribosomal protein L40A; ubiquitin may facilitate assembly of the ribosomal protein into ribosomes; homologous to mammalian ribosomal protein L40, no bacterial homolog; RPL40A has a paralog, RPL40B, that arose from the whole genome duplication; relative distribution to the nucleus increases upon DNA replication stress +S000031651 CDS YIL148W 9 68708 68715 W 1994-12-10 1994-12-10 +S000031652 CDS YIL148W 9 69150 69528 W 1994-12-10 1994-12-10 +S000031653 intron YIL148W 9 68716 69149 W 1994-12-10 1994-12-10 +S000001409 ORF Verified YIL147C SLN1 YPD2 chromosome 9 L000001916 9 73453 69791 C 1994-12-10 1994-12-10 Transmembrane histidine phosphotransfer kinase and osmosensor; regulates MAP kinase cascade; transmembrane protein with an intracellular kinase domain that signals to Ypd1p and Ssk1p, thereby forming a phosphorelay system similar to bacterial two-component regulators +S000031443 CDS YIL147C 9 73453 69791 C 1994-12-10 1994-12-10 +S000178111 ARS ARS907 chromosome 9 9 73820 73991 2014-11-18 2014-11-18 Autonomously replicating sequence +S000001408 ORF Verified YIL146C ATG32 mitophagy protein ATG32|ECM37 chromosome 9 L000003904 9 75773 74184 C 1994-12-10 1994-12-10 Mitochondrial outer membrane protein required to initiate mitophagy; recruits the autophagy adaptor protein Atg11p and the ubiquitin-like protein Atg8p to the mitochondrial surface to initiate mitophagy, the selective vacuolar degradation of mitochondria in response to starvation; can promote pexophagy when placed ectopically in the peroxisomal membrane; regulates mitophagy and ethanol production during alcoholic fermentation +S000030520 CDS YIL146C 9 75773 74184 C 1994-12-10 1994-12-10 +S000001407 ORF Verified YIL145C PAN6 pantoate--beta-alanine ligase PAN6 chromosome 9 9 77283 76354 C 2003-09-22 2003-09-22|1994-12-10 Pantothenate synthase; also known as pantoate-beta-alanine ligase, required for pantothenic acid biosynthesis, deletion causes pantothenic acid auxotrophy, homologous to E. coli panC +S000030395 CDS YIL145C 9 77283 76354 C 2003-09-22 2003-09-22|1994-12-10 +S000001406 ORF Verified YIL144W NDC80 kinetochore-associated Ndc80 complex subunit NDC80|TID3|HEC1 chromosome 9 L000004311 9 78074 80149 W 1994-12-10 1994-12-10 Component of the kinetochore-associated Ndc80 complex; conserved coiled-coil protein involved in chromosome segregation, spindle checkpoint activity, and kinetochore assembly and clustering; evolutionarily conserved; complex members include Ndc80p, Nuf2p, Scp24p, and Spc25p; modified by sumoylation +S000030319 CDS YIL144W 9 78074 80149 W 1994-12-10 1994-12-10 +S000001405 ORF Verified YIL143C SSL2 TFIIH/NER complex ATPase/helicase subunit SSL2|RAD25|LOM3 chromosome 9 L000002086 9 83041 80510 C 1994-12-10 1994-12-10 Component of RNA polymerase transcription factor TFIIH holoenzyme; acts as dsDNA-dependent translocase in context of TFIIH, unwinds DNA strands during initiation and promotes transcription start site (TSS) scanning; has DNA-dependent ATPase/helicase activity; interacts functionally with TFIIB, has roles in TSS selection and gene looping to juxtapose initiation and termination regions; involved in DNA repair; relocalizes to cytosol under hypoxia; homolog of human ERCC3 +S000037507 CDS YIL143C 9 83041 80510 C 1994-12-10 1994-12-10 +S000001404 ORF Verified YIL142W CCT2 chaperonin-containing T-complex subunit CCT2|TCP2|BIN3 chromosome 9 L000002269 9 83302 84885 W 1994-12-10 1994-12-10 Subunit beta of the cytosolic chaperonin Cct ring complex; related to Tcp1p, required for the assembly of actin and tubulins in vivo +S000037439 CDS YIL142W 9 83302 84885 W 1994-12-10 1994-12-10 +S000028796 ORF Dubious YIL142C-A chromosome 9 9 83540 83208 C 2003-07-29 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF CCT2/YIL142W +S000033561 CDS YIL142C-A 9 83540 83208 C 2003-07-29 2003-07-29 +S000001403 ORF Dubious YIL141W chromosome 9 9 85053 85442 W 1994-12-10 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000037327 CDS YIL141W 9 85053 85442 W 1994-12-10 1994-12-10 +S000001402 ORF Verified YIL140W AXL2 SRO4|BUD10 chromosome 9 L000003104 9 85366 87837 W 1994-12-10 1994-12-10 Integral plasma membrane protein; required for axial budding in haploid cells; localizes to the incipient bud site and bud neck; glycosylated by Pmt4p; potential Cdc28p substrate +S000037249 CDS YIL140W 9 85366 87837 W 1994-12-10 1994-12-10 +S000001401 ORF Verified YIL139C REV7 chromosome 9 L000001618 9 88716 87979 C -101 1994-12-10 1994-12-10 Accessory subunit of DNA polymerase zeta; involved in translesion synthesis during post-replication repair; required for mutagenesis induced by DNA damage; involved in double-strand break repair; forms a complex with Rev3p, Pol31p and Pol32p +S000035566 CDS YIL139C 9 88716 87979 C 1994-12-10 1994-12-10 +S000001400 ORF Verified YIL138C TPM2 tropomyosin TPM2 chromosome 9 L000002329 9 89715 89230 C 1994-12-10 1994-12-10 Minor isoform of tropomyosin; binds to and stabilizes actin cables and filaments, which direct polarized cell growth and the distribution of several organelles; appears to have distinct and also overlapping functions with Tpm1p; TPM2 has a paralog, TPM1, that arose from the whole genome duplication +S000035475 CDS YIL138C 9 89715 89230 C 1994-12-10 1994-12-10 +S000001399 ORF Verified YIL137C TMA108 TAE3|RBF108 chromosome 9 9 92788 89948 C 1994-12-10 1994-12-10 Ribosome-associated, nascent chain binding factor; binds N-terminal region of nascent peptides during translation; recognizes target proteins via its putative metallopeptidase peptide-binding pocket +S000035340 CDS YIL137C 9 92788 89948 C 1994-12-10 1994-12-10 +S000001398 ORF Verified YIL136W OM45 chromosome 9 L000001301 9 93619 94800 W 1994-12-10 1994-12-10 Mitochondrial outer membrane protein of unknown function; major constituent of the outer membrane, extending into the intermembrane space; interacts with porin (Por1p) and with Om14p; imported via the presequence pathway involving the TOM and TIM23 complexes, then assembled in the outer membrane by Mim1p; protein abundance increases in response to DNA replication stress +S000034390 CDS YIL136W 9 93619 94800 W 1994-12-10 1994-12-10 +S000001397 ORF Verified YIL135C VHS2 chromosome 9 9 96375 95065 C 1994-12-10 1994-12-10 Regulator of septin dynamics; involved in the regulation of septin dynamics at bud neck after mitotic entry, likely by stabilizing septin structure; regulated at post-translational level by cell cycle dependent phosphorylation; likely phosphorylated by Cdc28p and dephosphorylated by Cdc14p before cytokinesis; high-copy suppressor of synthetic lethality of sis2 sit4 double mutant; VHS2 has a paralog, MLF3, that arose from the whole genome duplication +S000034198 CDS YIL135C 9 96375 95065 C 1994-12-10 1994-12-10 +S000028556 ORF Uncharacterized YIL134C-A chromosome 9 9 96725 96522 C 2003-07-29 2003-07-29 Putative protein of unknown function; identified by fungal homology and RT-PCR +S000031242 CDS YIL134C-A 9 96725 96522 C 2003-07-29 2003-07-29 +S000006459 snoRNA_gene snR68 SNR68 chromosome 9 L000004537 9 97111 97246 W 1994-12-10 1994-12-10 C/D box small nucleolar RNA (snoRNA); guides 2'-O-methylation of large subunit (LSU) rRNA at position A2640 +S000030855 noncoding_exon snR68 9 97111 97246 W 1994-12-10 1994-12-10 +S000001396 ORF Verified YIL134W FLX1 flavin adenine dinucleotide transporter FLX1 chromosome 9 L000002664 9 97395 98330 W 1994-12-10 1994-12-10 Mitochondrial flavin adenine dinucleotide transporter; FAD is a synthesis product of riboflavin; human homolog SLC25A32 is implicated in multiple acyl-CoA dehydrogenase deficiency (MADD) or glutaric aciduria type II (GAII), and can complement yeast null mutant +S000034150 CDS YIL134W 9 97395 98330 W 1994-12-10 1994-12-10 +S000001395 ORF Verified YIL133C RPL16A uL13|ribosomal 60S subunit protein L16A|L13|rp22|YL15|L21A|L16A|RPL13 chromosome 9 L000001709 9 99416 98527 C 1994-12-10 1994-12-10 Ribosomal 60S subunit protein L16A; N-terminally acetylated, binds 5.8 S rRNA; transcriptionally regulated by Rap1p; homologous to mammalian ribosomal protein L13A and bacterial L13; RPL16A has a paralog, RPL16B, that arose from the whole genome duplication; protein abundance increases in response to DNA replication stress +S000033253 CDS YIL133C 9 99095 98527 C 1994-12-10 1994-12-10 +S000033252 CDS YIL133C 9 99416 99386 C 1994-12-10 1994-12-10 +S000033254 intron YIL133C 9 99385 99096 C 1994-12-10 1994-12-10 +S000001394 ORF Verified YIL132C CSM2 chromosome 9 9 100501 99860 C 1994-12-10 1994-12-10 Component of Shu complex (aka PCSS complex); Shu complex also includes Psy3, Shu1, Shu2, and promotes error-free DNA repair,; Shu complex mediates inhibition of Srs2p function; promotes formation of Rad51p filaments; Psy3p and Csm2p contain similar DNA-binding regions which work together to form a single DNA binding site; required for accurate chromosome segregation during meiosis +S000033192 CDS YIL132C 9 100501 99860 C 1994-12-10 1994-12-10 +S000001393 ORF Verified YIL131C FKH1 forkhead family transcription factor FKH1 chromosome 9 L000002607 9 102235 100781 C 1994-12-10 1994-12-10 Forkhead family transcription factor; rate-limiting replication origin activator; evolutionarily conserved lifespan regulator; binds multiple chromosomal elements with distinct specificities, cell cycle dynamics; regulates transcription elongation, chromatin silencing at mating loci, expression of G2/M phase genes; facilitates clustering, activation of early-firing replication origins; binds HML recombination enhancer, regulates donor preference during mating-type switching +S000033138 CDS YIL131C 9 102235 100781 C 1994-12-10 1994-12-10 +S000001392 ORF Verified YIL130W ASG1 chromosome 9 9 102782 105676 W 1994-12-10 1994-12-10 Zinc cluster protein proposed to be a transcriptional regulator; regulator involved in the stress response; null mutants have a respiratory deficiency, calcofluor white sensitivity and slightly increased cycloheximide resistance +S000032296 CDS YIL130W 9 102782 105676 W 1994-12-10 1994-12-10 +S000118394 ARS ARS909 ARSIX-106 chromosome 9 9 105870 106053 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000001391 ORF Verified YIL129C TAO3 PAG1 chromosome 9 9 113237 106107 C 1994-12-10 1994-12-10 Component of the RAM signaling network; is involved in regulation of Ace2p activity and cellular morphogenesis, interacts with protein kinase Cbk1p and also with Kic1p +S000032290 CDS YIL129C 9 113237 106107 C 1994-12-10 1994-12-10 +S000130158 ARS ARS910 chromosome 9 9 113237 113806 2009-05-07 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000001390 ORF Verified YIL128W MET18 MMS19 chromosome 9 L000003468 9 113806 116904 W 1994-12-10 1994-12-10 Component of cytosolic iron-sulfur protein assembly (CIA) machinery; acts at a late step of Fe-S cluster assembly; forms the CIA targeting complex with Cia1p and Cia2p that directs Fe-S cluster incorporation into a subset of proteins involved in methionine biosynthesis, DNA replication and repair, transcription, and telomere maintenance; ortholog of human MMS19 +S000032232 CDS YIL128W 9 113806 116904 W 1994-12-10 1994-12-10 +S000001389 ORF Uncharacterized YIL127C RRT14 chromosome 9 9 117644 117024 C 1994-12-10 1994-12-10 Putative protein of unknown function; identified in a screen for mutants with decreased levels of rDNA transcription; green fluorescent protein (GFP)-fusion protein localizes to the nucleolus; predicted to be involved in ribosome biogenesis +S000031158 CDS YIL127C 9 117644 117024 C 1994-12-10 1994-12-10 +S000001388 ORF Verified YIL126W STH1 RSC chromatin remodeling complex ATPase subunit STH1|NPS1 chromosome 9 L000002128 9 117992 122071 W -91 1994-12-10 1994-12-10 ATPase component of the RSC chromatin remodeling complex; required for expression of early meiotic genes; promotes base excision repair in chromatin; essential helicase-related protein homologous to Snf2p +S000031113 CDS YIL126W 9 117992 122071 W 1994-12-10 1994-12-10 +S000001387 ORF Verified YIL125W KGD1 alpha-ketoglutarate dehydrogenase KGD1|OGD1 chromosome 9 L000000897 9 122689 125733 W -91 1994-12-10 1994-12-10 Subunit of the mitochondrial alpha-ketoglutarate dehydrogenase complex; catalyzes a key step in the tricarboxylic acid (TCA) cycle, the oxidative decarboxylation of alpha-ketoglutarate to form succinyl-CoA +S000031016 CDS YIL125W 9 122689 125733 W 1994-12-10 1994-12-10 +S000001386 ORF Verified YIL124W AYR1 GBG1|acylglycerone-phosphate reductase chromosome 9 S000007473 9 126204 127097 W 1994-12-10 1994-12-10 Bifunctional triacylglycerol lipase and 1-acyl DHAP reductase; NADPH-dependent 1-acyl dihydroxyacetone phosphate reductase involved in phosphatidic acid biosynthesis; lipid droplet triacylglycerol lipase involved in the mobilization of non-polar lipids; found in lipid particles, the endoplasmic reticulum and the mitochondrial outer membrane; required for spore germination; role in cell wall biosynthesis; capable of metabolizing steroid hormones; oleic acid inducible +S000030012 CDS YIL124W 9 126204 127097 W 1994-12-10 1994-12-10 +S000001385 ORF Verified YIL123W SIM1 putative glucosidase SIM1 chromosome 9 L000003937 9 128151 129581 W 2011-02-03 1994-12-10|2011-02-03 Protein of the SUN family (Sim1p, Uth1p, Nca3p, Sun4p); may participate in DNA replication; promoter contains SCB regulation box at -300 bp indicating that expression may be cell cycle-regulated; SIM1 has a paralog, SUN4, that arose from the whole genome duplication +S000029900 CDS YIL123W 9 128151 129581 W 2011-02-03 1994-12-10|2011-02-03 +S000122103 five_prime_UTR_intron YIL123W 9 127662 128148 W 2007-04-04 2007-04-04 +S000001384 ORF Verified YIL122W POG1 chromosome 9 9 130610 131665 W 2011-02-03 1994-12-10 Nuclear chromatin-associated protein of unknown function; may have a role in cell cycle regulation; overexpression promotes recovery from pheromone induced arrest and suppresses the stress sensitivity caused by a mutation in the E3 ubiquitin ligase Rsp5p; binds upstream of BAR1 and cell cycle-related genes; phsosphoylated form may be ubiquitinated by Dma2p; potential Cdc28p substrate; SBF regulated +S000037860 CDS YIL122W 9 130610 131665 W 2011-02-03 1994-12-10 +S000001383 ORF Verified YIL121W QDR2 cation transporter chromosome 9 9 132244 133872 W 2011-02-03 1994-12-10 Plasma membrane transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; exports copper; has broad substrate specificity and can transport many mono- and divalent cations; transports a variety of drugs and is required for resistance to quinidine, barban, cisplatin, and bleomycin; contributes to potassium homeostasis; expression is regulated by copper +S000037111 CDS YIL121W 9 132244 133872 W 2011-02-03 1994-12-10 +S000001382 ORF Verified YIL120W QDR1 multidrug transporter chromosome 9 9 134417 136108 W 2011-02-03 1994-12-10 Multidrug transporter of the major facilitator superfamily; member of the 12-spanner drug:H(+) antiporter DHA1 family; involved in spore wall assembly; sequence similarity to DTR1 and QDR3, and the triple mutant dtr1 qdr1 qdr3 exhibits reduced dityrosine fluorescence relative to the single mutants; required for resistance to quinidine, ketoconazole, fluconazole, and barban; QDR1 has a paralog, AQR1, that arose from the whole genome duplication +S000037040 CDS YIL120W 9 134417 136108 W 2011-02-03 1994-12-10 +S000118395 ARS ARS911 ARSIX-136 chromosome 9 9 136098 136338 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178112 ARS_consensus_sequence ARS911 9 136288 136272 C 2014-11-18 2014-11-18 +S000001381 ORF Verified YIL119C RPI1 chromosome 9 L000001697 9 137877 136654 C 2011-02-03 1994-12-10 Transcription factor, allelic differences between S288C and Sigma1278b; mediates fermentation stress tolerance by modulating cell wall integrity; overexpression suppresses heat shock sensitivity of wild-type RAS2 overexpression and also suppresses cell lysis defect of mpk1 mutation; allele from S288c can confer fMAPK pathway independent transcription of FLO11; S288C and Sigma1278b alleles differ in number of tandem repeats within ORF +S000036217 CDS YIL119C 9 137877 136654 C 2011-02-03 1994-12-10 +S000001380 ORF Verified YIL118W RHO3 Rho family GTPase RHO3 chromosome 9 L000001632 9 139752 140447 W 2011-02-03 1994-12-10 Non-essential small GTPase of the Rho/Rac family of Ras-like proteins; involved in the establishment of cell polarity; GTPase activity positively regulated by the GTPase activating protein (GAP) Rgd1p +S000036201 CDS YIL118W 9 139752 140447 W 2011-02-03 1994-12-10 +S000001379 ORF Verified YIL117C PRM5 pheromone-regulated protein PRM5 chromosome 9 9 141569 140613 C 2011-02-03 1994-12-10 Pheromone-regulated protein, predicted to have 1 transmembrane segment; induced during cell integrity signaling; PRM5 has a paralog, YNL058C, that arose from the whole genome duplication +S000035189 CDS YIL117C 9 141569 140613 C 2011-02-03 1994-12-10 +S000001378 ORF Verified YIL116W HIS5 histidinol-phosphate transaminase chromosome 9 L000000782 9 142928 144085 W -89 2011-02-03 1994-12-10 Histidinol-phosphate aminotransferase; catalyzes the seventh step in histidine biosynthesis; responsive to general control of amino acid biosynthesis; mutations cause histidine auxotrophy and sensitivity to Cu, Co, and Ni salts +S000035124 CDS YIL116W 9 142928 144085 W 2011-02-03 1994-12-10 +S000028795 ORF Dubious YIL115W-A chromosome 9 9 144268 144639 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps the verified gene NUP159/YIL115C +S000033557 CDS YIL115W-A 9 144268 144639 W 2011-02-03 2003-07-29 +S000001377 ORF Verified YIL115C NUP159 FG-nucleoporin NUP159|RAT7|NUP158 chromosome 9 L000002782 9 148709 144327 C 2011-02-03 1994-12-10 FG-nucleoporin component of central core of the nuclear pore complex; also part of the nuclear pore complex (NPC) cytoplasmic filaments; contributes directly to nucleocytoplasmic transport; regulates ADP release from the ATP-dependent RNA helicase Dbp5p; forms a stable association with Nup82p, Gle2p and two other FG-nucleoporins (Nsp1p and Nup116p) +S000034872 CDS YIL115C 9 148709 144327 C 2011-02-03 1994-12-10 +S000001376 ORF Verified YIL114C POR2 putative porin POR2|YVDAC2 chromosome 9 L000003425 9 149988 149143 C 2011-02-03 1994-12-10 Putative mitochondrial porin (voltage-dependent anion channel); not required for mitochondrial membrane permeability or mitochondrial osmotic stability; POR2 has a paralog, POR1, that arose from the whole genome duplication +S000033971 CDS YIL114C 9 149988 149143 C 2011-02-03 1994-12-10 +S000001375 ORF Verified YIL113W SDP1 mitogen-activated protein kinase tyrosine protein phosphatase SDP1 chromosome 9 L000004339 9 150559 151188 W 2011-02-03 1994-12-10 Stress-inducible dual-specificity MAP kinase phosphatase; negatively regulates Slt2p MAP kinase by direct dephosphorylation, diffuse localization under normal conditions shifts to punctate localization after heat shock; SDP1 has a paralog, MSG5, that arose from the whole genome duplication +S000033917 CDS YIL113W 9 150559 151188 W 2011-02-03 1994-12-10 +S000001374 ORF Verified YIL112W HOS4 chromosome 9 9 151595 154846 W 2011-02-03 1994-12-10 Subunit of the Set3 complex; complex is a meiotic-specific repressor of sporulation specific genes that contains deacetylase activity; potential Cdc28p substrate +S000033813 CDS YIL112W 9 151595 154846 W 2011-02-03 1994-12-10 +S000001373 ORF Verified YIL111W COX5B cytochrome c oxidase subunit Vb chromosome 9 L000000389 9 155222 155765 W 2011-02-03 1994-12-10 Subunit Vb of cytochrome c oxidase; cytochrome c oxidase is the terminal member of the mitochondrial inner membrane electron transport chain; Cox5Bp is predominantly expressed during anaerobic growth while its isoform Va (Cox5Ap) is expressed during aerobic growth; COX5B has a paralog, COX5A, that arose from the whole genome duplication +S000033706 CDS YIL111W 9 155222 155222 W 2011-02-03 1994-12-10 +S000033707 CDS YIL111W 9 155311 155765 W 2011-02-03 1994-12-10 +S000033708 intron YIL111W 9 155223 155310 W 2011-02-03 1994-12-10 +S000001372 ORF Verified YIL110W HPM1 MNI1 chromosome 9 9 156045 157178 W 2011-02-03 1994-12-10 AdoMet-dependent methyltransferase; involved in a novel 3-methylhistidine modification of ribosomal protein Rpl3p; seven beta-strand MTase family member; null mutant exhibits a weak vacuolar protein sorting defect and caspofungin resistance +S000033038 CDS YIL110W 9 156045 157178 W 2011-02-03 1994-12-10 +S000001371 ORF Verified YIL109C SEC24 COPII subunit SEC24|ANU1 chromosome 9 L000004360 9 160165 157385 C 2011-02-03 1994-12-10 Component of the Sec23p-Sec24p heterodimer of the COPII vesicle coat; required for cargo selection during vesicle formation in ER to Golgi transport; homologous to Sfb3p; SEC24 has a paralog, SFB2, that arose from the whole genome duplication +S000034140 CDS YIL109C 9 160165 157385 C 2011-02-03 1994-12-10 +S000001370 ORF Verified YIL108W putative metalloendopeptidase chromosome 9 9 160887 162977 W 2011-02-03 1994-12-10 Putative metalloendopeptidase; forms cytoplasmic foci upon DNA replication stress +S000034098 CDS YIL108W 9 160887 162977 W 2011-02-03 1994-12-10 +S000001369 ORF Verified YIL107C PFK26 PFK-2|PFK2 chromosome 9 L000001406 9 165761 163278 C 2011-02-03 1994-12-10 6-phosphofructo-2-kinase; inhibited by phosphoenolpyruvate and sn-glycerol 3-phosphate; has negligible fructose-2,6-bisphosphatase activity; transcriptional regulation involves protein kinase A +S000032029 CDS YIL107C 9 165761 163278 C 2011-02-03 1994-12-10 +S000001368 ORF Verified YIL106W MOB1 chromosome 9 L000003356 9 166415 167444 W 2011-02-03 1999-11-17|1994-12-10 Component of the mitotic exit network; associates with and is required for the activation and Cdc15p-dependent phosphorylation of the Dbf2p kinase; required for cytokinesis and cell separation; component of the CCR4 transcriptional complex; relocalizes from cytoplasm to the nuclear periphery upon DNA replication stress +S000031985 CDS YIL106W 9 166415 166434 W 2011-02-03 1999-11-17|1994-12-10 +S000031986 CDS YIL106W 9 166520 167444 W 2011-02-03 1999-11-17 +S000031987 intron YIL106W 9 166435 166519 W 2011-02-03 1999-11-17 +S000028657 ORF Uncharacterized YIL105W-A chromosome 9 9 167664 167804 W 2011-02-03 2003-07-29 Protein of unknown function; completely overlaps the verified gene SLM1; identified by gene-trapping, microarray-based expression analysis, and genome-wide homology searching; mRNA identified as translated by ribosome profiling data +S000032461 CDS YIL105W-A 9 167664 167804 W 2011-02-03 2003-07-29 +S000001367 ORF Verified YIL105C SLM1 phosphatidylinositol 4,5-bisphosphate-binding protein|LIT2 chromosome 9 9 169641 167581 C 2011-02-03 1994-12-10 Phosphoinositide PI4,5P(2) binding protein, forms a complex with Slm2p; acts downstream of Mss4p in a pathway regulating actin cytoskeleton organization in response to stress; TORC2 complex substrate and effector; protein abundance increases in response to DNA replication stress; SLM1 has a paralog, SLM2, that arose from the whole genome duplication +S000030899 CDS YIL105C 9 169641 167581 C 2011-02-03 1994-12-10 +S000001366 ORF Verified YIL104C SHQ1 Hsp90 cochaperone SHQ1 chromosome 9 9 171505 169982 C 2011-02-03 1994-12-10 Chaperone protein; required for the assembly of box H/ACA snoRNPs and thus for pre-rRNA processing; functions as an RNA mimic; forms a complex with Naf1p and interacts with H/ACA snoRNP components Nhp2p and Cbf5p; homology with known Hsp90p cochaperones; relocalizes to the cytosol in response to hypoxia +S000030805 CDS YIL104C 9 171505 169982 C 2011-02-03 1994-12-10 +S000001365 ORF Verified YIL103W DPH1 KIF48 chromosome 9 9 171751 173028 W 2011-02-03 1994-12-10 Protein required for synthesis of diphthamide; required along with Dph2p, Kti11p, Jjj3p, and Dph5p; diphthamide is a modified histidine residue of translation elongation factor 2 (Eft1p or Eft2p); may act in a complex with Dph2p and Kti11p +S000030777 CDS YIL103W 9 171751 173028 W 2011-02-03 1994-12-10 +S000113587 ORF Uncharacterized YIL102C-A chromosome 9 9 173592 173365 C 2011-02-03 2005-11-21 Putative protein of unknown function; identified based on comparisons of the genome sequences of six Saccharomyces species; SWAT-GFP, seamless-GFP and mCherry fusion proteins localize to the endoplasmic reticulum +S000113588 CDS YIL102C-A 9 173592 173365 C 2011-02-03 2005-11-21 +S000001364 ORF Uncharacterized YIL102C chromosome 9 9 174887 174582 C 2011-02-03 1994-12-10 Putative protein of unknown function +S000030579 CDS YIL102C 9 174887 174582 C 2011-02-03 1994-12-10 +S000006741 tRNA_gene tT(AGU)I1 chromosome 9 L000003866 9 175031 175103 W 2011-02-03 1994-12-10 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000036345 noncoding_exon tT(AGU)I1 9 175031 175103 W 2011-02-03 1994-12-10 +S000118396 ARS ARS912 ARSIX-175 chromosome 9 9 175038 175358 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178113 ARS_consensus_sequence ARS912 9 175170 175186 W 2014-11-18 2014-11-18 +S000001363 ORF Verified YIL101C XBP1 chromosome 9 L000004246 9 177250 175307 C 2011-02-03 1994-12-10 Transcriptional repressor; binds promoter sequences of cyclin genes, CYS3, and SMF2; not expressed during log phase of growth, but induced by stress or starvation during mitosis, and late in meiosis; represses 15% of all yeast genes as cells transition to quiescence; important for maintaining G1 arrest and for longevity of quiescent cells; member of Swi4p/Mbp1p family; phosphorylated by Cdc28p; relative distribution to nucleus increases upon DNA replication stress +S000037752 CDS YIL101C 9 177250 175307 C 2011-02-03 1994-12-10 +S000001362 ORF Dubious YIL100W chromosome 9 9 177373 177726 W 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps the dubious ORF YIL100C-A +S000037716 CDS YIL100W 9 177373 177726 W 2011-02-03 1994-12-10 +S000028794 ORF Dubious YIL100C-A chromosome 9 9 177681 177343 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033555 CDS YIL100C-A 9 177681 177343 C 2011-02-03 2003-07-29 +S000001361 ORF Verified YIL099W SGA1 glucan 1,4-alpha-glucosidase chromosome 9 L000001875 9 178004 179653 W 2011-02-03 1994-12-10 Intracellular sporulation-specific glucoamylase; involved in glycogen degradation; induced during starvation of a/a diploids late in sporulation, but dispensable for sporulation +S000032666 CDS YIL099W 9 178004 179653 W 2011-02-03 1994-12-10 +S000001360 ORF Verified YIL098C FMC1 chromosome 9 L000004436 9 180239 179772 C 2011-02-03 1994-12-10 Mitochondrial matrix protein; required for assembly or stability at high temperature of the F1 sector of mitochondrial F1F0 ATP synthase; null mutant temperature sensitive growth on glycerol is suppressed by multicopy expression of Odc1p +S000032508 CDS YIL098C 9 180239 179772 C 2011-02-03 1994-12-10 +S000001359 ORF Verified YIL097W FYV10 glucose-induced degradation complex subunit FYV10|GID9 chromosome 9 9 180427 181977 W 2011-02-03 1994-12-10 Subunit of GID complex; involved in proteasome-dependent catabolite inactivation of gluconeogenic enzymes FBPase, PEPCK, and c-MDH; forms dimer with Rmd5p that is then recruited to GID Complex by Gid8p; contains a degenerate RING finger motif needed for GID complex ubiquitin ligase activity in vivo, as well as CTLH and CRA domains; plays role in anti-apoptosis; required for survival upon exposure to K1 killer toxin +S000032474 CDS YIL097W 9 180427 181977 W 2011-02-03 1994-12-10 +S000001358 ORF Verified YIL096C BMT5 25S rRNA (uracil2634-N3)-methyltransferase chromosome 9 9 183127 182117 C 2011-02-03 1994-12-10 Methyltransferase required for m3U2634 methylation of the 25S rRNA; S-adenosylmethionine-dependent; associates with precursors of the 60S ribosomal subunit; predicted to be involved in ribosome biogenesis +S000031394 CDS YIL096C 9 183127 182117 C 2011-02-03 1994-12-10 +S000006605 tRNA_gene tI(AAU)I1 chromosome 9 L000003875 9 183513 183440 C 2011-02-03 1994-12-10 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000030348 noncoding_exon tI(AAU)I1 9 183513 183440 C 2011-02-03 1994-12-10 +S000001357 ORF Verified YIL095W PRK1 serine/threonine protein kinase PRK1|PAK1 chromosome 9 L000002879 9 183937 186369 W 2011-02-03 1994-12-10 Protein serine/threonine kinase; regulates the organization and function of the actin cytoskeleton and reduces endocytic ability of cell through the phosphorylation of the Pan1p-Sla1p-End3p protein complex; PRK1 has a paralog, ARK1, that arose from the whole genome duplication +S000031347 CDS YIL095W 9 183937 186369 W 2011-02-03 1994-12-10 +S000001356 ORF Verified YIL094C LYS12 homoisocitrate dehydrogenase|LYS11|LYS10 chromosome 9 L000000970 9 187632 186517 C 2011-02-03 1994-12-10 Homo-isocitrate dehydrogenase; an NAD-linked mitochondrial enzyme required for the fourth step in the biosynthesis of lysine, in which homo-isocitrate is oxidatively decarboxylated to alpha-ketoadipate +S000031160 CDS YIL094C 9 187632 186517 C 2011-02-03 1994-12-10 +S000001355 ORF Verified YIL093C RSM25 mitochondrial 37S ribosomal protein RSM25 chromosome 9 9 188784 187990 C 2011-02-03 1994-12-10 Mitochondrial ribosomal protein of the small subunit +S000030231 CDS YIL093C 9 188784 187990 C 2011-02-03 1994-12-10 +S000001354 ORF Uncharacterized YIL092W chromosome 9 9 189066 190967 W 2011-02-03 1994-12-10 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the cytoplasm and to the nucleus +S000030095 CDS YIL092W 9 189066 190967 W 2011-02-03 1994-12-10 +S000001353 ORF Verified YIL091C UTP25 rRNA-binding ribosome biosynthesis protein UTP25 chromosome 9 9 193195 191030 C 2011-02-03 1994-12-10 Nucleolar protein; required for 35S pre-RNA processing and 40S ribosomal subunit biogenesis +S000029923 CDS YIL091C 9 193195 191030 C 2011-02-03 1994-12-10 +S000001352 ORF Verified YIL090W ICE2 chromosome 9 9 193595 195070 W 2011-02-03 1994-12-10 Integral ER membrane protein with type-III transmembrane domains; required for maintenance of ER zinc homeostasis; necessary for efficient targeting of Trm1p tRNA methyltransferase to inner nuclear membrane; mutations cause defects in cortical ER morphology in both the mother and daughter cells +S000029886 CDS YIL090W 9 193595 195070 W 2011-02-03 1994-12-10 +S000001351 ORF Verified YIL089W chromosome 9 9 195599 196216 W 2011-02-03 1994-12-10 Protein of unknown function found in the ER and vacuole lumen; overexpression of YIL089W affects endocytic protein trafficking +S000036415 CDS YIL089W 9 195599 196216 W 2011-02-03 1994-12-10 +S000007015 long_terminal_repeat YILCtau1 chromosome 9 9 197023 196653 C 2011-02-03 1994-12-10 Ty4 LTR +S000007011 long_terminal_repeat YILCdelta1 chromosome 9 9 197488 197140 C 2011-02-03 1994-12-10 Ty1 LTR +S000006547 tRNA_gene tE(CUC)I chromosome 9 L000003867 9 197592 197663 W 2011-02-03 1994-12-10 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis +S000031939 noncoding_exon tE(CUC)I 9 197592 197663 W 2011-02-03 1994-12-10 +S000001350 ORF Verified YIL088C AVT7 chromosome 9 9 199403 197931 C 2011-02-03 1994-12-10 Putative transporter; member of a family of seven S. cerevisiae genes (AVT1-7) related to vesicular GABA-glycine transporters +S000036264 CDS YIL088C 9 199403 197931 C 2011-02-03 1994-12-10 +S000001349 ORF Verified YIL087C AIM19 LRC2 chromosome 9 9 200119 199646 C 2011-02-03 1994-12-10 Protein of unknown function; mitochondrial protein that physically interacts with Tim23p; null mutant displays reduced respiratory growth +S000035319 CDS YIL087C 9 200119 199646 C 2011-02-03 1994-12-10 +S000001348 ORF Dubious YIL086C chromosome 9 9 200461 200153 C 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000035155 CDS YIL086C 9 200461 200153 C 2011-02-03 1994-12-10 +S000001347 ORF Verified YIL085C KTR7 putative mannosyltransferase chromosome 9 L000004100 9 202043 200490 C 2011-02-03 1994-12-10 Putative mannosyltransferase involved in protein glycosylation; member of the KRE2/MNT1 mannosyltransferase family; KTR7 has a paralog, KTR5, that arose from the whole genome duplication +S000035010 CDS YIL085C 9 202043 200490 C 2011-02-03 1994-12-10 +S000001346 ORF Verified YIL084C SDS3 chromosome 9 L000003384 9 203259 202276 C 2011-02-03 1994-12-10 Component of the Rpd3L histone deacetylase complex; required for its structural integrity and catalytic activity, involved in transcriptional silencing and required for sporulation; relocalizes to the cytosol in response to hypoxia; cells defective in SDS3 display pleiotropic phenotypes +S000034086 CDS YIL084C 9 203259 202276 C 2011-02-03 1994-12-10 +S000001345 ORF Verified YIL083C CAB2 phosphopantothenate--cysteine ligase CAB2 chromosome 9 9 204653 203556 C 2011-02-03 1994-12-10|2011-02-03 Subunit of the CoA-Synthesizing Protein Complex (CoA-SPC); subunits of this complex are: Cab2p, Cab3p, Cab4p, Cab5p, Sis2p and Vhs3p; probable phosphopantothenoylcysteine synthetase (PPCS), which catalyzes the second step of coenzyme A biosynthesis from pantothenate; null mutant lethality is complemented by human homolog PPCS and by E. coli coaBC (encoding a bifunctional enzyme with PPCS activity) +S000033946 CDS YIL083C 9 204653 203556 C 2011-02-03 1994-12-10|2011-02-03 +S000007017 long_terminal_repeat YILWsigma1 chromosome 9 9 205220 205559 W 2011-02-03 1994-12-10 Ty3 LTR +S000007020 LTR_retrotransposon YILWTy3-1 Ty3 chromosome 9 9 205220 210647 W 2011-02-03 1994-12-10 Ty3 element, LTR retrotransposon of the Gypsy (Metaviridae) group; contains co-transcribed genes TYA Gag and TYB Pol, encoding proteins involved in structure and function of virus-like particles, flanked by two direct repeats; transposition is induced upon exposure to mating pheromone +S000001344 ORF Dubious YIL082W chromosome 9 9 205635 206507 W 2011-02-03 1994-12-10 Retrotransposon TYA Gag gene co-transcribed with TYB Pol; translated as TYA or TYA-TYB polyprotein; Gag is a nucleocapsid protein that is the structural constituent of virus-like particles (VLPs); similar to retroviral Gag +S000033890 CDS YIL082W 9 205635 206507 W 2011-02-03 1994-12-10 +S000003537 transposable_element_gene YIL082W-A gag-pol fusion protein chromosome 9 9 205635 210132 W 2011-02-03 1994-12-10|1999-07-17 Retrotransposon TYA Gag and TYB Pol genes; transcribed/translated as one unit; polyprotein is processed to make a nucleocapsid-like protein (Gag), reverse transcriptase (RT), protease (PR), and integrase (IN); similar to retroviral genes +S000030100 CDS YIL082W-A 9 205635 206485 W 2011-02-03 1999-07-17|1994-12-10 +S000030101 CDS YIL082W-A 9 206487 210132 W 2011-02-03 1999-07-17|1994-12-10 +S000030102 plus_1_translational_frameshift YIL082W-A 9 206486 206486 W 2011-02-03 1999-07-17|1994-12-10 +S000007018 long_terminal_repeat YILWsigma2 chromosome 9 9 210308 210647 W 2011-02-03 1994-12-10 Ty3 LTR +S000006606 tRNA_gene tI(AAU)I2 chromosome 9 L000003868 9 210665 210738 W 2011-02-03 1994-12-10 Isoleucine tRNA (tRNA-Ile), predicted by tRNAscan-SE analysis +S000030349 noncoding_exon tI(AAU)I2 9 210665 210738 W 2011-02-03 1994-12-10 +S000001341 ORF Verified YIL079C AIR1 TRAMP complex RNA-binding subunit chromosome 9 S000028413 9 212005 210923 C 2011-02-03 1994-12-10 Zinc knuckle protein; involved in nuclear RNA processing and degradation as a component of the TRAMP complex; stimulates the poly(A) polymerase activity of Pap2p in vitro; AIR1 has a paralog, AIR2, that arose from the whole genome duplication; although Air1p and Air2p are homologous TRAMP subunits, they have nonredundant roles in regulation of substrate specificity of the exosome +S000032850 CDS YIL079C 9 212005 210923 C 2011-02-03 1994-12-10 +S000001340 ORF Verified YIL078W THS1 threonine--tRNA ligase THS1 chromosome 9 L000002301 9 212499 214703 W 2011-02-03 1994-12-10 Threonyl-tRNA synthetase; essential cytoplasmic protein; human homolog TARS can complement yeast null mutant +S000032807 CDS YIL078W 9 212499 214703 W 2011-02-03 1994-12-10 +S000007644 ARS ARS913 ARS901 ARSIX-215|ARS249 chromosome 9 9 214624 214754 2014-11-18 2001-03-06|2014-11-18|2006-09-08 Autonomously Replicating Sequence +S000178114 ARS_consensus_sequence ARS913 9 214732 214748 W 2014-11-18 2014-11-18 +S000001339 ORF Uncharacterized YIL077C chromosome 9 9 215953 214991 C 2011-02-03 1994-12-10 Putative protein of unknown function; the authentic, non-tagged protein is detected in highly purified mitochondria in high-throughput studies; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO) +S000032673 CDS YIL077C 9 215953 214991 C 2011-02-03 1994-12-10 +S000001338 ORF Verified YIL076W SEC28 coatomer subunit epsilon|ANU2 chromosome 9 L000004402 9 216658 217548 W 2011-02-03 1994-12-10|2005-11-22 Epsilon-COP subunit of the coatomer; regulates retrograde Golgi-to-ER protein traffic; stabilizes Cop1p, the alpha-COP and the coatomer complex; non-essential for cell growth; protein abundance increases in response to DNA replication stress +S000032630 CDS YIL076W 9 216658 217548 W 2011-02-03 1994-12-10|2005-11-22 +S000001337 ORF Verified YIL075C RPN2 proteasome regulatory particle base subunit RPN2|SEN3 chromosome 9 L000001864 9 220700 217863 C 2011-02-03 1994-12-10 Subunit of the 26S proteasome; substrate of the N-acetyltransferase Nat1p; protein abundance increases in response to DNA replication stress +S000031543 CDS YIL075C 9 220700 217863 C 2011-02-03 1994-12-10 +S000001336 ORF Verified YIL074C SER33 phosphoglycerate dehydrogenase SER33 chromosome 9 S000007458 9 222490 221081 C 2011-02-03 1994-12-10 3-phosphoglycerate dehydrogenase and alpha-ketoglutarate reductase; 3PG dehydrogenase that catalyzes the first step in serine and glycine biosynthesis; also functions as an alpha-ketoglutarate reductase, converting alpha-ketoglutarate to D-2-hydroxyglutarate (D-2HG); localizes to the cytoplasm; SER33 has a paralog, SER3, that arose from the whole genome duplication +S000031439 CDS YIL074C 9 222490 221081 C 2011-02-03 1994-12-10 +S000001335 ORF Verified YIL073C SPO22 ZIP4 chromosome 9 9 225954 222937 C 2011-02-03 2003-09-27|1994-12-10 Meiosis-specific protein essential for chromosome synapsis; involved in completion of nuclear divisions during meiosis; induced early in meiosis +S000030517 CDS YIL073C 9 225809 222937 C 2011-02-03 2003-09-27 +S000030516 CDS YIL073C 9 225954 225900 C 2011-02-03 2003-09-27|1994-12-10 +S000030518 intron YIL073C 9 225899 225810 C 2011-02-03 2003-09-27 +S000001334 ORF Verified YIL072W HOP1 chromosome 9 L000000802 9 226602 228419 W -59 2011-02-03 1994-12-10 Meiosis-specific protein required for chromosome synapsis; displays Red1p dependent localization to the unsynapsed axial-lateral elements of the synaptonemal complex; required for chiasma formation; in vitro, displays the ability to promote intra- and intermolecular synapsis between double-stranded DNA molecules and to fold DNA into rigid protein-DNA filaments +S000030472 CDS YIL072W 9 226602 228419 W 2011-02-03 1994-12-10 +S000028793 ORF Dubious YIL071W-A chromosome 9 9 228550 229026 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF PCI8/YIL071C +S000033552 CDS YIL071W-A 9 228550 229026 W 2011-02-03 2003-07-29 +S000001333 ORF Verified YIL071C PCI8 YIL071W|CSN11|YIH1 chromosome 9 S000007580 9 229994 228660 C 2011-02-03 1994-12-10 Possible shared subunit of Cop9 signalosome (CSN) and eIF3; binds eIF3b subunit Prt1p, has possible dual functions in transcriptional and translational control, contains a PCI (Proteasome-COP9 signalosome (CSN)-eIF3) domain +S000030209 CDS YIL071C 9 229994 228660 C 2011-02-03 1994-12-10 +S000001332 ORF Verified YIL070C MAM33 chromosome 9 9 231072 230272 C 2011-02-03 1994-12-10 Specific translational activator for the mitochondrial COX1 mRNA; acidic protein of the mitochondrial matrix; related to the human complement receptor gC1q-R +S000037502 CDS YIL070C 9 231072 230272 C 2011-02-03 1994-12-10 +S000001331 ORF Verified YIL069C RPS24B eS24|ribosomal 40S subunit protein S24B|S24e|S24B|RPS24EB chromosome 9 L000002711 9 232369 231553 C 2011-02-03 1994-12-10 Protein component of the small (40S) ribosomal subunit; homologous to mammalian ribosomal protein S24, no bacterial homolog; RPS24B has a paralog, RPS24A, that arose from the whole genome duplication +S000036651 CDS YIL069C 9 231957 231553 C 2011-02-03 1994-12-10 +S000036650 CDS YIL069C 9 232369 232367 C 2011-02-03 1994-12-10 +S000036652 intron YIL069C 9 232366 231958 C 2011-02-03 1994-12-10 +S000028792 ORF Dubious YIL068W-A chromosome 9 9 233013 233396 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF SEC6/YIL068C +S000033551 CDS YIL068W-A 9 233013 233396 W 2011-02-03 2003-07-29 +S000001330 ORF Verified YIL068C SEC6 SNARE-binding exocyst subunit SEC6 chromosome 9 L000001832 9 235474 233057 C 2011-02-03 1994-12-10 Essential 88kDa subunit of the exocyst complex; the exocyst mediates polarized targeting and tethering of post-Golgi secretory vesicles to active sites of exocytosis at the plasma membrane prior to SNARE-mediated fusion; anchors the assembled complex to sites of secretion; interacts with SM-like protein and SNARE regulator Sec1p and may recruit it to sites of secretion; binds to SNARE complexes binteracting with Sec9p +S000036567 CDS YIL068C 9 235474 233057 C 2011-02-03 1994-12-10 +S000028791 ORF Dubious YIL066W-A chromosome 9 9 237366 237809 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF YIL067C +S000033550 CDS YIL066W-A 9 237366 237809 W 2011-02-03 2003-07-29 +S000001329 ORF Uncharacterized YIL067C chromosome 9 9 237760 235724 C 2011-02-03 1994-12-10 Uncharacterized protein of unknown function +S000035626 CDS YIL067C 9 237760 235724 C 2011-02-03 1994-12-10 +S000001328 ORF Verified YIL066C RNR3 ribonucleotide-diphosphate reductase subunit RNR3|RIR3|DIN1 chromosome 9 L000001644|L000001657 9 240708 238099 C 2011-02-03 1994-12-10 Minor isoform of large subunit of ribonucleotide-diphosphate reductase; the RNR complex catalyzes rate-limiting step in dNTP synthesis, regulated by DNA replication and DNA damage checkpoint pathways via localization of small subunits; RNR3 has a paralog, RNR1, that arose from the whole genome duplication +S000035554 CDS YIL066C 9 240708 238099 C 2011-02-03 1994-12-10 +S000001327 ORF Verified YIL065C FIS1 MDV2 chromosome 9 9 241775 241308 C 2011-02-03 1994-12-10 Protein involved in mitochondrial fission and peroxisome abundance; may have a distinct role in tethering protein aggregates to mitochondria in order to retain them in the mother cell; required for localization of Dnm1p and Mdv1p during mitochondrial division; mediates ethanol-induced apoptosis and ethanol-induced mitochondrial fragmentation +S000035474 CDS YIL065C 9 241775 241308 C 2011-02-03 1994-12-10 +S000001326 ORF Verified YIL064W EFM4 SEE1 chromosome 9 9 241943 242716 W 2011-02-03 1994-12-10 Lysine methyltransferase; involved in the dimethylation of eEF1A (Tef1p/Tef2p) at lysine 316; sequence similarity to S-adenosylmethionine-dependent methyltransferases of the seven beta-strand family; role in vesicular transport +S000035414 CDS YIL064W 9 241943 242716 W 2011-02-03 1994-12-10 +S000001325 ORF Verified YIL063C YRB2 chromosome 9 L000002886 9 243744 242761 C 2011-02-03 1994-12-10 Protein of unknown function; involved in nuclear processes of the Ran-GTPase cycle; involved in nuclear protein export; contains Ran Binding Domain and FxFG repeats; interacts with Srm1p, GTP-Gsp1p, Rna1p and Crm1p; relocalizes to the cytosol in response to hypoxia; not essential for viability +S000034323 CDS YIL063C 9 243744 242761 C 2011-02-03 1994-12-10 +S000001324 ORF Verified YIL062C ARC15 chromosome 9 L000004032 9 244462 243998 C 2011-02-03 1994-12-10 Subunit of the ARP2/3 complex; ARP2/3 is required for the motility and integrity of cortical actin patches; has mRNA binding activity +S000034193 CDS YIL062C 9 244462 243998 C 2011-02-03 1994-12-10 +S000001323 ORF Verified YIL061C SNP1 U1 snRNP complex subunit SNP1|U1-70K chromosome 9 L000001954 9 245559 244657 C 2011-02-03 1994-12-10 Component of U1 snRNP required for mRNA splicing via spliceosome; substrate of the arginine methyltransferase Hmt1p; may interact with poly(A) polymerase to regulate polyadenylation; homolog of human U1 70K protein; protein abundance increases in response to DNA replication stress +S000033301 CDS YIL061C 9 245559 244657 C 2011-02-03 1994-12-10 +S000119034 ARS ARS923 ARSIX-246|ARS913.5 chromosome 9 9 245756 245925 2014-11-18 2014-11-18|2006-10-03 Autonomously Replicating Sequence +S000178115 ARS_consensus_sequence ARS923 9 245880 245864 C 2014-11-18 2014-11-18 +S000007012 long_terminal_repeat YILWdelta2 YILCdelta2 chromosome 9 9 246220 246552 W 2011-02-03 1994-12-10|2007-04-03 Ty2 LTR +S000001322 ORF Verified YIL060W chromosome 9 9 246392 246826 W 2011-02-03 1994-12-10 Mitochondrial protein of unknown function; required for respiratory growth; mutant accumulates less glycogen than does wild type; null mutation results in a decrease in plasma membrane electron transport; YIL060W is not an essential gene +S000033276 CDS YIL060W 9 246392 246826 W 2011-02-03 1994-12-10 +S000001320 ORF Dubious YIL058W chromosome 9 9 246914 247198 W 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034459 CDS YIL058W 9 246914 247198 W 2011-02-03 1994-12-10 +S000001321 ORF Dubious YIL059C chromosome 9 9 246915 246550 C 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps the uncharacterized ORF YIL060W +S000034503 CDS YIL059C 9 246915 246550 C 2011-02-03 1994-12-10 +S000118397 ARS ARS914 ARSIX-248 chromosome 9 9 247705 247760 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178116 ARS_consensus_sequence ARS914 9 247752 247736 C 2014-11-18 2014-11-18 +S000001319 ORF Verified YIL057C RGI2 chromosome 9 9 248396 247902 C 2011-02-03 1994-12-10 Protein of unknown function; involved in energy metabolism under respiratory conditions; expression induced under carbon limitation and repressed under high glucose; RGI2 has a paralog, RGI1, that arose from the whole genome duplication +S000032397 CDS YIL057C 9 248396 247902 C 2011-02-03 1994-12-10 +S000130159 ARS ARS915 chromosome 9 9 248396 248850 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000006735 tRNA_gene tS(UGA)I SUP17 chromosome 9 L000002191|L000003869 9 248850 248931 W -53 2011-02-03 1994-12-10 Serine tRNA (tRNA-Ser), predicted by tRNAscan-SE analysis; can mutate to suppress ochre nonsense mutations +S000034050 noncoding_exon tS(UGA)I 9 248850 248931 W 2011-02-03 1994-12-10 +S000001318 ORF Verified YIL056W VHR1 chromosome 9 9 249991 251913 W 2011-02-03 1994-12-10 Transcriptional activator; required for the vitamin H-responsive element (VHRE) mediated induction of VHT1 (Vitamin H transporter) and BIO5 (biotin biosynthesis intermediate transporter) in response to low biotin concentrations; VHR1 has a paralog, VHR2, that arose from the whole genome duplication +S000032356 CDS YIL056W 9 249991 251913 W 2011-02-03 1994-12-10 +S000001317 ORF Uncharacterized YIL055C chromosome 9 9 253925 252042 C 2011-02-03 1994-12-10 Putative protein of unknown function +S000031292 CDS YIL055C 9 253925 252042 C 2011-02-03 1994-12-10 +S000001316 ORF Uncharacterized YIL054W chromosome 9 9 254543 254860 W 2011-02-03 1994-12-10 Protein of unknown function; expressed at both mRNA and protein levels +S000031254 CDS YIL054W 9 254543 254860 W 2011-02-03 1994-12-10 +S000001315 ORF Verified YIL053W GPP1 RHR2|glycerol-1-phosphatase RHR2 chromosome 9 L000003988 9 255115 255867 W 2011-02-03 1994-12-10|2006-01-24 Constitutively expressed DL-glycerol-3-phosphate phosphatase; also known as glycerol-1-phosphatase; involved in glycerol biosynthesis, induced in response to both anaerobic and osmotic stress; GPP1 has a paralog, GPP2, that arose from the whole genome duplication +S000031111 CDS YIL053W 9 255115 255867 W 2011-02-03 1994-12-10|2006-01-24 +S000001314 ORF Verified YIL052C RPL34B eL34|ribosomal 60S subunit protein L34B|L34e|L34B chromosome 9 L000004466 9 257063 256226 C 2011-02-03 1994-12-10 Ribosomal 60S subunit protein L34B; homologous to mammalian ribosomal protein L34, no bacterial homolog; RPL34B has a paralog, RPL34A, that arose from the whole genome duplication +S000030947 CDS YIL052C 9 256554 256226 C 2011-02-03 1994-12-10 +S000030946 CDS YIL052C 9 257063 257027 C 2011-02-03 1994-12-10 +S000030948 intron YIL052C 9 257026 256555 C 2011-02-03 1994-12-10 +S000001313 ORF Verified YIL051C MMF1 isoleucine biosynthesis protein MMF1|IBM1 chromosome 9 L000004449 9 258280 257843 C 2011-02-03 1994-12-10 Mitochondrial protein required for transamination of isoleucine; but not of valine or leucine; may regulate specificity of branched-chain transaminases Bat1p and Bat2p; induction of expression in response to stress is mediated by a Hog1p-regulated antisense RNA and gene looping; interacts genetically with mitochondrial ribosomal protein genes; MMF1 has a paralog, HMF1, that arose from the whole genome duplication +S000029935 CDS YIL051C 9 258280 257843 C 2011-02-03 1994-12-10 +S000001312 ORF Verified YIL050W PCL7 chromosome 9 L000004039 9 258913 259770 W 2011-02-03 1994-12-10 Pho85p cyclin of the Pho80p subfamily; forms a functional kinase complex with Pho85p which phosphorylates Mmr1p and is regulated by Pho81p; involved in glycogen metabolism, expression is cell-cycle regulated; PCL7 has a paralog, PCL6, that arose from the whole genome duplication +S000029899 CDS YIL050W 9 258913 259770 W 2011-02-03 1994-12-10 +S000001311 ORF Verified YIL049W DFG10 putative polyprenol reductase chromosome 9 L000004073 9 260158 260919 W 2011-02-03 1994-12-10 Probable polyprenol reductase; catalyzes conversion of polyprenol to dolichol, the precursor for N-glycosylation; involved in filamentous growth; mutations in human homolog SRD5A3 confer CDG (Congenital Disorders of Glycosylation); human SRD5A3 can complement yeast null mutant +S000030228 CDS YIL049W 9 260158 260919 W 2011-02-03 1994-12-10 +S000001310 ORF Verified YIL048W NEO1 putative aminophospholipid-translocating P4-type ATPase NEO1 chromosome 9 L000004112 9 261437 264892 W 2011-02-03 1994-12-10 Phospholipid translocase (flippase), role in phospholipid asymmetry of plasma membrane; involved in endocytosis, vacuolar biogenesis and Golgi to ER vesicle-mediated transport; localizes to endosomes and the Golgi apparatus +S000030109 CDS YIL048W 9 261437 264892 W 2011-02-03 1994-12-10 +S000028790 ORF Dubious YIL047C-A chromosome 9 9 265467 265099 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF SYG1/YIL047C +S000033549 CDS YIL047C-A 9 265467 265099 C 2011-02-03 2003-07-29 +S000001309 ORF Verified YIL047C SYG1 chromosome 9 L000002256 9 267823 265115 C 2011-02-03 1994-12-10 Plasma membrane protein of unknown function; truncation and overexpression suppresses lethality of G-alpha protein deficiency +S000036323 CDS YIL047C 9 267823 265115 C 2011-02-03 1994-12-10 +S000028836 ORF Uncharacterized YIL046W-A chromosome 9 9 268309 268473 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000034486 CDS YIL046W-A 9 268309 268473 W 2011-02-03 2003-07-29 +S000001308 ORF Verified YIL046W MET30 ubiquitin-binding SDF ubiquitin ligase complex subunit MET30|ZRG11 chromosome 9 L000001093 9 268651 270573 W 2011-02-03 1994-12-10 F-box protein containing five copies of the WD40 motif; controls cell cycle function, sulfur metabolism, and methionine biosynthesis as part of the ubiquitin ligase complex; interacts with and regulates Met4p, localizes within the nucleus; dissociation of Met30p from SCF complex in response to cadmium stress is regulated by Cdc48p +S000036284 CDS YIL046W 9 268651 270573 W 2011-02-03 1994-12-10 +S000001307 ORF Verified YIL045W PIG2 putative protein phosphatase regulator PIG2 chromosome 9 L000001437 9 271161 272777 W 2011-02-03 1994-12-10 Putative type-1 protein phosphatase targeting subunit; tethers Glc7p type-1 protein phosphatase to Gsy2p glycogen synthase; PIG2 has a paralog, GIP2, that arose from the whole genome duplication +S000036173 CDS YIL045W 9 271161 272777 W 2011-02-03 1994-12-10 +S000001306 ORF Verified YIL044C AGE2 SAT2 chromosome 9 S000007503 9 273846 272950 C 2011-02-03 1994-12-10 ADP-ribosylation factor (ARF) GTPase activating protein (GAP) effector; involved in Trans-Golgi-Network (TGN) transport; contains C2C2H2 cysteine/histidine motif +S000035184 CDS YIL044C 9 273846 272950 C 2011-02-03 1994-12-10 +S000001305 ORF Verified YIL043C CBR1 CBR5 chromosome 9 L000000229 9 274926 274072 C 2011-02-03 1994-12-10|2006-01-23 Cytochrome b reductase; not essential for viability; also detected in mitochondria; mutation in conserved NADH binding domain of the human ortholog results in type I methemoglobinemia +S000035022 CDS YIL043C 9 274926 274072 C 2011-02-03 1994-12-10|2006-01-23 +S000001304 ORF Verified YIL042C PKP1 protein kinase PKP1 chromosome 9 9 276292 275108 C 2011-02-03 1994-12-10 Mitochondrial protein kinase; involved in negative regulation of pyruvate dehydrogenase complex activity by phosphorylating the ser-133 residue of the Pda1p subunit; acts in concert with kinase Pkp2p and phosphatases Ptc5p and Ptc6p +S000034870 CDS YIL042C 9 276292 275108 C 2011-02-03 1994-12-10 +S000001303 ORF Verified YIL041W GVP36 chromosome 9 9 276525 277505 W 2011-02-03 1994-12-10 BAR domain protein that localizes to early and late Golgi vesicles; required for adaptation to varying nutrient concentrations, fluid-phase endocytosis, polarization of the actin cytoskeleton, and vacuole biogenesis +S000034047 CDS YIL041W 9 276525 277505 W 2011-02-03 1994-12-10 +S000001302 ORF Verified YIL040W APQ12 chromosome 9 9 277723 278139 W 2011-02-03 1994-12-10 Nuclear envelope/ER integral membrane protein; interacts and functions with Brr6p and Brl1p in lipid homeostasis; mutants are defective in nuclear pore complex biogenesis, nuclear envelope morphology, mRNA export from the nucleus and are sensitive to sterol biosynthesis inhibitors and membrane fluidizing agents; exhibits synthetic lethal genetic interactions with genes involved in lipid metabolism +S000033887 CDS YIL040W 9 277723 278139 W 2011-02-03 1994-12-10 +S000001301 ORF Verified YIL039W TED1 chromosome 9 9 278426 279847 W 2011-02-03 1994-12-10 GPI-glycan remodelase; conserved phosphoesterase domain-containing protein; acts together with Emp24p/Erv25p in cargo exit from the ER; functional ortholog of mammalian GPI-glycan remodelase PGAP5; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO) +S000035327 CDS YIL039W 9 278426 279847 W 2011-02-03 1994-12-10 +S000001300 ORF Verified YIL038C NOT3 CCR4-NOT core subunit NOT3 chromosome 9 L000001265 9 282652 280142 C 2011-02-03 1994-12-10 Component of the CCR4-NOT core complex, involved in mRNA decapping; involved in transcription initiation and elongation and in mRNA degradation; conserved lysine in human homolog of Not3p and Not5p is mutated in cancers +S000034315 CDS YIL038C 9 282652 280142 C 2011-02-03 1994-12-10 +S000001299 ORF Verified YIL037C PRM2 pheromone-regulated protein PRM2 chromosome 9 9 284999 283029 C 2011-02-03 1994-12-10 Pheromone-regulated protein; predicted to have 4 transmembrane segments and a coiled coil domain; regulated by Ste12p; required for efficient nuclear fusion +S000034252 CDS YIL037C 9 284999 283029 C 2011-02-03 1994-12-10 +S000001298 ORF Verified YIL036W CST6 SHF1|ACA2 chromosome 9 L000002995 9 285666 287429 W 2011-02-03 1994-12-10 Basic leucine zipper (bZIP) transcription factor from ATF/CREB family involved in stress-responsive regulatory network; mediates transcriptional activation of NCE103 in response to low CO2 levels; proposed to be a regulator of oleate responsive genes; involved in utilization of non-optimal carbon sources and chromosome stability; relocalizes to the cytosol in response to hypoxia; CST6 has a paralog, ACA1, that arose from the whole genome duplication +S000034215 CDS YIL036W 9 285666 287429 W 2011-02-03 1994-12-10 +S000001297 ORF Verified YIL035C CKA1 casein kinase 2 catalytic subunit CKA1 chromosome 9 L000000343 9 288908 287790 C -29 2011-02-03 1994-12-10 Alpha catalytic subunit of casein kinase 2 (CK2); a Ser/Thr protein kinase with roles in cell growth and proliferation; CK2, comprised of CKA1, CKA2, CKB1 and CKB2, has many substrates including transcription factors and all RNA polymerases; regulates Fkh1p-mediated donor preference during mating-type switching +S000032136 CDS YIL035C 9 288908 287790 C 2011-02-03 1994-12-10 +S000001296 ORF Verified YIL034C CAP2 F-actin-capping protein subunit beta chromosome 9 L000000215 9 290089 289226 C -28 2011-02-03 1994-12-10 Beta subunit of the capping protein heterodimer (Cap1p and Cap2p); capping protein (CP) binds to the barbed ends of actin filaments preventing further polymerization; localized predominantly to cortical actin patches; protein increases in abundance and relocalizes from bud neck to plasma membrane upon DNA replication stress +S000032026 CDS YIL034C 9 290089 289226 C 2011-02-03 1994-12-10 +S000001295 ORF Verified YIL033C BCY1 cAMP-dependent protein kinase regulatory subunit BCY1|SRA1 chromosome 9 L000002044 9 291669 290419 C -28 2011-02-03 1994-12-10 Regulatory subunit of the cyclic AMP-dependent protein kinase (PKA); PKA is a component of a signaling pathway that controls a variety of cellular processes, including metabolism, cell cycle, stress response, stationary phase, and sporulation +S000031897 CDS YIL033C 9 291669 290419 C 2011-02-03 1994-12-10 +S000001294 ORF Dubious YIL032C chromosome 9 9 292317 291961 C 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030897 CDS YIL032C 9 292317 291961 C 2011-02-03 1994-12-10 +S000001293 ORF Verified YIL031W ULP2 SUMO protease ULP2|SMT4 chromosome 9 L000001939 9 292633 295737 W 2011-02-03 1994-12-10 Peptidase that deconjugates Smt3/SUMO-1 peptides from proteins; plays a role in chromosome cohesion at centromeric regions and recovery from checkpoint arrest induced by DNA damage or DNA replication defects; potential Cdc28p substrate; human homolog PML implicated in promyelocytic leukemia can partially complement yeast null mutant +S000030862 CDS YIL031W 9 292633 295737 W 2011-02-03 1994-12-10 +S000028789 ORF Dubious YIL030W-A chromosome 9 9 295565 295903 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps ORF ULP2/YIL031W +S000033536 CDS YIL030W-A 9 295565 295903 W 2011-02-03 2003-07-29 +S000028788 ORF Dubious YIL029W-A chromosome 9 9 299735 300106 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF SSM4/YIL030C +S000033533 CDS YIL029W-A 9 299735 300106 W 2011-02-03 2003-07-29 +S000001292 ORF Verified YIL030C SSM4 E3 ubiquitin-protein ligase SSM4|KIS3|DOA10 chromosome 9 L000002087 9 300009 296050 C 2011-02-03 1994-12-10 Membrane-embedded ubiquitin-protein ligase; ER and inner nuclear membrane localized RING-CH domain E3 ligase involved in ER-associated protein degradation (ERAD); targets misfolded cytosolic/nucleoplasmic domains of soluble and membrane embedded proteins (ERAD-C) and a transmembrane domain containing substrate (ERAD-M), Sbh2p; C-terminal element (CTE), conserved in human ortholog MARCH10/TEB4, determines substrate selectivity +S000030668 CDS YIL030C 9 300009 296050 C 2011-02-03 1994-12-10 +S000006624 tRNA_gene tK(CUU)I chromosome 9 L000003874 9 300300 300228 C 2011-02-03 1994-12-10|2011-02-03 Lysine tRNA (tRNA-Lys), predicted by tRNAscan-SE analysis; a small portion is imported into mitochondria via interaction with mt lysyl-tRNA synthetase Msk1p and is necessary to decode AAG codons at high temperature, when base modification of mt-encoded tRNA-Lys is reduced +S000036023 noncoding_exon tK(CUU)I 9 300300 300228 C 2011-02-03 1994-12-10|2011-02-03 +S000007013 long_terminal_repeat YILCdelta3 chromosome 9 9 300727 300409 C 2011-02-03 1994-12-10 Ty1 LTR +S000001291 ORF Uncharacterized YIL029C chromosome 9 9 301257 300829 C 2011-02-03 1994-12-10 Putative protein of unknown function; deletion confers sensitivity to 4-(N-(S-glutathionylacetyl)amino) phenylarsenoxide (GSAO); YIL029C has a paralog, YPR071W, that arose from a single-locus duplication +S000031121 CDS YIL029C 9 301257 300829 C 2011-02-03 1994-12-10 +S000001290 ORF Dubious YIL028W chromosome 9 9 302100 302498 W 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000031076 CDS YIL028W 9 302100 302498 W 2011-02-03 1994-12-10 +S000001289 ORF Verified YIL027C EMC5 KRE27 chromosome 9 9 304104 303679 C 2011-02-03 1994-12-10 Member of conserved ER transmembrane complex; required for efficient folding of proteins in the ER; null mutant displays induction of the unfolded protein response, and also shows K1 killer toxin resistance; homologous to worm B0334.15/EMC-5, fly CG15168, human MMGT +S000030935 CDS YIL027C 9 304104 303679 C 2011-02-03 1994-12-10 +S000001288 ORF Verified YIL026C IRR1 SCC3 chromosome 9 L000003590 9 307929 304477 C 2011-02-03 1994-12-10 Subunit of the cohesin complex; which is required for sister chromatid cohesion during mitosis and meiosis and interacts with centromeres and chromosome arms; relocalizes to the cytosol in response to hypoxia; essential for viability +S000029925 CDS YIL026C 9 307929 304477 C 2011-02-03 1994-12-10 +S000001287 ORF Dubious YIL025C chromosome 9 9 308575 308201 C 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000029834 CDS YIL025C 9 308575 308201 C 2011-02-03 1994-12-10 +S000001286 ORF Uncharacterized YIL024C chromosome 9 9 309171 308602 C 2011-02-03 1994-12-10 Putative protein of unknown function; non-essential gene; expression directly regulated by the metabolic and meiotic transcriptional regulator Ume6p +S000037819 CDS YIL024C 9 309171 308602 C 2011-02-03 1994-12-10 +S000001285 ORF Verified YIL023C YKE4 Zn(2+) transporter YKE4 chromosome 9 9 310426 309386 C 2011-02-03 1994-12-10 Zinc transporter; localizes to the ER; null mutant is sensitive to calcofluor white, leads to zinc accumulation in cytosol; ortholog of the mouse KE4 and member of the ZIP (ZRT, IRT-like Protein) family +S000035957 CDS YIL023C 9 310426 309386 C 2011-02-03 1994-12-10 +S000001284 ORF Verified YIL022W TIM44 protein translocase subunit TIM44|MPI1|MIM44|ISP45 chromosome 9 L000001138 9 311165 312460 W 2011-02-03 1994-12-10 Essential component of the TIM23 complex; tethers the import motor and regulatory factors (PAM complex) to the translocation channel (Tim23p-Tim17p core complex); TIM23 complex is short for the translocase of the inner mitochondrial membrane +S000035916 CDS YIL022W 9 311165 312460 W 2011-02-03 1994-12-10 +S000001283 ORF Verified YIL021W RPB3 DNA-directed RNA polymerase II core subunit RPB3|B44 chromosome 9 L000001677|L000001589 9 312905 313861 W -17 2011-02-03 1994-12-10 RNA polymerase II third largest subunit B44; part of central core; similar to prokaryotic alpha subunit +S000035800 CDS YIL021W 9 312905 313861 W 2011-02-03 1994-12-10 +S000028656 ORF Dubious YIL021C-A chromosome 9 9 313468 313199 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps verified gene RPB3/YIL021W; identified by gene-trapping, expression analysis, and genome-wide homology searching +S000032459 CDS YIL021C-A 9 313468 313199 C 2011-02-03 2003-07-29 +S000130160 ARS ARS918 chromosome 9 9 313861 314035 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000028787 ORF Dubious YIL020C-A chromosome 9 9 314051 313713 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; completely overlaps origin of replication ARS918, partially overlaps ORF RPB3/YIL021W +S000033532 CDS YIL020C-A 9 314051 313713 C 2011-02-03 2003-07-29 +S000001282 ORF Verified YIL020C HIS6 1-(5-phosphoribosyl)-5- ((5-phosphoribosylamino)methylideneamino)imidazole-4-carboxamide isomerase HIS6 chromosome 9 L000000783 9 314820 314035 C -17 2011-02-03 1994-12-10 Enzyme that catalyzes the fourth step in the histidine pathway; Phosphoribosylformimino-5-aminoimidazole carboxamide ribotide isomerase; mutations cause histidine auxotrophy and sensitivity to Cu, Co, and Ni salts +S000034720 CDS YIL020C 9 314820 314035 C 2011-02-03 1994-12-10 +S000001281 ORF Verified YIL019W FAF1 chromosome 9 9 315093 316133 W 2011-02-03 1994-12-10 Protein required for pre-rRNA processing; also required for 40S ribosomal subunit assembly +S000036117 CDS YIL019W 9 315093 316133 W 2011-02-03 1994-12-10 +S000001280 ORF Verified YIL018W RPL2B uL2|ribosomal 60S subunit protein L2B|L2|rp8|YL6|L5B|L2B|LOT2|RPL5A chromosome 9 L000001707 9 316768 317932 W 2011-02-03 1994-12-10 Ribosomal 60S subunit protein L2B; homologous to mammalian ribosomal protein L2 and bacterial L2; RPL2B has a paralog, RPL2A, that arose from the whole genome duplication; expression is upregulated at low temperatures +S000036024 CDS YIL018W 9 316768 316771 W 2011-02-03 1994-12-10 +S000036025 CDS YIL018W 9 317172 317932 W 2011-02-03 1994-12-10 +S000036026 intron YIL018W 9 316772 317171 W 2011-02-03 1994-12-10 +S000001279 ORF Verified YIL017C VID28 glucose-induced degradation complex subunit VID28|YIL017W|GID5 chromosome 9 9 320965 318200 C 2011-02-03 1994-12-10 GID Complex subunit, serves as adaptor for regulatory subunit Vid24p; protein involved in proteasome-dependent catabolite degradation of fructose-1,6-bisphosphatase (FBPase); localized to the nucleus and the cytoplasm +S000035053 CDS YIL017C 9 320965 318200 C 2011-02-03 1994-12-10 +S000001278 ORF Verified YIL016W SNL1 chromosome 9 L000004403 9 321454 321933 W 2011-02-03 1994-12-10 Ribosome-associated protein; proposed to act in protein synthesis and nuclear pore complex biogenesis and maintenance as well as protein folding; has similarity to the mammalian BAG-1 protein +S000035003 CDS YIL016W 9 321454 321933 W 2011-02-03 1994-12-10 +S000001277 ORF Verified YIL015W BAR1 aspartyl protease BAR1|SST1 chromosome 9 L000000160 9 322342 324105 W -12 2011-02-03 1994-12-10 Aspartyl protease; secreted into the periplasmic space of mating type a cell; helps cells find mating partners; cleaves and inactivates alpha factor allowing cells to recover from alpha-factor-induced cell cycle arrest +S000034859 CDS YIL015W 9 322342 324105 W 2011-02-03 1994-12-10 +S000006534 tRNA_gene tD(GUC)I1 chromosome 9 L000003873 9 324374 324303 C 2011-02-03 1994-12-10 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000030656 noncoding_exon tD(GUC)I1 9 324374 324303 C 2011-02-03 1994-12-10 +S000007019 long_terminal_repeat YILWsigma3 chromosome 9 9 324391 324734 W 2011-02-03 1994-12-10 Ty3 LTR +S000007016 long_terminal_repeat YILWdelta4 chromosome 9 9 324831 325164 W 2011-02-03 1994-12-10 Ty1 LTR +S000003536 ORF Uncharacterized YIL014C-A YIL015C-A chromosome 9 9 325526 325212 C 2011-02-03 1994-12-10 Putative protein of unknown function +S000035773 CDS YIL014C-A 9 325526 325212 C 2011-02-03 1994-12-10 +S000006742 tRNA_gene tT(AGU)I2 chromosome 9 L000003870 9 325748 325820 W 2011-02-03 1994-12-10 Threonine tRNA (tRNA-Thr), predicted by tRNAscan-SE analysis +S000036347 noncoding_exon tT(AGU)I2 9 325748 325820 W 2011-02-03 1994-12-10 +S000001276 ORF Verified YIL014W MNT3 alpha-1,3-mannosyltransferase MNT3 chromosome 9 9 326103 327995 W 2011-02-03 1994-12-10 Alpha-1,3-mannosyltransferase; adds the fourth and fifth alpha-1,3-linked mannose residues to O-linked glycans during protein O-glycosylation +S000033990 CDS YIL014W 9 326103 327995 W 2011-02-03 1994-12-10 +S000001275 ORF Verified YIL013C PDR11 ATP-binding cassette multidrug transporter PDR11 chromosome 9 L000003163 9 332442 328207 C 2011-02-03 1994-12-10 ATP-binding cassette (ABC) transporter; multidrug transporter involved in multiple drug resistance; mediates sterol uptake when sterol biosynthesis is compromised; regulated by Pdr1p; required for anaerobic growth; PDR11 has a paralog, AUS1, that arose from the whole genome duplication +S000033824 CDS YIL013C 9 332442 328207 C 2011-02-03 1994-12-10 +S000001274 ORF Dubious YIL012W chromosome 9 9 333011 333352 W 2011-02-03 1994-12-10|2011-02-03 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033748 CDS YIL012W 9 333011 333352 W 2011-02-03 1994-12-10|2011-02-03 +S000001273 ORF Verified YIL011W TIR3 YIB1 chromosome 9 9 333727 334536 W 2011-02-03 1994-12-10 Cell wall mannoprotein; member of Srp1p/Tip1p family of serine-alanine-rich proteins; expressed under anaerobic conditions and required for anaerobic growth; TIR3 has a paralog, TIR2, that arose from the whole genome duplication +S000033633 CDS YIL011W 9 333727 334536 W 2011-02-03 1994-12-10 +S000001272 ORF Verified YIL010W DOT5 thioredoxin peroxidase DOT5 chromosome 9 L000004392 9 334882 335529 W 2011-02-03 1994-12-10 Nuclear thiol peroxidase; functions as an alkyl-hydroperoxide reductase during post-diauxic growth +S000030341 CDS YIL010W 9 334882 335529 W 2011-02-03 1994-12-10 +S000006432 ORF Verified YIL009C-A EST3 telomerase subunit EST3 chromosome 9 L000004271 9 336212 335666 C 2011-02-03 1997-10-20 Component of the telomerase holoenzyme; involved in telomere replication; synthesis of the full-length protein results from a programmed +1 ribosomal frameshift +S000031928 CDS YIL009C-A 9 335935 335666 C 2011-02-03 1997-10-20 +S000031927 CDS YIL009C-A 9 336212 335937 C 2011-02-03 1997-10-20 +S000031929 plus_1_translational_frameshift YIL009C-A 9 335936 335936 C 2011-02-03 1997-10-20 +S000006535 tRNA_gene tD(GUC)I2 chromosome 9 L000003872 9 336420 336349 C 2011-02-03 1994-12-10 Aspartate tRNA (tRNA-Asp), predicted by tRNAscan-SE analysis +S000030659 noncoding_exon tD(GUC)I2 9 336420 336349 C 2011-02-03 1994-12-10 +S000007014 long_terminal_repeat YILCdelta5 chromosome 9 9 336897 336708 C 2011-02-03 1994-12-10 Ty1 LTR +S000001271 ORF Verified YIL009W FAA3 long-chain fatty acid-CoA ligase FAA3 chromosome 9 L000000596 9 339344 341428 W 2011-02-03 1994-12-10 Long chain fatty acyl-CoA synthetase; activates imported fatty acids with a preference for C16:0-C18:0 chain lengths; green fluorescent protein (GFP)-fusion protein localizes to the cell periphery +S000030759 CDS YIL009W 9 339344 341428 W 2011-02-03 1994-12-10 +S000118398 ARS ARS919 ARSIX-342 chromosome 9 9 341976 342045 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000001270 ORF Verified YIL008W URM1 ubiquitin-related modifier URM1 chromosome 9 S000007535 9 342536 342835 W 2011-02-03 1994-12-10 Ubiquitin-like protein involved in thiolation of cytoplasmic tRNAs; receives sulfur from the E1-like enzyme Uba4p and transfers it to tRNA; also functions as a protein tag with roles in nutrient sensing and oxidative stress response +S000030686 CDS YIL008W 9 342536 342835 W 2011-02-03 1994-12-10 +S000001269 ORF Verified YIL007C NAS2 chromosome 9 9 343656 342994 C 2011-02-03 1994-12-10 Evolutionarily conserved 19S regulatory particle assembly-chaperone; involved in assembly of the base subcomplex of the 19S proteasomal regulatory particle (RP); non-essential gene; interacts with Rpn4p; protein abundance increases in response to DNA replication stress; ortholog of human p27 +S000030556 CDS YIL007C 9 343656 342994 C 2011-02-03 1994-12-10 +S000001268 ORF Verified YIL006W YIA6 NAD+ transporter|NDT1 chromosome 9 9 344062 345183 W 2011-02-03 1994-12-10 Mitochondrial NAD+ transporter; involved in the transport of NAD+ into the mitochondria (see also YEA6); member of the mitochondrial carrier subfamily; disputed role as a pyruvate transporter; has putative mouse and human orthologs; YIA6 has a paralog, YEA6, that arose from the whole genome duplication +S000030529 CDS YIL006W 9 344062 345183 W 2011-02-03 1994-12-10 +S000001267 ORF Verified YIL005W EPS1 protein disulfide isomerase EPS1 chromosome 9 9 345692 347797 W 2011-02-03 1994-12-10 ER protein with chaperone and co-chaperone activity; involved in retention of resident ER proteins; has a role in recognizing proteins targeted for ER-associated degradation (ERAD), member of the protein disulfide isomerase family +S000030455 CDS YIL005W 9 345692 347797 W 2011-02-03 1994-12-10 +S000001266 ORF Verified YIL004C BET1 SLY12 chromosome 9 L000000171 9 348505 347946 C 2011-02-03 1994-12-10 Type II membrane protein required for vesicular transport; required for vesicular transport between the endoplasmic reticulum and Golgi complex; v-SNARE with similarity to synaptobrevins +S000037580 CDS YIL004C 9 348363 347946 C 2011-02-03 1994-12-10 +S000037579 CDS YIL004C 9 348505 348495 C 2011-02-03 1994-12-10 +S000037581 intron YIL004C 9 348494 348364 C 2011-02-03 1994-12-10 +S000001265 ORF Verified YIL003W CFD1 iron-sulfur cluster assembly protein CFD1|DRE3 chromosome 9 9 349122 350003 W 2011-02-03 1994-12-10 Highly conserved iron-sulfur cluster binding protein; localized in the cytoplasm; forms a complex with Nbp35p that is involved in iron-sulfur protein assembly in the cytosol +S000037556 CDS YIL003W 9 349122 350003 W 2011-02-03 1994-12-10 +S000028835 ORF Uncharacterized YIL002W-A chromosome 9 9 350301 350510 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000034485 CDS YIL002W-A 9 350301 350510 W 2011-02-03 2003-07-29 +S000001264 ORF Verified YIL002C INP51 phosphoinositide 5-phosphatase INP51|SJL1 chromosome 9 L000003319 9 353431 350591 C 2011-02-03 1994-12-10 Phosphatidylinositol 4,5-bisphosphate 5-phosphatase; synaptojanin-like protein with an N-terminal Sac1 domain, plays a role in phosphatidylinositol 4,5-bisphosphate homeostasis and in endocytosis; null mutation confers cold-tolerant growth +S000032035 CDS YIL002C 9 353431 350591 C 2011-02-03 1994-12-10 +S000001263 ORF Uncharacterized YIL001W chromosome 9 9 353940 355481 W 2011-02-03 1994-12-10 Putative protein of unknown function; contains a BTB/POZ domain which generally function in protein interactions; deletion slightly improved competitive fitness in rich media; GFP-tagged protein is localized to the cytoplasm +S000031993 CDS YIL001W 9 353940 355481 W 2011-02-03 1994-12-10 +S000006470 centromere CEN9 CEN9 chromosome 9 L000000302 9 355629 355745 W 0 2011-02-03 1994-12-10|2006-05-09 Chromosome IX centromere +S000077275 centromere_DNA_Element_I CEN9 9 355629 355638 W 2011-02-03 2004-10-05 +S000077276 centromere_DNA_Element_II CEN9 9 355639 355720 W 2011-02-03 2004-10-05 +S000077277 centromere_DNA_Element_III CEN9 9 355721 355745 W 2011-02-03 2004-10-05 +S000001440 ORF Verified YIR001C SGN1 RBP29|RBP1 chromosome 9 9 356895 356143 C 2011-02-03 1994-12-10 Cytoplasmic RNA-binding protein; contains an RNA recognition motif (RRM); may have a role in mRNA translation, as suggested by genetic interactions with genes encoding proteins involved in translational initiation +S000032594 CDS YIR001C 9 356895 356143 C 2011-02-03 1994-12-10 +S000118399 ARS ARS920 ARSIX-357 chromosome 9 9 357160 357396 2011-02-03 2006-08-30 Autonomously Replicating Sequence +S000178117 ARS_consensus_sequence ARS920 9 357222 357238 W 2014-11-18 2014-11-18 +S000001441 ORF Verified YIR002C MPH1 3'-5' DNA helicase chromosome 9 9 360396 357415 C 2011-02-03 1994-12-10 3'-5' DNA helicase involved in error-free bypass of DNA lesions; binds flap DNA, stimulates activity of Rad27p and Dna2p; prevents crossovers between ectopic sequences by removing substrates for Mus81-Mms4 or Rad1-Rad10 cleavage; homolog of human FANCM Fanconi anemia protein that is involved in stabilizing and remodeling blocked replication forks; member of SF2 DExD/H superfamily of helicases; nonsense or missense mutations in FANCM can make people more likely to get cancer +S000032716 CDS YIR002C 9 360396 357415 C 2011-02-03 1994-12-10 +S000001442 ORF Verified YIR003W AIM21 chromosome 9 9 360885 362924 W 2011-02-03 1994-12-10 Protein of unknown function; involved in mitochondrial migration along actin filament; may interact with ribosomes; GFP-fusion protein colocalizes with Sac1p to the actin cytoskeleton +S000032876 CDS YIR003W 9 360885 362924 W 2011-02-03 1994-12-10 +S000130161 ARS ARS921 chromosome 9 9 362924 363221 2011-02-03 2009-05-07 Putative replication origin; identified in multiple array studies, not yet confirmed by plasmid-based assay +S000001443 ORF Verified YIR004W DJP1 PAS22|ICS1 chromosome 9 L000003966 9 363221 364519 W 2011-02-03 1994-12-10 Cytosolic J-domain-containing protein; required for peroxisomal protein import and involved in peroxisome assembly; facilitates import of Mim1p and Mim2p into the mitochondrial outer membrane; homologous to E. coli DnaJ +S000033586 CDS YIR004W 9 363221 364519 W 2011-02-03 1994-12-10 +S000001444 ORF Verified YIR005W IST3 U2 snRNP complex subunit IST3|SNU17 chromosome 9 9 364889 365335 W 2011-02-03 1994-12-10 Component of the U2 snRNP; required for the first catalytic step of splicing and for spliceosomal assembly; interacts with Rds3p and is required for Mer1p-activated splicing; diploid mutants have a specific defect in MATa1 pre-mRNA splicing which leads to haploid gene expression in diploids +S000033658 CDS YIR005W 9 364889 365335 W 2011-02-03 1994-12-10 +S000001445 ORF Verified YIR006C PAN1 DIM2|MIP3|MDP3 chromosome 9 L000001335 9 369908 365466 C 2011-02-03 1994-12-10 Part of actin cytoskeleton-regulatory complex Pan1p-Sla1p-End3p; associates with actin patches on cell cortex; promotes protein-protein interactions essential for endocytosis; binds to and activates Arp2/3 complex in vitro; phosphorylation of Thr-1225 is regulated by MAPK Hog1p in response to osmotic stress; previously thought to be a subunit of poly(A) ribonuclease +S000033724 CDS YIR006C 9 369908 365466 C 2011-02-03 1994-12-10 +S000006556 tRNA_gene tE(UUC)I chromosome 9 L000003871 9 370417 370488 W 2011-02-03 1994-12-10 Glutamate tRNA (tRNA-Glu), predicted by tRNAscan-SE analysis; thiolation of uridine at wobble position (34) requires Ncs6p +S000035987 noncoding_exon tE(UUC)I 9 370417 370488 W 2011-02-03 1994-12-10 +S000001446 ORF Verified YIR007W EGH1 hydrolase chromosome 9 9 370704 372998 W 2011-02-03 1994-12-10 Steryl-beta-glucosidase with broad specificity for aglycones; has a role in ergosteryl-beta-glucoside catabolism; required for normal vacuolar morphology; has similarity to the C. neoformans ergosteryl-beta-glucosidase EGCrP2; localizes to the cytosol +S000034669 CDS YIR007W 9 370704 372998 W 2011-02-03 1994-12-10 +S000001447 ORF Verified YIR008C PRI1 DNA primase subunit PRI1 chromosome 9 L000001489 9 374306 373077 C 2011-02-03 1994-12-10 Subunit of DNA primase; DNA primase is required for DNA synthesis and double-strand break repair +S000034753 CDS YIR008C 9 374306 373077 C 2011-02-03 1994-12-10 +S000001448 ORF Verified YIR009W MSL1 U2 snRNP complex subunit MSL1|YIB9|YIB9w chromosome 9 L000004502 9 374525 374860 W 2011-02-03 1994-12-10 U2B component of U2 snRNP; involved in splicing, binds the U2 snRNA stem-loop IV in vitro but requires association of Lea1p for in vivo binding; does not contain the conserved C-terminal RNA binding domain found in other family members +S000034977 CDS YIR009W 9 374525 374860 W 2011-02-03 1994-12-10 +S000001449 ORF Verified YIR010W DSN1 MIND complex subunit DSN1 chromosome 9 L000004645 9 375431 377161 W 2011-02-03 1994-12-10 Essential component of the MIND kinetochore complex; joins kinetochore subunits contacting DNA to those contacting microtubules; Dsn1p phosphorylation promotes interaction between outer and inner kinetochore proteins; kinetochore receptor for monopolin, via interaction with subunit Csm1p; essential for meiotic but not mitotic chromosome segregation; MIND complex consists of Mtw1p, Nnf1p, Nsl1p and Dsn1p; modified by sumoylation; phosphorylated by monopolin subunit Hrr25p +S000035994 CDS YIR010W 9 375431 377161 W 2011-02-03 1994-12-10 +S000001450 ORF Verified YIR011C STS1 SSM5|DBF8 chromosome 9 L000000489 9 378246 377287 C 2011-02-03 1994-12-10 Protein required for localizing proteasomes to the nucleus; involved in cotranslational protein degradation; mediates interaction between nuclear import factor Srp1p and the proteasome; Sts1p and Srp1p couple proteasomes to nascent polypeptides emerging from the ribosome for cotranslational degradation; involved in ubiquitin-mediated protein degradation +S000036807 CDS YIR011C 9 378246 377287 C 2011-02-03 1994-12-10 +S000001451 ORF Verified YIR012W SQT1 chromosome 9 L000003431 9 378486 379781 W 2011-02-03 1994-12-10 Specific chaperone for ribosomal protein Rpl10p; binds nascent Rpl10p during translation; contains multiple WD repeats; interacts with Qsr1p in a two-hybrid assay; protein abundance increases in response to DNA replication stress +S000036906 CDS YIR012W 9 378486 379781 W 2011-02-03 1994-12-10 +S000001452 ORF Verified YIR013C GAT4 chromosome 9 S000007452 9 380384 380019 C 2011-02-03 1994-12-10 Protein containing GATA family zinc finger motifs; involved in spore wall assembly; sequence similarity to GAT3, and the double mutant gat3 gat4 exhibits reduced dityrosine fluorescence relative to the single mutants +S000036935 CDS YIR013C 9 380384 380019 C 2011-02-03 1994-12-10 +S000001453 ORF Uncharacterized YIR014W chromosome 9 9 381086 381814 W 2011-02-03 2003-09-22|1994-12-10 Putative protein of unknown function; green fluorescent protein (GFP)-fusion protein localizes to the vacuole; expression directly regulated by the metabolic and meiotic transcriptional regulator Ume6p; YIR014W is a non-essential gene +S000037725 CDS YIR014W 9 381086 381814 W 2011-02-03 2003-09-22|1994-12-10 +S000001454 ORF Verified YIR015W RPR2 ribonuclease P protein subunit RPR2 chromosome 9 L000004310 9 381948 382382 W 2011-02-03 1994-12-10 Subunit of nuclear RNase P; nuclear RNase P cleaves tRNA precursors to generate mature 5' ends and facilitates turnover of nuclear RNAs; not shared between RNase MRP and RNase P, in contrast to all other RNase P protein subunits; protein abundance increases in response to DNA replication stress +S000037806 CDS YIR015W 9 381948 382382 W 2011-02-03 1994-12-10 +S000001455 ORF Uncharacterized YIR016W chromosome 9 9 382628 383425 W 2011-02-03 1994-12-10 Putative protein of unknown function; expression directly regulated by the metabolic and meiotic transcriptional regulator Ume6p; overexpression causes a cell cycle delay or arrest; non-essential gene; YIR016W has a paralog, YOL036W, that arose from the whole genome duplication +S000037904 CDS YIR016W 9 382628 383425 W 2011-02-03 1994-12-10 +S000028799 ORF Dubious YIR017W-A chromosome 9 9 383566 384165 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000033566 CDS YIR017W-A 9 383566 384165 W 2011-02-03 2003-07-29 +S000001456 ORF Verified YIR017C MET28 chromosome 9 L000001092 9 384119 383556 C 2011-02-03 1994-12-10 bZIP transcriptional activator in the Cbf1p-Met4p-Met28p complex; participates in the regulation of sulfur metabolism +S000030791 CDS YIR017C 9 384119 383556 C 2011-02-03 1994-12-10 +S000001457 ORF Verified YIR018W YAP5 chromosome 9 L000004343 9 384609 385346 W 2011-02-03 1994-12-10 Basic leucine zipper (bZIP) iron-sensing transcription factor; involved in diauxic shift; YAP5 has a paralog, YAP7, that arose from the whole genome duplication +S000030914 CDS YIR018W 9 384609 385346 W 2011-02-03 1994-12-10 +S000028837 ORF Uncharacterized YIR018C-A chromosome 9 9 385701 385564 C 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000034488 CDS YIR018C-A 9 385701 385564 C 2011-02-03 2003-07-29 +S000001458 ORF Verified YIR019C FLO11 MUC1|STA4 chromosome 9 L000002104 9 393675 389572 C 2011-02-03 1994-12-10 GPI-anchored cell surface glycoprotein (flocculin); required for pseudohyphal and invasive growth, flocculation, and biofilm formation; major determinant of colony morphology; transcription regulated by the MAPK pathway (Ste12p and Tec1p) and the cAMP pathway (Flo8p); required for formation of fibrous interconnections between cells of a wild strain; role in co-flocculation with other yeast species; cleaved and shed from cells, contributing to their surface properties +S000030936 CDS YIR019C 9 393675 389572 C 2011-02-03 1994-12-10 +S000001459 ORF Uncharacterized YIR020C chromosome 9 9 394557 394255 C 2011-02-03 1994-12-10 Protein of unknown function; mRNA identified as translated by ribosome profiling data; SWAT-GFP fusion protein localizes to the endoplasmic reticulum +S000032045 CDS YIR020C 9 394557 394255 C 2011-02-03 1994-12-10 +S000007241 ORF Dubious YIR020W-A YIR020W-B chromosome 9 9 394917 395159 W 2011-02-03 1999-07-17 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000034820 CDS YIR020W-A 9 394917 395159 W 2011-02-03 1999-07-17 +S000132614 ncRNA_gene PWR1 PWR1 chromosome 9 9 395999 396939 W 2011-02-03 2010-01-05 Intergenic regulatory ncRNA; one of two long ncRNAs that play key roles in regulating transcription of the nearby protein-coding ORF FLO11; PWR1 promotes FLO11 transcription by interfering with ncRNA ICR1, which is transcribed across the FLO11 promoter +S000132615 noncoding_exon PWR1 9 395999 396939 W 2011-02-03 2010-01-05 +S000132612 ncRNA_gene ICR1 ICR1 chromosome 9 9 397082 393884 C 2011-02-03 2010-01-05 Long intergenic regulatory ncRNA; has a key role in regulating transcription of the nearby protein-coding ORF FLO11; initiated far upstream from FLO11 and transcribed across much of the large promoter of FLO11, repressing FLO11 transcription in cis +S000132613 noncoding_exon ICR1 9 397082 393884 C 2011-02-03 2010-01-05 +S000001460 ORF Verified YIR021W MRS1 PET157 chromosome 9 9 397294 398385 W 2011-02-03 1994-12-10 Splicing protein; required for splicing of two mitochondrial group I introns (BI3 in COB and AI5beta in COX1); forms a splicing complex, containing four subunits of Mrs1p and two subunits of the BI3-encoded maturase, that binds to the BI3 RNA; MRS1 has a paralog, CCE1, that arose from the whole genome duplication +S000032999 CDS YIR021W 9 397294 398385 W 2011-02-03 1994-12-10 +S000028800 ORF Dubious YIR020C-B chromosome 9 9 397949 397215 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; partially overlaps verified ORF MRS1 +S000033580 CDS YIR020C-B 9 397949 397215 C 2011-02-03 2003-07-29 +S000028838 ORF Uncharacterized YIR021W-A chromosome 9 9 398514 398726 W 2011-02-03 2003-07-29 Putative protein of unknown function; identified by expression profiling and mass spectrometry +S000034490 CDS YIR021W-A 9 398514 398726 W 2011-02-03 2003-07-29 +S000001461 ORF Verified YIR022W SEC11 signal peptidase complex catalytic subunit SEC11 chromosome 9 L000001836 9 398733 399236 W 22 2011-02-03 1994-12-10 18kDa catalytic subunit of the Signal Peptidase Complex (SPC); the Signal Peptidase Complex cleaves the signal sequence of proteins targeted to the endoplasmic reticulum; other members are Spc1p, Spc2p, Spc3p, and Sec11p +S000033111 CDS YIR022W 9 398733 399236 W 2011-02-03 1994-12-10 +S000001462 ORF Verified YIR023W DAL81 DURL|UGA35 chromosome 9 L000000481 9 399777 402689 W 22 2011-02-03 1994-12-10 Positive regulator of genes in multiple nitrogen degradation pathways; contains DNA binding domain but does not appear to bind the dodecanucleotide sequence present in the promoter region of many genes involved in allantoin catabolism +S000033187 CDS YIR023W 9 399777 402689 W 2011-02-03 1994-12-10 +S000028801 ORF Dubious YIR023C-A chromosome 9 9 402706 402383 C 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; almost completely overlaps ORF DAL81/YIR023W +S000033581 CDS YIR023C-A 9 402706 402383 C 2011-02-03 2003-07-29 +S000001463 ORF Verified YIR024C INA22 GIF1 chromosome 9 L000004438 9 403491 402841 C 2011-02-03 1994-12-10 F1F0 ATP synthase peripheral stalk assembly factor; subunit of the matrix-exposed inner mitochondrial membrane localized INA complex (Ina22p-Ina17p) involved in assembly of the F1F0 peripheral stalk; co-purifies with Aim43p, ATP synthase subunits, and cytochrome bc1 complex assembly factors; interacts with Arh1p, a mitochondrial oxidoreductase; deletion mutant has a respiratory growth defect +S000033910 CDS YIR024C 9 403491 402841 C 2011-02-03 1994-12-10 +S000001464 ORF Verified YIR025W MND2 chromosome 9 9 403659 404765 W 2011-02-03 1994-12-10 Subunit of the Anaphase-Promoting Complex/Cyclosome (APC/C); necessary for maintaining sister chromatid cohesion in prophase I of meiosis by inhibiting premature ubiquitination and subsequent degradation of substrates by the APC(Ama1) ubiquitin ligase +S000034094 CDS YIR025W 9 403659 404765 W 2011-02-03 1994-12-10 +S000001465 ORF Verified YIR026C YVH1 tyrosine protein phosphatase YVH1 chromosome 9 L000002567 9 405967 404873 C 31 2011-02-03 1994-12-10 Dual specificity protein phosphatase; regulates growth, sporulation, and glycogen accumulation in a cAMP-dependent protein kinase cascade dependent manner; mutants are defective in 60S ribosome assembly; positively regulates pre-autophagosomal structure (PAS) formation upon nitrogen starvation or rapamycin treatment +S000034138 CDS YIR026C 9 405967 404873 C 2011-02-03 1994-12-10 +S000001466 ORF Verified YIR027C DAL1 allantoinase chromosome 9 L000000474 9 407642 406260 C 32.1 2011-02-03 1994-12-10 Allantoinase; converts allantoin to allantoate in the first step of allantoin degradation; expression sensitive to nitrogen catabolite repression +S000034253 CDS YIR027C 9 407642 406260 C 2011-02-03 1994-12-10 +S000001467 ORF Verified YIR028W DAL4 allantoin permease chromosome 9 L000000477 9 408468 410375 W 34 2011-02-03 1994-12-10 Allantoin permease; expression sensitive to nitrogen catabolite repression and induced by allophanate, an intermediate in allantoin degradation +S000035258 CDS YIR028W 9 408468 410375 W 2011-02-03 1994-12-10 +S000001468 ORF Verified YIR029W DAL2 allantoicase|ALC1 chromosome 9 L000000475 9 410807 411838 W 36.1 2011-02-03 1994-12-10 Allantoicase; converts allantoate to urea and ureidoglycolate in the second step of allantoin degradation; expression sensitive to nitrogen catabolite repression and induced by allophanate, an intermediate in allantoin degradation +S000035347 CDS YIR029W 9 410807 411838 W 2011-02-03 1994-12-10 +S000118400 ARS ARS922 ARSIX-412 chromosome 9 9 411935 412011 2014-11-18 2014-11-18|2006-08-30 Autonomously Replicating Sequence +S000178118 ARS_consensus_sequence ARS922 9 412001 411985 C 2014-11-18 2014-11-18 +S000001469 ORF Verified YIR030C DCG1 chromosome 9 L000000497 9 412770 412036 C 36.4 2011-02-03 1994-12-10 Protein of unknown function; expression is sensitive to nitrogen catabolite repression and regulated by Dal80p; contains transmembrane domain +S000036237 CDS YIR030C 9 412770 412036 C 2011-02-03 1994-12-10 +S000028802 ORF Dubious YIR030W-A chromosome 9 9 412899 413282 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF DAL7/YIR031C +S000033582 CDS YIR030W-A 9 412899 413282 W 2011-02-03 2003-07-29 +S000001470 ORF Verified YIR031C DAL7 malate synthase DAL7|MSL2|MLS2 chromosome 9 L000000479 9 414679 413015 C 36.9 2011-02-03 1994-12-10 Malate synthase; can accept butyryl-CoA as acyl-CoA donor in addition to traditional substrate acetyl-CoA; recycles glyoxylate generated during allantoin degradation; SWAT-GFP and mCherry fusion proteins localize to the cytosol; expression sensitive to nitrogen catabolite repression and induced by allophanate, an intermediate in allantoin degradation +S000031686 CDS YIR031C 9 414679 413015 C 2011-02-03 1994-12-10 +S000001471 ORF Verified YIR032C DAL3 ureidoglycolate hydrolase chromosome 9 L000000476 9 415617 415030 C 37 2011-02-03 1994-12-10 Ureidoglycolate lyase; converts ureidoglycolate to glyoxylate and urea in the third step of allantoin degradation; expression is sensitive to nitrogen catabolite repression; this enzyme is sometimes referred to "ureidoglycolate hydrolase" but should not be confused with the Arabidopsis thaliana ureidoglycolate hydrolase enzyme which converts ureidoglycolate to glyoxylate, ammonia and carbon dioxide +S000031829 CDS YIR032C 9 415617 415030 C 2011-02-03 1994-12-10 +S000001472 ORF Verified YIR033W MGA2 chromosome 9 L000004181 9 416124 419465 W 2011-02-03 1994-12-10 ER membrane protein involved in regulation of OLE1 transcription; inactive ER form dimerizes and one subunit is then activated by ubiquitin/proteasome-dependent processing followed by nuclear targeting; MGA2 has a paralog, SPT23, that arose from the whole genome duplication +S000032031 CDS YIR033W 9 416124 419465 W 2011-02-03 1994-12-10 +S000001473 ORF Verified YIR034C LYS1 saccharopine dehydrogenase (NAD+, L-lysine-forming) chromosome 9 L000000964 9 420736 419615 C 40 2011-02-03 1994-12-10 Saccharopine dehydrogenase (NAD+, L-lysine-forming); catalyzes the conversion of saccharopine to L-lysine, which is the final step in the lysine biosynthesis pathway; also has mRNA binding activity +S000037430 CDS YIR034C 9 420736 419615 C 2011-02-03 1994-12-10 +S000001474 ORF Uncharacterized YIR035C sepiapterin reductase family protein chromosome 9 9 421790 421026 C 2011-02-03 1994-12-10 Putative cytoplasmic short-chain dehydrogenase/reductase +S000037528 CDS YIR035C 9 421790 421026 C 2011-02-03 1994-12-10 +S000028803 ORF Dubious YIR036W-A chromosome 9 9 422635 423036 W 2011-02-03 2003-07-29 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data; overlaps ORF IRC24/YIR036C +S000033584 CDS YIR036W-A 9 422635 423036 W 2011-02-03 2003-07-29 +S000001475 ORF Verified YIR036C IRC24 sepiapterin reductase family protein IRC24 chromosome 9 9 422865 422074 C 2011-02-03 1994-12-10 Putative benzil reductase;(GFP)-fusion protein localizes to the cytoplasm and is induced by the DNA-damaging agent MMS; sequence similarity with short-chain dehydrogenase/reductases; null mutant has increased spontaneous Rad52p foci +S000037606 CDS YIR036C 9 422865 422074 C 2011-02-03 1994-12-10 +S000001476 ORF Verified YIR037W HYR1 peroxiredoxin HYR1|ORP1|GPX3 chromosome 9 L000002612 9 423128 423619 W 2011-02-03 1994-12-10 Thiol peroxidase; functions as a hydroperoxide receptor to sense intracellular hydroperoxide levels and transduce a redox signal to the Yap1p transcription factor; HYR1 has a paralog, GPX1, that arose from the whole genome duplication +S000030468 CDS YIR037W 9 423128 423619 W 2011-02-03 1994-12-10 +S000001477 ORF Verified YIR038C GTT1 bifunctional glutathione transferase/peroxidase chromosome 9 L000004612 9 424513 423809 C 2011-02-03 1994-12-10 ER associated glutathione S-transferase capable of homodimerization; expression induced during the diauxic shift and throughout stationary phase; functional overlap with Gtt2p, Grx1p, and Grx2p +S000030525 CDS YIR038C 9 424513 423809 C 2011-02-03 1994-12-10 +S000007021 long_terminal_repeat YIRCdelta6 chromosome 9 9 426425 426201 C 2011-02-03 1994-12-10 Ty1 LTR +S000001478 ORF Verified YIR039C YPS6 aspartyl protease chromosome 9 L000004386 9 432111 430498 C 2011-02-03 1994-12-10 Putative GPI-anchored aspartic protease; member of the yapsin family of proteases involved in cell wall growth and maintenance +S000030600 CDS YIR039C 9 432111 430498 C 2011-02-03 1994-12-10 +S000001479 ORF Dubious YIR040C chromosome 9 9 433721 433389 C 2011-02-03 1994-12-10 Dubious open reading frame; unlikely to encode a functional protein, based on available experimental and comparative sequence data +S000030026 CDS YIR040C 9 433721 433389 C 2011-02-03 1994-12-10 +S000001480 ORF Verified YIR041W PAU15 seripauperin PAU15 chromosome 9 9 433929 434303 W 2011-02-03 1994-12-10 Protein of unknown function; member of the seripauperin multigene family encoded mainly in subtelomeric regions; SWAT-GFP and mCherry fusion proteins localize to the vacuole +S000030194 CDS YIR041W 9 433929 434303 W 2011-02-03 1994-12-10 +S000001481 ORF Uncharacterized YIR042C chromosome 9 9 435983 435273 C 2011-02-03 1994-12-10 Putative protein of unknown function; YIR042C is a non-essential gene +S000030300 CDS YIR042C 9 435983 435273 C 2011-02-03 1994-12-10 +S000001482 blocked_reading_frame YIR043C YIR044C chromosome 9 9 438179 437043 C 2014-11-18 1994-12-10|2014-11-18 Blocked reading frame; may encode a non-functional member of the conserved, often subtelomerically-encoded Cos protein family +S000030384 CDS YIR043C 9 438179 437043 C 2014-11-18 1994-12-10|2014-11-18 +S000028970 telomere TEL09R chromosome 9 9 439068 439888 W 43 2011-02-03 2003-09-09 Telomeric region on the right arm of Chromosome IX; composed of an X element core sequence, X element combinatorial repeats, and a short terminal stretch of telomeric repeats +S000028971 telomeric_repeat TEL09R 9 439816 439888 W 2011-02-03 2003-09-09 Terminal telomeric repeats on the right arm of Chromosome IX +S000028972 X_element TEL09R 9 439068 439533 W 2011-02-03 2003-09-09 Telomeric X element Core sequence on the right arm of Chromosome IX; contains an ARS consensus sequence and an Abf1p binding site consensus sequence +S000028973 X_element_combinatorial_repeat TEL09R 9 439534 439815 W 2011-02-03 2003-09-09 Telomeric X element combinatorial repeat on the right arm of Chr IX; contains repeats of the D, C, B and A types, as well as Tbf1p binding sites; formerly called SubTelomeric Repeats +S000178596 not physically mapped OTO1 Protein whose overexpression inhibits growth; encoded by a previously unannotated ORF located between YGR227W and YGR228W in the "C" direction; overexpression of PRM1 or UBP7 suppresses the growth inhibition caused by OTO1 overexpression; "orphan" ORF not conserved in any other known species +S000182414 not physically mapped SMT1 +S000029044 not physically mapped ASL1 S000029006 +S000155235 not physically mapped PDR19 +S000155237 not physically mapped PDR20 +S000155238 not physically mapped PDR21 +S000183332 not physically mapped HTC1 +S000183742 not physically mapped YPL2 +S000183740 not physically mapped YPL1 +S000151128 not physically mapped AIP5 +S000029237 not in systematic sequence of S288C KHR1 KHR1 KHR L000000899 Killer toxin; encoded on the left arm of chromosome IX in some strains, including YJM789 +S000029522 not in systematic sequence of S288C STA1 STA1 MAL5|DEX2 chromosome 9 L000003928 9 Glucoamylase (glucan 1,4-alpha-glucosidase) +S000029524 not in systematic sequence of S288C STA2 STA2 L000002105 Glucoamylase (glucan 1,4-alpha-glucosidase); allows yeast to degrade starch +S000029525 not in systematic sequence of S288C STA3 STA3 L000002106 Starch hydrolysis +S000029679 not in systematic sequence of S288C STRP STRP L000002135 Transmembrane protein with a highly basic C-terminal region +S000029531 not in systematic sequence of S288C SUC1 SUC1 chromosome 7 L000002143 7 228 Invertase; sucrose hydrolyzing enzyme; seven closely related but non-identical invertase genes have been described in yeast (SUC1-5, 7, 8) but only SUC2 is in the reference strain (S288C) +S000029532 not in systematic sequence of S288C SUC3 SUC3 chromosome 2 L000002145 2 146 Invertase; sucrose hydrolyzing enzyme; seven closely related but non-identical invertase genes have been described in yeast (SUC1-5, 7, 8) but only SUC2 is in the reference strain (S288C) +S000029533 not in systematic sequence of S288C SUC4 SUC4 SUC6 chromosome 13 L000002146 13 Invertase; sucrose hydrolyzing enzyme; seven closely related but non-identical invertase genes have been described in yeast (SUC1-5, 7, 8) but only SUC2 is in the reference strain (S288C) +S000029534 not in systematic sequence of S288C SUC5 SUC5 chromosome 4 L000002147 4 -152 Invertase; sucrose hydrolyzing enzyme; seven closely related but non-identical invertase genes have been described in yeast (SUC1-5, 7, 8) but only SUC2 is in the reference strain (S288C) +S000029535 not in systematic sequence of S288C SUC7 SUC7 chromosome 8 L000002148 8 Invertase; sucrose hydrolyzing enzyme; seven related but non-identical invertase genes have been described in yeast (SUC1-5, 7, 8) but only SUC2 is in strain S288C; unlike other forms of invertase, Suc7p is unable to hydrolyze raffinose +S000029417 not in systematic sequence of S288C RF2 RF2 chromosome 17 S000007533 17 Maturase-like coding sequence downstream of COX3/Q0275; present in some S. cerevisiae strains and other Saccharomyces species; compound ORF with homology to other group I open reading frames; in S288C is interrupted by two GC clusters, both of which ultimately result in a -1 frameshlft +S000029677 not in systematic sequence of S288C RTM1 RTM1 L000001785 Member of the lipid-translocating exporter (LTE) family; present in multiple copies associated with SUC telomeric loci, amplified in yeasts used for industrial biomass or ethanol production with molasses as substrate +S000029656 not in systematic sequence of S288C MAL2 MAL2 chromosome 3 L000001001 3 95 Multigene complex, polymeric locus for maltose fermentation; encodes the MAL23 trans-acting MAL-activator, MAL21 maltose permease, and MAL22 maltase; on the right arm of Chromosome III, but not in strain S288C +S000029681 not in systematic sequence of S288C MAL21 MAL21 MALT L000001011 Maltose permease; part of the complex locus MAL2 +S000029682 not in systematic sequence of S288C MAL22 MAL22 MALS L000001012 Maltase (alpha-D-glucosidase); encoded within the complex locus MAL2 +S000029685 not in systematic sequence of S288C MAL4 MAL4 chromosome 11 L000001006 11 85 Multigene complex, polymeric locus for maltose fermentation; encodes the MAL43 trans-acting MAL-activator, MAL41 maltose permease, and MAL42 maltase; on right arm of Chromosome XI, but not in strain S288C +S000029686 not in systematic sequence of S288C MAL41 MAL41 MALT L000001018 Maltose permease; part of the complex locus MAL4 +S000029687 not in systematic sequence of S288C MAL42 MAL42 MALS L000001019 Maltase (alpha-D-glucosidase); encoded within the complex locus MAL4 +S000029688 not in systematic sequence of S288C MAL43 MAL43 MALR L000001020 MAL-activator protein; encoded within the complex locus MAL4 +S000029689 not in systematic sequence of S288C MAL6 MAL6 L000001007 Multigene complex, polymeric locus for maltose fermentation; encodes the MAL63 trans-acting MAL-activator, MAL61 maltose permease, and MAL62 maltase; on the left arm of Chromosome VIII, but not in strain S288C +S000029690 not in systematic sequence of S288C MAL62 MAL62 MALS L000001022 Maltase (alpha-D-glucosidase); encoded within the complex locus MAL6 +S000029659 not in systematic sequence of S288C MAL63 MAL63 MALR L000001023 MAL-activator protein; transcription factor; part of the complex locus MAL6, plays a positive role in the regulation of maltose fermentation +S000029660 not in systematic sequence of S288C MATA1 MATA1 A1 L000002970 Expressed copy (at MATa) of a1; homeobox-domain protein that, along with alpha2, represses transcription of haploid-specific genes in diploid cells; MATa1 pre-mRNA splicing requires Bud13p and Ist3p; a1 sequence is not present in SGD because the sequenced S288C strain is MATalpha, not MATa +S000029661 not in systematic sequence of S288C MATA2 MATA2 A2 L000002971 Protein of unknown function; identical to the C-terminal 119 amino acid residues of the MATalpha2 protein; a2 sequence is not present in SGD because the sequenced S288C strain is MATalpha, not MATa +S000029662 not in systematic sequence of S288C MEL1 MEL1 chromosome 2 L000001063 2 -77 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose; regulated by several GAL genes +S000029692 not in systematic sequence of S288C MEL10 MEL10 chromosome 12 L000001072 12 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose +S000029663 not in systematic sequence of S288C MEL2 MEL2 L000001064 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose +S000029693 not in systematic sequence of S288C MEL3 MEL3 chromosome 16 L000001065 16 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose +S000029694 not in systematic sequence of S288C MEL4 MEL4 chromosome 11 L000001066 11 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose +S000029664 not in systematic sequence of S288C MEL5 MEL5 chromosome 4 L000001067 4 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose +S000029665 not in systematic sequence of S288C MEL6 MEL6 chromosome 13 L000001068 13 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose +S000029695 not in systematic sequence of S288C MEL7 MEL7 chromosome 6 L000001069 6 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose +S000029696 not in systematic sequence of S288C MEL8 MEL8 chromosome 15 L000001070 15 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose +S000029697 not in systematic sequence of S288C MEL9 MEL9 L000001071 Secreted alpha-galactosidase; required for catabolic conversion of melibiose to glucose and galactose +S000029666 not in systematic sequence of S288C MPR1 MPR1 S000007536 L-azetidine-2-carboxylic acid acetyltransferase; reduces intracellular ROS and contributes to L-proline analog resistance and tolerance to ethanol and freezing; member of N-acetyltransferase superfamily; not found in S288C, only present in strains with Sigma1278b background; located on left arm of chromosome XIV approximately 15 kb from telomere +S000029328 not in systematic sequence of S288C NTS1-1 NTS1-1 NTS1 L000001282 Nontranscribed region of the rDNA repeat between the 3'ETS and RDN5; required for rDNA repeat expansion; contains RNA polymerase I termination site +S000080162 not in systematic sequence of S288C KHS1 KHS1 Thermolabile killer toxin encoded on the right arm of Chromosome V +S000029703 not in systematic sequence of S288C AWA1 AWA1 Putative GPI-anchored protein; localized to the cell wall; involved in foam formation in sake mash by conferring hydrophobicity to the cell surface +S000029723 not in systematic sequence of S288C YAR069W-A BIO6 Putative 7-keto-8-aminopelargonic acid (KAPA) synthetase; in sake strains and S. cerevisiae strains YJM627 and A364a; involved in the biotin biosynthesis pathway; homologs present in S. bayanus, S. paradoxus, S. mikatae and S. kudriavzevii +S000029698 not in systematic sequence of S288C ENS2 ENS2 Endo.SceI|RF3 L000001619|L000000562 Mitochondrially-encoded 50 kD subunit of Endo.SceI; a dimeric multi-site-specific endonuclease that introduces double-stranded breaks at a number of well-defined sites on the mitochondrial DNA, inducing homologous recombination +S000134352 not in systematic sequence of S288C SUC8 SUC8 chromosome 10 10 Invertase; sucrose hydrolyzing enzyme; seven closely related but non-identical invertase genes have been described in yeast (SUC1-5, 7, 8) but only SUC2 is in the reference strain (S288C) +S000130715 not in systematic sequence of S288C ENA6 ENA6 chromosome 4 4 Plasma membrane sodium-pumping ATPase; the ENA6 gene is found in the PMR2 locus in the CEN.PK113-7D strain of S. cerevisiae, where other common lab strains have a varying number of the ENA genes (ENA1-ENA5) at the same locus +S000124112 not in systematic sequence of S288C TAT3 TAT3 Permease identified in lager brewing yeast strain Weihenstephan Nr.34; also in RM11-1a, but not S288C; subject to nitrogen catabolite repression and post-translational control, cellular localization dependent on nitrogen source quality +S000124955 not in systematic sequence of S288C MATA MATA MAT Mating type locus; note that the systematic sequence in SGD contains MATalpha sequences +S000125018 not in systematic sequence of S288C YAR070W-A BIO1 Putative pimeloyl-CoA synthetase involved in biotin biosynthesis; highly degraded pseudogenic paralog of YJR154W; functional copies present in S. cerevisiae strains YJM627 and A364a; functional pimeloyl-CoA synthetase (PCAS) genes are homologs of the bioW gene in Bacillus sp. and the bioC-bioH complex of E. coli +S000125021 not in systematic sequence of S288C YHR214W-F BIO8 Putative 7-keto-8-aminopelargonic acid (KAPA) synthetase; highly degraded pseudogenic copy of BIO6/YAR069W-A; functional copy present in S. cerevisiae strains YJM627 and A364a; involved in the biotin biosynthesis pathway +S000125022 not in systematic sequence of S288C YHR214W-G BIO7 Putative pimeloyl-CoA synthetase involved in biotin biosynthesis; in S. cerevisiae strains YJM627 and A364a; highly degraded pseudogenic copy of BIO1/YAR070W-A, which is a paralog of YJR154W +S000029657 not in systematic sequence of S288C MAL23 MAL23 MALR L000001013 MAL-activator protein; encoded within the complex locus MAL2; required for maltose and isomaltose utilization +S000029684 not in systematic sequence of S288C MAL34 MAL34 L000001017 ORF with sequence and positional similarity to the MAL64 gene; the MAL64 gene is thought to be a nonfunctional copy of MAL63; encoded within the complex locus MAL3 in some strains of S. cerevisiae, but not in S288C +S000029691 not in systematic sequence of S288C MAL64 MAL64 L000001024 MAL64 is a nonfunctional homolog of the MAL63 trans-activator; encoded within the complex locus MAL6 +S000029658 not in systematic sequence of S288C MAL61 MAL61 MALT L000001021 High-affinity maltose transporter; narrow substrate specificity, transporting maltose and turanose but not other alpha-glucosides; other names include alpha-glucoside transporter and maltose permease +S000145155 not in systematic sequence of S288C FPG1 FPG1 Putative cell wall mannoprotein involved in foam formation; contains a signal peptide and a putative GPI anchor; protein precursor homologous to Awa1p and Hpf1p +S000133140 not in systematic sequence of S288C XDH1 XDH1 chromosome 15 15 Xylitol dehydrogenase; involved in utilization of xylose as a carbon source; not present in S288C, but located in a 65kb insertion on the right arm of chromosome XV in many wine strains such as EC1118 and AWRI1631 +S000149345 not in systematic sequence of S288C IMI1 IMI1 Protein involved in maintaining mitochondrial integrity and glutathione homeostasis; localized to the cytoplasm; in W303 strain IMI1 is encoded by one continuous open reading frame comprising of YDL037C, the intergenic region and YDL039C, while in the reference sequence of S288C, YDL037C encodes Bsc1p and YDL039C encodes Prm7p. +S000150108 not in systematic sequence of S288C MPR2 MPR2 L-azetidine-2-carboxylic acid acetyltransferase; reduces intracellular ROS, contributes to L-proline analog resistance and tolerance to ethanol and freezing; member of N-acetyltransferase superfamily; not found in S288C, present in strains with Sigma1278b background; located on left arm of Chr X ~ 15 kb from telomere; identical to MPR1 except for one base at position 254, leading to Gly at position 85 in MPR1 and Glu in MPR2; present also in Japanese industrial baker's yeast diff --git a/data/Species.csv b/data/Species.csv index 1db2d8e..97c68fa 100644 --- a/data/Species.csv +++ b/data/Species.csv @@ -1,1015 +1,1015 @@ -"","Name","Classification","Taxon ID","Assembly","Accession","Variation database","Regulation database","Whole genome alignments","Other alignments","In peptide compara","In pan-taxonomic compara" -"","Absidia glauca","Mucoromycotina","4829","AG_v1","GCA_900079185.1","-","-","-","-","-","-" -"","Absidia repens str. NRRL 1336","Mucoromycotina","90262","Absrep1","GCA_002105175.1","-","-","-","-","","-" -"","Acaromyces ingoldii str. MCA 4198 (GCA_003144295)","","215250","Acain1","GCA_003144295.1","-","-","-","-","","-" -"","Acidomyces richmondensis (GCA_001572075)","Acidomyces","245562","ASM157207v1","GCA_001572075.1","-","-","-","-","-","-" -"","Acidomyces richmondensis BFW (GCA_001592465)","Acidomyces","766039","Acidomyces_richmondensis_BFW_v1.0","GCA_001592465.1","-","-","-","-","","-" -"","Acremonium chrysogenum ATCC 11550 (GCA_000769265)","Hypocreales","857340","ASM76926v1","GCA_000769265.1","-","-","-","-","","-" -"","Agaricus bisporus var. burnettii JB137-S8 (GCA_000300555)","Agaricales","597362","Agabi_varbur_1","GCA_000300555.1","-","-","-","-","","-" -"","Allomyces macrogynus ATCC 38327 (GCA_000151295)","Blastocladiales","578462","A_macrogynus_V3","GCA_000151295.1","-","-","-","-","","-" -"","Alternaria alternata str. SRC1lrK2f (GCA_001642055)","Pleosporales","5599","Altal1","GCA_001642055.1","-","-","-","-","","-" -"","Amanita muscaria Koide BX008 (GCA_000827485)","Agaricales","946122","Amanita_muscaria_Koide_BX008_v1.0","GCA_000827485.1","-","-","-","-","","-" -"","Amanita thiersii Skay4041 (GCA_002554575)","Agaricales","703135","Amanita_thiersii_v1.0","GCA_002554575.1","-","-","-","-","","-" -"","Amorphotheca resinae ATCC 22711 (GCA_003019875)","Myxotrichaceae","857342","Amore1","GCA_003019875.1","-","-","-","-","","-" -"","Amphiamblys sp. WSBS2006 (GCA_001875675)","Microsporidia","1866961","ASM187567v1","GCA_001875675.1","-","-","-","-","","-" -"","Anaeromyces robustus str. S4 (GCA_002104895)","","1754192","Anaeromyces_sp._S4_v1.0","GCA_002104895.1","-","-","-","-","","-" -"","Anncaliia algerae PRA109 (GCA_000385855)","Tubulinosematidae","1240240","Annc_alge_PRA109_V4","GCA_000385855.2","-","-","-","-","-","-" -"","Anncaliia algerae PRA339 (GCA_000385875)","Tubulinosematidae","1288291","Annc_alge_insect_USDA_JJB_V2","GCA_000385875.2","-","-","-","-","","-" -"","Anthracocystis flocculosa PF-1 (GCA_000417875)","Ustilaginales","1277687","Pflocc_1.0","GCA_000417875.1","-","-","-","-","","-" -"","Armillaria gallica str. Ar21-2 (GCA_002307695)","Agaricales","47427","Armga1","GCA_002307695.1","-","-","-","-","","-" -"","Armillaria ostoyae (GCA_900157425)","Agaricales","47428","version_2","GCA_900157425.1","-","-","-","-","","-" -"","Armillaria solidipes str. 28-4 (GCA_002307675)","Agaricales","1076256","Armost1","GCA_002307675.1","-","-","-","-","","-" -"","Arthrobotrys oligospora ATCC 24927 (GCA_000225545)","Orbiliales","756982","AOL24927_1.0","GCA_000225545.1","-","-","-","-","","-" -"","Ascochyta rabiei str. ArDII (GCA_001630375)","Pleosporales","5454","AscRab1.0","GCA_001630375.1","-","-","-","-","","-" -"","Ascoidea rubescens DSM 1968 (GCA_001661345)","Saccharomycetales","1344418","Ascru1","GCA_001661345.1","-","-","-","-","","-" -"","Ascosphaera apis ARSEF 7405 (GCA_001636715)","Onygenales","392613","AAP_1.0","GCA_001636715.1","-","-","-","-","","-" -"","Ashbya gossypii","Saccharomycetales","284811","ASM9102v1","GCA_000091025.3","-","","","","","-" -"","Aspergillus aculeatinus CBS 121060 (GCA_003184765)","Eurotiales","1448322","Aspacu1","GCA_003184765.1","-","-","-","-","-","-" -"","Aspergillus aculeatus ATCC 16872 (GCA_001890905)","Eurotiales","690307","Aspac1","GCA_001890905.1","-","-","-","-","-","-" -"","Aspergillus arachidicola str. CBS 117610 (GCA_002749805)","Eurotiales","656916","ASM274980v1","GCA_002749805.1","-","-","-","-","-","-" -"","Aspergillus bombycis str. NRRL26010 (GCA_001792695)","Eurotiales","109264","ASM179269v1","GCA_001792695.1","-","-","-","-","-","-" -"","Aspergillus brasiliensis CBS 101740 (GCA_001889945)","Eurotiales","767769","Aspbr1","GCA_001889945.1","-","-","-","-","-","-" -"","Aspergillus brunneoviolaceus CBS 621.78 (GCA_003184695)","Eurotiales","1450534","Aspbru1","GCA_003184695.1","-","-","-","-","-","-" -"","Aspergillus calidoustus str. SF006504 (GCA_001511075)","Eurotiales","454130","Acal_Allpaths_LG","GCA_001511075.1","-","-","-","-","-","-" -"","Aspergillus campestris IBT 28561 (GCA_002847485)","Eurotiales","1392248","Aspcam1","GCA_002847485.1","-","-","-","-","-","-" -"","Aspergillus candidus str. CBS 102.13 (GCA_002847045)","Eurotiales","41067","Aspcand1","GCA_002847045.1","-","-","-","-","-","-" -"","Aspergillus carbonarius ITEM 5010 (GCA_001990825)","Eurotiales","602072","Aspca3","GCA_001990825.1","-","-","-","-","-","-" -"","Aspergillus clavatus NRRL 1","Eurotiales","344612","ASM271v1","GCA_000002715.1","-","-","-","-","","-" -"","Aspergillus cristatus str. GZAAS20.1005 (GCA_001717485)","Eurotiales","573508","ASM171748v1","GCA_001717485.1","-","-","-","-","-","-" -"","Aspergillus ellipticus CBS 707.79 (GCA_003184645)","Eurotiales","1448320","Aspell1","GCA_003184645.1","-","-","-","-","-","-" -"","Aspergillus eucalypticola CBS 122712 (GCA_003184535)","Eurotiales","1448314","Aspeuc1","GCA_003184535.1","-","-","-","-","-","-" -"","Aspergillus fischeri NRRL 181","Eurotiales","331117","ASM14964v1","GCA_000149645.2","-","-","-","-","","-" -"","Aspergillus flavus AF70 (GCA_000952835)","Eurotiales","1392242","ASM95283v1","GCA_000952835.1","-","-","-","-","-","-" -"","Aspergillus flavus NRRL3357","Eurotiales","332952","JCVI-afl1-v2.0","GCA_000006275.2","-","-","-","-","","-" -"","Aspergillus fumigatus (GCA_002234985)","Eurotiales","746128","ASM223498v1","GCA_002234985.1","-","-","-","-","","-" -"","Aspergillus fumigatus A1163","Eurotiales","451804","ASM15014v1","GCA_000150145.1","-","-","-","-","-","-" -"","Aspergillus fumigatus Af293","Eurotiales","330879","ASM265v1","GCA_000002655.1","-","-","-","-","-","-" -"","Aspergillus fumigatus Z5 (GCA_001029325)","Eurotiales","1437362","ASM102932v1","GCA_001029325.1","-","-","-","-","-","-" -"","Aspergillus fumigatus var. RP-2014 (GCA_000731615)","Eurotiales","1476192","AspFumNiv1.0","GCA_000731615.1","-","-","-","-","-","-" -"","Aspergillus glaucus CBS 516.65 (GCA_001890805)","Eurotiales","1160497","Aspgl1","GCA_001890805.1","-","-","-","-","-","-" -"","Aspergillus heteromorphus CBS 117.55 (GCA_003184545)","Eurotiales","1448321","Asphet1","GCA_003184545.1","-","-","-","-","-","-" -"","Aspergillus indologenus CBS 114.80 (GCA_003184685)","Eurotiales","1450541","Aspind1","GCA_003184685.1","-","-","-","-","-","-" -"","Aspergillus japonicus CBS 114.51 (GCA_003184785)","Eurotiales","1448312","Aspjap1","GCA_003184785.1","-","-","-","-","-","-" -"","Aspergillus lacticoffeatus CBS 101883 (GCA_003184595)","Eurotiales","1450533","Asplac1","GCA_003184595.1","-","-","-","-","-","-" -"","Aspergillus lentulus (GCA_001445615)","Eurotiales","293939","Alt_assembly01","GCA_001445615.1","-","-","-","-","-","-" -"","Aspergillus luchuensis CBS 106.47 (GCA_001890685)","Eurotiales","1137211","Aspfo1","GCA_001890685.1","-","-","-","-","-","-" -"","Aspergillus luchuensis str. RIB 2604 (GCA_001602395)","Eurotiales","1069201","AspL_2604","GCA_001602395.1","-","-","-","-","-","-" -"","Aspergillus neoniger CBS 115656 (GCA_003184625)","Eurotiales","1448310","Aspneo1","GCA_003184625.1","-","-","-","-","-","-" -"","Aspergillus nidulans","Eurotiales","227321","ASM1142v1","GCA_000011425.1","-","-","-","-","","" -"","Aspergillus nidulans FGSC A4 (GCA_000149205)","Eurotiales","227321","ASM14920v2","GCA_000149205.2","-","-","-","-","-","-" -"","Aspergillus niger","Eurotiales","5061","ASM285v2","GCA_000002855.2","-","-","-","","","-" -"","Aspergillus niger (GCA_001515345)","Eurotiales","5061","ASM151534v1","GCA_001515345.1","-","-","-","-","-","-" -"","Aspergillus niger (GCA_900248155)","Eurotiales","5061","Aniger_ATCC_64974_N402","GCA_900248155.1","-","-","-","-","-","-" -"","Aspergillus niger ATCC 1015 (GCA_000230395)","Eurotiales","380704","ASPNI_v3.0","GCA_000230395.2","-","-","-","-","-","-" -"","Aspergillus nomius NRRL 13137 (GCA_001204775)","Eurotiales","1509407","ASM120477v1","GCA_001204775.1","-","-","-","-","-","-" -"","Aspergillus novofumigatus IBT 16806 (GCA_002847465)","Eurotiales","1392255","Aspnov1","GCA_002847465.1","-","-","-","-","-","-" -"","Aspergillus ochraceoroseus IBT 24754 (GCA_002846915)","Eurotiales","1392256","Aspergillus_ochraceoroseus_IBT_24754_v1.1","GCA_002846915.2","-","-","-","-","-","-" -"","Aspergillus ochraceoroseus str. SRRC1432 (GCA_000986665)","Eurotiales","138278","ASM98666v1","GCA_000986665.1","-","-","-","-","-","-" -"","Aspergillus oryzae 100-8 (GCA_000691885)","Eurotiales","1197718","Aspergillus_oryzae_100-8","GCA_000691885.1","-","-","-","-","-","-" -"","Aspergillus oryzae 3.042 (GCA_000269785)","Eurotiales","1160506","AspOry3042","GCA_000269785.2","-","-","-","-","-","-" -"","Aspergillus oryzae RIB40","Eurotiales","510516","ASM18445v3","GCA_000184455.3","-","-","-","-","","-" -"","Aspergillus oryzae str. BCC7051 (GCA_002007945)","Eurotiales","5062","ASM200794v1","GCA_002007945.1","-","-","-","-","-","-" -"","Aspergillus parasiticus SU-1 (GCA_000956085)","Eurotiales","1403190","ASM95608v1","GCA_000956085.1","-","-","-","-","-","-" -"","Aspergillus piperis CBS 112811 (GCA_003184755)","Eurotiales","1448313","Asppip1","GCA_003184755.1","-","-","-","-","-","-" -"","Aspergillus rambellii str. SRRC1468 (GCA_000986645)","Eurotiales","308745","ASM98664v1","GCA_000986645.1","-","-","-","-","-","-" -"","Aspergillus ruber CBS 135680 (GCA_000600275)","Eurotiales","1388766","Eurhe1","GCA_000600275.1","-","-","-","-","-","-" -"","Aspergillus saccharolyticus JOP 1030-1 (GCA_003184585)","Eurotiales","1450539","Aspsac1","GCA_003184585.1","-","-","-","-","-","-" -"","Aspergillus sclerotiicarbonarius CBS 121057 (GCA_003184635)","Eurotiales","1448318","Aspscle1","GCA_003184635.1","-","-","-","-","-","-" -"","Aspergillus sclerotioniger CBS 115572 (GCA_003184525)","Eurotiales","1450535","Aspscl1","GCA_003184525.1","-","-","-","-","-","-" -"","Aspergillus steynii IBT 23096 (GCA_002849105)","Eurotiales","1392250","Aspste1","GCA_002849105.1","-","-","-","-","-","-" -"","Aspergillus sydowii CBS 593.65 (GCA_001890705)","Eurotiales","1036612","Aspsy1","GCA_001890705.1","-","-","-","-","-","-" -"","Aspergillus taichungensis str. IBT 19404 (GCA_002850765)","Eurotiales","482145","Asptaic1","GCA_002850765.1","-","-","-","-","-","-" -"","Aspergillus terreus NIH2624","Eurotiales","341663","ASM14961v1","GCA_000149615.1","-","-","-","-","","-" -"","Aspergillus thermomutatus (GCA_002237265)","Eurotiales","41047","ASM223726v1","GCA_002237265.1","-","-","-","-","-","-" -"","Aspergillus tubingensis CBS 134.48 (GCA_001890745)","Eurotiales","767770","Asptu1","GCA_001890745.1","-","-","-","-","-","-" -"","Aspergillus turcosus (GCA_002234965)","Eurotiales","1245748","ASM223496v1","GCA_002234965.1","-","-","-","-","-","-" -"","Aspergillus turcosus (GCA_002234975)","Eurotiales","1245748","ASM223497v1","GCA_002234975.1","-","-","-","-","-","-" -"","Aspergillus udagawae str. IFM 46973 (GCA_001078395)","Eurotiales","91492","Aud_assembly01","GCA_001078395.1","-","-","-","-","-","-" -"","Aspergillus ustus str. 3.3904 (GCA_000812125)","Eurotiales","40382","Austus1.0","GCA_000812125.1","-","-","-","-","-","-" -"","Aspergillus uvarum CBS 121591 (GCA_003184745)","Eurotiales","1448315","Aspuva1","GCA_003184745.1","-","-","-","-","-","-" -"","Aspergillus vadensis CBS 113365 (GCA_003184925)","Eurotiales","1448311","Aspvad1","GCA_003184925.1","-","-","-","-","-","-" -"","Aspergillus versicolor CBS 583.65 (GCA_001890125)","Eurotiales","1036611","Aspve1","GCA_001890125.1","-","-","-","-","-","-" -"","Aspergillus violaceofuscus CBS 115571 (GCA_003184705)","Eurotiales","1450538","Aspvio1","GCA_003184705.1","-","-","-","-","-","-" -"","Aspergillus wentii DTO 134E9 (GCA_001890725)","Eurotiales","1073089","Aspwe1","GCA_001890725.1","-","-","-","-","-","-" -"","Aureobasidium melanogenum CBS 110374 (GCA_000721775)","Dothideales","1043003","Aureobasidium_pullulans_var._melanogenum_CBS_110374_v1.0","GCA_000721775.1","-","-","-","-","","-" -"","Aureobasidium namibiae CBS 147.97 (GCA_000721765)","Dothideales","1043004","Aureobasidium_pullulans_var._namibiae_CBS_147.97_v1.0","GCA_000721765.1","-","-","-","-","","-" -"","Aureobasidium pullulans (GCA_001678115)","Dothideales","5580","ASM167811v1","GCA_001678115.1","-","-","-","-","-","-" -"","Aureobasidium pullulans EXF-150 (GCA_000721785)","Dothideales","1043002","Aureobasidium_pullulans_var._pullulans_EXF-150_assembly_version_1.0","GCA_000721785.1","-","-","-","-","","-" -"","Aureobasidium subglaciale EXF-2481 (GCA_000721755)","Dothideales","1043005","Aureobasidium_pullulans_var._subglaciale_EXF-2481_v1.0","GCA_000721755.1","-","-","-","-","","-" -"","Babjeviella inositovora NRRL Y-12698 (GCA_001661335)","Saccharomycetales","984486","Babin1","GCA_001661335.1","-","-","-","-","","-" -"","Basidiobolus meristosporus CBS 931.73 (GCA_002104905)","","1314790","Basme2finSC","GCA_002104905.1","-","-","-","-","","-" -"","Batrachochytrium dendrobatidis JAM81 (GCA_000203795)","Rhizophydiales","684364","v1.0","GCA_000203795.1","-","-","-","-","-","-" -"","Batrachochytrium dendrobatidis JEL423 (GCA_000149865)","Rhizophydiales","403673","BD_JEL423","GCA_000149865.1","-","-","-","-","","-" -"","Batrachochytrium salamandrivorans str. BS (GCA_002006685)","Rhizophydiales","1357716","Batr_sala_BS_V1","GCA_002006685.1","-","-","-","-","","-" -"","Baudoinia panamericana UAMH 10762 (GCA_000338955)","Capnodiales","717646","Bauco1","GCA_000338955.1","-","-","-","-","","-" -"","Beauveria bassiana","Hypocreales","176275","ASM168263v1","GCA_001682635.1","-","-","-","","","-" -"","Beauveria bassiana ARSEF 2860 (GCA_000280675)","Hypocreales","655819","ASM28067v1","GCA_000280675.1","-","-","-","-","-","-" -"","Beauveria bassiana D1-5 (GCA_000770705)","Hypocreales","1245745","BBA1.0","GCA_000770705.1","-","-","-","-","-","-" -"","Beauveria bassiana str. JEF-007 (GCA_002871155)","Hypocreales","176275","ASM287115v1","GCA_002871155.1","-","-","-","-","-","-" -"","Bifiguratus adelaidae str. AZ0501","Mucoromycotina","1938954","ASM226119v1","GCA_002261195.1","-","-","-","-","","-" -"","Bipolaris maydis ATCC 48331 (GCA_000354255)","Pleosporales","665024","CocheC4_1","GCA_000354255.1","-","-","-","-","-","-" -"","Bipolaris maydis C5 (GCA_000338975)","Pleosporales","701091","CocheC5_3","GCA_000338975.1","-","-","-","-","","-" -"","Bipolaris oryzae ATCC 44560 (GCA_000523455)","Pleosporales","930090","Cochliobolus_miyabeanus_v1.0","GCA_000523455.1","-","-","-","-","","-" -"","Bipolaris sorokiniana ND90Pr (GCA_000338995)","Pleosporales","665912","Cocsa1","GCA_000338995.1","-","-","-","-","","-" -"","Bipolaris victoriae FI3 (GCA_000527765)","Pleosporales","930091","Cochliobolus_victoriae_v1.0","GCA_000527765.1","-","-","-","-","","-" -"","Bipolaris zeicola 26-R-13 (GCA_000523435)","Pleosporales","930089","Cochliobolus_carbonum_v1.0","GCA_000523435.1","-","-","-","-","","-" -"","Blastomyces dermatitidis ATCC 18188 (GCA_000151595)","Onygenales","653446","BD_ATCC18188_V1","GCA_000151595.1","-","-","-","-","-","-" -"","Blastomyces dermatitidis ATCC 26199 (GCA_000166155)","Onygenales","447095","BD_ATCC26199_V2","GCA_000166155.1","-","-","-","-","-","-" -"","Blastomyces dermatitidis ER-3 (GCA_000003525)","Onygenales","559297","BD_ER3_V1","GCA_000003525.2","-","-","-","-","","-" -"","Blastomyces gilchristii SLH14081 (GCA_000003855)","Onygenales","559298","BD_SLH14081_V1","GCA_000003855.2","-","-","-","-","","-" -"","Blastomyces percursus str. EI222 (GCA_001883805)","Onygenales","1658174","Blas_perc_EI222_V1","GCA_001883805.1","-","-","-","-","","-" -"","Blumeria graminis","Erysiphales","546991","EF2","GCA_000151065.2","-","-","-","","","-" -"","Blumeria graminis f. sp. tritici 96224 (GCA_000418435)","Erysiphales","1268274","Bgt_454_newbler_assembly","GCA_000418435.1","-","-","-","-","-","-" -"","Botryobasidium botryosum FD-172 SS1 (GCA_000697705)","Cantharellales","930990","Botbo1","GCA_000697705.1","-","-","-","-","","-" -"","Botrytis cinerea B05.10","Sclerotiniaceae","332648","ASM83294v1","GCA_000143535.4","-","-","-","","","-" -"","Botrytis cinerea BcDW1 (GCA_000349525)","Sclerotiniaceae","1290391","BcDW1","GCA_000349525.1","-","-","-","-","-","-" -"","Botrytis cinerea T4 (GCA_000227075)","Sclerotiniaceae","999810","BotFuc_Mar2011","GCA_000227075.1","-","-","-","-","-","-" -"","Brettanomyces bruxellensis AWRI1499 (GCA_000259595)","Saccharomycetales","1124627","AWRI1499_v1.0","GCA_000259595.1","-","-","-","-","","-" -"","Byssochlamys spectabilis No. 5 str. Paecilomyces variotii No. 5 (NBRC109023) (GCA_000497085)","Eurotiales","1356009","PVAR5_assembly01","GCA_000497085.1","-","-","-","-","","-" -"","Cadophora sp. DSE1049 (GCA_003073865)","Helotiales","1485229","Cadsp1","GCA_003073865.1","-","-","-","-","","-" -"","Calocera cornea HHB12733 (GCA_001632435)","Dacrymycetales","1353952","Calco1","GCA_001632435.1","-","-","-","-","","-" -"","Calocera viscosa TUFC12733 (GCA_001630345)","Dacrymycetales","1330018","Calvi1","GCA_001630345.1","-","-","-","-","","-" -"","Candida albicans 12C (GCA_000773845)","Saccharomycetales","1094981","Cand_albi_12C_V2","GCA_000773845.1","-","-","-","-","-","-" -"","Candida albicans 19F (GCA_000775445)","Saccharomycetales","1094987","Cand_albi_19F_V2","GCA_000775445.1","-","-","-","-","-","-" -"","Candida albicans Ca6 (GCA_000784695)","Saccharomycetales","1165368","Cand_albi_Ca6_V2","GCA_000784695.1","-","-","-","-","-","-" -"","Candida albicans GC75 (GCA_000773735)","Saccharomycetales","1094988","Cand_albi_GC75_V1","GCA_000773735.1","-","-","-","-","-","-" -"","Candida albicans L26 (GCA_000775455)","Saccharomycetales","1094982","Cand_albi_L26_V2","GCA_000775455.1","-","-","-","-","-","-" -"","Candida albicans P34048 (GCA_000775465)","Saccharomycetales","1094991","Cand_albi_P34048_V1","GCA_000775465.1","-","-","-","-","-","-" -"","Candida albicans P37005 (GCA_000773745)","Saccharomycetales","1094985","Cand_albi_P37005_V2","GCA_000773745.1","-","-","-","-","-","-" -"","Candida albicans P37037 (GCA_000773825)","Saccharomycetales","1094992","Cand_albi_P37037_V1","GCA_000773825.1","-","-","-","-","-","-" -"","Candida albicans P37039 (GCA_000784515)","Saccharomycetales","1094993","Cand_albi_P37039_V1","GCA_000784515.1","-","-","-","-","-","-" -"","Candida albicans P57055 (GCA_000775505)","Saccharomycetales","1094996","Cand_albi_P57055_V1","GCA_000775505.1","-","-","-","-","-","-" -"","Candida albicans P57072 (GCA_000773805)","Saccharomycetales","1094990","Cand_albi_P57072_V1","GCA_000773805.1","-","-","-","-","-","-" -"","Candida albicans P60002 (GCA_000784525)","Saccharomycetales","1094986","Cand_albi_P60002_V1","GCA_000784525.1","-","-","-","-","-","-" -"","Candida albicans P75010 (GCA_000784575)","Saccharomycetales","1094994","Cand_albi_P75010_V1","GCA_000784575.1","-","-","-","-","-","-" -"","Candida albicans P75016 (GCA_000784595)","Saccharomycetales","1094995","Cand_albi_P75016_V1","GCA_000784595.1","-","-","-","-","-","-" -"","Candida albicans P75063 (GCA_000775525)","Saccharomycetales","1094997","Cand_albi_P75063_V1","GCA_000775525.1","-","-","-","-","-","-" -"","Candida albicans P76055 (GCA_000784505)","Saccharomycetales","1094998","Cand_albi_P76055_V1","GCA_000784505.1","-","-","-","-","-","-" -"","Candida albicans P76067 (GCA_000784495)","Saccharomycetales","1094999","Cand_albi_P76067_V1","GCA_000784495.1","-","-","-","-","-","-" -"","Candida albicans P78042 (GCA_000784615)","Saccharomycetales","1095000","Cand_albi_P78042_V1","GCA_000784615.1","-","-","-","-","-","-" -"","Candida albicans P78048 (GCA_000773725)","Saccharomycetales","1094989","Cand_albi_P78048_V1","GCA_000773725.1","-","-","-","-","-","-" -"","Candida albicans P87 (GCA_000774085)","Saccharomycetales","1094984","Cand_albi_P87_V2","GCA_000774085.1","-","-","-","-","-","-" -"","Candida albicans P94015 (GCA_000773755)","Saccharomycetales","1094983","Cand_albi_P94015_V1","GCA_000773755.1","-","-","-","-","-","-" -"","Candida albicans SC5314 (GCA_000784635)","Saccharomycetales","237561","Cand_albi_SC5314_V4","GCA_000784635.1","-","-","-","-","","-" -"","Candida albicans SC5314 (GCA_000784655)","Saccharomycetales","237561","Cand_albi_SC5314_V3","GCA_000784655.1","-","-","-","-","-","-" -"","Candida albicans WO-1 (GCA_000149445)","Saccharomycetales","294748","ASM14944v2","GCA_000149445.2","-","-","-","-","-","-" -"","Candida dubliniensis CD36 (GCA_000026945)","Saccharomycetales","573826","ASM2694v1","GCA_000026945.1","-","-","-","-","-","-" -"","Candida maltosa Xu316 (GCA_000344705)","Saccharomycetales","1245528","Cmaltosa_v01","GCA_000344705.1","-","-","-","-","-","-" -"","Candida orthopsilosis Co 90-125 (GCA_000315875)","Saccharomycetales","1136231","ASM31587v1","GCA_000315875.1","-","-","-","-","-","-" -"","Candida parapsilosis str. CDC317 (GCA_000182765)","Saccharomycetales","5480","ASM18276v2","GCA_000182765.2","-","-","-","-","","-" -"","Candida tropicalis MYA-3404 (GCA_000006335)","Saccharomycetales","294747","ASM633v3","GCA_000006335.3","-","-","-","-","","-" -"","Capronia coronata CBS 617.96 (GCA_000585585)","Chaetothyriomycetidae","1182541","Capr_coro_CBS_617_96_V1","GCA_000585585.1","-","-","-","-","","-" -"","Capronia epimyces CBS 606.96 (GCA_000585565)","Chaetothyriomycetidae","1182542","Capr_epim_CBS_606_96_V1","GCA_000585565.1","-","-","-","-","","-" -"","Catenaria anguillulae PL171 (GCA_002102555)","Blastocladiales","765915","Catan2","GCA_002102555.1","-","-","-","-","","-" -"","Ceraceosorus bombacis (GCA_900000165)","","401625","Ceraceosorus_bombacis","GCA_900000165.1","-","-","-","-","-","-" -"","Ceraceosorus guamensis str. MCA 4658 (GCA_003144195)","","1522189","Cersp1","GCA_003144195.1","-","-","-","-","","-" -"","Ceratocystis platani str. CFO (GCA_000978885)","Microascales","88771","ASM97888v1","GCA_000978885.1","-","-","-","-","","-" -"","Cercospora berteroae (GCA_002933655)","Capnodiales","357750","Cbert_1","GCA_002933655.1","-","-","-","-","","-" -"","Cercospora beticola (GCA_002742065)","Capnodiales","122368","CB0940_V2","GCA_002742065.1","-","-","-","-","","-" -"","Cercospora zeina str. CMW25467 (GCA_002844615)","Capnodiales","348901","ASM284461v1","GCA_002844615.1","-","-","-","-","","-" -"","Chaetomium globosum CBS 148.51 (GCA_000143365)","Sordariales","306901","ASM14336v1","GCA_000143365.1","-","-","-","-","","-" -"","Chaetomium thermophilum var. thermophilum DSM 1495 (GCA_000221225)","Sordariales","759272","CTHT_3.0","GCA_000221225.1","-","-","-","-","","-" -"","Choanephora cucurbitarum str. KUS-F28377 (GCA_001683725)","Mucoromycotina","101091","ASM168372v1","GCA_001683725.1","-","-","-","-","","-" -"","Cladophialophora bantiana CBS 173.52 (GCA_000835475)","Chaetothyriomycetidae","1442370","Clad_bant_CBS_173_52_V1","GCA_000835475.1","-","-","-","-","","-" -"","Cladophialophora carrionii CBS 160.54 (GCA_000365165)","Chaetothyriomycetidae","1279043","Clad_carr_CBS_160_54_V1","GCA_000365165.2","-","-","-","-","-","-" -"","Cladophialophora carrionii str. KSF (GCA_001700775)","Chaetothyriomycetidae","86049","ASM170077v1","GCA_001700775.1","-","-","-","-","","-" -"","Cladophialophora immunda str. CBS 83496 (GCA_000835495)","Chaetothyriomycetidae","569365","Clad_immu_CBS83496_V1","GCA_000835495.1","-","-","-","-","","-" -"","Cladophialophora psammophila CBS 110553 (GCA_000585535)","Chaetothyriomycetidae","1182543","Clad_psam_CBS_110553_V1","GCA_000585535.1","-","-","-","-","","-" -"","Cladophialophora yegresii CBS 114405 (GCA_000585515)","Chaetothyriomycetidae","1182544","Clad_yegr_CBS_114405_V1","GCA_000585515.1","-","-","-","-","","-" -"","Claviceps purpurea 20.1 (GCA_000347355)","Hypocreales","1111077","ASM34735v1","GCA_000347355.1","-","-","-","-","","-" -"","Clavispora lusitaniae ATCC 42720 (GCA_000003835)","Saccharomycetales","306902","ASM383v1","GCA_000003835.1","-","-","-","-","","-" -"","Clavispora lusitaniae str. CBS 6936 (GCA_001673695)","Saccharomycetales","36911","ASM167369v2","GCA_001673695.2","-","-","-","-","-","-" -"","Clohesyomyces aquaticus str. CBS 115471 (GCA_002105025)","Pleosporales","1231657","Cloaq1","GCA_002105025.1","-","-","-","-","","-" -"","Coccidioides immitis H538.4 (GCA_000149815)","Onygenales","396776","ASM14981v1","GCA_000149815.1","-","-","-","-","","-" -"","Coccidioides immitis RMSCC 2394 (GCA_000149895)","Onygenales","404692","ASM14989v1","GCA_000149895.1","-","-","-","-","-","-" -"","Coccidioides immitis RMSCC 3703 (GCA_000150085)","Onygenales","454286","ASM15008v1","GCA_000150085.1","-","-","-","-","-","-" -"","Coccidioides immitis RS (GCA_000149335)","Onygenales","246410","ASM14933v2","GCA_000149335.2","-","-","-","-","-","-" -"","Coccidioides posadasii C735 delta SOWgp (GCA_000151335)","Onygenales","222929","JCVI-cpa1-1.0","GCA_000151335.1","-","-","-","-","-","-" -"","Coccidioides posadasii RMSCC 3488 (GCA_000150055)","Onygenales","454284","ASM15005v1","GCA_000150055.1","-","-","-","-","-","-" -"","Coccidioides posadasii str. Silveira (GCA_000170175)","Onygenales","443226","CPS2","GCA_000170175.2","-","-","-","-","","-" -"","Colletotrichum chlorophyti str. NTL11 (GCA_001937105)","Glomerellales","708187","ASM193710v1","GCA_001937105.1","-","-","-","-","-","-" -"","Colletotrichum fioriniae PJ7 (GCA_000582985)","Glomerellales","1445577","CFIO01","GCA_000582985.1","-","-","-","-","-","-" -"","Colletotrichum gloeosporioides","Glomerellales","1213859","GCA_000319635.1","GCA_000319635.1","-","-","-","","","-" -"","Colletotrichum gloeosporioides Cg-14 (GCA_000446055)","Glomerellales","1237896","Colletotrichum_gloeosporioides1","GCA_000446055.1","-","-","-","-","-","-" -"","Colletotrichum graminicola","Glomerellales","645133","C_graminicola_M1_001_V1","GCA_000149035.1","-","-","-","","","-" -"","Colletotrichum higginsianum","Glomerellales","80884","GCA_000313795.2","GCA_000313795.2","-","-","-","","","-" -"","Colletotrichum higginsianum IMI 349063 (GCA_001672515)","Glomerellales","759273","ASM167251v1","GCA_001672515.1","-","-","-","-","-","-" -"","Colletotrichum incanum str. MAFF 238704 (GCA_001625285)","Glomerellales","1573173","Ci238704v1","GCA_001625285.1","-","-","-","-","-","-" -"","Colletotrichum incanum str. MAFF238712 (GCA_001855235)","Glomerellales","1573173","ASM185523v1","GCA_001855235.1","-","-","-","-","-","-" -"","Colletotrichum nymphaeae SA-01 (GCA_001563115)","Glomerellales","1460502","CNYM01","GCA_001563115.1","-","-","-","-","-","-" -"","Colletotrichum orbiculare","Glomerellales","1213857","GCA_000350065.1","GCA_000350065.1","-","-","-","","","-" -"","Colletotrichum orchidophilum str. IMI 309357 (GCA_001831195)","Glomerellales","1209926","CORC01","GCA_001831195.1","-","-","-","-","-","-" -"","Colletotrichum salicis str. CBS 607.94 (GCA_001563125)","Glomerellales","1209931","CSAL01","GCA_001563125.1","-","-","-","-","-","-" -"","Colletotrichum simmondsii str. CBS122122 (GCA_001563135)","Glomerellales","703756","CSIM01","GCA_001563135.1","-","-","-","-","-","-" -"","Colletotrichum sublineola str. TX430BB (GCA_000696135)","Glomerellales","1173701","ASM69613v1","GCA_000696135.1","-","-","-","-","-","-" -"","Colletotrichum tofieldiae str. 0861 (GCA_001625265)","Glomerellales","708197","Ct0861v1","GCA_001625265.1","-","-","-","-","-","-" -"","Conidiobolus coronatus NRRL 28638 (GCA_001566745)","","796925","Conidiobolus_coronatus_NRRL28638","GCA_001566745.1","-","-","-","-","","-" -"","Coniella lustricola str. B22-T-1 (GCA_003019895)","Sordariomycetidae","2025994","Coniella_lustricola_v1.0","GCA_003019895.1","-","-","-","-","","-" -"","Coniochaeta ligniaria NRRL 30616 (GCA_001879275)","Sordariomycetidae","1408157","Conlig_v1.0","GCA_001879275.1","-","-","-","-","","-" -"","Coniophora puteana RWD-64-598 SS2 (GCA_000271625)","Boletales","741705","Conpu1","GCA_000271625.1","-","-","-","-","","-" -"","Coniosporium apollinis CBS 100218 str. CBS 352.97 (GCA_000281105)","","1168221","Coni_apol_CBS100218__V1","GCA_000281105.1","-","-","-","-","","-" -"","Coprinopsis cinerea okayama7#130 (GCA_000182895)","Agaricales","240176","CC3","GCA_000182895.1","-","-","-","-","","-" -"","Cordyceps brongniartii RCEF 3172 (GCA_001636735)","Hypocreales","1081107","BBO_1.0","GCA_001636735.1","-","-","-","-","","-" -"","Cordyceps confragosa RCEF 1005 (GCA_001636795)","Hypocreales","1081108","LEL_1.0","GCA_001636795.1","-","-","-","-","","-" -"","Cordyceps confragosa str. UM487 (GCA_001653215)","Hypocreales","1105325","ASM165321v1","GCA_001653215.1","-","-","-","-","-","-" -"","Cordyceps fumosorosea ARSEF 2679 (GCA_001636725)","Hypocreales","1081104","ISF_1.0","GCA_001636725.1","-","-","-","-","","-" -"","Cordyceps militaris CM01 (GCA_000225605)","Hypocreales","983644","CmilitarisCM01_v01","GCA_000225605.1","-","-","-","-","","-" -"","Cordyceps sp. RAO-2017 (GCA_002591385)","Hypocreales","2004951","Hirsu2","GCA_002591385.1","-","-","-","-","","-" -"","Corynespora cassiicola Philippines (GCA_003016335)","Pleosporales","1448308","Corynespora_cassiicola_v1.0","GCA_003016335.1","-","-","-","-","","-" -"","Cryptococcus amylolentus CBS 6039 (GCA_001720205)","Tremellales","1295533","Cryp_amyl_CBS6039_V3","GCA_001720205.1","-","-","-","-","","-" -"","Cryptococcus amylolentus CBS 6273 (GCA_001720235)","Tremellales","1296118","Cryp_amyl_CBS6273_V2","GCA_001720235.1","-","-","-","-","-","-" -"","Cryptococcus depauperatus CBS 7841 (GCA_001720195)","Tremellales","1295531","Filo_depa_CBS7841_V1","GCA_001720195.1","-","-","-","-","","-" -"","Cryptococcus depauperatus CBS 7855 (GCA_001720245)","Tremellales","1295532","Filo_depa_CBS7855_V2","GCA_001720245.1","-","-","-","-","-","-" -"","Cryptococcus gattii CA1280 (GCA_000836335)","Tremellales","1296109","Cryp_gatt_CA1280_V1","GCA_000836335.1","-","-","-","-","-","-" -"","Cryptococcus gattii CA1873 (GCA_000855695)","Tremellales","1296111","Cryp_gatt_CA1873_V1","GCA_000855695.1","-","-","-","-","-","-" -"","Cryptococcus gattii E566 (GCA_000875815)","Tremellales","1296102","Cryp_gatt_E566_V1","GCA_000875815.1","-","-","-","-","-","-" -"","Cryptococcus gattii EJB2 (GCA_000835745)","Tremellales","1296103","Cryp_gatt_EJB2_V1","GCA_000835745.1","-","-","-","-","-","-" -"","Cryptococcus gattii NT-10 (GCA_000935105)","Tremellales","1296108","Cryp_gatt_NT-10_V1","GCA_000935105.1","-","-","-","-","-","-" -"","Cryptococcus gattii Ru294 (GCA_000836355)","Tremellales","1296112","Cryp_gatt_Ru294_V1","GCA_000836355.1","-","-","-","-","-","-" -"","Cryptococcus gattii VGII 2001/935-1 (GCA_000835815)","Tremellales","1334442","Cryp_gatt_2001_935-1_V1","GCA_000835815.1","-","-","-","-","-","-" -"","Cryptococcus gattii VGII 99/473 (GCA_000836455)","Tremellales","1296104","Cryp_gatt_99_473_V1","GCA_000836455.1","-","-","-","-","-","-" -"","Cryptococcus gattii VGII CA1014 (GCA_000875795)","Tremellales","1296107","Cryp_gatt_CA1014_V1","GCA_000875795.1","-","-","-","-","-","-" -"","Cryptococcus gattii VGII CBS 10090 (GCA_000835765)","Tremellales","1296101","Cryp_gatt_CBS10090_V1","GCA_000835765.1","-","-","-","-","-","-" -"","Cryptococcus gattii VGII LA55 (GCA_000836315)","Tremellales","1296106","Cryp_gatt_LA55_V1","GCA_000836315.1","-","-","-","-","-","-" -"","Cryptococcus gattii VGII MMRL2647 (GCA_000875855)","Tremellales","1296117","Cryp_gatt_MMRL2647_V2","GCA_000875855.1","-","-","-","-","-","-" -"","Cryptococcus gattii VGII R265 (GCA_000149475)","Tremellales","294750","CNB2","GCA_000149475.3","-","-","-","-","-","-" -"","Cryptococcus gattii VGII Ram5 (GCA_000836375)","Tremellales","1296110","Cryp_gatt_Ram5_V1","GCA_000836375.1","-","-","-","-","-","-" -"","Cryptococcus gattii VGIV IND107 (GCA_000835755)","Tremellales","1296105","Cryp_gatt_IND107_V2","GCA_000835755.1","-","-","-","-","-","-" -"","Cryptococcus gattii WM276 (GCA_000185945)","Tremellales","367775","ASM18594v1","GCA_000185945.1","-","-","-","-","","-" -"","Cryptococcus neoformans var. grubii 125.91 (GCA_002215885)","Tremellales","1230079","Cryp_neof_125_91_V1","GCA_002215885.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii A1-35-8 (GCA_002221985)","Tremellales","1230081","Cryp_neof_grubii_A1-35-8_V1","GCA_002221985.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii A2-102-5 (GCA_002222375)","Tremellales","1230057","Cryp_neof_A2_102_5_V1","GCA_002222375.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii A5-35-17 (GCA_002222215)","Tremellales","1230080","Cryp_neof_grubii_A5-35-17_V1","GCA_002222215.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii AD1-7a (GCA_002220445)","Tremellales","1230056","Cryp_neof_AD1_7a_V1","GCA_002220445.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii AD1-83a (GCA_002215765)","Tremellales","1230065","Cryp_neof_AD1_83a_V1","GCA_002215765.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii AD2-60a (GCA_002215775)","Tremellales","1230059","Cryp_neof_AD2_60a_V1","GCA_002215775.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii Br795 (GCA_002222225)","Tremellales","1230061","Cryp_neof_Br795_V1","GCA_002222225.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii Bt1 (GCA_002215705)","Tremellales","1230073","Cryp_neof_Bt1_V1","GCA_002215705.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii Bt120 (GCA_002222465)","Tremellales","1230070","Cryp_neof_Bt120_V1","GCA_002222465.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii Bt15 (GCA_002222335)","Tremellales","1230071","Cryp_neof_Bt15_V1","GCA_002222335.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii Bt63 (GCA_002234625)","Tremellales","1230075","Cryp_neof_Bt63_V1","GCA_002234625.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii Bt85 (GCA_002215835)","Tremellales","1230076","Cryp_neof_Bt85_V1","GCA_002215835.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii C23 (GCA_002215825)","Tremellales","1230055","Cryp_neof_C23_V1","GCA_002215825.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii CHC193 (GCA_002222295)","Tremellales","1230064","Cryp_neof_CHC193_V1","GCA_002222295.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii D17-1 (GCA_002222255)","Tremellales","1230058","Cryp_neof_D17_1_V1","GCA_002222255.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii Gb118 (GCA_002224005)","Tremellales","1230060","Cryp_neof_Gb118_V1","GCA_002224005.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii H99 (GCA_000149245)","Tremellales","235443","CNA3","GCA_000149245.3","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii MW-RSA1955 (GCA_002222455)","Tremellales","1230066","Cryp_neof_MW_RSA1955_V1","GCA_002222455.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii MW-RSA36 (GCA_002222395)","Tremellales","1230062","Cryp_neof_MW_RSA36_V1","GCA_002222395.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii MW-RSA852 (GCA_002220035)","Tremellales","1230069","Cryp_neof_MW_RSA852_V1","GCA_002220035.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii Th84 (GCA_002222315)","Tremellales","1230067","Cryp_neof_Th84_V1","GCA_002222315.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii Tu259-1 (GCA_002222325)","Tremellales","1230072","Cryp_neof_Tu259_1_V1","GCA_002222325.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii Tu401-1 (GCA_002222475)","Tremellales","1230077","Cryp_neof_Tu401_1_V1","GCA_002222475.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii Ze90-1 (GCA_002222385)","Tremellales","1230078","Cryp_neof_Ze90_1_V1","GCA_002222385.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii c45 (GCA_002215855)","Tremellales","1230068","Cryp_neof_C45_V1","GCA_002215855.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii c8 (GCA_002222405)","Tremellales","1230063","Cryp_neof_C8_V1","GCA_002222405.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. CCTP51 (GCA_002217545)","Tremellales","178876","Cryp_neof_grubii_cng10_V1","GCA_002217545.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. CM20 (GCA_002222115)","Tremellales","178876","Cryp_neof_grubii_cng5_V1","GCA_002222115.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. CM24 (GCA_002222145)","Tremellales","178876","Cryp_neof_grubii_cng6_V1","GCA_002222145.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. CM36 (GCA_002222245)","Tremellales","178876","Cryp_neof_grubii_cng2_V1","GCA_002222245.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. CM50 (GCA_002222135)","Tremellales","178876","Cryp_neof_grubii_cng1_V1","GCA_002222135.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. CM52 (GCA_002222165)","Tremellales","178876","Cryp_neof_grubii_cng3_V1","GCA_002222165.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. CM64 (GCA_002222025)","Tremellales","178876","Cryp_neof_grubii_cng4_V1","GCA_002222025.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. KN99 (GCA_002216725)","Tremellales","178876","ASM221672v1","GCA_002216725.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. RCT21 (GCA_002222155)","Tremellales","178876","Cryp_neof_grubii_cng11_V1","GCA_002222155.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. RCT54 (GCA_002222015)","Tremellales","178876","Cryp_neof_grubii_cng8_V1","GCA_002222015.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. RCT6 (GCA_002222095)","Tremellales","178876","Cryp_neof_grubii_cng7_V1","GCA_002222095.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. V2 (GCA_002215755)","Tremellales","178876","Cneo_seroA_V2","GCA_002215755.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. grubii str. WM-1408 (GCA_002220045)","Tremellales","178876","Cneo_seroA_WM1408","GCA_002220045.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. neoformans B-3501A (GCA_000149385)","Tremellales","283643","ASM14938v1","GCA_000149385.1","-","-","-","-","-","-" -"","Cryptococcus neoformans var. neoformans JEC21","Tremellales","214684","ASM9104v1","GCA_000091045.1","-","-","-","-","","-" -"","Cutaneotrichosporon oleaginosum str. IBC0246 (GCA_001027345)","","879819","Triol1","GCA_001027345.1","-","-","-","-","","-" -"","Cyberlindnera fabianii str. 65 (GCA_001983305)","Saccharomycetales","36022","ASM198330v1","GCA_001983305.1","-","-","-","-","-","-" -"","Cyberlindnera fabianii str. YJS4271 (GCA_003205855)","Saccharomycetales","36022","ASM320585v1","GCA_003205855.1","-","-","-","-","","-" -"","Cyberlindnera jadinii NRRL Y-1542 (GCA_001661405)","Saccharomycetales","983966","Cybja1","GCA_001661405.1","-","-","-","-","-","-" -"","Cyberlindnera jadinii str. CBS1600 (GCA_001245095)","Saccharomycetales","4903","cj1","GCA_001245095.1","-","-","-","-","","-" -"","Cylindrobasidium torrendii FP15055 ss-10 (GCA_000934385)","Agaricales","1314674","Cylto1","GCA_000934385.1","-","-","-","-","","-" -"","Cyphellophora europaea CBS 101466 (GCA_000365145)","Chaetothyriomycetidae","1220924","Phia_euro_CBS_101466_V1","GCA_000365145.2","-","-","-","-","","-" -"","Dacryopinax primogenitus str. DJM-731 SS1 (GCA_000292625)","Dacrymycetales","1858805","Dacryopinax_sp._DJM_731_SSP1_v1.0","GCA_000292625.1","-","-","-","-","","-" -"","Dactylellina haptotyla CBS 200.50 (GCA_000441935)","Orbiliales","1284197","MHA_v2","GCA_000441935.1","-","-","-","-","","-" -"","Daedalea quercina L-15889 (GCA_001632345)","Polyporales","1314783","Daequ1","GCA_001632345.1","-","-","-","-","","-" -"","Daldinia sp. EC12 (GCA_002120325)","Xylariales","1001832","DalEC12_v.1.0","GCA_002120325.1","-","-","-","-","","-" -"","Debaryomyces fabryi str. CBS 789 (GCA_001447935)","Saccharomycetales","58627","debFab1.0","GCA_001447935.1","-","-","-","-","","-" -"","Debaryomyces hansenii CBS767 (GCA_000006445)","Saccharomycetales","284592","ASM644v2","GCA_000006445.2","-","-","-","-","","-" -"","Diaporthe ampelina (GCA_001006365)","Sordariomycetidae","1214573","UCDDA912v1.0","GCA_001006365.1","-","-","-","-","","-" -"","Diaporthe helianthi str. 7/96 (GCA_001702395)","Sordariomycetidae","158607","DHEL01v2","GCA_001702395.2","-","-","-","-","","-" -"","Dichomitus squalens LYAD-421 SS1 (GCA_000275845)","Polyporales","732165","Dichomitus_squalens_v1.0","GCA_000275845.1","-","-","-","-","","-" -"","Diplocarpon rosae (GCA_002317995)","Helotiales","946125","ASM231799v1","GCA_002317995.1","-","-","-","-","","-" -"","Diplodia corticola str. CBS 112549 (GCA_001883845)","Botryosphaeriales","236234","ASM188384v1","GCA_001883845.1","-","-","-","-","","-" -"","Diplodia seriata (GCA_001006355)","Botryosphaeriales","420778","UCDDS831v0.1","GCA_001006355.1","-","-","-","-","","-" -"","Diplodia seriata str. F98.1 (GCA_001975905)","Botryosphaeriales","420778","Dipser_v1","GCA_001975905.1","-","-","-","-","-","-" -"","Dothistroma septosporum","Capnodiales","675120","GCA_000340195.1","GCA_000340195.1","-","-","-","","","-" -"","Drechmeria coniospora str. ARSEF 6962 (GCA_001625195)","Hypocreales","98403","ASM162519v1","GCA_001625195.1","-","-","-","-","","-" -"","Drechslerella stenobrocha 248 (GCA_000525045)","Orbiliales","1043628","DREv1","GCA_000525045.1","-","-","-","-","","-" -"","Edhazardia aedis USNM 41457 (GCA_000230595)","Microsporidia","1003232","Edha_aedis_V4b","GCA_000230595.3","-","-","-","-","","-" -"","Elaphomyces granulatus str. OSC145934 (GCA_002240705)","Eurotiales","519963","PX439","GCA_002240705.1","-","-","-","-","","-" -"","Elsinoe australis str. NL1 (GCA_003013795)","","40998","ASM301379v1","GCA_003013795.1","-","-","-","-","","-" -"","Emergomyces pasteuriana Ep9510 str. UAMH 9510 (GCA_001883825)","Onygenales","1447872","Emmo_past_UAMH9510_V1","GCA_001883825.1","-","-","-","-","","-" -"","Emmonsia crescens UAMH 3008 (GCA_001008285)","Onygenales","1247875","ASM100828v1","GCA_001008285.1","-","-","-","-","","-" -"","Emmonsia crescens str. UAMH4076 (GCA_002572855)","Onygenales","73230","Emmon_cres_4076_V1","GCA_002572855.1","-","-","-","-","-","-" -"","Emmonsia parva UAMH 139 (GCA_001014755)","Onygenales","2060906","ASM101475v1","GCA_001014755.1","-","-","-","-","","-" -"","Emmonsia parva str. UAMH130 (GCA_002572885)","Onygenales","2060905","Emmon_parv_130","GCA_002572885.1","-","-","-","-","-","-" -"","Emmonsia sp. CAC-2015a str. CBS 136260 (GCA_001660665)","Onygenales","1658172","Emmo_afri_EA111","GCA_001660665.1","-","-","-","-","","-" -"","Encephalitozoon cuniculi EcunIII-L (GCA_001078035)","Unikaryonidae","1355160","ECIIIL","GCA_001078035.1","-","-","-","-","-","-" -"","Encephalitozoon hellem ATCC 50504 (GCA_000277815)","Unikaryonidae","907965","ASM27781v3","GCA_000277815.3","-","-","-","-","-","-" -"","Encephalitozoon intestinalis ATCC 50506 (GCA_000146465)","Unikaryonidae","876142","ASM14646v1","GCA_000146465.1","-","-","-","-","-","-" -"","Encephalitozoon romaleae SJ-2008 (GCA_000280035)","Unikaryonidae","1178016","ASM28003v2","GCA_000280035.2","-","-","-","-","-","-" -"","Endocarpon pusillum Z07020 (GCA_000464535)","Verrucariales","1263415","EPUS","GCA_000464535.1","-","-","-","-","","-" -"","Enterocytozoon bieneusi H348 (GCA_000209485)","Microsporidia","481877","ASM20948v1","GCA_000209485.1","-","-","-","-","","-" -"","Enterocytozoon hepatopenaei str. TH1 (GCA_002081675)","Microsporidia","646526","ASM208167v1","GCA_002081675.1","-","-","-","-","","-" -"","Enterospora canceri str. GB1 (GCA_002087915)","Microsporidia","1081671","ASM208791v1","GCA_002087915.1","-","-","-","-","","-" -"","Epicoccum nigrum str. ICMP 19927 (GCA_002116315)","Pleosporales","105696","ASM211631v1","GCA_002116315.1","-","-","-","-","","-" -"","Eremothecium cymbalariae DBVPG#7215 (GCA_000235365)","Saccharomycetales","931890","ASM23536v1","GCA_000235365.1","-","-","-","-","","-" -"","Eremothecium gossypii FDAG1 (GCA_000968835)","Saccharomycetales","1034331","ASM96883v1","GCA_000968835.1","-","-","-","-","","-" -"","Erysiphe necator (GCA_000798715)","Erysiphales","52586","ASM79871v1","GCA_000798715.1","-","-","-","-","","-" -"","Erysiphe pulchra (GCA_002918395)","Erysiphales","225359","ASM291839v1","GCA_002918395.1","-","-","-","-","","-" -"","Escovopsis weberi (GCA_001278495)","Hypocreales","150374","ASM127849v1","GCA_001278495.1","-","-","-","-","","-" -"","Eutypa lata UCREL1 (GCA_000349385)","Xylariales","1287681","UCREL1V03","GCA_000349385.1","-","-","-","-","","-" -"","Exidia glandulosa HHB12029 (GCA_001632375)","","1314781","Exigl1","GCA_001632375.1","-","-","-","-","","-" -"","Exophiala aquamarina CBS 119918 (GCA_000709125)","Chaetothyriomycetidae","1182545","Exop_aqua_CBS_119918_V1","GCA_000709125.1","-","-","-","-","","-" -"","Exophiala dermatitidis NIH/UT8656 (GCA_000230625)","Chaetothyriomycetidae","858893","Exop_derm_V1","GCA_000230625.1","-","-","-","-","","-" -"","Exophiala mesophila str. CBS 40295 (GCA_000836275)","Chaetothyriomycetidae","212818","Exop_meso_CBS40295_V1","GCA_000836275.1","-","-","-","-","","-" -"","Exophiala oligosperma str. CBS 72588 (GCA_000835515)","Chaetothyriomycetidae","215243","Exop_olig_CBS72588_V1","GCA_000835515.1","-","-","-","-","","-" -"","Exophiala sideris str. CBS 121828 (GCA_000835395)","Chaetothyriomycetidae","1016849","Exop_side_CBS121828_V1","GCA_000835395.1","-","-","-","-","","-" -"","Exophiala spinifera str. CBS 89968 (GCA_000836115)","Chaetothyriomycetidae","91928","Exop_spin_CBS89968_V1","GCA_000836115.1","-","-","-","-","","-" -"","Exophiala xenobiotica str. CBS 118157 (GCA_000835505)","Chaetothyriomycetidae","348802","Exop_xeno_CBS118157_V1","GCA_000835505.1","-","-","-","-","","-" -"","Exserohilum turcica Et28A (GCA_000359705)","Pleosporales","671987","Setospaeria_trucica_Et28A_v1.0","GCA_000359705.1","-","-","-","-","","-" -"","Fibroporia radiculosa str. TFFH 294 (GCA_000313525)","Polyporales","599839","ASM31352v1","GCA_000313525.1","-","-","-","-","","-" -"","Fibularhizoctonia sp. CBS 109695 (GCA_001630335)","Atheliales","436010","Fibsp1","GCA_001630335.1","-","-","-","-","","-" -"","Fistulina hepatica ATCC 64428 (GCA_000934395)","Agaricales","1128425","Fishe1","GCA_000934395.1","-","-","-","-","","-" -"","Fomitiporia mediterranea MF3/22 (GCA_000271605)","Hymenochaetales","694068","Fomme1","GCA_000271605.1","-","-","-","-","","-" -"","Fomitopsis pinicola FP-58527 SS1 (GCA_000344655)","Polyporales","743788","Fompi3","GCA_000344655.2","-","-","-","-","","-" -"","Fonsecaea erecta (GCA_001651985)","Chaetothyriomycetidae","1367422","ASM165198v1","GCA_001651985.1","-","-","-","-","","-" -"","Fonsecaea monophora (GCA_001642475)","Chaetothyriomycetidae","254056","ASM164247v1","GCA_001642475.1","-","-","-","-","","-" -"","Fonsecaea multimorphosa (GCA_001646985)","Chaetothyriomycetidae","979981","ASM164698v1","GCA_001646985.1","-","-","-","-","-","-" -"","Fonsecaea multimorphosa CBS 102226 (GCA_000836435)","Chaetothyriomycetidae","1442371","Fons_mult_CBS_102226_V1","GCA_000836435.1","-","-","-","-","","-" -"","Fonsecaea nubica (GCA_001646965)","Chaetothyriomycetidae","856822","ASM164696v1","GCA_001646965.1","-","-","-","-","","-" -"","Fonsecaea pedrosoi CBS 271.37 (GCA_000835455)","Chaetothyriomycetidae","1442368","Fons_pedr_CBS_271_37_V1","GCA_000835455.1","-","-","-","-","","-" -"","Fusarium culmorum UK99","Hypocreales","1318462","EF1","GCA_900074845.1","-","-","-","","","-" -"","Fusarium fujikuroi","Hypocreales","5127","EF1","GCA_000315255.1","-","-","-","","","-" -"","Fusarium fujikuroi (GCA_001023035)","Hypocreales","5127","ASM102303v1","GCA_001023035.1","-","-","-","-","-","-" -"","Fusarium fujikuroi (GCA_001023045)","Hypocreales","5127","ASM102304v1","GCA_001023045.1","-","-","-","-","-","-" -"","Fusarium fujikuroi (GCA_001023065)","Hypocreales","5127","ASM102306v1","GCA_001023065.1","-","-","-","-","-","-" -"","Fusarium fujikuroi (GCA_900096505)","Hypocreales","5127","version_1","GCA_900096505.1","-","-","-","-","-","-" -"","Fusarium fujikuroi (GCA_900096685)","Hypocreales","5127","version_1","GCA_900096685.1","-","-","-","-","-","-" -"","Fusarium fujikuroi (GCA_900096705)","Hypocreales","5127","version_1","GCA_900096705.1","-","-","-","-","-","-" -"","Fusarium graminearum PH-1 (GCA_000240135)","Hypocreales","229533","ASM24013v3","GCA_000240135.3","-","-","-","-","-","-" -"","Fusarium graminearum str. CS3005 (GCA_000599445)","Hypocreales","5518","CS3005v1","GCA_000599445.1","-","-","-","-","","-" -"","Fusarium graminearum str. PH-1","Hypocreales","5518","RR1","GCA_900044135.1","","-","-","","-","-" -"","Fusarium langsethiae str. Fl201059 (GCA_001292635)","Hypocreales","179993","ASM129263v1","GCA_001292635.1","-","-","-","-","-","-" -"","Fusarium mangiferae (GCA_900044065)","Hypocreales","192010","Genome_assembly_version_1","GCA_900044065.1","-","-","-","-","-","-" -"","Fusarium nygamai (GCA_002894225)","Hypocreales","42673","CS10214v1","GCA_002894225.1","-","-","-","-","-","-" -"","Fusarium oxysporum","Hypocreales","426428","FO2","GCA_000222805.1","","-","","","","-" -"","Fusarium oxysporum (GCA_900096695)","Hypocreales","5507","version_1","GCA_900096695.1","-","-","-","-","-","-" -"","Fusarium oxysporum FOSC 3-a (GCA_000271745)","Hypocreales","909455","FO_FOSC_3_a_V1","GCA_000271745.2","-","-","-","-","-","-" -"","Fusarium oxysporum Fo47 (GCA_000271705)","Hypocreales","660027","FO_Fo47_V1","GCA_000271705.2","-","-","-","-","-","-" -"","Fusarium oxysporum f. sp. conglutinans race 2 54008 str. 54008 (PHW808) (GCA_000260215)","Hypocreales","1089457","FO_PHW808_V1","GCA_000260215.2","-","-","-","-","-","-" -"","Fusarium oxysporum f. sp. cubense race 1 (GCA_000350345)","Hypocreales","1229664","Foc1_1.0","GCA_000350345.1","-","-","-","-","-","-" -"","Fusarium oxysporum f. sp. cubense race 4 (GCA_000350365)","Hypocreales","1229665","Foc4_1.0","GCA_000350365.1","-","-","-","-","-","-" -"","Fusarium oxysporum f. sp. cubense tropical race 4 54006 str. 54006 (II5) (GCA_000260195)","Hypocreales","1089451","FO_II5_V1","GCA_000260195.2","-","-","-","-","-","-" -"","Fusarium oxysporum f. sp. lycopersici 4287 (GCA_000149955)","Hypocreales","426428","ASM14995v2","GCA_000149955.2","-","-","-","-","-","-" -"","Fusarium oxysporum f. sp. lycopersici MN25 (GCA_000259975)","Hypocreales","1080343","FO_MN25_V1","GCA_000259975.2","-","-","-","-","-","-" -"","Fusarium oxysporum f. sp. melonis 26406 str. 26406 (melonis) (GCA_000260495)","Hypocreales","1089452","FO_melonis_V1","GCA_000260495.2","-","-","-","-","-","-" -"","Fusarium oxysporum f. sp. pisi HDV247 (GCA_000260075)","Hypocreales","1080344","FO_HDV247_V1","GCA_000260075.2","-","-","-","-","-","-" -"","Fusarium oxysporum f. sp. radicis-cucumerinum (GCA_001702695)","Hypocreales","327505","ASM170269v2","GCA_001702695.2","-","-","-","-","-","-" -"","Fusarium oxysporum f. sp. radicis-lycopersici 26381 str. 26381 (CL57) (GCA_000260155)","Hypocreales","1089448","FO_CL57_V1","GCA_000260155.3","-","-","-","-","-","-" -"","Fusarium oxysporum f. sp. raphani 54005 (GCA_000260235)","Hypocreales","1089458","FO_PHW815_V1","GCA_000260235.2","-","-","-","-","-","-" -"","Fusarium oxysporum f. sp. vasinfectum 25433 str. 25433 (Cotton) (GCA_000260175)","Hypocreales","1089449","FO_Cotton_V1","GCA_000260175.2","-","-","-","-","-","-" -"","Fusarium poae (GCA_001675295)","Hypocreales","36050","FPOA1.0","GCA_001675295.1","-","-","-","-","-","-" -"","Fusarium proliferatum (GCA_900029915)","Hypocreales","948311","F._proliferatum_NRRL62905_version_1","GCA_900029915.1","-","-","-","-","-","-" -"","Fusarium proliferatum ET1 (GCA_900067095)","Hypocreales","1227346","F._proliferatum_ET1_version_1","GCA_900067095.1","-","-","-","-","-","-" -"","Fusarium pseudograminearum","Hypocreales","1028729","GCA_000303195.1","GCA_000303195.1","-","-","-","","","-" -"","Fusarium solani","Hypocreales","660122","v2.0","GCA_000151355.1","-","-","","","","-" -"","Fusarium venenatum (GCA_900007375)","Hypocreales","56646","ASM90000737v1","GCA_900007375.1","-","-","-","-","-","-" -"","Fusarium verticillioides","Hypocreales","334819","ASM14955v1","GCA_000149555.1","-","-","","","","-" -"","Gaeumannomyces tritici R3-111a-1","Magnaporthales","644352","Gae_graminis_V2","GCA_000145635.1","-","-","-","-","","-" -"","Galerina marginata CBS 339.88 (GCA_000697645)","Agaricales","685588","Galma1","GCA_000697645.1","-","-","-","-","","-" -"","Ganoderma sinense ZZ0214-1 (GCA_002760635)","Polyporales","1077348","GanSi1.6","GCA_002760635.1","-","-","-","-","","-" -"","Gelatoporia subvermispora B (GCA_000320605)","Polyporales","914234","Ceriporiopsis_subvermispora_B_v1.0","GCA_000320605.2","-","-","-","-","","-" -"","Glarea lozoyensis ATCC 20868 str. 1224 (GCA_000409485)","Helotiales","1116229","GLAREA","GCA_000409485.1","-","-","-","-","","-" -"","Gloeophyllum trabeum ATCC 11539 (GCA_000344685)","Gloeophyllales","670483","Glotr1_1","GCA_000344685.1","-","-","-","-","","-" -"","Gonapodya prolifera JEL478 (GCA_001574975)","","1344416","Ganpr1","GCA_001574975.1","-","-","-","-","","-" -"","Grifola frondosa str. 9006-11 (GCA_001683735)","Agaricales","5627","ASM168373v1","GCA_001683735.1","-","-","-","-","","-" -"","Grosmannia clavigera kw1407 (GCA_000143105)","Ophiostomatales","655863","Sanger-454-IlluminaPA_2.0","GCA_000143105.2","-","-","-","-","","-" -"","Gymnopus luxurians FD-317 M1 (GCA_000827265)","Agaricales","944289","Gymlu1","GCA_000827265.1","-","-","-","-","","-" -"","Hanseniaspora guilliermondii (GCA_900119595)","Saccharomycetales","56406","version_1","GCA_900119595.1","-","-","-","-","","-" -"","Hanseniaspora opuntiae (GCA_001749795)","Saccharomycetales","211096","ASM174979v1","GCA_001749795.1","-","-","-","-","","-" -"","Hanseniaspora osmophila (GCA_001747045)","Saccharomycetales","56408","ASM174704v1","GCA_001747045.1","-","-","-","-","","-" -"","Hanseniaspora uvarum (GCA_001747055)","Saccharomycetales","29833","ASM174705v1","GCA_001747055.1","-","-","-","-","-","-" -"","Hanseniaspora uvarum DSM 2768 (GCA_000968475)","Saccharomycetales","1246595","Huva2.0","GCA_000968475.1","-","-","-","-","","-" -"","Hanseniaspora valbyensis NRRL Y-1626 (GCA_001664025)","Saccharomycetales","766949","Hanva1_1","GCA_001664025.1","-","-","-","-","","-" -"","Hebeloma cylindrosporum h7 (GCA_000827355)","Agaricales","686832","Hebeloma_cylindrosporum_h7_v2.0","GCA_000827355.1","-","-","-","-","","-" -"","Helicocarpus griseus UAMH5409 (GCA_002573585)","Onygenales","1447875","Heli_gris_5409_V1","GCA_002573585.1","-","-","-","-","","-" -"","Hepatospora eriocheir str. GB1 (GCA_002087885)","Microsporidia","1081669","ASM208788v1","GCA_002087885.1","-","-","-","-","-","-" -"","Hepatospora eriocheir str. canceri (GCA_002087875)","Microsporidia","1081669","ASM208787v1","GCA_002087875.1","-","-","-","-","","-" -"","Hesseltinella vesiculosa str. NRRL 3301","Mucoromycotina","101127","Hesve2","GCA_002104935.1","-","-","-","-","","-" -"","Heterobasidion irregulare TC 32-1 (GCA_000320585)","Russulales","747525","Heterobasidion_irregulare_v2.0","GCA_000320585.2","-","-","-","-","","-" -"","Hirsutella minnesotensis 3608 (GCA_000956045)","Hypocreales","1043627","ASM95604v1","GCA_000956045.1","-","-","-","-","","-" -"","Histoplasma capsulatum G186AR (GCA_000150115)","Onygenales","447093","ASM15011v1","GCA_000150115.1","-","-","-","-","-","-" -"","Histoplasma capsulatum H143 (GCA_000151035)","Onygenales","544712","ASM15103v1","GCA_000151035.1","-","-","-","-","-","-" -"","Histoplasma capsulatum H88 (GCA_000151005)","Onygenales","544711","ASM15100v2","GCA_000151005.2","-","-","-","-","-","-" -"","Histoplasma capsulatum NAm1 (GCA_000149585)","Onygenales","339724","ASM14958v1","GCA_000149585.1","-","-","-","-","","-" -"","Hortaea werneckii EXF-2000 (GCA_002127715)","Dothideales","1157616","HwerPB1","GCA_002127715.1","-","-","-","-","","-" -"","Hydnomerulius pinastri MD-312 (GCA_000827185)","Boletales","994086","Hydpi2","GCA_000827185.1","-","-","-","-","","-" -"","Hypholoma sublateritium FD-334 SS-4 (GCA_000827495)","Agaricales","945553","Hypsu1","GCA_000827495.1","-","-","-","-","","-" -"","Hyphopichia burtonii NRRL Y-1933 (GCA_001661395)","Saccharomycetales","984485","Hypbu1","GCA_001661395.1","-","-","-","-","","-" -"","Hypoxylon sp. CI-4A (GCA_002120315)","Xylariales","1001833","HypCI4A_v1.0","GCA_002120315.1","-","-","-","-","","-" -"","Hypoxylon sp. CO27-5 (GCA_002120305)","Xylariales","1001938","HypCO275_v1.0","GCA_002120305.1","-","-","-","-","-","-" -"","Hypoxylon sp. EC38 (GCA_002120335)","Xylariales","1001937","HypEC38_v3.0","GCA_002120335.1","-","-","-","-","-","-" -"","Hypsizygus marmoreus str. 51987-8 (GCA_001605315)","Agaricales","39966","ASM160531v1","GCA_001605315.1","-","-","-","-","","-" -"","Jaapia argillacea MUCL 33604 (GCA_000697665)","Jaapiales","933084","Jaaar1","GCA_000697665.1","-","-","-","-","","-" -"","Jaminaea rosea str. MCA 5214 (GCA_003144245)","","1569628","Jamsp1","GCA_003144245.1","-","-","-","-","","-" -"","Kalmanozyma brasiliensis GHG001 (GCA_000497045)","Ustilaginales","1365824","PSEUBRA1","GCA_000497045.1","-","-","-","-","","-" -"","Kazachstania africana CBS 2517 (GCA_000304475)","Saccharomycetales","1071382","Ka_CBS2517","GCA_000304475.1","-","-","-","-","","-" -"","Kazachstania naganishii CBS 8797 (GCA_000348985)","Saccharomycetales","1071383","ASM34898v1","GCA_000348985.1","-","-","-","-","","-" -"","Kluyveromyces dobzhanskii CBS 2104 str. CBS2104 (GCA_000820885)","Saccharomycetales","1427455","KLDO_01","GCA_000820885.1","-","-","-","-","","-" -"","Kluyveromyces lactis str. NRRL Y-1140 (GCA_000002515)","Saccharomycetales","28985","ASM251v1","GCA_000002515.1","-","-","-","-","","-" -"","Kluyveromyces marxianus DMKU3-1042 (GCA_001417885)","Saccharomycetales","1003335","Kmar_1.0","GCA_001417885.1","-","-","-","-","","-" -"","Kluyveromyces marxianus str. NBRC 1777 (GCA_001417835)","Saccharomycetales","4911","KM1777_03","GCA_001417835.1","-","-","-","-","-","-" -"","Kockovaella imperatae str. NRRL Y-17943 (GCA_002102565)","Tremellales","4999","Kocim1","GCA_002102565.1","-","-","-","-","","-" -"","Komagataella pastoris","Saccharomycetales","644223","GCA_000027005.1","GCA_000027005.1","-","-","-","","","-" -"","Komagataella pastoris (GCA_001708105)","Saccharomycetales","4922","ASM170810v1","GCA_001708105.1","-","-","-","-","-","-" -"","Komagataella phaffii CBS 7435 (GCA_000223565)","Saccharomycetales","981350","PicPas_Mar2011","GCA_000223565.1","-","-","-","-","-","-" -"","Komagataella phaffii CBS 7435 (GCA_900235035)","Saccharomycetales","981350","ASM90023503v1","GCA_900235035.1","-","-","-","-","-","-" -"","Komagataella phaffii GS115 (GCA_001746955)","Saccharomycetales","644223","ASM174695v1","GCA_001746955.1","-","-","-","-","","-" -"","Komagataella phaffii str. WT (GCA_001708085)","Saccharomycetales","460519","ASM170808v1","GCA_001708085.1","-","-","-","-","-","-" -"","Kuraishia capsulata CBS 1993 (GCA_000576695)","Saccharomycetales","1382522","AUH_PRJEB4427_v1","GCA_000576695.1","-","-","-","-","","-" -"","Kwoniella bestiolae CBS 10118 (GCA_000512585)","Tremellales","1296100","Cryp_best_CBS10118_V1","GCA_000512585.2","-","-","-","-","","-" -"","Kwoniella dejecticola CBS 10117 (GCA_000512565)","Tremellales","1296121","Cryp_deje_CBS10117_V1","GCA_000512565.2","-","-","-","-","","-" -"","Kwoniella heveanensis BCC8398 (GCA_000507405)","Tremellales","1296120","Cryp_heve_BCC8398_V1","GCA_000507405.3","-","-","-","-","-","-" -"","Kwoniella heveanensis CBS 569 (GCA_000507425)","Tremellales","1296119","Cryp_heve_CBS569_V2","GCA_000507425.3","-","-","-","-","-","-" -"","Kwoniella mangroviensis CBS 10435 (GCA_000507885)","Tremellales","1331196","Kwon_mang_CBS10435_V2","GCA_000507885.2","-","-","-","-","-","-" -"","Kwoniella mangroviensis CBS 8507 (GCA_000507465)","Tremellales","1296122","Kwon_mang_CBS8507_V2","GCA_000507465.3","-","-","-","-","-","-" -"","Kwoniella mangroviensis CBS 8886 (GCA_000507485)","Tremellales","1296123","Kwon_mang_CBS8886_V1","GCA_000507485.3","-","-","-","-","-","-" -"","Kwoniella pini CBS 10737 (GCA_000512605)","Tremellales","1296096","Cryp_pinu_CBS10737_V1","GCA_000512605.2","-","-","-","-","","-" -"","Laccaria amethystina LaAM-08-1 (GCA_000827195)","Agaricales","1095629","Laccaria_amethystina_LaAM-08-1_v1.0","GCA_000827195.1","-","-","-","-","","-" -"","Laccaria bicolor S238N-H82 (GCA_000143565)","Agaricales","486041","V1.0","GCA_000143565.1","-","-","-","-","","-" -"","Lachancea dasiensis CBS 10888 (GCA_900074725)","Saccharomycetales","1266660","LADA0","GCA_900074725.1","-","-","-","-","","-" -"","Lachancea fermentati (GCA_900074765)","Saccharomycetales","4955","LAFE0","GCA_900074765.1","-","-","-","-","-","-" -"","Lachancea lanzarotensis str. CBS 12615 (GCA_000938715)","Saccharomycetales","1245769","LALA0","GCA_000938715.1","-","-","-","-","","-" -"","Lachancea meyersii CBS 8951 (GCA_900074715)","Saccharomycetales","1266667","LAME0","GCA_900074715.1","-","-","-","-","-","-" -"","Lachancea mirantina (GCA_900074745)","Saccharomycetales","1230905","LAMI0","GCA_900074745.1","-","-","-","-","-","-" -"","Lachancea nothofagi CBS 11611 (GCA_900074755)","Saccharomycetales","1266666","LANO0","GCA_900074755.1","-","-","-","-","-","-" -"","Lachancea quebecensis (GCA_002900925)","Saccharomycetales","1654605","ASM290092v1","GCA_002900925.1","-","-","-","-","-","-" -"","Lachancea sp. CBS 6924 (GCA_900074735)","Saccharomycetales","433476","LAFA0","GCA_900074735.1","-","-","-","-","-","-" -"","Lachancea thermotolerans CBS 6340 (GCA_000142805)","Saccharomycetales","559295","ASM14280v1","GCA_000142805.1","-","-","-","-","-","-" -"","Laetiporus sulphureus 93-53 (GCA_001632365)","Polyporales","1314785","Laesu1","GCA_001632365.1","-","-","-","-","","-" -"","Lentinula edodes str. G408PP-4 (GCA_002003045)","Agaricales","5353","Lened_assembly01","GCA_002003045.1","-","-","-","-","","-" -"","Leptosphaeria maculans","Pleosporales","985895","ASM23037v1","GCA_000230375.1","-","-","-","","","-" -"","Leucoagaricus sp. SymC.cos (GCA_001563735)","Agaricales","1714833","ASM156373v1","GCA_001563735.1","-","-","-","-","","-" -"","Leucosporidium creatinivorum str. 62-1032 (GCA_002105055)","","106004","Leucr1","GCA_002105055.1","-","-","-","-","","-" -"","Lichtheimia corymbifera JMRC:FSU:9682 (GCA_000723665)","Mucoromycotina","1263082","454Minimus","GCA_000723665.1","-","-","-","-","","-" -"","Lichtheimia ramosa str. JMRC:FSU:6197 (GCA_000945115)","Mucoromycotina","688394","Lramosa_hybrid_454_Illumina","GCA_000945115.1","-","-","-","-","","-" -"","Lipomyces starkeyi NRRL Y-11557 (GCA_001661325)","Saccharomycetales","675824","Lipst1_1","GCA_001661325.1","-","-","-","-","","-" -"","Lobosporangium transversale str. NRRL 3116","Mortierellomycotina","64571","Lobtra1","GCA_002105155.1","-","-","-","-","","-" -"","Lodderomyces elongisporus NRRL YB-4239 (GCA_000149685)","Saccharomycetales","379508","ASM14968v1","GCA_000149685.1","-","-","-","-","","-" -"","Lomentospora prolificans str. JHH-5317 (GCA_002276285)","Microascales","41688","Lprolificans_pilon","GCA_002276285.1","-","-","-","-","","-" -"","Macrophomina phaseolina MS6 (GCA_000302655)","Botryosphaeriales","1126212","MphMS6_1.0","GCA_000302655.1","-","-","-","-","","-" -"","Madurella mycetomatis str. mm55 (GCA_001275765)","Sordariales","100816","ASM127576v2","GCA_001275765.2","-","-","-","-","","-" -"","Magnaporthe oryzae","Magnaporthales","242507","MG8","GCA_000002495.2","-","-","","","","-" -"","Magnaporthe poae","Magnaporthales","644358","Mag_poae_ATCC_64411_V1","GCA_000193285.1","-","-","","","","-" -"","Malassezia globosa CBS 7966 (GCA_000181695)","Malasseziales","425265","ASM18169v1","GCA_000181695.1","-","-","-","-","","-" -"","Malassezia pachydermatis (GCA_001278385)","Malasseziales","77020","MalaPachy","GCA_001278385.1","-","-","-","-","","-" -"","Malassezia sympodialis ATCC 42132 (GCA_000349305)","Malasseziales","1230383","ASM34930v2","GCA_000349305.2","-","-","-","-","","-" -"","Malassezia sympodialis ATCC 42132 (GCA_900149145)","Malasseziales","1230383","Msy_ATCC_42132_Feb2016","GCA_900149145.1","-","-","-","-","-","-" -"","Malassezia vespertilionis str. NWHC:44797-103 (GCA_002818225)","Malasseziales","2020962","ASM281822v1","GCA_002818225.1","-","-","-","-","","-" -"","Marssonina brunnea f. sp. 'multigermtubi' MB_m1 (GCA_000298775)","Helotiales","1072389","ASM29877v1","GCA_000298775.1","-","-","-","-","","-" -"","Meira miltonrushii str. MCA 3882 (GCA_003144205)","","1280837","Meimi1","GCA_003144205.1","-","-","-","-","","-" -"","Melampsora larici-populina","Pucciniales","747676","GCA_000204055.1","GCA_000204055.1","-","-","-","","","-" -"","Meliniomyces bicolor E (GCA_002865645)","Helotiales","1095630","Melbi2","GCA_002865645.1","-","-","-","-","","-" -"","Meliniomyces variabilis F (GCA_002865655)","Helotiales","1149755","Melva1","GCA_002865655.1","-","-","-","-","","-" -"","Metarhizium acridum CQMa 102 (GCA_000187405)","Hypocreales","655827","MetAcr_May2010","GCA_000187405.1","-","-","-","-","","-" -"","Metarhizium album ARSEF 1941 (GCA_000804445)","Hypocreales","1081103","MAM_1.0_for_version_1_of_the_Metarhizium_album_genome","GCA_000804445.1","-","-","-","-","","-" -"","Metarhizium anisopliae ARSEF 549 (GCA_000814975)","Hypocreales","1276135","MAN_1.0","GCA_000814975.1","-","-","-","-","-","-" -"","Metarhizium anisopliae BRIP 53284 (GCA_000426985)","Hypocreales","1291519","ASM42698v1","GCA_000426985.1","-","-","-","-","-","-" -"","Metarhizium anisopliae BRIP 53293 (GCA_000426965)","Hypocreales","1291518","ASM42696v1","GCA_000426965.1","-","-","-","-","-","-" -"","Metarhizium anisopliae str. E6 (GCA_000739145)","Hypocreales","5530","Metarhizium_anisopliae","GCA_000739145.1","-","-","-","-","-","-" -"","Metarhizium brunneum ARSEF 3297 (GCA_000814965)","Hypocreales","1276141","MBR_1.0","GCA_000814965.1","-","-","-","-","-","-" -"","Metarhizium guizhouense ARSEF 977 (GCA_000814955)","Hypocreales","1276136","MGU_1.0","GCA_000814955.1","-","-","-","-","-","-" -"","Metarhizium majus ARSEF 297 (GCA_000814945)","Hypocreales","1276143","MAJ_1.0","GCA_000814945.1","-","-","-","-","","-" -"","Metarhizium rileyi RCEF 4871 (GCA_001636745)","Hypocreales","1081105","NOR_1.0","GCA_001636745.1","-","-","-","-","","-" -"","Metarhizium robertsii (GCA_000591435)","Hypocreales","568076","MR2010_11_27","GCA_000591435.1","-","-","-","-","-","-" -"","Metarhizium robertsii ARSEF 23 (GCA_000187425)","Hypocreales","655844","MAA_2.0","GCA_000187425.2","-","-","-","-","","-" -"","Metschnikowia bicuspidata var. bicuspidata NRRL YB-4993 (GCA_001664035)","Saccharomycetales","869754","Metbi1","GCA_001664035.1","-","-","-","-","","-" -"","Meyerozyma guilliermondii ATCC 6260 (GCA_000149425)","Saccharomycetales","294746","ASM14942v1","GCA_000149425.1","-","-","-","-","","-" -"","Microbotryum intermedium (GCA_900096595)","Microbotryales","269621","Microbotrium_Intermedium_Assembly","GCA_900096595.1","-","-","-","-","","-" -"","Microbotryum violaceum","Microbotryales","683840","GCA_000166175.1","GCA_000166175.1","-","-","-","","","-" -"","Microdochium bolleyi str. J235TASD1 (GCA_001566295)","Xylariales","196109","Microdochium_bolleyi_v1.0","GCA_001566295.1","-","-","-","-","","-" -"","Microsporum canis CBS 113480 (GCA_000151145)","Onygenales","554155","ASM15114v1","GCA_000151145.1","-","-","-","-","","-" -"","Millerozyma farinosa CBS 7064 (GCA_000315895)","Saccharomycetales","559304","ASM31589v1","GCA_000315895.1","-","-","-","-","","-" -"","Mitosporidium daphniae str. UGP3 (GCA_000760515)","Microsporidia","1485682","UGP1.0","GCA_000760515.1","-","-","-","-","","-" -"","Mixia osmundae IAM 14324 (GCA_000241205)","Mixiales","764103","Mosmundae_2.0","GCA_000241205.2","-","-","-","-","","-" -"","Mixia osmundae IAM 14324 (GCA_000708205)","Mixiales","764103","Mixia_osmundae_v1.0","GCA_000708205.1","-","-","-","-","-","-" -"","Moelleriella libera RCEF 2490 (GCA_001636675)","Hypocreales","1081109","AAL_1.0","GCA_001636675.1","-","-","-","-","","-" -"","Moesziomyces antarcticus T-34 (GCA_000334475)","Ustilaginales","1151754","Pant_1.0","GCA_000334475.1","-","-","-","-","","-" -"","Moesziomyces antarcticus str. JCM 10317 (GCA_000747765)","Ustilaginales","84753","ASM74776v1","GCA_000747765.1","-","-","-","-","-","-" -"","Moesziomyces aphidis DSM 70725 (GCA_000517465)","Ustilaginales","1391700","PseuAph1.0","GCA_000517465.1","-","-","-","-","","-" -"","Moniliophthora perniciosa FA553 (GCA_000183025)","Agaricales","554373","ASM18302v1","GCA_000183025.1","-","-","-","-","","-" -"","Moniliophthora roreri MCA 2997 (GCA_000488995)","Agaricales","1381753","M_roreri_MCA_2997_v1","GCA_000488995.1","-","-","-","-","","-" -"","Moniliophthora roreri str. MCA 2952 (GCA_001466705)","Agaricales","221103","ASM146670v1","GCA_001466705.1","-","-","-","-","-","-" -"","Mortierella elongata AG-77","Mortierellomycotina","1314771","Mortierella_elongata_AG-77_v2.0","GCA_001651415.1","-","-","-","-","","-" -"","Mortierella verticillata NRRL 6337 (GCA_000739165)","Mortierellomycotina","1069443","Mort_vert_NRRL_6337_V1","GCA_000739165.1","-","-","-","-","","-" -"","Mucor ambiguus str. NBRC 6742 (GCA_000950595)","Mucoromycotina","91626","ASM95059v1","GCA_000950595.1","-","-","-","-","","-" -"","Mucor circinelloides f. circinelloides 1006PhL (GCA_000401635)","Mucoromycotina","1220926","Muco_sp_1006Ph_V1","GCA_000401635.1","-","-","-","-","","-" -"","Mucor circinelloides f. lusitanicus CBS 277.49","Mucoromycotina","747725","Mucci2","GCA_001638945.1","-","-","-","-","-","-" -"","Mycosphaerella eumusae str. CBS 114824 (GCA_001578235)","Capnodiales","321146","ASM157823v1","GCA_001578235.1","-","-","-","-","","-" -"","Nadsonia fulvescens var. elongata DSM 6958 (GCA_001661315)","Saccharomycetales","857566","Nadfu1","GCA_001661315.1","-","-","-","-","","-" -"","Naematelia encephala str. 68-887.2 (GCA_002105065)","Tremellales","71784","Treen1","GCA_002105065.1","-","-","-","-","","-" -"","Nannizzia gypsea CBS 118893 (GCA_000150975)","Onygenales","535722","MS_CBS118893","GCA_000150975.2","-","-","-","-","","-" -"","Naumovozyma castellii CBS 4309 (GCA_000237345)","Saccharomycetales","1064592","ASM23734v1","GCA_000237345.1","-","-","-","-","","-" -"","Naumovozyma dairenensis CBS 421 (GCA_000227115)","Saccharomycetales","1071378","ASM22711v2","GCA_000227115.2","-","-","-","-","","-" -"","Nematocida displodere str. JUm2807 (GCA_001642395)","Microsporidia","1805483","ASM164239v1","GCA_001642395.1","-","-","-","-","","-" -"","Nematocida parisii ERTm1 (GCA_000250985)","Microsporidia","881290","Nema_parisii_ERTm1_V3","GCA_000250985.1","-","-","-","-","-","-" -"","Nematocida parisii ERTm3 (GCA_000190615)","Microsporidia","935791","Nema_parisii_ERTm3_V1","GCA_000190615.1","-","-","-","-","","-" -"","Nematocida sp. 1 ERTm2 (GCA_000250695)","Microsporidia","944018","Nema_parisii_ERTm2_V1","GCA_000250695.1","-","-","-","-","","-" -"","Nematocida sp. 1 ERTm6 (GCA_000738915)","Microsporidia","1138374","Nema_sp_1_ERTm6_V2","GCA_000738915.1","-","-","-","-","-","-" -"","Nematocida sp. ERTm5 (GCA_001642415)","Microsporidia","1805481","ASM164241v1","GCA_001642415.1","-","-","-","-","-","-" -"","Neocallimastix californiae str. G1 (GCA_002104975)","","1754190","Neocallimastix_sp._G1_v1.0","GCA_002104975.1","-","-","-","-","","-" -"","Neofusicoccum parvum UCRNP2 (GCA_000385595)","Botryosphaeriales","1287680","UCRNP2V3","GCA_000385595.1","-","-","-","-","","-" -"","Neolecta irregularis DAH-3 (GCA_001929475)","Taphrinomycotina","1198029","NeoIirr1.0","GCA_001929475.1","-","-","-","-","","-" -"","Neolentinus lepideus HHB14362 ss-1 (GCA_001632425)","Gloeophyllales","1314782","Neole1","GCA_001632425.1","-","-","-","-","","-" -"","Neonectria ditissima str. R09/05 (GCA_001306435)","Hypocreales","78410","R0905_v2.0","GCA_001306435.1","-","-","-","-","","-" -"","Neurospora crassa","Sordariales","367110","NC12","GCA_000182925.2","-","-","-","","","" -"","Neurospora crassa str. 73 (GCA_000786625)","Sordariales","5141","Neucr_trp3_1","GCA_000786625.1","-","-","-","-","-","-" -"","Neurospora tetrasperma FGSC 2508 (GCA_000213175)","Sordariales","510951","v2.0","GCA_000213175.1","-","-","-","-","-","-" -"","Neurospora tetrasperma FGSC 2509 str. FGSC 2509 mat a (GCA_000213195)","Sordariales","510952","v1.0","GCA_000213195.1","-","-","-","-","","-" -"","Nosema apis BRL 01 (GCA_000447185)","Nosematidae","1037528","NapisBRLv01","GCA_000447185.1","-","-","-","-","","-" -"","Nosema bombycis CQ1 (GCA_000383075)","Nosematidae","578461","NosBomCQ1_v1.0","GCA_000383075.1","-","-","-","-","","-" -"","Nosema ceranae (GCA_000988165)","Nosematidae","40302","ASM98816v1","GCA_000988165.1","-","-","-","-","-","-" -"","Nosema ceranae BRL01 (GCA_000182985)","Nosematidae","578460","ASM18298v1","GCA_000182985.1","-","-","-","-","","-" -"","Ogataea parapolymorpha DL-1 (GCA_000187245)","Saccharomycetales","871575","Hansenula_2","GCA_000187245.3","-","-","-","-","","-" -"","Ogataea polymorpha str. NCYC 495 leu1.1 (GCA_001664045)","Saccharomycetales","460523","Hanpo2","GCA_001664045.1","-","-","-","-","","-" -"","Oidiodendron maius Zn (GCA_000827325)","Myxotrichaceae","913774","Oidiodendron_maius_Zn_v1.0","GCA_000827325.1","-","-","-","-","","-" -"","Ophiocordyceps australis (GCA_002591405)","Hypocreales","1399860","OphauG2","GCA_002591405.1","-","-","-","-","","-" -"","Ophiocordyceps australis (GCA_002591415)","Hypocreales","1399860","OphauB2","GCA_002591415.1","-","-","-","-","-","-" -"","Ophiocordyceps camponoti-rufipedis (GCA_002591395)","Hypocreales","2004952","Ophun1","GCA_002591395.1","-","-","-","-","","-" -"","Ophiocordyceps sinensis CO18 (GCA_000448365)","Hypocreales","911162","ASM44836v1","GCA_000448365.1","-","-","-","-","-","-" -"","Ophiocordyceps unilateralis str. SC16a (GCA_001272575)","Hypocreales","268505","ASM127257v2","GCA_001272575.2","-","-","-","-","-","-" -"","Ophiostoma piceae UAMH 11346 str. UAMH-11346 (GCA_000410735)","Ophiostomatales","1262450","Opiceae_UAMHv01","GCA_000410735.1","-","-","-","-","","-" -"","Ordospora colligata OC4 (GCA_000803265)","Ordosporidae","1354746","ASM80326v1","GCA_000803265.1","-","-","-","-","","-" -"","Pachysolen tannophilus NRRL Y-2460 (GCA_001661245)","Saccharomycetales","669874","Pacta1_2","GCA_001661245.1","-","-","-","-","","-" -"","Paracoccidioides brasiliensis Pb03 (GCA_000150475)","Onygenales","482561","Paracocci_br_Pb03_V2","GCA_000150475.2","-","-","-","-","-","-" -"","Paracoccidioides brasiliensis Pb18 (GCA_000150735)","Onygenales","502780","Paracocci_br_Pb18_V2","GCA_000150735.2","-","-","-","-","","-" -"","Paracoccidioides brasiliensis str. CNH (GCA_001713695)","Onygenales","121759","Paracocci_br_PbCNH","GCA_001713695.1","-","-","-","-","-","-" -"","Paracoccidioides brasiliensis str. Pb300 (GCA_001713645)","Onygenales","121759","ASM171364v1","GCA_001713645.1","-","-","-","-","-","-" -"","Paracoccidioides lutzii Pb01 (GCA_000150705)","Onygenales","502779","Paracocci_br_Pb01_V2","GCA_000150705.2","-","-","-","-","","-" -"","Paramicrosporidium saccamoebae str. KSL3 (GCA_002794465)","Cryptomycota","1246581","KSL3_v6","GCA_002794465.1","-","-","-","-","","-" -"","Paraphaeosphaeria sporulosa str. AP3s5-JAC2a (GCA_001642045)","Pleosporales","1460663","Parsp1","GCA_001642045.1","-","-","-","-","","-" -"","Paxillus involutus ATCC 200175 (GCA_000827475)","Boletales","664439","Paxillus_involutus_ATCC_200175_v1.0","GCA_000827475.1","-","-","-","-","","-" -"","Paxillus rubicundulus Ve08.2h10 (GCA_000827395)","Boletales","930991","Paxillus_rubicundulus_Ve08.2h10_v1.0","GCA_000827395.1","-","-","-","-","","-" -"","Penicilliopsis zonata CBS 506.65 (GCA_001890105)","Eurotiales","1073090","Aspzo1","GCA_001890105.1","-","-","-","-","","-" -"","Penicillium antarcticum (GCA_002072345)","Eurotiales","416450","ASM207234v1","GCA_002072345.1","-","-","-","-","","-" -"","Penicillium arizonense (GCA_001773325)","Eurotiales","1835702","ASM177332v1","GCA_001773325.1","-","-","-","-","-","-" -"","Penicillium brasilianum str. LaBioMMi 136 (GCA_002016555)","Eurotiales","104259","ASM201655v1","GCA_002016555.1","-","-","-","-","-","-" -"","Penicillium brasilianum str. MG11 (GCA_001048715)","Eurotiales","104259","Pbras_Allpaths-LG","GCA_001048715.1","-","-","-","-","","-" -"","Penicillium camemberti FM 013 (GCA_000513335)","Eurotiales","1429867","PCAMFM013_20131106","GCA_000513335.1","-","-","-","-","","-" -"","Penicillium chrysogenum str. P2niaD18 (GCA_000710275)","Eurotiales","5076","ASM71027v1","GCA_000710275.1","-","-","-","-","-","-" -"","Penicillium coprophilum (GCA_002072405)","Eurotiales","36646","ASM207240v1","GCA_002072405.1","-","-","-","-","-","-" -"","Penicillium decumbens (GCA_002072245)","Eurotiales","69771","ASM207224v1","GCA_002072245.1","-","-","-","-","-","-" -"","Penicillium digitatum PHI26 (GCA_000315665)","Eurotiales","1170229","PdigPHI26_v1","GCA_000315665.1","-","-","-","-","-","-" -"","Penicillium digitatum Pd1 (GCA_000315645)","Eurotiales","1170230","PdigPd1_v1","GCA_000315645.2","-","-","-","-","-","-" -"","Penicillium expansum str. CMP-1 (GCA_000769755)","Eurotiales","27334","PEX1","GCA_000769755.1","-","-","-","-","-","-" -"","Penicillium expansum str. MD-8 (GCA_000769745)","Eurotiales","27334","ASM76974v1","GCA_000769745.1","-","-","-","-","-","-" -"","Penicillium expansum str. d1 (GCA_000769735)","Eurotiales","27334","ASM76973v1","GCA_000769735.1","-","-","-","-","-","-" -"","Penicillium flavigenum (GCA_002072365)","Eurotiales","254877","ASM207236v1","GCA_002072365.1","-","-","-","-","-","-" -"","Penicillium freii (GCA_001513925)","Eurotiales","48697","ASM151392v1","GCA_001513925.1","-","-","-","-","-","-" -"","Penicillium griseofulvum str. PG3 (GCA_001561935)","Eurotiales","5078","ASM156193v1","GCA_001561935.1","-","-","-","-","-","-" -"","Penicillium italicum str. PHI-1 (GCA_000769765)","Eurotiales","40296","ASM76976v1","GCA_000769765.1","-","-","-","-","-","-" -"","Penicillium nalgiovense (GCA_002072425)","Eurotiales","60175","ASM207242v1","GCA_002072425.1","-","-","-","-","-","-" -"","Penicillium nordicum (GCA_001278595)","Eurotiales","229535","ASM127859v1","GCA_001278595.1","-","-","-","-","-","-" -"","Penicillium occitanis str. CL100 (GCA_002382855)","Eurotiales","290292","ASM238285v1","GCA_002382855.1","-","-","-","-","-","-" -"","Penicillium occitanis str. CT1 (GCA_002382835)","Eurotiales","290292","ASM238283v1","GCA_002382835.1","-","-","-","-","-","-" -"","Penicillium oxalicum 114-2 (GCA_000346795)","Eurotiales","933388","pde_v1.0","GCA_000346795.1","-","-","-","-","-","-" -"","Penicillium polonicum (GCA_002072265)","Eurotiales","60169","ASM207226v1","GCA_002072265.1","-","-","-","-","-","-" -"","Penicillium roqueforti FM164 (GCA_000513255)","Eurotiales","1365484","PROQFM164_20130607","GCA_000513255.1","-","-","-","-","-","-" -"","Penicillium rubens Wisconsin 54-1255 (GCA_000226395)","Eurotiales","500485","PenChr_Nov2007","GCA_000226395.1","-","-","-","-","-","-" -"","Penicillium solitum (GCA_002072235)","Eurotiales","60172","ASM207223v1","GCA_002072235.1","-","-","-","-","-","-" -"","Penicillium steckii (GCA_002072375)","Eurotiales","303698","ASM207237v1","GCA_002072375.1","-","-","-","-","-","-" -"","Penicillium subrubescens str. CBS 132785 (GCA_001908125)","Eurotiales","1316194","ASM190812v1","GCA_001908125.1","-","-","-","-","-","-" -"","Penicillium vulpinum (GCA_002072255)","Eurotiales","29845","ASM207225v1","GCA_002072255.1","-","-","-","-","-","-" -"","Peniophora sp. CONT (GCA_001632445)","Russulales","1314672","Ricme1","GCA_001632445.1","-","-","-","-","","-" -"","Periconia macrospinosa str. DSE2036 (GCA_003073855)","Pleosporales","97972","Perma1","GCA_003073855.1","-","-","-","-","","-" -"","Pestalotiopsis fici W106-1 (GCA_000516985)","Xylariales","1229662","PFICI","GCA_000516985.1","-","-","-","-","","-" -"","Pezoloma ericae str. UAMH 7357 (GCA_002865625)","Helotiales","1745343","Rhier1","GCA_002865625.1","-","-","-","-","","-" -"","Phaeoacremonium minimum UCRPA7 (GCA_000392275)","Sordariomycetidae","1286976","UCRPA7V03","GCA_000392275.1","-","-","-","-","","-" -"","Phaeomoniella chlamydospora (GCA_001006345)","Chaetothyriomycetidae","158046","UCRPA7V1.0","GCA_001006345.1","-","-","-","-","","-" -"","Phaeosphaeria nodorum","Pleosporales","321614","ASM14691v1","GCA_000146915.1","-","-","-","","","-" -"","Phanerochaete carnosa HHB-10118-sp (GCA_000300595)","Polyporales","650164","Phanerochaete_carnosa_HHB-10118-Sp_v1.0","GCA_000300595.1","-","-","-","-","","-" -"","Phellinus noxius (GCA_002287475)","Hymenochaetales","2282107","ASM228747v1","GCA_002287475.1","-","-","-","-","","-" -"","Phialocephala scopiformis str. CBS 120377 (GCA_001500285)","Helotiales","149040","Phisc1","GCA_001500285.1","-","-","-","-","","-" -"","Phialocephala subalpina (GCA_900073065)","Helotiales","576137","PAC_version_1","GCA_900073065.1","-","-","-","-","","-" -"","Phialophora americana str. CBS 27337 (GCA_000835435)","Chaetothyriomycetidae","5601","Capr_semi_CBS27337_V1","GCA_000835435.1","-","-","-","-","","-" -"","Phialophora attae str. CBS 131958 (GCA_001299255)","Chaetothyriomycetidae","1664694","ASM129925v1","GCA_001299255.1","-","-","-","-","","-" -"","Phlebia centrifuga str. FBCC195 (GCA_001913855)","Polyporales","98765","ASM191385v2","GCA_001913855.2","-","-","-","-","","-" -"","Phlebiopsis gigantea 11061_1 CR5-6 (GCA_000832265)","Polyporales","745531","Phlgi1","GCA_000832265.1","-","-","-","-","","-" -"","Pichia kudriavzevii str. 129 (GCA_001983325)","Saccharomycetales","4909","ASM198332v1","GCA_001983325.1","-","-","-","-","-","-" -"","Pichia kudriavzevii str. CBS573 (GCA_003054445)","Saccharomycetales","4909","ASM305444v1","GCA_003054445.1","-","-","-","-","-","-" -"","Pichia kudriavzevii str. Ckrusei653 (GCA_002166775)","Saccharomycetales","4909","Cand_krus_Ckrusei653_V21","GCA_002166775.1","-","-","-","-","-","-" -"","Pichia kudriavzevii str. SD108 (GCA_000764455)","Saccharomycetales","4909","ASM76445v1","GCA_000764455.1","-","-","-","-","","-" -"","Pichia membranifaciens NRRL Y-2026 (GCA_001661235)","Saccharomycetales","763406","Picme2","GCA_001661235.1","-","-","-","-","","-" -"","Pichia membranifaciens str. KS47-1 (GCA_001950575)","Saccharomycetales","4926","P_membrenifaciens-1.0","GCA_001950575.1","-","-","-","-","-","-" -"","Piloderma croceum F 1598 (GCA_000827315)","Atheliales","765440","Piloderma_croceum_F_1598_v1.0","GCA_000827315.1","-","-","-","-","","-" -"","Piromyces finnis (GCA_002104945)","","1754191","Piromyces_sp._finnis_v3.0","GCA_002104945.1","-","-","-","-","","-" -"","Piromyces sp. E2 (GCA_002157105)","","73868","PirspE2_v1.0","GCA_002157105.1","-","-","-","-","","-" -"","Pisolithus microcarpus 441 (GCA_000827275)","Boletales","765257","Pisolithus_microcarpus_441_v1.0","GCA_000827275.1","-","-","-","-","","-" -"","Pisolithus tinctorius Marx 270 (GCA_000827335)","Boletales","870435","Pisolithus_tinctorius_Marx_270_v1.0","GCA_000827335.1","-","-","-","-","","-" -"","Pleurotus ostreatus PC15 (GCA_000697685)","Agaricales","1137138","PleosPC15_2","GCA_000697685.1","-","-","-","-","","-" -"","Plicaturopsis crispa FD-325 SS-3 (GCA_000827205)","","944288","Plicr1","GCA_000827205.1","-","-","-","-","","-" -"","Pneumocystis carinii B80 (GCA_001477545)","Taphrinomycotina","1408658","Pneu_cari_B80_V3","GCA_001477545.1","-","-","-","-","","-" -"","Pneumocystis jirovecii RU7 (GCA_001477535)","Taphrinomycotina","1408657","Pneu_jiro_RU7_V2","GCA_001477535.1","-","-","-","-","","-" -"","Pneumocystis murina B123 (GCA_000349005)","Taphrinomycotina","1069680","Pneumo_murina_B123_V4","GCA_000349005.2","-","-","-","-","","-" -"","Pochonia chlamydosporia 170 (GCA_001653235)","Hypocreales","1380566","ASM165323v2","GCA_001653235.2","-","-","-","-","","-" -"","Podospora anserina S mat+ (GCA_000226545)","Sordariales","515849","ASM22654v1","GCA_000226545.1","-","-","-","-","-","-" -"","Polytolypa hystricis UAMH7299 (GCA_002573605)","Onygenales","1447883","Poly_hyst_7299_V1","GCA_002573605.1","-","-","-","-","","-" -"","Postia placenta MAD-698-R-SB12 (GCA_002117355)","Polyporales","670580","PosplRSB12_1","GCA_002117355.1","-","-","-","-","-","-" -"","Postia placenta Mad-698-R (GCA_000006255)","Polyporales","561896","Postia_placenta_V1.0","GCA_000006255.1","-","-","-","-","","-" -"","Protomyces lactucaedebilis str. 12-1054 (GCA_002105105)","Taphrinomycotina","56484","Prola1","GCA_002105105.1","-","-","-","-","","-" -"","Pseudocercospora fijiensis CIRAD86 (GCA_000340215)","Capnodiales","383855","Mycfi2","GCA_000340215.1","-","-","-","-","","-" -"","Pseudocercospora musae str. CBS 116634 (GCA_001578225)","Capnodiales","113226","ASM157822v1","GCA_001578225.1","-","-","-","-","","-" -"","Pseudogymnoascus destructans (GCA_001641265)","Pseudeurotiaceae","655981","ASM164126v1","GCA_001641265.1","-","-","-","-","-","-" -"","Pseudogymnoascus destructans 20631-21 (GCA_000184105)","Pseudeurotiaceae","658429","Geom_destructans_V1","GCA_000184105.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. 03VT05 (GCA_001662645)","Pseudeurotiaceae","1622148","ASM166264v1","GCA_001662645.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. 05NY08 (GCA_001662605)","Pseudeurotiaceae","1622149","ASM166260v1","GCA_001662605.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. 23342-1-I1 (GCA_001662575)","Pseudeurotiaceae","1524831","ASM166257v1","GCA_001662575.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. 24MN13 (GCA_001662595)","Pseudeurotiaceae","1622150","ASM166259v1","GCA_001662595.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-103 (GCA_000750895)","Pseudeurotiaceae","1420912","DG30","GCA_000750895.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-3557 (GCA_000750665)","Pseudeurotiaceae","1437433","DG3","GCA_000750665.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-3775 (GCA_000750715)","Pseudeurotiaceae","1420901","DG4","GCA_000750715.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-3808 (GCA_000750675)","Pseudeurotiaceae","1391699","DG1","GCA_000750675.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-4246 (GCA_000750735)","Pseudeurotiaceae","1420902","DG5","GCA_000750735.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-4281 (FW-2241) (GCA_000750745)","Pseudeurotiaceae","1420906","DG6","GCA_000750745.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-4513 (FW-928) (GCA_000750755)","Pseudeurotiaceae","1420907","DG7","GCA_000750755.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-4514 (FW-929) (GCA_000750795)","Pseudeurotiaceae","1420908","DG8","GCA_000750795.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-4515 (FW-2607) (GCA_000750805)","Pseudeurotiaceae","1420909","DG10","GCA_000750805.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-4516 (FW-969) (GCA_000750815)","Pseudeurotiaceae","1420910","DG11","GCA_000750815.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-4517 (FW-2822) (GCA_000750875)","Pseudeurotiaceae","1420911","DG13","GCA_000750875.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-4518 (FW-2643) (GCA_000750925)","Pseudeurotiaceae","1420913","DG36","GCA_000750925.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-4519 (FW-2642) (GCA_000750935)","Pseudeurotiaceae","1420914","DG38","GCA_000750935.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. VKM F-4520 (FW-2644) (GCA_000750995)","Pseudeurotiaceae","1420915","DG39","GCA_000750995.1","-","-","-","-","-","-" -"","Pseudogymnoascus sp. WSF 3629 (GCA_001662585)","Pseudeurotiaceae","1622147","ASM166258v1","GCA_001662585.1","-","-","-","-","-","-" -"","Pseudogymnoascus verrucosus (GCA_001662655)","Pseudeurotiaceae","342668","ASM166265v1","GCA_001662655.1","-","-","-","-","-","-" -"","Pseudoloma neurophilia str. MK1 (GCA_001432165)","Microsporidia","146866","ASM143216v1","GCA_001432165.1","-","-","-","-","","-" -"","Pseudomassariella vexata str. CBS 129021 (GCA_002105095)","Xylariales","1141098","Pseve2","GCA_002105095.1","-","-","-","-","","-" -"","Pseudomicrostroma glucosiphilum str. MCA 4718 (GCA_003144135)","","1684307","Rhodsp1","GCA_003144135.1","-","-","-","-","","-" -"","Pseudozyma hubeiensis SY62 (GCA_000403515)","Ustilaginales","1305764","ASM40351v1","GCA_000403515.1","-","-","-","-","","-" -"","Puccinia coronata var. avenae f. sp. avenae (GCA_002873275)","Pucciniales","200324","ASM287327v1","GCA_002873275.1","-","-","-","-","","-" -"","Puccinia graminis","Pucciniales","418459","ASM14992v1","GCA_000149925.1","","-","","","","" -"","Puccinia graminis Ug99","Pucciniales","1040990","v1","-","","-","-","","","-" -"","Puccinia sorghi str. RO10H11247 (GCA_001263375)","Pucciniales","27349","ASM126337v1","GCA_001263375.1","-","-","-","-","","-" -"","Puccinia striiformis (GCA_002920065)","Pucciniales","27350","ASM292006v1","GCA_002920065.1","-","-","-","-","","-" -"","Puccinia striiformis f. sp. tritici PST-130 str. Race 130","Pucciniales","875184","PST-130_1.0","GCA_000223505.1","-","-","-","","-","-" -"","Puccinia striiformis f. sp. tritici PST-78 (GCA_001191645)","Pucciniales","1165861","P_striiformis_V1","GCA_001191645.1","-","-","-","-","-","-" -"","Puccinia triticina","Pucciniales","630390","ASM15152v1","GCA_000151525.1","-","-","","","","-" -"","Punctularia strigosozonata HHB-11173 SS5 (GCA_000264995)","Corticiales","741275","Punctularia_strigosozonata_v1.0","GCA_000264995.1","-","-","-","-","","-" -"","Purpureocillium lilacinum (GCA_001653205)","Hypocreales","33203","ASM165320v1","GCA_001653205.1","-","-","-","-","","-" -"","Purpureocillium lilacinum (GCA_001653265)","Hypocreales","33203","ASM165326v1","GCA_001653265.1","-","-","-","-","-","-" -"","Purpureocillium lilacinum str. 36-1 (GCA_003144605)","Hypocreales","33203","ASM314460v1","GCA_003144605.1","-","-","-","-","-","-" -"","Pyrenochaeta sp. DS3sAY3a (GCA_001644535)","Pleosporales","765867","Pyrsp1","GCA_001644535.1","-","-","-","-","","-" -"","Pyrenophora teres","Pleosporales","861557","GCA_000166005.1","GCA_000166005.1","-","-","-","","","-" -"","Pyrenophora tritici-repentis (GCA_003171545)","Pleosporales","45151","PtrARCrossB10","GCA_003171545.1","-","-","-","-","-","-" -"","Pyrenophora tritici-repentis (GCA_003231325)","Pleosporales","45151","Ptr134","GCA_003231325.1","-","-","-","-","-","-" -"","Pyrenophora tritici-repentis (GCA_003231365)","Pleosporales","45151","Ptr239","GCA_003231365.1","-","-","-","-","-","-" -"","Pyrenophora tritici-repentis (GCA_003231425)","Pleosporales","45151","Ptr86-124","GCA_003231425.1","-","-","-","-","-","-" -"","Pyrenophora tritici-repentis Pt-1C-BFP","Pleosporales","426418","ASM14998v1","GCA_000149985.1","-","-","-","-","","-" -"","Rachicladosporium antarcticum (GCA_002077065)","Capnodiales","1507870","ASM207706v1","GCA_002077065.1","-","-","-","-","","-" -"","Rachicladosporium sp. CCFEE 5018 (GCA_002077045)","Capnodiales","1974281","ASM207704v2","GCA_002077045.2","-","-","-","-","","-" -"","Ramularia collo-cygni (GCA_900074925)","Capnodiales","112498","version_1","GCA_900074925.1","-","-","-","-","","-" -"","Rasamsonia emersonii CBS 393.64 (GCA_000968595)","Eurotiales","1408163","ASM96859v1","GCA_000968595.1","-","-","-","-","","-" -"","Rhinocladiella mackenziei CBS 650.93 (GCA_000835555)","Chaetothyriomycetidae","1442369","Rhin_mack_CBS_650_93_V1","GCA_000835555.1","-","-","-","-","","-" -"","Rhizoclosmatium globosum str. JEL800 (GCA_002104985)","Chytridiomycetes","329046","Rhihy1","GCA_002104985.1","-","-","-","-","","-" -"","Rhizoctonia solani (GCA_001286725)","Cantharellales","456999","AG22IIIB","GCA_001286725.1","-","-","-","-","-","-" -"","Rhizoctonia solani 123E (GCA_000715385)","Cantharellales","1423351","Rhizoctonia_solani_123E_v1","GCA_000715385.1","-","-","-","-","-","-" -"","Rhizoctonia solani AG-1 IA str. AG1 IA (GCA_000334115)","Cantharellales","983506","Rhisol_AG1IA_1.0","GCA_000334115.1","-","-","-","-","","-" -"","Rhizoctonia solani AG-1 IB (GCA_000350255)","Cantharellales","1108050","ASM35025v1","GCA_000350255.1","-","-","-","-","-","-" -"","Rhizoctonia solani AG-3 Rhs1AP (GCA_000524645)","Cantharellales","1086054","Rhizoctonia_solani_AG-3","GCA_000524645.1","-","-","-","-","-","-" -"","Rhizoctonia solani AG-8 WAC10335 (GCA_000695385)","Cantharellales","1287689","RSAG8-1.V1","GCA_000695385.1","-","-","-","-","-","-" -"","Rhizophagus clarus str. HR1","Glomerales","94130","RclarusHR1_1.0","GCA_003203555.1","-","-","-","-","","-" -"","Rhizophagus irregularis DAOM 181602=DAOM 197198","Glomerales","747089","Rir_HGAP_ii_V2","GCA_002897155.1","-","-","-","-","-","-" -"","Rhizophagus irregularis DAOM 181602=DAOM 197198 (GCA_000439145)","Glomerales","747089","ASM43914v3","GCA_000439145.3","-","-","-","-","-","-" -"","Rhizophagus irregularis DAOM 197198w str. DAOM197198w (GCA_000597685)","Glomerales","1432141","Rir","GCA_000597685.1","-","-","-","-","-","-" -"","Rhizophagus irregularis str. A1","Glomerales","588596","ASM159312v1","GCA_001593125.1","-","-","-","-","-","-" -"","Rhizophagus irregularis str. A4","Glomerales","588596","ASM159314v1","GCA_001593145.1","-","-","-","-","-","-" -"","Rhizophagus irregularis str. A5","Glomerales","588596","ASM159320v1","GCA_001593205.1","-","-","-","-","-","-" -"","Rhizophagus irregularis str. C2","Glomerales","588596","ASM159315v1","GCA_001593155.1","-","-","-","-","-","-" -"","Rhizopogon vesiculosus str. AM-OR11-056 (GCA_001882365)","Boletales","180088","Rves_AM-OR11-056_1.0","GCA_001882365.1","-","-","-","-","","-" -"","Rhizopogon vinicolor AM-OR11-026 (GCA_001658105)","Boletales","1314800","Rhivi1","GCA_001658105.1","-","-","-","-","-","-" -"","Rhizopus delemar RA 99-880 (GCA_000149305)","Mucoromycotina","246409","RO3","GCA_000149305.1","-","-","-","-","","-" -"","Rhizopus microsporus ATCC 52813","Mucoromycotina","1340429","Rhimi1_1","GCA_002708625.1","-","-","-","-","-","-" -"","Rhizopus microsporus str. ATCC 11559","Mucoromycotina","58291","Rhimi_ATCC11559_1","GCA_002083735.1","-","-","-","-","-","-" -"","Rhizopus microsporus str. ATCC62417 (GCA_900000135)","Mucoromycotina","58291","RMATCC62417_Allpaths-LG","GCA_900000135.1","-","-","-","-","-","-" -"","Rhizopus microsporus str. CBS-344.29 (GCA_000825725)","Mucoromycotina","58291","Rmicro_CBS_344.29_Allpaths-LG","GCA_000825725.1","-","-","-","-","","-" -"","Rhizopus microsporus var. microsporus str. ATCC 52814","Mucoromycotina","86635","Rhimi_ATCC52814_1","GCA_002083745.1","-","-","-","-","-","-" -"","Rhodotorula graminis WP1 (GCA_001329695)","Sporidiobolales","578459","Rhoba1_1","GCA_001329695.1","-","-","-","-","","-" -"","Rhodotorula sp. JG-1b (GCA_001541205)","Sporidiobolales","1305733","Rhosp1","GCA_001541205.1","-","-","-","-","-","-" -"","Rhodotorula taiwanensis str. MD1149 (GCA_002922495)","Sporidiobolales","741276","ASM292249v1","GCA_002922495.1","-","-","-","-","-","-" -"","Rhodotorula toruloides (GCA_001255795)","Sporidiobolales","5286","IFO0880_HGAP3_v1","GCA_001255795.1","-","-","-","-","-","-" -"","Rhodotorula toruloides ATCC 204091 (GCA_000222205)","Sporidiobolales","1001064","R.glutinis2","GCA_000222205.2","-","-","-","-","","-" -"","Rhodotorula toruloides NP11 (GCA_000320785)","Sporidiobolales","1130832","RHOziaDV1.0","GCA_000320785.2","-","-","-","-","-","-" -"","Rhynchosporium agropyri (GCA_900074905)","Helotiales","914238","version_1","GCA_900074905.1","-","-","-","-","","-" -"","Rhynchosporium commune (GCA_900074885)","Helotiales","914237","version_1","GCA_900074885.1","-","-","-","-","","-" -"","Rhynchosporium secalis (GCA_900074895)","Helotiales","38038","version_1","GCA_900074895.1","-","-","-","-","","-" -"","Rosellinia necatrix str. W97 (GCA_001445595)","Xylariales","77044","Rnecatrix_2.0","GCA_001445595.3","-","-","-","-","","-" -"","Rozella allomycis CSF55 (GCA_000442015)","Cryptomycota","988480","Rozella_k41_t100","GCA_000442015.1","-","-","-","-","","-" -"","Rutstroemia sp. NJR-2017a BBW (GCA_002946425)","Helotiales","2070414","ASM294642v1","GCA_002946425.1","-","-","-","-","","-" -"","Rutstroemia sp. NJR-2017a BVV2 (GCA_002946415)","Helotiales","2070413","ASM294641v1","GCA_002946415.1","-","-","-","-","","-" -"","Rutstroemia sp. NJR-2017a WRK4 (GCA_002946385)","Helotiales","2070412","ASM294638v1","GCA_002946385.1","-","-","-","-","","-" -"","Saccharomyces arboricola H-6 (GCA_000292725)","Saccharomycetales","1160507","SacArb1.0","GCA_000292725.1","-","-","-","-","","-" -"","Saccharomyces cerevisiae","Saccharomycetales","559292","R64-1-1","GCA_000146045.2","","","","","","" -"","Saccharomyces cerevisiae (GCA_001634645)","Saccharomycetales","4932","GLBRCY22-3","GCA_001634645.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae (GCA_002804325)","Saccharomycetales","4932","ASM280432v1","GCA_002804325.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae CEN.PK113-7D (GCA_000269885)","Saccharomycetales","889517","ASM26988v1","GCA_000269885.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae EC1118 (GCA_000218975)","Saccharomycetales","643680","ASM21897v1","GCA_000218975.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae FostersB (GCA_000190255)","Saccharomycetales","764102","ScFostersB_v01","GCA_000190255.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae FostersO (GCA_000326005)","Saccharomycetales","764101","ScFostersO_v01","GCA_000326005.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae Kyokai no. 7 str. kyokai no. 7 (GCA_000260735)","Saccharomycetales","721032","K7_1.0","GCA_000260735.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae Lalvin QA23 (GCA_000325965)","Saccharomycetales","764098","ScQA23_v01","GCA_000325965.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae P283 (GCA_000568295)","Saccharomycetales","1177187","P283","GCA_000568295.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae P301 (GCA_000568055)","Saccharomycetales","1182968","p301","GCA_000568055.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae R103 (GCA_000568365)","Saccharomycetales","1182967","R103","GCA_000568365.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae RM11-1a (GCA_000149365)","Saccharomycetales","285006","ASM14936v1","GCA_000149365.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae VL3 (GCA_000190235)","Saccharomycetales","764100","ScVL3_v01","GCA_000190235.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae Vin13 (GCA_000190215)","Saccharomycetales","764099","ScVIN13_v01","GCA_000190215.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1078 (GCA_000975645)","Saccharomycetales","1296266","Sc_YJM1078_v1","GCA_000975645.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1083 (GCA_000975675)","Saccharomycetales","1292971","Sc_YJM1083_v1","GCA_000975675.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1129 (GCA_000975705)","Saccharomycetales","1293430","Sc_YJM1129_v1","GCA_000975705.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1133 (GCA_000976695)","Saccharomycetales","1294333","Sc_YJM1133_v1","GCA_000976695.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1190 (GCA_000976725)","Saccharomycetales","1294334","Sc_YJM1190_v1","GCA_000976725.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1199 (GCA_000976755)","Saccharomycetales","1294335","Sc_YJM1199_v1","GCA_000976755.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1202 (GCA_000976785)","Saccharomycetales","1294336","Sc_YJM1202_v1","GCA_000976785.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1208 (GCA_000976815)","Saccharomycetales","1294337","Sc_YJM1208_v1","GCA_000976815.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1242 (GCA_000976845)","Saccharomycetales","1294338","Sc_YJM1242_v1","GCA_000976845.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1244 (GCA_000976875)","Saccharomycetales","1294339","Sc_YJM1244_v1","GCA_000976875.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1248 (GCA_000976905)","Saccharomycetales","1294340","Sc_YJM1248_v1","GCA_000976905.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1250 (GCA_000976935)","Saccharomycetales","1294341","Sc_YJM1250_v1","GCA_000976935.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1252 (GCA_000976965)","Saccharomycetales","1294342","Sc_YJM1252_v1","GCA_000976965.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1273 (GCA_000976995)","Saccharomycetales","1294343","Sc_YJM1273_v1","GCA_000976995.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1304 (GCA_000977025)","Saccharomycetales","1294344","Sc_YJM1304_v1","GCA_000977025.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1307 (GCA_000977055)","Saccharomycetales","1294345","Sc_YJM1307_v1","GCA_000977055.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1311 (GCA_000977085)","Saccharomycetales","1294346","Sc_YJM1311_v1","GCA_000977085.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1326 (GCA_000977115)","Saccharomycetales","1294347","Sc_YJM1326_v1","GCA_000977115.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1332 (GCA_000977145)","Saccharomycetales","1294348","Sc_YJM1332_v1","GCA_000977145.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1336 (GCA_000977175)","Saccharomycetales","1294349","Sc_YJM1336_v1","GCA_000977175.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1338 (GCA_000977205)","","1294350","Sc_YJM1338_v1","GCA_000977205.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1341 (GCA_000977235)","Saccharomycetales","1294351","Sc_YJM1341_v1","GCA_000977235.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1342 (GCA_000977265)","Saccharomycetales","1294352","Sc_YJM1342_v1","GCA_000977265.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1355 (GCA_000977295)","Saccharomycetales","1294353","Sc_YJM1355_v1","GCA_000977295.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1356 (GCA_000977325)","Saccharomycetales","1294354","Sc_YJM1356_v1","GCA_000977325.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1381 (GCA_000977355)","Saccharomycetales","1294355","Sc_YJM1381_v1","GCA_000977355.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1383 (GCA_000977385)","Saccharomycetales","1294356","Sc_YJM1383_v1","GCA_000977385.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1385 (GCA_000977415)","Saccharomycetales","1294357","Sc_YJM1385_v1","GCA_000977415.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1386 (GCA_000977445)","Saccharomycetales","1294358","Sc_YJM1386_v1","GCA_000977445.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1387 (GCA_000977475)","Saccharomycetales","1294359","Sc_YJM1387_v1","GCA_000977475.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1388 (GCA_000977505)","Saccharomycetales","1294360","Sc_YJM1388_v1","GCA_000977505.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1389 (GCA_000977535)","Saccharomycetales","1294361","Sc_YJM1389_v1","GCA_000977535.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1399 (GCA_000977565)","Saccharomycetales","1294362","Sc_YJM1399_v1","GCA_000977565.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1400 (GCA_000977595)","Saccharomycetales","1294363","Sc_YJM1400_v1","GCA_000977595.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1401 (GCA_000977625)","Saccharomycetales","1294364","Sc_YJM1401_v1","GCA_000977625.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1402 (GCA_000977655)","Saccharomycetales","1294365","Sc_YJM1402_v1","GCA_000977655.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1415 (GCA_000977685)","Saccharomycetales","1294366","Sc_YJM1415_v1","GCA_000977685.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1417 (GCA_000977715)","Saccharomycetales","1294367","Sc_YJM1417_v1","GCA_000977715.4","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1418 (GCA_000977745)","Saccharomycetales","1294368","Sc_YJM1418_v1","GCA_000977745.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1419 (GCA_000977775)","Saccharomycetales","1294369","Sc_YJM1419_v1","GCA_000977775.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1433 (GCA_000977805)","Saccharomycetales","1294370","Sc_YJM1433_v1","GCA_000977805.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1434 (GCA_000977835)","Saccharomycetales","1294371","Sc_YJM1434_v1","GCA_000977835.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1439 (GCA_000977865)","Saccharomycetales","1294372","Sc_YJM1439_v1","GCA_000977865.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1443 (GCA_000977895)","Saccharomycetales","1294373","Sc_YJM1443_v1","GCA_000977895.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1444 (GCA_000977925)","Saccharomycetales","1294374","Sc_YJM1444_v1","GCA_000977925.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1447 (GCA_000977955)","Saccharomycetales","1294375","Sc_YJM1447_v1","GCA_000977955.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1450 (GCA_000977985)","Saccharomycetales","1294376","Sc_YJM1450_v1","GCA_000977985.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1460 (GCA_000978015)","Saccharomycetales","1294377","Sc_YJM1460_v1","GCA_000978015.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1463 (GCA_000978045)","Saccharomycetales","1294378","Sc_YJM1463_v1","GCA_000978045.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1477 (GCA_000978075)","Saccharomycetales","1294379","Sc_YJM1477_v1","GCA_000978075.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1478 (GCA_000978105)","Saccharomycetales","1294380","Sc_YJM1478_v1","GCA_000978105.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1479 (GCA_000978135)","Saccharomycetales","1294381","Sc_YJM1479_v1","GCA_000978135.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1526 (GCA_000978165)","Saccharomycetales","1294382","Sc_YJM1526_v1","GCA_000978165.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1527 (GCA_000978195)","Saccharomycetales","1294383","Sc_YJM1527_v1","GCA_000978195.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1549 (GCA_000978225)","Saccharomycetales","1294384","Sc_YJM1549_v1","GCA_000978225.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1573 (GCA_000978255)","Saccharomycetales","1294385","Sc_YJM1573_v1","GCA_000978255.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1574 (GCA_000978285)","Saccharomycetales","1294386","Sc_YJM1574_v1","GCA_000978285.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1592 (GCA_000978315)","Saccharomycetales","1294387","Sc_YJM1592_v1","GCA_000978315.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM1615 (GCA_000978345)","Saccharomycetales","1294388","Sc_YJM1615_v1","GCA_000978345.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM189 (GCA_000975735)","Saccharomycetales","1294303","Sc_YJM189_v1","GCA_000975735.4","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM193 (GCA_000975765)","Saccharomycetales","1294304","Sc_YJM193_v1","GCA_000975765.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM195 (GCA_000975585)","Saccharomycetales","1294305","Sc_YJM195_v1","GCA_000975585.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM244 (GCA_000975615)","Saccharomycetales","1294306","Sc_YJM244_v1","GCA_000975615.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM248 (GCA_000975795)","Saccharomycetales","1294307","Sc_YJM248_v1","GCA_000975795.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM270 (GCA_000975825)","Saccharomycetales","1294308","Sc_YJM270_v1","GCA_000975825.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM271 (GCA_000975855)","Saccharomycetales","1294309","Sc_YJM271_v1","GCA_000975855.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM320 (GCA_000975885)","Saccharomycetales","947042","Sc_YJM320_v1","GCA_000975885.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM326 (GCA_000975915)","Saccharomycetales","468558","Sc_YJM326_v1","GCA_000975915.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM428 (GCA_000975945)","Saccharomycetales","947044","Sc_YJM428_v1","GCA_000975945.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM450 (GCA_000975975)","Saccharomycetales","1294310","Sc_YJM450_v1","GCA_000975975.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM451 (GCA_000976005)","Saccharomycetales","502869","Sc_YJM451_v1","GCA_000976005.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM453 (GCA_000976035)","Saccharomycetales","1294311","Sc_YJM453_v1","GCA_000976035.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM456 (GCA_000976065)","Saccharomycetales","1294312","Sc_YJM456_v1","GCA_000976065.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM470 (GCA_000976095)","Saccharomycetales","1294313","Sc_YJM470_v1","GCA_000976095.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM541 (GCA_000976125)","Saccharomycetales","1294314","Sc_YJM541_v1","GCA_000976125.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM554 (GCA_000976155)","Saccharomycetales","1294315","Sc_YJM554_v1","GCA_000976155.4","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM555 (GCA_000976185)","Saccharomycetales","1294316","Sc_YJM555_v1","GCA_000976185.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM627 (GCA_000976215)","Saccharomycetales","1294317","Sc_YJM627_v1","GCA_000976215.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM681 (GCA_000976245)","Saccharomycetales","1294318","Sc_YJM681_v1","GCA_000976245.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM682 (GCA_000976275)","Saccharomycetales","1294319","Sc_YJM682_v1","GCA_000976275.4","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM683 (GCA_000976305)","Saccharomycetales","1294320","Sc_YJM683_v1","GCA_000976305.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM689 (GCA_000976335)","Saccharomycetales","1294321","Sc_YJM689_v1","GCA_000976335.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM693 (GCA_000976365)","Saccharomycetales","1294322","Sc_YJM693_v1","GCA_000976365.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM789 (GCA_000181435)","Saccharomycetales","307796","ASM18143v1","GCA_000181435.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM969 (GCA_000976395)","Saccharomycetales","1294323","Sc_YJM969_v1","GCA_000976395.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM972 (GCA_000976425)","Saccharomycetales","1294324","Sc_YJM972_v1","GCA_000976425.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM975 (GCA_000976455)","Saccharomycetales","1294325","Sc_YJM975_v1","GCA_000976455.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM978 (GCA_000976485)","Saccharomycetales","1294326","Sc_YJM978_v1","GCA_000976485.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM981 (GCA_000976515)","Saccharomycetales","1294327","Sc_YJM981_v1","GCA_000976515.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM984 (GCA_000976545)","Saccharomycetales","1294328","Sc_YJM984_v1","GCA_000976545.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM987 (GCA_000976575)","Saccharomycetales","1294329","Sc_YJM987_v1","GCA_000976575.4","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM990 (GCA_000976605)","Saccharomycetales","1294330","Sc_YJM990_v1","GCA_000976605.3","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM993 (GCA_000662435)","Saccharomycetales","1294331","Sc_YJM993_v1","GCA_000662435.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae YJM996 (GCA_000976665)","Saccharomycetales","1294332","Sc_YJM996_v1","GCA_000976665.2","-","-","-","-","-","-" -"","Saccharomyces cerevisiae str. 131 (GCA_001983315)","Saccharomycetales","4932","ASM198331v1","GCA_001983315.1","-","-","-","-","-","-" -"","Saccharomyces cerevisiae x Saccharomyces kudriavzevii VIN7 (GCA_000326105)","Saccharomycetales","1095631","ASM32610v1","GCA_000326105.1","-","-","-","-","-","-" -"","Saccharomyces eubayanus str. FM1318 (GCA_001298625)","Saccharomycetales","1080349","SEUB3.0","GCA_001298625.1","-","-","-","-","","-" -"","Saccharomyces kudriavzevii IFO 1802 (GCA_000167075)","Saccharomycetales","226230","Saccharomyces_kudriavzevii_strain_IFO1802_v1.0","GCA_000167075.2","-","-","-","-","","-" -"","Saccharomyces sp. 'boulardii' str. biocodex (GCA_001298375)","Saccharomycetales","252598","ASM129837v2","GCA_001298375.2","-","-","-","-","","-" -"","Saccharomyces sp. 'boulardii' str. unique28 (GCA_001413975)","Saccharomycetales","252598","ASM141397v1","GCA_001413975.1","-","-","-","-","-","-" -"","Saccharomycetaceae sp. 'Ashbya aceri' (GCA_000412225)","Saccharomycetales","566037","ASM41222v2","GCA_000412225.2","-","-","-","-","","-" -"","Saitoella complicata NRRL Y-17804 (GCA_000227095)","Taphrinomycotina","698492","Scomplicata_3.0","GCA_000227095.3","-","-","-","-","","-" -"","Saitoella complicata NRRL Y-17804 (GCA_001661265)","Taphrinomycotina","698492","Saico1","GCA_001661265.1","-","-","-","-","-","-" -"","Scedosporium apiospermum str. IHEM 14462 (GCA_000732125)","Microascales","563466","ScApio1.0","GCA_000732125.1","-","-","-","-","","-" -"","Scheffersomyces stipitis CBS 6054 (GCA_000209165)","Saccharomycetales","322104","ASM20916v1","GCA_000209165.1","-","-","-","-","","-" -"","Schizophyllum commune H4-8 (GCA_000143185)","Agaricales","578458","v1.0","GCA_000143185.1","-","-","-","-","","-" -"","Schizopora paradoxa str. KUC8140 (GCA_001020605)","Hymenochaetales","27342","Schpa1","GCA_001020605.1","-","-","-","-","","-" -"","Schizosaccharomyces cryophilus","Schizosaccharomycetales","653667","GCA_000004155.2","GCA_000004155.2","-","-","","","","-" -"","Schizosaccharomyces japonicus","Schizosaccharomycetales","402676","GCA_000149845.2","GCA_000149845.2","-","-","","","","-" -"","Schizosaccharomyces octosporus","Schizosaccharomycetales","483514","GCA_000150505.2","GCA_000150505.2","-","-","","","","-" -"","Schizosaccharomyces pombe","Schizosaccharomycetales","284812","ASM294v2","GCA_000002945.2","","-","","","","" -"","Scleroderma citrinum Foug A (GCA_000827425)","Boletales","1036808","Scleroderma_citrinum_Foug_A_v1.0","GCA_000827425.1","-","-","-","-","","-" -"","Sclerotinia borealis F-4128 (GCA_000503235)","Sclerotiniaceae","1432307","SBOR_1","GCA_000503235.1","-","-","-","-","","-" -"","Sclerotinia sclerotiorum","Sclerotiniaceae","665079","ASM14694v1","GCA_000146945.1","-","-","-","","","-" -"","Sclerotinia sclerotiorum 1980 UF-70 (GCA_001857865)","Sclerotiniaceae","665079","ASM185786v1","GCA_001857865.1","-","-","-","-","-","-" -"","Serendipita indica DSM 11827 (GCA_000313545)","Sebacinales","1109443","ASM31354v1","GCA_000313545.1","-","-","-","-","","-" -"","Serendipita vermifera MAFF 305830 (GCA_000827415)","Sebacinales","933852","Sebacina_vermifera_MAFF_305830_v1.0","GCA_000827415.1","-","-","-","-","","-" -"","Serpula lacrymans var. lacrymans S7.3 (GCA_000218725)","Boletales","936435","v1.0","GCA_000218725.1","-","-","-","-","","-" -"","Serpula lacrymans var. lacrymans S7.9 (GCA_000218685)","Boletales","578457","v1.0","GCA_000218685.1","-","-","-","-","-","-" -"","Sistotremastrum niveocremeum HHB9708 (GCA_001630475)","","1314777","Sisni1","GCA_001630475.1","-","-","-","-","","-" -"","Sistotremastrum suecicum HHB10207 ss-3 (GCA_001632355)","","1314776","Sissu1","GCA_001632355.1","-","-","-","-","","-" -"","Sordaria macrospora k-hell (GCA_000182805)","Sordariales","771870","ASM18280v2","GCA_000182805.2","-","-","-","-","","-" -"","Spathaspora passalidarum NRRL Y-27907 (GCA_000223485)","Saccharomycetales","619300","Spathaspora_passalidarum_v2.0","GCA_000223485.1","-","-","-","-","","-" -"","Sphaerobolus stellatus SS14 (GCA_000827215)","Geastrales","990650","Sphst1","GCA_000827215.1","-","-","-","-","","-" -"","Sphaerulina musiva SO2202 (GCA_000320565)","Capnodiales","692275","Septoria_musiva_SO2202_v1.0","GCA_000320565.2","-","-","-","-","","-" -"","Spizellomyces punctatus DAOM BR117 (GCA_000182565)","Chytridiomycetes","645134","S_punctatus_V1","GCA_000182565.2","-","-","-","-","","-" -"","Sporisorium reilianum","Ustilaginales","999809","GCA_000230245.1","GCA_000230245.1","-","-","-","","","-" -"","Sporisorium reilianum f. sp. reilianum (GCA_900162835)","Ustilaginales","72559","version_2","GCA_900162835.1","-","-","-","-","-","-" -"","Sporothrix brasiliensis 5110 (GCA_000820605)","Ophiostomatales","1398154","S_brasiliensis_5110_v1","GCA_000820605.1","-","-","-","-","","-" -"","Sporothrix insectorum RCEF 264 (GCA_001636815)","Ophiostomatales","1081102","SPI_1.0","GCA_001636815.1","-","-","-","-","","-" -"","Sporothrix schenckii 1099-18 (GCA_000961545)","Ophiostomatales","1397361","S_schenckii_v1","GCA_000961545.1","-","-","-","-","-","-" -"","Sporothrix schenckii ATCC 58251 (GCA_000474925)","Ophiostomatales","1391915","Spor_sche_ATCC58251_V1","GCA_000474925.1","-","-","-","-","","-" -"","Spraguea lophii 42_110 (GCA_000430065)","Spraguidae","1358809","Sprlop1.0","GCA_000430065.1","-","-","-","-","","-" -"","Stachybotrys chartarum IBT 40288 (GCA_000732765)","Hypocreales","1283842","S40288v1","GCA_000732765.1","-","-","-","-","","-" -"","Stachybotrys chartarum IBT 40293 (GCA_000732565)","Hypocreales","1280524","S40293v1","GCA_000732565.1","-","-","-","-","-","-" -"","Stachybotrys chartarum IBT 7711 (GCA_000730325)","Hypocreales","1280523","S7711v1","GCA_000730325.1","-","-","-","-","-","-" -"","Stachybotrys chlorohalonata IBT 40285 (GCA_000732775)","Hypocreales","1283841","S40285v1","GCA_000732775.1","-","-","-","-","","-" -"","Stagonospora sp. SRC1lsM3a (GCA_001644525)","Pleosporales","765868","Stasp1","GCA_001644525.1","-","-","-","-","","-" -"","Stemphylium lycopersici str. CIDEFI 216 (GCA_001191545)","Pleosporales","183478","ASM119154v1","GCA_001191545.1","-","-","-","-","","-" -"","Stereum hirsutum FP-91666 SS1 (GCA_000264905)","Russulales","721885","Stehi1","GCA_000264905.1","-","-","-","-","","-" -"","Sugiyamaella lignohabitans str. CBS 10342 (GCA_001640025)","Saccharomycetales","796027","ASM164002v2","GCA_001640025.2","-","-","-","-","","-" -"","Suhomyces tanzawaensis NRRL Y-17324 (GCA_001661415)","Saccharomycetales","984487","Canta1","GCA_001661415.1","-","-","-","-","","-" -"","Suillus luteus UH-Slu-Lm8-n1 (GCA_000827255)","Boletales","930992","Suilu1","GCA_000827255.1","-","-","-","-","","-" -"","Syncephalastrum racemosum str. NRRL 2496","Mucoromycotina","13706","Synrac1","GCA_002105135.1","-","-","-","-","","-" -"","Talaromyces atroroseus str. IBT 11181 (GCA_001907595)","Eurotiales","1441469","ASM190759v1","GCA_001907595.1","-","-","-","-","","-" -"","Talaromyces cellulolyticus str. Y-94 (GCA_000829775)","Eurotiales","1472165","TcelY94_1.0","GCA_000829775.1","-","-","-","-","","-" -"","Talaromyces islandicus (GCA_000985935)","Eurotiales","28573","PIS","GCA_000985935.1","-","-","-","-","","-" -"","Talaromyces marneffei ATCC 18224 (GCA_000001985)","Eurotiales","441960","JCVI-PMFA1-2.0","GCA_000001985.1","-","-","-","-","","-" -"","Talaromyces marneffei PM1 (GCA_000750115)","Eurotiales","1077442","ASM75011v1","GCA_000750115.1","-","-","-","-","-","-" -"","Talaromyces stipitatus ATCC 10500 (GCA_000003125)","Eurotiales","441959","JCVI-TSTA1-3.0","GCA_000003125.1","-","-","-","-","","-" -"","Termitomyces sp. J132 (GCA_001263195)","Agaricales","1306850","TerJ1321.0","GCA_001263195.1","-","-","-","-","","-" -"","Testicularia cyperi str. MCA 3645 (GCA_003144125)","Ustilaginales","1882483","Tescy1","GCA_003144125.1","-","-","-","-","","-" -"","Tetrapisispora blattae CBS 6284 (GCA_000315915)","Saccharomycetales","1071380","ASM31591v1","GCA_000315915.1","-","-","-","-","","-" -"","Tetrapisispora phaffii CBS 4417 (GCA_000236905)","Saccharomycetales","1071381","ASM23690v1","GCA_000236905.1","-","-","-","-","","-" -"","Thermothelomyces thermophila ATCC 42464 (GCA_000226095)","Sordariales","573729","ASM22609v1","GCA_000226095.1","-","-","-","-","","-" -"","Thielavia terrestris NRRL 8126 (GCA_000226115)","Sordariales","578455","ASM22611v1","GCA_000226115.1","-","-","-","-","","-" -"","Thielaviopsis punctulata (GCA_000968615)","Microascales","72032","ASM96861v1","GCA_000968615.1","-","-","-","-","","-" -"","Tilletia caries str. DAOM 238032 (GCA_001645005)","","13290","ASM164500v1","GCA_001645005.1","-","-","-","-","","-" -"","Tilletia controversa str. DAOM 236426 (GCA_001645045)","","13291","ASM164504v1","GCA_001645045.1","-","-","-","-","","-" -"","Tilletia indica str. DAOM 236416 (GCA_001645015)","","43049","ASM164501v1","GCA_001645015.1","-","-","-","-","","-" -"","Tilletia walkeri str. DAOM 236422 (GCA_001645055)","","117179","ASM164505v1","GCA_001645055.1","-","-","-","-","","-" -"","Tilletiaria anomala UBC 951 (GCA_000711695)","Georgefischeriales","1037660","Tilletiaria_anomala_UBC_951_v1.0","GCA_000711695.1","-","-","-","-","","-" -"","Tilletiopsis washingtonensis str. MCA 4186 (GCA_003144115)","","58919","Tilwa1","GCA_003144115.1","-","-","-","-","","-" -"","Tolypocladium capitatum str. CBS 113982 (GCA_002901185)","Hypocreales","45235","ASM290118v1","GCA_002901185.1","-","-","-","-","","-" -"","Tolypocladium ophioglossoides CBS 100239 (GCA_001189435)","Hypocreales","1163406","Tophv1.0","GCA_001189435.1","-","-","-","-","","-" -"","Tolypocladium paradoxum str. NRBC 100945 (GCA_002916505)","Hypocreales","94208","ASM291650v1","GCA_002916505.1","-","-","-","-","","-" -"","Torrubiella hemipterigena str. BCC 1449 (GCA_000825705)","Hypocreales","1531966","Allpaths-LG","GCA_000825705.1","-","-","-","-","","-" -"","Tortispora caseinolytica NRRL Y-17796 (GCA_001661475)","Saccharomycetales","767744","Canca1","GCA_001661475.1","-","-","-","-","","-" -"","Torulaspora delbrueckii str. CBS 1146 (GCA_000243375)","Saccharomycetales","4950","ASM24337v1","GCA_000243375.1","-","-","-","-","","-" -"","Trachipleistophora hominis (GCA_000316135)","Pleistophoridae","72359","ASM31613v1","GCA_000316135.1","-","-","-","-","","-" -"","Trametes cinnabarina str. BRFM137 (GCA_000765035)","Polyporales","5643","BN946","GCA_000765035.1","-","-","-","-","","-" -"","Trametes coccinea BRFM310 (GCA_002092935)","Polyporales","1353009","Pycco1","GCA_002092935.1","-","-","-","-","","-" -"","Trametes pubescens str. FBCC735 (GCA_001895945)","Polyporales","154538","ASM189594v1","GCA_001895945.1","-","-","-","-","","-" -"","Trametes versicolor FP-101664 SS1 (GCA_000271585)","Polyporales","717944","Trametes_versicolor_v1.0","GCA_000271585.1","-","-","-","-","","-" -"","Tremella mesenterica DSM 1558 (GCA_000271645)","Tremellales","578456","Treme1","GCA_000271645.1","-","-","-","-","","-" -"","Trichoderma asperellum CBS 433.97 (GCA_003025105)","Hypocreales","1042311","Trias_v._1.0","GCA_003025105.1","-","-","-","-","","-" -"","Trichoderma atroviride IMI 206040 (GCA_000171015)","Hypocreales","452589","TRIAT_v2.0","GCA_000171015.2","-","-","-","-","","-" -"","Trichoderma citrinoviride str. TUCIM 6016 (GCA_003025115)","Hypocreales","58853","Trici_v4.0","GCA_003025115.1","-","-","-","-","","-" -"","Trichoderma gamsii str. T6085 (GCA_001481775)","Hypocreales","398673","TGAM01v2","GCA_001481775.2","-","-","-","-","","-" -"","Trichoderma guizhouense str. NJAU 4742 (GCA_002022785)","Hypocreales","1491466","ASM202278v1","GCA_002022785.1","-","-","-","-","","-" -"","Trichoderma harzianum CBS 226.95 (GCA_003025095)","Hypocreales","983964","Allpaths-LG_v._01_03_12","GCA_003025095.1","-","-","-","-","-","-" -"","Trichoderma harzianum str. T6776 (GCA_000988865)","Hypocreales","5544","ASM98886v1","GCA_000988865.1","-","-","-","-","","-" -"","Trichoderma harzianum str. TR274 (GCA_002838845)","Hypocreales","5544","ASM283884v1","GCA_002838845.1","-","-","-","-","-","-" -"","Trichoderma harzianum str. Tr1 (GCA_002894145)","Hypocreales","5544","Tr1","GCA_002894145.1","-","-","-","-","-","-" -"","Trichoderma longibrachiatum ATCC 18648 (GCA_003025155)","Hypocreales","983965","Trilo3","GCA_003025155.1","-","-","-","-","","-" -"","Trichoderma parareesei (GCA_001050175)","Hypocreales","858221","Tpara_v1.0","GCA_001050175.1","-","-","-","-","","-" -"","Trichoderma reesei","Hypocreales","431241","GCA_000167675.2","GCA_000167675.2","-","-","-","","","-" -"","Trichoderma reesei RUT C-30 (GCA_000513815)","Hypocreales","1344414","TrireRUTC30_1","GCA_000513815.1","-","-","-","-","-","-" -"","Trichoderma virens","Hypocreales","413071","ASM17099v1","GCA_000170995.2","-","-","","","","-" -"","Trichophyton benhamiae CBS 112371 (GCA_000151125)","Onygenales","663331","ASM15112v2","GCA_000151125.2","-","-","-","-","","-" -"","Trichophyton equinum CBS 127.97 (GCA_000151175)","Onygenales","559882","ASM15117v1","GCA_000151175.1","-","-","-","-","","-" -"","Trichophyton interdigitale H6 (GCA_000616785)","Onygenales","1215336","Tric_rubr_H6_V2","GCA_000616785.1","-","-","-","-","-","-" -"","Trichophyton interdigitale MR816 (GCA_000622975)","Onygenales","1215338","Tric_inte_MR816_V1","GCA_000622975.1","-","-","-","-","","-" -"","Trichophyton mentagrophytes str. TIMM 2789 (GCA_003118255)","Onygenales","523103","ABySS_70bp_45k_152cov_v1","GCA_003118255.1","-","-","-","-","","-" -"","Trichophyton rubrum CBS 100081 (GCA_000616805)","Onygenales","1215328","Tric_fish_CBS_100081_V1","GCA_000616805.1","-","-","-","-","-","-" -"","Trichophyton rubrum CBS 118892 (GCA_000151425)","Onygenales","559305","ASM15142v1","GCA_000151425.1","-","-","-","-","","-" -"","Trichophyton rubrum CBS 202.88 (GCA_000616985)","Onygenales","1215334","Tric_raub_CBS_202_88_V2","GCA_000616985.1","-","-","-","-","-","-" -"","Trichophyton rubrum CBS 288.86 (GCA_000616825)","Onygenales","1215330","Tric_fish_CBS_288_86_V1","GCA_000616825.1","-","-","-","-","-","-" -"","Trichophyton rubrum CBS 289.86 (GCA_000616845)","Onygenales","1215329","Tric_kane_CBS_289_86_V1","GCA_000616845.1","-","-","-","-","-","-" -"","Trichophyton rubrum CBS 735.88 (GCA_000616965)","Onygenales","1215332","Tric_megn_CBS_735_88_V1","GCA_000616965.1","-","-","-","-","-","-" -"","Trichophyton rubrum D6 (GCA_000622995)","Onygenales","1215335","Tric_rubr_D6_V1","GCA_000622995.1","-","-","-","-","-","-" -"","Trichophyton rubrum MR1448 (GCA_000616905)","Onygenales","1215339","Tric_rubr_M1448_V1","GCA_000616905.1","-","-","-","-","-","-" -"","Trichophyton rubrum MR1459 (GCA_000616945)","Onygenales","1215341","Tric_rubr_MR1459_V1","GCA_000616945.1","-","-","-","-","-","-" -"","Trichophyton rubrum MR850 (GCA_000616765)","Onygenales","1215337","Tric_rubr_MR-850_V1","GCA_000616765.1","-","-","-","-","-","-" -"","Trichophyton rubrum str. CMCC(F)T1i (GCA_001651445)","Onygenales","5551","CMCC_F_T1i","GCA_001651445.1","-","-","-","-","-","-" -"","Trichophyton soudanense CBS 452.61 (GCA_000616865)","Onygenales","1215331","Tric_soud_CBS_452_61_V1","GCA_000616865.1","-","-","-","-","","-" -"","Trichophyton tonsurans CBS 112818 (GCA_000151455)","Onygenales","647933","ASM15145v1","GCA_000151455.1","-","-","-","-","","-" -"","Trichophyton verrucosum HKI 0517 (GCA_000151505)","Onygenales","663202","ASM15150v1","GCA_000151505.1","-","-","-","-","","-" -"","Trichophyton violaceum str. CMCC(F)T3l (GCA_001651435)","Onygenales","34388","CMCC_F_T3l","GCA_001651435.1","-","-","-","-","","-" -"","Trichosporon asahii var. asahii CBS 2479 (GCA_000293215)","","1186058","Trichosporon_asahii_1","GCA_000293215.1","-","-","-","-","-","-" -"","Trichosporon asahii var. asahii CBS 8904 (GCA_000299215)","","1220162","ASM29921v2","GCA_000299215.2","-","-","-","-","","-" -"","Tsuchiyaea wingfieldii CBS 7118 (GCA_001720155)","Tremellales","1295528","Tsuc_wing_CBS7118_V1","GCA_001720155.1","-","-","-","-","","-" -"","Tuber borchii str. Tbo3840 (GCA_003070745)","Pezizales","42251","Tubbor1","GCA_003070745.1","-","-","-","-","","-" -"","Tuber magnatum (GCA_003182015)","Pezizales","42249","ASM318201v1","GCA_003182015.1","-","-","-","-","","-" -"","Tuber melanosporum","Pezizales","656061","ASM15164v1","GCA_000151645.1","-","-","-","","","-" -"","Tulasnella calospora MUT 4182 (GCA_000827465)","Cantharellales","1051891","Tulasnella_calospora_AL13_4D_v1.0","GCA_000827465.1","-","-","-","-","","-" -"","Umbilicaria pustulata (GCA_900169345)","","136370","Lasallia_pustulata_v1","GCA_900169345.1","-","-","-","-","-","-" -"","Uncinocarpus reesii 1704 str. UAMH 1704 (GCA_000003515)","Onygenales","336963","ASM351v2","GCA_000003515.2","-","-","-","-","","-" -"","Ustilaginoidea virens (GCA_000965225)","Hypocreales","1159556","ASM96522v2","GCA_000965225.2","-","-","-","-","-","-" -"","Ustilaginoidea virens str. UV-8b (GCA_000687475)","Hypocreales","1159556","Assembly_for_version_1_of_the_Villosiclava_virens_genome","GCA_000687475.1","-","-","-","-","","-" -"","Ustilaginomycotina sp. SA 807 (GCA_003144235)","","1673888","Ustsp1","GCA_003144235.1","-","-","-","-","","-" -"","Ustilago bromivora str. UB2112 (GCA_900080155)","Ustilaginales","307758","UBRO_v3","GCA_900080155.1","-","-","-","-","-","-" -"","Ustilago hordei str. Uh4857-4 (GCA_000286035)","Ustilaginales","120017","ASM28603v1","GCA_000286035.1","-","-","-","-","","-" -"","Ustilago maydis","Ustilaginales","237631","Umaydis521_2.0","GCA_000328475.2","-","-","-","","","" -"","Valsa mali str. 03-8 (GCA_000818155)","Sordariomycetidae","105487","ASM81815v1","GCA_000818155.1","-","-","-","-","-","-" -"","Valsa mali var. pyri str. SXYL134 (GCA_000813385)","Sordariomycetidae","694573","ASM81338v1","GCA_000813385.1","-","-","-","-","","-" -"","Vanderwaltozyma polyspora DSM 70294 (GCA_000150035)","Saccharomycetales","436907","ASM15003v1","GCA_000150035.1","-","-","-","-","","-" -"","Vavraia culicis subsp. floridensis (GCA_000192795)","Pleistophoridae","948595","Vavr_culi_floridensis_V1","GCA_000192795.1","-","-","-","-","","-" -"","Verruconis gallopava str. CBS 43764 (GCA_000836295)","Venturiales","253628","O_gall_CBS43764","GCA_000836295.1","-","-","-","-","-","-" -"","Verticillium alfalfae VaMs.102 (GCA_000150825)","Glomerellales","526221","ASM15082v1","GCA_000150825.1","-","-","-","-","-","-" -"","Verticillium dahliae","Glomerellales","498257","ASM15067v2","GCA_000150675.2","-","-","-","","","-" -"","Verticillium dahliae (GCA_002892995)","Glomerellales","27337","ASM289299v1","GCA_002892995.1","-","-","-","-","-","-" -"","Verticillium dahliae (GCA_002893025)","Glomerellales","27337","ASM289302v1","GCA_002893025.1","-","-","-","-","-","-" -"","Verticillium dahliae (GCA_002893035)","Glomerellales","27337","ASM289303v1","GCA_002893035.1","-","-","-","-","-","-" -"","Verticillium dahliae (GCA_002893045)","Glomerellales","27337","ASM289304v1","GCA_002893045.1","-","-","-","-","-","-" -"","Verticillium dahliae JR2","Glomerellales","1202531","VDAG_JR2v.4.0","GCA_000400815.2","","-","-","","-","-" -"","Verticillium dahliae str. 12008 (GCA_002892985)","Glomerellales","27337","ASM289298v1","GCA_002892985.1","-","-","-","-","-","-" -"","Verticillium longisporum (GCA_001268145)","Glomerellales","100787","vl1.denovo.v1","GCA_001268145.1","-","-","-","-","-","-" -"","Verticillium longisporum (GCA_001268165)","Glomerellales","100787","vl2.denovo.v1","GCA_001268165.1","-","-","-","-","","-" -"","Vittaforma corneae ATCC 50505 (GCA_000231115)","Nosematidae","993615","Vitt_corn_V1","GCA_000231115.1","-","-","-","-","","-" -"","Wallemia ichthyophaga EXF-994 (GCA_000400465)","Wallemiales","1299270","Wallemia_ichthyophaga_version_1.0","GCA_000400465.1","-","-","-","-","","-" -"","Wallemia mellicola CBS 633.66 (GCA_000263375)","Wallemiales","671144","Wallemia_sebi_v1.0","GCA_000263375.1","-","-","-","-","","-" -"","Wickerhamiella sorbophila str. DS02 (GCA_002251995)","Saccharomycetales","45607","ASM225199v2","GCA_002251995.2","-","-","-","-","","-" -"","Wickerhamomyces anomalus NRRL Y-366-8 (GCA_001661255)","Saccharomycetales","683960","Wican1","GCA_001661255.1","-","-","-","-","","-" -"","Wickerhamomyces ciferrii str. NRRL Y-1031 (GCA_000313485)","Saccharomycetales","1041607","ASM31348v1","GCA_000313485.1","-","-","-","-","","-" -"","Wolfiporia cocos MD-104 SS10 (GCA_000344635)","Polyporales","742152","Wolco1","GCA_000344635.1","-","-","-","-","","-" -"","Xanthophyllomyces dendrorhous (GCA_001007165)","Cystofilobasidiales","5421","Xden1","GCA_001007165.2","-","-","-","-","-","-" -"","Xylona heveae TC161 (GCA_001619985)","","1328760","Xylona_heveae_TC161_v1.0","GCA_001619985.1","-","-","-","-","","-" -"","Yarrowia lipolytica","Saccharomycetales","284591","GCA_000002525.1","GCA_000002525.1","-","-","-","","-","-" -"","Yarrowia lipolytica (GCA_900087985)","Saccharomycetales","4952","YALIA101","GCA_900087985.1","-","-","-","-","","-" -"","Yarrowia lipolytica str. CLIB89 (W29) (GCA_001761485)","Saccharomycetales","4952","ASM176148v1","GCA_001761485.1","-","-","-","-","-","-" -"","Zygosaccharomyces bailii (GCA_900162805)","Saccharomycetales","4954","version_1","GCA_900162805.1","-","-","-","-","-","-" -"","Zygosaccharomyces bailii CLIB 213 (GCA_000442885)","Saccharomycetales","1333698","ZYBA0","GCA_000442885.1","-","-","-","-","","-" -"","Zygosaccharomyces bailii ISA1307 (GCA_000530735)","Saccharomycetales","1355161","Z_bailii_ISA1307_version_3","GCA_000530735.1","-","-","-","-","-","-" -"","Zygosaccharomyces parabailii str. ATCC 60483 (GCA_001984395)","Saccharomycetales","1365886","ASM198439v2","GCA_001984395.2","-","-","-","-","","-" -"","Zygosaccharomyces rouxii str. CBS 732 (GCA_000026365)","Saccharomycetales","4956","ASM2636v1","GCA_000026365.1","-","-","-","-","","-" -"","Zygosaccharomyces rouxii str. NBRC110957 (GCA_001972345)","Saccharomycetales","4956","ZYGR_assembly01","GCA_001972345.1","-","-","-","-","-","-" -"","Zymoseptoria brevis str. Zb18110 (GCA_000966595)","Capnodiales","1047168","ASM96659v1","GCA_000966595.1","-","-","-","-","","-" -"","Zymoseptoria tritici","Capnodiales","336722","MG2","GCA_000219625.1","","-","-","","","" -"","Zymoseptoria tritici ST99CH_1A5 (GCA_900099495)","Capnodiales","1276529","ZT1A5_complete_assembly","GCA_900099495.1","-","-","-","-","-","-" -"","Zymoseptoria tritici ST99CH_1E4 (GCA_900184115)","Capnodiales","1276532","ST99CH_1E4","GCA_900184115.1","-","-","-","-","-","-" -"","Zymoseptoria tritici ST99CH_3D1 (GCA_900184105)","Capnodiales","1276537","ST99CH_3D1","GCA_900184105.1","-","-","-","-","-","-" -"","Zymoseptoria tritici ST99CH_3D7 (GCA_900091695)","Capnodiales","1276538","Zt_ST99CH_3D7","GCA_900091695.1","-","-","-","-","-","-" -"","[Candida] arabinofermentans NRRL YB-2248 (GCA_001661425)","Saccharomycetales","983967","Canar1","GCA_001661425.1","-","-","-","-","-","-" -"","[Candida] auris (GCA_002759435)","Saccharomycetales","498019","Cand_auris_B8441_V2","GCA_002759435.2","-","-","-","-","-","-" -"","[Candida] auris (GCA_002775015)","Saccharomycetales","498019","Cand_auris_B11221_V1","GCA_002775015.1","-","-","-","-","-","-" -"","[Candida] auris (GCA_003013715)","Saccharomycetales","498019","Cand_auris_B11220","GCA_003013715.1","-","-","-","-","-","-" -"","[Candida] auris (GCA_003014415)","Saccharomycetales","498019","Cand_auris_B11243","GCA_003014415.1","-","-","-","-","-","-" -"","[Candida] auris str. 6684 (GCA_001189475)","Saccharomycetales","498019","ASM118947v1","GCA_001189475.1","-","-","-","-","","-" -"","[Candida] duobushaemulonis str. B09383 (GCA_002926085)","Saccharomycetales","1231522","CanDuoHae_v1.0","GCA_002926085.1","-","-","-","-","-","-" -"","[Candida] glabrata (GCA_001466525)","Saccharomycetales","5478","ASM146652v1","GCA_001466525.1","-","-","-","-","-","-" -"","[Candida] glabrata (GCA_001466535)","Saccharomycetales","5478","ASM146653v1","GCA_001466535.1","-","-","-","-","-","-" -"","[Candida] glabrata (GCA_001466565)","Saccharomycetales","5478","ASM146656v1","GCA_001466565.1","-","-","-","-","-","-" -"","[Candida] glabrata (GCA_001466575)","Saccharomycetales","5478","ASM146657v1","GCA_001466575.1","-","-","-","-","-","-" -"","[Candida] glabrata (GCA_001466635)","Saccharomycetales","5478","ASM146663v1","GCA_001466635.1","-","-","-","-","-","-" -"","[Candida] glabrata (GCA_001466685)","Saccharomycetales","5478","ASM146668v1","GCA_001466685.1","-","-","-","-","-","-" -"","[Candida] glabrata (GCA_002219185)","Saccharomycetales","5478","ASM221918v1","GCA_002219185.1","-","-","-","-","-","-" -"","[Candida] glabrata (GCA_002219195)","Saccharomycetales","5478","ASM221919v1","GCA_002219195.1","-","-","-","-","-","-" -"","[Candida] glabrata str. CBS138 (GCA_000002545)","Saccharomycetales","5478","ASM254v2","GCA_000002545.2","-","-","-","-","","-" -"","[Candida] haemulonis str. B11899 (GCA_002926055)","Saccharomycetales","45357","CanHae_1.0","GCA_002926055.1","-","-","-","-","-","-" -"","[Candida] intermedia (GCA_900106115)","Saccharomycetales","45354","CBS_141442_assembly","GCA_900106115.1","-","-","-","-","-","-" -"","[Candida] intermedia (GCA_900106125)","Saccharomycetales","45354","PYCC_4715_assembly","GCA_900106125.1","-","-","-","-","-","-" -"","[Candida] pseudohaemulonis str. B12108 (GCA_003013735)","Saccharomycetales","418784","Cand_pseudohaemulonii_B12108","GCA_003013735.1","-","-","-","-","-","-" -"","[Candida] tenuis ATCC 10573 (GCA_000223465)","Saccharomycetales","590646","Candida_tenuis_v1.0","GCA_000223465.1","-","-","-","-","-","-" +"","Name","Classification","Taxon ID","Assembly","Accession","Variation database","Regulation database","Whole genome alignments","Other alignments","In peptide compara","In pan-taxonomic compara" +"","Absidia glauca","Mucoromycotina","4829","AG_v1","GCA_900079185.1","-","-","-","-","-","-" +"","Absidia repens str. NRRL 1336","Mucoromycotina","90262","Absrep1","GCA_002105175.1","-","-","-","-","","-" +"","Acaromyces ingoldii str. MCA 4198 (GCA_003144295)","","215250","Acain1","GCA_003144295.1","-","-","-","-","","-" +"","Acidomyces richmondensis (GCA_001572075)","Acidomyces","245562","ASM157207v1","GCA_001572075.1","-","-","-","-","-","-" +"","Acidomyces richmondensis BFW (GCA_001592465)","Acidomyces","766039","Acidomyces_richmondensis_BFW_v1.0","GCA_001592465.1","-","-","-","-","","-" +"","Acremonium chrysogenum ATCC 11550 (GCA_000769265)","Hypocreales","857340","ASM76926v1","GCA_000769265.1","-","-","-","-","","-" +"","Agaricus bisporus var. burnettii JB137-S8 (GCA_000300555)","Agaricales","597362","Agabi_varbur_1","GCA_000300555.1","-","-","-","-","","-" +"","Allomyces macrogynus ATCC 38327 (GCA_000151295)","Blastocladiales","578462","A_macrogynus_V3","GCA_000151295.1","-","-","-","-","","-" +"","Alternaria alternata str. SRC1lrK2f (GCA_001642055)","Pleosporales","5599","Altal1","GCA_001642055.1","-","-","-","-","","-" +"","Amanita muscaria Koide BX008 (GCA_000827485)","Agaricales","946122","Amanita_muscaria_Koide_BX008_v1.0","GCA_000827485.1","-","-","-","-","","-" +"","Amanita thiersii Skay4041 (GCA_002554575)","Agaricales","703135","Amanita_thiersii_v1.0","GCA_002554575.1","-","-","-","-","","-" +"","Amorphotheca resinae ATCC 22711 (GCA_003019875)","Myxotrichaceae","857342","Amore1","GCA_003019875.1","-","-","-","-","","-" +"","Amphiamblys sp. WSBS2006 (GCA_001875675)","Microsporidia","1866961","ASM187567v1","GCA_001875675.1","-","-","-","-","","-" +"","Anaeromyces robustus str. S4 (GCA_002104895)","","1754192","Anaeromyces_sp._S4_v1.0","GCA_002104895.1","-","-","-","-","","-" +"","Anncaliia algerae PRA109 (GCA_000385855)","Tubulinosematidae","1240240","Annc_alge_PRA109_V4","GCA_000385855.2","-","-","-","-","-","-" +"","Anncaliia algerae PRA339 (GCA_000385875)","Tubulinosematidae","1288291","Annc_alge_insect_USDA_JJB_V2","GCA_000385875.2","-","-","-","-","","-" +"","Anthracocystis flocculosa PF-1 (GCA_000417875)","Ustilaginales","1277687","Pflocc_1.0","GCA_000417875.1","-","-","-","-","","-" +"","Armillaria gallica str. Ar21-2 (GCA_002307695)","Agaricales","47427","Armga1","GCA_002307695.1","-","-","-","-","","-" +"","Armillaria ostoyae (GCA_900157425)","Agaricales","47428","version_2","GCA_900157425.1","-","-","-","-","","-" +"","Armillaria solidipes str. 28-4 (GCA_002307675)","Agaricales","1076256","Armost1","GCA_002307675.1","-","-","-","-","","-" +"","Arthrobotrys oligospora ATCC 24927 (GCA_000225545)","Orbiliales","756982","AOL24927_1.0","GCA_000225545.1","-","-","-","-","","-" +"","Ascochyta rabiei str. ArDII (GCA_001630375)","Pleosporales","5454","AscRab1.0","GCA_001630375.1","-","-","-","-","","-" +"","Ascoidea rubescens DSM 1968 (GCA_001661345)","Saccharomycetales","1344418","Ascru1","GCA_001661345.1","-","-","-","-","","-" +"","Ascosphaera apis ARSEF 7405 (GCA_001636715)","Onygenales","392613","AAP_1.0","GCA_001636715.1","-","-","-","-","","-" +"","Ashbya gossypii","Saccharomycetales","284811","ASM9102v1","GCA_000091025.3","-","","","","","-" +"","Aspergillus aculeatinus CBS 121060 (GCA_003184765)","Eurotiales","1448322","Aspacu1","GCA_003184765.1","-","-","-","-","-","-" +"","Aspergillus aculeatus ATCC 16872 (GCA_001890905)","Eurotiales","690307","Aspac1","GCA_001890905.1","-","-","-","-","-","-" +"","Aspergillus arachidicola str. CBS 117610 (GCA_002749805)","Eurotiales","656916","ASM274980v1","GCA_002749805.1","-","-","-","-","-","-" +"","Aspergillus bombycis str. NRRL26010 (GCA_001792695)","Eurotiales","109264","ASM179269v1","GCA_001792695.1","-","-","-","-","-","-" +"","Aspergillus brasiliensis CBS 101740 (GCA_001889945)","Eurotiales","767769","Aspbr1","GCA_001889945.1","-","-","-","-","-","-" +"","Aspergillus brunneoviolaceus CBS 621.78 (GCA_003184695)","Eurotiales","1450534","Aspbru1","GCA_003184695.1","-","-","-","-","-","-" +"","Aspergillus calidoustus str. SF006504 (GCA_001511075)","Eurotiales","454130","Acal_Allpaths_LG","GCA_001511075.1","-","-","-","-","-","-" +"","Aspergillus campestris IBT 28561 (GCA_002847485)","Eurotiales","1392248","Aspcam1","GCA_002847485.1","-","-","-","-","-","-" +"","Aspergillus candidus str. CBS 102.13 (GCA_002847045)","Eurotiales","41067","Aspcand1","GCA_002847045.1","-","-","-","-","-","-" +"","Aspergillus carbonarius ITEM 5010 (GCA_001990825)","Eurotiales","602072","Aspca3","GCA_001990825.1","-","-","-","-","-","-" +"","Aspergillus clavatus NRRL 1","Eurotiales","344612","ASM271v1","GCA_000002715.1","-","-","-","-","","-" +"","Aspergillus cristatus str. GZAAS20.1005 (GCA_001717485)","Eurotiales","573508","ASM171748v1","GCA_001717485.1","-","-","-","-","-","-" +"","Aspergillus ellipticus CBS 707.79 (GCA_003184645)","Eurotiales","1448320","Aspell1","GCA_003184645.1","-","-","-","-","-","-" +"","Aspergillus eucalypticola CBS 122712 (GCA_003184535)","Eurotiales","1448314","Aspeuc1","GCA_003184535.1","-","-","-","-","-","-" +"","Aspergillus fischeri NRRL 181","Eurotiales","331117","ASM14964v1","GCA_000149645.2","-","-","-","-","","-" +"","Aspergillus flavus AF70 (GCA_000952835)","Eurotiales","1392242","ASM95283v1","GCA_000952835.1","-","-","-","-","-","-" +"","Aspergillus flavus NRRL3357","Eurotiales","332952","JCVI-afl1-v2.0","GCA_000006275.2","-","-","-","-","","-" +"","Aspergillus fumigatus (GCA_002234985)","Eurotiales","746128","ASM223498v1","GCA_002234985.1","-","-","-","-","","-" +"","Aspergillus fumigatus A1163","Eurotiales","451804","ASM15014v1","GCA_000150145.1","-","-","-","-","-","-" +"","Aspergillus fumigatus Af293","Eurotiales","330879","ASM265v1","GCA_000002655.1","-","-","-","-","-","-" +"","Aspergillus fumigatus Z5 (GCA_001029325)","Eurotiales","1437362","ASM102932v1","GCA_001029325.1","-","-","-","-","-","-" +"","Aspergillus fumigatus var. RP-2014 (GCA_000731615)","Eurotiales","1476192","AspFumNiv1.0","GCA_000731615.1","-","-","-","-","-","-" +"","Aspergillus glaucus CBS 516.65 (GCA_001890805)","Eurotiales","1160497","Aspgl1","GCA_001890805.1","-","-","-","-","-","-" +"","Aspergillus heteromorphus CBS 117.55 (GCA_003184545)","Eurotiales","1448321","Asphet1","GCA_003184545.1","-","-","-","-","-","-" +"","Aspergillus indologenus CBS 114.80 (GCA_003184685)","Eurotiales","1450541","Aspind1","GCA_003184685.1","-","-","-","-","-","-" +"","Aspergillus japonicus CBS 114.51 (GCA_003184785)","Eurotiales","1448312","Aspjap1","GCA_003184785.1","-","-","-","-","-","-" +"","Aspergillus lacticoffeatus CBS 101883 (GCA_003184595)","Eurotiales","1450533","Asplac1","GCA_003184595.1","-","-","-","-","-","-" +"","Aspergillus lentulus (GCA_001445615)","Eurotiales","293939","Alt_assembly01","GCA_001445615.1","-","-","-","-","-","-" +"","Aspergillus luchuensis CBS 106.47 (GCA_001890685)","Eurotiales","1137211","Aspfo1","GCA_001890685.1","-","-","-","-","-","-" +"","Aspergillus luchuensis str. RIB 2604 (GCA_001602395)","Eurotiales","1069201","AspL_2604","GCA_001602395.1","-","-","-","-","-","-" +"","Aspergillus neoniger CBS 115656 (GCA_003184625)","Eurotiales","1448310","Aspneo1","GCA_003184625.1","-","-","-","-","-","-" +"","Aspergillus nidulans","Eurotiales","227321","ASM1142v1","GCA_000011425.1","-","-","-","-","","" +"","Aspergillus nidulans FGSC A4 (GCA_000149205)","Eurotiales","227321","ASM14920v2","GCA_000149205.2","-","-","-","-","-","-" +"","Aspergillus niger","Eurotiales","5061","ASM285v2","GCA_000002855.2","-","-","-","","","-" +"","Aspergillus niger (GCA_001515345)","Eurotiales","5061","ASM151534v1","GCA_001515345.1","-","-","-","-","-","-" +"","Aspergillus niger (GCA_900248155)","Eurotiales","5061","Aniger_ATCC_64974_N402","GCA_900248155.1","-","-","-","-","-","-" +"","Aspergillus niger ATCC 1015 (GCA_000230395)","Eurotiales","380704","ASPNI_v3.0","GCA_000230395.2","-","-","-","-","-","-" +"","Aspergillus nomius NRRL 13137 (GCA_001204775)","Eurotiales","1509407","ASM120477v1","GCA_001204775.1","-","-","-","-","-","-" +"","Aspergillus novofumigatus IBT 16806 (GCA_002847465)","Eurotiales","1392255","Aspnov1","GCA_002847465.1","-","-","-","-","-","-" +"","Aspergillus ochraceoroseus IBT 24754 (GCA_002846915)","Eurotiales","1392256","Aspergillus_ochraceoroseus_IBT_24754_v1.1","GCA_002846915.2","-","-","-","-","-","-" +"","Aspergillus ochraceoroseus str. SRRC1432 (GCA_000986665)","Eurotiales","138278","ASM98666v1","GCA_000986665.1","-","-","-","-","-","-" +"","Aspergillus oryzae 100-8 (GCA_000691885)","Eurotiales","1197718","Aspergillus_oryzae_100-8","GCA_000691885.1","-","-","-","-","-","-" +"","Aspergillus oryzae 3.042 (GCA_000269785)","Eurotiales","1160506","AspOry3042","GCA_000269785.2","-","-","-","-","-","-" +"","Aspergillus oryzae RIB40","Eurotiales","510516","ASM18445v3","GCA_000184455.3","-","-","-","-","","-" +"","Aspergillus oryzae str. BCC7051 (GCA_002007945)","Eurotiales","5062","ASM200794v1","GCA_002007945.1","-","-","-","-","-","-" +"","Aspergillus parasiticus SU-1 (GCA_000956085)","Eurotiales","1403190","ASM95608v1","GCA_000956085.1","-","-","-","-","-","-" +"","Aspergillus piperis CBS 112811 (GCA_003184755)","Eurotiales","1448313","Asppip1","GCA_003184755.1","-","-","-","-","-","-" +"","Aspergillus rambellii str. SRRC1468 (GCA_000986645)","Eurotiales","308745","ASM98664v1","GCA_000986645.1","-","-","-","-","-","-" +"","Aspergillus ruber CBS 135680 (GCA_000600275)","Eurotiales","1388766","Eurhe1","GCA_000600275.1","-","-","-","-","-","-" +"","Aspergillus saccharolyticus JOP 1030-1 (GCA_003184585)","Eurotiales","1450539","Aspsac1","GCA_003184585.1","-","-","-","-","-","-" +"","Aspergillus sclerotiicarbonarius CBS 121057 (GCA_003184635)","Eurotiales","1448318","Aspscle1","GCA_003184635.1","-","-","-","-","-","-" +"","Aspergillus sclerotioniger CBS 115572 (GCA_003184525)","Eurotiales","1450535","Aspscl1","GCA_003184525.1","-","-","-","-","-","-" +"","Aspergillus steynii IBT 23096 (GCA_002849105)","Eurotiales","1392250","Aspste1","GCA_002849105.1","-","-","-","-","-","-" +"","Aspergillus sydowii CBS 593.65 (GCA_001890705)","Eurotiales","1036612","Aspsy1","GCA_001890705.1","-","-","-","-","-","-" +"","Aspergillus taichungensis str. IBT 19404 (GCA_002850765)","Eurotiales","482145","Asptaic1","GCA_002850765.1","-","-","-","-","-","-" +"","Aspergillus terreus NIH2624","Eurotiales","341663","ASM14961v1","GCA_000149615.1","-","-","-","-","","-" +"","Aspergillus thermomutatus (GCA_002237265)","Eurotiales","41047","ASM223726v1","GCA_002237265.1","-","-","-","-","-","-" +"","Aspergillus tubingensis CBS 134.48 (GCA_001890745)","Eurotiales","767770","Asptu1","GCA_001890745.1","-","-","-","-","-","-" +"","Aspergillus turcosus (GCA_002234965)","Eurotiales","1245748","ASM223496v1","GCA_002234965.1","-","-","-","-","-","-" +"","Aspergillus turcosus (GCA_002234975)","Eurotiales","1245748","ASM223497v1","GCA_002234975.1","-","-","-","-","-","-" +"","Aspergillus udagawae str. IFM 46973 (GCA_001078395)","Eurotiales","91492","Aud_assembly01","GCA_001078395.1","-","-","-","-","-","-" +"","Aspergillus ustus str. 3.3904 (GCA_000812125)","Eurotiales","40382","Austus1.0","GCA_000812125.1","-","-","-","-","-","-" +"","Aspergillus uvarum CBS 121591 (GCA_003184745)","Eurotiales","1448315","Aspuva1","GCA_003184745.1","-","-","-","-","-","-" +"","Aspergillus vadensis CBS 113365 (GCA_003184925)","Eurotiales","1448311","Aspvad1","GCA_003184925.1","-","-","-","-","-","-" +"","Aspergillus versicolor CBS 583.65 (GCA_001890125)","Eurotiales","1036611","Aspve1","GCA_001890125.1","-","-","-","-","-","-" +"","Aspergillus violaceofuscus CBS 115571 (GCA_003184705)","Eurotiales","1450538","Aspvio1","GCA_003184705.1","-","-","-","-","-","-" +"","Aspergillus wentii DTO 134E9 (GCA_001890725)","Eurotiales","1073089","Aspwe1","GCA_001890725.1","-","-","-","-","-","-" +"","Aureobasidium melanogenum CBS 110374 (GCA_000721775)","Dothideales","1043003","Aureobasidium_pullulans_var._melanogenum_CBS_110374_v1.0","GCA_000721775.1","-","-","-","-","","-" +"","Aureobasidium namibiae CBS 147.97 (GCA_000721765)","Dothideales","1043004","Aureobasidium_pullulans_var._namibiae_CBS_147.97_v1.0","GCA_000721765.1","-","-","-","-","","-" +"","Aureobasidium pullulans (GCA_001678115)","Dothideales","5580","ASM167811v1","GCA_001678115.1","-","-","-","-","-","-" +"","Aureobasidium pullulans EXF-150 (GCA_000721785)","Dothideales","1043002","Aureobasidium_pullulans_var._pullulans_EXF-150_assembly_version_1.0","GCA_000721785.1","-","-","-","-","","-" +"","Aureobasidium subglaciale EXF-2481 (GCA_000721755)","Dothideales","1043005","Aureobasidium_pullulans_var._subglaciale_EXF-2481_v1.0","GCA_000721755.1","-","-","-","-","","-" +"","Babjeviella inositovora NRRL Y-12698 (GCA_001661335)","Saccharomycetales","984486","Babin1","GCA_001661335.1","-","-","-","-","","-" +"","Basidiobolus meristosporus CBS 931.73 (GCA_002104905)","","1314790","Basme2finSC","GCA_002104905.1","-","-","-","-","","-" +"","Batrachochytrium dendrobatidis JAM81 (GCA_000203795)","Rhizophydiales","684364","v1.0","GCA_000203795.1","-","-","-","-","-","-" +"","Batrachochytrium dendrobatidis JEL423 (GCA_000149865)","Rhizophydiales","403673","BD_JEL423","GCA_000149865.1","-","-","-","-","","-" +"","Batrachochytrium salamandrivorans str. BS (GCA_002006685)","Rhizophydiales","1357716","Batr_sala_BS_V1","GCA_002006685.1","-","-","-","-","","-" +"","Baudoinia panamericana UAMH 10762 (GCA_000338955)","Capnodiales","717646","Bauco1","GCA_000338955.1","-","-","-","-","","-" +"","Beauveria bassiana","Hypocreales","176275","ASM168263v1","GCA_001682635.1","-","-","-","","","-" +"","Beauveria bassiana ARSEF 2860 (GCA_000280675)","Hypocreales","655819","ASM28067v1","GCA_000280675.1","-","-","-","-","-","-" +"","Beauveria bassiana D1-5 (GCA_000770705)","Hypocreales","1245745","BBA1.0","GCA_000770705.1","-","-","-","-","-","-" +"","Beauveria bassiana str. JEF-007 (GCA_002871155)","Hypocreales","176275","ASM287115v1","GCA_002871155.1","-","-","-","-","-","-" +"","Bifiguratus adelaidae str. AZ0501","Mucoromycotina","1938954","ASM226119v1","GCA_002261195.1","-","-","-","-","","-" +"","Bipolaris maydis ATCC 48331 (GCA_000354255)","Pleosporales","665024","CocheC4_1","GCA_000354255.1","-","-","-","-","-","-" +"","Bipolaris maydis C5 (GCA_000338975)","Pleosporales","701091","CocheC5_3","GCA_000338975.1","-","-","-","-","","-" +"","Bipolaris oryzae ATCC 44560 (GCA_000523455)","Pleosporales","930090","Cochliobolus_miyabeanus_v1.0","GCA_000523455.1","-","-","-","-","","-" +"","Bipolaris sorokiniana ND90Pr (GCA_000338995)","Pleosporales","665912","Cocsa1","GCA_000338995.1","-","-","-","-","","-" +"","Bipolaris victoriae FI3 (GCA_000527765)","Pleosporales","930091","Cochliobolus_victoriae_v1.0","GCA_000527765.1","-","-","-","-","","-" +"","Bipolaris zeicola 26-R-13 (GCA_000523435)","Pleosporales","930089","Cochliobolus_carbonum_v1.0","GCA_000523435.1","-","-","-","-","","-" +"","Blastomyces dermatitidis ATCC 18188 (GCA_000151595)","Onygenales","653446","BD_ATCC18188_V1","GCA_000151595.1","-","-","-","-","-","-" +"","Blastomyces dermatitidis ATCC 26199 (GCA_000166155)","Onygenales","447095","BD_ATCC26199_V2","GCA_000166155.1","-","-","-","-","-","-" +"","Blastomyces dermatitidis ER-3 (GCA_000003525)","Onygenales","559297","BD_ER3_V1","GCA_000003525.2","-","-","-","-","","-" +"","Blastomyces gilchristii SLH14081 (GCA_000003855)","Onygenales","559298","BD_SLH14081_V1","GCA_000003855.2","-","-","-","-","","-" +"","Blastomyces percursus str. EI222 (GCA_001883805)","Onygenales","1658174","Blas_perc_EI222_V1","GCA_001883805.1","-","-","-","-","","-" +"","Blumeria graminis","Erysiphales","546991","EF2","GCA_000151065.2","-","-","-","","","-" +"","Blumeria graminis f. sp. tritici 96224 (GCA_000418435)","Erysiphales","1268274","Bgt_454_newbler_assembly","GCA_000418435.1","-","-","-","-","-","-" +"","Botryobasidium botryosum FD-172 SS1 (GCA_000697705)","Cantharellales","930990","Botbo1","GCA_000697705.1","-","-","-","-","","-" +"","Botrytis cinerea B05.10","Sclerotiniaceae","332648","ASM83294v1","GCA_000143535.4","-","-","-","","","-" +"","Botrytis cinerea BcDW1 (GCA_000349525)","Sclerotiniaceae","1290391","BcDW1","GCA_000349525.1","-","-","-","-","-","-" +"","Botrytis cinerea T4 (GCA_000227075)","Sclerotiniaceae","999810","BotFuc_Mar2011","GCA_000227075.1","-","-","-","-","-","-" +"","Brettanomyces bruxellensis AWRI1499 (GCA_000259595)","Saccharomycetales","1124627","AWRI1499_v1.0","GCA_000259595.1","-","-","-","-","","-" +"","Byssochlamys spectabilis No. 5 str. Paecilomyces variotii No. 5 (NBRC109023) (GCA_000497085)","Eurotiales","1356009","PVAR5_assembly01","GCA_000497085.1","-","-","-","-","","-" +"","Cadophora sp. DSE1049 (GCA_003073865)","Helotiales","1485229","Cadsp1","GCA_003073865.1","-","-","-","-","","-" +"","Calocera cornea HHB12733 (GCA_001632435)","Dacrymycetales","1353952","Calco1","GCA_001632435.1","-","-","-","-","","-" +"","Calocera viscosa TUFC12733 (GCA_001630345)","Dacrymycetales","1330018","Calvi1","GCA_001630345.1","-","-","-","-","","-" +"","Candida albicans 12C (GCA_000773845)","Saccharomycetales","1094981","Cand_albi_12C_V2","GCA_000773845.1","-","-","-","-","-","-" +"","Candida albicans 19F (GCA_000775445)","Saccharomycetales","1094987","Cand_albi_19F_V2","GCA_000775445.1","-","-","-","-","-","-" +"","Candida albicans Ca6 (GCA_000784695)","Saccharomycetales","1165368","Cand_albi_Ca6_V2","GCA_000784695.1","-","-","-","-","-","-" +"","Candida albicans GC75 (GCA_000773735)","Saccharomycetales","1094988","Cand_albi_GC75_V1","GCA_000773735.1","-","-","-","-","-","-" +"","Candida albicans L26 (GCA_000775455)","Saccharomycetales","1094982","Cand_albi_L26_V2","GCA_000775455.1","-","-","-","-","-","-" +"","Candida albicans P34048 (GCA_000775465)","Saccharomycetales","1094991","Cand_albi_P34048_V1","GCA_000775465.1","-","-","-","-","-","-" +"","Candida albicans P37005 (GCA_000773745)","Saccharomycetales","1094985","Cand_albi_P37005_V2","GCA_000773745.1","-","-","-","-","-","-" +"","Candida albicans P37037 (GCA_000773825)","Saccharomycetales","1094992","Cand_albi_P37037_V1","GCA_000773825.1","-","-","-","-","-","-" +"","Candida albicans P37039 (GCA_000784515)","Saccharomycetales","1094993","Cand_albi_P37039_V1","GCA_000784515.1","-","-","-","-","-","-" +"","Candida albicans P57055 (GCA_000775505)","Saccharomycetales","1094996","Cand_albi_P57055_V1","GCA_000775505.1","-","-","-","-","-","-" +"","Candida albicans P57072 (GCA_000773805)","Saccharomycetales","1094990","Cand_albi_P57072_V1","GCA_000773805.1","-","-","-","-","-","-" +"","Candida albicans P60002 (GCA_000784525)","Saccharomycetales","1094986","Cand_albi_P60002_V1","GCA_000784525.1","-","-","-","-","-","-" +"","Candida albicans P75010 (GCA_000784575)","Saccharomycetales","1094994","Cand_albi_P75010_V1","GCA_000784575.1","-","-","-","-","-","-" +"","Candida albicans P75016 (GCA_000784595)","Saccharomycetales","1094995","Cand_albi_P75016_V1","GCA_000784595.1","-","-","-","-","-","-" +"","Candida albicans P75063 (GCA_000775525)","Saccharomycetales","1094997","Cand_albi_P75063_V1","GCA_000775525.1","-","-","-","-","-","-" +"","Candida albicans P76055 (GCA_000784505)","Saccharomycetales","1094998","Cand_albi_P76055_V1","GCA_000784505.1","-","-","-","-","-","-" +"","Candida albicans P76067 (GCA_000784495)","Saccharomycetales","1094999","Cand_albi_P76067_V1","GCA_000784495.1","-","-","-","-","-","-" +"","Candida albicans P78042 (GCA_000784615)","Saccharomycetales","1095000","Cand_albi_P78042_V1","GCA_000784615.1","-","-","-","-","-","-" +"","Candida albicans P78048 (GCA_000773725)","Saccharomycetales","1094989","Cand_albi_P78048_V1","GCA_000773725.1","-","-","-","-","-","-" +"","Candida albicans P87 (GCA_000774085)","Saccharomycetales","1094984","Cand_albi_P87_V2","GCA_000774085.1","-","-","-","-","-","-" +"","Candida albicans P94015 (GCA_000773755)","Saccharomycetales","1094983","Cand_albi_P94015_V1","GCA_000773755.1","-","-","-","-","-","-" +"","Candida albicans SC5314 (GCA_000784635)","Saccharomycetales","237561","Cand_albi_SC5314_V4","GCA_000784635.1","-","-","-","-","","-" +"","Candida albicans SC5314 (GCA_000784655)","Saccharomycetales","237561","Cand_albi_SC5314_V3","GCA_000784655.1","-","-","-","-","-","-" +"","Candida albicans WO-1 (GCA_000149445)","Saccharomycetales","294748","ASM14944v2","GCA_000149445.2","-","-","-","-","-","-" +"","Candida dubliniensis CD36 (GCA_000026945)","Saccharomycetales","573826","ASM2694v1","GCA_000026945.1","-","-","-","-","-","-" +"","Candida maltosa Xu316 (GCA_000344705)","Saccharomycetales","1245528","Cmaltosa_v01","GCA_000344705.1","-","-","-","-","-","-" +"","Candida orthopsilosis Co 90-125 (GCA_000315875)","Saccharomycetales","1136231","ASM31587v1","GCA_000315875.1","-","-","-","-","-","-" +"","Candida parapsilosis str. CDC317 (GCA_000182765)","Saccharomycetales","5480","ASM18276v2","GCA_000182765.2","-","-","-","-","","-" +"","Candida tropicalis MYA-3404 (GCA_000006335)","Saccharomycetales","294747","ASM633v3","GCA_000006335.3","-","-","-","-","","-" +"","Capronia coronata CBS 617.96 (GCA_000585585)","Chaetothyriomycetidae","1182541","Capr_coro_CBS_617_96_V1","GCA_000585585.1","-","-","-","-","","-" +"","Capronia epimyces CBS 606.96 (GCA_000585565)","Chaetothyriomycetidae","1182542","Capr_epim_CBS_606_96_V1","GCA_000585565.1","-","-","-","-","","-" +"","Catenaria anguillulae PL171 (GCA_002102555)","Blastocladiales","765915","Catan2","GCA_002102555.1","-","-","-","-","","-" +"","Ceraceosorus bombacis (GCA_900000165)","","401625","Ceraceosorus_bombacis","GCA_900000165.1","-","-","-","-","-","-" +"","Ceraceosorus guamensis str. MCA 4658 (GCA_003144195)","","1522189","Cersp1","GCA_003144195.1","-","-","-","-","","-" +"","Ceratocystis platani str. CFO (GCA_000978885)","Microascales","88771","ASM97888v1","GCA_000978885.1","-","-","-","-","","-" +"","Cercospora berteroae (GCA_002933655)","Capnodiales","357750","Cbert_1","GCA_002933655.1","-","-","-","-","","-" +"","Cercospora beticola (GCA_002742065)","Capnodiales","122368","CB0940_V2","GCA_002742065.1","-","-","-","-","","-" +"","Cercospora zeina str. CMW25467 (GCA_002844615)","Capnodiales","348901","ASM284461v1","GCA_002844615.1","-","-","-","-","","-" +"","Chaetomium globosum CBS 148.51 (GCA_000143365)","Sordariales","306901","ASM14336v1","GCA_000143365.1","-","-","-","-","","-" +"","Chaetomium thermophilum var. thermophilum DSM 1495 (GCA_000221225)","Sordariales","759272","CTHT_3.0","GCA_000221225.1","-","-","-","-","","-" +"","Choanephora cucurbitarum str. KUS-F28377 (GCA_001683725)","Mucoromycotina","101091","ASM168372v1","GCA_001683725.1","-","-","-","-","","-" +"","Cladophialophora bantiana CBS 173.52 (GCA_000835475)","Chaetothyriomycetidae","1442370","Clad_bant_CBS_173_52_V1","GCA_000835475.1","-","-","-","-","","-" +"","Cladophialophora carrionii CBS 160.54 (GCA_000365165)","Chaetothyriomycetidae","1279043","Clad_carr_CBS_160_54_V1","GCA_000365165.2","-","-","-","-","-","-" +"","Cladophialophora carrionii str. KSF (GCA_001700775)","Chaetothyriomycetidae","86049","ASM170077v1","GCA_001700775.1","-","-","-","-","","-" +"","Cladophialophora immunda str. CBS 83496 (GCA_000835495)","Chaetothyriomycetidae","569365","Clad_immu_CBS83496_V1","GCA_000835495.1","-","-","-","-","","-" +"","Cladophialophora psammophila CBS 110553 (GCA_000585535)","Chaetothyriomycetidae","1182543","Clad_psam_CBS_110553_V1","GCA_000585535.1","-","-","-","-","","-" +"","Cladophialophora yegresii CBS 114405 (GCA_000585515)","Chaetothyriomycetidae","1182544","Clad_yegr_CBS_114405_V1","GCA_000585515.1","-","-","-","-","","-" +"","Claviceps purpurea 20.1 (GCA_000347355)","Hypocreales","1111077","ASM34735v1","GCA_000347355.1","-","-","-","-","","-" +"","Clavispora lusitaniae ATCC 42720 (GCA_000003835)","Saccharomycetales","306902","ASM383v1","GCA_000003835.1","-","-","-","-","","-" +"","Clavispora lusitaniae str. CBS 6936 (GCA_001673695)","Saccharomycetales","36911","ASM167369v2","GCA_001673695.2","-","-","-","-","-","-" +"","Clohesyomyces aquaticus str. CBS 115471 (GCA_002105025)","Pleosporales","1231657","Cloaq1","GCA_002105025.1","-","-","-","-","","-" +"","Coccidioides immitis H538.4 (GCA_000149815)","Onygenales","396776","ASM14981v1","GCA_000149815.1","-","-","-","-","","-" +"","Coccidioides immitis RMSCC 2394 (GCA_000149895)","Onygenales","404692","ASM14989v1","GCA_000149895.1","-","-","-","-","-","-" +"","Coccidioides immitis RMSCC 3703 (GCA_000150085)","Onygenales","454286","ASM15008v1","GCA_000150085.1","-","-","-","-","-","-" +"","Coccidioides immitis RS (GCA_000149335)","Onygenales","246410","ASM14933v2","GCA_000149335.2","-","-","-","-","-","-" +"","Coccidioides posadasii C735 delta SOWgp (GCA_000151335)","Onygenales","222929","JCVI-cpa1-1.0","GCA_000151335.1","-","-","-","-","-","-" +"","Coccidioides posadasii RMSCC 3488 (GCA_000150055)","Onygenales","454284","ASM15005v1","GCA_000150055.1","-","-","-","-","-","-" +"","Coccidioides posadasii str. Silveira (GCA_000170175)","Onygenales","443226","CPS2","GCA_000170175.2","-","-","-","-","","-" +"","Colletotrichum chlorophyti str. NTL11 (GCA_001937105)","Glomerellales","708187","ASM193710v1","GCA_001937105.1","-","-","-","-","-","-" +"","Colletotrichum fioriniae PJ7 (GCA_000582985)","Glomerellales","1445577","CFIO01","GCA_000582985.1","-","-","-","-","-","-" +"","Colletotrichum gloeosporioides","Glomerellales","1213859","GCA_000319635.1","GCA_000319635.1","-","-","-","","","-" +"","Colletotrichum gloeosporioides Cg-14 (GCA_000446055)","Glomerellales","1237896","Colletotrichum_gloeosporioides1","GCA_000446055.1","-","-","-","-","-","-" +"","Colletotrichum graminicola","Glomerellales","645133","C_graminicola_M1_001_V1","GCA_000149035.1","-","-","-","","","-" +"","Colletotrichum higginsianum","Glomerellales","80884","GCA_000313795.2","GCA_000313795.2","-","-","-","","","-" +"","Colletotrichum higginsianum IMI 349063 (GCA_001672515)","Glomerellales","759273","ASM167251v1","GCA_001672515.1","-","-","-","-","-","-" +"","Colletotrichum incanum str. MAFF 238704 (GCA_001625285)","Glomerellales","1573173","Ci238704v1","GCA_001625285.1","-","-","-","-","-","-" +"","Colletotrichum incanum str. MAFF238712 (GCA_001855235)","Glomerellales","1573173","ASM185523v1","GCA_001855235.1","-","-","-","-","-","-" +"","Colletotrichum nymphaeae SA-01 (GCA_001563115)","Glomerellales","1460502","CNYM01","GCA_001563115.1","-","-","-","-","-","-" +"","Colletotrichum orbiculare","Glomerellales","1213857","GCA_000350065.1","GCA_000350065.1","-","-","-","","","-" +"","Colletotrichum orchidophilum str. IMI 309357 (GCA_001831195)","Glomerellales","1209926","CORC01","GCA_001831195.1","-","-","-","-","-","-" +"","Colletotrichum salicis str. CBS 607.94 (GCA_001563125)","Glomerellales","1209931","CSAL01","GCA_001563125.1","-","-","-","-","-","-" +"","Colletotrichum simmondsii str. CBS122122 (GCA_001563135)","Glomerellales","703756","CSIM01","GCA_001563135.1","-","-","-","-","-","-" +"","Colletotrichum sublineola str. TX430BB (GCA_000696135)","Glomerellales","1173701","ASM69613v1","GCA_000696135.1","-","-","-","-","-","-" +"","Colletotrichum tofieldiae str. 0861 (GCA_001625265)","Glomerellales","708197","Ct0861v1","GCA_001625265.1","-","-","-","-","-","-" +"","Conidiobolus coronatus NRRL 28638 (GCA_001566745)","","796925","Conidiobolus_coronatus_NRRL28638","GCA_001566745.1","-","-","-","-","","-" +"","Coniella lustricola str. B22-T-1 (GCA_003019895)","Sordariomycetidae","2025994","Coniella_lustricola_v1.0","GCA_003019895.1","-","-","-","-","","-" +"","Coniochaeta ligniaria NRRL 30616 (GCA_001879275)","Sordariomycetidae","1408157","Conlig_v1.0","GCA_001879275.1","-","-","-","-","","-" +"","Coniophora puteana RWD-64-598 SS2 (GCA_000271625)","Boletales","741705","Conpu1","GCA_000271625.1","-","-","-","-","","-" +"","Coniosporium apollinis CBS 100218 str. CBS 352.97 (GCA_000281105)","","1168221","Coni_apol_CBS100218__V1","GCA_000281105.1","-","-","-","-","","-" +"","Coprinopsis cinerea okayama7#130 (GCA_000182895)","Agaricales","240176","CC3","GCA_000182895.1","-","-","-","-","","-" +"","Cordyceps brongniartii RCEF 3172 (GCA_001636735)","Hypocreales","1081107","BBO_1.0","GCA_001636735.1","-","-","-","-","","-" +"","Cordyceps confragosa RCEF 1005 (GCA_001636795)","Hypocreales","1081108","LEL_1.0","GCA_001636795.1","-","-","-","-","","-" +"","Cordyceps confragosa str. UM487 (GCA_001653215)","Hypocreales","1105325","ASM165321v1","GCA_001653215.1","-","-","-","-","-","-" +"","Cordyceps fumosorosea ARSEF 2679 (GCA_001636725)","Hypocreales","1081104","ISF_1.0","GCA_001636725.1","-","-","-","-","","-" +"","Cordyceps militaris CM01 (GCA_000225605)","Hypocreales","983644","CmilitarisCM01_v01","GCA_000225605.1","-","-","-","-","","-" +"","Cordyceps sp. RAO-2017 (GCA_002591385)","Hypocreales","2004951","Hirsu2","GCA_002591385.1","-","-","-","-","","-" +"","Corynespora cassiicola Philippines (GCA_003016335)","Pleosporales","1448308","Corynespora_cassiicola_v1.0","GCA_003016335.1","-","-","-","-","","-" +"","Cryptococcus amylolentus CBS 6039 (GCA_001720205)","Tremellales","1295533","Cryp_amyl_CBS6039_V3","GCA_001720205.1","-","-","-","-","","-" +"","Cryptococcus amylolentus CBS 6273 (GCA_001720235)","Tremellales","1296118","Cryp_amyl_CBS6273_V2","GCA_001720235.1","-","-","-","-","-","-" +"","Cryptococcus depauperatus CBS 7841 (GCA_001720195)","Tremellales","1295531","Filo_depa_CBS7841_V1","GCA_001720195.1","-","-","-","-","","-" +"","Cryptococcus depauperatus CBS 7855 (GCA_001720245)","Tremellales","1295532","Filo_depa_CBS7855_V2","GCA_001720245.1","-","-","-","-","-","-" +"","Cryptococcus gattii CA1280 (GCA_000836335)","Tremellales","1296109","Cryp_gatt_CA1280_V1","GCA_000836335.1","-","-","-","-","-","-" +"","Cryptococcus gattii CA1873 (GCA_000855695)","Tremellales","1296111","Cryp_gatt_CA1873_V1","GCA_000855695.1","-","-","-","-","-","-" +"","Cryptococcus gattii E566 (GCA_000875815)","Tremellales","1296102","Cryp_gatt_E566_V1","GCA_000875815.1","-","-","-","-","-","-" +"","Cryptococcus gattii EJB2 (GCA_000835745)","Tremellales","1296103","Cryp_gatt_EJB2_V1","GCA_000835745.1","-","-","-","-","-","-" +"","Cryptococcus gattii NT-10 (GCA_000935105)","Tremellales","1296108","Cryp_gatt_NT-10_V1","GCA_000935105.1","-","-","-","-","-","-" +"","Cryptococcus gattii Ru294 (GCA_000836355)","Tremellales","1296112","Cryp_gatt_Ru294_V1","GCA_000836355.1","-","-","-","-","-","-" +"","Cryptococcus gattii VGII 2001/935-1 (GCA_000835815)","Tremellales","1334442","Cryp_gatt_2001_935-1_V1","GCA_000835815.1","-","-","-","-","-","-" +"","Cryptococcus gattii VGII 99/473 (GCA_000836455)","Tremellales","1296104","Cryp_gatt_99_473_V1","GCA_000836455.1","-","-","-","-","-","-" +"","Cryptococcus gattii VGII CA1014 (GCA_000875795)","Tremellales","1296107","Cryp_gatt_CA1014_V1","GCA_000875795.1","-","-","-","-","-","-" +"","Cryptococcus gattii VGII CBS 10090 (GCA_000835765)","Tremellales","1296101","Cryp_gatt_CBS10090_V1","GCA_000835765.1","-","-","-","-","-","-" +"","Cryptococcus gattii VGII LA55 (GCA_000836315)","Tremellales","1296106","Cryp_gatt_LA55_V1","GCA_000836315.1","-","-","-","-","-","-" +"","Cryptococcus gattii VGII MMRL2647 (GCA_000875855)","Tremellales","1296117","Cryp_gatt_MMRL2647_V2","GCA_000875855.1","-","-","-","-","-","-" +"","Cryptococcus gattii VGII R265 (GCA_000149475)","Tremellales","294750","CNB2","GCA_000149475.3","-","-","-","-","-","-" +"","Cryptococcus gattii VGII Ram5 (GCA_000836375)","Tremellales","1296110","Cryp_gatt_Ram5_V1","GCA_000836375.1","-","-","-","-","-","-" +"","Cryptococcus gattii VGIV IND107 (GCA_000835755)","Tremellales","1296105","Cryp_gatt_IND107_V2","GCA_000835755.1","-","-","-","-","-","-" +"","Cryptococcus gattii WM276 (GCA_000185945)","Tremellales","367775","ASM18594v1","GCA_000185945.1","-","-","-","-","","-" +"","Cryptococcus neoformans var. grubii 125.91 (GCA_002215885)","Tremellales","1230079","Cryp_neof_125_91_V1","GCA_002215885.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii A1-35-8 (GCA_002221985)","Tremellales","1230081","Cryp_neof_grubii_A1-35-8_V1","GCA_002221985.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii A2-102-5 (GCA_002222375)","Tremellales","1230057","Cryp_neof_A2_102_5_V1","GCA_002222375.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii A5-35-17 (GCA_002222215)","Tremellales","1230080","Cryp_neof_grubii_A5-35-17_V1","GCA_002222215.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii AD1-7a (GCA_002220445)","Tremellales","1230056","Cryp_neof_AD1_7a_V1","GCA_002220445.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii AD1-83a (GCA_002215765)","Tremellales","1230065","Cryp_neof_AD1_83a_V1","GCA_002215765.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii AD2-60a (GCA_002215775)","Tremellales","1230059","Cryp_neof_AD2_60a_V1","GCA_002215775.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii Br795 (GCA_002222225)","Tremellales","1230061","Cryp_neof_Br795_V1","GCA_002222225.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii Bt1 (GCA_002215705)","Tremellales","1230073","Cryp_neof_Bt1_V1","GCA_002215705.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii Bt120 (GCA_002222465)","Tremellales","1230070","Cryp_neof_Bt120_V1","GCA_002222465.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii Bt15 (GCA_002222335)","Tremellales","1230071","Cryp_neof_Bt15_V1","GCA_002222335.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii Bt63 (GCA_002234625)","Tremellales","1230075","Cryp_neof_Bt63_V1","GCA_002234625.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii Bt85 (GCA_002215835)","Tremellales","1230076","Cryp_neof_Bt85_V1","GCA_002215835.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii C23 (GCA_002215825)","Tremellales","1230055","Cryp_neof_C23_V1","GCA_002215825.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii CHC193 (GCA_002222295)","Tremellales","1230064","Cryp_neof_CHC193_V1","GCA_002222295.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii D17-1 (GCA_002222255)","Tremellales","1230058","Cryp_neof_D17_1_V1","GCA_002222255.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii Gb118 (GCA_002224005)","Tremellales","1230060","Cryp_neof_Gb118_V1","GCA_002224005.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii H99 (GCA_000149245)","Tremellales","235443","CNA3","GCA_000149245.3","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii MW-RSA1955 (GCA_002222455)","Tremellales","1230066","Cryp_neof_MW_RSA1955_V1","GCA_002222455.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii MW-RSA36 (GCA_002222395)","Tremellales","1230062","Cryp_neof_MW_RSA36_V1","GCA_002222395.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii MW-RSA852 (GCA_002220035)","Tremellales","1230069","Cryp_neof_MW_RSA852_V1","GCA_002220035.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii Th84 (GCA_002222315)","Tremellales","1230067","Cryp_neof_Th84_V1","GCA_002222315.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii Tu259-1 (GCA_002222325)","Tremellales","1230072","Cryp_neof_Tu259_1_V1","GCA_002222325.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii Tu401-1 (GCA_002222475)","Tremellales","1230077","Cryp_neof_Tu401_1_V1","GCA_002222475.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii Ze90-1 (GCA_002222385)","Tremellales","1230078","Cryp_neof_Ze90_1_V1","GCA_002222385.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii c45 (GCA_002215855)","Tremellales","1230068","Cryp_neof_C45_V1","GCA_002215855.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii c8 (GCA_002222405)","Tremellales","1230063","Cryp_neof_C8_V1","GCA_002222405.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. CCTP51 (GCA_002217545)","Tremellales","178876","Cryp_neof_grubii_cng10_V1","GCA_002217545.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. CM20 (GCA_002222115)","Tremellales","178876","Cryp_neof_grubii_cng5_V1","GCA_002222115.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. CM24 (GCA_002222145)","Tremellales","178876","Cryp_neof_grubii_cng6_V1","GCA_002222145.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. CM36 (GCA_002222245)","Tremellales","178876","Cryp_neof_grubii_cng2_V1","GCA_002222245.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. CM50 (GCA_002222135)","Tremellales","178876","Cryp_neof_grubii_cng1_V1","GCA_002222135.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. CM52 (GCA_002222165)","Tremellales","178876","Cryp_neof_grubii_cng3_V1","GCA_002222165.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. CM64 (GCA_002222025)","Tremellales","178876","Cryp_neof_grubii_cng4_V1","GCA_002222025.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. KN99 (GCA_002216725)","Tremellales","178876","ASM221672v1","GCA_002216725.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. RCT21 (GCA_002222155)","Tremellales","178876","Cryp_neof_grubii_cng11_V1","GCA_002222155.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. RCT54 (GCA_002222015)","Tremellales","178876","Cryp_neof_grubii_cng8_V1","GCA_002222015.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. RCT6 (GCA_002222095)","Tremellales","178876","Cryp_neof_grubii_cng7_V1","GCA_002222095.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. V2 (GCA_002215755)","Tremellales","178876","Cneo_seroA_V2","GCA_002215755.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. grubii str. WM-1408 (GCA_002220045)","Tremellales","178876","Cneo_seroA_WM1408","GCA_002220045.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. neoformans B-3501A (GCA_000149385)","Tremellales","283643","ASM14938v1","GCA_000149385.1","-","-","-","-","-","-" +"","Cryptococcus neoformans var. neoformans JEC21","Tremellales","214684","ASM9104v1","GCA_000091045.1","-","-","-","-","","-" +"","Cutaneotrichosporon oleaginosum str. IBC0246 (GCA_001027345)","","879819","Triol1","GCA_001027345.1","-","-","-","-","","-" +"","Cyberlindnera fabianii str. 65 (GCA_001983305)","Saccharomycetales","36022","ASM198330v1","GCA_001983305.1","-","-","-","-","-","-" +"","Cyberlindnera fabianii str. YJS4271 (GCA_003205855)","Saccharomycetales","36022","ASM320585v1","GCA_003205855.1","-","-","-","-","","-" +"","Cyberlindnera jadinii NRRL Y-1542 (GCA_001661405)","Saccharomycetales","983966","Cybja1","GCA_001661405.1","-","-","-","-","-","-" +"","Cyberlindnera jadinii str. CBS1600 (GCA_001245095)","Saccharomycetales","4903","cj1","GCA_001245095.1","-","-","-","-","","-" +"","Cylindrobasidium torrendii FP15055 ss-10 (GCA_000934385)","Agaricales","1314674","Cylto1","GCA_000934385.1","-","-","-","-","","-" +"","Cyphellophora europaea CBS 101466 (GCA_000365145)","Chaetothyriomycetidae","1220924","Phia_euro_CBS_101466_V1","GCA_000365145.2","-","-","-","-","","-" +"","Dacryopinax primogenitus str. DJM-731 SS1 (GCA_000292625)","Dacrymycetales","1858805","Dacryopinax_sp._DJM_731_SSP1_v1.0","GCA_000292625.1","-","-","-","-","","-" +"","Dactylellina haptotyla CBS 200.50 (GCA_000441935)","Orbiliales","1284197","MHA_v2","GCA_000441935.1","-","-","-","-","","-" +"","Daedalea quercina L-15889 (GCA_001632345)","Polyporales","1314783","Daequ1","GCA_001632345.1","-","-","-","-","","-" +"","Daldinia sp. EC12 (GCA_002120325)","Xylariales","1001832","DalEC12_v.1.0","GCA_002120325.1","-","-","-","-","","-" +"","Debaryomyces fabryi str. CBS 789 (GCA_001447935)","Saccharomycetales","58627","debFab1.0","GCA_001447935.1","-","-","-","-","","-" +"","Debaryomyces hansenii CBS767 (GCA_000006445)","Saccharomycetales","284592","ASM644v2","GCA_000006445.2","-","-","-","-","","-" +"","Diaporthe ampelina (GCA_001006365)","Sordariomycetidae","1214573","UCDDA912v1.0","GCA_001006365.1","-","-","-","-","","-" +"","Diaporthe helianthi str. 7/96 (GCA_001702395)","Sordariomycetidae","158607","DHEL01v2","GCA_001702395.2","-","-","-","-","","-" +"","Dichomitus squalens LYAD-421 SS1 (GCA_000275845)","Polyporales","732165","Dichomitus_squalens_v1.0","GCA_000275845.1","-","-","-","-","","-" +"","Diplocarpon rosae (GCA_002317995)","Helotiales","946125","ASM231799v1","GCA_002317995.1","-","-","-","-","","-" +"","Diplodia corticola str. CBS 112549 (GCA_001883845)","Botryosphaeriales","236234","ASM188384v1","GCA_001883845.1","-","-","-","-","","-" +"","Diplodia seriata (GCA_001006355)","Botryosphaeriales","420778","UCDDS831v0.1","GCA_001006355.1","-","-","-","-","","-" +"","Diplodia seriata str. F98.1 (GCA_001975905)","Botryosphaeriales","420778","Dipser_v1","GCA_001975905.1","-","-","-","-","-","-" +"","Dothistroma septosporum","Capnodiales","675120","GCA_000340195.1","GCA_000340195.1","-","-","-","","","-" +"","Drechmeria coniospora str. ARSEF 6962 (GCA_001625195)","Hypocreales","98403","ASM162519v1","GCA_001625195.1","-","-","-","-","","-" +"","Drechslerella stenobrocha 248 (GCA_000525045)","Orbiliales","1043628","DREv1","GCA_000525045.1","-","-","-","-","","-" +"","Edhazardia aedis USNM 41457 (GCA_000230595)","Microsporidia","1003232","Edha_aedis_V4b","GCA_000230595.3","-","-","-","-","","-" +"","Elaphomyces granulatus str. OSC145934 (GCA_002240705)","Eurotiales","519963","PX439","GCA_002240705.1","-","-","-","-","","-" +"","Elsinoe australis str. NL1 (GCA_003013795)","","40998","ASM301379v1","GCA_003013795.1","-","-","-","-","","-" +"","Emergomyces pasteuriana Ep9510 str. UAMH 9510 (GCA_001883825)","Onygenales","1447872","Emmo_past_UAMH9510_V1","GCA_001883825.1","-","-","-","-","","-" +"","Emmonsia crescens UAMH 3008 (GCA_001008285)","Onygenales","1247875","ASM100828v1","GCA_001008285.1","-","-","-","-","","-" +"","Emmonsia crescens str. UAMH4076 (GCA_002572855)","Onygenales","73230","Emmon_cres_4076_V1","GCA_002572855.1","-","-","-","-","-","-" +"","Emmonsia parva UAMH 139 (GCA_001014755)","Onygenales","2060906","ASM101475v1","GCA_001014755.1","-","-","-","-","","-" +"","Emmonsia parva str. UAMH130 (GCA_002572885)","Onygenales","2060905","Emmon_parv_130","GCA_002572885.1","-","-","-","-","-","-" +"","Emmonsia sp. CAC-2015a str. CBS 136260 (GCA_001660665)","Onygenales","1658172","Emmo_afri_EA111","GCA_001660665.1","-","-","-","-","","-" +"","Encephalitozoon cuniculi EcunIII-L (GCA_001078035)","Unikaryonidae","1355160","ECIIIL","GCA_001078035.1","-","-","-","-","-","-" +"","Encephalitozoon hellem ATCC 50504 (GCA_000277815)","Unikaryonidae","907965","ASM27781v3","GCA_000277815.3","-","-","-","-","-","-" +"","Encephalitozoon intestinalis ATCC 50506 (GCA_000146465)","Unikaryonidae","876142","ASM14646v1","GCA_000146465.1","-","-","-","-","-","-" +"","Encephalitozoon romaleae SJ-2008 (GCA_000280035)","Unikaryonidae","1178016","ASM28003v2","GCA_000280035.2","-","-","-","-","-","-" +"","Endocarpon pusillum Z07020 (GCA_000464535)","Verrucariales","1263415","EPUS","GCA_000464535.1","-","-","-","-","","-" +"","Enterocytozoon bieneusi H348 (GCA_000209485)","Microsporidia","481877","ASM20948v1","GCA_000209485.1","-","-","-","-","","-" +"","Enterocytozoon hepatopenaei str. TH1 (GCA_002081675)","Microsporidia","646526","ASM208167v1","GCA_002081675.1","-","-","-","-","","-" +"","Enterospora canceri str. GB1 (GCA_002087915)","Microsporidia","1081671","ASM208791v1","GCA_002087915.1","-","-","-","-","","-" +"","Epicoccum nigrum str. ICMP 19927 (GCA_002116315)","Pleosporales","105696","ASM211631v1","GCA_002116315.1","-","-","-","-","","-" +"","Eremothecium cymbalariae DBVPG#7215 (GCA_000235365)","Saccharomycetales","931890","ASM23536v1","GCA_000235365.1","-","-","-","-","","-" +"","Eremothecium gossypii FDAG1 (GCA_000968835)","Saccharomycetales","1034331","ASM96883v1","GCA_000968835.1","-","-","-","-","","-" +"","Erysiphe necator (GCA_000798715)","Erysiphales","52586","ASM79871v1","GCA_000798715.1","-","-","-","-","","-" +"","Erysiphe pulchra (GCA_002918395)","Erysiphales","225359","ASM291839v1","GCA_002918395.1","-","-","-","-","","-" +"","Escovopsis weberi (GCA_001278495)","Hypocreales","150374","ASM127849v1","GCA_001278495.1","-","-","-","-","","-" +"","Eutypa lata UCREL1 (GCA_000349385)","Xylariales","1287681","UCREL1V03","GCA_000349385.1","-","-","-","-","","-" +"","Exidia glandulosa HHB12029 (GCA_001632375)","","1314781","Exigl1","GCA_001632375.1","-","-","-","-","","-" +"","Exophiala aquamarina CBS 119918 (GCA_000709125)","Chaetothyriomycetidae","1182545","Exop_aqua_CBS_119918_V1","GCA_000709125.1","-","-","-","-","","-" +"","Exophiala dermatitidis NIH/UT8656 (GCA_000230625)","Chaetothyriomycetidae","858893","Exop_derm_V1","GCA_000230625.1","-","-","-","-","","-" +"","Exophiala mesophila str. CBS 40295 (GCA_000836275)","Chaetothyriomycetidae","212818","Exop_meso_CBS40295_V1","GCA_000836275.1","-","-","-","-","","-" +"","Exophiala oligosperma str. CBS 72588 (GCA_000835515)","Chaetothyriomycetidae","215243","Exop_olig_CBS72588_V1","GCA_000835515.1","-","-","-","-","","-" +"","Exophiala sideris str. CBS 121828 (GCA_000835395)","Chaetothyriomycetidae","1016849","Exop_side_CBS121828_V1","GCA_000835395.1","-","-","-","-","","-" +"","Exophiala spinifera str. CBS 89968 (GCA_000836115)","Chaetothyriomycetidae","91928","Exop_spin_CBS89968_V1","GCA_000836115.1","-","-","-","-","","-" +"","Exophiala xenobiotica str. CBS 118157 (GCA_000835505)","Chaetothyriomycetidae","348802","Exop_xeno_CBS118157_V1","GCA_000835505.1","-","-","-","-","","-" +"","Exserohilum turcica Et28A (GCA_000359705)","Pleosporales","671987","Setospaeria_trucica_Et28A_v1.0","GCA_000359705.1","-","-","-","-","","-" +"","Fibroporia radiculosa str. TFFH 294 (GCA_000313525)","Polyporales","599839","ASM31352v1","GCA_000313525.1","-","-","-","-","","-" +"","Fibularhizoctonia sp. CBS 109695 (GCA_001630335)","Atheliales","436010","Fibsp1","GCA_001630335.1","-","-","-","-","","-" +"","Fistulina hepatica ATCC 64428 (GCA_000934395)","Agaricales","1128425","Fishe1","GCA_000934395.1","-","-","-","-","","-" +"","Fomitiporia mediterranea MF3/22 (GCA_000271605)","Hymenochaetales","694068","Fomme1","GCA_000271605.1","-","-","-","-","","-" +"","Fomitopsis pinicola FP-58527 SS1 (GCA_000344655)","Polyporales","743788","Fompi3","GCA_000344655.2","-","-","-","-","","-" +"","Fonsecaea erecta (GCA_001651985)","Chaetothyriomycetidae","1367422","ASM165198v1","GCA_001651985.1","-","-","-","-","","-" +"","Fonsecaea monophora (GCA_001642475)","Chaetothyriomycetidae","254056","ASM164247v1","GCA_001642475.1","-","-","-","-","","-" +"","Fonsecaea multimorphosa (GCA_001646985)","Chaetothyriomycetidae","979981","ASM164698v1","GCA_001646985.1","-","-","-","-","-","-" +"","Fonsecaea multimorphosa CBS 102226 (GCA_000836435)","Chaetothyriomycetidae","1442371","Fons_mult_CBS_102226_V1","GCA_000836435.1","-","-","-","-","","-" +"","Fonsecaea nubica (GCA_001646965)","Chaetothyriomycetidae","856822","ASM164696v1","GCA_001646965.1","-","-","-","-","","-" +"","Fonsecaea pedrosoi CBS 271.37 (GCA_000835455)","Chaetothyriomycetidae","1442368","Fons_pedr_CBS_271_37_V1","GCA_000835455.1","-","-","-","-","","-" +"","Fusarium culmorum UK99","Hypocreales","1318462","EF1","GCA_900074845.1","-","-","-","","","-" +"","Fusarium fujikuroi","Hypocreales","5127","EF1","GCA_000315255.1","-","-","-","","","-" +"","Fusarium fujikuroi (GCA_001023035)","Hypocreales","5127","ASM102303v1","GCA_001023035.1","-","-","-","-","-","-" +"","Fusarium fujikuroi (GCA_001023045)","Hypocreales","5127","ASM102304v1","GCA_001023045.1","-","-","-","-","-","-" +"","Fusarium fujikuroi (GCA_001023065)","Hypocreales","5127","ASM102306v1","GCA_001023065.1","-","-","-","-","-","-" +"","Fusarium fujikuroi (GCA_900096505)","Hypocreales","5127","version_1","GCA_900096505.1","-","-","-","-","-","-" +"","Fusarium fujikuroi (GCA_900096685)","Hypocreales","5127","version_1","GCA_900096685.1","-","-","-","-","-","-" +"","Fusarium fujikuroi (GCA_900096705)","Hypocreales","5127","version_1","GCA_900096705.1","-","-","-","-","-","-" +"","Fusarium graminearum PH-1 (GCA_000240135)","Hypocreales","229533","ASM24013v3","GCA_000240135.3","-","-","-","-","-","-" +"","Fusarium graminearum str. CS3005 (GCA_000599445)","Hypocreales","5518","CS3005v1","GCA_000599445.1","-","-","-","-","","-" +"","Fusarium graminearum str. PH-1","Hypocreales","5518","RR1","GCA_900044135.1","","-","-","","-","-" +"","Fusarium langsethiae str. Fl201059 (GCA_001292635)","Hypocreales","179993","ASM129263v1","GCA_001292635.1","-","-","-","-","-","-" +"","Fusarium mangiferae (GCA_900044065)","Hypocreales","192010","Genome_assembly_version_1","GCA_900044065.1","-","-","-","-","-","-" +"","Fusarium nygamai (GCA_002894225)","Hypocreales","42673","CS10214v1","GCA_002894225.1","-","-","-","-","-","-" +"","Fusarium oxysporum","Hypocreales","426428","FO2","GCA_000222805.1","","-","","","","-" +"","Fusarium oxysporum (GCA_900096695)","Hypocreales","5507","version_1","GCA_900096695.1","-","-","-","-","-","-" +"","Fusarium oxysporum FOSC 3-a (GCA_000271745)","Hypocreales","909455","FO_FOSC_3_a_V1","GCA_000271745.2","-","-","-","-","-","-" +"","Fusarium oxysporum Fo47 (GCA_000271705)","Hypocreales","660027","FO_Fo47_V1","GCA_000271705.2","-","-","-","-","-","-" +"","Fusarium oxysporum f. sp. conglutinans race 2 54008 str. 54008 (PHW808) (GCA_000260215)","Hypocreales","1089457","FO_PHW808_V1","GCA_000260215.2","-","-","-","-","-","-" +"","Fusarium oxysporum f. sp. cubense race 1 (GCA_000350345)","Hypocreales","1229664","Foc1_1.0","GCA_000350345.1","-","-","-","-","-","-" +"","Fusarium oxysporum f. sp. cubense race 4 (GCA_000350365)","Hypocreales","1229665","Foc4_1.0","GCA_000350365.1","-","-","-","-","-","-" +"","Fusarium oxysporum f. sp. cubense tropical race 4 54006 str. 54006 (II5) (GCA_000260195)","Hypocreales","1089451","FO_II5_V1","GCA_000260195.2","-","-","-","-","-","-" +"","Fusarium oxysporum f. sp. lycopersici 4287 (GCA_000149955)","Hypocreales","426428","ASM14995v2","GCA_000149955.2","-","-","-","-","-","-" +"","Fusarium oxysporum f. sp. lycopersici MN25 (GCA_000259975)","Hypocreales","1080343","FO_MN25_V1","GCA_000259975.2","-","-","-","-","-","-" +"","Fusarium oxysporum f. sp. melonis 26406 str. 26406 (melonis) (GCA_000260495)","Hypocreales","1089452","FO_melonis_V1","GCA_000260495.2","-","-","-","-","-","-" +"","Fusarium oxysporum f. sp. pisi HDV247 (GCA_000260075)","Hypocreales","1080344","FO_HDV247_V1","GCA_000260075.2","-","-","-","-","-","-" +"","Fusarium oxysporum f. sp. radicis-cucumerinum (GCA_001702695)","Hypocreales","327505","ASM170269v2","GCA_001702695.2","-","-","-","-","-","-" +"","Fusarium oxysporum f. sp. radicis-lycopersici 26381 str. 26381 (CL57) (GCA_000260155)","Hypocreales","1089448","FO_CL57_V1","GCA_000260155.3","-","-","-","-","-","-" +"","Fusarium oxysporum f. sp. raphani 54005 (GCA_000260235)","Hypocreales","1089458","FO_PHW815_V1","GCA_000260235.2","-","-","-","-","-","-" +"","Fusarium oxysporum f. sp. vasinfectum 25433 str. 25433 (Cotton) (GCA_000260175)","Hypocreales","1089449","FO_Cotton_V1","GCA_000260175.2","-","-","-","-","-","-" +"","Fusarium poae (GCA_001675295)","Hypocreales","36050","FPOA1.0","GCA_001675295.1","-","-","-","-","-","-" +"","Fusarium proliferatum (GCA_900029915)","Hypocreales","948311","F._proliferatum_NRRL62905_version_1","GCA_900029915.1","-","-","-","-","-","-" +"","Fusarium proliferatum ET1 (GCA_900067095)","Hypocreales","1227346","F._proliferatum_ET1_version_1","GCA_900067095.1","-","-","-","-","-","-" +"","Fusarium pseudograminearum","Hypocreales","1028729","GCA_000303195.1","GCA_000303195.1","-","-","-","","","-" +"","Fusarium solani","Hypocreales","660122","v2.0","GCA_000151355.1","-","-","","","","-" +"","Fusarium venenatum (GCA_900007375)","Hypocreales","56646","ASM90000737v1","GCA_900007375.1","-","-","-","-","-","-" +"","Fusarium verticillioides","Hypocreales","334819","ASM14955v1","GCA_000149555.1","-","-","","","","-" +"","Gaeumannomyces tritici R3-111a-1","Magnaporthales","644352","Gae_graminis_V2","GCA_000145635.1","-","-","-","-","","-" +"","Galerina marginata CBS 339.88 (GCA_000697645)","Agaricales","685588","Galma1","GCA_000697645.1","-","-","-","-","","-" +"","Ganoderma sinense ZZ0214-1 (GCA_002760635)","Polyporales","1077348","GanSi1.6","GCA_002760635.1","-","-","-","-","","-" +"","Gelatoporia subvermispora B (GCA_000320605)","Polyporales","914234","Ceriporiopsis_subvermispora_B_v1.0","GCA_000320605.2","-","-","-","-","","-" +"","Glarea lozoyensis ATCC 20868 str. 1224 (GCA_000409485)","Helotiales","1116229","GLAREA","GCA_000409485.1","-","-","-","-","","-" +"","Gloeophyllum trabeum ATCC 11539 (GCA_000344685)","Gloeophyllales","670483","Glotr1_1","GCA_000344685.1","-","-","-","-","","-" +"","Gonapodya prolifera JEL478 (GCA_001574975)","","1344416","Ganpr1","GCA_001574975.1","-","-","-","-","","-" +"","Grifola frondosa str. 9006-11 (GCA_001683735)","Agaricales","5627","ASM168373v1","GCA_001683735.1","-","-","-","-","","-" +"","Grosmannia clavigera kw1407 (GCA_000143105)","Ophiostomatales","655863","Sanger-454-IlluminaPA_2.0","GCA_000143105.2","-","-","-","-","","-" +"","Gymnopus luxurians FD-317 M1 (GCA_000827265)","Agaricales","944289","Gymlu1","GCA_000827265.1","-","-","-","-","","-" +"","Hanseniaspora guilliermondii (GCA_900119595)","Saccharomycetales","56406","version_1","GCA_900119595.1","-","-","-","-","","-" +"","Hanseniaspora opuntiae (GCA_001749795)","Saccharomycetales","211096","ASM174979v1","GCA_001749795.1","-","-","-","-","","-" +"","Hanseniaspora osmophila (GCA_001747045)","Saccharomycetales","56408","ASM174704v1","GCA_001747045.1","-","-","-","-","","-" +"","Hanseniaspora uvarum (GCA_001747055)","Saccharomycetales","29833","ASM174705v1","GCA_001747055.1","-","-","-","-","-","-" +"","Hanseniaspora uvarum DSM 2768 (GCA_000968475)","Saccharomycetales","1246595","Huva2.0","GCA_000968475.1","-","-","-","-","","-" +"","Hanseniaspora valbyensis NRRL Y-1626 (GCA_001664025)","Saccharomycetales","766949","Hanva1_1","GCA_001664025.1","-","-","-","-","","-" +"","Hebeloma cylindrosporum h7 (GCA_000827355)","Agaricales","686832","Hebeloma_cylindrosporum_h7_v2.0","GCA_000827355.1","-","-","-","-","","-" +"","Helicocarpus griseus UAMH5409 (GCA_002573585)","Onygenales","1447875","Heli_gris_5409_V1","GCA_002573585.1","-","-","-","-","","-" +"","Hepatospora eriocheir str. GB1 (GCA_002087885)","Microsporidia","1081669","ASM208788v1","GCA_002087885.1","-","-","-","-","-","-" +"","Hepatospora eriocheir str. canceri (GCA_002087875)","Microsporidia","1081669","ASM208787v1","GCA_002087875.1","-","-","-","-","","-" +"","Hesseltinella vesiculosa str. NRRL 3301","Mucoromycotina","101127","Hesve2","GCA_002104935.1","-","-","-","-","","-" +"","Heterobasidion irregulare TC 32-1 (GCA_000320585)","Russulales","747525","Heterobasidion_irregulare_v2.0","GCA_000320585.2","-","-","-","-","","-" +"","Hirsutella minnesotensis 3608 (GCA_000956045)","Hypocreales","1043627","ASM95604v1","GCA_000956045.1","-","-","-","-","","-" +"","Histoplasma capsulatum G186AR (GCA_000150115)","Onygenales","447093","ASM15011v1","GCA_000150115.1","-","-","-","-","-","-" +"","Histoplasma capsulatum H143 (GCA_000151035)","Onygenales","544712","ASM15103v1","GCA_000151035.1","-","-","-","-","-","-" +"","Histoplasma capsulatum H88 (GCA_000151005)","Onygenales","544711","ASM15100v2","GCA_000151005.2","-","-","-","-","-","-" +"","Histoplasma capsulatum NAm1 (GCA_000149585)","Onygenales","339724","ASM14958v1","GCA_000149585.1","-","-","-","-","","-" +"","Hortaea werneckii EXF-2000 (GCA_002127715)","Dothideales","1157616","HwerPB1","GCA_002127715.1","-","-","-","-","","-" +"","Hydnomerulius pinastri MD-312 (GCA_000827185)","Boletales","994086","Hydpi2","GCA_000827185.1","-","-","-","-","","-" +"","Hypholoma sublateritium FD-334 SS-4 (GCA_000827495)","Agaricales","945553","Hypsu1","GCA_000827495.1","-","-","-","-","","-" +"","Hyphopichia burtonii NRRL Y-1933 (GCA_001661395)","Saccharomycetales","984485","Hypbu1","GCA_001661395.1","-","-","-","-","","-" +"","Hypoxylon sp. CI-4A (GCA_002120315)","Xylariales","1001833","HypCI4A_v1.0","GCA_002120315.1","-","-","-","-","","-" +"","Hypoxylon sp. CO27-5 (GCA_002120305)","Xylariales","1001938","HypCO275_v1.0","GCA_002120305.1","-","-","-","-","-","-" +"","Hypoxylon sp. EC38 (GCA_002120335)","Xylariales","1001937","HypEC38_v3.0","GCA_002120335.1","-","-","-","-","-","-" +"","Hypsizygus marmoreus str. 51987-8 (GCA_001605315)","Agaricales","39966","ASM160531v1","GCA_001605315.1","-","-","-","-","","-" +"","Jaapia argillacea MUCL 33604 (GCA_000697665)","Jaapiales","933084","Jaaar1","GCA_000697665.1","-","-","-","-","","-" +"","Jaminaea rosea str. MCA 5214 (GCA_003144245)","","1569628","Jamsp1","GCA_003144245.1","-","-","-","-","","-" +"","Kalmanozyma brasiliensis GHG001 (GCA_000497045)","Ustilaginales","1365824","PSEUBRA1","GCA_000497045.1","-","-","-","-","","-" +"","Kazachstania africana CBS 2517 (GCA_000304475)","Saccharomycetales","1071382","Ka_CBS2517","GCA_000304475.1","-","-","-","-","","-" +"","Kazachstania naganishii CBS 8797 (GCA_000348985)","Saccharomycetales","1071383","ASM34898v1","GCA_000348985.1","-","-","-","-","","-" +"","Kluyveromyces dobzhanskii CBS 2104 str. CBS2104 (GCA_000820885)","Saccharomycetales","1427455","KLDO_01","GCA_000820885.1","-","-","-","-","","-" +"","Kluyveromyces lactis str. NRRL Y-1140 (GCA_000002515)","Saccharomycetales","28985","ASM251v1","GCA_000002515.1","-","-","-","-","","-" +"","Kluyveromyces marxianus DMKU3-1042 (GCA_001417885)","Saccharomycetales","1003335","Kmar_1.0","GCA_001417885.1","-","-","-","-","","-" +"","Kluyveromyces marxianus str. NBRC 1777 (GCA_001417835)","Saccharomycetales","4911","KM1777_03","GCA_001417835.1","-","-","-","-","-","-" +"","Kockovaella imperatae str. NRRL Y-17943 (GCA_002102565)","Tremellales","4999","Kocim1","GCA_002102565.1","-","-","-","-","","-" +"","Komagataella pastoris","Saccharomycetales","644223","GCA_000027005.1","GCA_000027005.1","-","-","-","","","-" +"","Komagataella pastoris (GCA_001708105)","Saccharomycetales","4922","ASM170810v1","GCA_001708105.1","-","-","-","-","-","-" +"","Komagataella phaffii CBS 7435 (GCA_000223565)","Saccharomycetales","981350","PicPas_Mar2011","GCA_000223565.1","-","-","-","-","-","-" +"","Komagataella phaffii CBS 7435 (GCA_900235035)","Saccharomycetales","981350","ASM90023503v1","GCA_900235035.1","-","-","-","-","-","-" +"","Komagataella phaffii GS115 (GCA_001746955)","Saccharomycetales","644223","ASM174695v1","GCA_001746955.1","-","-","-","-","","-" +"","Komagataella phaffii str. WT (GCA_001708085)","Saccharomycetales","460519","ASM170808v1","GCA_001708085.1","-","-","-","-","-","-" +"","Kuraishia capsulata CBS 1993 (GCA_000576695)","Saccharomycetales","1382522","AUH_PRJEB4427_v1","GCA_000576695.1","-","-","-","-","","-" +"","Kwoniella bestiolae CBS 10118 (GCA_000512585)","Tremellales","1296100","Cryp_best_CBS10118_V1","GCA_000512585.2","-","-","-","-","","-" +"","Kwoniella dejecticola CBS 10117 (GCA_000512565)","Tremellales","1296121","Cryp_deje_CBS10117_V1","GCA_000512565.2","-","-","-","-","","-" +"","Kwoniella heveanensis BCC8398 (GCA_000507405)","Tremellales","1296120","Cryp_heve_BCC8398_V1","GCA_000507405.3","-","-","-","-","-","-" +"","Kwoniella heveanensis CBS 569 (GCA_000507425)","Tremellales","1296119","Cryp_heve_CBS569_V2","GCA_000507425.3","-","-","-","-","-","-" +"","Kwoniella mangroviensis CBS 10435 (GCA_000507885)","Tremellales","1331196","Kwon_mang_CBS10435_V2","GCA_000507885.2","-","-","-","-","-","-" +"","Kwoniella mangroviensis CBS 8507 (GCA_000507465)","Tremellales","1296122","Kwon_mang_CBS8507_V2","GCA_000507465.3","-","-","-","-","-","-" +"","Kwoniella mangroviensis CBS 8886 (GCA_000507485)","Tremellales","1296123","Kwon_mang_CBS8886_V1","GCA_000507485.3","-","-","-","-","-","-" +"","Kwoniella pini CBS 10737 (GCA_000512605)","Tremellales","1296096","Cryp_pinu_CBS10737_V1","GCA_000512605.2","-","-","-","-","","-" +"","Laccaria amethystina LaAM-08-1 (GCA_000827195)","Agaricales","1095629","Laccaria_amethystina_LaAM-08-1_v1.0","GCA_000827195.1","-","-","-","-","","-" +"","Laccaria bicolor S238N-H82 (GCA_000143565)","Agaricales","486041","V1.0","GCA_000143565.1","-","-","-","-","","-" +"","Lachancea dasiensis CBS 10888 (GCA_900074725)","Saccharomycetales","1266660","LADA0","GCA_900074725.1","-","-","-","-","","-" +"","Lachancea fermentati (GCA_900074765)","Saccharomycetales","4955","LAFE0","GCA_900074765.1","-","-","-","-","-","-" +"","Lachancea lanzarotensis str. CBS 12615 (GCA_000938715)","Saccharomycetales","1245769","LALA0","GCA_000938715.1","-","-","-","-","","-" +"","Lachancea meyersii CBS 8951 (GCA_900074715)","Saccharomycetales","1266667","LAME0","GCA_900074715.1","-","-","-","-","-","-" +"","Lachancea mirantina (GCA_900074745)","Saccharomycetales","1230905","LAMI0","GCA_900074745.1","-","-","-","-","-","-" +"","Lachancea nothofagi CBS 11611 (GCA_900074755)","Saccharomycetales","1266666","LANO0","GCA_900074755.1","-","-","-","-","-","-" +"","Lachancea quebecensis (GCA_002900925)","Saccharomycetales","1654605","ASM290092v1","GCA_002900925.1","-","-","-","-","-","-" +"","Lachancea sp. CBS 6924 (GCA_900074735)","Saccharomycetales","433476","LAFA0","GCA_900074735.1","-","-","-","-","-","-" +"","Lachancea thermotolerans CBS 6340 (GCA_000142805)","Saccharomycetales","559295","ASM14280v1","GCA_000142805.1","-","-","-","-","-","-" +"","Laetiporus sulphureus 93-53 (GCA_001632365)","Polyporales","1314785","Laesu1","GCA_001632365.1","-","-","-","-","","-" +"","Lentinula edodes str. G408PP-4 (GCA_002003045)","Agaricales","5353","Lened_assembly01","GCA_002003045.1","-","-","-","-","","-" +"","Leptosphaeria maculans","Pleosporales","985895","ASM23037v1","GCA_000230375.1","-","-","-","","","-" +"","Leucoagaricus sp. SymC.cos (GCA_001563735)","Agaricales","1714833","ASM156373v1","GCA_001563735.1","-","-","-","-","","-" +"","Leucosporidium creatinivorum str. 62-1032 (GCA_002105055)","","106004","Leucr1","GCA_002105055.1","-","-","-","-","","-" +"","Lichtheimia corymbifera JMRC:FSU:9682 (GCA_000723665)","Mucoromycotina","1263082","454Minimus","GCA_000723665.1","-","-","-","-","","-" +"","Lichtheimia ramosa str. JMRC:FSU:6197 (GCA_000945115)","Mucoromycotina","688394","Lramosa_hybrid_454_Illumina","GCA_000945115.1","-","-","-","-","","-" +"","Lipomyces starkeyi NRRL Y-11557 (GCA_001661325)","Saccharomycetales","675824","Lipst1_1","GCA_001661325.1","-","-","-","-","","-" +"","Lobosporangium transversale str. NRRL 3116","Mortierellomycotina","64571","Lobtra1","GCA_002105155.1","-","-","-","-","","-" +"","Lodderomyces elongisporus NRRL YB-4239 (GCA_000149685)","Saccharomycetales","379508","ASM14968v1","GCA_000149685.1","-","-","-","-","","-" +"","Lomentospora prolificans str. JHH-5317 (GCA_002276285)","Microascales","41688","Lprolificans_pilon","GCA_002276285.1","-","-","-","-","","-" +"","Macrophomina phaseolina MS6 (GCA_000302655)","Botryosphaeriales","1126212","MphMS6_1.0","GCA_000302655.1","-","-","-","-","","-" +"","Madurella mycetomatis str. mm55 (GCA_001275765)","Sordariales","100816","ASM127576v2","GCA_001275765.2","-","-","-","-","","-" +"","Magnaporthe oryzae","Magnaporthales","242507","MG8","GCA_000002495.2","-","-","","","","-" +"","Magnaporthe poae","Magnaporthales","644358","Mag_poae_ATCC_64411_V1","GCA_000193285.1","-","-","","","","-" +"","Malassezia globosa CBS 7966 (GCA_000181695)","Malasseziales","425265","ASM18169v1","GCA_000181695.1","-","-","-","-","","-" +"","Malassezia pachydermatis (GCA_001278385)","Malasseziales","77020","MalaPachy","GCA_001278385.1","-","-","-","-","","-" +"","Malassezia sympodialis ATCC 42132 (GCA_000349305)","Malasseziales","1230383","ASM34930v2","GCA_000349305.2","-","-","-","-","","-" +"","Malassezia sympodialis ATCC 42132 (GCA_900149145)","Malasseziales","1230383","Msy_ATCC_42132_Feb2016","GCA_900149145.1","-","-","-","-","-","-" +"","Malassezia vespertilionis str. NWHC:44797-103 (GCA_002818225)","Malasseziales","2020962","ASM281822v1","GCA_002818225.1","-","-","-","-","","-" +"","Marssonina brunnea f. sp. 'multigermtubi' MB_m1 (GCA_000298775)","Helotiales","1072389","ASM29877v1","GCA_000298775.1","-","-","-","-","","-" +"","Meira miltonrushii str. MCA 3882 (GCA_003144205)","","1280837","Meimi1","GCA_003144205.1","-","-","-","-","","-" +"","Melampsora larici-populina","Pucciniales","747676","GCA_000204055.1","GCA_000204055.1","-","-","-","","","-" +"","Meliniomyces bicolor E (GCA_002865645)","Helotiales","1095630","Melbi2","GCA_002865645.1","-","-","-","-","","-" +"","Meliniomyces variabilis F (GCA_002865655)","Helotiales","1149755","Melva1","GCA_002865655.1","-","-","-","-","","-" +"","Metarhizium acridum CQMa 102 (GCA_000187405)","Hypocreales","655827","MetAcr_May2010","GCA_000187405.1","-","-","-","-","","-" +"","Metarhizium album ARSEF 1941 (GCA_000804445)","Hypocreales","1081103","MAM_1.0_for_version_1_of_the_Metarhizium_album_genome","GCA_000804445.1","-","-","-","-","","-" +"","Metarhizium anisopliae ARSEF 549 (GCA_000814975)","Hypocreales","1276135","MAN_1.0","GCA_000814975.1","-","-","-","-","-","-" +"","Metarhizium anisopliae BRIP 53284 (GCA_000426985)","Hypocreales","1291519","ASM42698v1","GCA_000426985.1","-","-","-","-","-","-" +"","Metarhizium anisopliae BRIP 53293 (GCA_000426965)","Hypocreales","1291518","ASM42696v1","GCA_000426965.1","-","-","-","-","-","-" +"","Metarhizium anisopliae str. E6 (GCA_000739145)","Hypocreales","5530","Metarhizium_anisopliae","GCA_000739145.1","-","-","-","-","-","-" +"","Metarhizium brunneum ARSEF 3297 (GCA_000814965)","Hypocreales","1276141","MBR_1.0","GCA_000814965.1","-","-","-","-","-","-" +"","Metarhizium guizhouense ARSEF 977 (GCA_000814955)","Hypocreales","1276136","MGU_1.0","GCA_000814955.1","-","-","-","-","-","-" +"","Metarhizium majus ARSEF 297 (GCA_000814945)","Hypocreales","1276143","MAJ_1.0","GCA_000814945.1","-","-","-","-","","-" +"","Metarhizium rileyi RCEF 4871 (GCA_001636745)","Hypocreales","1081105","NOR_1.0","GCA_001636745.1","-","-","-","-","","-" +"","Metarhizium robertsii (GCA_000591435)","Hypocreales","568076","MR2010_11_27","GCA_000591435.1","-","-","-","-","-","-" +"","Metarhizium robertsii ARSEF 23 (GCA_000187425)","Hypocreales","655844","MAA_2.0","GCA_000187425.2","-","-","-","-","","-" +"","Metschnikowia bicuspidata var. bicuspidata NRRL YB-4993 (GCA_001664035)","Saccharomycetales","869754","Metbi1","GCA_001664035.1","-","-","-","-","","-" +"","Meyerozyma guilliermondii ATCC 6260 (GCA_000149425)","Saccharomycetales","294746","ASM14942v1","GCA_000149425.1","-","-","-","-","","-" +"","Microbotryum intermedium (GCA_900096595)","Microbotryales","269621","Microbotrium_Intermedium_Assembly","GCA_900096595.1","-","-","-","-","","-" +"","Microbotryum violaceum","Microbotryales","683840","GCA_000166175.1","GCA_000166175.1","-","-","-","","","-" +"","Microdochium bolleyi str. J235TASD1 (GCA_001566295)","Xylariales","196109","Microdochium_bolleyi_v1.0","GCA_001566295.1","-","-","-","-","","-" +"","Microsporum canis CBS 113480 (GCA_000151145)","Onygenales","554155","ASM15114v1","GCA_000151145.1","-","-","-","-","","-" +"","Millerozyma farinosa CBS 7064 (GCA_000315895)","Saccharomycetales","559304","ASM31589v1","GCA_000315895.1","-","-","-","-","","-" +"","Mitosporidium daphniae str. UGP3 (GCA_000760515)","Microsporidia","1485682","UGP1.0","GCA_000760515.1","-","-","-","-","","-" +"","Mixia osmundae IAM 14324 (GCA_000241205)","Mixiales","764103","Mosmundae_2.0","GCA_000241205.2","-","-","-","-","","-" +"","Mixia osmundae IAM 14324 (GCA_000708205)","Mixiales","764103","Mixia_osmundae_v1.0","GCA_000708205.1","-","-","-","-","-","-" +"","Moelleriella libera RCEF 2490 (GCA_001636675)","Hypocreales","1081109","AAL_1.0","GCA_001636675.1","-","-","-","-","","-" +"","Moesziomyces antarcticus T-34 (GCA_000334475)","Ustilaginales","1151754","Pant_1.0","GCA_000334475.1","-","-","-","-","","-" +"","Moesziomyces antarcticus str. JCM 10317 (GCA_000747765)","Ustilaginales","84753","ASM74776v1","GCA_000747765.1","-","-","-","-","-","-" +"","Moesziomyces aphidis DSM 70725 (GCA_000517465)","Ustilaginales","1391700","PseuAph1.0","GCA_000517465.1","-","-","-","-","","-" +"","Moniliophthora perniciosa FA553 (GCA_000183025)","Agaricales","554373","ASM18302v1","GCA_000183025.1","-","-","-","-","","-" +"","Moniliophthora roreri MCA 2997 (GCA_000488995)","Agaricales","1381753","M_roreri_MCA_2997_v1","GCA_000488995.1","-","-","-","-","","-" +"","Moniliophthora roreri str. MCA 2952 (GCA_001466705)","Agaricales","221103","ASM146670v1","GCA_001466705.1","-","-","-","-","-","-" +"","Mortierella elongata AG-77","Mortierellomycotina","1314771","Mortierella_elongata_AG-77_v2.0","GCA_001651415.1","-","-","-","-","","-" +"","Mortierella verticillata NRRL 6337 (GCA_000739165)","Mortierellomycotina","1069443","Mort_vert_NRRL_6337_V1","GCA_000739165.1","-","-","-","-","","-" +"","Mucor ambiguus str. NBRC 6742 (GCA_000950595)","Mucoromycotina","91626","ASM95059v1","GCA_000950595.1","-","-","-","-","","-" +"","Mucor circinelloides f. circinelloides 1006PhL (GCA_000401635)","Mucoromycotina","1220926","Muco_sp_1006Ph_V1","GCA_000401635.1","-","-","-","-","","-" +"","Mucor circinelloides f. lusitanicus CBS 277.49","Mucoromycotina","747725","Mucci2","GCA_001638945.1","-","-","-","-","-","-" +"","Mycosphaerella eumusae str. CBS 114824 (GCA_001578235)","Capnodiales","321146","ASM157823v1","GCA_001578235.1","-","-","-","-","","-" +"","Nadsonia fulvescens var. elongata DSM 6958 (GCA_001661315)","Saccharomycetales","857566","Nadfu1","GCA_001661315.1","-","-","-","-","","-" +"","Naematelia encephala str. 68-887.2 (GCA_002105065)","Tremellales","71784","Treen1","GCA_002105065.1","-","-","-","-","","-" +"","Nannizzia gypsea CBS 118893 (GCA_000150975)","Onygenales","535722","MS_CBS118893","GCA_000150975.2","-","-","-","-","","-" +"","Naumovozyma castellii CBS 4309 (GCA_000237345)","Saccharomycetales","1064592","ASM23734v1","GCA_000237345.1","-","-","-","-","","-" +"","Naumovozyma dairenensis CBS 421 (GCA_000227115)","Saccharomycetales","1071378","ASM22711v2","GCA_000227115.2","-","-","-","-","","-" +"","Nematocida displodere str. JUm2807 (GCA_001642395)","Microsporidia","1805483","ASM164239v1","GCA_001642395.1","-","-","-","-","","-" +"","Nematocida parisii ERTm1 (GCA_000250985)","Microsporidia","881290","Nema_parisii_ERTm1_V3","GCA_000250985.1","-","-","-","-","-","-" +"","Nematocida parisii ERTm3 (GCA_000190615)","Microsporidia","935791","Nema_parisii_ERTm3_V1","GCA_000190615.1","-","-","-","-","","-" +"","Nematocida sp. 1 ERTm2 (GCA_000250695)","Microsporidia","944018","Nema_parisii_ERTm2_V1","GCA_000250695.1","-","-","-","-","","-" +"","Nematocida sp. 1 ERTm6 (GCA_000738915)","Microsporidia","1138374","Nema_sp_1_ERTm6_V2","GCA_000738915.1","-","-","-","-","-","-" +"","Nematocida sp. ERTm5 (GCA_001642415)","Microsporidia","1805481","ASM164241v1","GCA_001642415.1","-","-","-","-","-","-" +"","Neocallimastix californiae str. G1 (GCA_002104975)","","1754190","Neocallimastix_sp._G1_v1.0","GCA_002104975.1","-","-","-","-","","-" +"","Neofusicoccum parvum UCRNP2 (GCA_000385595)","Botryosphaeriales","1287680","UCRNP2V3","GCA_000385595.1","-","-","-","-","","-" +"","Neolecta irregularis DAH-3 (GCA_001929475)","Taphrinomycotina","1198029","NeoIirr1.0","GCA_001929475.1","-","-","-","-","","-" +"","Neolentinus lepideus HHB14362 ss-1 (GCA_001632425)","Gloeophyllales","1314782","Neole1","GCA_001632425.1","-","-","-","-","","-" +"","Neonectria ditissima str. R09/05 (GCA_001306435)","Hypocreales","78410","R0905_v2.0","GCA_001306435.1","-","-","-","-","","-" +"","Neurospora crassa","Sordariales","367110","NC12","GCA_000182925.2","-","-","-","","","" +"","Neurospora crassa str. 73 (GCA_000786625)","Sordariales","5141","Neucr_trp3_1","GCA_000786625.1","-","-","-","-","-","-" +"","Neurospora tetrasperma FGSC 2508 (GCA_000213175)","Sordariales","510951","v2.0","GCA_000213175.1","-","-","-","-","-","-" +"","Neurospora tetrasperma FGSC 2509 str. FGSC 2509 mat a (GCA_000213195)","Sordariales","510952","v1.0","GCA_000213195.1","-","-","-","-","","-" +"","Nosema apis BRL 01 (GCA_000447185)","Nosematidae","1037528","NapisBRLv01","GCA_000447185.1","-","-","-","-","","-" +"","Nosema bombycis CQ1 (GCA_000383075)","Nosematidae","578461","NosBomCQ1_v1.0","GCA_000383075.1","-","-","-","-","","-" +"","Nosema ceranae (GCA_000988165)","Nosematidae","40302","ASM98816v1","GCA_000988165.1","-","-","-","-","-","-" +"","Nosema ceranae BRL01 (GCA_000182985)","Nosematidae","578460","ASM18298v1","GCA_000182985.1","-","-","-","-","","-" +"","Ogataea parapolymorpha DL-1 (GCA_000187245)","Saccharomycetales","871575","Hansenula_2","GCA_000187245.3","-","-","-","-","","-" +"","Ogataea polymorpha str. NCYC 495 leu1.1 (GCA_001664045)","Saccharomycetales","460523","Hanpo2","GCA_001664045.1","-","-","-","-","","-" +"","Oidiodendron maius Zn (GCA_000827325)","Myxotrichaceae","913774","Oidiodendron_maius_Zn_v1.0","GCA_000827325.1","-","-","-","-","","-" +"","Ophiocordyceps australis (GCA_002591405)","Hypocreales","1399860","OphauG2","GCA_002591405.1","-","-","-","-","","-" +"","Ophiocordyceps australis (GCA_002591415)","Hypocreales","1399860","OphauB2","GCA_002591415.1","-","-","-","-","-","-" +"","Ophiocordyceps camponoti-rufipedis (GCA_002591395)","Hypocreales","2004952","Ophun1","GCA_002591395.1","-","-","-","-","","-" +"","Ophiocordyceps sinensis CO18 (GCA_000448365)","Hypocreales","911162","ASM44836v1","GCA_000448365.1","-","-","-","-","-","-" +"","Ophiocordyceps unilateralis str. SC16a (GCA_001272575)","Hypocreales","268505","ASM127257v2","GCA_001272575.2","-","-","-","-","-","-" +"","Ophiostoma piceae UAMH 11346 str. UAMH-11346 (GCA_000410735)","Ophiostomatales","1262450","Opiceae_UAMHv01","GCA_000410735.1","-","-","-","-","","-" +"","Ordospora colligata OC4 (GCA_000803265)","Ordosporidae","1354746","ASM80326v1","GCA_000803265.1","-","-","-","-","","-" +"","Pachysolen tannophilus NRRL Y-2460 (GCA_001661245)","Saccharomycetales","669874","Pacta1_2","GCA_001661245.1","-","-","-","-","","-" +"","Paracoccidioides brasiliensis Pb03 (GCA_000150475)","Onygenales","482561","Paracocci_br_Pb03_V2","GCA_000150475.2","-","-","-","-","-","-" +"","Paracoccidioides brasiliensis Pb18 (GCA_000150735)","Onygenales","502780","Paracocci_br_Pb18_V2","GCA_000150735.2","-","-","-","-","","-" +"","Paracoccidioides brasiliensis str. CNH (GCA_001713695)","Onygenales","121759","Paracocci_br_PbCNH","GCA_001713695.1","-","-","-","-","-","-" +"","Paracoccidioides brasiliensis str. Pb300 (GCA_001713645)","Onygenales","121759","ASM171364v1","GCA_001713645.1","-","-","-","-","-","-" +"","Paracoccidioides lutzii Pb01 (GCA_000150705)","Onygenales","502779","Paracocci_br_Pb01_V2","GCA_000150705.2","-","-","-","-","","-" +"","Paramicrosporidium saccamoebae str. KSL3 (GCA_002794465)","Cryptomycota","1246581","KSL3_v6","GCA_002794465.1","-","-","-","-","","-" +"","Paraphaeosphaeria sporulosa str. AP3s5-JAC2a (GCA_001642045)","Pleosporales","1460663","Parsp1","GCA_001642045.1","-","-","-","-","","-" +"","Paxillus involutus ATCC 200175 (GCA_000827475)","Boletales","664439","Paxillus_involutus_ATCC_200175_v1.0","GCA_000827475.1","-","-","-","-","","-" +"","Paxillus rubicundulus Ve08.2h10 (GCA_000827395)","Boletales","930991","Paxillus_rubicundulus_Ve08.2h10_v1.0","GCA_000827395.1","-","-","-","-","","-" +"","Penicilliopsis zonata CBS 506.65 (GCA_001890105)","Eurotiales","1073090","Aspzo1","GCA_001890105.1","-","-","-","-","","-" +"","Penicillium antarcticum (GCA_002072345)","Eurotiales","416450","ASM207234v1","GCA_002072345.1","-","-","-","-","","-" +"","Penicillium arizonense (GCA_001773325)","Eurotiales","1835702","ASM177332v1","GCA_001773325.1","-","-","-","-","-","-" +"","Penicillium brasilianum str. LaBioMMi 136 (GCA_002016555)","Eurotiales","104259","ASM201655v1","GCA_002016555.1","-","-","-","-","-","-" +"","Penicillium brasilianum str. MG11 (GCA_001048715)","Eurotiales","104259","Pbras_Allpaths-LG","GCA_001048715.1","-","-","-","-","","-" +"","Penicillium camemberti FM 013 (GCA_000513335)","Eurotiales","1429867","PCAMFM013_20131106","GCA_000513335.1","-","-","-","-","","-" +"","Penicillium chrysogenum str. P2niaD18 (GCA_000710275)","Eurotiales","5076","ASM71027v1","GCA_000710275.1","-","-","-","-","-","-" +"","Penicillium coprophilum (GCA_002072405)","Eurotiales","36646","ASM207240v1","GCA_002072405.1","-","-","-","-","-","-" +"","Penicillium decumbens (GCA_002072245)","Eurotiales","69771","ASM207224v1","GCA_002072245.1","-","-","-","-","-","-" +"","Penicillium digitatum PHI26 (GCA_000315665)","Eurotiales","1170229","PdigPHI26_v1","GCA_000315665.1","-","-","-","-","-","-" +"","Penicillium digitatum Pd1 (GCA_000315645)","Eurotiales","1170230","PdigPd1_v1","GCA_000315645.2","-","-","-","-","-","-" +"","Penicillium expansum str. CMP-1 (GCA_000769755)","Eurotiales","27334","PEX1","GCA_000769755.1","-","-","-","-","-","-" +"","Penicillium expansum str. MD-8 (GCA_000769745)","Eurotiales","27334","ASM76974v1","GCA_000769745.1","-","-","-","-","-","-" +"","Penicillium expansum str. d1 (GCA_000769735)","Eurotiales","27334","ASM76973v1","GCA_000769735.1","-","-","-","-","-","-" +"","Penicillium flavigenum (GCA_002072365)","Eurotiales","254877","ASM207236v1","GCA_002072365.1","-","-","-","-","-","-" +"","Penicillium freii (GCA_001513925)","Eurotiales","48697","ASM151392v1","GCA_001513925.1","-","-","-","-","-","-" +"","Penicillium griseofulvum str. PG3 (GCA_001561935)","Eurotiales","5078","ASM156193v1","GCA_001561935.1","-","-","-","-","-","-" +"","Penicillium italicum str. PHI-1 (GCA_000769765)","Eurotiales","40296","ASM76976v1","GCA_000769765.1","-","-","-","-","-","-" +"","Penicillium nalgiovense (GCA_002072425)","Eurotiales","60175","ASM207242v1","GCA_002072425.1","-","-","-","-","-","-" +"","Penicillium nordicum (GCA_001278595)","Eurotiales","229535","ASM127859v1","GCA_001278595.1","-","-","-","-","-","-" +"","Penicillium occitanis str. CL100 (GCA_002382855)","Eurotiales","290292","ASM238285v1","GCA_002382855.1","-","-","-","-","-","-" +"","Penicillium occitanis str. CT1 (GCA_002382835)","Eurotiales","290292","ASM238283v1","GCA_002382835.1","-","-","-","-","-","-" +"","Penicillium oxalicum 114-2 (GCA_000346795)","Eurotiales","933388","pde_v1.0","GCA_000346795.1","-","-","-","-","-","-" +"","Penicillium polonicum (GCA_002072265)","Eurotiales","60169","ASM207226v1","GCA_002072265.1","-","-","-","-","-","-" +"","Penicillium roqueforti FM164 (GCA_000513255)","Eurotiales","1365484","PROQFM164_20130607","GCA_000513255.1","-","-","-","-","-","-" +"","Penicillium rubens Wisconsin 54-1255 (GCA_000226395)","Eurotiales","500485","PenChr_Nov2007","GCA_000226395.1","-","-","-","-","-","-" +"","Penicillium solitum (GCA_002072235)","Eurotiales","60172","ASM207223v1","GCA_002072235.1","-","-","-","-","-","-" +"","Penicillium steckii (GCA_002072375)","Eurotiales","303698","ASM207237v1","GCA_002072375.1","-","-","-","-","-","-" +"","Penicillium subrubescens str. CBS 132785 (GCA_001908125)","Eurotiales","1316194","ASM190812v1","GCA_001908125.1","-","-","-","-","-","-" +"","Penicillium vulpinum (GCA_002072255)","Eurotiales","29845","ASM207225v1","GCA_002072255.1","-","-","-","-","-","-" +"","Peniophora sp. CONT (GCA_001632445)","Russulales","1314672","Ricme1","GCA_001632445.1","-","-","-","-","","-" +"","Periconia macrospinosa str. DSE2036 (GCA_003073855)","Pleosporales","97972","Perma1","GCA_003073855.1","-","-","-","-","","-" +"","Pestalotiopsis fici W106-1 (GCA_000516985)","Xylariales","1229662","PFICI","GCA_000516985.1","-","-","-","-","","-" +"","Pezoloma ericae str. UAMH 7357 (GCA_002865625)","Helotiales","1745343","Rhier1","GCA_002865625.1","-","-","-","-","","-" +"","Phaeoacremonium minimum UCRPA7 (GCA_000392275)","Sordariomycetidae","1286976","UCRPA7V03","GCA_000392275.1","-","-","-","-","","-" +"","Phaeomoniella chlamydospora (GCA_001006345)","Chaetothyriomycetidae","158046","UCRPA7V1.0","GCA_001006345.1","-","-","-","-","","-" +"","Phaeosphaeria nodorum","Pleosporales","321614","ASM14691v1","GCA_000146915.1","-","-","-","","","-" +"","Phanerochaete carnosa HHB-10118-sp (GCA_000300595)","Polyporales","650164","Phanerochaete_carnosa_HHB-10118-Sp_v1.0","GCA_000300595.1","-","-","-","-","","-" +"","Phellinus noxius (GCA_002287475)","Hymenochaetales","2282107","ASM228747v1","GCA_002287475.1","-","-","-","-","","-" +"","Phialocephala scopiformis str. CBS 120377 (GCA_001500285)","Helotiales","149040","Phisc1","GCA_001500285.1","-","-","-","-","","-" +"","Phialocephala subalpina (GCA_900073065)","Helotiales","576137","PAC_version_1","GCA_900073065.1","-","-","-","-","","-" +"","Phialophora americana str. CBS 27337 (GCA_000835435)","Chaetothyriomycetidae","5601","Capr_semi_CBS27337_V1","GCA_000835435.1","-","-","-","-","","-" +"","Phialophora attae str. CBS 131958 (GCA_001299255)","Chaetothyriomycetidae","1664694","ASM129925v1","GCA_001299255.1","-","-","-","-","","-" +"","Phlebia centrifuga str. FBCC195 (GCA_001913855)","Polyporales","98765","ASM191385v2","GCA_001913855.2","-","-","-","-","","-" +"","Phlebiopsis gigantea 11061_1 CR5-6 (GCA_000832265)","Polyporales","745531","Phlgi1","GCA_000832265.1","-","-","-","-","","-" +"","Pichia kudriavzevii str. 129 (GCA_001983325)","Saccharomycetales","4909","ASM198332v1","GCA_001983325.1","-","-","-","-","-","-" +"","Pichia kudriavzevii str. CBS573 (GCA_003054445)","Saccharomycetales","4909","ASM305444v1","GCA_003054445.1","-","-","-","-","-","-" +"","Pichia kudriavzevii str. Ckrusei653 (GCA_002166775)","Saccharomycetales","4909","Cand_krus_Ckrusei653_V21","GCA_002166775.1","-","-","-","-","-","-" +"","Pichia kudriavzevii str. SD108 (GCA_000764455)","Saccharomycetales","4909","ASM76445v1","GCA_000764455.1","-","-","-","-","","-" +"","Pichia membranifaciens NRRL Y-2026 (GCA_001661235)","Saccharomycetales","763406","Picme2","GCA_001661235.1","-","-","-","-","","-" +"","Pichia membranifaciens str. KS47-1 (GCA_001950575)","Saccharomycetales","4926","P_membrenifaciens-1.0","GCA_001950575.1","-","-","-","-","-","-" +"","Piloderma croceum F 1598 (GCA_000827315)","Atheliales","765440","Piloderma_croceum_F_1598_v1.0","GCA_000827315.1","-","-","-","-","","-" +"","Piromyces finnis (GCA_002104945)","","1754191","Piromyces_sp._finnis_v3.0","GCA_002104945.1","-","-","-","-","","-" +"","Piromyces sp. E2 (GCA_002157105)","","73868","PirspE2_v1.0","GCA_002157105.1","-","-","-","-","","-" +"","Pisolithus microcarpus 441 (GCA_000827275)","Boletales","765257","Pisolithus_microcarpus_441_v1.0","GCA_000827275.1","-","-","-","-","","-" +"","Pisolithus tinctorius Marx 270 (GCA_000827335)","Boletales","870435","Pisolithus_tinctorius_Marx_270_v1.0","GCA_000827335.1","-","-","-","-","","-" +"","Pleurotus ostreatus PC15 (GCA_000697685)","Agaricales","1137138","PleosPC15_2","GCA_000697685.1","-","-","-","-","","-" +"","Plicaturopsis crispa FD-325 SS-3 (GCA_000827205)","","944288","Plicr1","GCA_000827205.1","-","-","-","-","","-" +"","Pneumocystis carinii B80 (GCA_001477545)","Taphrinomycotina","1408658","Pneu_cari_B80_V3","GCA_001477545.1","-","-","-","-","","-" +"","Pneumocystis jirovecii RU7 (GCA_001477535)","Taphrinomycotina","1408657","Pneu_jiro_RU7_V2","GCA_001477535.1","-","-","-","-","","-" +"","Pneumocystis murina B123 (GCA_000349005)","Taphrinomycotina","1069680","Pneumo_murina_B123_V4","GCA_000349005.2","-","-","-","-","","-" +"","Pochonia chlamydosporia 170 (GCA_001653235)","Hypocreales","1380566","ASM165323v2","GCA_001653235.2","-","-","-","-","","-" +"","Podospora anserina S mat+ (GCA_000226545)","Sordariales","515849","ASM22654v1","GCA_000226545.1","-","-","-","-","-","-" +"","Polytolypa hystricis UAMH7299 (GCA_002573605)","Onygenales","1447883","Poly_hyst_7299_V1","GCA_002573605.1","-","-","-","-","","-" +"","Postia placenta MAD-698-R-SB12 (GCA_002117355)","Polyporales","670580","PosplRSB12_1","GCA_002117355.1","-","-","-","-","-","-" +"","Postia placenta Mad-698-R (GCA_000006255)","Polyporales","561896","Postia_placenta_V1.0","GCA_000006255.1","-","-","-","-","","-" +"","Protomyces lactucaedebilis str. 12-1054 (GCA_002105105)","Taphrinomycotina","56484","Prola1","GCA_002105105.1","-","-","-","-","","-" +"","Pseudocercospora fijiensis CIRAD86 (GCA_000340215)","Capnodiales","383855","Mycfi2","GCA_000340215.1","-","-","-","-","","-" +"","Pseudocercospora musae str. CBS 116634 (GCA_001578225)","Capnodiales","113226","ASM157822v1","GCA_001578225.1","-","-","-","-","","-" +"","Pseudogymnoascus destructans (GCA_001641265)","Pseudeurotiaceae","655981","ASM164126v1","GCA_001641265.1","-","-","-","-","-","-" +"","Pseudogymnoascus destructans 20631-21 (GCA_000184105)","Pseudeurotiaceae","658429","Geom_destructans_V1","GCA_000184105.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. 03VT05 (GCA_001662645)","Pseudeurotiaceae","1622148","ASM166264v1","GCA_001662645.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. 05NY08 (GCA_001662605)","Pseudeurotiaceae","1622149","ASM166260v1","GCA_001662605.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. 23342-1-I1 (GCA_001662575)","Pseudeurotiaceae","1524831","ASM166257v1","GCA_001662575.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. 24MN13 (GCA_001662595)","Pseudeurotiaceae","1622150","ASM166259v1","GCA_001662595.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-103 (GCA_000750895)","Pseudeurotiaceae","1420912","DG30","GCA_000750895.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-3557 (GCA_000750665)","Pseudeurotiaceae","1437433","DG3","GCA_000750665.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-3775 (GCA_000750715)","Pseudeurotiaceae","1420901","DG4","GCA_000750715.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-3808 (GCA_000750675)","Pseudeurotiaceae","1391699","DG1","GCA_000750675.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-4246 (GCA_000750735)","Pseudeurotiaceae","1420902","DG5","GCA_000750735.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-4281 (FW-2241) (GCA_000750745)","Pseudeurotiaceae","1420906","DG6","GCA_000750745.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-4513 (FW-928) (GCA_000750755)","Pseudeurotiaceae","1420907","DG7","GCA_000750755.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-4514 (FW-929) (GCA_000750795)","Pseudeurotiaceae","1420908","DG8","GCA_000750795.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-4515 (FW-2607) (GCA_000750805)","Pseudeurotiaceae","1420909","DG10","GCA_000750805.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-4516 (FW-969) (GCA_000750815)","Pseudeurotiaceae","1420910","DG11","GCA_000750815.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-4517 (FW-2822) (GCA_000750875)","Pseudeurotiaceae","1420911","DG13","GCA_000750875.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-4518 (FW-2643) (GCA_000750925)","Pseudeurotiaceae","1420913","DG36","GCA_000750925.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-4519 (FW-2642) (GCA_000750935)","Pseudeurotiaceae","1420914","DG38","GCA_000750935.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. VKM F-4520 (FW-2644) (GCA_000750995)","Pseudeurotiaceae","1420915","DG39","GCA_000750995.1","-","-","-","-","-","-" +"","Pseudogymnoascus sp. WSF 3629 (GCA_001662585)","Pseudeurotiaceae","1622147","ASM166258v1","GCA_001662585.1","-","-","-","-","-","-" +"","Pseudogymnoascus verrucosus (GCA_001662655)","Pseudeurotiaceae","342668","ASM166265v1","GCA_001662655.1","-","-","-","-","-","-" +"","Pseudoloma neurophilia str. MK1 (GCA_001432165)","Microsporidia","146866","ASM143216v1","GCA_001432165.1","-","-","-","-","","-" +"","Pseudomassariella vexata str. CBS 129021 (GCA_002105095)","Xylariales","1141098","Pseve2","GCA_002105095.1","-","-","-","-","","-" +"","Pseudomicrostroma glucosiphilum str. MCA 4718 (GCA_003144135)","","1684307","Rhodsp1","GCA_003144135.1","-","-","-","-","","-" +"","Pseudozyma hubeiensis SY62 (GCA_000403515)","Ustilaginales","1305764","ASM40351v1","GCA_000403515.1","-","-","-","-","","-" +"","Puccinia coronata var. avenae f. sp. avenae (GCA_002873275)","Pucciniales","200324","ASM287327v1","GCA_002873275.1","-","-","-","-","","-" +"","Puccinia graminis","Pucciniales","418459","ASM14992v1","GCA_000149925.1","","-","","","","" +"","Puccinia graminis Ug99","Pucciniales","1040990","v1","-","","-","-","","","-" +"","Puccinia sorghi str. RO10H11247 (GCA_001263375)","Pucciniales","27349","ASM126337v1","GCA_001263375.1","-","-","-","-","","-" +"","Puccinia striiformis (GCA_002920065)","Pucciniales","27350","ASM292006v1","GCA_002920065.1","-","-","-","-","","-" +"","Puccinia striiformis f. sp. tritici PST-130 str. Race 130","Pucciniales","875184","PST-130_1.0","GCA_000223505.1","-","-","-","","-","-" +"","Puccinia striiformis f. sp. tritici PST-78 (GCA_001191645)","Pucciniales","1165861","P_striiformis_V1","GCA_001191645.1","-","-","-","-","-","-" +"","Puccinia triticina","Pucciniales","630390","ASM15152v1","GCA_000151525.1","-","-","","","","-" +"","Punctularia strigosozonata HHB-11173 SS5 (GCA_000264995)","Corticiales","741275","Punctularia_strigosozonata_v1.0","GCA_000264995.1","-","-","-","-","","-" +"","Purpureocillium lilacinum (GCA_001653205)","Hypocreales","33203","ASM165320v1","GCA_001653205.1","-","-","-","-","","-" +"","Purpureocillium lilacinum (GCA_001653265)","Hypocreales","33203","ASM165326v1","GCA_001653265.1","-","-","-","-","-","-" +"","Purpureocillium lilacinum str. 36-1 (GCA_003144605)","Hypocreales","33203","ASM314460v1","GCA_003144605.1","-","-","-","-","-","-" +"","Pyrenochaeta sp. DS3sAY3a (GCA_001644535)","Pleosporales","765867","Pyrsp1","GCA_001644535.1","-","-","-","-","","-" +"","Pyrenophora teres","Pleosporales","861557","GCA_000166005.1","GCA_000166005.1","-","-","-","","","-" +"","Pyrenophora tritici-repentis (GCA_003171545)","Pleosporales","45151","PtrARCrossB10","GCA_003171545.1","-","-","-","-","-","-" +"","Pyrenophora tritici-repentis (GCA_003231325)","Pleosporales","45151","Ptr134","GCA_003231325.1","-","-","-","-","-","-" +"","Pyrenophora tritici-repentis (GCA_003231365)","Pleosporales","45151","Ptr239","GCA_003231365.1","-","-","-","-","-","-" +"","Pyrenophora tritici-repentis (GCA_003231425)","Pleosporales","45151","Ptr86-124","GCA_003231425.1","-","-","-","-","-","-" +"","Pyrenophora tritici-repentis Pt-1C-BFP","Pleosporales","426418","ASM14998v1","GCA_000149985.1","-","-","-","-","","-" +"","Rachicladosporium antarcticum (GCA_002077065)","Capnodiales","1507870","ASM207706v1","GCA_002077065.1","-","-","-","-","","-" +"","Rachicladosporium sp. CCFEE 5018 (GCA_002077045)","Capnodiales","1974281","ASM207704v2","GCA_002077045.2","-","-","-","-","","-" +"","Ramularia collo-cygni (GCA_900074925)","Capnodiales","112498","version_1","GCA_900074925.1","-","-","-","-","","-" +"","Rasamsonia emersonii CBS 393.64 (GCA_000968595)","Eurotiales","1408163","ASM96859v1","GCA_000968595.1","-","-","-","-","","-" +"","Rhinocladiella mackenziei CBS 650.93 (GCA_000835555)","Chaetothyriomycetidae","1442369","Rhin_mack_CBS_650_93_V1","GCA_000835555.1","-","-","-","-","","-" +"","Rhizoclosmatium globosum str. JEL800 (GCA_002104985)","Chytridiomycetes","329046","Rhihy1","GCA_002104985.1","-","-","-","-","","-" +"","Rhizoctonia solani (GCA_001286725)","Cantharellales","456999","AG22IIIB","GCA_001286725.1","-","-","-","-","-","-" +"","Rhizoctonia solani 123E (GCA_000715385)","Cantharellales","1423351","Rhizoctonia_solani_123E_v1","GCA_000715385.1","-","-","-","-","-","-" +"","Rhizoctonia solani AG-1 IA str. AG1 IA (GCA_000334115)","Cantharellales","983506","Rhisol_AG1IA_1.0","GCA_000334115.1","-","-","-","-","","-" +"","Rhizoctonia solani AG-1 IB (GCA_000350255)","Cantharellales","1108050","ASM35025v1","GCA_000350255.1","-","-","-","-","-","-" +"","Rhizoctonia solani AG-3 Rhs1AP (GCA_000524645)","Cantharellales","1086054","Rhizoctonia_solani_AG-3","GCA_000524645.1","-","-","-","-","-","-" +"","Rhizoctonia solani AG-8 WAC10335 (GCA_000695385)","Cantharellales","1287689","RSAG8-1.V1","GCA_000695385.1","-","-","-","-","-","-" +"","Rhizophagus clarus str. HR1","Glomerales","94130","RclarusHR1_1.0","GCA_003203555.1","-","-","-","-","","-" +"","Rhizophagus irregularis DAOM 181602=DAOM 197198","Glomerales","747089","Rir_HGAP_ii_V2","GCA_002897155.1","-","-","-","-","-","-" +"","Rhizophagus irregularis DAOM 181602=DAOM 197198 (GCA_000439145)","Glomerales","747089","ASM43914v3","GCA_000439145.3","-","-","-","-","-","-" +"","Rhizophagus irregularis DAOM 197198w str. DAOM197198w (GCA_000597685)","Glomerales","1432141","Rir","GCA_000597685.1","-","-","-","-","-","-" +"","Rhizophagus irregularis str. A1","Glomerales","588596","ASM159312v1","GCA_001593125.1","-","-","-","-","-","-" +"","Rhizophagus irregularis str. A4","Glomerales","588596","ASM159314v1","GCA_001593145.1","-","-","-","-","-","-" +"","Rhizophagus irregularis str. A5","Glomerales","588596","ASM159320v1","GCA_001593205.1","-","-","-","-","-","-" +"","Rhizophagus irregularis str. C2","Glomerales","588596","ASM159315v1","GCA_001593155.1","-","-","-","-","-","-" +"","Rhizopogon vesiculosus str. AM-OR11-056 (GCA_001882365)","Boletales","180088","Rves_AM-OR11-056_1.0","GCA_001882365.1","-","-","-","-","","-" +"","Rhizopogon vinicolor AM-OR11-026 (GCA_001658105)","Boletales","1314800","Rhivi1","GCA_001658105.1","-","-","-","-","-","-" +"","Rhizopus delemar RA 99-880 (GCA_000149305)","Mucoromycotina","246409","RO3","GCA_000149305.1","-","-","-","-","","-" +"","Rhizopus microsporus ATCC 52813","Mucoromycotina","1340429","Rhimi1_1","GCA_002708625.1","-","-","-","-","-","-" +"","Rhizopus microsporus str. ATCC 11559","Mucoromycotina","58291","Rhimi_ATCC11559_1","GCA_002083735.1","-","-","-","-","-","-" +"","Rhizopus microsporus str. ATCC62417 (GCA_900000135)","Mucoromycotina","58291","RMATCC62417_Allpaths-LG","GCA_900000135.1","-","-","-","-","-","-" +"","Rhizopus microsporus str. CBS-344.29 (GCA_000825725)","Mucoromycotina","58291","Rmicro_CBS_344.29_Allpaths-LG","GCA_000825725.1","-","-","-","-","","-" +"","Rhizopus microsporus var. microsporus str. ATCC 52814","Mucoromycotina","86635","Rhimi_ATCC52814_1","GCA_002083745.1","-","-","-","-","-","-" +"","Rhodotorula graminis WP1 (GCA_001329695)","Sporidiobolales","578459","Rhoba1_1","GCA_001329695.1","-","-","-","-","","-" +"","Rhodotorula sp. JG-1b (GCA_001541205)","Sporidiobolales","1305733","Rhosp1","GCA_001541205.1","-","-","-","-","-","-" +"","Rhodotorula taiwanensis str. MD1149 (GCA_002922495)","Sporidiobolales","741276","ASM292249v1","GCA_002922495.1","-","-","-","-","-","-" +"","Rhodotorula toruloides (GCA_001255795)","Sporidiobolales","5286","IFO0880_HGAP3_v1","GCA_001255795.1","-","-","-","-","-","-" +"","Rhodotorula toruloides ATCC 204091 (GCA_000222205)","Sporidiobolales","1001064","R.glutinis2","GCA_000222205.2","-","-","-","-","","-" +"","Rhodotorula toruloides NP11 (GCA_000320785)","Sporidiobolales","1130832","RHOziaDV1.0","GCA_000320785.2","-","-","-","-","-","-" +"","Rhynchosporium agropyri (GCA_900074905)","Helotiales","914238","version_1","GCA_900074905.1","-","-","-","-","","-" +"","Rhynchosporium commune (GCA_900074885)","Helotiales","914237","version_1","GCA_900074885.1","-","-","-","-","","-" +"","Rhynchosporium secalis (GCA_900074895)","Helotiales","38038","version_1","GCA_900074895.1","-","-","-","-","","-" +"","Rosellinia necatrix str. W97 (GCA_001445595)","Xylariales","77044","Rnecatrix_2.0","GCA_001445595.3","-","-","-","-","","-" +"","Rozella allomycis CSF55 (GCA_000442015)","Cryptomycota","988480","Rozella_k41_t100","GCA_000442015.1","-","-","-","-","","-" +"","Rutstroemia sp. NJR-2017a BBW (GCA_002946425)","Helotiales","2070414","ASM294642v1","GCA_002946425.1","-","-","-","-","","-" +"","Rutstroemia sp. NJR-2017a BVV2 (GCA_002946415)","Helotiales","2070413","ASM294641v1","GCA_002946415.1","-","-","-","-","","-" +"","Rutstroemia sp. NJR-2017a WRK4 (GCA_002946385)","Helotiales","2070412","ASM294638v1","GCA_002946385.1","-","-","-","-","","-" +"","Saccharomyces arboricola H-6 (GCA_000292725)","Saccharomycetales","1160507","SacArb1.0","GCA_000292725.1","-","-","-","-","","-" +"","Saccharomyces cerevisiae","Saccharomycetales","559292","R64-1-1","GCA_000146045.2","","","","","","" +"","Saccharomyces cerevisiae (GCA_001634645)","Saccharomycetales","4932","GLBRCY22-3","GCA_001634645.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae (GCA_002804325)","Saccharomycetales","4932","ASM280432v1","GCA_002804325.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae CEN.PK113-7D (GCA_000269885)","Saccharomycetales","889517","ASM26988v1","GCA_000269885.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae EC1118 (GCA_000218975)","Saccharomycetales","643680","ASM21897v1","GCA_000218975.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae FostersB (GCA_000190255)","Saccharomycetales","764102","ScFostersB_v01","GCA_000190255.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae FostersO (GCA_000326005)","Saccharomycetales","764101","ScFostersO_v01","GCA_000326005.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae Kyokai no. 7 str. kyokai no. 7 (GCA_000260735)","Saccharomycetales","721032","K7_1.0","GCA_000260735.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae Lalvin QA23 (GCA_000325965)","Saccharomycetales","764098","ScQA23_v01","GCA_000325965.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae P283 (GCA_000568295)","Saccharomycetales","1177187","P283","GCA_000568295.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae P301 (GCA_000568055)","Saccharomycetales","1182968","p301","GCA_000568055.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae R103 (GCA_000568365)","Saccharomycetales","1182967","R103","GCA_000568365.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae RM11-1a (GCA_000149365)","Saccharomycetales","285006","ASM14936v1","GCA_000149365.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae VL3 (GCA_000190235)","Saccharomycetales","764100","ScVL3_v01","GCA_000190235.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae Vin13 (GCA_000190215)","Saccharomycetales","764099","ScVIN13_v01","GCA_000190215.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1078 (GCA_000975645)","Saccharomycetales","1296266","Sc_YJM1078_v1","GCA_000975645.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1083 (GCA_000975675)","Saccharomycetales","1292971","Sc_YJM1083_v1","GCA_000975675.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1129 (GCA_000975705)","Saccharomycetales","1293430","Sc_YJM1129_v1","GCA_000975705.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1133 (GCA_000976695)","Saccharomycetales","1294333","Sc_YJM1133_v1","GCA_000976695.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1190 (GCA_000976725)","Saccharomycetales","1294334","Sc_YJM1190_v1","GCA_000976725.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1199 (GCA_000976755)","Saccharomycetales","1294335","Sc_YJM1199_v1","GCA_000976755.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1202 (GCA_000976785)","Saccharomycetales","1294336","Sc_YJM1202_v1","GCA_000976785.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1208 (GCA_000976815)","Saccharomycetales","1294337","Sc_YJM1208_v1","GCA_000976815.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1242 (GCA_000976845)","Saccharomycetales","1294338","Sc_YJM1242_v1","GCA_000976845.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1244 (GCA_000976875)","Saccharomycetales","1294339","Sc_YJM1244_v1","GCA_000976875.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1248 (GCA_000976905)","Saccharomycetales","1294340","Sc_YJM1248_v1","GCA_000976905.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1250 (GCA_000976935)","Saccharomycetales","1294341","Sc_YJM1250_v1","GCA_000976935.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1252 (GCA_000976965)","Saccharomycetales","1294342","Sc_YJM1252_v1","GCA_000976965.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1273 (GCA_000976995)","Saccharomycetales","1294343","Sc_YJM1273_v1","GCA_000976995.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1304 (GCA_000977025)","Saccharomycetales","1294344","Sc_YJM1304_v1","GCA_000977025.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1307 (GCA_000977055)","Saccharomycetales","1294345","Sc_YJM1307_v1","GCA_000977055.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1311 (GCA_000977085)","Saccharomycetales","1294346","Sc_YJM1311_v1","GCA_000977085.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1326 (GCA_000977115)","Saccharomycetales","1294347","Sc_YJM1326_v1","GCA_000977115.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1332 (GCA_000977145)","Saccharomycetales","1294348","Sc_YJM1332_v1","GCA_000977145.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1336 (GCA_000977175)","Saccharomycetales","1294349","Sc_YJM1336_v1","GCA_000977175.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1338 (GCA_000977205)","","1294350","Sc_YJM1338_v1","GCA_000977205.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1341 (GCA_000977235)","Saccharomycetales","1294351","Sc_YJM1341_v1","GCA_000977235.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1342 (GCA_000977265)","Saccharomycetales","1294352","Sc_YJM1342_v1","GCA_000977265.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1355 (GCA_000977295)","Saccharomycetales","1294353","Sc_YJM1355_v1","GCA_000977295.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1356 (GCA_000977325)","Saccharomycetales","1294354","Sc_YJM1356_v1","GCA_000977325.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1381 (GCA_000977355)","Saccharomycetales","1294355","Sc_YJM1381_v1","GCA_000977355.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1383 (GCA_000977385)","Saccharomycetales","1294356","Sc_YJM1383_v1","GCA_000977385.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1385 (GCA_000977415)","Saccharomycetales","1294357","Sc_YJM1385_v1","GCA_000977415.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1386 (GCA_000977445)","Saccharomycetales","1294358","Sc_YJM1386_v1","GCA_000977445.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1387 (GCA_000977475)","Saccharomycetales","1294359","Sc_YJM1387_v1","GCA_000977475.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1388 (GCA_000977505)","Saccharomycetales","1294360","Sc_YJM1388_v1","GCA_000977505.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1389 (GCA_000977535)","Saccharomycetales","1294361","Sc_YJM1389_v1","GCA_000977535.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1399 (GCA_000977565)","Saccharomycetales","1294362","Sc_YJM1399_v1","GCA_000977565.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1400 (GCA_000977595)","Saccharomycetales","1294363","Sc_YJM1400_v1","GCA_000977595.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1401 (GCA_000977625)","Saccharomycetales","1294364","Sc_YJM1401_v1","GCA_000977625.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1402 (GCA_000977655)","Saccharomycetales","1294365","Sc_YJM1402_v1","GCA_000977655.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1415 (GCA_000977685)","Saccharomycetales","1294366","Sc_YJM1415_v1","GCA_000977685.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1417 (GCA_000977715)","Saccharomycetales","1294367","Sc_YJM1417_v1","GCA_000977715.4","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1418 (GCA_000977745)","Saccharomycetales","1294368","Sc_YJM1418_v1","GCA_000977745.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1419 (GCA_000977775)","Saccharomycetales","1294369","Sc_YJM1419_v1","GCA_000977775.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1433 (GCA_000977805)","Saccharomycetales","1294370","Sc_YJM1433_v1","GCA_000977805.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1434 (GCA_000977835)","Saccharomycetales","1294371","Sc_YJM1434_v1","GCA_000977835.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1439 (GCA_000977865)","Saccharomycetales","1294372","Sc_YJM1439_v1","GCA_000977865.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1443 (GCA_000977895)","Saccharomycetales","1294373","Sc_YJM1443_v1","GCA_000977895.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1444 (GCA_000977925)","Saccharomycetales","1294374","Sc_YJM1444_v1","GCA_000977925.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1447 (GCA_000977955)","Saccharomycetales","1294375","Sc_YJM1447_v1","GCA_000977955.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1450 (GCA_000977985)","Saccharomycetales","1294376","Sc_YJM1450_v1","GCA_000977985.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1460 (GCA_000978015)","Saccharomycetales","1294377","Sc_YJM1460_v1","GCA_000978015.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1463 (GCA_000978045)","Saccharomycetales","1294378","Sc_YJM1463_v1","GCA_000978045.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1477 (GCA_000978075)","Saccharomycetales","1294379","Sc_YJM1477_v1","GCA_000978075.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1478 (GCA_000978105)","Saccharomycetales","1294380","Sc_YJM1478_v1","GCA_000978105.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1479 (GCA_000978135)","Saccharomycetales","1294381","Sc_YJM1479_v1","GCA_000978135.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1526 (GCA_000978165)","Saccharomycetales","1294382","Sc_YJM1526_v1","GCA_000978165.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1527 (GCA_000978195)","Saccharomycetales","1294383","Sc_YJM1527_v1","GCA_000978195.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1549 (GCA_000978225)","Saccharomycetales","1294384","Sc_YJM1549_v1","GCA_000978225.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1573 (GCA_000978255)","Saccharomycetales","1294385","Sc_YJM1573_v1","GCA_000978255.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1574 (GCA_000978285)","Saccharomycetales","1294386","Sc_YJM1574_v1","GCA_000978285.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1592 (GCA_000978315)","Saccharomycetales","1294387","Sc_YJM1592_v1","GCA_000978315.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM1615 (GCA_000978345)","Saccharomycetales","1294388","Sc_YJM1615_v1","GCA_000978345.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM189 (GCA_000975735)","Saccharomycetales","1294303","Sc_YJM189_v1","GCA_000975735.4","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM193 (GCA_000975765)","Saccharomycetales","1294304","Sc_YJM193_v1","GCA_000975765.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM195 (GCA_000975585)","Saccharomycetales","1294305","Sc_YJM195_v1","GCA_000975585.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM244 (GCA_000975615)","Saccharomycetales","1294306","Sc_YJM244_v1","GCA_000975615.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM248 (GCA_000975795)","Saccharomycetales","1294307","Sc_YJM248_v1","GCA_000975795.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM270 (GCA_000975825)","Saccharomycetales","1294308","Sc_YJM270_v1","GCA_000975825.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM271 (GCA_000975855)","Saccharomycetales","1294309","Sc_YJM271_v1","GCA_000975855.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM320 (GCA_000975885)","Saccharomycetales","947042","Sc_YJM320_v1","GCA_000975885.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM326 (GCA_000975915)","Saccharomycetales","468558","Sc_YJM326_v1","GCA_000975915.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM428 (GCA_000975945)","Saccharomycetales","947044","Sc_YJM428_v1","GCA_000975945.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM450 (GCA_000975975)","Saccharomycetales","1294310","Sc_YJM450_v1","GCA_000975975.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM451 (GCA_000976005)","Saccharomycetales","502869","Sc_YJM451_v1","GCA_000976005.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM453 (GCA_000976035)","Saccharomycetales","1294311","Sc_YJM453_v1","GCA_000976035.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM456 (GCA_000976065)","Saccharomycetales","1294312","Sc_YJM456_v1","GCA_000976065.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM470 (GCA_000976095)","Saccharomycetales","1294313","Sc_YJM470_v1","GCA_000976095.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM541 (GCA_000976125)","Saccharomycetales","1294314","Sc_YJM541_v1","GCA_000976125.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM554 (GCA_000976155)","Saccharomycetales","1294315","Sc_YJM554_v1","GCA_000976155.4","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM555 (GCA_000976185)","Saccharomycetales","1294316","Sc_YJM555_v1","GCA_000976185.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM627 (GCA_000976215)","Saccharomycetales","1294317","Sc_YJM627_v1","GCA_000976215.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM681 (GCA_000976245)","Saccharomycetales","1294318","Sc_YJM681_v1","GCA_000976245.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM682 (GCA_000976275)","Saccharomycetales","1294319","Sc_YJM682_v1","GCA_000976275.4","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM683 (GCA_000976305)","Saccharomycetales","1294320","Sc_YJM683_v1","GCA_000976305.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM689 (GCA_000976335)","Saccharomycetales","1294321","Sc_YJM689_v1","GCA_000976335.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM693 (GCA_000976365)","Saccharomycetales","1294322","Sc_YJM693_v1","GCA_000976365.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM789 (GCA_000181435)","Saccharomycetales","307796","ASM18143v1","GCA_000181435.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM969 (GCA_000976395)","Saccharomycetales","1294323","Sc_YJM969_v1","GCA_000976395.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM972 (GCA_000976425)","Saccharomycetales","1294324","Sc_YJM972_v1","GCA_000976425.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM975 (GCA_000976455)","Saccharomycetales","1294325","Sc_YJM975_v1","GCA_000976455.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM978 (GCA_000976485)","Saccharomycetales","1294326","Sc_YJM978_v1","GCA_000976485.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM981 (GCA_000976515)","Saccharomycetales","1294327","Sc_YJM981_v1","GCA_000976515.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM984 (GCA_000976545)","Saccharomycetales","1294328","Sc_YJM984_v1","GCA_000976545.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM987 (GCA_000976575)","Saccharomycetales","1294329","Sc_YJM987_v1","GCA_000976575.4","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM990 (GCA_000976605)","Saccharomycetales","1294330","Sc_YJM990_v1","GCA_000976605.3","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM993 (GCA_000662435)","Saccharomycetales","1294331","Sc_YJM993_v1","GCA_000662435.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae YJM996 (GCA_000976665)","Saccharomycetales","1294332","Sc_YJM996_v1","GCA_000976665.2","-","-","-","-","-","-" +"","Saccharomyces cerevisiae str. 131 (GCA_001983315)","Saccharomycetales","4932","ASM198331v1","GCA_001983315.1","-","-","-","-","-","-" +"","Saccharomyces cerevisiae x Saccharomyces kudriavzevii VIN7 (GCA_000326105)","Saccharomycetales","1095631","ASM32610v1","GCA_000326105.1","-","-","-","-","-","-" +"","Saccharomyces eubayanus str. FM1318 (GCA_001298625)","Saccharomycetales","1080349","SEUB3.0","GCA_001298625.1","-","-","-","-","","-" +"","Saccharomyces kudriavzevii IFO 1802 (GCA_000167075)","Saccharomycetales","226230","Saccharomyces_kudriavzevii_strain_IFO1802_v1.0","GCA_000167075.2","-","-","-","-","","-" +"","Saccharomyces sp. 'boulardii' str. biocodex (GCA_001298375)","Saccharomycetales","252598","ASM129837v2","GCA_001298375.2","-","-","-","-","","-" +"","Saccharomyces sp. 'boulardii' str. unique28 (GCA_001413975)","Saccharomycetales","252598","ASM141397v1","GCA_001413975.1","-","-","-","-","-","-" +"","Saccharomycetaceae sp. 'Ashbya aceri' (GCA_000412225)","Saccharomycetales","566037","ASM41222v2","GCA_000412225.2","-","-","-","-","","-" +"","Saitoella complicata NRRL Y-17804 (GCA_000227095)","Taphrinomycotina","698492","Scomplicata_3.0","GCA_000227095.3","-","-","-","-","","-" +"","Saitoella complicata NRRL Y-17804 (GCA_001661265)","Taphrinomycotina","698492","Saico1","GCA_001661265.1","-","-","-","-","-","-" +"","Scedosporium apiospermum str. IHEM 14462 (GCA_000732125)","Microascales","563466","ScApio1.0","GCA_000732125.1","-","-","-","-","","-" +"","Scheffersomyces stipitis CBS 6054 (GCA_000209165)","Saccharomycetales","322104","ASM20916v1","GCA_000209165.1","-","-","-","-","","-" +"","Schizophyllum commune H4-8 (GCA_000143185)","Agaricales","578458","v1.0","GCA_000143185.1","-","-","-","-","","-" +"","Schizopora paradoxa str. KUC8140 (GCA_001020605)","Hymenochaetales","27342","Schpa1","GCA_001020605.1","-","-","-","-","","-" +"","Schizosaccharomyces cryophilus","Schizosaccharomycetales","653667","GCA_000004155.2","GCA_000004155.2","-","-","","","","-" +"","Schizosaccharomyces japonicus","Schizosaccharomycetales","402676","GCA_000149845.2","GCA_000149845.2","-","-","","","","-" +"","Schizosaccharomyces octosporus","Schizosaccharomycetales","483514","GCA_000150505.2","GCA_000150505.2","-","-","","","","-" +"","Schizosaccharomyces pombe","Schizosaccharomycetales","284812","ASM294v2","GCA_000002945.2","","-","","","","" +"","Scleroderma citrinum Foug A (GCA_000827425)","Boletales","1036808","Scleroderma_citrinum_Foug_A_v1.0","GCA_000827425.1","-","-","-","-","","-" +"","Sclerotinia borealis F-4128 (GCA_000503235)","Sclerotiniaceae","1432307","SBOR_1","GCA_000503235.1","-","-","-","-","","-" +"","Sclerotinia sclerotiorum","Sclerotiniaceae","665079","ASM14694v1","GCA_000146945.1","-","-","-","","","-" +"","Sclerotinia sclerotiorum 1980 UF-70 (GCA_001857865)","Sclerotiniaceae","665079","ASM185786v1","GCA_001857865.1","-","-","-","-","-","-" +"","Serendipita indica DSM 11827 (GCA_000313545)","Sebacinales","1109443","ASM31354v1","GCA_000313545.1","-","-","-","-","","-" +"","Serendipita vermifera MAFF 305830 (GCA_000827415)","Sebacinales","933852","Sebacina_vermifera_MAFF_305830_v1.0","GCA_000827415.1","-","-","-","-","","-" +"","Serpula lacrymans var. lacrymans S7.3 (GCA_000218725)","Boletales","936435","v1.0","GCA_000218725.1","-","-","-","-","","-" +"","Serpula lacrymans var. lacrymans S7.9 (GCA_000218685)","Boletales","578457","v1.0","GCA_000218685.1","-","-","-","-","-","-" +"","Sistotremastrum niveocremeum HHB9708 (GCA_001630475)","","1314777","Sisni1","GCA_001630475.1","-","-","-","-","","-" +"","Sistotremastrum suecicum HHB10207 ss-3 (GCA_001632355)","","1314776","Sissu1","GCA_001632355.1","-","-","-","-","","-" +"","Sordaria macrospora k-hell (GCA_000182805)","Sordariales","771870","ASM18280v2","GCA_000182805.2","-","-","-","-","","-" +"","Spathaspora passalidarum NRRL Y-27907 (GCA_000223485)","Saccharomycetales","619300","Spathaspora_passalidarum_v2.0","GCA_000223485.1","-","-","-","-","","-" +"","Sphaerobolus stellatus SS14 (GCA_000827215)","Geastrales","990650","Sphst1","GCA_000827215.1","-","-","-","-","","-" +"","Sphaerulina musiva SO2202 (GCA_000320565)","Capnodiales","692275","Septoria_musiva_SO2202_v1.0","GCA_000320565.2","-","-","-","-","","-" +"","Spizellomyces punctatus DAOM BR117 (GCA_000182565)","Chytridiomycetes","645134","S_punctatus_V1","GCA_000182565.2","-","-","-","-","","-" +"","Sporisorium reilianum","Ustilaginales","999809","GCA_000230245.1","GCA_000230245.1","-","-","-","","","-" +"","Sporisorium reilianum f. sp. reilianum (GCA_900162835)","Ustilaginales","72559","version_2","GCA_900162835.1","-","-","-","-","-","-" +"","Sporothrix brasiliensis 5110 (GCA_000820605)","Ophiostomatales","1398154","S_brasiliensis_5110_v1","GCA_000820605.1","-","-","-","-","","-" +"","Sporothrix insectorum RCEF 264 (GCA_001636815)","Ophiostomatales","1081102","SPI_1.0","GCA_001636815.1","-","-","-","-","","-" +"","Sporothrix schenckii 1099-18 (GCA_000961545)","Ophiostomatales","1397361","S_schenckii_v1","GCA_000961545.1","-","-","-","-","-","-" +"","Sporothrix schenckii ATCC 58251 (GCA_000474925)","Ophiostomatales","1391915","Spor_sche_ATCC58251_V1","GCA_000474925.1","-","-","-","-","","-" +"","Spraguea lophii 42_110 (GCA_000430065)","Spraguidae","1358809","Sprlop1.0","GCA_000430065.1","-","-","-","-","","-" +"","Stachybotrys chartarum IBT 40288 (GCA_000732765)","Hypocreales","1283842","S40288v1","GCA_000732765.1","-","-","-","-","","-" +"","Stachybotrys chartarum IBT 40293 (GCA_000732565)","Hypocreales","1280524","S40293v1","GCA_000732565.1","-","-","-","-","-","-" +"","Stachybotrys chartarum IBT 7711 (GCA_000730325)","Hypocreales","1280523","S7711v1","GCA_000730325.1","-","-","-","-","-","-" +"","Stachybotrys chlorohalonata IBT 40285 (GCA_000732775)","Hypocreales","1283841","S40285v1","GCA_000732775.1","-","-","-","-","","-" +"","Stagonospora sp. SRC1lsM3a (GCA_001644525)","Pleosporales","765868","Stasp1","GCA_001644525.1","-","-","-","-","","-" +"","Stemphylium lycopersici str. CIDEFI 216 (GCA_001191545)","Pleosporales","183478","ASM119154v1","GCA_001191545.1","-","-","-","-","","-" +"","Stereum hirsutum FP-91666 SS1 (GCA_000264905)","Russulales","721885","Stehi1","GCA_000264905.1","-","-","-","-","","-" +"","Sugiyamaella lignohabitans str. CBS 10342 (GCA_001640025)","Saccharomycetales","796027","ASM164002v2","GCA_001640025.2","-","-","-","-","","-" +"","Suhomyces tanzawaensis NRRL Y-17324 (GCA_001661415)","Saccharomycetales","984487","Canta1","GCA_001661415.1","-","-","-","-","","-" +"","Suillus luteus UH-Slu-Lm8-n1 (GCA_000827255)","Boletales","930992","Suilu1","GCA_000827255.1","-","-","-","-","","-" +"","Syncephalastrum racemosum str. NRRL 2496","Mucoromycotina","13706","Synrac1","GCA_002105135.1","-","-","-","-","","-" +"","Talaromyces atroroseus str. IBT 11181 (GCA_001907595)","Eurotiales","1441469","ASM190759v1","GCA_001907595.1","-","-","-","-","","-" +"","Talaromyces cellulolyticus str. Y-94 (GCA_000829775)","Eurotiales","1472165","TcelY94_1.0","GCA_000829775.1","-","-","-","-","","-" +"","Talaromyces islandicus (GCA_000985935)","Eurotiales","28573","PIS","GCA_000985935.1","-","-","-","-","","-" +"","Talaromyces marneffei ATCC 18224 (GCA_000001985)","Eurotiales","441960","JCVI-PMFA1-2.0","GCA_000001985.1","-","-","-","-","","-" +"","Talaromyces marneffei PM1 (GCA_000750115)","Eurotiales","1077442","ASM75011v1","GCA_000750115.1","-","-","-","-","-","-" +"","Talaromyces stipitatus ATCC 10500 (GCA_000003125)","Eurotiales","441959","JCVI-TSTA1-3.0","GCA_000003125.1","-","-","-","-","","-" +"","Termitomyces sp. J132 (GCA_001263195)","Agaricales","1306850","TerJ1321.0","GCA_001263195.1","-","-","-","-","","-" +"","Testicularia cyperi str. MCA 3645 (GCA_003144125)","Ustilaginales","1882483","Tescy1","GCA_003144125.1","-","-","-","-","","-" +"","Tetrapisispora blattae CBS 6284 (GCA_000315915)","Saccharomycetales","1071380","ASM31591v1","GCA_000315915.1","-","-","-","-","","-" +"","Tetrapisispora phaffii CBS 4417 (GCA_000236905)","Saccharomycetales","1071381","ASM23690v1","GCA_000236905.1","-","-","-","-","","-" +"","Thermothelomyces thermophila ATCC 42464 (GCA_000226095)","Sordariales","573729","ASM22609v1","GCA_000226095.1","-","-","-","-","","-" +"","Thielavia terrestris NRRL 8126 (GCA_000226115)","Sordariales","578455","ASM22611v1","GCA_000226115.1","-","-","-","-","","-" +"","Thielaviopsis punctulata (GCA_000968615)","Microascales","72032","ASM96861v1","GCA_000968615.1","-","-","-","-","","-" +"","Tilletia caries str. DAOM 238032 (GCA_001645005)","","13290","ASM164500v1","GCA_001645005.1","-","-","-","-","","-" +"","Tilletia controversa str. DAOM 236426 (GCA_001645045)","","13291","ASM164504v1","GCA_001645045.1","-","-","-","-","","-" +"","Tilletia indica str. DAOM 236416 (GCA_001645015)","","43049","ASM164501v1","GCA_001645015.1","-","-","-","-","","-" +"","Tilletia walkeri str. DAOM 236422 (GCA_001645055)","","117179","ASM164505v1","GCA_001645055.1","-","-","-","-","","-" +"","Tilletiaria anomala UBC 951 (GCA_000711695)","Georgefischeriales","1037660","Tilletiaria_anomala_UBC_951_v1.0","GCA_000711695.1","-","-","-","-","","-" +"","Tilletiopsis washingtonensis str. MCA 4186 (GCA_003144115)","","58919","Tilwa1","GCA_003144115.1","-","-","-","-","","-" +"","Tolypocladium capitatum str. CBS 113982 (GCA_002901185)","Hypocreales","45235","ASM290118v1","GCA_002901185.1","-","-","-","-","","-" +"","Tolypocladium ophioglossoides CBS 100239 (GCA_001189435)","Hypocreales","1163406","Tophv1.0","GCA_001189435.1","-","-","-","-","","-" +"","Tolypocladium paradoxum str. NRBC 100945 (GCA_002916505)","Hypocreales","94208","ASM291650v1","GCA_002916505.1","-","-","-","-","","-" +"","Torrubiella hemipterigena str. BCC 1449 (GCA_000825705)","Hypocreales","1531966","Allpaths-LG","GCA_000825705.1","-","-","-","-","","-" +"","Tortispora caseinolytica NRRL Y-17796 (GCA_001661475)","Saccharomycetales","767744","Canca1","GCA_001661475.1","-","-","-","-","","-" +"","Torulaspora delbrueckii str. CBS 1146 (GCA_000243375)","Saccharomycetales","4950","ASM24337v1","GCA_000243375.1","-","-","-","-","","-" +"","Trachipleistophora hominis (GCA_000316135)","Pleistophoridae","72359","ASM31613v1","GCA_000316135.1","-","-","-","-","","-" +"","Trametes cinnabarina str. BRFM137 (GCA_000765035)","Polyporales","5643","BN946","GCA_000765035.1","-","-","-","-","","-" +"","Trametes coccinea BRFM310 (GCA_002092935)","Polyporales","1353009","Pycco1","GCA_002092935.1","-","-","-","-","","-" +"","Trametes pubescens str. FBCC735 (GCA_001895945)","Polyporales","154538","ASM189594v1","GCA_001895945.1","-","-","-","-","","-" +"","Trametes versicolor FP-101664 SS1 (GCA_000271585)","Polyporales","717944","Trametes_versicolor_v1.0","GCA_000271585.1","-","-","-","-","","-" +"","Tremella mesenterica DSM 1558 (GCA_000271645)","Tremellales","578456","Treme1","GCA_000271645.1","-","-","-","-","","-" +"","Trichoderma asperellum CBS 433.97 (GCA_003025105)","Hypocreales","1042311","Trias_v._1.0","GCA_003025105.1","-","-","-","-","","-" +"","Trichoderma atroviride IMI 206040 (GCA_000171015)","Hypocreales","452589","TRIAT_v2.0","GCA_000171015.2","-","-","-","-","","-" +"","Trichoderma citrinoviride str. TUCIM 6016 (GCA_003025115)","Hypocreales","58853","Trici_v4.0","GCA_003025115.1","-","-","-","-","","-" +"","Trichoderma gamsii str. T6085 (GCA_001481775)","Hypocreales","398673","TGAM01v2","GCA_001481775.2","-","-","-","-","","-" +"","Trichoderma guizhouense str. NJAU 4742 (GCA_002022785)","Hypocreales","1491466","ASM202278v1","GCA_002022785.1","-","-","-","-","","-" +"","Trichoderma harzianum CBS 226.95 (GCA_003025095)","Hypocreales","983964","Allpaths-LG_v._01_03_12","GCA_003025095.1","-","-","-","-","-","-" +"","Trichoderma harzianum str. T6776 (GCA_000988865)","Hypocreales","5544","ASM98886v1","GCA_000988865.1","-","-","-","-","","-" +"","Trichoderma harzianum str. TR274 (GCA_002838845)","Hypocreales","5544","ASM283884v1","GCA_002838845.1","-","-","-","-","-","-" +"","Trichoderma harzianum str. Tr1 (GCA_002894145)","Hypocreales","5544","Tr1","GCA_002894145.1","-","-","-","-","-","-" +"","Trichoderma longibrachiatum ATCC 18648 (GCA_003025155)","Hypocreales","983965","Trilo3","GCA_003025155.1","-","-","-","-","","-" +"","Trichoderma parareesei (GCA_001050175)","Hypocreales","858221","Tpara_v1.0","GCA_001050175.1","-","-","-","-","","-" +"","Trichoderma reesei","Hypocreales","431241","GCA_000167675.2","GCA_000167675.2","-","-","-","","","-" +"","Trichoderma reesei RUT C-30 (GCA_000513815)","Hypocreales","1344414","TrireRUTC30_1","GCA_000513815.1","-","-","-","-","-","-" +"","Trichoderma virens","Hypocreales","413071","ASM17099v1","GCA_000170995.2","-","-","","","","-" +"","Trichophyton benhamiae CBS 112371 (GCA_000151125)","Onygenales","663331","ASM15112v2","GCA_000151125.2","-","-","-","-","","-" +"","Trichophyton equinum CBS 127.97 (GCA_000151175)","Onygenales","559882","ASM15117v1","GCA_000151175.1","-","-","-","-","","-" +"","Trichophyton interdigitale H6 (GCA_000616785)","Onygenales","1215336","Tric_rubr_H6_V2","GCA_000616785.1","-","-","-","-","-","-" +"","Trichophyton interdigitale MR816 (GCA_000622975)","Onygenales","1215338","Tric_inte_MR816_V1","GCA_000622975.1","-","-","-","-","","-" +"","Trichophyton mentagrophytes str. TIMM 2789 (GCA_003118255)","Onygenales","523103","ABySS_70bp_45k_152cov_v1","GCA_003118255.1","-","-","-","-","","-" +"","Trichophyton rubrum CBS 100081 (GCA_000616805)","Onygenales","1215328","Tric_fish_CBS_100081_V1","GCA_000616805.1","-","-","-","-","-","-" +"","Trichophyton rubrum CBS 118892 (GCA_000151425)","Onygenales","559305","ASM15142v1","GCA_000151425.1","-","-","-","-","","-" +"","Trichophyton rubrum CBS 202.88 (GCA_000616985)","Onygenales","1215334","Tric_raub_CBS_202_88_V2","GCA_000616985.1","-","-","-","-","-","-" +"","Trichophyton rubrum CBS 288.86 (GCA_000616825)","Onygenales","1215330","Tric_fish_CBS_288_86_V1","GCA_000616825.1","-","-","-","-","-","-" +"","Trichophyton rubrum CBS 289.86 (GCA_000616845)","Onygenales","1215329","Tric_kane_CBS_289_86_V1","GCA_000616845.1","-","-","-","-","-","-" +"","Trichophyton rubrum CBS 735.88 (GCA_000616965)","Onygenales","1215332","Tric_megn_CBS_735_88_V1","GCA_000616965.1","-","-","-","-","-","-" +"","Trichophyton rubrum D6 (GCA_000622995)","Onygenales","1215335","Tric_rubr_D6_V1","GCA_000622995.1","-","-","-","-","-","-" +"","Trichophyton rubrum MR1448 (GCA_000616905)","Onygenales","1215339","Tric_rubr_M1448_V1","GCA_000616905.1","-","-","-","-","-","-" +"","Trichophyton rubrum MR1459 (GCA_000616945)","Onygenales","1215341","Tric_rubr_MR1459_V1","GCA_000616945.1","-","-","-","-","-","-" +"","Trichophyton rubrum MR850 (GCA_000616765)","Onygenales","1215337","Tric_rubr_MR-850_V1","GCA_000616765.1","-","-","-","-","-","-" +"","Trichophyton rubrum str. CMCC(F)T1i (GCA_001651445)","Onygenales","5551","CMCC_F_T1i","GCA_001651445.1","-","-","-","-","-","-" +"","Trichophyton soudanense CBS 452.61 (GCA_000616865)","Onygenales","1215331","Tric_soud_CBS_452_61_V1","GCA_000616865.1","-","-","-","-","","-" +"","Trichophyton tonsurans CBS 112818 (GCA_000151455)","Onygenales","647933","ASM15145v1","GCA_000151455.1","-","-","-","-","","-" +"","Trichophyton verrucosum HKI 0517 (GCA_000151505)","Onygenales","663202","ASM15150v1","GCA_000151505.1","-","-","-","-","","-" +"","Trichophyton violaceum str. CMCC(F)T3l (GCA_001651435)","Onygenales","34388","CMCC_F_T3l","GCA_001651435.1","-","-","-","-","","-" +"","Trichosporon asahii var. asahii CBS 2479 (GCA_000293215)","","1186058","Trichosporon_asahii_1","GCA_000293215.1","-","-","-","-","-","-" +"","Trichosporon asahii var. asahii CBS 8904 (GCA_000299215)","","1220162","ASM29921v2","GCA_000299215.2","-","-","-","-","","-" +"","Tsuchiyaea wingfieldii CBS 7118 (GCA_001720155)","Tremellales","1295528","Tsuc_wing_CBS7118_V1","GCA_001720155.1","-","-","-","-","","-" +"","Tuber borchii str. Tbo3840 (GCA_003070745)","Pezizales","42251","Tubbor1","GCA_003070745.1","-","-","-","-","","-" +"","Tuber magnatum (GCA_003182015)","Pezizales","42249","ASM318201v1","GCA_003182015.1","-","-","-","-","","-" +"","Tuber melanosporum","Pezizales","656061","ASM15164v1","GCA_000151645.1","-","-","-","","","-" +"","Tulasnella calospora MUT 4182 (GCA_000827465)","Cantharellales","1051891","Tulasnella_calospora_AL13_4D_v1.0","GCA_000827465.1","-","-","-","-","","-" +"","Umbilicaria pustulata (GCA_900169345)","","136370","Lasallia_pustulata_v1","GCA_900169345.1","-","-","-","-","-","-" +"","Uncinocarpus reesii 1704 str. UAMH 1704 (GCA_000003515)","Onygenales","336963","ASM351v2","GCA_000003515.2","-","-","-","-","","-" +"","Ustilaginoidea virens (GCA_000965225)","Hypocreales","1159556","ASM96522v2","GCA_000965225.2","-","-","-","-","-","-" +"","Ustilaginoidea virens str. UV-8b (GCA_000687475)","Hypocreales","1159556","Assembly_for_version_1_of_the_Villosiclava_virens_genome","GCA_000687475.1","-","-","-","-","","-" +"","Ustilaginomycotina sp. SA 807 (GCA_003144235)","","1673888","Ustsp1","GCA_003144235.1","-","-","-","-","","-" +"","Ustilago bromivora str. UB2112 (GCA_900080155)","Ustilaginales","307758","UBRO_v3","GCA_900080155.1","-","-","-","-","-","-" +"","Ustilago hordei str. Uh4857-4 (GCA_000286035)","Ustilaginales","120017","ASM28603v1","GCA_000286035.1","-","-","-","-","","-" +"","Ustilago maydis","Ustilaginales","237631","Umaydis521_2.0","GCA_000328475.2","-","-","-","","","" +"","Valsa mali str. 03-8 (GCA_000818155)","Sordariomycetidae","105487","ASM81815v1","GCA_000818155.1","-","-","-","-","-","-" +"","Valsa mali var. pyri str. SXYL134 (GCA_000813385)","Sordariomycetidae","694573","ASM81338v1","GCA_000813385.1","-","-","-","-","","-" +"","Vanderwaltozyma polyspora DSM 70294 (GCA_000150035)","Saccharomycetales","436907","ASM15003v1","GCA_000150035.1","-","-","-","-","","-" +"","Vavraia culicis subsp. floridensis (GCA_000192795)","Pleistophoridae","948595","Vavr_culi_floridensis_V1","GCA_000192795.1","-","-","-","-","","-" +"","Verruconis gallopava str. CBS 43764 (GCA_000836295)","Venturiales","253628","O_gall_CBS43764","GCA_000836295.1","-","-","-","-","-","-" +"","Verticillium alfalfae VaMs.102 (GCA_000150825)","Glomerellales","526221","ASM15082v1","GCA_000150825.1","-","-","-","-","-","-" +"","Verticillium dahliae","Glomerellales","498257","ASM15067v2","GCA_000150675.2","-","-","-","","","-" +"","Verticillium dahliae (GCA_002892995)","Glomerellales","27337","ASM289299v1","GCA_002892995.1","-","-","-","-","-","-" +"","Verticillium dahliae (GCA_002893025)","Glomerellales","27337","ASM289302v1","GCA_002893025.1","-","-","-","-","-","-" +"","Verticillium dahliae (GCA_002893035)","Glomerellales","27337","ASM289303v1","GCA_002893035.1","-","-","-","-","-","-" +"","Verticillium dahliae (GCA_002893045)","Glomerellales","27337","ASM289304v1","GCA_002893045.1","-","-","-","-","-","-" +"","Verticillium dahliae JR2","Glomerellales","1202531","VDAG_JR2v.4.0","GCA_000400815.2","","-","-","","-","-" +"","Verticillium dahliae str. 12008 (GCA_002892985)","Glomerellales","27337","ASM289298v1","GCA_002892985.1","-","-","-","-","-","-" +"","Verticillium longisporum (GCA_001268145)","Glomerellales","100787","vl1.denovo.v1","GCA_001268145.1","-","-","-","-","-","-" +"","Verticillium longisporum (GCA_001268165)","Glomerellales","100787","vl2.denovo.v1","GCA_001268165.1","-","-","-","-","","-" +"","Vittaforma corneae ATCC 50505 (GCA_000231115)","Nosematidae","993615","Vitt_corn_V1","GCA_000231115.1","-","-","-","-","","-" +"","Wallemia ichthyophaga EXF-994 (GCA_000400465)","Wallemiales","1299270","Wallemia_ichthyophaga_version_1.0","GCA_000400465.1","-","-","-","-","","-" +"","Wallemia mellicola CBS 633.66 (GCA_000263375)","Wallemiales","671144","Wallemia_sebi_v1.0","GCA_000263375.1","-","-","-","-","","-" +"","Wickerhamiella sorbophila str. DS02 (GCA_002251995)","Saccharomycetales","45607","ASM225199v2","GCA_002251995.2","-","-","-","-","","-" +"","Wickerhamomyces anomalus NRRL Y-366-8 (GCA_001661255)","Saccharomycetales","683960","Wican1","GCA_001661255.1","-","-","-","-","","-" +"","Wickerhamomyces ciferrii str. NRRL Y-1031 (GCA_000313485)","Saccharomycetales","1041607","ASM31348v1","GCA_000313485.1","-","-","-","-","","-" +"","Wolfiporia cocos MD-104 SS10 (GCA_000344635)","Polyporales","742152","Wolco1","GCA_000344635.1","-","-","-","-","","-" +"","Xanthophyllomyces dendrorhous (GCA_001007165)","Cystofilobasidiales","5421","Xden1","GCA_001007165.2","-","-","-","-","-","-" +"","Xylona heveae TC161 (GCA_001619985)","","1328760","Xylona_heveae_TC161_v1.0","GCA_001619985.1","-","-","-","-","","-" +"","Yarrowia lipolytica","Saccharomycetales","284591","GCA_000002525.1","GCA_000002525.1","-","-","-","","-","-" +"","Yarrowia lipolytica (GCA_900087985)","Saccharomycetales","4952","YALIA101","GCA_900087985.1","-","-","-","-","","-" +"","Yarrowia lipolytica str. CLIB89 (W29) (GCA_001761485)","Saccharomycetales","4952","ASM176148v1","GCA_001761485.1","-","-","-","-","-","-" +"","Zygosaccharomyces bailii (GCA_900162805)","Saccharomycetales","4954","version_1","GCA_900162805.1","-","-","-","-","-","-" +"","Zygosaccharomyces bailii CLIB 213 (GCA_000442885)","Saccharomycetales","1333698","ZYBA0","GCA_000442885.1","-","-","-","-","","-" +"","Zygosaccharomyces bailii ISA1307 (GCA_000530735)","Saccharomycetales","1355161","Z_bailii_ISA1307_version_3","GCA_000530735.1","-","-","-","-","-","-" +"","Zygosaccharomyces parabailii str. ATCC 60483 (GCA_001984395)","Saccharomycetales","1365886","ASM198439v2","GCA_001984395.2","-","-","-","-","","-" +"","Zygosaccharomyces rouxii str. CBS 732 (GCA_000026365)","Saccharomycetales","4956","ASM2636v1","GCA_000026365.1","-","-","-","-","","-" +"","Zygosaccharomyces rouxii str. NBRC110957 (GCA_001972345)","Saccharomycetales","4956","ZYGR_assembly01","GCA_001972345.1","-","-","-","-","-","-" +"","Zymoseptoria brevis str. Zb18110 (GCA_000966595)","Capnodiales","1047168","ASM96659v1","GCA_000966595.1","-","-","-","-","","-" +"","Zymoseptoria tritici","Capnodiales","336722","MG2","GCA_000219625.1","","-","-","","","" +"","Zymoseptoria tritici ST99CH_1A5 (GCA_900099495)","Capnodiales","1276529","ZT1A5_complete_assembly","GCA_900099495.1","-","-","-","-","-","-" +"","Zymoseptoria tritici ST99CH_1E4 (GCA_900184115)","Capnodiales","1276532","ST99CH_1E4","GCA_900184115.1","-","-","-","-","-","-" +"","Zymoseptoria tritici ST99CH_3D1 (GCA_900184105)","Capnodiales","1276537","ST99CH_3D1","GCA_900184105.1","-","-","-","-","-","-" +"","Zymoseptoria tritici ST99CH_3D7 (GCA_900091695)","Capnodiales","1276538","Zt_ST99CH_3D7","GCA_900091695.1","-","-","-","-","-","-" +"","[Candida] arabinofermentans NRRL YB-2248 (GCA_001661425)","Saccharomycetales","983967","Canar1","GCA_001661425.1","-","-","-","-","-","-" +"","[Candida] auris (GCA_002759435)","Saccharomycetales","498019","Cand_auris_B8441_V2","GCA_002759435.2","-","-","-","-","-","-" +"","[Candida] auris (GCA_002775015)","Saccharomycetales","498019","Cand_auris_B11221_V1","GCA_002775015.1","-","-","-","-","-","-" +"","[Candida] auris (GCA_003013715)","Saccharomycetales","498019","Cand_auris_B11220","GCA_003013715.1","-","-","-","-","-","-" +"","[Candida] auris (GCA_003014415)","Saccharomycetales","498019","Cand_auris_B11243","GCA_003014415.1","-","-","-","-","-","-" +"","[Candida] auris str. 6684 (GCA_001189475)","Saccharomycetales","498019","ASM118947v1","GCA_001189475.1","-","-","-","-","","-" +"","[Candida] duobushaemulonis str. B09383 (GCA_002926085)","Saccharomycetales","1231522","CanDuoHae_v1.0","GCA_002926085.1","-","-","-","-","-","-" +"","[Candida] glabrata (GCA_001466525)","Saccharomycetales","5478","ASM146652v1","GCA_001466525.1","-","-","-","-","-","-" +"","[Candida] glabrata (GCA_001466535)","Saccharomycetales","5478","ASM146653v1","GCA_001466535.1","-","-","-","-","-","-" +"","[Candida] glabrata (GCA_001466565)","Saccharomycetales","5478","ASM146656v1","GCA_001466565.1","-","-","-","-","-","-" +"","[Candida] glabrata (GCA_001466575)","Saccharomycetales","5478","ASM146657v1","GCA_001466575.1","-","-","-","-","-","-" +"","[Candida] glabrata (GCA_001466635)","Saccharomycetales","5478","ASM146663v1","GCA_001466635.1","-","-","-","-","-","-" +"","[Candida] glabrata (GCA_001466685)","Saccharomycetales","5478","ASM146668v1","GCA_001466685.1","-","-","-","-","-","-" +"","[Candida] glabrata (GCA_002219185)","Saccharomycetales","5478","ASM221918v1","GCA_002219185.1","-","-","-","-","-","-" +"","[Candida] glabrata (GCA_002219195)","Saccharomycetales","5478","ASM221919v1","GCA_002219195.1","-","-","-","-","-","-" +"","[Candida] glabrata str. CBS138 (GCA_000002545)","Saccharomycetales","5478","ASM254v2","GCA_000002545.2","-","-","-","-","","-" +"","[Candida] haemulonis str. B11899 (GCA_002926055)","Saccharomycetales","45357","CanHae_1.0","GCA_002926055.1","-","-","-","-","-","-" +"","[Candida] intermedia (GCA_900106115)","Saccharomycetales","45354","CBS_141442_assembly","GCA_900106115.1","-","-","-","-","-","-" +"","[Candida] intermedia (GCA_900106125)","Saccharomycetales","45354","PYCC_4715_assembly","GCA_900106125.1","-","-","-","-","-","-" +"","[Candida] pseudohaemulonis str. B12108 (GCA_003013735)","Saccharomycetales","418784","Cand_pseudohaemulonii_B12108","GCA_003013735.1","-","-","-","-","-","-" +"","[Candida] tenuis ATCC 10573 (GCA_000223465)","Saccharomycetales","590646","Candida_tenuis_v1.0","GCA_000223465.1","-","-","-","-","-","-" diff --git a/data/intogen-KRAS-distribution-data.tsv b/data/intogen-KRAS-distribution-data.tsv index c2ee938..64640cc 100644 --- a/data/intogen-KRAS-distribution-data.tsv +++ b/data/intogen-KRAS-distribution-data.tsv @@ -1,179 +1,179 @@ -MUTS_PAM STRAND MOST_SEVERE START MUTS_PAM_SAMPLES REF MUTS_CS ALT AA_CHANGE CHR MUTS_CS_SAMPLES PROTEIN_POS GENE TRANSCRIPT -93 + missense_variant 25398284 93 C 93 T G/D 12 93 12 ENSG00000133703 ENST00000311936 -93 + missense_variant 25398284 93 C 93 T G/D 12 93 12 ENSG00000133703 ENST00000557334 -93 + missense_variant 25398284 93 C 93 T G/D 12 93 12 ENSG00000133703 ENST00000256078 -93 + missense_variant 25398284 93 C 93 T G/D 12 93 12 ENSG00000133703 ENST00000556131 -86 + missense_variant 25398284 86 C 86 A G/V 12 86 12 ENSG00000133703 ENST00000311936 -86 + missense_variant 25398284 86 C 86 A G/V 12 86 12 ENSG00000133703 ENST00000557334 -86 + missense_variant 25398284 86 C 86 A G/V 12 86 12 ENSG00000133703 ENST00000556131 -86 + missense_variant 25398284 86 C 86 A G/V 12 86 12 ENSG00000133703 ENST00000256078 -72 + missense_variant 25398285 72 C 72 A G/C 12 72 12 ENSG00000133703 ENST00000556131 -72 + missense_variant 25398285 72 C 72 A G/C 12 72 12 ENSG00000133703 ENST00000256078 -72 + missense_variant 25398285 72 C 72 A G/C 12 72 12 ENSG00000133703 ENST00000557334 -72 + missense_variant 25398285 72 C 72 A G/C 12 72 12 ENSG00000133703 ENST00000311936 -63 - missense_variant 25398284 63 G 63 A G/D 12 63 12 ENSG00000133703 ENST00000557334 -63 - missense_variant 25398284 63 G 63 A G/D 12 63 12 ENSG00000133703 ENST00000556131 -63 - missense_variant 25398284 63 G 63 A G/D 12 63 12 ENSG00000133703 ENST00000256078 -63 - missense_variant 25398284 63 G 63 A G/D 12 63 12 ENSG00000133703 ENST00000311936 -36 - missense_variant 25398284 36 G 36 T G/V 12 36 12 ENSG00000133703 ENST00000311936 -36 - missense_variant 25398284 36 G 36 T G/V 12 36 12 ENSG00000133703 ENST00000256078 -36 - missense_variant 25398284 36 G 36 T G/V 12 36 12 ENSG00000133703 ENST00000556131 -36 - missense_variant 25398284 36 G 36 T G/V 12 36 12 ENSG00000133703 ENST00000557334 -24 + missense_variant 25398281 24 C 24 T G/D 12 24 13 ENSG00000133703 ENST00000256078 -24 + missense_variant 25398281 24 C 24 T G/D 12 24 13 ENSG00000133703 ENST00000311936 -24 + missense_variant 25398281 24 C 24 T G/D 12 24 13 ENSG00000133703 ENST00000557334 -24 + missense_variant 25398281 24 C 24 T G/D 12 24 13 ENSG00000133703 ENST00000556131 -23 + missense_variant 25398284 23 C 23 G G/A 12 23 12 ENSG00000133703 ENST00000556131 -23 + missense_variant 25398284 23 C 23 G G/A 12 23 12 ENSG00000133703 ENST00000311936 -23 + missense_variant 25398284 23 C 23 G G/A 12 23 12 ENSG00000133703 ENST00000557334 -23 + missense_variant 25398284 23 C 23 G G/A 12 23 12 ENSG00000133703 ENST00000256078 -16 - missense_variant 25398285 16 G 16 C G/R 12 16 12 ENSG00000133703 ENST00000556131 -16 - missense_variant 25398285 16 G 16 C G/R 12 16 12 ENSG00000133703 ENST00000311936 -16 - missense_variant 25398285 16 G 16 C G/R 12 16 12 ENSG00000133703 ENST00000557334 -16 - missense_variant 25398285 16 G 16 C G/R 12 16 12 ENSG00000133703 ENST00000256078 -13 + missense_variant 25398285 13 C 13 G G/R 12 13 12 ENSG00000133703 ENST00000311936 -13 + missense_variant 25398285 13 C 13 G G/R 12 13 12 ENSG00000133703 ENST00000556131 -13 + missense_variant 25398285 13 C 13 G G/R 12 13 12 ENSG00000133703 ENST00000557334 -13 + missense_variant 25398285 13 C 13 G G/R 12 13 12 ENSG00000133703 ENST00000256078 -11 + missense_variant 25380275 11 T 11 G Q/H 12 11 61 ENSG00000133703 ENST00000311936 -11 + missense_variant 25380275 11 T 11 G Q/H 12 11 61 ENSG00000133703 ENST00000256078 -10 + missense_variant 25398282 10 C 10 A G/C 12 10 13 ENSG00000133703 ENST00000557334 -10 + missense_variant 25398282 10 C 10 A G/C 12 10 13 ENSG00000133703 ENST00000311936 -10 + missense_variant 25398282 10 C 10 A G/C 12 10 13 ENSG00000133703 ENST00000556131 -10 + missense_variant 25398282 10 C 10 A G/C 12 10 13 ENSG00000133703 ENST00000256078 -9 + missense_variant 25398285 9 C 9 T G/S 12 9 12 ENSG00000133703 ENST00000557334 -9 + missense_variant 25398285 9 C 9 T G/S 12 9 12 ENSG00000133703 ENST00000556131 -9 + missense_variant 25398285 9 C 9 T G/S 12 9 12 ENSG00000133703 ENST00000311936 -9 + missense_variant 25398285 9 C 9 T G/S 12 9 12 ENSG00000133703 ENST00000256078 -7 + missense_variant 25380276 7 T 7 A Q/L 12 7 61 ENSG00000133703 ENST00000256078 -7 + missense_variant 25378562 7 C 7 T A/T 12 7 146 ENSG00000133703 ENST00000256078 -7 + missense_variant 25378562 7 C 7 T A/T 12 7 146 ENSG00000133703 ENST00000311936 -7 + missense_variant 25380276 7 T 7 A Q/L 12 7 61 ENSG00000133703 ENST00000311936 -5 + missense_variant 25398284 5 CC 5 AA G/F 12 5 12 ENSG00000133703 ENST00000311936 -5 + missense_variant 25398284 5 CC 5 AA G/F 12 5 12 ENSG00000133703 ENST00000256078 -5 + missense_variant 25380276 5 T 5 C Q/R 12 5 61 ENSG00000133703 ENST00000311936 -5 + missense_variant 25398284 5 CC 5 AA G/F 12 5 12 ENSG00000133703 ENST00000557334 -5 + missense_variant 25398284 5 CC 5 AA G/F 12 5 12 ENSG00000133703 ENST00000556131 -5 + missense_variant 25380276 5 T 5 C Q/R 12 5 61 ENSG00000133703 ENST00000256078 -4 + missense_variant 25398284 4 C 4 A G/V 12 4 12.0 ENSG00000133703 ENST00000256078 -4 + missense_variant 25398284 4 C 4 A G/V 12 4 12.0 ENSG00000133703 ENST00000557334 -4 + missense_variant 25398284 4 C 4 A G/V 12 4 12.0 ENSG00000133703 ENST00000311936 -4 + missense_variant 25398284 4 C 4 A G/V 12 4 12.0 ENSG00000133703 ENST00000556131 -3 + missense_variant 25380277 3 G 3 T Q/K 12 3 61 ENSG00000133703 ENST00000256078 -3 + missense_variant 25380275 3 T 3 A Q/H 12 3 61 ENSG00000133703 ENST00000256078 -3 + missense_variant 25378647 3 T 3 G K/N 12 3 117 ENSG00000133703 ENST00000256078 -3 + missense_variant 25380275 3 T 3 A Q/H 12 3 61 ENSG00000133703 ENST00000311936 -3 + missense_variant 25378647 3 T 3 G K/N 12 3 117 ENSG00000133703 ENST00000311936 -3 - missense_variant 25398281 3 G 3 A G/D 12 3 13 ENSG00000133703 ENST00000256078 -3 - missense_variant 25380275 3 A 3 C Q/H 12 3 61 ENSG00000133703 ENST00000256078 -3 + missense_variant 25398284 3 C 3 T G/D 12 3 12.0 ENSG00000133703 ENST00000256078 -3 + missense_variant 25380277 3 G 3 T Q/K 12 3 61 ENSG00000133703 ENST00000311936 -3 - missense_variant 25398281 3 G 3 A G/D 12 3 13 ENSG00000133703 ENST00000311936 -3 - missense_variant 25380275 3 A 3 C Q/H 12 3 61 ENSG00000133703 ENST00000311936 -3 + missense_variant 25398284 3 C 3 T G/D 12 3 12.0 ENSG00000133703 ENST00000311936 -3 + missense_variant 25398284 3 C 3 T G/D 12 3 12.0 ENSG00000133703 ENST00000556131 -3 - missense_variant 25398281 3 G 3 A G/D 12 3 13 ENSG00000133703 ENST00000557334 -3 + missense_variant 25398284 3 C 3 T G/D 12 3 12.0 ENSG00000133703 ENST00000557334 -3 - missense_variant 25398281 3 G 3 A G/D 12 3 13 ENSG00000133703 ENST00000556131 -2 + missense_variant 25398255 2 G 2 T Q/K 12 2 22 ENSG00000133703 ENST00000556131 -2 - missense_variant 25398285 2 G 2 A G/S 12 2 12 ENSG00000133703 ENST00000311936 -2 - missense_variant 25380276 2 A 2 G Q/R 12 2 61 ENSG00000133703 ENST00000311936 -2 + missense_variant 25398255 2 G 2 T Q/K 12 2 22 ENSG00000133703 ENST00000557334 -2 - missense_variant 25398285 2 G 2 A G/S 12 2 12 ENSG00000133703 ENST00000556131 -2 - missense_variant 25378562 2 G 2 A A/T 12 2 146 ENSG00000133703 ENST00000311936 -2 - missense_variant 25378562 2 G 2 A A/T 12 2 146 ENSG00000133703 ENST00000256078 -2 + missense_variant 25398255 2 G 2 T Q/K 12 2 22 ENSG00000133703 ENST00000256078 -2 - missense_variant 25380276 2 A 2 G Q/R 12 2 61 ENSG00000133703 ENST00000256078 -2 + missense_variant 25398255 2 G 2 T Q/K 12 2 22 ENSG00000133703 ENST00000311936 -2 + missense_variant 25378561 2 G 2 A A/V 12 2 146 ENSG00000133703 ENST00000311936 -2 - missense_variant 25398285 2 G 2 A G/S 12 2 12 ENSG00000133703 ENST00000256078 -2 - missense_variant 25398285 2 G 2 A G/S 12 2 12 ENSG00000133703 ENST00000557334 -2 + missense_variant 25378561 2 G 2 A A/V 12 2 146 ENSG00000133703 ENST00000256078 -1 + missense_variant 25398285 1 C 1 G G/R 12 1 12.0 ENSG00000133703 ENST00000557334 -1 + missense_variant 25398306 1 T 1 C K/E 12 1 5 ENSG00000133703 ENST00000557334 -1 - missense_variant 25362743 1 A 1 T S/C 12 1 72 ENSG00000133703 ENST00000557334 -1 - missense_variant 25398282 1 G 1 T G/C 12 1 13 ENSG00000133703 ENST00000557334 -1 - missense_variant 25398284 1 G 1 C G/A 12 1 12 ENSG00000133703 ENST00000557334 -1 + missense_variant 25398285 1 C 1 A G/C 12 1 12.0 ENSG00000133703 ENST00000557334 -0 + synonymous_variant 25398283 0 A 1 C - 12 1 12 ENSG00000133703 ENST00000557334 -1 + missense_variant 25398281 1 C 1 A G/V 12 1 13 ENSG00000133703 ENST00000557334 -0 + synonymous_variant 25398280 0 G 1 A - 12 1 13 ENSG00000133703 ENST00000557334 -0 + synonymous_variant 25380278 0 A 1 G - 12 1 60 ENSG00000133703 ENST00000311936 -1 - missense_variant 25378647 1 A 1 T K/N 12 1 117 ENSG00000133703 ENST00000256078 -1 - missense_variant 25398282 1 G 1 T G/C 12 1 13 ENSG00000133703 ENST00000256078 -1 - missense_variant 25398284 1 G 1 C G/A 12 1 12 ENSG00000133703 ENST00000256078 -1 + missense_variant 25362743 1 A 1 G C/R 12 1 185 ENSG00000133703 ENST00000311936 -0 + inframe_deletion 25362744 0 CTTTGT 1 - - 12 1 183-184 ENSG00000133703 ENST00000311936 -1 + missense_variant 25378557 1 C 1 G K/N 12 1 147 ENSG00000133703 ENST00000311936 -1 + missense_variant 25378562 1 C 1 G A/P 12 1 146 ENSG00000133703 ENST00000311936 -1 + missense_variant 25378562 1 C 1 T A/T 12 1 146.0 ENSG00000133703 ENST00000311936 -1 + missense_variant 25378594 1 C 1 G R/T 12 1 135 ENSG00000133703 ENST00000311936 -1 + missense_variant 25378645 1 C 1 G C/S 12 1 118 ENSG00000133703 ENST00000311936 -1 + missense_variant 25380240 1 C 1 A R/M 12 1 73.0 ENSG00000133703 ENST00000311936 -1 + missense_variant 25380254 1 C 1 A R/S 12 1 68 ENSG00000133703 ENST00000311936 -1 + missense_variant 25380271 1 C 1 T E/K 12 1 63.0 ENSG00000133703 ENST00000311936 -1 + missense_variant 25380274 1 C 1 T E/K 12 1 62 ENSG00000133703 ENST00000311936 -1 + missense_variant 25380275 1 T 1 G Q/H 12 1 61.0 ENSG00000133703 ENST00000311936 -1 + missense_variant 25398306 1 T 1 C K/E 12 1 5 ENSG00000133703 ENST00000256078 -1 + missense_variant 25398285 1 C 1 G G/R 12 1 12.0 ENSG00000133703 ENST00000256078 -1 + missense_variant 25398285 1 C 1 A G/C 12 1 12.0 ENSG00000133703 ENST00000256078 -1 + missense_variant 25380282 1 G 1 C A/G 12 1 59 ENSG00000133703 ENST00000256078 -1 + missense_variant 25380271 1 C 1 T E/K 12 1 63.0 ENSG00000133703 ENST00000256078 -1 + missense_variant 25380274 1 C 1 T E/K 12 1 62 ENSG00000133703 ENST00000256078 -1 + missense_variant 25380275 1 T 1 G Q/H 12 1 61.0 ENSG00000133703 ENST00000256078 -1 + missense_variant 25380277 1 GA 1 TT GQ/GK 12 1 60-61 ENSG00000133703 ENST00000256078 -0 + synonymous_variant 25380278 0 A 1 G - 12 1 60 ENSG00000133703 ENST00000256078 -0 + synonymous_variant 25380278 0 A 1 T - 12 1 60 ENSG00000133703 ENST00000256078 -1 + missense_variant 25380282 1 G 1 T A/E 12 1 59 ENSG00000133703 ENST00000256078 -0 + synonymous_variant 25398283 0 A 1 C - 12 1 12 ENSG00000133703 ENST00000256078 -1 + missense_variant 25398211 1 T 1 C I/M 12 1 36 ENSG00000133703 ENST00000256078 -1 + missense_variant 25398213 1 T 1 A I/L 12 1 36 ENSG00000133703 ENST00000256078 -0 + synonymous_variant 25398250 0 T 1 C - 12 1 23 ENSG00000133703 ENST00000256078 -1 + missense_variant 25398260 1 G 1 C T/R 12 1 20 ENSG00000133703 ENST00000256078 -0 + synonymous_variant 25398280 0 G 1 A - 12 1 13 ENSG00000133703 ENST00000256078 -1 + missense_variant 25398281 1 C 1 A G/V 12 1 13 ENSG00000133703 ENST00000256078 -1 + missense_variant 25380277 1 GA 1 TT GQ/GK 12 1 60-61 ENSG00000133703 ENST00000311936 -0 + synonymous_variant 25380278 0 A 1 T - 12 1 60 ENSG00000133703 ENST00000311936 -1 + missense_variant 25380240 1 C 1 A R/M 12 1 73.0 ENSG00000133703 ENST00000256078 -1 + missense_variant 25380282 1 G 1 C A/G 12 1 59 ENSG00000133703 ENST00000311936 -1 + missense_variant 25398260 1 G 1 C T/R 12 1 20 ENSG00000133703 ENST00000556131 -0 + synonymous_variant 25398280 0 G 1 A - 12 1 13 ENSG00000133703 ENST00000556131 -1 + missense_variant 25398281 1 C 1 A G/V 12 1 13 ENSG00000133703 ENST00000556131 -0 + synonymous_variant 25398283 0 A 1 C - 12 1 12 ENSG00000133703 ENST00000556131 -1 + missense_variant 25398285 1 C 1 A G/C 12 1 12.0 ENSG00000133703 ENST00000556131 -1 + missense_variant 25398285 1 C 1 G G/R 12 1 12.0 ENSG00000133703 ENST00000556131 -1 + missense_variant 25398306 1 T 1 C K/E 12 1 5 ENSG00000133703 ENST00000556131 -1 - missense_variant 25398282 1 G 1 T G/C 12 1 13 ENSG00000133703 ENST00000556131 -1 - missense_variant 25398284 1 G 1 C G/A 12 1 12 ENSG00000133703 ENST00000556131 -1 + missense_variant 25362743 1 A 1 G C/R 12 1 72 ENSG00000133703 ENST00000557334 -0 + inframe_deletion 25362744 0 CTTTGT 1 - - 12 1 70-71 ENSG00000133703 ENST00000557334 -1 + missense_variant 25398211 1 T 1 C I/M 12 1 36 ENSG00000133703 ENST00000557334 -1 + missense_variant 25398213 1 T 1 A I/L 12 1 36 ENSG00000133703 ENST00000557334 -0 + synonymous_variant 25398250 0 T 1 C - 12 1 23 ENSG00000133703 ENST00000557334 -1 + missense_variant 25398260 1 G 1 C T/R 12 1 20 ENSG00000133703 ENST00000557334 -0 + synonymous_variant 25398250 0 T 1 C - 12 1 23 ENSG00000133703 ENST00000556131 -1 + missense_variant 25398213 1 T 1 A I/L 12 1 36 ENSG00000133703 ENST00000556131 -1 + missense_variant 25398211 1 T 1 C I/M 12 1 36 ENSG00000133703 ENST00000556131 -1 + missense_variant 25398281 1 C 1 A G/V 12 1 13 ENSG00000133703 ENST00000311936 -1 + missense_variant 25380282 1 G 1 T A/E 12 1 59 ENSG00000133703 ENST00000311936 -1 + missense_variant 25398211 1 T 1 C I/M 12 1 36 ENSG00000133703 ENST00000311936 -1 + missense_variant 25398213 1 T 1 A I/L 12 1 36 ENSG00000133703 ENST00000311936 -0 + synonymous_variant 25398250 0 T 1 C - 12 1 23 ENSG00000133703 ENST00000311936 -1 + missense_variant 25398260 1 G 1 C T/R 12 1 20 ENSG00000133703 ENST00000311936 -0 + synonymous_variant 25398280 0 G 1 A - 12 1 13 ENSG00000133703 ENST00000311936 -0 + synonymous_variant 25398283 0 A 1 C - 12 1 12 ENSG00000133703 ENST00000311936 -1 - missense_variant 25398284 1 G 1 C G/A 12 1 12 ENSG00000133703 ENST00000311936 -1 + missense_variant 25398285 1 C 1 A G/C 12 1 12.0 ENSG00000133703 ENST00000311936 -1 + missense_variant 25398285 1 C 1 G G/R 12 1 12.0 ENSG00000133703 ENST00000311936 -1 + missense_variant 25398306 1 T 1 C K/E 12 1 5 ENSG00000133703 ENST00000311936 -1 - missense_variant 25362743 1 A 1 T S/C 12 1 185 ENSG00000133703 ENST00000311936 -1 - missense_variant 25378647 1 A 1 T K/N 12 1 117 ENSG00000133703 ENST00000311936 -1 - missense_variant 25398282 1 G 1 T G/C 12 1 13 ENSG00000133703 ENST00000311936 -1 + missense_variant 25380254 1 C 1 A R/S 12 1 68 ENSG00000133703 ENST00000256078 -1 + missense_variant 25378645 1 C 1 G C/S 12 1 118 ENSG00000133703 ENST00000256078 -1 + missense_variant 25378594 1 C 1 G R/T 12 1 135 ENSG00000133703 ENST00000256078 -1 + missense_variant 25368454 1 C 1 T R/Q 12 1 164 ENSG00000133703 ENST00000256078 -1 + missense_variant 25368473 1 T 1 C T/A 12 1 158 ENSG00000133703 ENST00000256078 -1 + missense_variant 25378557 1 C 1 G K/N 12 1 147 ENSG00000133703 ENST00000256078 -1 + missense_variant 25378562 1 C 1 G A/P 12 1 146 ENSG00000133703 ENST00000256078 -1 + missense_variant 25378562 1 C 1 T A/T 12 1 146.0 ENSG00000133703 ENST00000256078 +MUTS_PAM STRAND MOST_SEVERE START MUTS_PAM_SAMPLES REF MUTS_CS ALT AA_CHANGE CHR MUTS_CS_SAMPLES PROTEIN_POS GENE TRANSCRIPT +93 + missense_variant 25398284 93 C 93 T G/D 12 93 12 ENSG00000133703 ENST00000311936 +93 + missense_variant 25398284 93 C 93 T G/D 12 93 12 ENSG00000133703 ENST00000557334 +93 + missense_variant 25398284 93 C 93 T G/D 12 93 12 ENSG00000133703 ENST00000256078 +93 + missense_variant 25398284 93 C 93 T G/D 12 93 12 ENSG00000133703 ENST00000556131 +86 + missense_variant 25398284 86 C 86 A G/V 12 86 12 ENSG00000133703 ENST00000311936 +86 + missense_variant 25398284 86 C 86 A G/V 12 86 12 ENSG00000133703 ENST00000557334 +86 + missense_variant 25398284 86 C 86 A G/V 12 86 12 ENSG00000133703 ENST00000556131 +86 + missense_variant 25398284 86 C 86 A G/V 12 86 12 ENSG00000133703 ENST00000256078 +72 + missense_variant 25398285 72 C 72 A G/C 12 72 12 ENSG00000133703 ENST00000556131 +72 + missense_variant 25398285 72 C 72 A G/C 12 72 12 ENSG00000133703 ENST00000256078 +72 + missense_variant 25398285 72 C 72 A G/C 12 72 12 ENSG00000133703 ENST00000557334 +72 + missense_variant 25398285 72 C 72 A G/C 12 72 12 ENSG00000133703 ENST00000311936 +63 - missense_variant 25398284 63 G 63 A G/D 12 63 12 ENSG00000133703 ENST00000557334 +63 - missense_variant 25398284 63 G 63 A G/D 12 63 12 ENSG00000133703 ENST00000556131 +63 - missense_variant 25398284 63 G 63 A G/D 12 63 12 ENSG00000133703 ENST00000256078 +63 - missense_variant 25398284 63 G 63 A G/D 12 63 12 ENSG00000133703 ENST00000311936 +36 - missense_variant 25398284 36 G 36 T G/V 12 36 12 ENSG00000133703 ENST00000311936 +36 - missense_variant 25398284 36 G 36 T G/V 12 36 12 ENSG00000133703 ENST00000256078 +36 - missense_variant 25398284 36 G 36 T G/V 12 36 12 ENSG00000133703 ENST00000556131 +36 - missense_variant 25398284 36 G 36 T G/V 12 36 12 ENSG00000133703 ENST00000557334 +24 + missense_variant 25398281 24 C 24 T G/D 12 24 13 ENSG00000133703 ENST00000256078 +24 + missense_variant 25398281 24 C 24 T G/D 12 24 13 ENSG00000133703 ENST00000311936 +24 + missense_variant 25398281 24 C 24 T G/D 12 24 13 ENSG00000133703 ENST00000557334 +24 + missense_variant 25398281 24 C 24 T G/D 12 24 13 ENSG00000133703 ENST00000556131 +23 + missense_variant 25398284 23 C 23 G G/A 12 23 12 ENSG00000133703 ENST00000556131 +23 + missense_variant 25398284 23 C 23 G G/A 12 23 12 ENSG00000133703 ENST00000311936 +23 + missense_variant 25398284 23 C 23 G G/A 12 23 12 ENSG00000133703 ENST00000557334 +23 + missense_variant 25398284 23 C 23 G G/A 12 23 12 ENSG00000133703 ENST00000256078 +16 - missense_variant 25398285 16 G 16 C G/R 12 16 12 ENSG00000133703 ENST00000556131 +16 - missense_variant 25398285 16 G 16 C G/R 12 16 12 ENSG00000133703 ENST00000311936 +16 - missense_variant 25398285 16 G 16 C G/R 12 16 12 ENSG00000133703 ENST00000557334 +16 - missense_variant 25398285 16 G 16 C G/R 12 16 12 ENSG00000133703 ENST00000256078 +13 + missense_variant 25398285 13 C 13 G G/R 12 13 12 ENSG00000133703 ENST00000311936 +13 + missense_variant 25398285 13 C 13 G G/R 12 13 12 ENSG00000133703 ENST00000556131 +13 + missense_variant 25398285 13 C 13 G G/R 12 13 12 ENSG00000133703 ENST00000557334 +13 + missense_variant 25398285 13 C 13 G G/R 12 13 12 ENSG00000133703 ENST00000256078 +11 + missense_variant 25380275 11 T 11 G Q/H 12 11 61 ENSG00000133703 ENST00000311936 +11 + missense_variant 25380275 11 T 11 G Q/H 12 11 61 ENSG00000133703 ENST00000256078 +10 + missense_variant 25398282 10 C 10 A G/C 12 10 13 ENSG00000133703 ENST00000557334 +10 + missense_variant 25398282 10 C 10 A G/C 12 10 13 ENSG00000133703 ENST00000311936 +10 + missense_variant 25398282 10 C 10 A G/C 12 10 13 ENSG00000133703 ENST00000556131 +10 + missense_variant 25398282 10 C 10 A G/C 12 10 13 ENSG00000133703 ENST00000256078 +9 + missense_variant 25398285 9 C 9 T G/S 12 9 12 ENSG00000133703 ENST00000557334 +9 + missense_variant 25398285 9 C 9 T G/S 12 9 12 ENSG00000133703 ENST00000556131 +9 + missense_variant 25398285 9 C 9 T G/S 12 9 12 ENSG00000133703 ENST00000311936 +9 + missense_variant 25398285 9 C 9 T G/S 12 9 12 ENSG00000133703 ENST00000256078 +7 + missense_variant 25380276 7 T 7 A Q/L 12 7 61 ENSG00000133703 ENST00000256078 +7 + missense_variant 25378562 7 C 7 T A/T 12 7 146 ENSG00000133703 ENST00000256078 +7 + missense_variant 25378562 7 C 7 T A/T 12 7 146 ENSG00000133703 ENST00000311936 +7 + missense_variant 25380276 7 T 7 A Q/L 12 7 61 ENSG00000133703 ENST00000311936 +5 + missense_variant 25398284 5 CC 5 AA G/F 12 5 12 ENSG00000133703 ENST00000311936 +5 + missense_variant 25398284 5 CC 5 AA G/F 12 5 12 ENSG00000133703 ENST00000256078 +5 + missense_variant 25380276 5 T 5 C Q/R 12 5 61 ENSG00000133703 ENST00000311936 +5 + missense_variant 25398284 5 CC 5 AA G/F 12 5 12 ENSG00000133703 ENST00000557334 +5 + missense_variant 25398284 5 CC 5 AA G/F 12 5 12 ENSG00000133703 ENST00000556131 +5 + missense_variant 25380276 5 T 5 C Q/R 12 5 61 ENSG00000133703 ENST00000256078 +4 + missense_variant 25398284 4 C 4 A G/V 12 4 12.0 ENSG00000133703 ENST00000256078 +4 + missense_variant 25398284 4 C 4 A G/V 12 4 12.0 ENSG00000133703 ENST00000557334 +4 + missense_variant 25398284 4 C 4 A G/V 12 4 12.0 ENSG00000133703 ENST00000311936 +4 + missense_variant 25398284 4 C 4 A G/V 12 4 12.0 ENSG00000133703 ENST00000556131 +3 + missense_variant 25380277 3 G 3 T Q/K 12 3 61 ENSG00000133703 ENST00000256078 +3 + missense_variant 25380275 3 T 3 A Q/H 12 3 61 ENSG00000133703 ENST00000256078 +3 + missense_variant 25378647 3 T 3 G K/N 12 3 117 ENSG00000133703 ENST00000256078 +3 + missense_variant 25380275 3 T 3 A Q/H 12 3 61 ENSG00000133703 ENST00000311936 +3 + missense_variant 25378647 3 T 3 G K/N 12 3 117 ENSG00000133703 ENST00000311936 +3 - missense_variant 25398281 3 G 3 A G/D 12 3 13 ENSG00000133703 ENST00000256078 +3 - missense_variant 25380275 3 A 3 C Q/H 12 3 61 ENSG00000133703 ENST00000256078 +3 + missense_variant 25398284 3 C 3 T G/D 12 3 12.0 ENSG00000133703 ENST00000256078 +3 + missense_variant 25380277 3 G 3 T Q/K 12 3 61 ENSG00000133703 ENST00000311936 +3 - missense_variant 25398281 3 G 3 A G/D 12 3 13 ENSG00000133703 ENST00000311936 +3 - missense_variant 25380275 3 A 3 C Q/H 12 3 61 ENSG00000133703 ENST00000311936 +3 + missense_variant 25398284 3 C 3 T G/D 12 3 12.0 ENSG00000133703 ENST00000311936 +3 + missense_variant 25398284 3 C 3 T G/D 12 3 12.0 ENSG00000133703 ENST00000556131 +3 - missense_variant 25398281 3 G 3 A G/D 12 3 13 ENSG00000133703 ENST00000557334 +3 + missense_variant 25398284 3 C 3 T G/D 12 3 12.0 ENSG00000133703 ENST00000557334 +3 - missense_variant 25398281 3 G 3 A G/D 12 3 13 ENSG00000133703 ENST00000556131 +2 + missense_variant 25398255 2 G 2 T Q/K 12 2 22 ENSG00000133703 ENST00000556131 +2 - missense_variant 25398285 2 G 2 A G/S 12 2 12 ENSG00000133703 ENST00000311936 +2 - missense_variant 25380276 2 A 2 G Q/R 12 2 61 ENSG00000133703 ENST00000311936 +2 + missense_variant 25398255 2 G 2 T Q/K 12 2 22 ENSG00000133703 ENST00000557334 +2 - missense_variant 25398285 2 G 2 A G/S 12 2 12 ENSG00000133703 ENST00000556131 +2 - missense_variant 25378562 2 G 2 A A/T 12 2 146 ENSG00000133703 ENST00000311936 +2 - missense_variant 25378562 2 G 2 A A/T 12 2 146 ENSG00000133703 ENST00000256078 +2 + missense_variant 25398255 2 G 2 T Q/K 12 2 22 ENSG00000133703 ENST00000256078 +2 - missense_variant 25380276 2 A 2 G Q/R 12 2 61 ENSG00000133703 ENST00000256078 +2 + missense_variant 25398255 2 G 2 T Q/K 12 2 22 ENSG00000133703 ENST00000311936 +2 + missense_variant 25378561 2 G 2 A A/V 12 2 146 ENSG00000133703 ENST00000311936 +2 - missense_variant 25398285 2 G 2 A G/S 12 2 12 ENSG00000133703 ENST00000256078 +2 - missense_variant 25398285 2 G 2 A G/S 12 2 12 ENSG00000133703 ENST00000557334 +2 + missense_variant 25378561 2 G 2 A A/V 12 2 146 ENSG00000133703 ENST00000256078 +1 + missense_variant 25398285 1 C 1 G G/R 12 1 12.0 ENSG00000133703 ENST00000557334 +1 + missense_variant 25398306 1 T 1 C K/E 12 1 5 ENSG00000133703 ENST00000557334 +1 - missense_variant 25362743 1 A 1 T S/C 12 1 72 ENSG00000133703 ENST00000557334 +1 - missense_variant 25398282 1 G 1 T G/C 12 1 13 ENSG00000133703 ENST00000557334 +1 - missense_variant 25398284 1 G 1 C G/A 12 1 12 ENSG00000133703 ENST00000557334 +1 + missense_variant 25398285 1 C 1 A G/C 12 1 12.0 ENSG00000133703 ENST00000557334 +0 + synonymous_variant 25398283 0 A 1 C - 12 1 12 ENSG00000133703 ENST00000557334 +1 + missense_variant 25398281 1 C 1 A G/V 12 1 13 ENSG00000133703 ENST00000557334 +0 + synonymous_variant 25398280 0 G 1 A - 12 1 13 ENSG00000133703 ENST00000557334 +0 + synonymous_variant 25380278 0 A 1 G - 12 1 60 ENSG00000133703 ENST00000311936 +1 - missense_variant 25378647 1 A 1 T K/N 12 1 117 ENSG00000133703 ENST00000256078 +1 - missense_variant 25398282 1 G 1 T G/C 12 1 13 ENSG00000133703 ENST00000256078 +1 - missense_variant 25398284 1 G 1 C G/A 12 1 12 ENSG00000133703 ENST00000256078 +1 + missense_variant 25362743 1 A 1 G C/R 12 1 185 ENSG00000133703 ENST00000311936 +0 + inframe_deletion 25362744 0 CTTTGT 1 - - 12 1 183-184 ENSG00000133703 ENST00000311936 +1 + missense_variant 25378557 1 C 1 G K/N 12 1 147 ENSG00000133703 ENST00000311936 +1 + missense_variant 25378562 1 C 1 G A/P 12 1 146 ENSG00000133703 ENST00000311936 +1 + missense_variant 25378562 1 C 1 T A/T 12 1 146.0 ENSG00000133703 ENST00000311936 +1 + missense_variant 25378594 1 C 1 G R/T 12 1 135 ENSG00000133703 ENST00000311936 +1 + missense_variant 25378645 1 C 1 G C/S 12 1 118 ENSG00000133703 ENST00000311936 +1 + missense_variant 25380240 1 C 1 A R/M 12 1 73.0 ENSG00000133703 ENST00000311936 +1 + missense_variant 25380254 1 C 1 A R/S 12 1 68 ENSG00000133703 ENST00000311936 +1 + missense_variant 25380271 1 C 1 T E/K 12 1 63.0 ENSG00000133703 ENST00000311936 +1 + missense_variant 25380274 1 C 1 T E/K 12 1 62 ENSG00000133703 ENST00000311936 +1 + missense_variant 25380275 1 T 1 G Q/H 12 1 61.0 ENSG00000133703 ENST00000311936 +1 + missense_variant 25398306 1 T 1 C K/E 12 1 5 ENSG00000133703 ENST00000256078 +1 + missense_variant 25398285 1 C 1 G G/R 12 1 12.0 ENSG00000133703 ENST00000256078 +1 + missense_variant 25398285 1 C 1 A G/C 12 1 12.0 ENSG00000133703 ENST00000256078 +1 + missense_variant 25380282 1 G 1 C A/G 12 1 59 ENSG00000133703 ENST00000256078 +1 + missense_variant 25380271 1 C 1 T E/K 12 1 63.0 ENSG00000133703 ENST00000256078 +1 + missense_variant 25380274 1 C 1 T E/K 12 1 62 ENSG00000133703 ENST00000256078 +1 + missense_variant 25380275 1 T 1 G Q/H 12 1 61.0 ENSG00000133703 ENST00000256078 +1 + missense_variant 25380277 1 GA 1 TT GQ/GK 12 1 60-61 ENSG00000133703 ENST00000256078 +0 + synonymous_variant 25380278 0 A 1 G - 12 1 60 ENSG00000133703 ENST00000256078 +0 + synonymous_variant 25380278 0 A 1 T - 12 1 60 ENSG00000133703 ENST00000256078 +1 + missense_variant 25380282 1 G 1 T A/E 12 1 59 ENSG00000133703 ENST00000256078 +0 + synonymous_variant 25398283 0 A 1 C - 12 1 12 ENSG00000133703 ENST00000256078 +1 + missense_variant 25398211 1 T 1 C I/M 12 1 36 ENSG00000133703 ENST00000256078 +1 + missense_variant 25398213 1 T 1 A I/L 12 1 36 ENSG00000133703 ENST00000256078 +0 + synonymous_variant 25398250 0 T 1 C - 12 1 23 ENSG00000133703 ENST00000256078 +1 + missense_variant 25398260 1 G 1 C T/R 12 1 20 ENSG00000133703 ENST00000256078 +0 + synonymous_variant 25398280 0 G 1 A - 12 1 13 ENSG00000133703 ENST00000256078 +1 + missense_variant 25398281 1 C 1 A G/V 12 1 13 ENSG00000133703 ENST00000256078 +1 + missense_variant 25380277 1 GA 1 TT GQ/GK 12 1 60-61 ENSG00000133703 ENST00000311936 +0 + synonymous_variant 25380278 0 A 1 T - 12 1 60 ENSG00000133703 ENST00000311936 +1 + missense_variant 25380240 1 C 1 A R/M 12 1 73.0 ENSG00000133703 ENST00000256078 +1 + missense_variant 25380282 1 G 1 C A/G 12 1 59 ENSG00000133703 ENST00000311936 +1 + missense_variant 25398260 1 G 1 C T/R 12 1 20 ENSG00000133703 ENST00000556131 +0 + synonymous_variant 25398280 0 G 1 A - 12 1 13 ENSG00000133703 ENST00000556131 +1 + missense_variant 25398281 1 C 1 A G/V 12 1 13 ENSG00000133703 ENST00000556131 +0 + synonymous_variant 25398283 0 A 1 C - 12 1 12 ENSG00000133703 ENST00000556131 +1 + missense_variant 25398285 1 C 1 A G/C 12 1 12.0 ENSG00000133703 ENST00000556131 +1 + missense_variant 25398285 1 C 1 G G/R 12 1 12.0 ENSG00000133703 ENST00000556131 +1 + missense_variant 25398306 1 T 1 C K/E 12 1 5 ENSG00000133703 ENST00000556131 +1 - missense_variant 25398282 1 G 1 T G/C 12 1 13 ENSG00000133703 ENST00000556131 +1 - missense_variant 25398284 1 G 1 C G/A 12 1 12 ENSG00000133703 ENST00000556131 +1 + missense_variant 25362743 1 A 1 G C/R 12 1 72 ENSG00000133703 ENST00000557334 +0 + inframe_deletion 25362744 0 CTTTGT 1 - - 12 1 70-71 ENSG00000133703 ENST00000557334 +1 + missense_variant 25398211 1 T 1 C I/M 12 1 36 ENSG00000133703 ENST00000557334 +1 + missense_variant 25398213 1 T 1 A I/L 12 1 36 ENSG00000133703 ENST00000557334 +0 + synonymous_variant 25398250 0 T 1 C - 12 1 23 ENSG00000133703 ENST00000557334 +1 + missense_variant 25398260 1 G 1 C T/R 12 1 20 ENSG00000133703 ENST00000557334 +0 + synonymous_variant 25398250 0 T 1 C - 12 1 23 ENSG00000133703 ENST00000556131 +1 + missense_variant 25398213 1 T 1 A I/L 12 1 36 ENSG00000133703 ENST00000556131 +1 + missense_variant 25398211 1 T 1 C I/M 12 1 36 ENSG00000133703 ENST00000556131 +1 + missense_variant 25398281 1 C 1 A G/V 12 1 13 ENSG00000133703 ENST00000311936 +1 + missense_variant 25380282 1 G 1 T A/E 12 1 59 ENSG00000133703 ENST00000311936 +1 + missense_variant 25398211 1 T 1 C I/M 12 1 36 ENSG00000133703 ENST00000311936 +1 + missense_variant 25398213 1 T 1 A I/L 12 1 36 ENSG00000133703 ENST00000311936 +0 + synonymous_variant 25398250 0 T 1 C - 12 1 23 ENSG00000133703 ENST00000311936 +1 + missense_variant 25398260 1 G 1 C T/R 12 1 20 ENSG00000133703 ENST00000311936 +0 + synonymous_variant 25398280 0 G 1 A - 12 1 13 ENSG00000133703 ENST00000311936 +0 + synonymous_variant 25398283 0 A 1 C - 12 1 12 ENSG00000133703 ENST00000311936 +1 - missense_variant 25398284 1 G 1 C G/A 12 1 12 ENSG00000133703 ENST00000311936 +1 + missense_variant 25398285 1 C 1 A G/C 12 1 12.0 ENSG00000133703 ENST00000311936 +1 + missense_variant 25398285 1 C 1 G G/R 12 1 12.0 ENSG00000133703 ENST00000311936 +1 + missense_variant 25398306 1 T 1 C K/E 12 1 5 ENSG00000133703 ENST00000311936 +1 - missense_variant 25362743 1 A 1 T S/C 12 1 185 ENSG00000133703 ENST00000311936 +1 - missense_variant 25378647 1 A 1 T K/N 12 1 117 ENSG00000133703 ENST00000311936 +1 - missense_variant 25398282 1 G 1 T G/C 12 1 13 ENSG00000133703 ENST00000311936 +1 + missense_variant 25380254 1 C 1 A R/S 12 1 68 ENSG00000133703 ENST00000256078 +1 + missense_variant 25378645 1 C 1 G C/S 12 1 118 ENSG00000133703 ENST00000256078 +1 + missense_variant 25378594 1 C 1 G R/T 12 1 135 ENSG00000133703 ENST00000256078 +1 + missense_variant 25368454 1 C 1 T R/Q 12 1 164 ENSG00000133703 ENST00000256078 +1 + missense_variant 25368473 1 T 1 C T/A 12 1 158 ENSG00000133703 ENST00000256078 +1 + missense_variant 25378557 1 C 1 G K/N 12 1 147 ENSG00000133703 ENST00000256078 +1 + missense_variant 25378562 1 C 1 G A/P 12 1 146 ENSG00000133703 ENST00000256078 +1 + missense_variant 25378562 1 C 1 T A/T 12 1 146.0 ENSG00000133703 ENST00000256078 diff --git a/data/intogen-OR1A1-distribution-data.tsv b/data/intogen-OR1A1-distribution-data.tsv index 714de60..3693ce2 100644 --- a/data/intogen-OR1A1-distribution-data.tsv +++ b/data/intogen-OR1A1-distribution-data.tsv @@ -1,49 +1,49 @@ -MUTS_PAM STRAND MOST_SEVERE START MUTS_PAM_SAMPLES REF MUTS_CS ALT AA_CHANGE CHR MUTS_CS_SAMPLES PROTEIN_POS GENE TRANSCRIPT -2 + missense_variant 3119330 2 G 2 A R/Q 17 2 139 ENSG00000172146 ENST00000304094 -2 + missense_variant 3119138 2 C 2 T S/L 17 2 75 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119772 0 C 2 T - 17 2 286 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119791 1 C 1 T R/W 17 1 293 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119799 1 G 1 A M/I 17 1 295 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119805 0 T 1 C - 17 1 297 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119823 0 C 1 T - 17 1 303 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119786 1 G 1 A R/K 17 1 291 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119744 1 C 1 G T/R 17 1 277 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119691 0 C 1 T - 17 1 259 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119589 0 C 1 T - 17 1 225 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119408 1 G 1 A S/N 17 1 165 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119431 1 G 1 A E/K 17 1 173 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119462 1 C 1 T P/L 17 1 183 ENSG00000172146 ENST00000304094 -1 + stop_gained 3119514 1 C 1 G - 17 1 200 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119530 1 T 1 G F/V 17 1 206 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119581 1 A 1 G T/A 17 1 223 ENSG00000172146 ENST00000304094 -1 + stop_gained 3119590 1 C 1 T - 17 1 226 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119679 1 G 1 T M/I 17 1 255 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119592 0 G 1 A - 17 1 226 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119596 1 C 1 T P/S 17 1 228 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119610 0 C 1 T - 17 1 232 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119627 1 C 1 T S/F 17 1 238 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119640 0 C 1 A - 17 1 242 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119672 1 C 1 T T/I 17 1 253 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119395 1 C 1 A L/M 17 1 161 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119403 0 A 1 G - 17 1 163 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119386 1 C 1 T P/S 17 1 158 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119289 0 C 1 A - 17 1 125 ENSG00000172146 ENST00000304094 -1 + stop_gained 3118972 1 C 1 T - 17 1 20 ENSG00000172146 ENST00000304094 -1 + missense_variant 3118978 1 G 1 A E/K 17 1 22 ENSG00000172146 ENST00000304094 -1 + missense_variant 3118986 1 A 1 C E/D 17 1 24 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119002 1 C 1 T L/F 17 1 30 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119029 0 T 1 C - 17 1 39 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119074 1 C 1 T R/C 17 1 54 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119075 1 G 1 A R/H 17 1 54 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119076 0 C 1 T - 17 1 54 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119115 0 C 1 T - 17 1 67 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119139 0 G 1 A - 17 1 75 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3119187 0 C 1 T - 17 1 91 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119210 1 C 1 T T/M 17 1 99 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119217 1 G 1 A M/I 17 1 101 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119264 1 C 1 T A/V 17 1 117 ENSG00000172146 ENST00000304094 -1 + missense_variant 3119269 1 G 1 A A/T 17 1 119 ENSG00000172146 ENST00000304094 -1 + missense_variant 3118961 1 G 1 A G/E 17 1 16 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3118956 0 C 1 A - 17 1 14 ENSG00000172146 ENST00000304094 -0 + synonymous_variant 3118944 0 G 1 A - 17 1 10 ENSG00000172146 ENST00000304094 -1 + missense_variant 3118928 1 A 1 C N/T 17 1 5 ENSG00000172146 ENST00000304094 +MUTS_PAM STRAND MOST_SEVERE START MUTS_PAM_SAMPLES REF MUTS_CS ALT AA_CHANGE CHR MUTS_CS_SAMPLES PROTEIN_POS GENE TRANSCRIPT +2 + missense_variant 3119330 2 G 2 A R/Q 17 2 139 ENSG00000172146 ENST00000304094 +2 + missense_variant 3119138 2 C 2 T S/L 17 2 75 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119772 0 C 2 T - 17 2 286 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119791 1 C 1 T R/W 17 1 293 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119799 1 G 1 A M/I 17 1 295 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119805 0 T 1 C - 17 1 297 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119823 0 C 1 T - 17 1 303 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119786 1 G 1 A R/K 17 1 291 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119744 1 C 1 G T/R 17 1 277 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119691 0 C 1 T - 17 1 259 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119589 0 C 1 T - 17 1 225 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119408 1 G 1 A S/N 17 1 165 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119431 1 G 1 A E/K 17 1 173 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119462 1 C 1 T P/L 17 1 183 ENSG00000172146 ENST00000304094 +1 + stop_gained 3119514 1 C 1 G - 17 1 200 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119530 1 T 1 G F/V 17 1 206 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119581 1 A 1 G T/A 17 1 223 ENSG00000172146 ENST00000304094 +1 + stop_gained 3119590 1 C 1 T - 17 1 226 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119679 1 G 1 T M/I 17 1 255 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119592 0 G 1 A - 17 1 226 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119596 1 C 1 T P/S 17 1 228 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119610 0 C 1 T - 17 1 232 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119627 1 C 1 T S/F 17 1 238 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119640 0 C 1 A - 17 1 242 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119672 1 C 1 T T/I 17 1 253 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119395 1 C 1 A L/M 17 1 161 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119403 0 A 1 G - 17 1 163 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119386 1 C 1 T P/S 17 1 158 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119289 0 C 1 A - 17 1 125 ENSG00000172146 ENST00000304094 +1 + stop_gained 3118972 1 C 1 T - 17 1 20 ENSG00000172146 ENST00000304094 +1 + missense_variant 3118978 1 G 1 A E/K 17 1 22 ENSG00000172146 ENST00000304094 +1 + missense_variant 3118986 1 A 1 C E/D 17 1 24 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119002 1 C 1 T L/F 17 1 30 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119029 0 T 1 C - 17 1 39 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119074 1 C 1 T R/C 17 1 54 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119075 1 G 1 A R/H 17 1 54 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119076 0 C 1 T - 17 1 54 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119115 0 C 1 T - 17 1 67 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119139 0 G 1 A - 17 1 75 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3119187 0 C 1 T - 17 1 91 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119210 1 C 1 T T/M 17 1 99 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119217 1 G 1 A M/I 17 1 101 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119264 1 C 1 T A/V 17 1 117 ENSG00000172146 ENST00000304094 +1 + missense_variant 3119269 1 G 1 A A/T 17 1 119 ENSG00000172146 ENST00000304094 +1 + missense_variant 3118961 1 G 1 A G/E 17 1 16 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3118956 0 C 1 A - 17 1 14 ENSG00000172146 ENST00000304094 +0 + synonymous_variant 3118944 0 G 1 A - 17 1 10 ENSG00000172146 ENST00000304094 +1 + missense_variant 3118928 1 A 1 C N/T 17 1 5 ENSG00000172146 ENST00000304094 diff --git a/data/intogen-PTPN11-distribution-data.tsv b/data/intogen-PTPN11-distribution-data.tsv index 879116c..5222b89 100644 --- a/data/intogen-PTPN11-distribution-data.tsv +++ b/data/intogen-PTPN11-distribution-data.tsv @@ -1,113 +1,113 @@ -MUTS_PAM STRAND MOST_SEVERE START MUTS_PAM_SAMPLES REF MUTS_CS ALT AA_CHANGE CHR MUTS_CS_SAMPLES PROTEIN_POS GENE TRANSCRIPT -5 + missense_variant 112926888 5 G 5 T G/V 12 5 503 ENSG00000179295 ENST00000351677 -4 + missense_variant 112926270 4 C 4 T T/M 12 4 468 ENSG00000179295 ENST00000351677 -3 + missense_variant 112888198 3 G 3 A A/T 12 3 72 ENSG00000179295 ENST00000392597 -3 + missense_variant 112888198 3 G 3 A A/T 12 3 72 ENSG00000179295 ENST00000351677 -2 + missense_variant 112926910 2 G 2 C Q/H 12 2 510 ENSG00000179295 ENST00000351677 -2 + missense_variant 112926909 2 A 2 T Q/L 12 2 510 ENSG00000179295 ENST00000351677 -2 + missense_variant 112926900 2 C 2 A T/K 12 2 507 ENSG00000179295 ENST00000351677 -2 + missense_variant 112891006 2 C 2 T H/Y 12 2 114 ENSG00000179295 ENST00000392597 -2 + missense_variant 112888210 2 G 2 A E/K 12 2 76 ENSG00000179295 ENST00000392597 -2 + missense_variant 112888199 2 C 2 T A/V 12 2 72 ENSG00000179295 ENST00000392597 -2 + missense_variant 112888199 2 C 2 A A/D 12 2 72 ENSG00000179295 ENST00000392597 -2 + missense_variant 112891006 2 C 2 T H/Y 12 2 114 ENSG00000179295 ENST00000351677 -2 + missense_variant 112888210 2 G 2 A E/K 12 2 76 ENSG00000179295 ENST00000351677 -2 + missense_variant 112888199 2 C 2 T A/V 12 2 72 ENSG00000179295 ENST00000351677 -2 + missense_variant 112888199 2 C 2 A A/D 12 2 72 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112893822 0 T 1 C - 12 1 82 ENSG00000179295 ENST00000530818 -1 + missense_variant 112910837 1 C 1 G I/M 12 1 282 ENSG00000179295 ENST00000392597 -1 + missense_variant 112910844 1 T 1 G F/V 12 1 285.0 ENSG00000179295 ENST00000392597 -0 + synonymous_variant 112915507 0 A 1 G - 12 1 302 ENSG00000179295 ENST00000392597 -1 + missense_variant 112915523 1 A 1 G N/D 12 1 308 ENSG00000179295 ENST00000392597 -1 + missense_variant 112915743 1 A 1 G N/S 12 1 339 ENSG00000179295 ENST00000392597 -1 + missense_variant 112919908 1 T 1 G Y/D 12 1 375 ENSG00000179295 ENST00000392597 -1 + frameshift_variant 112920002 1 - 1 T - 12 1 406 ENSG00000179295 ENST00000392597 -1 + missense_variant 112924286 1 C 1 T T/M 12 1 411 ENSG00000179295 ENST00000392597 -1 + stop_gained 112924308 1 C 1 A - 12 1 418 ENSG00000179295 ENST00000392597 -1 + missense_variant 112924331 1 A 1 T H/L 12 1 426 ENSG00000179295 ENST00000392597 -1 + missense_variant 112924336 1 G 1 A V/M 12 1 428 ENSG00000179295 ENST00000392597 -1 + missense_variant 112892383 1 G 1 C V/L 12 1 26 ENSG00000179295 ENST00000530818 -0 + synonymous_variant 112892409 0 T 1 C - 12 1 34 ENSG00000179295 ENST00000530818 -1 + stop_gained 112893784 1 G 1 T - 12 1 70 ENSG00000179295 ENST00000530818 -0 + synonymous_variant 112893798 0 A 1 G - 12 1 74 ENSG00000179295 ENST00000530818 -1 + missense_variant 112910775 1 C 1 T L/F 12 1 262 ENSG00000179295 ENST00000392597 -0 + synonymous_variant 112893822 0 T 1 C - 12 1 237 ENSG00000179295 ENST00000392597 -0 + synonymous_variant 112893802 0 C 1 A - 12 1 231 ENSG00000179295 ENST00000392597 -1 + missense_variant 112888211 1 A 1 C E/A 12 1 76 ENSG00000179295 ENST00000392597 -1 + missense_variant 112888165 1 G 1 T D/Y 12 1 61 ENSG00000179295 ENST00000392597 -1 + missense_variant 112888189 1 G 1 A E/K 12 1 69.0 ENSG00000179295 ENST00000392597 -1 + missense_variant 112888189 1 G 1 A E/K 12 1 69 ENSG00000179295 ENST00000392597 -1 + missense_variant 112888195 1 T 1 C F/L 12 1 71 ENSG00000179295 ENST00000392597 -1 + missense_variant 112888197 1 T 1 A F/L 12 1 71 ENSG00000179295 ENST00000392597 -1 + missense_variant 112888211 1 A 1 C E/A 12 1 76.0 ENSG00000179295 ENST00000392597 -1 + missense_variant 112891015 1 C 1 T L/F 12 1 117 ENSG00000179295 ENST00000392597 -0 + synonymous_variant 112893798 0 A 1 G - 12 1 229 ENSG00000179295 ENST00000392597 -1 + missense_variant 112891073 1 T 1 A L/H 12 1 136 ENSG00000179295 ENST00000392597 -0 + synonymous_variant 112891116 0 T 1 C - 12 1 150 ENSG00000179295 ENST00000392597 -1 + missense_variant 112891129 1 G 1 T D/Y 12 1 155 ENSG00000179295 ENST00000392597 -1 + missense_variant 112892383 1 G 1 C V/L 12 1 181 ENSG00000179295 ENST00000392597 -0 + synonymous_variant 112892409 0 T 1 C - 12 1 189 ENSG00000179295 ENST00000392597 -1 + stop_gained 112893784 1 G 1 T - 12 1 225 ENSG00000179295 ENST00000392597 -0 + synonymous_variant 112893802 0 C 1 A - 12 1 76 ENSG00000179295 ENST00000530818 -1 + missense_variant 112888163 1 G 1 T G/V 12 1 60 ENSG00000179295 ENST00000392597 -1 + missense_variant 112888165 1 G 1 A D/N 12 1 61 ENSG00000179295 ENST00000392597 -1 + missense_variant 112888162 1 G 1 C G/R 12 1 60 ENSG00000179295 ENST00000392597 -0 + synonymous_variant 112893822 0 T 1 C - 12 1 237 ENSG00000179295 ENST00000351677 -1 + missense_variant 112888165 1 G 1 T D/Y 12 1 61 ENSG00000179295 ENST00000351677 -1 + missense_variant 112888189 1 G 1 A E/K 12 1 69.0 ENSG00000179295 ENST00000351677 -1 + missense_variant 112888189 1 G 1 A E/K 12 1 69 ENSG00000179295 ENST00000351677 -1 + missense_variant 112888195 1 T 1 C F/L 12 1 71 ENSG00000179295 ENST00000351677 -1 + missense_variant 112888197 1 T 1 A F/L 12 1 71 ENSG00000179295 ENST00000351677 -1 + missense_variant 112888211 1 A 1 C E/A 12 1 76.0 ENSG00000179295 ENST00000351677 -1 + missense_variant 112888211 1 A 1 C E/A 12 1 76 ENSG00000179295 ENST00000351677 -1 + missense_variant 112891015 1 C 1 T L/F 12 1 117 ENSG00000179295 ENST00000351677 -1 + missense_variant 112891073 1 T 1 A L/H 12 1 136 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112891116 0 T 1 C - 12 1 150 ENSG00000179295 ENST00000351677 -1 + missense_variant 112891129 1 G 1 T D/Y 12 1 155 ENSG00000179295 ENST00000351677 -1 + missense_variant 112892383 1 G 1 C V/L 12 1 181 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112892409 0 T 1 C - 12 1 189 ENSG00000179295 ENST00000351677 -1 + stop_gained 112893784 1 G 1 T - 12 1 225 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112893798 0 A 1 G - 12 1 229 ENSG00000179295 ENST00000351677 -1 + missense_variant 112888165 1 G 1 A D/N 12 1 61 ENSG00000179295 ENST00000351677 -1 + missense_variant 112888163 1 G 1 T G/V 12 1 60 ENSG00000179295 ENST00000351677 -1 + missense_variant 112888162 1 G 1 C G/R 12 1 60 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112888161 0 T 1 C - 12 1 59 ENSG00000179295 ENST00000351677 -1 + missense_variant 112884103 1 G 1 A G/D 12 1 13 ENSG00000179295 ENST00000351677 -1 + missense_variant 112888139 1 C 1 G T/S 12 1 52 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112893802 0 C 1 A - 12 1 231 ENSG00000179295 ENST00000351677 -1 + missense_variant 112910775 1 C 1 T L/F 12 1 262 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112888161 0 T 1 C - 12 1 59 ENSG00000179295 ENST00000392597 -1 + missense_variant 112910837 1 C 1 G I/M 12 1 282 ENSG00000179295 ENST00000351677 -1 + missense_variant 112926887 1 G 1 C G/R 12 1 503 ENSG00000179295 ENST00000351677 -1 + missense_variant 112926908 1 C 1 G Q/E 12 1 510.0 ENSG00000179295 ENST00000351677 -1 + missense_variant 112939963 1 G 1 C G/R 12 1 539 ENSG00000179295 ENST00000351677 -1 + missense_variant 112939970 1 A 1 T E/V 12 1 541 ENSG00000179295 ENST00000351677 -1 + missense_variant 112939981 1 A 1 C I/L 12 1 545 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112939993 0 C 1 T - 12 1 549 ENSG00000179295 ENST00000351677 -1 + missense_variant 112939999 1 G 1 A D/N 12 1 551 ENSG00000179295 ENST00000351677 -1 + missense_variant 112940012 1 G 1 A G/E 12 1 555 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112940025 0 T 1 C - 12 1 559 ENSG00000179295 ENST00000351677 -1 + missense_variant 112940027 1 T 1 C L/P 12 1 560 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112940031 0 G 1 A - 12 1 561 ENSG00000179295 ENST00000351677 -1 + missense_variant 112940036 1 G 1 T C/F 12 1 563 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112940052 0 C 1 T - 12 1 568 ENSG00000179295 ENST00000351677 -1 + missense_variant 112884103 1 G 1 A G/D 12 1 13 ENSG00000179295 ENST00000392597 -1 + missense_variant 112888139 1 C 1 G T/S 12 1 52 ENSG00000179295 ENST00000392597 -1 + missense_variant 112926885 1 C 1 T S/L 12 1 502 ENSG00000179295 ENST00000351677 -1 + missense_variant 112926884 1 T 1 C S/P 12 1 502 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112926862 0 C 1 T - 12 1 494 ENSG00000179295 ENST00000351677 -1 + missense_variant 112924286 1 C 1 T T/M 12 1 411 ENSG00000179295 ENST00000351677 -1 + missense_variant 112910844 1 T 1 G F/V 12 1 285.0 ENSG00000179295 ENST00000351677 -0 + synonymous_variant 112915507 0 A 1 G - 12 1 302 ENSG00000179295 ENST00000351677 -1 + missense_variant 112915523 1 A 1 G N/D 12 1 308 ENSG00000179295 ENST00000351677 -1 + missense_variant 112915743 1 A 1 G N/S 12 1 339 ENSG00000179295 ENST00000351677 -1 + missense_variant 112919908 1 T 1 G Y/D 12 1 375 ENSG00000179295 ENST00000351677 -1 + frameshift_variant 112920002 1 - 1 T - 12 1 406 ENSG00000179295 ENST00000351677 -1 + stop_gained 112924308 1 C 1 A - 12 1 418 ENSG00000179295 ENST00000351677 -1 + missense_variant 112926852 1 C 1 T P/L 12 1 491 ENSG00000179295 ENST00000351677 -1 + missense_variant 112924331 1 A 1 T H/L 12 1 426 ENSG00000179295 ENST00000351677 -1 + missense_variant 112924336 1 G 1 A V/M 12 1 428 ENSG00000179295 ENST00000351677 -1 + missense_variant 112926248 1 G 1 A A/T 12 1 461 ENSG00000179295 ENST00000351677 -1 + missense_variant 112926249 1 C 1 G A/G 12 1 461 ENSG00000179295 ENST00000351677 -1 + missense_variant 112926291 1 TT 1 CA L/P 12 1 475 ENSG00000179295 ENST00000351677 -1 + missense_variant 112926839 1 G 1 T D/Y 12 1 487 ENSG00000179295 ENST00000351677 +MUTS_PAM STRAND MOST_SEVERE START MUTS_PAM_SAMPLES REF MUTS_CS ALT AA_CHANGE CHR MUTS_CS_SAMPLES PROTEIN_POS GENE TRANSCRIPT +5 + missense_variant 112926888 5 G 5 T G/V 12 5 503 ENSG00000179295 ENST00000351677 +4 + missense_variant 112926270 4 C 4 T T/M 12 4 468 ENSG00000179295 ENST00000351677 +3 + missense_variant 112888198 3 G 3 A A/T 12 3 72 ENSG00000179295 ENST00000392597 +3 + missense_variant 112888198 3 G 3 A A/T 12 3 72 ENSG00000179295 ENST00000351677 +2 + missense_variant 112926910 2 G 2 C Q/H 12 2 510 ENSG00000179295 ENST00000351677 +2 + missense_variant 112926909 2 A 2 T Q/L 12 2 510 ENSG00000179295 ENST00000351677 +2 + missense_variant 112926900 2 C 2 A T/K 12 2 507 ENSG00000179295 ENST00000351677 +2 + missense_variant 112891006 2 C 2 T H/Y 12 2 114 ENSG00000179295 ENST00000392597 +2 + missense_variant 112888210 2 G 2 A E/K 12 2 76 ENSG00000179295 ENST00000392597 +2 + missense_variant 112888199 2 C 2 T A/V 12 2 72 ENSG00000179295 ENST00000392597 +2 + missense_variant 112888199 2 C 2 A A/D 12 2 72 ENSG00000179295 ENST00000392597 +2 + missense_variant 112891006 2 C 2 T H/Y 12 2 114 ENSG00000179295 ENST00000351677 +2 + missense_variant 112888210 2 G 2 A E/K 12 2 76 ENSG00000179295 ENST00000351677 +2 + missense_variant 112888199 2 C 2 T A/V 12 2 72 ENSG00000179295 ENST00000351677 +2 + missense_variant 112888199 2 C 2 A A/D 12 2 72 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112893822 0 T 1 C - 12 1 82 ENSG00000179295 ENST00000530818 +1 + missense_variant 112910837 1 C 1 G I/M 12 1 282 ENSG00000179295 ENST00000392597 +1 + missense_variant 112910844 1 T 1 G F/V 12 1 285.0 ENSG00000179295 ENST00000392597 +0 + synonymous_variant 112915507 0 A 1 G - 12 1 302 ENSG00000179295 ENST00000392597 +1 + missense_variant 112915523 1 A 1 G N/D 12 1 308 ENSG00000179295 ENST00000392597 +1 + missense_variant 112915743 1 A 1 G N/S 12 1 339 ENSG00000179295 ENST00000392597 +1 + missense_variant 112919908 1 T 1 G Y/D 12 1 375 ENSG00000179295 ENST00000392597 +1 + frameshift_variant 112920002 1 - 1 T - 12 1 406 ENSG00000179295 ENST00000392597 +1 + missense_variant 112924286 1 C 1 T T/M 12 1 411 ENSG00000179295 ENST00000392597 +1 + stop_gained 112924308 1 C 1 A - 12 1 418 ENSG00000179295 ENST00000392597 +1 + missense_variant 112924331 1 A 1 T H/L 12 1 426 ENSG00000179295 ENST00000392597 +1 + missense_variant 112924336 1 G 1 A V/M 12 1 428 ENSG00000179295 ENST00000392597 +1 + missense_variant 112892383 1 G 1 C V/L 12 1 26 ENSG00000179295 ENST00000530818 +0 + synonymous_variant 112892409 0 T 1 C - 12 1 34 ENSG00000179295 ENST00000530818 +1 + stop_gained 112893784 1 G 1 T - 12 1 70 ENSG00000179295 ENST00000530818 +0 + synonymous_variant 112893798 0 A 1 G - 12 1 74 ENSG00000179295 ENST00000530818 +1 + missense_variant 112910775 1 C 1 T L/F 12 1 262 ENSG00000179295 ENST00000392597 +0 + synonymous_variant 112893822 0 T 1 C - 12 1 237 ENSG00000179295 ENST00000392597 +0 + synonymous_variant 112893802 0 C 1 A - 12 1 231 ENSG00000179295 ENST00000392597 +1 + missense_variant 112888211 1 A 1 C E/A 12 1 76 ENSG00000179295 ENST00000392597 +1 + missense_variant 112888165 1 G 1 T D/Y 12 1 61 ENSG00000179295 ENST00000392597 +1 + missense_variant 112888189 1 G 1 A E/K 12 1 69.0 ENSG00000179295 ENST00000392597 +1 + missense_variant 112888189 1 G 1 A E/K 12 1 69 ENSG00000179295 ENST00000392597 +1 + missense_variant 112888195 1 T 1 C F/L 12 1 71 ENSG00000179295 ENST00000392597 +1 + missense_variant 112888197 1 T 1 A F/L 12 1 71 ENSG00000179295 ENST00000392597 +1 + missense_variant 112888211 1 A 1 C E/A 12 1 76.0 ENSG00000179295 ENST00000392597 +1 + missense_variant 112891015 1 C 1 T L/F 12 1 117 ENSG00000179295 ENST00000392597 +0 + synonymous_variant 112893798 0 A 1 G - 12 1 229 ENSG00000179295 ENST00000392597 +1 + missense_variant 112891073 1 T 1 A L/H 12 1 136 ENSG00000179295 ENST00000392597 +0 + synonymous_variant 112891116 0 T 1 C - 12 1 150 ENSG00000179295 ENST00000392597 +1 + missense_variant 112891129 1 G 1 T D/Y 12 1 155 ENSG00000179295 ENST00000392597 +1 + missense_variant 112892383 1 G 1 C V/L 12 1 181 ENSG00000179295 ENST00000392597 +0 + synonymous_variant 112892409 0 T 1 C - 12 1 189 ENSG00000179295 ENST00000392597 +1 + stop_gained 112893784 1 G 1 T - 12 1 225 ENSG00000179295 ENST00000392597 +0 + synonymous_variant 112893802 0 C 1 A - 12 1 76 ENSG00000179295 ENST00000530818 +1 + missense_variant 112888163 1 G 1 T G/V 12 1 60 ENSG00000179295 ENST00000392597 +1 + missense_variant 112888165 1 G 1 A D/N 12 1 61 ENSG00000179295 ENST00000392597 +1 + missense_variant 112888162 1 G 1 C G/R 12 1 60 ENSG00000179295 ENST00000392597 +0 + synonymous_variant 112893822 0 T 1 C - 12 1 237 ENSG00000179295 ENST00000351677 +1 + missense_variant 112888165 1 G 1 T D/Y 12 1 61 ENSG00000179295 ENST00000351677 +1 + missense_variant 112888189 1 G 1 A E/K 12 1 69.0 ENSG00000179295 ENST00000351677 +1 + missense_variant 112888189 1 G 1 A E/K 12 1 69 ENSG00000179295 ENST00000351677 +1 + missense_variant 112888195 1 T 1 C F/L 12 1 71 ENSG00000179295 ENST00000351677 +1 + missense_variant 112888197 1 T 1 A F/L 12 1 71 ENSG00000179295 ENST00000351677 +1 + missense_variant 112888211 1 A 1 C E/A 12 1 76.0 ENSG00000179295 ENST00000351677 +1 + missense_variant 112888211 1 A 1 C E/A 12 1 76 ENSG00000179295 ENST00000351677 +1 + missense_variant 112891015 1 C 1 T L/F 12 1 117 ENSG00000179295 ENST00000351677 +1 + missense_variant 112891073 1 T 1 A L/H 12 1 136 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112891116 0 T 1 C - 12 1 150 ENSG00000179295 ENST00000351677 +1 + missense_variant 112891129 1 G 1 T D/Y 12 1 155 ENSG00000179295 ENST00000351677 +1 + missense_variant 112892383 1 G 1 C V/L 12 1 181 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112892409 0 T 1 C - 12 1 189 ENSG00000179295 ENST00000351677 +1 + stop_gained 112893784 1 G 1 T - 12 1 225 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112893798 0 A 1 G - 12 1 229 ENSG00000179295 ENST00000351677 +1 + missense_variant 112888165 1 G 1 A D/N 12 1 61 ENSG00000179295 ENST00000351677 +1 + missense_variant 112888163 1 G 1 T G/V 12 1 60 ENSG00000179295 ENST00000351677 +1 + missense_variant 112888162 1 G 1 C G/R 12 1 60 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112888161 0 T 1 C - 12 1 59 ENSG00000179295 ENST00000351677 +1 + missense_variant 112884103 1 G 1 A G/D 12 1 13 ENSG00000179295 ENST00000351677 +1 + missense_variant 112888139 1 C 1 G T/S 12 1 52 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112893802 0 C 1 A - 12 1 231 ENSG00000179295 ENST00000351677 +1 + missense_variant 112910775 1 C 1 T L/F 12 1 262 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112888161 0 T 1 C - 12 1 59 ENSG00000179295 ENST00000392597 +1 + missense_variant 112910837 1 C 1 G I/M 12 1 282 ENSG00000179295 ENST00000351677 +1 + missense_variant 112926887 1 G 1 C G/R 12 1 503 ENSG00000179295 ENST00000351677 +1 + missense_variant 112926908 1 C 1 G Q/E 12 1 510.0 ENSG00000179295 ENST00000351677 +1 + missense_variant 112939963 1 G 1 C G/R 12 1 539 ENSG00000179295 ENST00000351677 +1 + missense_variant 112939970 1 A 1 T E/V 12 1 541 ENSG00000179295 ENST00000351677 +1 + missense_variant 112939981 1 A 1 C I/L 12 1 545 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112939993 0 C 1 T - 12 1 549 ENSG00000179295 ENST00000351677 +1 + missense_variant 112939999 1 G 1 A D/N 12 1 551 ENSG00000179295 ENST00000351677 +1 + missense_variant 112940012 1 G 1 A G/E 12 1 555 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112940025 0 T 1 C - 12 1 559 ENSG00000179295 ENST00000351677 +1 + missense_variant 112940027 1 T 1 C L/P 12 1 560 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112940031 0 G 1 A - 12 1 561 ENSG00000179295 ENST00000351677 +1 + missense_variant 112940036 1 G 1 T C/F 12 1 563 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112940052 0 C 1 T - 12 1 568 ENSG00000179295 ENST00000351677 +1 + missense_variant 112884103 1 G 1 A G/D 12 1 13 ENSG00000179295 ENST00000392597 +1 + missense_variant 112888139 1 C 1 G T/S 12 1 52 ENSG00000179295 ENST00000392597 +1 + missense_variant 112926885 1 C 1 T S/L 12 1 502 ENSG00000179295 ENST00000351677 +1 + missense_variant 112926884 1 T 1 C S/P 12 1 502 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112926862 0 C 1 T - 12 1 494 ENSG00000179295 ENST00000351677 +1 + missense_variant 112924286 1 C 1 T T/M 12 1 411 ENSG00000179295 ENST00000351677 +1 + missense_variant 112910844 1 T 1 G F/V 12 1 285.0 ENSG00000179295 ENST00000351677 +0 + synonymous_variant 112915507 0 A 1 G - 12 1 302 ENSG00000179295 ENST00000351677 +1 + missense_variant 112915523 1 A 1 G N/D 12 1 308 ENSG00000179295 ENST00000351677 +1 + missense_variant 112915743 1 A 1 G N/S 12 1 339 ENSG00000179295 ENST00000351677 +1 + missense_variant 112919908 1 T 1 G Y/D 12 1 375 ENSG00000179295 ENST00000351677 +1 + frameshift_variant 112920002 1 - 1 T - 12 1 406 ENSG00000179295 ENST00000351677 +1 + stop_gained 112924308 1 C 1 A - 12 1 418 ENSG00000179295 ENST00000351677 +1 + missense_variant 112926852 1 C 1 T P/L 12 1 491 ENSG00000179295 ENST00000351677 +1 + missense_variant 112924331 1 A 1 T H/L 12 1 426 ENSG00000179295 ENST00000351677 +1 + missense_variant 112924336 1 G 1 A V/M 12 1 428 ENSG00000179295 ENST00000351677 +1 + missense_variant 112926248 1 G 1 A A/T 12 1 461 ENSG00000179295 ENST00000351677 +1 + missense_variant 112926249 1 C 1 G A/G 12 1 461 ENSG00000179295 ENST00000351677 +1 + missense_variant 112926291 1 TT 1 CA L/P 12 1 475 ENSG00000179295 ENST00000351677 +1 + missense_variant 112926839 1 G 1 T D/Y 12 1 487 ENSG00000179295 ENST00000351677 diff --git a/data/refAPSES.mfa b/data/refAPSES.mfa index 9e62ba3..435e365 100644 --- a/data/refAPSES.mfa +++ b/data/refAPSES.mfa @@ -1,39 +1,39 @@ ->MBP1_ASPNI AN3154 XP_660758 Q5B8H6 --VYSATYSSVPVYEFKIGTDSVMRRRSDDWINATHILKVAGFDKPARTRI -LEREVQKGVHEKVQGGYGKYQGTWIPLQEGRQLAERNNILDKLLPIFDY - ->MBP1_BIPOR COCMIDRAFT_338 XP_007682304 W6ZM86 -KIYSATYSNVPVYECNVNGHHVMRRRADDWINATHILKVADYDKPARTRI -LEREVQKGVHEKVQGGYGKYQGTWIPLEEGRGLAERNGVLDKMRAIFDY - ->MBP1_COPCI - XP_001837394 A8NYC6 -QIFKATYSGIPVYEMMCKGVAVMRRRSDSWLNATQILKVAGFDKPQRTRV -LEREVQKGEHEKVQGGYGKYQGTWIPLERGMQLAKQYNCEHLLRPIIEF - ->MBP1_CRYNE - XP_569090 Q5KMQ9 -DYVPTSVSPPPAPKHSVA--PPSKARRDKEKETGRTKATPSRTGPTSAAA -LQAQAQLN-RAKMHDSTPDADASFRSFEERVSLTEDDSSSDTPSPVASV - ->MBP1_NEUCR Swi4 XP_955821 Q7RW59 --IYSATYSGIPVWEYQFGVDHVMRRRHDDWVNATHILKAAGFDKPARTRI -LEREVQKDTHEKIQGGYGRYQGTWIPLEQAEALARRNNIYERLKPIFEF - ->MBP1_PUCGR PGTG_08863 XP_003327086 E3KED4 --IYKATYSGVPVLEMPCEGIAVMRRRSDSWLNATQILKVAGFDKPQRTRV -LEREIQKGTHEKIQGGYGKYQGTWVPLDRGIDLAKQYGVDHLLSALFNF - ->MBP1_SACCE Mbp1 NP_010227 P39678 -QIYSARYSGVDVYEFIHSTGSIMKRKKDDWVNATHILKAANFAKAKRTRI -LEKEVLKETHEKVQGGFGKYQGTWVPLNIAKQLAEKFSVYDQLKPLFDF - ->MBP1_SCHPO Res2 NP_593032 P41412 --VHVAVYSGVEVYECFIKGVSVMRRRRDSWLNATQILKVADFDKPQRTRV -LERQVQIGAHEKVQGGYGKYQGTWVPFQRGVDLATKYKVDGIMSPILS- - ->MBP1_USTMA UMAG_11222 XP_011392621 A0A0D1DP35 --IFKATYSGVPVYECIINNVAVMRRRSDDWLNATQILKVVGLDKPQRTRV -LEREIQKGIHEKVQGGYGKYQGTWIPLDVAIELAERYNIQGLLQPITSY - ->MBP1_WALME - XP_006957051 I4YGC0 --IYKACYSGVPVYEFNCKNVAVMKRRSDSWMNATQILKVANFDKPQRTRI -LEREVQKGTHEKVQGGYGKYQGTWIPMERSVELARQYRIELLLDPIINY +>MBP1_ASPNI AN3154 XP_660758 Q5B8H6 +-VYSATYSSVPVYEFKIGTDSVMRRRSDDWINATHILKVAGFDKPARTRI +LEREVQKGVHEKVQGGYGKYQGTWIPLQEGRQLAERNNILDKLLPIFDY + +>MBP1_BIPOR COCMIDRAFT_338 XP_007682304 W6ZM86 +KIYSATYSNVPVYECNVNGHHVMRRRADDWINATHILKVADYDKPARTRI +LEREVQKGVHEKVQGGYGKYQGTWIPLEEGRGLAERNGVLDKMRAIFDY + +>MBP1_COPCI - XP_001837394 A8NYC6 +QIFKATYSGIPVYEMMCKGVAVMRRRSDSWLNATQILKVAGFDKPQRTRV +LEREVQKGEHEKVQGGYGKYQGTWIPLERGMQLAKQYNCEHLLRPIIEF + +>MBP1_CRYNE - XP_569090 Q5KMQ9 +DYVPTSVSPPPAPKHSVA--PPSKARRDKEKETGRTKATPSRTGPTSAAA +LQAQAQLN-RAKMHDSTPDADASFRSFEERVSLTEDDSSSDTPSPVASV + +>MBP1_NEUCR Swi4 XP_955821 Q7RW59 +-IYSATYSGIPVWEYQFGVDHVMRRRHDDWVNATHILKAAGFDKPARTRI +LEREVQKDTHEKIQGGYGRYQGTWIPLEQAEALARRNNIYERLKPIFEF + +>MBP1_PUCGR PGTG_08863 XP_003327086 E3KED4 +-IYKATYSGVPVLEMPCEGIAVMRRRSDSWLNATQILKVAGFDKPQRTRV +LEREIQKGTHEKIQGGYGKYQGTWVPLDRGIDLAKQYGVDHLLSALFNF + +>MBP1_SACCE Mbp1 NP_010227 P39678 +QIYSARYSGVDVYEFIHSTGSIMKRKKDDWVNATHILKAANFAKAKRTRI +LEKEVLKETHEKVQGGFGKYQGTWVPLNIAKQLAEKFSVYDQLKPLFDF + +>MBP1_SCHPO Res2 NP_593032 P41412 +-VHVAVYSGVEVYECFIKGVSVMRRRRDSWLNATQILKVADFDKPQRTRV +LERQVQIGAHEKVQGGYGKYQGTWVPFQRGVDLATKYKVDGIMSPILS- + +>MBP1_USTMA UMAG_11222 XP_011392621 A0A0D1DP35 +-IFKATYSGVPVYECIINNVAVMRRRSDDWLNATQILKVVGLDKPQRTRV +LEREIQKGIHEKVQGGYGKYQGTWIPLDVAIELAERYNIQGLLQPITSY + +>MBP1_WALME - XP_006957051 I4YGC0 +-IYKACYSGVPVYEFNCKNVAVMKRRSDSWMNATQILKVANFDKPQRTRI +LEREVQKGTHEKVQGGYGKYQGTWIPMERSVELARQYRIELLLDPIINY diff --git a/data/refAPSES_PSI-BLAST.json b/data/refAPSES_PSI-BLAST.json index 6230627..fdb7251 100644 --- a/data/refAPSES_PSI-BLAST.json +++ b/data/refAPSES_PSI-BLAST.json @@ -1,490 +1,490 @@ -[ - { "name" : "68476_WALME", - "RefSeqID" : "XP_006957790", - "UniProtID" : "I4YDD8", - "taxonomyID" : "671144", - "sequence" : [ - "MKEEKEKTPPNNITGPPTPAQNILHSTPAAFGTAGTVGQGAGGFGSQLYQSPYVDSQQSVIGSPVTPAPLPKKATLKTPQ", - "PRIYSAVYSGVGVYEAMIRGIAVMRRRADGYMNATQILKVAGVDKGRRTKILEREILAGLHEKIQGGYGKYQGTWIPFER", - "GRELALQYGCDHLLAPIFDFNPSVMQPSAGRSAKSPSKKRQNSIVLSPTQERHQSSIIALNTARASGIYVGGADDPNDDG", - "LSKKEKSPVKKSKYDEVPVNVSKRPYVPPPGTNAHILTRTQQSLTALFQQPTTNSDFIPEAVAILDTTSGALHPDLAIDE", - "LGHTALHWAASLGRISNVQQLIKKGADMKRGNIEGETPLERSVLVNDNYDKKTFAYLLQELGSSIRVVDRTGRSILHHIA", - "LIAAVNGRSMSAKYYMENVLEYIARYENGEFKSLVDLQDEHGDTALNISARVGNRNLVKMLVDAGANKTVVNKLGLKASD", - "FGVEHETLNSVTGDEMLSNLQPPPPLNVDSSASVLENIHNLLNGITQQYTDETSGKNALLFEIQAELKQHSHELADVRKE", - "IQYWQNKATQMAEVDQKIKNINEAIENEKVQTWSLLGEANADKMEGIETSSSSNTSEIKIPTGDNEESLKQLRKLSKWLE", - "GTQKLTEERVASIDGLSASKEVKYKSIVSVCTGVPVNEVEGMLAQLLEAMESDANADLNKVQEFLAREC"] - }, - { "name" : "00846_COPCI", - "RefSeqID" : "XP_001831299", - "UniProtID" : "A8N8X1", - "taxonomyID" : "240176", - "sequence" : [ - "MQASTRPPGSNQPPVKIYNAVYSSVQVYECMVRGIAVMRRRNDSYVNATQILKVAGVDKGRRTKILEKEILPGKHEIVQG", - "GYGKYQGTWIPLERGRDIAAQYGVAPLLSPLFDFQPSTNSLGALPVSTPGGTASPRPLSASSSYSSMGVAGQYIPSSIPS", - "NLPPAPIMPGSALRLLNQGRAQGLFTPSTTSATLRPAGYHSPGPYGTSYAPSPQPQSSQTPPPGSGLKRNRSEAEVEGYH", - "SQPHDVQMADAPPPNTASQPNEDNPSPAKRLRTDGSITTEPASSQGQWQQQQPLPYASQQRSGPGLSQLSGHNGHGSSRP", - "PSSLSAPNGNRPAHTNPEDQTRKTRFSSKPSMPRGMDPHMPFKDARRSALIALICHRDDPTSVIDLLREISADHLNPPSF", - "DVDTVLDDQGHTALHLAASMARTQTVDMLIQTGADMHRGNHLGETPLIRACLATPNSDQQSFATLVNYLHDSIWTLDTSK", - "KSVVHHIVSLAGVKGRAVVARYYLDQIFYWIAQHEGGDFRSLVDLQDEHGDTAINIAARVGNRSLVRTLLDVGANRVLAN", - "KLGLRPGDFGVETEELSSGLRAEDLISSLRTGPPAPVQKSQDVIADMTSMIQSLSTEFQAEIKSKQDSLDVTQAHLRAAT", - "RELSEQRKQIQTWQARCGDLDQINQRVRNVEKAIAEEDMFDWTGRTELDGKDGKEKGGPAFAYRGSKSTMVGVGGSVDVS", - "FSVESEPPLPTTDTAASLVKLRRLKMWHQRMEELVKGRLKGLQGASAEKEYQCKKIVALCTGIPLDKVEEMLDNLVIAVE", - "SEAQVVDIGRVSGFMQKVRDGII"] - }, - { "name" : "8533_BIPOR", - "RefSeqID" : "XP_007691662", - "UniProtID" : "W6ZE71", - "taxonomyID" : "930090", - "sequence" : [ - "MSTSHSFPAASPSHQQSALYANSPHGHALMAAPAALNRSFSDMSAFHHHAMDKPQIYTAVYSGVSVYEMEVNRVAVMRRR", - "SDGWLNATQILKVAGVDKGKRTKVLEKEILTGEHEKVQGGYGKYQGTWINYRRGREFCRQYGVEDVLRPLLDYDITLDGS", - "HAPGHAIETPTKEQAMAANRKRFYTQSIDGRTTTQNLTGTFFSNISSTATSALAAMNKVARLNSPAPRPSSSSQRRTSAT", - "RPSQSQPPLASQDSFRTSSQQSITSEPSFAGHNGQTDSAYATAVDESQEPPRKRIRASHDDSYSQPTAADMSIHPLSSPT", - "EPSESFDQHHPAQPITLADGDVPTALPPLPYPDTKQDEEKQAMLTDLFADQTRSDFTNHPAILHLSGPDLDMPIDNSSNT", - "ALHWAATLARVSLIRLLVSKGANMFRGNASGQTALMSAVSVNNSLDHSCFPETLEILAPLIELRDSQGRTILHHIAVTCA", - "IKGRAASSKYYLEALLEYLVRSNIGGGQPPPFHDTSNHSKPIGLMRFMQEMVNARDKAGNTALNLAARIGNRNIISQLME", - "VQADPTIPNHKGTRPMDFGVGTDLGDGQGIITATSPTKAKAPLSKAEETSREIQPLMSGILQSASLQFTQEARLKQDAID", - "QTNELITQLSSQQKQEQQKLQTLRARLRQRQDRAKRISNLKRWLEPQRHMLSVNDGAIDLHDKKRIGYADTQGAGLLIKE", - "DDLPYELRQAGDHLDRRASDGPIYLSTSVPLDPSTLSQVSHQPQCQNFLLQQLPAASVLRQRIETYTATNTALLKRSRML", - "KEKDGQLEMMYRKVVSLCTKVEENRIEECLEGLVAALDSEEGEGVEVGRVREFLRKVEGVD"] - }, - { "name" : "PGTG_02039", - "RefSeqID" : "XP_003320997", - "UniProtID" : "E3JX03", - "taxonomyID" : "418459", - "sequence" : [ - "MAAHKTTNDIPVSSSHHINPESGTGTSSTQAFPIPNIKNNPHVYMAVYSSVPVYEMMVRGIGVMRRRSDSYMNATQILKV", - "AGLDKSKRTRILEREIIQGEHEKIQGGYGRYQGTWVPFTRAQELATQLNVAQLLAPLFDYRPEPNSEVNIRSTNTKPSSS", - "ASRANSHKTTLARQTSRQSLNEKRERSGDTTPLPHDPPEAGPSKRSRLNTPSRQSNGSANTPSSLIDHSHSAMDPDFIIP", - "HSQSQPTAASQCTTSTFAPIHGATVEYPAGPSHLRKSNSSSRSHLEVALKAERNIHTLMALFSNPPDGDELESETHHENP", - "NSVAEVNEVLEDPELEIDTPIDEHCHTALHWASSLARLGLVRAFLRSGADVNRGNDVGETPLMRSTLVTNNFERESFNQL", - "LELLHPSLWTLDNQDRTVLHHICLTASIKGRGESSRYYLECICEWIVNKHGAQFDSQLFDAVDLNGDTALNIAARVGNKH", - "LVRMLLDVGADMTIGNNLGLKPIDFGVGAGETSASYTDDMISAPLRRNPTASAPARSSRDIITSITSSVNSLSEDFENEI", - "RSKTDRLESVRAQLMVATRQLTTQRRQLESLKHDLDERALLELRLKKLRMAIAEEDGFDWTGRSDLDGRPAQAGKLFEQN", - "GIASTLAGLSASQIQLELEPDPFIPPENNQDSLVYLRRLEKWYVRVLSLLRERIGRMKGSNLEQEAKYLKVIGSFIGNTC", - "TNDLSSSGSSMTGRPANQTTSTTQEVPSRATQNVNPADIHDLESMDGHRRKVSTTDAVNKSHEFGRTRSELLKASMIDNK", - "LLKQLMAAIESDGPELDLNRVAGFMQRVQSGSL"] - }, - { "name" : "MBPA_ASPNI", - "RefSeqID" : "XP_664319", - "UniProtID" : "Q5AYB5", - "taxonomyID" : "227321", - "sequence" : [ - "MTTSNHHQQRPSLSMSYSQGSIGSANGMSFSQSQMSSLNASQSVASTPRATPPPKSSQQSAMSFNYSNGLPNGARASFSG", - "FEDMNGYGTMIYHEEFKPQIYRAVYSNVSVYEMEVNGVAVMKRRSDGWLNATQILKVAGVVKARRTKTLEKEIAAGEHEK", - "VQGGYGKYQGTWVNYQRGVELCREYHVEELLRPLLEYDMNPNGTAASGQDSLDTPTKEQAMAAQRKRLYSGMENRSMSQP", - "QQGTFFQNISRTAATAVNAMSKARFESPAARGGDSRRLSVIRKPSQQMGSQDAQPPFGSQQSFYSAASDSGFASNIPTNG", - "RYAPQDAMSFEQEEPMEPPRKRIRSSQAFSLPIDGTSMSMSEPTPTEPNDSFYQDMEPLHHIDEGRHGLDPLPPATTPER", - "FQKMKLIMTLFLDKTTKDFSTHPALIQLSGEDLEVPLDEYRNNALHWAAMLARMPLVYALVKKGVNIARLNGAGETALQK", - "AVGTRNNLDYRSFPRLLQVLAPTIDMVDRSGRTILHHIAVMAATGHGGHVSAKHYLEALLEFIVRHGGTSLNQQSNGTAS", - "QPGMPLSNEVITLGRFISEIVNLRDDQGDTALNLAGRARSVLVPQLLEVGADPHIPNHTGLRPADYGVGVDMVDGSSQPA", - "GSRSDTFLAQLAKTRKEILEATTAQVTAIVQETLGTFDKELAASLTSKQEKFDHWHAKIRESAKARQIEQKQLDELKRRS", - "IDRTETSRRLKNLEKSSTDLLEAHKEILTNLGDTSKPVSLGDADQESGFEIAEFEALFPETFDPASGFSEAQIAYLRKLP", - "SAEILEQRVSCYRAFNKETLDEIDALRSKNVVLGQNYRRMVMACTGWSAEQVDEAAEGLTQCVKELNDNPVPEDEAIEIL", - "MRDRGQDW"] - }, - { "name" : "05520_CRYNE", - "RefSeqID" : "XP_570545", - "UniProtID" : "Q5KHS0", - "taxonomyID" : "214684", - "sequence" : [ - "MEPPSNPIQPPVTPSHHSLLSAISPALSEQTPAPIHTLPPHLRPSIPQPHIAPPRPSSVQPTMEEQQRMHHIQQHQQQQH", - "FQQQQNDENVFGSVMGAPGHVPGHEAPMSTQPKVYASVYSGVPVFEAMIRGISVMRRASDSWVNATQILKVAGVHKSART", - "KILEKEVLNGIHEKIQGGYGKYQGTWVPLDRGRDLAEQYGVGSYLSSVFDFVPSASVIAALPVIRTGTPDRSGQQTPSGL", - "PGHPNQRVISPFANHGQTTPHMPPPQFIHQGNEQMMNLPPHPSSLAYPTQPKPYFSMPLQHTVGPQYDERHEGMTMTPTM", - "SMDGLAPPADIARMGFPYNPSDIYIDQYGQPHATYQASPYGKESGHPSKRQRSDAEGSYIESGAAVQQHVEQDEEADDGL", - "DNDSTASDDARDPPPLPSSMLLPHKPIRPKATPANGRIKSRLVQIFNVEGQVNLRSVFGLAPDQLPNFDIDMVIDDQGHS", - "ALHWACALARLSIVQQLIELGADIHRGNYAGETPLIRAVLTSNHAEAGSFTDLLHLLSPSIRTLDHAYRTVLHHIALVAG", - "VKGRVPAARTYMASVLEWVAREQQANNTHSITNPPNPADRNELAPINLRTLVDVQDVHGDTALNVAARVGNKGLVGLLLD", - "AGADKTRANKLGLRPENFGLEIEALKISNGEAVMANLKSEVSKPERKSRDVQKNIATIFESISSTFSSEMLAKQTKLNAT", - "EASVRHATRALADKRQHLHRAQEKLATMQLFEQRSENVRRIMDAIAAGTLLTPAEFTGRTQTMHEKSTGQLPPLAFRHVP", - "GLALDASSQSQLNGAPPSTPLSVEDQEDIALPERDDPECLVKLRRMALWEDRIAEVLEDKIRAMEGEGVDRAVKYRKLVS", - "VCAKVPVDKVDSMLDGLVAAVESEGQGLDFSRASNFVNRIKATKS"] - }, - { "name" : "RES1_SCHPO", - "RefSeqID" : "NP_595496", - "UniProtID" : "P33520", - "taxonomyID" : "284812", - "sequence" : [ - "MYNDQIHKITYSGVEVFEYTINGFPLMKRCHDNWLNATQILKIAELDKPRRTRILEKFAQKGLHEKIQGGCGKYQGTWVP", - "SERAVELAHEYNVFDLIQPLIEYSGSAFMPMSTFTPQSNRKPTEAYRRNSPVKKSFSRPSHSLLYPYTSSNNMTSTSRMS", - "GIHDALSLQSDFTRSPDMPSDSFTGSLHDIKASPFSSNNYAQSLLDYFLLPNTTQPPDFVYDRPSDWDVNAGIDEDGHTA", - "LHWAAAMGNLEMMHALLQAGANVVAVNYLQQTSLMRCVMFTMNYDLQTFEVVSELLQSAICMNDSFGQTVFHHIALLASS", - "KSKMEAARYYMDILLQNLTATQSVDVAAQIINLQDDHGDTALLICARNGAKKCARLLLSFYASSSIPNNQGQYPTDFLSS", - "KDMSFPENDDSPLNSKIEDNLIDNLKYPQSLDDHLSSKKPISYFSNKLTHQTLPNVFTQLSELSKCHEASLAEKQLTYNL", - "AMEALEQTVRETETCQRLWNERTNNDENYLVNQREDLIHQCKKFLHTLKTARYYLETVQLHQLKKYVTYFSQIWSTDELA", - "DISETKNLVGHDTKTNRSSLSSKHEVDLFTAENEAAREKLVEQLCSLQAQRKQKINEILNLLSMGMYNTINTDQSGS"] - }, - { "name" : "CDC10_SCHPO", - "RefSeqID" : "NP_596132", - "UniProtID" : "P01129", - "taxonomyID" : "284812", - "sequence" : [ - "MASANFIRQFELGNDSFSYQKRPEDEPSQPLSNRNINKLNDSSTLKDSSSRIFINSQVLRDGRPVELYAVECSGMKYMEL", - "SCGDNVALRRCPDSYFNISQILRLAGTSSSENAKELDDIIESGDYENVDSKHPQIDGVWVPYDRAISIAKRYGVYEILQP", - "LISFNLDLFPKFSKQQQIESSSISKNLNTSSFNTRSPLRNHNFSNPSKSSKNGVHTINNMQSSPSPSSSFLLPLTQIDSQ", - "NVKRSNNYLSTSPPILEQRLKRHRIDVSDEDLHPSSQLNDNEASSLFPDTPRLNHSLSFVSLVSSLPPLDQNIMQDYHTS", - "KDILTSIFLDVNFADSSALEAKLSDSLDLDVPIDELGHAALHWAAAVAKMPLLQALIHKGANPLRGNLTGETALMRSVLV", - "TNHLNQNSFGDLLDLLYASLPCTDRAGRTVVHHICLTAGIKGRGSASRYYLETLLNWAKKHASGNNGYMLKDFINYLNHQ", - "DKNGDTALNIAARIGNKNIVEVLMQAGASAYIPNRAGLSVANFGIFVENALKQPEDSKQTKVSLMSENLSSKEKTAVPPR", - "QKSRDIIASVTDVISSLDKDFQDEMAAKQSMIDSAYTQLRESTKKLSDLREQLHVSETQRTLFLELRQRCKNLMTSIEEQ", - "KSELSNLYESFDPNGIHDSLSLDADAPFTVNENNNKNLSIAELKFQVAAYERNEARLNELANKLWQRNSNIKSKCRRVVS", - "LCTGVDESRVDSLLESLLQAVESDGQQGEVDMGRVAGFLRVVKEHQA"] - }, - { "name" : "05338_USTMA", - "RefSeqID" : "XP_011392041", - "UniProtID" : "A0A0D1BWD8", - "taxonomyID" : "237631", - "sequence" : [ - "MPLNYFANQDQTASDTYAHEASSFPAPSSILTDTSKPLQPVQEVAASSLVDGVSFTSPHASIIHASKQSPRAASSLSFTT", - "SALQRAGLLPANPNMSTTATSGTSAASESLQRVITQGTASAAAINGASTPAHSGPLTPAHLKNLTPAQANAALQNPVGNI", - "PTVYLATYSNVPVYEITVRGIAVMRRRGDGWLNATQILKIAGIEKTRRTKILEKSILTGEHEKIQGGYGKFQGTWIPLQR", - "AQQVAAEYNVSHLLQPILEFDPATADQIPKLYQRKKPAASARNSSASAINDARGSTPSKIYSPAPASLGGPSQQPRFLSL", - "RPPKETHEQEISSAIFMPPGTAGLLSNGTFVDDRAASALAYPGPPAIPPGSTPAEQAALRSYNVYGYTPQGVPLPSSAAA", - "DGNGTEAAATAASTGAGKREASETDQDGASAAKRSRLTSPQQQRRDDGLLLGPSPVKDLNALGPAGGSLRAASAPRGHRI", - "TVGPPDAAGRDGAVPRYADRALPPKPYDEGEKRMRDRLVSLFSDDGVLPGVSEATGAGASQSAADEDDDAYVAKLDSLLA", - "DLREKASLGGLGASGTDGPKATVDLITDDHGHTALHWASALCRVKLVRTLVARPPWQGGANIHAGNHAGETALHRSVLVT", - "NSYDASSFPTLLNLLSSSLNTRDFKKRTVLHHISLVAALKGRAASARYYLACVLEHISAEKNSKYKGLIDAQDEDGETAL", - "GIVARLGNASMVRMLLDVGARKDLANALGIRPSDWGIESSADGASLTPSQNDGTNTVASLPPLTAADLASQNPSDIISAL", - "TRPAQVPVMKSSDVRDQLSSTLDDLQSSFERELKEKQDAVSTVQSHLQAATRDLAARRKTVSAAQAKLAEKDEARQRVQN", - "LRRAIVAQLGLEEADADLSLEQLVEEAANAASAAPADKSADKMDIDGAEDVKPVRASNLETLIDDILSFDTIQSDLKAVG", - "TSAVTQEVVEQDELVRLRWLVSFYQSSCDELSSTISELEDSSAKKESQCQQVVAICANIPQDKVESMLDELLTAMESDGP", - "DVDLARVANFMQKVGKTRENGDQPGVGAQLSSSTSLSTAVSSGGTAASSVVPAVERDGEDAKPDA"] - }, - { "name" : "SWI4_SACCE", - "RefSeqID" : "NP_011036", - "UniProtID" : "P25302", - "taxonomyID" : "559292", - "sequence" : [ - "MPFDVLISNQKDNTNHQNITPISKSVLLAPHSNHPVIEIATYSETDVYECYIRGFETKIVMRRTKDDWINITQVFKIAQF", - "SKTKRTKILEKESNDMQHEKVQGGYGRFQGTWIPLDSAKFLVNKYEIIDPVVNSILTFQFDPNNPPPKRSKNSILRKTSP", - "GTKITSPSSYNKTPRKKNSSSSTSATTTAANKKGKKNASINQPNPSPLQNLVFQTPQQFQVNSSMNIMNNNDNHTTMNFN", - "NDTRHNLINNISNNSNQSTIIQQQKSIHENSFNNNYSATQKPLQFFPIPTNLQNKNVALNNPNNNDSNSYSHNIDNVINS", - "SNNNNNGNNNNLIIVPDGPMQSQQQQQHHHEYLTNNFNHSMMDSITNGNSKKRRKKLNQSNEQQFYNQQEKIQRHFKLMK", - "QPLLWQSFQNPNDHHNEYCDSNGSNNNNNTVASNGSSIEVFSSNENDNSMNMSSRSMTPFSAGNTSSQNKLENKMTDQEY", - "KQTILTILSSERSSDVDQALLATLYPAPKNFNINFEIDDQGHTPLHWATAMANIPLIKMLITLNANALQCNKLGFNCITK", - "SIFYNNCYKENAFDEIISILKICLITPDVNGRLPFHYLIELSVNKSKNPMIIKSYMDSIILSLGQQDYNLLKICLNYQDN", - "IGNTPLHLSALNLNFEVYNRLVYLGASTDILNLDNESPASIMNKFNTPAGGSNSRNNNTKADRKLARNLPQKNYYQQQQQ", - "QQQPQNNVKIPKIIKTQHPDKEDSTADVNIAKTDSEVNESQYLHSNQPNSTNMNTIMEDLSNINSFVTSSVIKDIKSTPS", - "KILENSPILYRRRSQSISDEKEKAKDNENQVEKKKDPLNSVKTAMPSLESPSSLLPIQMSPLGKYSKPLSQQINKLNTKV", - "SSLQRIMGEEIKNLDNEVVETESSISNNKKRLITIAHQIEDAFDSVSNKTPINSISDLQSRIKETSSKLNSEKQNFIQSL", - "EKSQALKLATIVQDEESKVDMNTNSSSHPEKQEDEEPIPKSTSETSSPKNTKADAKFSNTVQESYDVNETLRLATELTIL", - "QFKRRMTTLKISEAKSKINSSVKLDKYRNLIGITIENIDSKLDDIEKDLRANA"] - }, - { "name" : "SWI6_NEUCR", - "RefSeqID" : "XP_962967", - "UniProtID" : "Q7SBG9", - "taxonomyID" : "367110", - "sequence" : [ - "MQPPQLGGASQQSQPSSQQSFSMSQSSQSVYRQYTDPPNRLHNDHAVPTIYSATYSGVGVYEMEVNNVAVMRRQKDGWVN", - "ATQILKVANIDKGRRTKILEKEIQIGEHEKVQGGYGKYQGTWIPFERGLEVCRQYGVEELLSKLLTHNRGQEGETGNVDT", - "PTKEQAMAAQRKRMYNASSQENRGIGSTGTFFKNISSTASTAVAAISKARFDSPAPRNRSGPSRAPSFNRQSSMQDVADF", - "PNSQQSLVSTEYATQTQNADSGFGSQTTQPLAGDGLEQPPRKRQRVLTPARSFGGQTPGHQPLDPFNAGNIANGDSGSPT", - "EPSNSFNYDQVTANDGDASYALGPLRPLPYENNADAEAKRGMLMGLFMDANGPEEAIQAALCNVSPQELDSPIDTQSHTA", - "LHWAATLSRMPLLRALIHAGANPWRVNACGETALMRACTVTNSMENNTFPELLDLLGCTLDVTDDKGRTVLHHIAVTSAV", - "KGRHYASRYYLESLLEWVVRQGSAPSSQENGIGDRKGRRMGIARFMSEIVNAQDNSGDTALNVAARVGNRSIISQLLEVG", - "ADPTIPNRANLKPLDFGIGIADAETNDDPAQEKTGATTGSGHKSRETSDEVVRSITHLIGESASIFQNELKKKQESIDTL", - "HSQLRVTSSQVGDARRTLESLQEKLKAQQLAKQKIVNFNRACEEEEQILIELEQRHGRLDVASANAWEMELESALEIVKT", - "QSPKGLDPDSRPSLPSAAVLRARIKALRARSSKTRQAVAALQAQSKEKELKYRRLVSLCTRRPEIEVEALLDTLTRAVES", - "EKPELEIARVRRFLGGVEGVVH"] - }, - { "name" : "15042_USTMA", - "RefSeqID" : "XP_011388143", - "UniProtID" : "A0A0D1CVS5", - "taxonomyID" : "237631", - "sequence" : [ - "MSTASPLHHGHGNGSYANSPAPTGVTGRDAGVAAAAVADSAVRSGSVPASASGSAPGSASGSMYGEAHTQHHTGHHHYSA", - "HHTHSHGALTSPVNGGHSSSWSPYGYPAAPVYGGSPSPYGHNAYSQYASGYGYANGTAHHVATAPTTPSATSTAYHTGVN", - "GMMMHHGQHAGYGYSSHHLGSHTPTHTHTHSSAYFMNGDGAHSHLNSSAHLTSPSYTTAPQYSTQLPLAGRHRVTTTLWE", - "DEGTLCFQVDARGVCVARRHDNNMINGTKLLNVCGMSRGKRDGILKNEKERIVVKVGAMHLKGVWISFARAKQLAEQNGI", - "ADALYPLFEPNIQSFLYHPDNYPRTAAVIAAAQERQAQRQRAPGGQPSPGANGTSQAPPLMRANTTPSNGDTSTFSSGLS", - "SLGSWTGSHDQGHASAPTTAQPSPSSMHNGATQMHMSLSNHGTASPTYAQSQQQQQQQQQQQQQQQQQQQQQQQQAYPMT", - "AAQQLARPSVGDRRQSAPISLNNSVGHAENPYGATNLGGAANGGLVNGARKVSGLKRSWNDADDLNGSAAASPTERDMQR", - "SGSGGSNGLKLDGDDLHSPDSSDDRLAKKTRGMPQRGGGATTAMPSMSTNMLMGVGNGSGIHHE"] - }, - { "name" : "04778_USTMA", - "RefSeqID" : "XP_011391646", - "UniProtID" : "A0A0D1DQM4", - "taxonomyID" : "237631", - "sequence" : [ - "MNQAPLSATGVNFYISGPRPARLFPTPIHEFRKGKYATAGGESGFMTVFEYDVRGHTMMIDVDTSFVRFTSITQALGKNK", - "VNFGRLVKTCPALDPHITKLKGGYLSIQGTWLPFDLAKELSRRIAWEIRDHLVPLFGYDFPSTCLRPDSEGFGQLAIGMS", - "QKRARKRHNNGGPHQTSCYGPSLPISIELWQHSTDPLRDLGESSVVGGQAIEHVSAKNSAVQPCYGSSQPATFHYSKGYG", - "LESRPWYGQDYLESNSLESMWNSAQAGGGSVGLQVPISTCGATASPCLAAIGANGGSPILSSPPSSNASSSSNQSYTAAG", - "YGLMVPPTVPSHSVNSEAGANQAEGPTPIDGSRSYASLTAHGYATGYGDANASLSTWNDATHASTFTLHVHAHVHFQPPD", - "PESAQLFTIHDFGSDPFYAEQVERG"] - }, - { "name" : "STUA_ASPNI", - "RefSeqID" : "XP_663440", - "UniProtID" : "P36011", - "taxonomyID" : "227321", - "sequence" : [ - "MASMNQPQPYMDVHSHLSSGQTYASHPATAGALTHYQYPQQPPVLQPTSTYGPASSYSQYPYPNSVASSQSVPPPTTSIS", - "SQVPAQLLPLPVTNHPVPTHGYGNNSGTPMQGYVYDPTGQMAPPGAKPRVTATLWEDEGSLCYQVEAKGVCVARREDNGM", - "INGTKLLNVAGMTRGRRDGILKSEKVRNVVKIGPMHLKGVWIPFDRALEFANKEKITDLLYPLFVQHISNLLYHPANQNQ", - "RNMTVPDSRRLEGPQPVVRTPQAQQPPSLHHHSLQTPVPSHMSQPGGRPSLDRAHTFPTPPARMNSSVPNTQPLSIDTSL", - "SNARSMPTTPATTPPGNNLQGMQSYQPQSGYDSKPYYSAAPSTHPQYAPQQPLPQQSMAQYGHSMPTSSYRDMAPPSSQR", - "GSVTEIESDVKTERYGQGTVAKTEPEQEQEYAQPDSGYNTGRGSYYTTNPSVGGLAHDHSQLTPDMTGSPQQNGSGRMTP", - "RTSNTAPQWAPGYTTPPRPAAASSLYNIVSDTRGTSGANGSTSDNYSVASNSGYSTGMNGSMGSNKRMRDDDDDRIVPPD", - "SRGEFDTKRRKTLTETPVGGPVGGVPLGLQPMKAGGSLISARR"] - }, - { "name" : "STUA_NEUCR", - "RefSeqID" : "XP_960837", - "UniProtID" : "Q1K6U0", - "taxonomyID" : "367110", - "sequence" : [ - "MNPNTPADVYYGQMSQGSSMPVTTVPSHSHYASQQPPPLLQPGSTYAHQYGTPQYGYANALSSPASIPPSLPPSMNSMAG", - "QSVLPLPGSGSMNPAVYASGGFDTTGQVAPPGMKPRVTATLWEDEGSLCFQVEARGICVARREDNAMINGTKLLNVAGMT", - "RGRRDGILKSEKVRHVVKIGPMHLKGVWIPFERALDFANKEKITELLYPLFVHNIGALLYHPTNQSRTSQVMAAAEQRRK", - "DSHGQLRGPPGLPSLQQHHHHHSMLPGPPSLPSHPSMGRPALDRAHTFPTPPTSASSVMGPMGNSDGYQWSQQSMSGTQG", - "NSSLSLDTSLGSNARSMPSTPATTPPGSTIQSMQNYPPVSQSYESSRQMYQGQSAQQAQYQSQQHYSSQPQHQERPVYSQ", - "SSYIKNDMGPPSGRPTGQSNDASDSKPPTGMIHQGQGQSDPGTHAGSEEDDDANNEAEYTHDSGGYDANRGSYNYNTQAV", - "NSLPHDHGLAPEIGGSPHQAGSGRATPRTAAAPSSYYSAQGYHTPPRGQPSSSLYNVMSNERTGSNGTQGNEMYAGQADM", - "PSSLPNGYSAQPSVMNGSSGGLKRGRDDDDDGGRPTTSAPNLGPGMDMKRRKTMMDGGSLPSPTYTATIAQAAPSAIAAH", - "RRR"] - }, - { "name" : "PHD1_SACCE", - "RefSeqID" : "NP_012881", - "UniProtID" : "P36093", - "taxonomyID" : "559292", - "sequence" : [ - "MYHVPEMRLHYPLVNTQSNAAITPTRSYDNTLPSFNELSHQSTINLPFVQRETPNAYANVAQLATSPTQAKSGYYCRYYA", - "VPFPTYPQQPQSPYQQAVLPYATIPNSNFQPSSFPVMAVMPPEVQFDGSFLNTLHPHTELPPIIQNTNDTSVARPNNLKS", - "IAAASPTVTATTRTPGVSSTSVLKPRVITTMWEDENTICYQVEANGISVVRRADNNMINGTKLLNVTKMTRGRRDGILRS", - "EKVREVVKIGSMHLKGVWIPFERAYILAQREQILDHLYPLFVKDIESIVDARKPSNKASLTPKSSPAPIKQEPSDNKHEI", - "ATEIKPKSIDALSNGASTQGAGELPHLKINHIDTEAQTSRAKNELS"] - }, - { "name" : "08099_COPCI", - "RefSeqID" : "XP_001836714", - "UniProtID" : "A8NVH3", - "taxonomyID" : "240176", - "sequence" : [ - "MSTGMLQETLQTTSASTSGTRFRPYASPNHQVTKGRYITSNDPRGYIPVYEYPLNGQWIMMDIDDGYILWTGIWKALGNS", - "KADIVKMIDSQPDLAPLIRRVRGGYLKIQGTWMPYEVALKLSRRVAWPIRHDLVPLFGPTFPSTCLSPDQPGYGQVVASS", - "NVRRRARRNTQATAQPPREAHSNWTVMTPGPMVGLSFPHSQFSRPPLPPLAPTPARSPSDYAPSSHYGNQLDPQDARRYS", - "HSPYSPLASPPERKSSISSKALSLEIPPVRPSSSKAREDISLPPLKQPDGADPEMSPYALPPISALEDLRGVDTQDSAAV", - "LRRLRLDDDYPSSSRSSTSQDSIWGRRHSLSAHSPHPRSSDNSRFQPYLSSRSYQDSTLKRSRSPAESYADRRRASDFSQ", - "EDSTSAYSPISPATPNSSILSHSSFSDLKKLASSTDTRYNFPRISGRDWAPLKGDTDHIRSSYRSGPSPLELDSDSESSA", - "PHRPW"] - }, - { "name" : "68479_WALME", - "RefSeqID" : "XP_006957792", - "UniProtID" : "I4YDE0", - "taxonomyID" : "671144", - "sequence" : [ - "MTNKVQELWWEENKTRVWQVEVDNGNYVARRQDNDQINGTKLLNITKITRGKRDGILKNEKSRQVVKTGTITLKGVWIPF", - "ERAIILARQFNIEQQLYPLFETNLGDYVENSIGSHQIKRKSLNNLMDSLTTNRELVSKRRSTVSTYNPATSAYVSPYGFS", - "PQHCYQTEFEDMNQHSGEIQSGRPRNTSSASDWMTNWSTSSSSPVIPATPNTFSPVMNTFQSLALHSPPIPIPNYYYDSS", - "SSYFPSYHQKQQQQQVQMQMQMHTTASIGGDRQSNEYIQR"] - }, - { "name" : "11943_PUCGR", - "RefSeqID" : "XP_003330006", - "UniProtID" : "E3KMR2", - "taxonomyID" : "418459", - "sequence" : [ - "MAAAPTSSFLTSMSAQPPRTVQALVNEEVRAPPPVRLYPSQHRVSMTRYATSTDPRGYIPVFEYPLNGQYIMIDCETGMV", - "HFTGIWKALGHTKADVVKLVESDPTIAPYLRKVRGGYLKIQGTWLPFDTAQTLARRVAWQVRYDLVPLFGPDFPDTCLGP", - "GEPGFGQLLLSAPKPRGRRGAKKAAAAPTVAHERTASPQDNRSQSRPGPYPSQESFGNRCSGRVEAVGAMNGYSPMLSQA", - "RYSPYTRAPVHRITQLEPLPSLIQPNQSCPHPTADSMYSSHYHQSPRQSMMTSHGAGPYGQQHLTGSTASGMQSTAPLPS", - "MRPHQAHQSENNFFETYRGPDSFEALSNKWLAPEVANPSLNDSGLLHGEGGCLPPLQYSNNPVLRNGPSGSPTNQYNFPN", - "QIDSAHSSHHIDSNQTQHVHRHAGFPYESQHQSNFRHDLSTEEAAHHPASPSQQPPPSVTYDKAHNSEPQAGSQAANVTA", - "GCYAASGSNSTGNPAGSPGSHSSHVPKSPTPSSASTSTHMQNSHNPNSHRSPSNTLTNMSNNGGFNSNTQGEEAIQFSVL", - "TSPAHLETSGPSENSIPPAQSSDSDWNPAQNTTGLSPSQAPRQ"] - }, - { "name" : "03082_PUCGR", - "RefSeqID" : "XP_003321545", - "UniProtID" : "E3JYK1", - "taxonomyID" : "418459", - "sequence" : [ - "MILISPTRTLPSPRPIDTDPILNYRHIQPAAAAAAVGPWLGQNQHHHHHHDTLAKSPNITTAPATHSPSELSASPAPSAV", - "STGSSLLDPQSVPHIKIPHSSSPPAIMLPQPSSDDDSSTAEEEQPSAQSSNATLNTPTPHTNAPHQLDSHASSVGLYDLP", - "PTSSSAPTTSSSSSPFPSNVPSHQQPSPYSSSPHPNQEHHPHHPHHGNQFYQQSPPALHSPLQSAHHPQQSFDARPHSSL", - "FAHQHYHSRPQSAPHSTSQFSLDPHVLAAAAANVEVKKWDEENTYYYQVAHKGVTVGRLKGSGLVNGTKLLNLAGISRGK", - "RDGILKNEKIRKVVKHGTMHLKGVWIAFDRAVFLAEQHSIADKIFPLLVVNLEHYVPIEPPLMAGGTKLGPGSLFHHHHP", - "RHPRLLPQPIKFPPSTISLAPASANSFSSTGGWPSGPSSALPSIGYNEPFSAPPIPRSAATADTSPSIYEQAQFQYLNSA", - "QANNPDLLERRHTLPNNSFHGYNSVPSFGSSQPPPPVSYSFHYNSTHVPGYPPRSSTAESATPNQFEYQSKNHNGNGNGD", - "AAGSYPATLYHSQPAARPVSSTTAQPSPALNSAPLLLGDLSPGSSTQIVDHGAGDFRLSTGTSNGQVKQEGDDESCNEKR", - "LIMEWNPSC"] - }, - { "name" : "SOK2_SACCE", - "RefSeqID" : "NP_013729", - "UniProtID" : "P53438", - "taxonomyID" : "559292", - "sequence" : [ - "MPIGNPINTNDIKSNRMRQESNMSAVSNSESTIGQSTQQQQQQQQYLGQSVQPLMPVSYQYVVPEQWPYPQYYQQPQSQS", - "QQQLQSQPQMYQVQESFQSSGSDSNASNPPSTSVGVPSNATATALPNGSAITTKKSNNSTNISNNVPYYYYFPQMQAQQS", - "MAYSYPQAYYYYPANGDGTTNGATPSVTSNQVQNPNLEKTYSTFEQQQQHQQQQQLQAQTYPAQPPKIGNAFSKFSKSGP", - "PSDSSSGSMSPNSNRTSRNSNSISSLAQQPPMSNYPQPSTYQYPGFHKTSSIPNSHSPIPPRSLTTPTQGPTSQNGPLSY", - "NLPQVGLLPPQQQQQVSPLYDGNSITPPVKPSTDQETYLTANRHGVSDQQYDSMAKTMNSFQTTTIRHPMPLIATTNATG", - "SNTSGTSASIIRPRVTTTMWEDEKTLCYQVEANGISVVRRADNDMVNGTKLLNVTKMTRGRRDGILKAEKIRHVVKIGSM", - "HLKGVWIPFERALAIAQREKIADYLYPLFIRDIQSVLKQNNPSNDSSSSSSSTGIKSISPRTYYQPINNYQNPNGPSNIS", - "AAQLTYSSMNLNNKIIPNNSIPAVSTIAAGEKPLKKCTMPNSNQLEGHTITNLQTLSATMPMKQQLMGNIASPLSYPRNA", - "TMNSASTLGITPADSKPLTPSPTTTNTNQSSESNVGSIHTGITLPRVESESASHSKWSKEADSGNTVPDNQTLKEPRSSQ", - "LPISALTSTDTDKIKTSTSDEATQPNEPSEAEPVKESESSKSQVDGAGDVSNEEIAADDTKKQEK"] - }, - { "name" : "14426_COPCI", - "RefSeqID" : "XP_002911429", - "UniProtID" : "D6RMB0", - "taxonomyID" : "240176", - "sequence" : [ - "MTARPPLPLRHANPSLRDGNATIPPVKYQILSCQGKDILVGRLKIDTTDGGHAFILRRFDTQAISLTTMFRAAFPTASEA", - "EEKDEINYVKANFDLFGNNGSSKEPHITRLAGTWVNRDTAGQLAHDYNMVDLINTMVEAEPDPNGQYRRSNKSAQNNNPP", - "TNAPEPTPATNVHATRSPAKQSPKPPSKTLPTPSPGSGDAQPPAPKRRREGSPATFTSGIPVASSPAVPKTPGPRRSTRT", - "KSPAPSRVPQPLTATKPRSRASVAPPSPKKRPVDLPKSSPIKAEEDTAVEDNVAGNELYAQDISEQKKLIADLKAAASSK", - "KPADTVKEDDDQQMEEEGQGPSKLKRIRQDEEKPLQFEFKEPEREERQIATNRRVGRFDMQPERKSLAWGIAAFAFGMTA", - "ITYLPNFL"] - }, - { "name" : "BQT4_SCHPO", - "RefSeqID" : "NP_596166", - "UniProtID" : "O60158", - "taxonomyID" : "284812", - "sequence" : [ - "MTENEKSRSLPAERNPLYKDDTLDHTPLIPKCRAQVIEFPDGPATFVRLKCTNPESKVPHFLMRMAKDSSISATSMFRSA", - "FPKATQEEEDLEMRWIRDNLNPIEDKRVAGLWVPPADALALAKDYSMTPFINALLEASSTPSTYATPSRPTAQKSETSEG", - "EPESSTSATTTSVARRTRQRLAEHLENSKKTILQHDNKEEDKEIHSEENETKDEIKSEKKEPEIKKQEGGSSTEKVGQPS", - "SSDDKAKGSTSKDQPSEEEEKTSDIQDRKIKTPIKPSLLGKIRSSVNKGMTDVASQVNRGMTDVASQVNKGVNGVASQVN", - "KGMNGVANQVNKGVTGVASQVRKPVGKLEKKFENLEKSIGDTLKSSIRSSPKSKKRSREDFEENEDYNAMVPVKRSRITK", - "LESEVYYEKRKVRALGGIAIGLGVGAILPFLF"] - }, - { "name" : "PGTG_05590", - "RefSeqID" : "XP_003323688", - "UniProtID" : "E3K4V4", - "taxonomyID" : "418459", - "sequence" : [ - "MPKSSSCCEPEQKQSIPTNANPISAGGAGLDIRLAGMRSAHATLRGCSFSPYMVTQHPPLRDSVNRNKQQPTNNSTNPYT", - "KKASRMSQTNLYKSNNPPNLPQDEFNQTLVNYQGKLRSIRIQDININGHTITIARIKIPSPEKLSSHLIKRFDTNAISAS", - "SFFRSAFPHSTEEEEAIQMRYLHQIYDTHTAGAVEFGSARKLTGVWVPIENAAELAEVYGLTRFAEPLLAFPNPKENPRS", - "PTGTKIGGEDESSTTQTPKASQQSKLTGQISVTRSSKRSRAGPLSFGNTSPSSFSLNSFNKPPTETNKSGTHDDSKSTND", - "ENDEKPASPTDRVAGRGARNSPSKKPTTVDENHEHTEHEDHQLIGTDELAQRAKQEALKLVSELKNSQPCTQSSLESPTN", - "TLETELTRTTSPAKSNKVTRKRSSDEVSFEGEEQGEDEDEERTADETATHRSFLPKLLWRKSAAQAHPNSKKHKRTQLGG", - "GGSSSSSSKSFVPLLTNSATPSVDDSSSTHNPNKRNLAIAGIVIAGAAA"] - }, - { "name" : "06560_NEUCR", - "RefSeqID" : "XP_962267", - "UniProtID" : "Q7S9H5", - "taxonomyID" : "367110", - "sequence" : [ - "MAQVARHLPARRNPLMLEDVPSHTDLASRRRLGQTQLTPRMVTAVPGAEVDPSSLLAFDYAHLRAPLPKGIVSGIFKSSP", - "PSYFLMRRSQDGYISATGMFKATFPYASQEEEEAERKYIKSIPTTSSEETAGNVWIPPEQALILAEEYQITPWIRALLDP", - "SDIAVTATDSSAPKQIAPPPKFFGAQPPLVAPTPPTTRSTRSRPSSRRSSSPAKSTTTSKRGTTPRNTKRTVTTEASATT", - "VTTTATATAVPSAETPATSFADSQAPTLINGEIPTSTPINTVPVTKIQTTEAELKVESIEKEPVVVLEPIEEEPKIKVRV", - "DEDVKLDKDGEEVKHTKVELEVPLMAGEPPSKEEARKMIEEAKAMVEAAVKADAEAAAALVEASKAGAEDEKAEDEAKAE", - "TEATKEEEADSKGKRKAEKISVDEDEKAADEAEQPRQAKRVKTEAELRKDRIRKRAYLGLTATFAVGALGALLPIITPYV", - "ANVL"] - }, - { "name" : "81480_BIPOR", - "RefSeqID" : "XP_007682909", - "UniProtID" : "W6ZKJ4", - "taxonomyID" : "930090", - "sequence" : [ - "MVVDRVLPERKNPLLEPTDSTSIEILIERRRLGQTNLGVKAGVSGIANATKPENMGTFDYAHLRVPLPKDLTGSGIFSRN", - "RMSAFPESYFLMRRSSDGYISATGMFKAAFPWASLQEEDLERKYQKTFPSAGDEEVAGSVWIAPEEALALSEEYSMRHWI", - "EALLDPAPIEKGGKDKSNAAIQMPPRFDVANAQPATLPTFGFRQTRARSARSVSPSKAMTPGRKYATPRKGRSTRSAMKP", - "DATHADDMFRPIEAVTPSTALQNSIARRIAPAETIASSIEGEVKEVEQEVKAALDAEKKPEPELEVQEGTVHIEVKQTVE", - "TNGDTEKTSTSVTVDVPHDHAALPEPEDPTAMIEEAKRMVAEAQKLEGGSPSVTRSSKRGIEEVLDEEDLADERLNKLAK", - "KAYTTEQKMTKEKVTRRALVGLGVMAAIGTAFQYFV"] - }, - { "name" : "01622_ASPNI", - "RefSeqID" : "XP_657766", - "UniProtID" : "Q5BH18", - "taxonomyID" : "227321", - "sequence" : [ - "MVRSLPKKNNPFVTPDAAPPYEELLMRRRLGKTNLAVKPTQVGTSNATKPENLGPFEYAHLRAPLPKDLKGSEIFPSHSP", - "QQHPETYFLMRRSKDGYVSATGMFKIAFPWAKLEEERSEREYLKTRPETSEDEIAGNVWISPVLALELAAEYKMYDWVRA", - "LLDPTEIIQSPSSAKKQITPPPKFELPPIQAPEALVPSSRTRSRRSASPSKKAGTPRKPRQTKAQKEAAVAATNEANATL", - "QSALDDTVSNADGEINGDVLPSVEDKREPETSPVKGKKAAAKAKKQAVSEEDQEDKVKIEIKSDAAEGSDVQAAQTTISV", - "EMPISLPEAPSAEDTQEMIAKAKEMVKEAVKLQQEPAESSATAKKRGAEEAELGEEEEDEETKTLRTKRAKVLEEKLKRE", - "RVRNRALMGVTAAFALAKPALVLLEA"] - }, - { "name" : "05405_ASPNI", - "RefSeqID" : "XP_663009", - "UniProtID" : "Q5B225", - "taxonomyID" : "227321", - "sequence" : [ - "MASIQFLLNPLPSLPSSDRCPLPTPSPTISSSTAMLRSPRQKKQKMAKDAPIFQRGKPRGEVRYPPYEDRDGKFSCQHQD", - "FRIHPLGNIADYPRHIPYNSDKKSFQERTGRESFEVFQYTFQLPGEEKQWTVMWDYNIGLVRTTHLFKCNDYSKTTPAKM", - "LNQNPGLRDICHSITGGALAAQGYWMPYEAAKAIAATFCWKIRFALTPLFGDNFPDLCIHPDDRARFGRMVIDPGIVRIA", - "TEKANLYRMLELRCSTTNSLRADYVLRPSSAPDIDRTDPNLERDRVALGRHILPKSHRHHHHRSKTSPSTNTSLVGYGSS", - "PEVEYYSCGTEPYCVSPESPIRSSFTPVNTPRSTDIYPSSSSTNFLRSPHELLASLSSSASIARARIERASKISGARVIP", - "SSVPSNVTSITTKGRDNTGHSALMEESDIDADAETDSGHEHDLDFELSSSDESSTSSTVSSSTSSASLGFAANSRNRPYR", - "DDDEPHRDTDEEMVDYRAPKRIATAGARDRRWGRGRRVIHQEHSDIETSRRARKHAQRSSNARLVCEMTAAHALISLLHD", - "ATGSDVDVDTHNRLECGRSPDGGVKNNLKGSYFGIRLNHNPSTESGQKRRRASA"] - }, - { "name" : "105954_BIPOR", - "RefSeqID" : "XP_007691967", - "UniProtID" : "W6Z1H5", - "taxonomyID" : "930090", - "sequence" : [ - "MNIQDLLNPSCGDRHDHRRSESATPPSRPVAILPALRRQKIPKDAPIFSEGNRTVGIVNFAPHEAGNDEELLAQHCRFQI", - "YPLGEISRKGVRHIPYNSDKKDFLEKTGRDAFEMFQYTYKLPGEDKPYVVVWDYNVGLVRMTPFFKSCKYSKTIPAKTLR", - "ENPGLKDISYSITGGALVCQGYWIPYQAARAIAATFCYDIRWALTPVFGNDFPSICLTPDDPSFAKFVIDPAIVRYCTEE", - "TTKFRELGSAYEVHRPVAPTQVEAPTSRSDQPLSTSIVRQRRARPIDIESGYGTDTERNDRCLFSPEVSPRTRFTPINRP", - "RSPYSPRTAESSFVSSPVSIRAPPGLHTPTSTPYEHSGEVFRAKRSHSKVAFCEHPADEAVIRPPTAATVDSAHGCEMCV", - "GDDNHSHLDMDAAEMLLSLRTADSAMPPSKRTRRGS"] - }, - { "name" : "69819_WALME", - "RefSeqID" : "XP_006959479", - "UniProtID" : "I4Y911", - "taxonomyID" : "671144", - "sequence" : [ - "MTSPGLPKDFNELLDKSEIPSPKWQQITRDDRPITIARLKLPHPREKHTFILRRYDCNGISFGSLFKAAYPYATDEEEKI", - "ESGFVKKNYDVTLVPTEEYQERKLAKLAGFWIPIAIAEELGQRYAMAEYVDALAKADTPDLTDFKKRSSNRQTSEDIKSS", - "PAKAQASLESPAKSASKIPTPTKNPAPRRSARHQSRSPSPSPLTHNLTPGKKKAKKAPKEAVIEESVEETIVVDKKESPL", - "KKALNDDQVLADIERAKDLVDDIKQSKNLSQSSPVKVVKEEVLETIQPSVSTESLEGEGKRKRELEDETGNEIKVVSFGQ", - "NPPANPEEIQQRPVVQRRGVAAAVGAFALGVGFAASNILPRFLF"] - }, - { "name" : "02840_CRYNE", - "RefSeqID" : "XP_568872", - "UniProtID" : "Q5KM59", - "taxonomyID" : "214684", - "sequence" : [ - "MSHPAADAPPPYPGTTDDAQYDLTPLPHTANRPRLPEDKRNPHLNNLPEDTKIVKFQTIVRENKEIVVGRIKVPTENANG", - "THHAFILRRYDTNAISLTTMYKVAFPSATEEEEKREMDWVKSSFDTRGTNGGRDSEVVRLAGQWVSRNLAIHIAPAYNLV", - "QLVAALSRAVPDPNVAYRKSQRSQAAADELARTKAKQSQAPSSVPAISNVPVRKPQAAIPSMATEISSPASKRQRKDSVT", - "EASGSATQTITEAQPSADTSETDDTRHITIEATTTITSPSGANVDMDAEIEQAKQLVKDLRQEIQLRNEAGDSLEDQGVA", - "VADDVRGVKRGKHEDEAVVISGGAGGKDRVVRTNKRIPQTAGGDVGQRFGWGAFVFSIGLGASLTLFSQYASSLL"] - }, - { "name" : "11055_USTMA", - "RefSeqID" : "XP_011390537", - "UniProtID" : "A0A0D1DZM8", - "taxonomyID" : "237631", - "sequence" : [ - "MPAAASARKSTPTRKSTPRRARSSSVTSNASTGVPASPSASPRKTKKQKEAAAAAAAAVAAAAATAEQVNDDESDLLRPK", - "LPTKRNPRLKEVDEAVVKLQIIKREGHNIIIGRVKLPTVNGQDHAFLLKRFDTNAMAASSMFRLAFPFADGTAEAAEMRF", - "LDTKYDTNRANGGYIVEEVKVPETPKKRGRTRKTAENSKKESTPDTESVSADKQIRVLPEGSTGVRLQGTWIPAEDAIEV", - "AEDYGIAKYALALIHATAEHAEDGGAPILTSEPVAEVKTPRKRQRVSAAAATASDTPDSPQLVQRVTRLENADGSISKVR", - "VESTLEAPSSNGVPVALSQAEIEEQIAQAKALAAGIQQSITAGSGSASTRGQKRRAVNDRPTAEIDPLADDEDYSESGRV", - "VRAFRRGTRVARRRPIATTAGAVAAAGAVGAGALAWVSGGNPEVAIQTLQASMQSIGLQNLQNLGLQNLQQIGTQLGAHL", - "ASILPW"] - }, - { "name" : "XBP1_NEUCR", - "RefSeqID" : "XP_962373", - "UniProtID" : "Q7S9W7", - "taxonomyID" : "367110", - "sequence" : [ - "MLNQNPGLKDIAYSITGGAIKAQGYWMPYACAKAVCATFCYQIAGALIPLFGPDFPSECISPGEPRYGIMIIKPELISDT", - "MRKAQELYRRYGNWGGGCTSSSPARRPLRTASSGSQERHHHHPYPNQEHLDHQQQQQRTVCSRRCPAEENSCVDARPQLR", - "GISAPMPPAGEWTPPLLRSSAGRPRPVMPTSTHSSISYPERAPHRSAWTAVNHQPPNNSLDRYSLKRPLPSNEPDESVSH", - "SNWPSRSQAPNPWLTAIPRSPRKTSSSPWASQPGSASRSRAGSIDSMASQHPQGLPSPSLILSSPSSSMVSLSSSNSPSP", - "RPQLPPISQLCSLPVPSGRRRLPNGRPSRVGGDATSSHSRQDHSTCGAYQFSAGYQRALTPPSSTSAPMHWRSQRRPSLQ", - "DQHEHEHIEDTQPRRIAVEANMECGDDNESHLHLPLPLPRTSSSASIVADKNANDTTSDNSSSRNFNSASIGSGRDDGQT", - "SLAARKTAALTLLHLRQQEEEKEAAAAAAAAAAAAYSSTKRPESPSSSLSSPVSPPPTSGQPSPTLSAVVTATNLRRGTT", - "TATATAVIDTTEPLAPPPSPSSNYLGSPISTSIASSSSSFSPSTSCNGTRENSVVANEMTRYAGQEADAGGPRHCNGDAD", - "DEGDYEHEQQYRRKRRRLLLVGRAKSF"] - }, - { "name" : "XBP1_SACCE", - "RefSeqID" : "NP_012165", - "UniProtID" : "P40489", - "taxonomyID" : "559292", - "sequence" : [ - "MKYPAFSINSDTVHLTDNPLDDYQRLYLVSVLDRDSPPASFSAGLNIRKVNYKSSIAAQFTHPNFIISARDAGNGEEAAA", - "QNVLNCFEYQFPNLQTIQSLVHEQTLLSQLASSATPHSALHLHDKNILMGKIILPSRSNKTPVSASPTKQEKKALSTASR", - "ENATSSLTKNQQFKLTKMDHNLINDKLINPNNCVIWSHDSGYVFMTGIWRLYQDVMKGLINLPRGDSVSTSQQQFFCKAE", - "FEKILSFCFYNHSSFTSEESSSVLLSSSTSSPPKRRTSTGSTFLDANASSSSTSSTQANNYIDFHWNNIKPELRDLICQS", - "YKDFLINELGPDQIDLPNLNPANFTKRIRGGYIKIQGTWLPMEISRLLCLRFCFPIRYFLVPIFGPDFPKDCESWYLAHQ", - "NVTFASSTTGAGAATAATAAANTSTNFTSTAVARPRQKPRPRPRQRSTSMSHSKAQKLVIEDALPSFDSFVENLGLSSND", - "KNFIKKNSKRQKSSTYTSQTSSPIGPRDPTVQILSNLASFYNTHGHRYSYPGNIYIPQQRYSLPPPNQLSSPQRQLNYTY", - "DHIHPVPSQYQSPRHYNVPSSPIAPAPPTFPQPYGDDHYHFLKYASEVYKQQNQRPAHNTNTNMDTSFSPRANNSLNNFK", - "FKTNSKQ"] - } -] +[ + { "name" : "68476_WALME", + "RefSeqID" : "XP_006957790", + "UniProtID" : "I4YDD8", + "taxonomyID" : "671144", + "sequence" : [ + "MKEEKEKTPPNNITGPPTPAQNILHSTPAAFGTAGTVGQGAGGFGSQLYQSPYVDSQQSVIGSPVTPAPLPKKATLKTPQ", + "PRIYSAVYSGVGVYEAMIRGIAVMRRRADGYMNATQILKVAGVDKGRRTKILEREILAGLHEKIQGGYGKYQGTWIPFER", + "GRELALQYGCDHLLAPIFDFNPSVMQPSAGRSAKSPSKKRQNSIVLSPTQERHQSSIIALNTARASGIYVGGADDPNDDG", + "LSKKEKSPVKKSKYDEVPVNVSKRPYVPPPGTNAHILTRTQQSLTALFQQPTTNSDFIPEAVAILDTTSGALHPDLAIDE", + "LGHTALHWAASLGRISNVQQLIKKGADMKRGNIEGETPLERSVLVNDNYDKKTFAYLLQELGSSIRVVDRTGRSILHHIA", + "LIAAVNGRSMSAKYYMENVLEYIARYENGEFKSLVDLQDEHGDTALNISARVGNRNLVKMLVDAGANKTVVNKLGLKASD", + "FGVEHETLNSVTGDEMLSNLQPPPPLNVDSSASVLENIHNLLNGITQQYTDETSGKNALLFEIQAELKQHSHELADVRKE", + "IQYWQNKATQMAEVDQKIKNINEAIENEKVQTWSLLGEANADKMEGIETSSSSNTSEIKIPTGDNEESLKQLRKLSKWLE", + "GTQKLTEERVASIDGLSASKEVKYKSIVSVCTGVPVNEVEGMLAQLLEAMESDANADLNKVQEFLAREC"] + }, + { "name" : "00846_COPCI", + "RefSeqID" : "XP_001831299", + "UniProtID" : "A8N8X1", + "taxonomyID" : "240176", + "sequence" : [ + "MQASTRPPGSNQPPVKIYNAVYSSVQVYECMVRGIAVMRRRNDSYVNATQILKVAGVDKGRRTKILEKEILPGKHEIVQG", + "GYGKYQGTWIPLERGRDIAAQYGVAPLLSPLFDFQPSTNSLGALPVSTPGGTASPRPLSASSSYSSMGVAGQYIPSSIPS", + "NLPPAPIMPGSALRLLNQGRAQGLFTPSTTSATLRPAGYHSPGPYGTSYAPSPQPQSSQTPPPGSGLKRNRSEAEVEGYH", + "SQPHDVQMADAPPPNTASQPNEDNPSPAKRLRTDGSITTEPASSQGQWQQQQPLPYASQQRSGPGLSQLSGHNGHGSSRP", + "PSSLSAPNGNRPAHTNPEDQTRKTRFSSKPSMPRGMDPHMPFKDARRSALIALICHRDDPTSVIDLLREISADHLNPPSF", + "DVDTVLDDQGHTALHLAASMARTQTVDMLIQTGADMHRGNHLGETPLIRACLATPNSDQQSFATLVNYLHDSIWTLDTSK", + "KSVVHHIVSLAGVKGRAVVARYYLDQIFYWIAQHEGGDFRSLVDLQDEHGDTAINIAARVGNRSLVRTLLDVGANRVLAN", + "KLGLRPGDFGVETEELSSGLRAEDLISSLRTGPPAPVQKSQDVIADMTSMIQSLSTEFQAEIKSKQDSLDVTQAHLRAAT", + "RELSEQRKQIQTWQARCGDLDQINQRVRNVEKAIAEEDMFDWTGRTELDGKDGKEKGGPAFAYRGSKSTMVGVGGSVDVS", + "FSVESEPPLPTTDTAASLVKLRRLKMWHQRMEELVKGRLKGLQGASAEKEYQCKKIVALCTGIPLDKVEEMLDNLVIAVE", + "SEAQVVDIGRVSGFMQKVRDGII"] + }, + { "name" : "8533_BIPOR", + "RefSeqID" : "XP_007691662", + "UniProtID" : "W6ZE71", + "taxonomyID" : "930090", + "sequence" : [ + "MSTSHSFPAASPSHQQSALYANSPHGHALMAAPAALNRSFSDMSAFHHHAMDKPQIYTAVYSGVSVYEMEVNRVAVMRRR", + "SDGWLNATQILKVAGVDKGKRTKVLEKEILTGEHEKVQGGYGKYQGTWINYRRGREFCRQYGVEDVLRPLLDYDITLDGS", + "HAPGHAIETPTKEQAMAANRKRFYTQSIDGRTTTQNLTGTFFSNISSTATSALAAMNKVARLNSPAPRPSSSSQRRTSAT", + "RPSQSQPPLASQDSFRTSSQQSITSEPSFAGHNGQTDSAYATAVDESQEPPRKRIRASHDDSYSQPTAADMSIHPLSSPT", + "EPSESFDQHHPAQPITLADGDVPTALPPLPYPDTKQDEEKQAMLTDLFADQTRSDFTNHPAILHLSGPDLDMPIDNSSNT", + "ALHWAATLARVSLIRLLVSKGANMFRGNASGQTALMSAVSVNNSLDHSCFPETLEILAPLIELRDSQGRTILHHIAVTCA", + "IKGRAASSKYYLEALLEYLVRSNIGGGQPPPFHDTSNHSKPIGLMRFMQEMVNARDKAGNTALNLAARIGNRNIISQLME", + "VQADPTIPNHKGTRPMDFGVGTDLGDGQGIITATSPTKAKAPLSKAEETSREIQPLMSGILQSASLQFTQEARLKQDAID", + "QTNELITQLSSQQKQEQQKLQTLRARLRQRQDRAKRISNLKRWLEPQRHMLSVNDGAIDLHDKKRIGYADTQGAGLLIKE", + "DDLPYELRQAGDHLDRRASDGPIYLSTSVPLDPSTLSQVSHQPQCQNFLLQQLPAASVLRQRIETYTATNTALLKRSRML", + "KEKDGQLEMMYRKVVSLCTKVEENRIEECLEGLVAALDSEEGEGVEVGRVREFLRKVEGVD"] + }, + { "name" : "PGTG_02039", + "RefSeqID" : "XP_003320997", + "UniProtID" : "E3JX03", + "taxonomyID" : "418459", + "sequence" : [ + "MAAHKTTNDIPVSSSHHINPESGTGTSSTQAFPIPNIKNNPHVYMAVYSSVPVYEMMVRGIGVMRRRSDSYMNATQILKV", + "AGLDKSKRTRILEREIIQGEHEKIQGGYGRYQGTWVPFTRAQELATQLNVAQLLAPLFDYRPEPNSEVNIRSTNTKPSSS", + "ASRANSHKTTLARQTSRQSLNEKRERSGDTTPLPHDPPEAGPSKRSRLNTPSRQSNGSANTPSSLIDHSHSAMDPDFIIP", + "HSQSQPTAASQCTTSTFAPIHGATVEYPAGPSHLRKSNSSSRSHLEVALKAERNIHTLMALFSNPPDGDELESETHHENP", + "NSVAEVNEVLEDPELEIDTPIDEHCHTALHWASSLARLGLVRAFLRSGADVNRGNDVGETPLMRSTLVTNNFERESFNQL", + "LELLHPSLWTLDNQDRTVLHHICLTASIKGRGESSRYYLECICEWIVNKHGAQFDSQLFDAVDLNGDTALNIAARVGNKH", + "LVRMLLDVGADMTIGNNLGLKPIDFGVGAGETSASYTDDMISAPLRRNPTASAPARSSRDIITSITSSVNSLSEDFENEI", + "RSKTDRLESVRAQLMVATRQLTTQRRQLESLKHDLDERALLELRLKKLRMAIAEEDGFDWTGRSDLDGRPAQAGKLFEQN", + "GIASTLAGLSASQIQLELEPDPFIPPENNQDSLVYLRRLEKWYVRVLSLLRERIGRMKGSNLEQEAKYLKVIGSFIGNTC", + "TNDLSSSGSSMTGRPANQTTSTTQEVPSRATQNVNPADIHDLESMDGHRRKVSTTDAVNKSHEFGRTRSELLKASMIDNK", + "LLKQLMAAIESDGPELDLNRVAGFMQRVQSGSL"] + }, + { "name" : "MBPA_ASPNI", + "RefSeqID" : "XP_664319", + "UniProtID" : "Q5AYB5", + "taxonomyID" : "227321", + "sequence" : [ + "MTTSNHHQQRPSLSMSYSQGSIGSANGMSFSQSQMSSLNASQSVASTPRATPPPKSSQQSAMSFNYSNGLPNGARASFSG", + "FEDMNGYGTMIYHEEFKPQIYRAVYSNVSVYEMEVNGVAVMKRRSDGWLNATQILKVAGVVKARRTKTLEKEIAAGEHEK", + "VQGGYGKYQGTWVNYQRGVELCREYHVEELLRPLLEYDMNPNGTAASGQDSLDTPTKEQAMAAQRKRLYSGMENRSMSQP", + "QQGTFFQNISRTAATAVNAMSKARFESPAARGGDSRRLSVIRKPSQQMGSQDAQPPFGSQQSFYSAASDSGFASNIPTNG", + "RYAPQDAMSFEQEEPMEPPRKRIRSSQAFSLPIDGTSMSMSEPTPTEPNDSFYQDMEPLHHIDEGRHGLDPLPPATTPER", + "FQKMKLIMTLFLDKTTKDFSTHPALIQLSGEDLEVPLDEYRNNALHWAAMLARMPLVYALVKKGVNIARLNGAGETALQK", + "AVGTRNNLDYRSFPRLLQVLAPTIDMVDRSGRTILHHIAVMAATGHGGHVSAKHYLEALLEFIVRHGGTSLNQQSNGTAS", + "QPGMPLSNEVITLGRFISEIVNLRDDQGDTALNLAGRARSVLVPQLLEVGADPHIPNHTGLRPADYGVGVDMVDGSSQPA", + "GSRSDTFLAQLAKTRKEILEATTAQVTAIVQETLGTFDKELAASLTSKQEKFDHWHAKIRESAKARQIEQKQLDELKRRS", + "IDRTETSRRLKNLEKSSTDLLEAHKEILTNLGDTSKPVSLGDADQESGFEIAEFEALFPETFDPASGFSEAQIAYLRKLP", + "SAEILEQRVSCYRAFNKETLDEIDALRSKNVVLGQNYRRMVMACTGWSAEQVDEAAEGLTQCVKELNDNPVPEDEAIEIL", + "MRDRGQDW"] + }, + { "name" : "05520_CRYNE", + "RefSeqID" : "XP_570545", + "UniProtID" : "Q5KHS0", + "taxonomyID" : "214684", + "sequence" : [ + "MEPPSNPIQPPVTPSHHSLLSAISPALSEQTPAPIHTLPPHLRPSIPQPHIAPPRPSSVQPTMEEQQRMHHIQQHQQQQH", + "FQQQQNDENVFGSVMGAPGHVPGHEAPMSTQPKVYASVYSGVPVFEAMIRGISVMRRASDSWVNATQILKVAGVHKSART", + "KILEKEVLNGIHEKIQGGYGKYQGTWVPLDRGRDLAEQYGVGSYLSSVFDFVPSASVIAALPVIRTGTPDRSGQQTPSGL", + "PGHPNQRVISPFANHGQTTPHMPPPQFIHQGNEQMMNLPPHPSSLAYPTQPKPYFSMPLQHTVGPQYDERHEGMTMTPTM", + "SMDGLAPPADIARMGFPYNPSDIYIDQYGQPHATYQASPYGKESGHPSKRQRSDAEGSYIESGAAVQQHVEQDEEADDGL", + "DNDSTASDDARDPPPLPSSMLLPHKPIRPKATPANGRIKSRLVQIFNVEGQVNLRSVFGLAPDQLPNFDIDMVIDDQGHS", + "ALHWACALARLSIVQQLIELGADIHRGNYAGETPLIRAVLTSNHAEAGSFTDLLHLLSPSIRTLDHAYRTVLHHIALVAG", + "VKGRVPAARTYMASVLEWVAREQQANNTHSITNPPNPADRNELAPINLRTLVDVQDVHGDTALNVAARVGNKGLVGLLLD", + "AGADKTRANKLGLRPENFGLEIEALKISNGEAVMANLKSEVSKPERKSRDVQKNIATIFESISSTFSSEMLAKQTKLNAT", + "EASVRHATRALADKRQHLHRAQEKLATMQLFEQRSENVRRIMDAIAAGTLLTPAEFTGRTQTMHEKSTGQLPPLAFRHVP", + "GLALDASSQSQLNGAPPSTPLSVEDQEDIALPERDDPECLVKLRRMALWEDRIAEVLEDKIRAMEGEGVDRAVKYRKLVS", + "VCAKVPVDKVDSMLDGLVAAVESEGQGLDFSRASNFVNRIKATKS"] + }, + { "name" : "RES1_SCHPO", + "RefSeqID" : "NP_595496", + "UniProtID" : "P33520", + "taxonomyID" : "284812", + "sequence" : [ + "MYNDQIHKITYSGVEVFEYTINGFPLMKRCHDNWLNATQILKIAELDKPRRTRILEKFAQKGLHEKIQGGCGKYQGTWVP", + "SERAVELAHEYNVFDLIQPLIEYSGSAFMPMSTFTPQSNRKPTEAYRRNSPVKKSFSRPSHSLLYPYTSSNNMTSTSRMS", + "GIHDALSLQSDFTRSPDMPSDSFTGSLHDIKASPFSSNNYAQSLLDYFLLPNTTQPPDFVYDRPSDWDVNAGIDEDGHTA", + "LHWAAAMGNLEMMHALLQAGANVVAVNYLQQTSLMRCVMFTMNYDLQTFEVVSELLQSAICMNDSFGQTVFHHIALLASS", + "KSKMEAARYYMDILLQNLTATQSVDVAAQIINLQDDHGDTALLICARNGAKKCARLLLSFYASSSIPNNQGQYPTDFLSS", + "KDMSFPENDDSPLNSKIEDNLIDNLKYPQSLDDHLSSKKPISYFSNKLTHQTLPNVFTQLSELSKCHEASLAEKQLTYNL", + "AMEALEQTVRETETCQRLWNERTNNDENYLVNQREDLIHQCKKFLHTLKTARYYLETVQLHQLKKYVTYFSQIWSTDELA", + "DISETKNLVGHDTKTNRSSLSSKHEVDLFTAENEAAREKLVEQLCSLQAQRKQKINEILNLLSMGMYNTINTDQSGS"] + }, + { "name" : "CDC10_SCHPO", + "RefSeqID" : "NP_596132", + "UniProtID" : "P01129", + "taxonomyID" : "284812", + "sequence" : [ + "MASANFIRQFELGNDSFSYQKRPEDEPSQPLSNRNINKLNDSSTLKDSSSRIFINSQVLRDGRPVELYAVECSGMKYMEL", + "SCGDNVALRRCPDSYFNISQILRLAGTSSSENAKELDDIIESGDYENVDSKHPQIDGVWVPYDRAISIAKRYGVYEILQP", + "LISFNLDLFPKFSKQQQIESSSISKNLNTSSFNTRSPLRNHNFSNPSKSSKNGVHTINNMQSSPSPSSSFLLPLTQIDSQ", + "NVKRSNNYLSTSPPILEQRLKRHRIDVSDEDLHPSSQLNDNEASSLFPDTPRLNHSLSFVSLVSSLPPLDQNIMQDYHTS", + "KDILTSIFLDVNFADSSALEAKLSDSLDLDVPIDELGHAALHWAAAVAKMPLLQALIHKGANPLRGNLTGETALMRSVLV", + "TNHLNQNSFGDLLDLLYASLPCTDRAGRTVVHHICLTAGIKGRGSASRYYLETLLNWAKKHASGNNGYMLKDFINYLNHQ", + "DKNGDTALNIAARIGNKNIVEVLMQAGASAYIPNRAGLSVANFGIFVENALKQPEDSKQTKVSLMSENLSSKEKTAVPPR", + "QKSRDIIASVTDVISSLDKDFQDEMAAKQSMIDSAYTQLRESTKKLSDLREQLHVSETQRTLFLELRQRCKNLMTSIEEQ", + "KSELSNLYESFDPNGIHDSLSLDADAPFTVNENNNKNLSIAELKFQVAAYERNEARLNELANKLWQRNSNIKSKCRRVVS", + "LCTGVDESRVDSLLESLLQAVESDGQQGEVDMGRVAGFLRVVKEHQA"] + }, + { "name" : "05338_USTMA", + "RefSeqID" : "XP_011392041", + "UniProtID" : "A0A0D1BWD8", + "taxonomyID" : "237631", + "sequence" : [ + "MPLNYFANQDQTASDTYAHEASSFPAPSSILTDTSKPLQPVQEVAASSLVDGVSFTSPHASIIHASKQSPRAASSLSFTT", + "SALQRAGLLPANPNMSTTATSGTSAASESLQRVITQGTASAAAINGASTPAHSGPLTPAHLKNLTPAQANAALQNPVGNI", + "PTVYLATYSNVPVYEITVRGIAVMRRRGDGWLNATQILKIAGIEKTRRTKILEKSILTGEHEKIQGGYGKFQGTWIPLQR", + "AQQVAAEYNVSHLLQPILEFDPATADQIPKLYQRKKPAASARNSSASAINDARGSTPSKIYSPAPASLGGPSQQPRFLSL", + "RPPKETHEQEISSAIFMPPGTAGLLSNGTFVDDRAASALAYPGPPAIPPGSTPAEQAALRSYNVYGYTPQGVPLPSSAAA", + "DGNGTEAAATAASTGAGKREASETDQDGASAAKRSRLTSPQQQRRDDGLLLGPSPVKDLNALGPAGGSLRAASAPRGHRI", + "TVGPPDAAGRDGAVPRYADRALPPKPYDEGEKRMRDRLVSLFSDDGVLPGVSEATGAGASQSAADEDDDAYVAKLDSLLA", + "DLREKASLGGLGASGTDGPKATVDLITDDHGHTALHWASALCRVKLVRTLVARPPWQGGANIHAGNHAGETALHRSVLVT", + "NSYDASSFPTLLNLLSSSLNTRDFKKRTVLHHISLVAALKGRAASARYYLACVLEHISAEKNSKYKGLIDAQDEDGETAL", + "GIVARLGNASMVRMLLDVGARKDLANALGIRPSDWGIESSADGASLTPSQNDGTNTVASLPPLTAADLASQNPSDIISAL", + "TRPAQVPVMKSSDVRDQLSSTLDDLQSSFERELKEKQDAVSTVQSHLQAATRDLAARRKTVSAAQAKLAEKDEARQRVQN", + "LRRAIVAQLGLEEADADLSLEQLVEEAANAASAAPADKSADKMDIDGAEDVKPVRASNLETLIDDILSFDTIQSDLKAVG", + "TSAVTQEVVEQDELVRLRWLVSFYQSSCDELSSTISELEDSSAKKESQCQQVVAICANIPQDKVESMLDELLTAMESDGP", + "DVDLARVANFMQKVGKTRENGDQPGVGAQLSSSTSLSTAVSSGGTAASSVVPAVERDGEDAKPDA"] + }, + { "name" : "SWI4_SACCE", + "RefSeqID" : "NP_011036", + "UniProtID" : "P25302", + "taxonomyID" : "559292", + "sequence" : [ + "MPFDVLISNQKDNTNHQNITPISKSVLLAPHSNHPVIEIATYSETDVYECYIRGFETKIVMRRTKDDWINITQVFKIAQF", + "SKTKRTKILEKESNDMQHEKVQGGYGRFQGTWIPLDSAKFLVNKYEIIDPVVNSILTFQFDPNNPPPKRSKNSILRKTSP", + "GTKITSPSSYNKTPRKKNSSSSTSATTTAANKKGKKNASINQPNPSPLQNLVFQTPQQFQVNSSMNIMNNNDNHTTMNFN", + "NDTRHNLINNISNNSNQSTIIQQQKSIHENSFNNNYSATQKPLQFFPIPTNLQNKNVALNNPNNNDSNSYSHNIDNVINS", + "SNNNNNGNNNNLIIVPDGPMQSQQQQQHHHEYLTNNFNHSMMDSITNGNSKKRRKKLNQSNEQQFYNQQEKIQRHFKLMK", + "QPLLWQSFQNPNDHHNEYCDSNGSNNNNNTVASNGSSIEVFSSNENDNSMNMSSRSMTPFSAGNTSSQNKLENKMTDQEY", + "KQTILTILSSERSSDVDQALLATLYPAPKNFNINFEIDDQGHTPLHWATAMANIPLIKMLITLNANALQCNKLGFNCITK", + "SIFYNNCYKENAFDEIISILKICLITPDVNGRLPFHYLIELSVNKSKNPMIIKSYMDSIILSLGQQDYNLLKICLNYQDN", + "IGNTPLHLSALNLNFEVYNRLVYLGASTDILNLDNESPASIMNKFNTPAGGSNSRNNNTKADRKLARNLPQKNYYQQQQQ", + "QQQPQNNVKIPKIIKTQHPDKEDSTADVNIAKTDSEVNESQYLHSNQPNSTNMNTIMEDLSNINSFVTSSVIKDIKSTPS", + "KILENSPILYRRRSQSISDEKEKAKDNENQVEKKKDPLNSVKTAMPSLESPSSLLPIQMSPLGKYSKPLSQQINKLNTKV", + "SSLQRIMGEEIKNLDNEVVETESSISNNKKRLITIAHQIEDAFDSVSNKTPINSISDLQSRIKETSSKLNSEKQNFIQSL", + "EKSQALKLATIVQDEESKVDMNTNSSSHPEKQEDEEPIPKSTSETSSPKNTKADAKFSNTVQESYDVNETLRLATELTIL", + "QFKRRMTTLKISEAKSKINSSVKLDKYRNLIGITIENIDSKLDDIEKDLRANA"] + }, + { "name" : "SWI6_NEUCR", + "RefSeqID" : "XP_962967", + "UniProtID" : "Q7SBG9", + "taxonomyID" : "367110", + "sequence" : [ + "MQPPQLGGASQQSQPSSQQSFSMSQSSQSVYRQYTDPPNRLHNDHAVPTIYSATYSGVGVYEMEVNNVAVMRRQKDGWVN", + "ATQILKVANIDKGRRTKILEKEIQIGEHEKVQGGYGKYQGTWIPFERGLEVCRQYGVEELLSKLLTHNRGQEGETGNVDT", + "PTKEQAMAAQRKRMYNASSQENRGIGSTGTFFKNISSTASTAVAAISKARFDSPAPRNRSGPSRAPSFNRQSSMQDVADF", + "PNSQQSLVSTEYATQTQNADSGFGSQTTQPLAGDGLEQPPRKRQRVLTPARSFGGQTPGHQPLDPFNAGNIANGDSGSPT", + "EPSNSFNYDQVTANDGDASYALGPLRPLPYENNADAEAKRGMLMGLFMDANGPEEAIQAALCNVSPQELDSPIDTQSHTA", + "LHWAATLSRMPLLRALIHAGANPWRVNACGETALMRACTVTNSMENNTFPELLDLLGCTLDVTDDKGRTVLHHIAVTSAV", + "KGRHYASRYYLESLLEWVVRQGSAPSSQENGIGDRKGRRMGIARFMSEIVNAQDNSGDTALNVAARVGNRSIISQLLEVG", + "ADPTIPNRANLKPLDFGIGIADAETNDDPAQEKTGATTGSGHKSRETSDEVVRSITHLIGESASIFQNELKKKQESIDTL", + "HSQLRVTSSQVGDARRTLESLQEKLKAQQLAKQKIVNFNRACEEEEQILIELEQRHGRLDVASANAWEMELESALEIVKT", + "QSPKGLDPDSRPSLPSAAVLRARIKALRARSSKTRQAVAALQAQSKEKELKYRRLVSLCTRRPEIEVEALLDTLTRAVES", + "EKPELEIARVRRFLGGVEGVVH"] + }, + { "name" : "15042_USTMA", + "RefSeqID" : "XP_011388143", + "UniProtID" : "A0A0D1CVS5", + "taxonomyID" : "237631", + "sequence" : [ + "MSTASPLHHGHGNGSYANSPAPTGVTGRDAGVAAAAVADSAVRSGSVPASASGSAPGSASGSMYGEAHTQHHTGHHHYSA", + "HHTHSHGALTSPVNGGHSSSWSPYGYPAAPVYGGSPSPYGHNAYSQYASGYGYANGTAHHVATAPTTPSATSTAYHTGVN", + "GMMMHHGQHAGYGYSSHHLGSHTPTHTHTHSSAYFMNGDGAHSHLNSSAHLTSPSYTTAPQYSTQLPLAGRHRVTTTLWE", + "DEGTLCFQVDARGVCVARRHDNNMINGTKLLNVCGMSRGKRDGILKNEKERIVVKVGAMHLKGVWISFARAKQLAEQNGI", + "ADALYPLFEPNIQSFLYHPDNYPRTAAVIAAAQERQAQRQRAPGGQPSPGANGTSQAPPLMRANTTPSNGDTSTFSSGLS", + "SLGSWTGSHDQGHASAPTTAQPSPSSMHNGATQMHMSLSNHGTASPTYAQSQQQQQQQQQQQQQQQQQQQQQQQQAYPMT", + "AAQQLARPSVGDRRQSAPISLNNSVGHAENPYGATNLGGAANGGLVNGARKVSGLKRSWNDADDLNGSAAASPTERDMQR", + "SGSGGSNGLKLDGDDLHSPDSSDDRLAKKTRGMPQRGGGATTAMPSMSTNMLMGVGNGSGIHHE"] + }, + { "name" : "04778_USTMA", + "RefSeqID" : "XP_011391646", + "UniProtID" : "A0A0D1DQM4", + "taxonomyID" : "237631", + "sequence" : [ + "MNQAPLSATGVNFYISGPRPARLFPTPIHEFRKGKYATAGGESGFMTVFEYDVRGHTMMIDVDTSFVRFTSITQALGKNK", + "VNFGRLVKTCPALDPHITKLKGGYLSIQGTWLPFDLAKELSRRIAWEIRDHLVPLFGYDFPSTCLRPDSEGFGQLAIGMS", + "QKRARKRHNNGGPHQTSCYGPSLPISIELWQHSTDPLRDLGESSVVGGQAIEHVSAKNSAVQPCYGSSQPATFHYSKGYG", + "LESRPWYGQDYLESNSLESMWNSAQAGGGSVGLQVPISTCGATASPCLAAIGANGGSPILSSPPSSNASSSSNQSYTAAG", + "YGLMVPPTVPSHSVNSEAGANQAEGPTPIDGSRSYASLTAHGYATGYGDANASLSTWNDATHASTFTLHVHAHVHFQPPD", + "PESAQLFTIHDFGSDPFYAEQVERG"] + }, + { "name" : "STUA_ASPNI", + "RefSeqID" : "XP_663440", + "UniProtID" : "P36011", + "taxonomyID" : "227321", + "sequence" : [ + "MASMNQPQPYMDVHSHLSSGQTYASHPATAGALTHYQYPQQPPVLQPTSTYGPASSYSQYPYPNSVASSQSVPPPTTSIS", + "SQVPAQLLPLPVTNHPVPTHGYGNNSGTPMQGYVYDPTGQMAPPGAKPRVTATLWEDEGSLCYQVEAKGVCVARREDNGM", + "INGTKLLNVAGMTRGRRDGILKSEKVRNVVKIGPMHLKGVWIPFDRALEFANKEKITDLLYPLFVQHISNLLYHPANQNQ", + "RNMTVPDSRRLEGPQPVVRTPQAQQPPSLHHHSLQTPVPSHMSQPGGRPSLDRAHTFPTPPARMNSSVPNTQPLSIDTSL", + "SNARSMPTTPATTPPGNNLQGMQSYQPQSGYDSKPYYSAAPSTHPQYAPQQPLPQQSMAQYGHSMPTSSYRDMAPPSSQR", + "GSVTEIESDVKTERYGQGTVAKTEPEQEQEYAQPDSGYNTGRGSYYTTNPSVGGLAHDHSQLTPDMTGSPQQNGSGRMTP", + "RTSNTAPQWAPGYTTPPRPAAASSLYNIVSDTRGTSGANGSTSDNYSVASNSGYSTGMNGSMGSNKRMRDDDDDRIVPPD", + "SRGEFDTKRRKTLTETPVGGPVGGVPLGLQPMKAGGSLISARR"] + }, + { "name" : "STUA_NEUCR", + "RefSeqID" : "XP_960837", + "UniProtID" : "Q1K6U0", + "taxonomyID" : "367110", + "sequence" : [ + "MNPNTPADVYYGQMSQGSSMPVTTVPSHSHYASQQPPPLLQPGSTYAHQYGTPQYGYANALSSPASIPPSLPPSMNSMAG", + "QSVLPLPGSGSMNPAVYASGGFDTTGQVAPPGMKPRVTATLWEDEGSLCFQVEARGICVARREDNAMINGTKLLNVAGMT", + "RGRRDGILKSEKVRHVVKIGPMHLKGVWIPFERALDFANKEKITELLYPLFVHNIGALLYHPTNQSRTSQVMAAAEQRRK", + "DSHGQLRGPPGLPSLQQHHHHHSMLPGPPSLPSHPSMGRPALDRAHTFPTPPTSASSVMGPMGNSDGYQWSQQSMSGTQG", + "NSSLSLDTSLGSNARSMPSTPATTPPGSTIQSMQNYPPVSQSYESSRQMYQGQSAQQAQYQSQQHYSSQPQHQERPVYSQ", + "SSYIKNDMGPPSGRPTGQSNDASDSKPPTGMIHQGQGQSDPGTHAGSEEDDDANNEAEYTHDSGGYDANRGSYNYNTQAV", + "NSLPHDHGLAPEIGGSPHQAGSGRATPRTAAAPSSYYSAQGYHTPPRGQPSSSLYNVMSNERTGSNGTQGNEMYAGQADM", + "PSSLPNGYSAQPSVMNGSSGGLKRGRDDDDDGGRPTTSAPNLGPGMDMKRRKTMMDGGSLPSPTYTATIAQAAPSAIAAH", + "RRR"] + }, + { "name" : "PHD1_SACCE", + "RefSeqID" : "NP_012881", + "UniProtID" : "P36093", + "taxonomyID" : "559292", + "sequence" : [ + "MYHVPEMRLHYPLVNTQSNAAITPTRSYDNTLPSFNELSHQSTINLPFVQRETPNAYANVAQLATSPTQAKSGYYCRYYA", + "VPFPTYPQQPQSPYQQAVLPYATIPNSNFQPSSFPVMAVMPPEVQFDGSFLNTLHPHTELPPIIQNTNDTSVARPNNLKS", + "IAAASPTVTATTRTPGVSSTSVLKPRVITTMWEDENTICYQVEANGISVVRRADNNMINGTKLLNVTKMTRGRRDGILRS", + "EKVREVVKIGSMHLKGVWIPFERAYILAQREQILDHLYPLFVKDIESIVDARKPSNKASLTPKSSPAPIKQEPSDNKHEI", + "ATEIKPKSIDALSNGASTQGAGELPHLKINHIDTEAQTSRAKNELS"] + }, + { "name" : "08099_COPCI", + "RefSeqID" : "XP_001836714", + "UniProtID" : "A8NVH3", + "taxonomyID" : "240176", + "sequence" : [ + "MSTGMLQETLQTTSASTSGTRFRPYASPNHQVTKGRYITSNDPRGYIPVYEYPLNGQWIMMDIDDGYILWTGIWKALGNS", + "KADIVKMIDSQPDLAPLIRRVRGGYLKIQGTWMPYEVALKLSRRVAWPIRHDLVPLFGPTFPSTCLSPDQPGYGQVVASS", + "NVRRRARRNTQATAQPPREAHSNWTVMTPGPMVGLSFPHSQFSRPPLPPLAPTPARSPSDYAPSSHYGNQLDPQDARRYS", + "HSPYSPLASPPERKSSISSKALSLEIPPVRPSSSKAREDISLPPLKQPDGADPEMSPYALPPISALEDLRGVDTQDSAAV", + "LRRLRLDDDYPSSSRSSTSQDSIWGRRHSLSAHSPHPRSSDNSRFQPYLSSRSYQDSTLKRSRSPAESYADRRRASDFSQ", + "EDSTSAYSPISPATPNSSILSHSSFSDLKKLASSTDTRYNFPRISGRDWAPLKGDTDHIRSSYRSGPSPLELDSDSESSA", + "PHRPW"] + }, + { "name" : "68479_WALME", + "RefSeqID" : "XP_006957792", + "UniProtID" : "I4YDE0", + "taxonomyID" : "671144", + "sequence" : [ + "MTNKVQELWWEENKTRVWQVEVDNGNYVARRQDNDQINGTKLLNITKITRGKRDGILKNEKSRQVVKTGTITLKGVWIPF", + "ERAIILARQFNIEQQLYPLFETNLGDYVENSIGSHQIKRKSLNNLMDSLTTNRELVSKRRSTVSTYNPATSAYVSPYGFS", + "PQHCYQTEFEDMNQHSGEIQSGRPRNTSSASDWMTNWSTSSSSPVIPATPNTFSPVMNTFQSLALHSPPIPIPNYYYDSS", + "SSYFPSYHQKQQQQQVQMQMQMHTTASIGGDRQSNEYIQR"] + }, + { "name" : "11943_PUCGR", + "RefSeqID" : "XP_003330006", + "UniProtID" : "E3KMR2", + "taxonomyID" : "418459", + "sequence" : [ + "MAAAPTSSFLTSMSAQPPRTVQALVNEEVRAPPPVRLYPSQHRVSMTRYATSTDPRGYIPVFEYPLNGQYIMIDCETGMV", + "HFTGIWKALGHTKADVVKLVESDPTIAPYLRKVRGGYLKIQGTWLPFDTAQTLARRVAWQVRYDLVPLFGPDFPDTCLGP", + "GEPGFGQLLLSAPKPRGRRGAKKAAAAPTVAHERTASPQDNRSQSRPGPYPSQESFGNRCSGRVEAVGAMNGYSPMLSQA", + "RYSPYTRAPVHRITQLEPLPSLIQPNQSCPHPTADSMYSSHYHQSPRQSMMTSHGAGPYGQQHLTGSTASGMQSTAPLPS", + "MRPHQAHQSENNFFETYRGPDSFEALSNKWLAPEVANPSLNDSGLLHGEGGCLPPLQYSNNPVLRNGPSGSPTNQYNFPN", + "QIDSAHSSHHIDSNQTQHVHRHAGFPYESQHQSNFRHDLSTEEAAHHPASPSQQPPPSVTYDKAHNSEPQAGSQAANVTA", + "GCYAASGSNSTGNPAGSPGSHSSHVPKSPTPSSASTSTHMQNSHNPNSHRSPSNTLTNMSNNGGFNSNTQGEEAIQFSVL", + "TSPAHLETSGPSENSIPPAQSSDSDWNPAQNTTGLSPSQAPRQ"] + }, + { "name" : "03082_PUCGR", + "RefSeqID" : "XP_003321545", + "UniProtID" : "E3JYK1", + "taxonomyID" : "418459", + "sequence" : [ + "MILISPTRTLPSPRPIDTDPILNYRHIQPAAAAAAVGPWLGQNQHHHHHHDTLAKSPNITTAPATHSPSELSASPAPSAV", + "STGSSLLDPQSVPHIKIPHSSSPPAIMLPQPSSDDDSSTAEEEQPSAQSSNATLNTPTPHTNAPHQLDSHASSVGLYDLP", + "PTSSSAPTTSSSSSPFPSNVPSHQQPSPYSSSPHPNQEHHPHHPHHGNQFYQQSPPALHSPLQSAHHPQQSFDARPHSSL", + "FAHQHYHSRPQSAPHSTSQFSLDPHVLAAAAANVEVKKWDEENTYYYQVAHKGVTVGRLKGSGLVNGTKLLNLAGISRGK", + "RDGILKNEKIRKVVKHGTMHLKGVWIAFDRAVFLAEQHSIADKIFPLLVVNLEHYVPIEPPLMAGGTKLGPGSLFHHHHP", + "RHPRLLPQPIKFPPSTISLAPASANSFSSTGGWPSGPSSALPSIGYNEPFSAPPIPRSAATADTSPSIYEQAQFQYLNSA", + "QANNPDLLERRHTLPNNSFHGYNSVPSFGSSQPPPPVSYSFHYNSTHVPGYPPRSSTAESATPNQFEYQSKNHNGNGNGD", + "AAGSYPATLYHSQPAARPVSSTTAQPSPALNSAPLLLGDLSPGSSTQIVDHGAGDFRLSTGTSNGQVKQEGDDESCNEKR", + "LIMEWNPSC"] + }, + { "name" : "SOK2_SACCE", + "RefSeqID" : "NP_013729", + "UniProtID" : "P53438", + "taxonomyID" : "559292", + "sequence" : [ + "MPIGNPINTNDIKSNRMRQESNMSAVSNSESTIGQSTQQQQQQQQYLGQSVQPLMPVSYQYVVPEQWPYPQYYQQPQSQS", + "QQQLQSQPQMYQVQESFQSSGSDSNASNPPSTSVGVPSNATATALPNGSAITTKKSNNSTNISNNVPYYYYFPQMQAQQS", + "MAYSYPQAYYYYPANGDGTTNGATPSVTSNQVQNPNLEKTYSTFEQQQQHQQQQQLQAQTYPAQPPKIGNAFSKFSKSGP", + "PSDSSSGSMSPNSNRTSRNSNSISSLAQQPPMSNYPQPSTYQYPGFHKTSSIPNSHSPIPPRSLTTPTQGPTSQNGPLSY", + "NLPQVGLLPPQQQQQVSPLYDGNSITPPVKPSTDQETYLTANRHGVSDQQYDSMAKTMNSFQTTTIRHPMPLIATTNATG", + "SNTSGTSASIIRPRVTTTMWEDEKTLCYQVEANGISVVRRADNDMVNGTKLLNVTKMTRGRRDGILKAEKIRHVVKIGSM", + "HLKGVWIPFERALAIAQREKIADYLYPLFIRDIQSVLKQNNPSNDSSSSSSSTGIKSISPRTYYQPINNYQNPNGPSNIS", + "AAQLTYSSMNLNNKIIPNNSIPAVSTIAAGEKPLKKCTMPNSNQLEGHTITNLQTLSATMPMKQQLMGNIASPLSYPRNA", + "TMNSASTLGITPADSKPLTPSPTTTNTNQSSESNVGSIHTGITLPRVESESASHSKWSKEADSGNTVPDNQTLKEPRSSQ", + "LPISALTSTDTDKIKTSTSDEATQPNEPSEAEPVKESESSKSQVDGAGDVSNEEIAADDTKKQEK"] + }, + { "name" : "14426_COPCI", + "RefSeqID" : "XP_002911429", + "UniProtID" : "D6RMB0", + "taxonomyID" : "240176", + "sequence" : [ + "MTARPPLPLRHANPSLRDGNATIPPVKYQILSCQGKDILVGRLKIDTTDGGHAFILRRFDTQAISLTTMFRAAFPTASEA", + "EEKDEINYVKANFDLFGNNGSSKEPHITRLAGTWVNRDTAGQLAHDYNMVDLINTMVEAEPDPNGQYRRSNKSAQNNNPP", + "TNAPEPTPATNVHATRSPAKQSPKPPSKTLPTPSPGSGDAQPPAPKRRREGSPATFTSGIPVASSPAVPKTPGPRRSTRT", + "KSPAPSRVPQPLTATKPRSRASVAPPSPKKRPVDLPKSSPIKAEEDTAVEDNVAGNELYAQDISEQKKLIADLKAAASSK", + "KPADTVKEDDDQQMEEEGQGPSKLKRIRQDEEKPLQFEFKEPEREERQIATNRRVGRFDMQPERKSLAWGIAAFAFGMTA", + "ITYLPNFL"] + }, + { "name" : "BQT4_SCHPO", + "RefSeqID" : "NP_596166", + "UniProtID" : "O60158", + "taxonomyID" : "284812", + "sequence" : [ + "MTENEKSRSLPAERNPLYKDDTLDHTPLIPKCRAQVIEFPDGPATFVRLKCTNPESKVPHFLMRMAKDSSISATSMFRSA", + "FPKATQEEEDLEMRWIRDNLNPIEDKRVAGLWVPPADALALAKDYSMTPFINALLEASSTPSTYATPSRPTAQKSETSEG", + "EPESSTSATTTSVARRTRQRLAEHLENSKKTILQHDNKEEDKEIHSEENETKDEIKSEKKEPEIKKQEGGSSTEKVGQPS", + "SSDDKAKGSTSKDQPSEEEEKTSDIQDRKIKTPIKPSLLGKIRSSVNKGMTDVASQVNRGMTDVASQVNKGVNGVASQVN", + "KGMNGVANQVNKGVTGVASQVRKPVGKLEKKFENLEKSIGDTLKSSIRSSPKSKKRSREDFEENEDYNAMVPVKRSRITK", + "LESEVYYEKRKVRALGGIAIGLGVGAILPFLF"] + }, + { "name" : "PGTG_05590", + "RefSeqID" : "XP_003323688", + "UniProtID" : "E3K4V4", + "taxonomyID" : "418459", + "sequence" : [ + "MPKSSSCCEPEQKQSIPTNANPISAGGAGLDIRLAGMRSAHATLRGCSFSPYMVTQHPPLRDSVNRNKQQPTNNSTNPYT", + "KKASRMSQTNLYKSNNPPNLPQDEFNQTLVNYQGKLRSIRIQDININGHTITIARIKIPSPEKLSSHLIKRFDTNAISAS", + "SFFRSAFPHSTEEEEAIQMRYLHQIYDTHTAGAVEFGSARKLTGVWVPIENAAELAEVYGLTRFAEPLLAFPNPKENPRS", + "PTGTKIGGEDESSTTQTPKASQQSKLTGQISVTRSSKRSRAGPLSFGNTSPSSFSLNSFNKPPTETNKSGTHDDSKSTND", + "ENDEKPASPTDRVAGRGARNSPSKKPTTVDENHEHTEHEDHQLIGTDELAQRAKQEALKLVSELKNSQPCTQSSLESPTN", + "TLETELTRTTSPAKSNKVTRKRSSDEVSFEGEEQGEDEDEERTADETATHRSFLPKLLWRKSAAQAHPNSKKHKRTQLGG", + "GGSSSSSSKSFVPLLTNSATPSVDDSSSTHNPNKRNLAIAGIVIAGAAA"] + }, + { "name" : "06560_NEUCR", + "RefSeqID" : "XP_962267", + "UniProtID" : "Q7S9H5", + "taxonomyID" : "367110", + "sequence" : [ + "MAQVARHLPARRNPLMLEDVPSHTDLASRRRLGQTQLTPRMVTAVPGAEVDPSSLLAFDYAHLRAPLPKGIVSGIFKSSP", + "PSYFLMRRSQDGYISATGMFKATFPYASQEEEEAERKYIKSIPTTSSEETAGNVWIPPEQALILAEEYQITPWIRALLDP", + "SDIAVTATDSSAPKQIAPPPKFFGAQPPLVAPTPPTTRSTRSRPSSRRSSSPAKSTTTSKRGTTPRNTKRTVTTEASATT", + "VTTTATATAVPSAETPATSFADSQAPTLINGEIPTSTPINTVPVTKIQTTEAELKVESIEKEPVVVLEPIEEEPKIKVRV", + "DEDVKLDKDGEEVKHTKVELEVPLMAGEPPSKEEARKMIEEAKAMVEAAVKADAEAAAALVEASKAGAEDEKAEDEAKAE", + "TEATKEEEADSKGKRKAEKISVDEDEKAADEAEQPRQAKRVKTEAELRKDRIRKRAYLGLTATFAVGALGALLPIITPYV", + "ANVL"] + }, + { "name" : "81480_BIPOR", + "RefSeqID" : "XP_007682909", + "UniProtID" : "W6ZKJ4", + "taxonomyID" : "930090", + "sequence" : [ + "MVVDRVLPERKNPLLEPTDSTSIEILIERRRLGQTNLGVKAGVSGIANATKPENMGTFDYAHLRVPLPKDLTGSGIFSRN", + "RMSAFPESYFLMRRSSDGYISATGMFKAAFPWASLQEEDLERKYQKTFPSAGDEEVAGSVWIAPEEALALSEEYSMRHWI", + "EALLDPAPIEKGGKDKSNAAIQMPPRFDVANAQPATLPTFGFRQTRARSARSVSPSKAMTPGRKYATPRKGRSTRSAMKP", + "DATHADDMFRPIEAVTPSTALQNSIARRIAPAETIASSIEGEVKEVEQEVKAALDAEKKPEPELEVQEGTVHIEVKQTVE", + "TNGDTEKTSTSVTVDVPHDHAALPEPEDPTAMIEEAKRMVAEAQKLEGGSPSVTRSSKRGIEEVLDEEDLADERLNKLAK", + "KAYTTEQKMTKEKVTRRALVGLGVMAAIGTAFQYFV"] + }, + { "name" : "01622_ASPNI", + "RefSeqID" : "XP_657766", + "UniProtID" : "Q5BH18", + "taxonomyID" : "227321", + "sequence" : [ + "MVRSLPKKNNPFVTPDAAPPYEELLMRRRLGKTNLAVKPTQVGTSNATKPENLGPFEYAHLRAPLPKDLKGSEIFPSHSP", + "QQHPETYFLMRRSKDGYVSATGMFKIAFPWAKLEEERSEREYLKTRPETSEDEIAGNVWISPVLALELAAEYKMYDWVRA", + "LLDPTEIIQSPSSAKKQITPPPKFELPPIQAPEALVPSSRTRSRRSASPSKKAGTPRKPRQTKAQKEAAVAATNEANATL", + "QSALDDTVSNADGEINGDVLPSVEDKREPETSPVKGKKAAAKAKKQAVSEEDQEDKVKIEIKSDAAEGSDVQAAQTTISV", + "EMPISLPEAPSAEDTQEMIAKAKEMVKEAVKLQQEPAESSATAKKRGAEEAELGEEEEDEETKTLRTKRAKVLEEKLKRE", + "RVRNRALMGVTAAFALAKPALVLLEA"] + }, + { "name" : "05405_ASPNI", + "RefSeqID" : "XP_663009", + "UniProtID" : "Q5B225", + "taxonomyID" : "227321", + "sequence" : [ + "MASIQFLLNPLPSLPSSDRCPLPTPSPTISSSTAMLRSPRQKKQKMAKDAPIFQRGKPRGEVRYPPYEDRDGKFSCQHQD", + "FRIHPLGNIADYPRHIPYNSDKKSFQERTGRESFEVFQYTFQLPGEEKQWTVMWDYNIGLVRTTHLFKCNDYSKTTPAKM", + "LNQNPGLRDICHSITGGALAAQGYWMPYEAAKAIAATFCWKIRFALTPLFGDNFPDLCIHPDDRARFGRMVIDPGIVRIA", + "TEKANLYRMLELRCSTTNSLRADYVLRPSSAPDIDRTDPNLERDRVALGRHILPKSHRHHHHRSKTSPSTNTSLVGYGSS", + "PEVEYYSCGTEPYCVSPESPIRSSFTPVNTPRSTDIYPSSSSTNFLRSPHELLASLSSSASIARARIERASKISGARVIP", + "SSVPSNVTSITTKGRDNTGHSALMEESDIDADAETDSGHEHDLDFELSSSDESSTSSTVSSSTSSASLGFAANSRNRPYR", + "DDDEPHRDTDEEMVDYRAPKRIATAGARDRRWGRGRRVIHQEHSDIETSRRARKHAQRSSNARLVCEMTAAHALISLLHD", + "ATGSDVDVDTHNRLECGRSPDGGVKNNLKGSYFGIRLNHNPSTESGQKRRRASA"] + }, + { "name" : "105954_BIPOR", + "RefSeqID" : "XP_007691967", + "UniProtID" : "W6Z1H5", + "taxonomyID" : "930090", + "sequence" : [ + "MNIQDLLNPSCGDRHDHRRSESATPPSRPVAILPALRRQKIPKDAPIFSEGNRTVGIVNFAPHEAGNDEELLAQHCRFQI", + "YPLGEISRKGVRHIPYNSDKKDFLEKTGRDAFEMFQYTYKLPGEDKPYVVVWDYNVGLVRMTPFFKSCKYSKTIPAKTLR", + "ENPGLKDISYSITGGALVCQGYWIPYQAARAIAATFCYDIRWALTPVFGNDFPSICLTPDDPSFAKFVIDPAIVRYCTEE", + "TTKFRELGSAYEVHRPVAPTQVEAPTSRSDQPLSTSIVRQRRARPIDIESGYGTDTERNDRCLFSPEVSPRTRFTPINRP", + "RSPYSPRTAESSFVSSPVSIRAPPGLHTPTSTPYEHSGEVFRAKRSHSKVAFCEHPADEAVIRPPTAATVDSAHGCEMCV", + "GDDNHSHLDMDAAEMLLSLRTADSAMPPSKRTRRGS"] + }, + { "name" : "69819_WALME", + "RefSeqID" : "XP_006959479", + "UniProtID" : "I4Y911", + "taxonomyID" : "671144", + "sequence" : [ + "MTSPGLPKDFNELLDKSEIPSPKWQQITRDDRPITIARLKLPHPREKHTFILRRYDCNGISFGSLFKAAYPYATDEEEKI", + "ESGFVKKNYDVTLVPTEEYQERKLAKLAGFWIPIAIAEELGQRYAMAEYVDALAKADTPDLTDFKKRSSNRQTSEDIKSS", + "PAKAQASLESPAKSASKIPTPTKNPAPRRSARHQSRSPSPSPLTHNLTPGKKKAKKAPKEAVIEESVEETIVVDKKESPL", + "KKALNDDQVLADIERAKDLVDDIKQSKNLSQSSPVKVVKEEVLETIQPSVSTESLEGEGKRKRELEDETGNEIKVVSFGQ", + "NPPANPEEIQQRPVVQRRGVAAAVGAFALGVGFAASNILPRFLF"] + }, + { "name" : "02840_CRYNE", + "RefSeqID" : "XP_568872", + "UniProtID" : "Q5KM59", + "taxonomyID" : "214684", + "sequence" : [ + "MSHPAADAPPPYPGTTDDAQYDLTPLPHTANRPRLPEDKRNPHLNNLPEDTKIVKFQTIVRENKEIVVGRIKVPTENANG", + "THHAFILRRYDTNAISLTTMYKVAFPSATEEEEKREMDWVKSSFDTRGTNGGRDSEVVRLAGQWVSRNLAIHIAPAYNLV", + "QLVAALSRAVPDPNVAYRKSQRSQAAADELARTKAKQSQAPSSVPAISNVPVRKPQAAIPSMATEISSPASKRQRKDSVT", + "EASGSATQTITEAQPSADTSETDDTRHITIEATTTITSPSGANVDMDAEIEQAKQLVKDLRQEIQLRNEAGDSLEDQGVA", + "VADDVRGVKRGKHEDEAVVISGGAGGKDRVVRTNKRIPQTAGGDVGQRFGWGAFVFSIGLGASLTLFSQYASSLL"] + }, + { "name" : "11055_USTMA", + "RefSeqID" : "XP_011390537", + "UniProtID" : "A0A0D1DZM8", + "taxonomyID" : "237631", + "sequence" : [ + "MPAAASARKSTPTRKSTPRRARSSSVTSNASTGVPASPSASPRKTKKQKEAAAAAAAAVAAAAATAEQVNDDESDLLRPK", + "LPTKRNPRLKEVDEAVVKLQIIKREGHNIIIGRVKLPTVNGQDHAFLLKRFDTNAMAASSMFRLAFPFADGTAEAAEMRF", + "LDTKYDTNRANGGYIVEEVKVPETPKKRGRTRKTAENSKKESTPDTESVSADKQIRVLPEGSTGVRLQGTWIPAEDAIEV", + "AEDYGIAKYALALIHATAEHAEDGGAPILTSEPVAEVKTPRKRQRVSAAAATASDTPDSPQLVQRVTRLENADGSISKVR", + "VESTLEAPSSNGVPVALSQAEIEEQIAQAKALAAGIQQSITAGSGSASTRGQKRRAVNDRPTAEIDPLADDEDYSESGRV", + "VRAFRRGTRVARRRPIATTAGAVAAAGAVGAGALAWVSGGNPEVAIQTLQASMQSIGLQNLQNLGLQNLQQIGTQLGAHL", + "ASILPW"] + }, + { "name" : "XBP1_NEUCR", + "RefSeqID" : "XP_962373", + "UniProtID" : "Q7S9W7", + "taxonomyID" : "367110", + "sequence" : [ + "MLNQNPGLKDIAYSITGGAIKAQGYWMPYACAKAVCATFCYQIAGALIPLFGPDFPSECISPGEPRYGIMIIKPELISDT", + "MRKAQELYRRYGNWGGGCTSSSPARRPLRTASSGSQERHHHHPYPNQEHLDHQQQQQRTVCSRRCPAEENSCVDARPQLR", + "GISAPMPPAGEWTPPLLRSSAGRPRPVMPTSTHSSISYPERAPHRSAWTAVNHQPPNNSLDRYSLKRPLPSNEPDESVSH", + "SNWPSRSQAPNPWLTAIPRSPRKTSSSPWASQPGSASRSRAGSIDSMASQHPQGLPSPSLILSSPSSSMVSLSSSNSPSP", + "RPQLPPISQLCSLPVPSGRRRLPNGRPSRVGGDATSSHSRQDHSTCGAYQFSAGYQRALTPPSSTSAPMHWRSQRRPSLQ", + "DQHEHEHIEDTQPRRIAVEANMECGDDNESHLHLPLPLPRTSSSASIVADKNANDTTSDNSSSRNFNSASIGSGRDDGQT", + "SLAARKTAALTLLHLRQQEEEKEAAAAAAAAAAAAYSSTKRPESPSSSLSSPVSPPPTSGQPSPTLSAVVTATNLRRGTT", + "TATATAVIDTTEPLAPPPSPSSNYLGSPISTSIASSSSSFSPSTSCNGTRENSVVANEMTRYAGQEADAGGPRHCNGDAD", + "DEGDYEHEQQYRRKRRRLLLVGRAKSF"] + }, + { "name" : "XBP1_SACCE", + "RefSeqID" : "NP_012165", + "UniProtID" : "P40489", + "taxonomyID" : "559292", + "sequence" : [ + "MKYPAFSINSDTVHLTDNPLDDYQRLYLVSVLDRDSPPASFSAGLNIRKVNYKSSIAAQFTHPNFIISARDAGNGEEAAA", + "QNVLNCFEYQFPNLQTIQSLVHEQTLLSQLASSATPHSALHLHDKNILMGKIILPSRSNKTPVSASPTKQEKKALSTASR", + "ENATSSLTKNQQFKLTKMDHNLINDKLINPNNCVIWSHDSGYVFMTGIWRLYQDVMKGLINLPRGDSVSTSQQQFFCKAE", + "FEKILSFCFYNHSSFTSEESSSVLLSSSTSSPPKRRTSTGSTFLDANASSSSTSSTQANNYIDFHWNNIKPELRDLICQS", + "YKDFLINELGPDQIDLPNLNPANFTKRIRGGYIKIQGTWLPMEISRLLCLRFCFPIRYFLVPIFGPDFPKDCESWYLAHQ", + "NVTFASSTTGAGAATAATAAANTSTNFTSTAVARPRQKPRPRPRQRSTSMSHSKAQKLVIEDALPSFDSFVENLGLSSND", + "KNFIKKNSKRQKSSTYTSQTSSPIGPRDPTVQILSNLASFYNTHGHRYSYPGNIYIPQQRYSLPPPNQLSSPQRQLNYTY", + "DHIHPVPSQYQSPRHYNVPSSPIAPAPPTFPQPYGDDHYHFLKYASEVYKQQNQRPAHNTNTNMDTSFSPRANNSLNNFK", + "FKTNSKQ"] + } +] diff --git a/data/refAnnotations.json b/data/refAnnotations.json index eafc3fe..b551dd0 100644 --- a/data/refAnnotations.json +++ b/data/refAnnotations.json @@ -1,116 +1,116 @@ -[ - {"pName" : "MBP1_SACCE", "fName" : "APSES fold", "start" : "4", "end" : "102"}, - {"pName" : "MBP1_SACCE", "fName" : "KilA-N", "start" : "22", "end" : "105"}, - {"pName" : "MBP1_SACCE", "fName" : "low complexity", "start" : "108", "end" : "122"}, - {"pName" : "MBP1_SACCE", "fName" : "low complexity", "start" : "236", "end" : "241"}, - {"pName" : "MBP1_SACCE", "fName" : "low complexity", "start" : "279", "end" : "307"}, - {"pName" : "MBP1_SACCE", "fName" : "low complexity", "start" : "700", "end" : "717"}, - {"pName" : "MBP1_SACCE", "fName" : "Ankyrin fold", "start" : "394", "end" : "423"}, - {"pName" : "MBP1_SACCE", "fName" : "Ankyrin fold", "start" : "427", "end" : "463"}, - {"pName" : "MBP1_SACCE", "fName" : "Ankyrin fold", "start" : "512", "end" : "541"}, - {"pName" : "MBP1_SACCE", "fName" : "Swi6 fold", "start" : "381", "end" : "547"}, - {"pName" : "MBP1_SACCE", "fName" : "coiled coil", "start" : "633", "end" : "655"}, - - {"pName" : "MBP1_ASPNI", "fName" : "APSES fold", "start" : "9", "end" : "106"}, - {"pName" : "MBP1_ASPNI", "fName" : "KilA-N", "start" : "26", "end" : "109"}, - {"pName" : "MBP1_ASPNI", "fName" : "low complexity", "start" : "529", "end" : "534"}, - {"pName" : "MBP1_ASPNI", "fName" : "Ankyrin fold", "start" : "260", "end" : "289"}, - {"pName" : "MBP1_ASPNI", "fName" : "Ankyrin fold", "start" : "381", "end" : "413"}, - {"pName" : "MBP1_ASPNI", "fName" : "Swi6 fold", "start" : "193", "end" : "402"}, - {"pName" : "MBP1_ASPNI", "fName" : "coiled coil", "start" : "509", "end" : "572"}, - - {"pName" : "MBP1_BIPOR", "fName" : "APSES fold", "start" : "8", "end" : "106"}, - {"pName" : "MBP1_BIPOR", "fName" : "KilA-N", "start" : "26", "end" : "109"}, - {"pName" : "MBP1_BIPOR", "fName" : "low complexity", "start" : "134", "end" : "152"}, - {"pName" : "MBP1_BIPOR", "fName" : "low complexity", "start" : "267", "end" : "278"}, - {"pName" : "MBP1_BIPOR", "fName" : "low complexity", "start" : "670", "end" : "685"}, - {"pName" : "MBP1_BIPOR", "fName" : "Ankyrin fold", "start" : "266", "end" : "295"}, - {"pName" : "MBP1_BIPOR", "fName" : "Ankyrin fold", "start" : "387", "end" : "416"}, - {"pName" : "MBP1_BIPOR", "fName" : "Swi6 fold", "start" : "253", "end" : "421"}, - {"pName" : "MBP1_BIPOR", "fName" : "coiled coil", "start" : "659", "end" : "681"}, - {"pName" : "MBP1_BIPOR", "fName" : "coiled coil", "start" : "500", "end" : "590"}, - - {"pName" : "MBP1_NEUCR", "fName" : "APSES fold", "start" : "14", "end" : "114"}, - {"pName" : "MBP1_NEUCR", "fName" : "KilA-N", "start" : "34", "end" : "117"}, - {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "130", "end" : "141"}, - {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "253", "end" : "266"}, - {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "514", "end" : "525"}, - {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "554", "end" : "564"}, - {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "601", "end" : "618"}, - {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "620", "end" : "629"}, - {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "636", "end" : "652"}, - {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "658", "end" : "672"}, - {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "725", "end" : "735"}, - {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "752", "end" : "771"}, - {"pName" : "MBP1_NEUCR", "fName" : "Ankyrin fold", "start" : "268", "end" : "297"}, - {"pName" : "MBP1_NEUCR", "fName" : "Ankyrin fold", "start" : "390", "end" : "419"}, - {"pName" : "MBP1_NEUCR", "fName" : "Swi6 fold", "start" : "270", "end" : "426"}, - {"pName" : "MBP1_NEUCR", "fName" : "coiled coil", "start" : "500", "end" : "550"}, - - {"pName" : "MBP1_SCHPO", "fName" : "APSES fold", "start" : "8", "end" : "104"}, - {"pName" : "MBP1_SCHPO", "fName" : "KilA-N", "start" : "25", "end" : "113"}, - {"pName" : "MBP1_SCHPO", "fName" : "low complexity", "start" : "111", "end" : "125"}, - {"pName" : "MBP1_SCHPO", "fName" : "low complexity", "start" : "136", "end" : "145"}, - {"pName" : "MBP1_SCHPO", "fName" : "low complexity", "start" : "176", "end" : "191"}, - {"pName" : "MBP1_SCHPO", "fName" : "low complexity", "start" : "422", "end" : "447"}, - {"pName" : "MBP1_SCHPO", "fName" : "Ankyrin fold", "start" : "247", "end" : "276"}, - {"pName" : "MBP1_SCHPO", "fName" : "Ankyrin fold", "start" : "368", "end" : "397"}, - {"pName" : "MBP1_SCHPO", "fName" : "Swi6 fold", "start" : "234", "end" : "400"}, - {"pName" : "MBP1_SCHPO", "fName" : "coiled coil", "start" : "457", "end" : "538"}, - - {"pName" : "MBP1_COPCI", "fName" : "APSES fold", "start" : "5", "end" : "103"}, - {"pName" : "MBP1_COPCI", "fName" : "KilA-N", "start" : "23", "end" : "106"}, - {"pName" : "MBP1_COPCI", "fName" : "low complexity", "start" : "170", "end" : "191"}, - {"pName" : "MBP1_COPCI", "fName" : "low complexity", "start" : "435", "end" : "450"}, - {"pName" : "MBP1_COPCI", "fName" : "low complexity", "start" : "611", "end" : "626"}, - {"pName" : "MBP1_COPCI", "fName" : "Ankyrin fold", "start" : "270", "end" : "299"}, - {"pName" : "MBP1_COPCI", "fName" : "Ankyrin fold", "start" : "389", "end" : "418"}, - {"pName" : "MBP1_COPCI", "fName" : "Ankyrin fold", "start" : "474", "end" : "509"}, - {"pName" : "MBP1_COPCI", "fName" : "Swi6 fold", "start" : "257", "end" : "429"}, - {"pName" : "MBP1_COPCI", "fName" : "coiled coil", "start" : "500", "end" : "570"}, - {"pName" : "MBP1_COPCI", "fName" : "coiled coil", "start" : "651", "end" : "678"}, - - {"pName" : "MBP1_CRYNE", "fName" : "APSES fold", "start" : "16", "end" : "114"}, - {"pName" : "MBP1_CRYNE", "fName" : "KilA-N", "start" : "34", "end" : "117"}, - {"pName" : "MBP1_CRYNE", "fName" : "low complexity", "start" : "66", "end" : "85"}, - {"pName" : "MBP1_CRYNE", "fName" : "low complexity", "start" : "413", "end" : "423"}, - {"pName" : "MBP1_CRYNE", "fName" : "low complexity", "start" : "633", "end" : "644"}, - {"pName" : "MBP1_CRYNE", "fName" : "low complexity", "start" : "697", "end" : "709"}, - {"pName" : "MBP1_CRYNE", "fName" : "Ankyrin fold", "start" : "477", "end" : "506"}, - {"pName" : "MBP1_CRYNE", "fName" : "Ankyrin fold", "start" : "618", "end" : "647"}, - {"pName" : "MBP1_CRYNE", "fName" : "Swi6 fold", "start" : "452", "end" : "663"}, - - {"pName" : "MBP1_PUCGR", "fName" : "APSES fold", "start" : "90", "end" : "187"}, - {"pName" : "MBP1_PUCGR", "fName" : "KilA-N", "start" : "107", "end" : "190"}, - {"pName" : "MBP1_PUCGR", "fName" : "low complexity", "start" : "208", "end" : "227"}, - {"pName" : "MBP1_PUCGR", "fName" : "low complexity", "start" : "273", "end" : "291"}, - {"pName" : "MBP1_PUCGR", "fName" : "Ankyrin fold", "start" : "442", "end" : "271"}, - {"pName" : "MBP1_PUCGR", "fName" : "Ankyrin fold", "start" : "475", "end" : "509"}, - {"pName" : "MBP1_PUCGR", "fName" : "Ankyrin fold", "start" : "561", "end" : "590"}, - {"pName" : "MBP1_PUCGR", "fName" : "Swi6 fold", "start" : "429", "end" : "601"}, - {"pName" : "MBP1_PUCGR", "fName" : "coiled coil", "start" : "827", "end" : "863"}, - - {"pName" : "MBP1_USTMA", "fName" : "APSES fold", "start" : "7", "end" : "104"}, - {"pName" : "MBP1_USTMA", "fName" : "KilA-N", "start" : "24", "end" : "107"}, - {"pName" : "MBP1_USTMA", "fName" : "low complexity", "start" : "106", "end" : "116"}, - {"pName" : "MBP1_USTMA", "fName" : "low complexity", "start" : "161", "end" : "183"}, - {"pName" : "MBP1_USTMA", "fName" : "low complexity", "start" : "666", "end" : "681"}, - {"pName" : "MBP1_USTMA", "fName" : "low complexity", "start" : "688", "end" : "700"}, - {"pName" : "MBP1_USTMA", "fName" : "AT hook", "start" : "134", "end" : "146"}, - {"pName" : "MBP1_USTMA", "fName" : "Ankyrin fold", "start" : "245", "end" : "274"}, - {"pName" : "MBP1_USTMA", "fName" : "Ankyrin fold", "start" : "278", "end" : "314"}, - {"pName" : "MBP1_USTMA", "fName" : "Ankyrin fold", "start" : "364", "end" : "393"}, - {"pName" : "MBP1_USTMA", "fName" : "Swi6 fold", "start" : "232", "end" : "404"}, - {"pName" : "MBP1_USTMA", "fName" : "coiled coil", "start" : "590", "end" : "618"}, - - {"pName" : "MBP1_WALME", "fName" : "APSES fold", "start" : "6", "end" : "103"}, - {"pName" : "MBP1_WALME", "fName" : "KilA-N", "start" : "23", "end" : "106"}, - {"pName" : "MBP1_WALME", "fName" : "low complexity", "start" : "149", "end" : "162"}, - {"pName" : "MBP1_WALME", "fName" : "low complexity", "start" : "171", "end" : "188"}, - {"pName" : "MBP1_WALME", "fName" : "low complexity", "start" : "618", "end" : "628"}, - {"pName" : "MBP1_WALME", "fName" : "low complexity", "start" : "634", "end" : "660"}, - {"pName" : "MBP1_WALME", "fName" : "Ankyrin fold", "start" : "250", "end" : "279"}, - {"pName" : "MBP1_WALME", "fName" : "Ankyrin fold", "start" : "369", "end" : "398"}, - {"pName" : "MBP1_WALME", "fName" : "Swi6 fold", "start" : "237", "end" : "409"}, - {"pName" : "MBP1_WALME", "fName" : "coiled coil", "start" : "461", "end" : "585"} -] +[ + {"pName" : "MBP1_SACCE", "fName" : "APSES fold", "start" : "4", "end" : "102"}, + {"pName" : "MBP1_SACCE", "fName" : "KilA-N", "start" : "22", "end" : "105"}, + {"pName" : "MBP1_SACCE", "fName" : "low complexity", "start" : "108", "end" : "122"}, + {"pName" : "MBP1_SACCE", "fName" : "low complexity", "start" : "236", "end" : "241"}, + {"pName" : "MBP1_SACCE", "fName" : "low complexity", "start" : "279", "end" : "307"}, + {"pName" : "MBP1_SACCE", "fName" : "low complexity", "start" : "700", "end" : "717"}, + {"pName" : "MBP1_SACCE", "fName" : "Ankyrin fold", "start" : "394", "end" : "423"}, + {"pName" : "MBP1_SACCE", "fName" : "Ankyrin fold", "start" : "427", "end" : "463"}, + {"pName" : "MBP1_SACCE", "fName" : "Ankyrin fold", "start" : "512", "end" : "541"}, + {"pName" : "MBP1_SACCE", "fName" : "Swi6 fold", "start" : "381", "end" : "547"}, + {"pName" : "MBP1_SACCE", "fName" : "coiled coil", "start" : "633", "end" : "655"}, + + {"pName" : "MBP1_ASPNI", "fName" : "APSES fold", "start" : "9", "end" : "106"}, + {"pName" : "MBP1_ASPNI", "fName" : "KilA-N", "start" : "26", "end" : "109"}, + {"pName" : "MBP1_ASPNI", "fName" : "low complexity", "start" : "529", "end" : "534"}, + {"pName" : "MBP1_ASPNI", "fName" : "Ankyrin fold", "start" : "260", "end" : "289"}, + {"pName" : "MBP1_ASPNI", "fName" : "Ankyrin fold", "start" : "381", "end" : "413"}, + {"pName" : "MBP1_ASPNI", "fName" : "Swi6 fold", "start" : "193", "end" : "402"}, + {"pName" : "MBP1_ASPNI", "fName" : "coiled coil", "start" : "509", "end" : "572"}, + + {"pName" : "MBP1_BIPOR", "fName" : "APSES fold", "start" : "8", "end" : "106"}, + {"pName" : "MBP1_BIPOR", "fName" : "KilA-N", "start" : "26", "end" : "109"}, + {"pName" : "MBP1_BIPOR", "fName" : "low complexity", "start" : "134", "end" : "152"}, + {"pName" : "MBP1_BIPOR", "fName" : "low complexity", "start" : "267", "end" : "278"}, + {"pName" : "MBP1_BIPOR", "fName" : "low complexity", "start" : "670", "end" : "685"}, + {"pName" : "MBP1_BIPOR", "fName" : "Ankyrin fold", "start" : "266", "end" : "295"}, + {"pName" : "MBP1_BIPOR", "fName" : "Ankyrin fold", "start" : "387", "end" : "416"}, + {"pName" : "MBP1_BIPOR", "fName" : "Swi6 fold", "start" : "253", "end" : "421"}, + {"pName" : "MBP1_BIPOR", "fName" : "coiled coil", "start" : "659", "end" : "681"}, + {"pName" : "MBP1_BIPOR", "fName" : "coiled coil", "start" : "500", "end" : "590"}, + + {"pName" : "MBP1_NEUCR", "fName" : "APSES fold", "start" : "14", "end" : "114"}, + {"pName" : "MBP1_NEUCR", "fName" : "KilA-N", "start" : "34", "end" : "117"}, + {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "130", "end" : "141"}, + {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "253", "end" : "266"}, + {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "514", "end" : "525"}, + {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "554", "end" : "564"}, + {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "601", "end" : "618"}, + {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "620", "end" : "629"}, + {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "636", "end" : "652"}, + {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "658", "end" : "672"}, + {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "725", "end" : "735"}, + {"pName" : "MBP1_NEUCR", "fName" : "low complexity", "start" : "752", "end" : "771"}, + {"pName" : "MBP1_NEUCR", "fName" : "Ankyrin fold", "start" : "268", "end" : "297"}, + {"pName" : "MBP1_NEUCR", "fName" : "Ankyrin fold", "start" : "390", "end" : "419"}, + {"pName" : "MBP1_NEUCR", "fName" : "Swi6 fold", "start" : "270", "end" : "426"}, + {"pName" : "MBP1_NEUCR", "fName" : "coiled coil", "start" : "500", "end" : "550"}, + + {"pName" : "MBP1_SCHPO", "fName" : "APSES fold", "start" : "8", "end" : "104"}, + {"pName" : "MBP1_SCHPO", "fName" : "KilA-N", "start" : "25", "end" : "113"}, + {"pName" : "MBP1_SCHPO", "fName" : "low complexity", "start" : "111", "end" : "125"}, + {"pName" : "MBP1_SCHPO", "fName" : "low complexity", "start" : "136", "end" : "145"}, + {"pName" : "MBP1_SCHPO", "fName" : "low complexity", "start" : "176", "end" : "191"}, + {"pName" : "MBP1_SCHPO", "fName" : "low complexity", "start" : "422", "end" : "447"}, + {"pName" : "MBP1_SCHPO", "fName" : "Ankyrin fold", "start" : "247", "end" : "276"}, + {"pName" : "MBP1_SCHPO", "fName" : "Ankyrin fold", "start" : "368", "end" : "397"}, + {"pName" : "MBP1_SCHPO", "fName" : "Swi6 fold", "start" : "234", "end" : "400"}, + {"pName" : "MBP1_SCHPO", "fName" : "coiled coil", "start" : "457", "end" : "538"}, + + {"pName" : "MBP1_COPCI", "fName" : "APSES fold", "start" : "5", "end" : "103"}, + {"pName" : "MBP1_COPCI", "fName" : "KilA-N", "start" : "23", "end" : "106"}, + {"pName" : "MBP1_COPCI", "fName" : "low complexity", "start" : "170", "end" : "191"}, + {"pName" : "MBP1_COPCI", "fName" : "low complexity", "start" : "435", "end" : "450"}, + {"pName" : "MBP1_COPCI", "fName" : "low complexity", "start" : "611", "end" : "626"}, + {"pName" : "MBP1_COPCI", "fName" : "Ankyrin fold", "start" : "270", "end" : "299"}, + {"pName" : "MBP1_COPCI", "fName" : "Ankyrin fold", "start" : "389", "end" : "418"}, + {"pName" : "MBP1_COPCI", "fName" : "Ankyrin fold", "start" : "474", "end" : "509"}, + {"pName" : "MBP1_COPCI", "fName" : "Swi6 fold", "start" : "257", "end" : "429"}, + {"pName" : "MBP1_COPCI", "fName" : "coiled coil", "start" : "500", "end" : "570"}, + {"pName" : "MBP1_COPCI", "fName" : "coiled coil", "start" : "651", "end" : "678"}, + + {"pName" : "MBP1_CRYNE", "fName" : "APSES fold", "start" : "16", "end" : "114"}, + {"pName" : "MBP1_CRYNE", "fName" : "KilA-N", "start" : "34", "end" : "117"}, + {"pName" : "MBP1_CRYNE", "fName" : "low complexity", "start" : "66", "end" : "85"}, + {"pName" : "MBP1_CRYNE", "fName" : "low complexity", "start" : "413", "end" : "423"}, + {"pName" : "MBP1_CRYNE", "fName" : "low complexity", "start" : "633", "end" : "644"}, + {"pName" : "MBP1_CRYNE", "fName" : "low complexity", "start" : "697", "end" : "709"}, + {"pName" : "MBP1_CRYNE", "fName" : "Ankyrin fold", "start" : "477", "end" : "506"}, + {"pName" : "MBP1_CRYNE", "fName" : "Ankyrin fold", "start" : "618", "end" : "647"}, + {"pName" : "MBP1_CRYNE", "fName" : "Swi6 fold", "start" : "452", "end" : "663"}, + + {"pName" : "MBP1_PUCGR", "fName" : "APSES fold", "start" : "90", "end" : "187"}, + {"pName" : "MBP1_PUCGR", "fName" : "KilA-N", "start" : "107", "end" : "190"}, + {"pName" : "MBP1_PUCGR", "fName" : "low complexity", "start" : "208", "end" : "227"}, + {"pName" : "MBP1_PUCGR", "fName" : "low complexity", "start" : "273", "end" : "291"}, + {"pName" : "MBP1_PUCGR", "fName" : "Ankyrin fold", "start" : "442", "end" : "271"}, + {"pName" : "MBP1_PUCGR", "fName" : "Ankyrin fold", "start" : "475", "end" : "509"}, + {"pName" : "MBP1_PUCGR", "fName" : "Ankyrin fold", "start" : "561", "end" : "590"}, + {"pName" : "MBP1_PUCGR", "fName" : "Swi6 fold", "start" : "429", "end" : "601"}, + {"pName" : "MBP1_PUCGR", "fName" : "coiled coil", "start" : "827", "end" : "863"}, + + {"pName" : "MBP1_USTMA", "fName" : "APSES fold", "start" : "7", "end" : "104"}, + {"pName" : "MBP1_USTMA", "fName" : "KilA-N", "start" : "24", "end" : "107"}, + {"pName" : "MBP1_USTMA", "fName" : "low complexity", "start" : "106", "end" : "116"}, + {"pName" : "MBP1_USTMA", "fName" : "low complexity", "start" : "161", "end" : "183"}, + {"pName" : "MBP1_USTMA", "fName" : "low complexity", "start" : "666", "end" : "681"}, + {"pName" : "MBP1_USTMA", "fName" : "low complexity", "start" : "688", "end" : "700"}, + {"pName" : "MBP1_USTMA", "fName" : "AT hook", "start" : "134", "end" : "146"}, + {"pName" : "MBP1_USTMA", "fName" : "Ankyrin fold", "start" : "245", "end" : "274"}, + {"pName" : "MBP1_USTMA", "fName" : "Ankyrin fold", "start" : "278", "end" : "314"}, + {"pName" : "MBP1_USTMA", "fName" : "Ankyrin fold", "start" : "364", "end" : "393"}, + {"pName" : "MBP1_USTMA", "fName" : "Swi6 fold", "start" : "232", "end" : "404"}, + {"pName" : "MBP1_USTMA", "fName" : "coiled coil", "start" : "590", "end" : "618"}, + + {"pName" : "MBP1_WALME", "fName" : "APSES fold", "start" : "6", "end" : "103"}, + {"pName" : "MBP1_WALME", "fName" : "KilA-N", "start" : "23", "end" : "106"}, + {"pName" : "MBP1_WALME", "fName" : "low complexity", "start" : "149", "end" : "162"}, + {"pName" : "MBP1_WALME", "fName" : "low complexity", "start" : "171", "end" : "188"}, + {"pName" : "MBP1_WALME", "fName" : "low complexity", "start" : "618", "end" : "628"}, + {"pName" : "MBP1_WALME", "fName" : "low complexity", "start" : "634", "end" : "660"}, + {"pName" : "MBP1_WALME", "fName" : "Ankyrin fold", "start" : "250", "end" : "279"}, + {"pName" : "MBP1_WALME", "fName" : "Ankyrin fold", "start" : "369", "end" : "398"}, + {"pName" : "MBP1_WALME", "fName" : "Swi6 fold", "start" : "237", "end" : "409"}, + {"pName" : "MBP1_WALME", "fName" : "coiled coil", "start" : "461", "end" : "585"} +] diff --git a/data/refFeatures.json b/data/refFeatures.json index 8df1da7..4d6d5c6 100644 --- a/data/refFeatures.json +++ b/data/refFeatures.json @@ -1,47 +1,47 @@ -[ - { "name" : "APSES fold", - "description " : "DNA binding domain by similarity to structure", - "sourceDB" : "PDB", - "accession" : "1BM8_A_1_99"}, - - { "name" : "KilA-N", - "description " : "DNA binding domain by Pfam annotation", - "sourceDB" : "Pfam", - "accession" : "PF04383"}, - - { "name" : "AT hook", - "description " : "DNA interaction motif by SMART annotation", - "sourceDB" : "SMART", - "accession" : null}, - - { "name" : "low complexity", - "description " : "SEG annotation by SMART", - "sourceDB" : "SMART", - "accession" : null}, - - { "name" : "Ankyrin fold", - "description " : "Ankyrin domain by SMART annotation", - "sourceDB" : "SMART", - "accession" : "SM00248"}, - - { "name" : "Swi6 fold", - "description " : "Swi6 fold by similarity to structure", - "sourceDB" : "PDB", - "accession" : "1SW6_B"}, - - { "name" : "coiled coil", - "description " : "Coiled coil by SMART annotation", - "sourceDB" : "SMART", - "accession" : null}, - - { "name" : "McInerny 2011", - "description " : "Yeast cell cycle review", - "sourceDB" : "PubMed", - "accession" : "21310294"} -] - - - - - - +[ + { "name" : "APSES fold", + "description " : "DNA binding domain by similarity to structure", + "sourceDB" : "PDB", + "accession" : "1BM8_A_1_99"}, + + { "name" : "KilA-N", + "description " : "DNA binding domain by Pfam annotation", + "sourceDB" : "Pfam", + "accession" : "PF04383"}, + + { "name" : "AT hook", + "description " : "DNA interaction motif by SMART annotation", + "sourceDB" : "SMART", + "accession" : null}, + + { "name" : "low complexity", + "description " : "SEG annotation by SMART", + "sourceDB" : "SMART", + "accession" : null}, + + { "name" : "Ankyrin fold", + "description " : "Ankyrin domain by SMART annotation", + "sourceDB" : "SMART", + "accession" : "SM00248"}, + + { "name" : "Swi6 fold", + "description " : "Swi6 fold by similarity to structure", + "sourceDB" : "PDB", + "accession" : "1SW6_B"}, + + { "name" : "coiled coil", + "description " : "Coiled coil by SMART annotation", + "sourceDB" : "SMART", + "accession" : null}, + + { "name" : "McInerny 2011", + "description " : "Yeast cell cycle review", + "sourceDB" : "PubMed", + "accession" : "21310294"} +] + + + + + + diff --git a/data/refMBP1Proteins.json b/data/refMBP1Proteins.json index 43832d2..cdeb769 100644 --- a/data/refMBP1Proteins.json +++ b/data/refMBP1Proteins.json @@ -1,155 +1,155 @@ -[ - { "name" : "MBP1_SCHPO", - "RefSeqID" : "NP_593032", - "UniProtID" : "P41412", - "taxonomyID" : 284812, - "sequence" : [ - "MAPRSSAVHVAVYSGVEVYECFIKGVSVMRRRRDSWLNATQILKVADFDKPQRTRVLERQVQIGAHEKVQ", - "GGYGKYQGTWVPFQRGVDLATKYKVDGIMSPILSLDIDEGKAIAPKKKQTKQKKPSVRGRRGRKPSSLSS", - "STLHSVNEKQPNSSISPTIESSMNKVNLPGAEEQVSATPLPASPNALLSPNDNTIKPVEELGMLEAPLDK", - "YEESLLDFFLHPEEGRIPSFLYSPPPDFQVNSVIDDDGHTSLHWACSMGHIEMIKLLLRANADIGVCNRL", - "SQTPLMRSVIFTNNYDCQTFGQVLELLQSTIYAVDTNGQSIFHHIVQSTSTPSKVAAAKYYLDCILEKLI", - "SIQPFENVVRLVNLQDSNGDTSLLIAARNGAMDCVNSLLSYNANPSIPNRQRRTASEYLLEADKKPHSLL", - "QSNSNASHSAFSFSGISPAIISPSCSSHAFVKAIPSISSKFSQLAEEYESQLREKEEDLIRANRLKQDTL", - "NEISRTYQELTFLQKNNPTYSQSMENLIREAQETYQQLSKRLLIWLEARQIFDLERSLKPHTSLSISFPS", - "DFLKKEDGLSLNNDFKKPACNNVTNSDEYEQLINKLTSLQASRKKDTLYIRKLYEELGIDDTVNSYRRLI", - "AMSCGINPEDLSLEILDAVEEALTREK"] - }, - { "name" : "MBP1_ASPNI", - "RefSeqID" : "XP_660758", - "UniProtID" : "Q5B8H6", - "taxonomyID" : 227321, - "sequence" : [ - "MAAVDFSNVYSATYSSVPVYEFKIGTDSVMRRRSDDWINATHILKVAGFDKPARTRILEREVQKGVHEKV", - "QGGYGKYQGTWIPLQEGRQLAERNNILDKLLPIFDYVAGDRSPPPAPKHTSAASKPRAPKINKRVVKEDV", - "FSAVNHHRSMGPPSFHHEHYDVNTGLDEDESIEQATLESSSMIADEDMISMSQNGPYSSRKRKRGINEVA", - "AMSLSEQEHILYGDQLLDYFMTVGDAPEATRIPPPQPPANFQVDRPIDDSGNTALHWACAMGDLEIVKDL", - "LRRGADMKALSIHEETPLVRAVLFTNNYEKRTFPALLDLLLDTISFRDWFGATLFHHIAQTTKSKGKWKS", - "SRYYCEVALEKLRTTFSPEEVDLLLSCQDSVGDTAVLVAARNGVFRLVDLLLSRCPRAGDLVNKRGETAS", - "SIMQRAHLAERDIPPPPSSITMGNDHIDGEVGAPTSLEPQSVTLHHESSPATAQLLSQIGAIMAEASRKL", - "TSSYGAAKPSQKDSDDVANPEALYEQLEQDRQKIRRQYDALAAKEAAEESSDAQLGRYEQMRDNYESLLE", - "QIQRARLKERLASTPVPTQTAVIGSSSPEQDRLLTTFQLSRALCSEQKIRRAAVKELAQQRADAGVSTKF", - "DVHRKLVALATGLKEEELDPMAAELAETLEFDRMNGKGVGPESPEADHKDSASLPFPGPVVSVDA"] - }, - { "name" : "MBP1_BIPOR", - "RefSeqID" : "XP_007682304", - "UniProtID" : "W6ZM86", - "taxonomyID" : 930090, - "sequence" : [ - "MPPAPDGKIYSATYSNVPVYECNVNGHHVMRRRADDWINATHILKVADYDKPARTRILEREVQKGVHEKV", - "QGGYGKYQGTWIPLEEGRGLAERNGVLDKMRAIFDYVPGDRSPPPAPKHATAASNRMKPPRQTAAAVAAA", - "AVAAAAAAAAVANHNALMSNSRSQASEDPYENSQRSQIYREDTPDNETVISESMLGDADLMDMSQYSADG", - "NRKRKRGMDQMSLLDQQHQIWADQLLDYFMLLDHEAAVSWPEPPPSINLDRPIDEKGHAAMHWAAAMGDV", - "GVVKELIHRGARLDCLSNNLETPLMRAVMFTNNFDKETMPSMVKIFQQTVHRTDWFGSTVFHHIAATTSS", - "SNKYVCARWYLDCIINKLSETWIPEEVTRLLNAADQNGDTAIMIAARNGARKCVRSLLGRNVAVDIPNKK", - "GETADDLIRELNQRRRMHGRTRQASSSPFAPAPEHRLNGHVPHFDGGPLMSVPVPSMAVRESVQYRSQTA", - "SHLMTKVAPTLLEKCEELATAYEAELQEKEAEFFDAERVVKRRQAELEAVRKQVAELQSMSKGLHIDLND", - "EEAERQQEDELRLLVEEAESLLEIEQKAELRRLCSSMPQQNSDSSPVDITEKMRLALLLHRAQLERRELV", - "REVVGNLSVAGMSEKQGTYKKLIAKALGEREEDVESMLPEILQELEEAETQERAEGLDGSPV"] - }, - { "name" : "MBP1_NEUCR", - "RefSeqID" : "XP_955821", - "UniProtID" : "Q7RW59", - "taxonomyID" : 367110, - "sequence" : [ - "MVKENVGGNPEPGIYSATYSGIPVWEYQFGVDLKEHVMRRRHDDWVNATHILKAAGFDKPARTRILEREV", - "QKDTHEKIQGGYGRYQGTWIPLEQAEALARRNNIYERLKPIFEFQPGNESPPPAPRHASKPKAPKVKPAV", - "PTWGSKSAKNANPPQPGTFLPPGRKGLPAQAPDYNDADTHMHDDDTPDNLTVASASYMAEDDRYDHSHFS", - "TGHRKRKRDELIEDMTEQQHAVYGDELLDYFLLSRNEQPAVRPDPPPNFKPDWPIDNERHTCLHWASAMG", - "DVDVMRQLKKFGASLDAQNVRGETPFMRAVNFTNCFEKQTFPQVMKELFSTIDCRDLSGCTVIHHAAVMK", - "IGRVNSQSCSRYYLDIILNRLQETHHPEFVQQLLDAQDNDGNTAVHLAAMRDARKCIRALLGRGASTDIP", - "NKQGIRAEELIKELNASISKSRSNLPQRSSSPFAPDTQRHDAFHEAISESMVTSRKNSQPNYSSDAANTV", - "QNRITPLVLQKLKDLTATYDSEFKEKDDAEKEARRILNKTQSELKALTASIDDYNSRLDTDDVAAKTAAE", - "MATARHKVLAFVTHQNRISVQEAVKQELAALDRANAVTNGTSTKSKSSSPSKKPKLSPIPDQKDKPPKDE", - "NETESEAEHPDPPAAQAHQQQPGPSSQDTEVEDQDREEEEDDYTHRLSLAAELRSILQEQRSAENDYVEA", - "RGMLGTGERIDKYKHLLMSCLPPDEQENLEENLEEMIKLMEQEDESVTDLPAGAVGGGGGGNAADGSGGG", - "GQPSNGRRESVLPALRGGNGDGEMSRRGSRTAAAAAAQVDGEREINGRAGAERTERIQEIAAV"] - }, - { "name" : "MBP1_COPCI", - "RefSeqID" : "XP_001837394", - "UniProtID" : "A8NYC6", - "taxonomyID" : 240176, - "sequence" : [ - "MPEAQIFKATYSGIPVYEMMCKGVAVMRRRSDSWLNATQILKVAGFDKPQRTRVLEREVQKGEHEKVQGG", - "YGKYQGTWIPLERGMQLAKQYNCEHLLRPIIEFTPAAKSPPLAPKHLVATAGNRPVRKPLTTDLSAAVIN", - "TRSTRKQVADGVGEESDHDTHSLRGSEDGSMTPSPSEASSSSRTPSPIHSPGTYHSNGLDGPSSGGRNRY", - "RQSNDRYDEDDDASRHNGMGDPRSYGDQILEYFISDTNQIPPILITPPPDFDPNMAIDDDGHTSLHWACA", - "MGRIRIVKLLLSAGADIFKVNKAGQTALMRSVMFANNYDVRKFPELYELLHRSTLNIDNSNRTVFHHVVD", - "VAMSKGKTHAARYYMETILTRLADYPKELADVINFQDEDGETALTMAARCRSKRLVKLLIDHGADPKINN", - "HDGKNAEDYILEDERFRSSPAPSSRVAAMSYRNAQVAYPPPGAPSTYSFAPANHDRPPLHYSAAAQKAST", - "RCVNDMASMLDSLAASFDQELRDKERDMAQAQALLTNIQAEILESQRTVLQLRQQAEGLSQAKQRLADLE", - "NALQDKMGRRYRLGFEKWIKDEETREKVIRDAANGDLVLTPATTSYTVDEDGDSDSGSNGDKNKGKRKAQ", - "VQQEEVSDLVELYSNIPTDPEELRKQCEALREEVSQSRKRRKAMFDELVTFQAEAGTSGRMSDYRRLIAA", - "GCGGLEPLEIDSVLGMLLETLEAEDPSSTSATWSGSKGQQTG"] - }, - { "name" : "MBP1_CRYNE", - "RefSeqID" : "XP_569090", - "UniProtID" : "Q5KMQ9", - "taxonomyID" : 214684, - "sequence" : [ - "MGKKVIASGGDNGPNTIYKATYSGVPVYEMVCRDVAVMRRRSDAYLNATQILKVAGFDKPQRTRVLEREV", - "QKGEHEKVQGGYGKYQGTWIPIERGLALAKQYGVEDILRPIIDYVPTSVSPPPAPKHSVAPPSKARRDKE", - "KETGRTKATPSRTGPTSAAALQAQAQLNRAKMHDSTPDADASFRSFEERVSLTPEDDSSSDTPSPVASVM", - "TDQDMEVDKMGMHMSMPNVTLSQNMEELGAGSRKRSAAMMMEDEDQFGQLRSIRGNSAVHTPHGTPRHLG", - "IGMPPEPIGPEQYTDIILNYFVSETSQIPSILVSPPHDFDPNAPIDDDGHTALHWACAMGRVRVVKLLLT", - "AGASIFAGNNAEQTPLMRSVMFSNNYDMRKFPELYELLHRSTLNIDKQNRTVFHHIANLALTKGKTHAAK", - "YYMETILARLADYPQELADVINFQDEEGETALTIAARARSRRLVKALLDHGANPKIKNRDSRSAEDYILE", - "DERFRSSPVPAPNGGIGKASTSAAAEKPLFAPQLYFSEAARLCGGQALTDITSHMQSLARSFDAELQGKE", - "RDILQAKALLTNIHTEVTENGRSITAITNQAAPLEEKRRELEALQASLKTRVKDALKKGYIGWLEGELVR", - "EQRWENGELEGNEEEKAAVQALRDVPTGGQEVVQAEEEKLRWEIEEKRKRRAMFVEKFVRAQTEAGTSEQ", - "IAKYRKLVSAGLGGVSTNEVDELMNQLLEGLEEENDNQVYNTTAGESGPSSWVQ"] - }, - { "name" : "MBP1_PUCGR", - "RefSeqID" : "XP_003327086", - "UniProtID" : "E3KED4", - "taxonomyID" : 418459, - "sequence" : [ - "MAYGGSIQPLRPPSRESATLHLHQPDLTVTSPPLSLTHCPPCVYSHFTHTPTSLIVIQVSLHSLLDQETY", - "HLLPSRSPPTVSVRMGTTTIYKATYSGVPVLEMPCEGIAVMRRRSDSWLNATQILKVAGFDKPQRTRVLE", - "REIQKGTHEKIQGGYGKYQGTWVPLDRGIDLAKQYGVDHLLSALFNFQPSSNESPPLAPKHVTALSTRVK", - "VSKVSAASAARAARAVVPSLPSTSGLGGRNTNNSWSNFDSDNEPGLPPAASSRESNGNWATQSKLARSSN", - "LARARANINNSHPEDLPVPAPDQLQASPLPSMQTADPENDNSLTPSELSLPSRTPSPIEDLPLTVNTASS", - "QSTRNKGKSRDLPDDEDLSRGQKRKYDTSLVEDTSYSDGADDQYINGNPSNAASAKYAKLILDYFVSESS", - "QIPNFLNDPPSDFDPNVVIDDDGHTALHWACAMGRIKIIKLLLTCGADIFRANNAGQTALMRAVMFTNNH", - "DLRTFPELFESFSGSVINIDRTDRTVFHYVIDIALTKGKVPAARYYLETILSQLSEYPKELIDILNFQDE", - "DGETALTLAARCRSKKLVKILLDHGANPKTANRDGKSAEDYILEDDKFRALSPTPCSSGPIRQLDQNSPG", - "GTSNRSDFVDLVDPVPIDSNLIPQRSPNASPPHYSETGQRVTKQLLPEVTSMIELLATTFDTELQDKERD", - "LDHAVGLLSNIEKEYLEGQRKILNYERMLSDFGEKKLALGDLEKELNDKLGKRYRFGWEKYVRDEEERAR", - "RITEQRSKYLQELSIEDRKLLDSSNLRFADPSKQEVLMKLQADERENSDLLNLIRTNSTDVESECDLLRE", - "SVQKLSEERERLFKEFINLSSENTGGENEEDDGANHTSANTSRLNNYRKLISLGCGGIGLDEVDEVIESL", - "NEGIDVNELNDNGFLTEQDEELGNHQNYHNIHTQGR"] - }, - { "name" : "MBP1_USTMA", - "RefSeqID" : "XP_011392621", - "UniProtID" : "A0A0D1DP35", - "taxonomyID" : 237631, - "sequence" : [ - "MSGDKTIFKATYSGVPVYECIINNVAVMRRRSDDWLNATQILKVVGLDKPQRTRVLEREIQKGIHEKVQG", - "GYGKYQGTWIPLDVAIELAERYNIQGLLQPITSYVPSAADSPPPAPKHTISTSNRSKKIIPADPGALGRS", - "RRATSIETESEVIGAAPNNVSEGSMSPSPSDISSSSRTPSPLPADRAHPLHANHALAGYNGRDANNHARY", - "ADIILDYFVTENTTVPSLLINPPPDFNPDMSIDDDEHTALHWACAMGRIRVVKLLLSAGADIFRVNSNQQ", - "TALMRATMFSNNYDLRKFPELFELLHRSILNIDRNDRTVFHHVVDLALSRGKPHAARYYMETMINRLADY", - "GDQLADILNFQDDEGETPLTMAARARSKRLVRLLLEHGADPKIRNKEGKNAEDYIIEDERFRSSPSRTGP", - "AGIELGADGLPVLPTSSLHTSEAGQRTAGRAVTLMSNLLHSLADSYDSEINTAEKKLTQAHGLLKQIQTE", - "IEDSAKVAEALHHEAQGVDEERKRVDSLQLALKHAINKRARDDLERRWSEGKQAIKRARLQAGLEPGALS", - "TSNATNAPATGDQKSKDDAKSLIEALPAGTNVKTAIAELRKQLSQVQANKTELVDKFVARAREQGTGRTM", - "AAYRRLIAAGCGGIAPDEVDAVVGVLCELLQESHTGARAGAGGERDDRARDVAMMLKGAGAAALAANAGA", - "P"] - }, - { "name" : "MBP1_WALME", - "RefSeqID" : "XP_006957051", - "UniProtID" : "I4YGC0", - "taxonomyID" : 671144, - "sequence" : [ - "MSAPPIYKACYSGVPVYEFNCKNVAVMKRRSDSWMNATQILKVANFDKPQRTRILEREVQKGTHEKVQGG", - "YGKYQGTWIPMERSVELARQYRIELLLDPIINYLPGPQSPPLAPKHATNVGSRARKSTAPAAQTLPSTSK", - "VFHPLSSTKHPAKLAAATNAKAEISDGEDASIPSSPSFKSNSSRTPSPIRINARKRKLEDEATIPSSAID", - "GSISYEDIILDYFISESTQIPALLIHPPSDFNPNMSIDDEGHTAMHWACAMGKVRVVKLLLSAGADIFRV", - "NHSEQTALMRSVMFSNNYDIRKFPQLYELLHRSTLNLDKHDRTVLHHIVDLALTKSKTHAARYYMECVLS", - "KLANYPDELADVINFQDDEGESALTLAARARSKRLVKLLLEHGADSKLPNKDGKTAEDYILEDERFRQSP", - "LLNSNHLRLHPPDTSIYAPPAHLFNSETSQNIANTSMSSVANLLESLAQSYDKEITQKERDYQQAQVILR", - "NIKTDIVEAKSNIEKMTIDSSEFEHLKHKLRELEMKLEEHSNDVYNKGWEEYSRNVDDPAIDAPSDNVQE", - "ECASLRNKIKDLQEKRISSMQELIKRQKEVGTGKKMSEYRKLISVGCGIPTTEIDAVLEMLLESLESENA", - "NKKAALASGISGALSSTSSAPSQATTSAPTGVATPGAPVPASSEKAGLLPPAPVMQ"] - } -] +[ + { "name" : "MBP1_SCHPO", + "RefSeqID" : "NP_593032", + "UniProtID" : "P41412", + "taxonomyID" : 284812, + "sequence" : [ + "MAPRSSAVHVAVYSGVEVYECFIKGVSVMRRRRDSWLNATQILKVADFDKPQRTRVLERQVQIGAHEKVQ", + "GGYGKYQGTWVPFQRGVDLATKYKVDGIMSPILSLDIDEGKAIAPKKKQTKQKKPSVRGRRGRKPSSLSS", + "STLHSVNEKQPNSSISPTIESSMNKVNLPGAEEQVSATPLPASPNALLSPNDNTIKPVEELGMLEAPLDK", + "YEESLLDFFLHPEEGRIPSFLYSPPPDFQVNSVIDDDGHTSLHWACSMGHIEMIKLLLRANADIGVCNRL", + "SQTPLMRSVIFTNNYDCQTFGQVLELLQSTIYAVDTNGQSIFHHIVQSTSTPSKVAAAKYYLDCILEKLI", + "SIQPFENVVRLVNLQDSNGDTSLLIAARNGAMDCVNSLLSYNANPSIPNRQRRTASEYLLEADKKPHSLL", + "QSNSNASHSAFSFSGISPAIISPSCSSHAFVKAIPSISSKFSQLAEEYESQLREKEEDLIRANRLKQDTL", + "NEISRTYQELTFLQKNNPTYSQSMENLIREAQETYQQLSKRLLIWLEARQIFDLERSLKPHTSLSISFPS", + "DFLKKEDGLSLNNDFKKPACNNVTNSDEYEQLINKLTSLQASRKKDTLYIRKLYEELGIDDTVNSYRRLI", + "AMSCGINPEDLSLEILDAVEEALTREK"] + }, + { "name" : "MBP1_ASPNI", + "RefSeqID" : "XP_660758", + "UniProtID" : "Q5B8H6", + "taxonomyID" : 227321, + "sequence" : [ + "MAAVDFSNVYSATYSSVPVYEFKIGTDSVMRRRSDDWINATHILKVAGFDKPARTRILEREVQKGVHEKV", + "QGGYGKYQGTWIPLQEGRQLAERNNILDKLLPIFDYVAGDRSPPPAPKHTSAASKPRAPKINKRVVKEDV", + "FSAVNHHRSMGPPSFHHEHYDVNTGLDEDESIEQATLESSSMIADEDMISMSQNGPYSSRKRKRGINEVA", + "AMSLSEQEHILYGDQLLDYFMTVGDAPEATRIPPPQPPANFQVDRPIDDSGNTALHWACAMGDLEIVKDL", + "LRRGADMKALSIHEETPLVRAVLFTNNYEKRTFPALLDLLLDTISFRDWFGATLFHHIAQTTKSKGKWKS", + "SRYYCEVALEKLRTTFSPEEVDLLLSCQDSVGDTAVLVAARNGVFRLVDLLLSRCPRAGDLVNKRGETAS", + "SIMQRAHLAERDIPPPPSSITMGNDHIDGEVGAPTSLEPQSVTLHHESSPATAQLLSQIGAIMAEASRKL", + "TSSYGAAKPSQKDSDDVANPEALYEQLEQDRQKIRRQYDALAAKEAAEESSDAQLGRYEQMRDNYESLLE", + "QIQRARLKERLASTPVPTQTAVIGSSSPEQDRLLTTFQLSRALCSEQKIRRAAVKELAQQRADAGVSTKF", + "DVHRKLVALATGLKEEELDPMAAELAETLEFDRMNGKGVGPESPEADHKDSASLPFPGPVVSVDA"] + }, + { "name" : "MBP1_BIPOR", + "RefSeqID" : "XP_007682304", + "UniProtID" : "W6ZM86", + "taxonomyID" : 930090, + "sequence" : [ + "MPPAPDGKIYSATYSNVPVYECNVNGHHVMRRRADDWINATHILKVADYDKPARTRILEREVQKGVHEKV", + "QGGYGKYQGTWIPLEEGRGLAERNGVLDKMRAIFDYVPGDRSPPPAPKHATAASNRMKPPRQTAAAVAAA", + "AVAAAAAAAAVANHNALMSNSRSQASEDPYENSQRSQIYREDTPDNETVISESMLGDADLMDMSQYSADG", + "NRKRKRGMDQMSLLDQQHQIWADQLLDYFMLLDHEAAVSWPEPPPSINLDRPIDEKGHAAMHWAAAMGDV", + "GVVKELIHRGARLDCLSNNLETPLMRAVMFTNNFDKETMPSMVKIFQQTVHRTDWFGSTVFHHIAATTSS", + "SNKYVCARWYLDCIINKLSETWIPEEVTRLLNAADQNGDTAIMIAARNGARKCVRSLLGRNVAVDIPNKK", + "GETADDLIRELNQRRRMHGRTRQASSSPFAPAPEHRLNGHVPHFDGGPLMSVPVPSMAVRESVQYRSQTA", + "SHLMTKVAPTLLEKCEELATAYEAELQEKEAEFFDAERVVKRRQAELEAVRKQVAELQSMSKGLHIDLND", + "EEAERQQEDELRLLVEEAESLLEIEQKAELRRLCSSMPQQNSDSSPVDITEKMRLALLLHRAQLERRELV", + "REVVGNLSVAGMSEKQGTYKKLIAKALGEREEDVESMLPEILQELEEAETQERAEGLDGSPV"] + }, + { "name" : "MBP1_NEUCR", + "RefSeqID" : "XP_955821", + "UniProtID" : "Q7RW59", + "taxonomyID" : 367110, + "sequence" : [ + "MVKENVGGNPEPGIYSATYSGIPVWEYQFGVDLKEHVMRRRHDDWVNATHILKAAGFDKPARTRILEREV", + "QKDTHEKIQGGYGRYQGTWIPLEQAEALARRNNIYERLKPIFEFQPGNESPPPAPRHASKPKAPKVKPAV", + "PTWGSKSAKNANPPQPGTFLPPGRKGLPAQAPDYNDADTHMHDDDTPDNLTVASASYMAEDDRYDHSHFS", + "TGHRKRKRDELIEDMTEQQHAVYGDELLDYFLLSRNEQPAVRPDPPPNFKPDWPIDNERHTCLHWASAMG", + "DVDVMRQLKKFGASLDAQNVRGETPFMRAVNFTNCFEKQTFPQVMKELFSTIDCRDLSGCTVIHHAAVMK", + "IGRVNSQSCSRYYLDIILNRLQETHHPEFVQQLLDAQDNDGNTAVHLAAMRDARKCIRALLGRGASTDIP", + "NKQGIRAEELIKELNASISKSRSNLPQRSSSPFAPDTQRHDAFHEAISESMVTSRKNSQPNYSSDAANTV", + "QNRITPLVLQKLKDLTATYDSEFKEKDDAEKEARRILNKTQSELKALTASIDDYNSRLDTDDVAAKTAAE", + "MATARHKVLAFVTHQNRISVQEAVKQELAALDRANAVTNGTSTKSKSSSPSKKPKLSPIPDQKDKPPKDE", + "NETESEAEHPDPPAAQAHQQQPGPSSQDTEVEDQDREEEEDDYTHRLSLAAELRSILQEQRSAENDYVEA", + "RGMLGTGERIDKYKHLLMSCLPPDEQENLEENLEEMIKLMEQEDESVTDLPAGAVGGGGGGNAADGSGGG", + "GQPSNGRRESVLPALRGGNGDGEMSRRGSRTAAAAAAQVDGEREINGRAGAERTERIQEIAAV"] + }, + { "name" : "MBP1_COPCI", + "RefSeqID" : "XP_001837394", + "UniProtID" : "A8NYC6", + "taxonomyID" : 240176, + "sequence" : [ + "MPEAQIFKATYSGIPVYEMMCKGVAVMRRRSDSWLNATQILKVAGFDKPQRTRVLEREVQKGEHEKVQGG", + "YGKYQGTWIPLERGMQLAKQYNCEHLLRPIIEFTPAAKSPPLAPKHLVATAGNRPVRKPLTTDLSAAVIN", + "TRSTRKQVADGVGEESDHDTHSLRGSEDGSMTPSPSEASSSSRTPSPIHSPGTYHSNGLDGPSSGGRNRY", + "RQSNDRYDEDDDASRHNGMGDPRSYGDQILEYFISDTNQIPPILITPPPDFDPNMAIDDDGHTSLHWACA", + "MGRIRIVKLLLSAGADIFKVNKAGQTALMRSVMFANNYDVRKFPELYELLHRSTLNIDNSNRTVFHHVVD", + "VAMSKGKTHAARYYMETILTRLADYPKELADVINFQDEDGETALTMAARCRSKRLVKLLIDHGADPKINN", + "HDGKNAEDYILEDERFRSSPAPSSRVAAMSYRNAQVAYPPPGAPSTYSFAPANHDRPPLHYSAAAQKAST", + "RCVNDMASMLDSLAASFDQELRDKERDMAQAQALLTNIQAEILESQRTVLQLRQQAEGLSQAKQRLADLE", + "NALQDKMGRRYRLGFEKWIKDEETREKVIRDAANGDLVLTPATTSYTVDEDGDSDSGSNGDKNKGKRKAQ", + "VQQEEVSDLVELYSNIPTDPEELRKQCEALREEVSQSRKRRKAMFDELVTFQAEAGTSGRMSDYRRLIAA", + "GCGGLEPLEIDSVLGMLLETLEAEDPSSTSATWSGSKGQQTG"] + }, + { "name" : "MBP1_CRYNE", + "RefSeqID" : "XP_569090", + "UniProtID" : "Q5KMQ9", + "taxonomyID" : 214684, + "sequence" : [ + "MGKKVIASGGDNGPNTIYKATYSGVPVYEMVCRDVAVMRRRSDAYLNATQILKVAGFDKPQRTRVLEREV", + "QKGEHEKVQGGYGKYQGTWIPIERGLALAKQYGVEDILRPIIDYVPTSVSPPPAPKHSVAPPSKARRDKE", + "KETGRTKATPSRTGPTSAAALQAQAQLNRAKMHDSTPDADASFRSFEERVSLTPEDDSSSDTPSPVASVM", + "TDQDMEVDKMGMHMSMPNVTLSQNMEELGAGSRKRSAAMMMEDEDQFGQLRSIRGNSAVHTPHGTPRHLG", + "IGMPPEPIGPEQYTDIILNYFVSETSQIPSILVSPPHDFDPNAPIDDDGHTALHWACAMGRVRVVKLLLT", + "AGASIFAGNNAEQTPLMRSVMFSNNYDMRKFPELYELLHRSTLNIDKQNRTVFHHIANLALTKGKTHAAK", + "YYMETILARLADYPQELADVINFQDEEGETALTIAARARSRRLVKALLDHGANPKIKNRDSRSAEDYILE", + "DERFRSSPVPAPNGGIGKASTSAAAEKPLFAPQLYFSEAARLCGGQALTDITSHMQSLARSFDAELQGKE", + "RDILQAKALLTNIHTEVTENGRSITAITNQAAPLEEKRRELEALQASLKTRVKDALKKGYIGWLEGELVR", + "EQRWENGELEGNEEEKAAVQALRDVPTGGQEVVQAEEEKLRWEIEEKRKRRAMFVEKFVRAQTEAGTSEQ", + "IAKYRKLVSAGLGGVSTNEVDELMNQLLEGLEEENDNQVYNTTAGESGPSSWVQ"] + }, + { "name" : "MBP1_PUCGR", + "RefSeqID" : "XP_003327086", + "UniProtID" : "E3KED4", + "taxonomyID" : 418459, + "sequence" : [ + "MAYGGSIQPLRPPSRESATLHLHQPDLTVTSPPLSLTHCPPCVYSHFTHTPTSLIVIQVSLHSLLDQETY", + "HLLPSRSPPTVSVRMGTTTIYKATYSGVPVLEMPCEGIAVMRRRSDSWLNATQILKVAGFDKPQRTRVLE", + "REIQKGTHEKIQGGYGKYQGTWVPLDRGIDLAKQYGVDHLLSALFNFQPSSNESPPLAPKHVTALSTRVK", + "VSKVSAASAARAARAVVPSLPSTSGLGGRNTNNSWSNFDSDNEPGLPPAASSRESNGNWATQSKLARSSN", + "LARARANINNSHPEDLPVPAPDQLQASPLPSMQTADPENDNSLTPSELSLPSRTPSPIEDLPLTVNTASS", + "QSTRNKGKSRDLPDDEDLSRGQKRKYDTSLVEDTSYSDGADDQYINGNPSNAASAKYAKLILDYFVSESS", + "QIPNFLNDPPSDFDPNVVIDDDGHTALHWACAMGRIKIIKLLLTCGADIFRANNAGQTALMRAVMFTNNH", + "DLRTFPELFESFSGSVINIDRTDRTVFHYVIDIALTKGKVPAARYYLETILSQLSEYPKELIDILNFQDE", + "DGETALTLAARCRSKKLVKILLDHGANPKTANRDGKSAEDYILEDDKFRALSPTPCSSGPIRQLDQNSPG", + "GTSNRSDFVDLVDPVPIDSNLIPQRSPNASPPHYSETGQRVTKQLLPEVTSMIELLATTFDTELQDKERD", + "LDHAVGLLSNIEKEYLEGQRKILNYERMLSDFGEKKLALGDLEKELNDKLGKRYRFGWEKYVRDEEERAR", + "RITEQRSKYLQELSIEDRKLLDSSNLRFADPSKQEVLMKLQADERENSDLLNLIRTNSTDVESECDLLRE", + "SVQKLSEERERLFKEFINLSSENTGGENEEDDGANHTSANTSRLNNYRKLISLGCGGIGLDEVDEVIESL", + "NEGIDVNELNDNGFLTEQDEELGNHQNYHNIHTQGR"] + }, + { "name" : "MBP1_USTMA", + "RefSeqID" : "XP_011392621", + "UniProtID" : "A0A0D1DP35", + "taxonomyID" : 237631, + "sequence" : [ + "MSGDKTIFKATYSGVPVYECIINNVAVMRRRSDDWLNATQILKVVGLDKPQRTRVLEREIQKGIHEKVQG", + "GYGKYQGTWIPLDVAIELAERYNIQGLLQPITSYVPSAADSPPPAPKHTISTSNRSKKIIPADPGALGRS", + "RRATSIETESEVIGAAPNNVSEGSMSPSPSDISSSSRTPSPLPADRAHPLHANHALAGYNGRDANNHARY", + "ADIILDYFVTENTTVPSLLINPPPDFNPDMSIDDDEHTALHWACAMGRIRVVKLLLSAGADIFRVNSNQQ", + "TALMRATMFSNNYDLRKFPELFELLHRSILNIDRNDRTVFHHVVDLALSRGKPHAARYYMETMINRLADY", + "GDQLADILNFQDDEGETPLTMAARARSKRLVRLLLEHGADPKIRNKEGKNAEDYIIEDERFRSSPSRTGP", + "AGIELGADGLPVLPTSSLHTSEAGQRTAGRAVTLMSNLLHSLADSYDSEINTAEKKLTQAHGLLKQIQTE", + "IEDSAKVAEALHHEAQGVDEERKRVDSLQLALKHAINKRARDDLERRWSEGKQAIKRARLQAGLEPGALS", + "TSNATNAPATGDQKSKDDAKSLIEALPAGTNVKTAIAELRKQLSQVQANKTELVDKFVARAREQGTGRTM", + "AAYRRLIAAGCGGIAPDEVDAVVGVLCELLQESHTGARAGAGGERDDRARDVAMMLKGAGAAALAANAGA", + "P"] + }, + { "name" : "MBP1_WALME", + "RefSeqID" : "XP_006957051", + "UniProtID" : "I4YGC0", + "taxonomyID" : 671144, + "sequence" : [ + "MSAPPIYKACYSGVPVYEFNCKNVAVMKRRSDSWMNATQILKVANFDKPQRTRILEREVQKGTHEKVQGG", + "YGKYQGTWIPMERSVELARQYRIELLLDPIINYLPGPQSPPLAPKHATNVGSRARKSTAPAAQTLPSTSK", + "VFHPLSSTKHPAKLAAATNAKAEISDGEDASIPSSPSFKSNSSRTPSPIRINARKRKLEDEATIPSSAID", + "GSISYEDIILDYFISESTQIPALLIHPPSDFNPNMSIDDEGHTAMHWACAMGKVRVVKLLLSAGADIFRV", + "NHSEQTALMRSVMFSNNYDIRKFPQLYELLHRSTLNLDKHDRTVLHHIVDLALTKSKTHAARYYMECVLS", + "KLANYPDELADVINFQDDEGESALTLAARARSKRLVKLLLEHGADSKLPNKDGKTAEDYILEDERFRQSP", + "LLNSNHLRLHPPDTSIYAPPAHLFNSETSQNIANTSMSSVANLLESLAQSYDKEITQKERDYQQAQVILR", + "NIKTDIVEAKSNIEKMTIDSSEFEHLKHKLRELEMKLEEHSNDVYNKGWEEYSRNVDDPAIDAPSDNVQE", + "ECASLRNKIKDLQEKRISSMQELIKRQKEVGTGKKMSEYRKLISVGCGIPTTEIDAVLEMLLESLESENA", + "NKKAALASGISGALSSTSSAPSQATTSAPTGVATPGAPVPASSEKAGLLPPAPVMQ"] + } +] diff --git a/data/refTaxonomy.json b/data/refTaxonomy.json index 8da18b2..cc8272e 100644 --- a/data/refTaxonomy.json +++ b/data/refTaxonomy.json @@ -1,22 +1,22 @@ -[ - { "ID" : 227321, - "species" : "Aspergillus nidulans FGSC A4"}, - { "ID" : 930090, - "species" : "Bipolaris oryzae ATCC 44560"}, - { "ID" : 240176, - "species" : "Coprinopsis cinerea okayama7#130"}, - { "ID" : 214684, - "species" : "Cryptococcus neoformans var. neoformans JEC21"}, - { "ID" : 367110, - "species" : "Neurospora crassa OR74A"}, - { "ID" : 418459, - "species" : "Puccinia graminis f. sp. tritici CRL 75-36-700-3"}, - { "ID" : 559292, - "species" : "Saccharomyces cerevisiae S288C"}, - { "ID" : 284812, - "species" : "Schizosaccharomyces pombe 972h-"}, - { "ID" : 237631, - "species" : "Ustilago maydis 521"}, - { "ID" : 671144, - "species" : "Wallemia mellicola CBS 633.66"} -] +[ + { "ID" : 227321, + "species" : "Aspergillus nidulans FGSC A4"}, + { "ID" : 930090, + "species" : "Bipolaris oryzae ATCC 44560"}, + { "ID" : 240176, + "species" : "Coprinopsis cinerea okayama7#130"}, + { "ID" : 214684, + "species" : "Cryptococcus neoformans var. neoformans JEC21"}, + { "ID" : 367110, + "species" : "Neurospora crassa OR74A"}, + { "ID" : 418459, + "species" : "Puccinia graminis f. sp. tritici CRL 75-36-700-3"}, + { "ID" : 559292, + "species" : "Saccharomyces cerevisiae S288C"}, + { "ID" : 284812, + "species" : "Schizosaccharomyces pombe 972h-"}, + { "ID" : 237631, + "species" : "Ustilago maydis 521"}, + { "ID" : 671144, + "species" : "Wallemia mellicola CBS 633.66"} +] diff --git a/data/referenceDomainAnnotations.txt b/data/referenceDomainAnnotations.txt index c8d58d6..be47276 100644 --- a/data/referenceDomainAnnotations.txt +++ b/data/referenceDomainAnnotations.txt @@ -1,115 +1,115 @@ -ID protein.ID feature.ID start end note -# MBP1_SACCE -NA ref_pro_4 ref_ftr_1 4 102 APSES fold -NA ref_pro_4 ref_ftr_2 22 105 KilA-N -NA ref_pro_4 ref_ftr_4 108 122 low complexity -NA ref_pro_4 ref_ftr_4 236 241 low complexity -NA ref_pro_4 ref_ftr_4 279 307 low complexity -NA ref_pro_4 ref_ftr_4 700 717 low complexity -NA ref_pro_4 ref_ftr_4 700 717 low complexity -NA ref_pro_4 ref_ftr_5 394 423 Ankyrin -NA ref_pro_4 ref_ftr_5 427 463 Ankyrin -NA ref_pro_4 ref_ftr_5 512 541 Ankyrin -NA ref_pro_4 ref_ftr_6 381 547 Swi6 fold -NA ref_pro_4 ref_ftr_7 633 655 coiled coil -# MBP1_ASPNI -NA ref_pro_1 ref_ftr_1 9 106 APSES fold -NA ref_pro_1 ref_ftr_2 26 109 KilA-N -NA ref_pro_1 ref_ftr_4 529 534 low complexity -NA ref_pro_1 ref_ftr_5 260 289 Ankyrin -NA ref_pro_1 ref_ftr_5 381 413 Ankyrin -NA ref_pro_1 ref_ftr_6 193 402 Swi6 fold -NA ref_pro_1 ref_ftr_7 509 572 coiled coil -# MBP1_BIPOR -NA ref_pro_2 ref_ftr_1 8 106 APSES fold -NA ref_pro_2 ref_ftr_2 26 109 KilA-N -NA ref_pro_2 ref_ftr_4 134 152 low complexity -NA ref_pro_2 ref_ftr_4 267 278 low complexity -NA ref_pro_2 ref_ftr_4 670 685 low complexity -NA ref_pro_2 ref_ftr_5 266 295 Ankyrin -NA ref_pro_2 ref_ftr_5 387 416 Ankyrin -NA ref_pro_2 ref_ftr_6 253 421 Swi6 fold -NA ref_pro_2 ref_ftr_7 659 681 coiled coil -NA ref_pro_2 ref_ftr_7 500 590 coiled coil -# MBP1_NEUCR -NA ref_pro_3 ref_ftr_1 14 114 APSES fold -NA ref_pro_3 ref_ftr_2 34 117 KilA-N -NA ref_pro_3 ref_ftr_4 130 141 low complexity -NA ref_pro_3 ref_ftr_4 253 266 low complexity -NA ref_pro_3 ref_ftr_4 514 525 low complexity -NA ref_pro_3 ref_ftr_4 554 564 low complexity -NA ref_pro_3 ref_ftr_4 601 618 low complexity -NA ref_pro_3 ref_ftr_4 620 629 low complexity -NA ref_pro_3 ref_ftr_4 636 652 low complexity -NA ref_pro_3 ref_ftr_4 658 672 low complexity -NA ref_pro_3 ref_ftr_4 725 735 low complexity -NA ref_pro_3 ref_ftr_4 752 771 low complexity -NA ref_pro_3 ref_ftr_5 268 297 Ankyrin -NA ref_pro_3 ref_ftr_5 390 419 Ankyrin -NA ref_pro_3 ref_ftr_6 270 426 Swi6 fold -NA ref_pro_3 ref_ftr_7 500 550 coiled coil -# MBP1_SCHPO -NA ref_pro_5 ref_ftr_1 8 104 APSES fold -NA ref_pro_5 ref_ftr_2 25 113 KilA-N -NA ref_pro_5 ref_ftr_4 111 125 low complexity -NA ref_pro_5 ref_ftr_4 136 145 low complexity -NA ref_pro_5 ref_ftr_4 176 191 low complexity -NA ref_pro_5 ref_ftr_4 422 447 low complexity -NA ref_pro_5 ref_ftr_5 247 276 Ankyrin -NA ref_pro_5 ref_ftr_5 368 397 Ankyrin -NA ref_pro_5 ref_ftr_6 234 400 Swi6 fold -NA ref_pro_5 ref_ftr_7 457 538 coiled coil -# MBP1_COPCI -NA ref_pro_6 ref_ftr_1 5 103 APSES fold -NA ref_pro_6 ref_ftr_2 23 106 KilA-N -NA ref_pro_6 ref_ftr_4 170 191 low complexity -NA ref_pro_6 ref_ftr_4 435 450 low complexity -NA ref_pro_6 ref_ftr_4 611 626 low complexity -NA ref_pro_6 ref_ftr_5 270 299 Ankyrin -NA ref_pro_6 ref_ftr_5 389 418 Ankyrin -NA ref_pro_6 ref_ftr_5 474 509 Ankyrin -NA ref_pro_6 ref_ftr_6 257 429 Swi6 fold -NA ref_pro_6 ref_ftr_7 500 570 coiled coil -NA ref_pro_6 ref_ftr_7 651 678 coiled coil -# MBP1_CRYNE -NA ref_pro_7 ref_ftr_1 113 211 APSES fold -NA ref_pro_7 ref_ftr_2 131 215 KilA-N -NA ref_pro_7 ref_ftr_4 66 85 low complexity -NA ref_pro_7 ref_ftr_4 413 423 low complexity -NA ref_pro_7 ref_ftr_4 633 644 low complexity -NA ref_pro_7 ref_ftr_4 697 709 low complexity -NA ref_pro_7 ref_ftr_5 477 506 Ankyrin -NA ref_pro_7 ref_ftr_5 618 647 Ankyrin -NA ref_pro_7 ref_ftr_6 452 663 Swi6 fold -# MBP1_PUCGR -NA ref_pro_8 ref_ftr_1 90 187 APSES fold -NA ref_pro_8 ref_ftr_2 107 190 KilA-N -NA ref_pro_8 ref_ftr_4 208 227 low complexity -NA ref_pro_8 ref_ftr_4 273 291 low complexity -NA ref_pro_8 ref_ftr_5 442 271 Ankyrin -NA ref_pro_8 ref_ftr_5 475 509 Ankyrin -NA ref_pro_8 ref_ftr_5 561 590 Ankyrin -NA ref_pro_8 ref_ftr_6 429 601 Swi6 fold -NA ref_pro_8 ref_ftr_7 827 863 coiled coil -# MBP1_USTMA -NA ref_pro_9 ref_ftr_1 7 104 APSES fold -NA ref_pro_9 ref_ftr_2 24 107 KilA-N -NA ref_pro_9 ref_ftr_4 106 116 low complexity -NA ref_pro_9 ref_ftr_4 161 183 low complexity -NA ref_pro_9 ref_ftr_4 657 672 low complexity -NA ref_pro_9 ref_ftr_4 776 796 low complexity -NA ref_pro_9 ref_ftr_5 245 274 Ankyrin -NA ref_pro_9 ref_ftr_5 355 384 Ankyrin -NA ref_pro_9 ref_ftr_6 232 395 Swi6 fold -NA ref_pro_9 ref_ftr_7 581 609 coiled coil -# MBP1_WALME -NA ref_pro_10 ref_ftr_1 6 103 APSES fold -NA ref_pro_10 ref_ftr_2 23 106 KilA-N -NA ref_pro_10 ref_ftr_4 149 162 low complexity -NA ref_pro_10 ref_ftr_4 171 188 low complexity -NA ref_pro_10 ref_ftr_4 618 628 low complexity -NA ref_pro_10 ref_ftr_4 634 660 low complexity -NA ref_pro_10 ref_ftr_5 250 279 Ankyrin -NA ref_pro_10 ref_ftr_5 369 398 Ankyrin -NA ref_pro_10 ref_ftr_6 237 409 Swi6 fold -NA ref_pro_10 ref_ftr_7 461 585 coiled coil +ID protein.ID feature.ID start end note +# MBP1_SACCE +NA ref_pro_4 ref_ftr_1 4 102 APSES fold +NA ref_pro_4 ref_ftr_2 22 105 KilA-N +NA ref_pro_4 ref_ftr_4 108 122 low complexity +NA ref_pro_4 ref_ftr_4 236 241 low complexity +NA ref_pro_4 ref_ftr_4 279 307 low complexity +NA ref_pro_4 ref_ftr_4 700 717 low complexity +NA ref_pro_4 ref_ftr_4 700 717 low complexity +NA ref_pro_4 ref_ftr_5 394 423 Ankyrin +NA ref_pro_4 ref_ftr_5 427 463 Ankyrin +NA ref_pro_4 ref_ftr_5 512 541 Ankyrin +NA ref_pro_4 ref_ftr_6 381 547 Swi6 fold +NA ref_pro_4 ref_ftr_7 633 655 coiled coil +# MBP1_ASPNI +NA ref_pro_1 ref_ftr_1 9 106 APSES fold +NA ref_pro_1 ref_ftr_2 26 109 KilA-N +NA ref_pro_1 ref_ftr_4 529 534 low complexity +NA ref_pro_1 ref_ftr_5 260 289 Ankyrin +NA ref_pro_1 ref_ftr_5 381 413 Ankyrin +NA ref_pro_1 ref_ftr_6 193 402 Swi6 fold +NA ref_pro_1 ref_ftr_7 509 572 coiled coil +# MBP1_BIPOR +NA ref_pro_2 ref_ftr_1 8 106 APSES fold +NA ref_pro_2 ref_ftr_2 26 109 KilA-N +NA ref_pro_2 ref_ftr_4 134 152 low complexity +NA ref_pro_2 ref_ftr_4 267 278 low complexity +NA ref_pro_2 ref_ftr_4 670 685 low complexity +NA ref_pro_2 ref_ftr_5 266 295 Ankyrin +NA ref_pro_2 ref_ftr_5 387 416 Ankyrin +NA ref_pro_2 ref_ftr_6 253 421 Swi6 fold +NA ref_pro_2 ref_ftr_7 659 681 coiled coil +NA ref_pro_2 ref_ftr_7 500 590 coiled coil +# MBP1_NEUCR +NA ref_pro_3 ref_ftr_1 14 114 APSES fold +NA ref_pro_3 ref_ftr_2 34 117 KilA-N +NA ref_pro_3 ref_ftr_4 130 141 low complexity +NA ref_pro_3 ref_ftr_4 253 266 low complexity +NA ref_pro_3 ref_ftr_4 514 525 low complexity +NA ref_pro_3 ref_ftr_4 554 564 low complexity +NA ref_pro_3 ref_ftr_4 601 618 low complexity +NA ref_pro_3 ref_ftr_4 620 629 low complexity +NA ref_pro_3 ref_ftr_4 636 652 low complexity +NA ref_pro_3 ref_ftr_4 658 672 low complexity +NA ref_pro_3 ref_ftr_4 725 735 low complexity +NA ref_pro_3 ref_ftr_4 752 771 low complexity +NA ref_pro_3 ref_ftr_5 268 297 Ankyrin +NA ref_pro_3 ref_ftr_5 390 419 Ankyrin +NA ref_pro_3 ref_ftr_6 270 426 Swi6 fold +NA ref_pro_3 ref_ftr_7 500 550 coiled coil +# MBP1_SCHPO +NA ref_pro_5 ref_ftr_1 8 104 APSES fold +NA ref_pro_5 ref_ftr_2 25 113 KilA-N +NA ref_pro_5 ref_ftr_4 111 125 low complexity +NA ref_pro_5 ref_ftr_4 136 145 low complexity +NA ref_pro_5 ref_ftr_4 176 191 low complexity +NA ref_pro_5 ref_ftr_4 422 447 low complexity +NA ref_pro_5 ref_ftr_5 247 276 Ankyrin +NA ref_pro_5 ref_ftr_5 368 397 Ankyrin +NA ref_pro_5 ref_ftr_6 234 400 Swi6 fold +NA ref_pro_5 ref_ftr_7 457 538 coiled coil +# MBP1_COPCI +NA ref_pro_6 ref_ftr_1 5 103 APSES fold +NA ref_pro_6 ref_ftr_2 23 106 KilA-N +NA ref_pro_6 ref_ftr_4 170 191 low complexity +NA ref_pro_6 ref_ftr_4 435 450 low complexity +NA ref_pro_6 ref_ftr_4 611 626 low complexity +NA ref_pro_6 ref_ftr_5 270 299 Ankyrin +NA ref_pro_6 ref_ftr_5 389 418 Ankyrin +NA ref_pro_6 ref_ftr_5 474 509 Ankyrin +NA ref_pro_6 ref_ftr_6 257 429 Swi6 fold +NA ref_pro_6 ref_ftr_7 500 570 coiled coil +NA ref_pro_6 ref_ftr_7 651 678 coiled coil +# MBP1_CRYNE +NA ref_pro_7 ref_ftr_1 113 211 APSES fold +NA ref_pro_7 ref_ftr_2 131 215 KilA-N +NA ref_pro_7 ref_ftr_4 66 85 low complexity +NA ref_pro_7 ref_ftr_4 413 423 low complexity +NA ref_pro_7 ref_ftr_4 633 644 low complexity +NA ref_pro_7 ref_ftr_4 697 709 low complexity +NA ref_pro_7 ref_ftr_5 477 506 Ankyrin +NA ref_pro_7 ref_ftr_5 618 647 Ankyrin +NA ref_pro_7 ref_ftr_6 452 663 Swi6 fold +# MBP1_PUCGR +NA ref_pro_8 ref_ftr_1 90 187 APSES fold +NA ref_pro_8 ref_ftr_2 107 190 KilA-N +NA ref_pro_8 ref_ftr_4 208 227 low complexity +NA ref_pro_8 ref_ftr_4 273 291 low complexity +NA ref_pro_8 ref_ftr_5 442 271 Ankyrin +NA ref_pro_8 ref_ftr_5 475 509 Ankyrin +NA ref_pro_8 ref_ftr_5 561 590 Ankyrin +NA ref_pro_8 ref_ftr_6 429 601 Swi6 fold +NA ref_pro_8 ref_ftr_7 827 863 coiled coil +# MBP1_USTMA +NA ref_pro_9 ref_ftr_1 7 104 APSES fold +NA ref_pro_9 ref_ftr_2 24 107 KilA-N +NA ref_pro_9 ref_ftr_4 106 116 low complexity +NA ref_pro_9 ref_ftr_4 161 183 low complexity +NA ref_pro_9 ref_ftr_4 657 672 low complexity +NA ref_pro_9 ref_ftr_4 776 796 low complexity +NA ref_pro_9 ref_ftr_5 245 274 Ankyrin +NA ref_pro_9 ref_ftr_5 355 384 Ankyrin +NA ref_pro_9 ref_ftr_6 232 395 Swi6 fold +NA ref_pro_9 ref_ftr_7 581 609 coiled coil +# MBP1_WALME +NA ref_pro_10 ref_ftr_1 6 103 APSES fold +NA ref_pro_10 ref_ftr_2 23 106 KilA-N +NA ref_pro_10 ref_ftr_4 149 162 low complexity +NA ref_pro_10 ref_ftr_4 171 188 low complexity +NA ref_pro_10 ref_ftr_4 618 628 low complexity +NA ref_pro_10 ref_ftr_4 634 660 low complexity +NA ref_pro_10 ref_ftr_5 250 279 Ankyrin +NA ref_pro_10 ref_ftr_5 369 398 Ankyrin +NA ref_pro_10 ref_ftr_6 237 409 Swi6 fold +NA ref_pro_10 ref_ftr_7 461 585 coiled coil diff --git a/functionTemplate.R b/functionTemplate.R index d5de8e0..28e252b 100644 --- a/functionTemplate.R +++ b/functionTemplate.R @@ -1,37 +1,37 @@ -# functionTemplate.R -# -# Purpose: (General) -# -# ToDo: -# Notes: -# -# ============================================================================== - -myFunction <- function(a, b=1) { - # Purpose: - # Describe ... - # Version: - # Date: - # Author: - # - # Parameters: - # a: ... - # b: ... - # Value: - # result: ... - # Example: - - # code ... - - return(result) -} - - -# ==== TESTS ================================================================= -# Enter your function tests here... - -if (FALSE) { - # test ... -} - -# [END] +# functionTemplate.R +# +# Purpose: (General) +# +# ToDo: +# Notes: +# +# ============================================================================== + +myFunction <- function(a, b=1) { + # Purpose: + # Describe ... + # Version: + # Date: + # Author: + # + # Parameters: + # a: ... + # b: ... + # Value: + # result: ... + # Example: + + # code ... + + return(result) +} + + +# ==== TESTS ================================================================= +# Enter your function tests here... + +if (FALSE) { + # test ... +} + +# [END] diff --git a/myScripts/.myProfile.R b/myScripts/.myProfile.R index 3e1cebb..b8d9736 100644 --- a/myScripts/.myProfile.R +++ b/myScripts/.myProfile.R @@ -1,21 +1,21 @@ -# .myProfile.R -# This contains information which the course framework needs from time to time -# to personalize assignments, validate submissions etc. Make sure that -# the information correctly matches our official records. -# myEmail char A string with your eMail address. Use your official -# UofT eMail address. -# myStudentNumber numeric Your UofT student number. Take care to have this -# correct. -# -# NOTE: -# After you have updated this script, move the file to your "myScripts" folder. -# Utility scripts will look for it on the path: "./myScripts/.myProfile.R" -# -# ============================================================================== -# options(stringsAsFactors = FALSE) - -myEMail <- "yh.deng@mail.utoronto.ca" # e.g. "u.franklin@utoronto.ca" -myStudentNumber <- 1005845285 # e.g. 1003141592 -MYSPE <- "Cutaneotrichosporon oleaginosum" - -# [END] +# .myProfile.R +# This contains information which the course framework needs from time to time +# to personalize assignments, validate submissions etc. Make sure that +# the information correctly matches our official records. +# myEmail char A string with your eMail address. Use your official +# UofT eMail address. +# myStudentNumber numeric Your UofT student number. Take care to have this +# correct. +# +# NOTE: +# After you have updated this script, move the file to your "myScripts" folder. +# Utility scripts will look for it on the path: "./myScripts/.myProfile.R" +# +# ============================================================================== +# options(stringsAsFactors = FALSE) + +myEMail <- "yh.deng@mail.utoronto.ca" # e.g. "u.franklin@utoronto.ca" +myStudentNumber <- 1005845285 # e.g. 1003141592 +MYSPE <- "Cutaneotrichosporon oleaginosum" + +# [END] diff --git a/myScripts/ABC-INT-Mutation_impact-code.R b/myScripts/ABC-INT-Mutation_impact-code.R index ff5f585..51d4bf0 100644 --- a/myScripts/ABC-INT-Mutation_impact-code.R +++ b/myScripts/ABC-INT-Mutation_impact-code.R @@ -1,54 +1,51 @@ -myFA <- readFASTA("data/RAB39B_HSa_coding.fa") -myFA <- rbind(myFA, readFASTA("data/PTPN5_HSa_coding.fa")) -myFA <- rbind(myFA, readFASTA("data/PTPN11_HSa_coding.fa")) -myFA <- rbind(myFA, readFASTA("data/KRAS_HSa_coding.fa")) -rownames(myFA)<-c("RAB39B", "PTPN5", "PTPN11", "KRAS") # Assign row names - -gen_mutations <- function(seq, N) { - stats <- c() - stats <- cbind(stats, c(0, 0, 0)) - rownames(stats) <- c("silent", "missense", "nonsense") - colnames(stats) <- c("occurrences") - # Actual function - for (i in 1:217) { - # select index for mutation - working_seq <- Biostrings::DNAString(seq) - aa_seq <- Biostrings::translate(working_seq, no.init.codon = TRUE) - mut_action <- sample(c("ins", "del", "sub"), 1, TRUE) - mut_seq <- Biostrings::DNAString(seq) - if (mut_action == "sub") { - mut_index <- sample(1:length(working_seq), 1, replace = TRUE) - possible_mutations <- Biostrings::DNA_BASES - possible_mutations <- possible_mutations[possible_mutations != as.character(unlist(working_seq[mut_index]))] - mut_change <- sample(possible_mutations, 1, replace = TRUE) - mut_seq <- Biostrings::replaceLetterAt(mut_seq, mut_index, mut_change) - } else if (mut_action == "ins") { - mut_index <- sample(1:length(working_seq) - 2, 1, replace = TRUE) - possible_mutations <- Biostrings::DNA_BASES - mut_seq <- Biostrings::DNAString(paste(substring(working_seq, 1, mut_index - 1), sample(possible_mutations, 1), substring(working_seq, mut_index), sep = "")) - } else { - mut_index <- sample(1:length(working_seq), 1, replace = TRUE) - mut_seq <- mut_seq[-mut_index] - } - mut_seq <- Biostrings::DNAString(substring(mut_seq, 1, length(mut_seq) - (length(mut_seq) %% 3))) - mut_aa <- Biostrings::translate(mut_seq, no.init.codon = TRUE) - - # Note: we need silent, nonsense, and missense - mut_aa_stop <- match("*", Biostrings::as.matrix(mut_aa)) - aa_seq_stop <- match("*", Biostrings::as.matrix(aa_seq)) - if (!is.na(mut_aa_stop) & (is.na(aa_seq_stop) | mut_aa_stop < aa_seq_stop)) { - stats["nonsense", "occurrences"] <- 1 + stats["nonsense", "occurrences"] - } else if (mut_aa == aa_seq) { - stats["silent", "occurrences"] <- 1 + stats["silent", "occurrences"] - } else { - stats["missense", "occurrences"] <- 1 + stats["missense", "occurrences"] - } - } - return(stats) -} -N_test <- 1200 -gen_mutations("ATGATGATGATGATGATG", N_test) -gen_mutations("CCCCCCCCCCCCCCCCCC", N_test) -gen_mutations("TATTACTATTACTATTAC", N_test) -gen_mutations("TGGTGGTGGTGGTGGTGGTGGTGG", N_test) -gen_mutations("TGTTGTTGTTGTTGTTGTTGTTGT", N_test) +gen_mutations <- function(seq, N) { + sealKey() # See: http://steipe.biochemistry.utoronto.ca/abc/index.php/BCH441_Code_submisson_instructions + stats <- c() + stats <- cbind(stats, c(0, 0, 0)) + rownames(stats) <- c("silent", "missense", "nonsense") + colnames(stats) <- c("occurrences") + # Actual function + for (i in 1:N) { + original_seq <- Biostrings::DNAString(seq) + aa_seq <- Biostrings::translate(original_seq, no.init.codon = TRUE) + + mut_seq <- Biostrings::DNAString(seq) + mut_index <- sample(1:length(original_seq), 1, replace = TRUE) + possible_mutations <- Biostrings::DNA_BASES + possible_mutations <- possible_mutations[possible_mutations != as.character(unlist(original_seq[mut_index]))] + mut_seq <- Biostrings::replaceLetterAt(mut_seq, mut_index, sample(possible_mutations, 1, replace = TRUE)) + mut_aa <- Biostrings::translate(mut_seq, no.init.codon = TRUE) + + + term_aa <- regexpr(pattern = "\\*", aa_seq) + term_mut_aa <- as.integer(regexpr(pattern = "\\*", mut_aa)) + if ((term_aa == -1 && term_mut_aa != -1) || (term_mut_aa != -1 && term_mut_aa < term_aa)) { + stats["nonsense", "occurrences"] <- 1 + stats["nonsense", "occurrences"] + } else if (mut_aa == aa_seq) { + stats["silent", "occurrences"] <- 1 + stats["silent", "occurrences"] + } else { + stats["missense", "occurrences"] <- 1 + stats["missense", "occurrences"] + } + } + sealKey() + return(stats) +} + +gen_mutations("ATGATGATGATGATGATG", 1000) +gen_mutations("CCCCCCCCCCCCCCCCCC", 500) +gen_mutations("TATTACTATTACTATTAC", 500) +gen_mutations("TGGTGGTGGTGGTGGTGGTGGTGG", 500) +gen_mutations("TGTTGTTGTTGTTGTTGTTGTTGT", 500) +gen_mutations("TGTTGTTGTTGTTGTTGTTGTTGA", 500) + + +myFA <- readFASTA("data/RAB39B_HSa_coding.fa") +myFA <- rbind(myFA, readFASTA("data/PTPN5_HSa_coding.fa")) +myFA <- rbind(myFA, readFASTA("data/PTPN11_HSa_coding.fa")) +myFA <- rbind(myFA, readFASTA("data/KRAS_HSa_coding.fa")) +rownames(myFA)<-c("RAB39B", "PTPN5", "PTPN11", "KRAS") # Assign row names + +gen_mutations(myFA["RAB39B", 2], 10000) +gen_mutations(myFA["PTPN5", 2], 10000) +gen_mutations(myFA["PTPN11", 2], 10000) +gen_mutations(myFA["KRAS", 2], 10000) diff --git a/myScripts/BIN-Storing_data.R b/myScripts/BIN-Storing_data.R index 2aba13f..c4a3886 100644 --- a/myScripts/BIN-Storing_data.R +++ b/myScripts/BIN-Storing_data.R @@ -1,41 +1,41 @@ -# == 1.3 Task: submit for credit (part 1/2) ================================ -# == Submission - Code to add another philosopher to the datamodel: - -pID <- autoincrement(philDB$person) -immanuelKant <- data.frame(id = pID, - name = "Immanuel Kant", - born = "1724", - died = "1804", - school = "Enlightenment Philosophy") -philDB$person <- rbind(philDB$person, immanuelKant) - -bID = autoincrement(philDB$books) -immanuelKantWork <- data.frame(id = bID, - title = "Critique of Pure Reason", - published = "1781") -philDB$books <- rbind(philDB$books, immanuelKantWork) -philDB$works <- rbind(philDB$works, data.frame(id = autoincrement(philDB$works), personID = pID, bookID = bID)) - -bID = autoincrement(philDB$books) -immanuelKantWork <- data.frame(id = bID, - title = "Critique of Judgement", - published = "1790") -philDB$books <- rbind(philDB$books, immanuelKantWork) -philDB$works <- rbind(philDB$works, data.frame(id = autoincrement(philDB$works), personID = pID, bookID = bID)) - -# == Submission: Code to list the philosophical schools in alphabetical order as well as their respective books in alphabetical order. - -schools <- unique(philDB$person$school) -schools <- sort(schools) - -for (s in schools) { - cat(sprintf("%s\n", s)) - authors = which(philDB$person$school == s) - for (author in authors) { - works = which(philDB$works$personID == author) - for (work in works) { - bookId = which(philDB$books$id == philDB$works$bookID[work]) - cat(sprintf("\t%s - (%s)\n", philDB$books$title[bookId], philDB$books$published[bookId])) - } - } +# == 1.3 Task: submit for credit (part 1/2) ================================ +# == Submission - Code to add another philosopher to the datamodel: + +pID <- autoincrement(philDB$person) +immanuelKant <- data.frame(id = pID, + name = "Immanuel Kant", + born = "1724", + died = "1804", + school = "Enlightenment Philosophy") +philDB$person <- rbind(philDB$person, immanuelKant) + +bID = autoincrement(philDB$books) +immanuelKantWork <- data.frame(id = bID, + title = "Critique of Pure Reason", + published = "1781") +philDB$books <- rbind(philDB$books, immanuelKantWork) +philDB$works <- rbind(philDB$works, data.frame(id = autoincrement(philDB$works), personID = pID, bookID = bID)) + +bID = autoincrement(philDB$books) +immanuelKantWork <- data.frame(id = bID, + title = "Critique of Judgement", + published = "1790") +philDB$books <- rbind(philDB$books, immanuelKantWork) +philDB$works <- rbind(philDB$works, data.frame(id = autoincrement(philDB$works), personID = pID, bookID = bID)) + +# == Submission: Code to list the philosophical schools in alphabetical order as well as their respective books in alphabetical order. + +schools <- unique(philDB$person$school) +schools <- sort(schools) + +for (s in schools) { + cat(sprintf("%s\n", s)) + authors = which(philDB$person$school == s) + for (author in authors) { + works = which(philDB$works$personID == author) + for (work in works) { + bookId = which(philDB$books$id == philDB$works$bookID[work]) + cat(sprintf("\t%s - (%s)\n", philDB$books$title[bookId], philDB$books$published[bookId])) + } + } } \ No newline at end of file diff --git a/myScripts/CUTOLTaxonomy.json b/myScripts/CUTOLTaxonomy.json index 9025c71..999223c 100644 --- a/myScripts/CUTOLTaxonomy.json +++ b/myScripts/CUTOLTaxonomy.json @@ -1,4 +1,4 @@ -[{ - "ID": 879819, - "species": "Cutaneotrichosporon oleaginosum"} -] +[{ + "ID": 879819, + "species": "Cutaneotrichosporon oleaginosum"} +] diff --git a/myScripts/MBP1_CUTOL.json b/myScripts/MBP1_CUTOL.json index 04d300b..6c086c9 100644 --- a/myScripts/MBP1_CUTOL.json +++ b/myScripts/MBP1_CUTOL.json @@ -1,19 +1,19 @@ -[ - { "name" : "MBP1_CUTOL", - "RefSeqID" : "XP_018278493.1", - "UniProtID" : "A0A0J0XLN0", - "taxonomyID" : 879819, - "sequence" : [ - "MGKKAAAAGDGGPNTIYKATYSGVPVFEFICRNVAVMRRRSDAYLNATQILKVAGFDKPQRTRVLEREVQ", - "KGEHEKVQGGYGKYQGTWVPIERGLALAKQYNVEDLLRPIIDFVPRESVSPPPAPKHAVAPPTKRNKEPK", - "PKEGLVPIKSAGVLSGTGRHQTPDSVGEDVESEVMDDMSESQTPSPLNGTSLLPAVDERSIDGMDIDGFS", - "MMNGGGHARKRSAAMMDDEDEYEQLKRARGNSAVHTPPPPGQSPRYGGMQHPLTQDEYNDIVLNYFVSEA", - "TQIPAVMTNPPYNWDPNGIIDDDHHTALHWAAAMGRTRVIKLLLSAGARIFDKNNLDQTPLMRSVMFTNN", - "YDLRKFPEVFELLHRSTLNIDKNNRTVFHHIANLALYKGKTHAARYYMEVILSRLADYPQELADVINFAD", - "EDGETALTLAARARSKRIVKALLDHGADPKLRNRDHKSAEDYILEDERFRSSPDVMLNRTQPSAAPRNPT", - "SLGAAVFSQGLPPQLYNSEAARLASGPHSSDILQQMQALARSFEAEKLNKERDVLEAKAMLTSIHTEVND", - "AGRTLHNLGEQMKPLEAKQGELDGLVERLQSKLQKDLARGARKWKAADEGRENRWKNGDDPSQAGEDYSD", - "LPELTAIPDNAEAEEERLRGEIEKMRARRGELVTRLVKAQTQTGTTDKMAQYRRLITAGCGGDINPGEID", - "DIVGQLLDMLENEAQSGRPAPPPQAAPSWVTS"] - } -] +[ + { "name" : "MBP1_CUTOL", + "RefSeqID" : "XP_018278493.1", + "UniProtID" : "A0A0J0XLN0", + "taxonomyID" : 879819, + "sequence" : [ + "MGKKAAAAGDGGPNTIYKATYSGVPVFEFICRNVAVMRRRSDAYLNATQILKVAGFDKPQRTRVLEREVQ", + "KGEHEKVQGGYGKYQGTWVPIERGLALAKQYNVEDLLRPIIDFVPRESVSPPPAPKHAVAPPTKRNKEPK", + "PKEGLVPIKSAGVLSGTGRHQTPDSVGEDVESEVMDDMSESQTPSPLNGTSLLPAVDERSIDGMDIDGFS", + "MMNGGGHARKRSAAMMDDEDEYEQLKRARGNSAVHTPPPPGQSPRYGGMQHPLTQDEYNDIVLNYFVSEA", + "TQIPAVMTNPPYNWDPNGIIDDDHHTALHWAAAMGRTRVIKLLLSAGARIFDKNNLDQTPLMRSVMFTNN", + "YDLRKFPEVFELLHRSTLNIDKNNRTVFHHIANLALYKGKTHAARYYMEVILSRLADYPQELADVINFAD", + "EDGETALTLAARARSKRIVKALLDHGADPKLRNRDHKSAEDYILEDERFRSSPDVMLNRTQPSAAPRNPT", + "SLGAAVFSQGLPPQLYNSEAARLASGPHSSDILQQMQALARSFEAEKLNKERDVLEAKAMLTSIHTEVND", + "AGRTLHNLGEQMKPLEAKQGELDGLVERLQSKLQKDLARGARKWKAADEGRENRWKNGDDPSQAGEDYSD", + "LPELTAIPDNAEAEEERLRGEIEKMRARRGELVTRLVKAQTQTGTTDKMAQYRRLITAGCGGDINPGEID", + "DIVGQLLDMLENEAQSGRPAPPPQAAPSWVTS"] + } +] diff --git a/myScripts/README-myScripts.txt b/myScripts/README-myScripts.txt index b76c55a..536a089 100644 --- a/myScripts/README-myScripts.txt +++ b/myScripts/README-myScripts.txt @@ -1,8 +1,8 @@ -README - myScripts folder: -========================== - -The "myScripts" folder is a place to keep your personal files -safe. No files will be submitted into this folder on the GitHub, master -copy. Thefore everything you put into this folder is safe from being -inadvertently overwritten by a file with the same name that would be -downloaded in a GitHub "pull" request. +README - myScripts folder: +========================== + +The "myScripts" folder is a place to keep your personal files +safe. No files will be submitted into this folder on the GitHub, master +copy. Thefore everything you put into this folder is safe from being +inadvertently overwritten by a file with the same name that would be +downloaded in a GitHub "pull" request. diff --git a/myScripts/makeProteinDB.R b/myScripts/makeProteinDB.R index 70a9864..815f56b 100644 --- a/myScripts/makeProteinDB.R +++ b/myScripts/makeProteinDB.R @@ -1,4 +1,4 @@ -source("./scripts/ABC-createRefDB.R") - -myDB <- dbAddProtein(myDB, jsonlite::fromJSON("./myScripts/MBP1_CUTOL.json")) -myDB <- dbAddTaxonomy(myDB, jsonlite::fromJSON("./myScripts/CUTOLtaxonomy.json")) +source("./scripts/ABC-createRefDB.R") + +myDB <- dbAddProtein(myDB, jsonlite::fromJSON("./myScripts/MBP1_CUTOL.json")) +myDB <- dbAddTaxonomy(myDB, jsonlite::fromJSON("./myScripts/CUTOLtaxonomy.json")) diff --git a/myScripts/myScript.R b/myScripts/myScript.R index f42a47e..178b255 100644 --- a/myScripts/myScript.R +++ b/myScripts/myScript.R @@ -1,38 +1,38 @@ -# myScript.R -# -# --- As you work with this file, you can delete the instructions below -------- -# Write your notes and code experiments into this document. Save it -# from time to time - however I recommend that you do not _commit_ -# your saved version. -# -# As long as you do not _commit_ this script to version control, -# you can _pull_ updated versions of the entire project from GitHub -# by using the RStudio version control interface. However, once -# you _commit_ any file in your local version, RStudio will require -# you to resolve conflicts before you can _pull_ updates. -# --- As you work with this file, you can delete the instructions above -------- -# -## Purpose: <...> -# -# Version: <...> -# -# Date: <...> -# Author: () -# -# Versions: -# -# -# -# TODO: -# <...> -# -# ==================================================================== - - - - - - - -# [END] - +# myScript.R +# +# --- As you work with this file, you can delete the instructions below -------- +# Write your notes and code experiments into this document. Save it +# from time to time - however I recommend that you do not _commit_ +# your saved version. +# +# As long as you do not _commit_ this script to version control, +# you can _pull_ updated versions of the entire project from GitHub +# by using the RStudio version control interface. However, once +# you _commit_ any file in your local version, RStudio will require +# you to resolve conflicts before you can _pull_ updates. +# --- As you work with this file, you can delete the instructions above -------- +# +## Purpose: <...> +# +# Version: <...> +# +# Date: <...> +# Author: () +# +# Versions: +# +# +# +# TODO: +# <...> +# +# ==================================================================== + + + + + + + +# [END] + diff --git a/plottingReference.R b/plottingReference.R index fb576db..ac44aa1 100644 --- a/plottingReference.R +++ b/plottingReference.R @@ -1,1434 +1,1434 @@ -# tocID <- "plottingReference.R" -# -# Purpose: Reference to graphical output in R. -# -# -# Version: 2.1 -# -# Date: 2017 09 - 2021 09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# V 2.1 First minor updates 2021 -# V 2.0 Comprehensive reference with basic and advanced options based on -# an integrated yeast gene expression dataset. Full rewrite of most -# sections. -# V 1.1 Stylistic improvements, code polish, and additional examples -# V 1.0 Digest from "plotting reference" files -# -# ToDo: Demo 6.3.2 in parallel plots -# -# - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ------------------------------------------------------------------- -#TOC> 01 INITIALIZE 69 -#TOC> 02 THIS REFERENCE ... 74 -#TOC> 02.1 Dataset Documentation 81 -#TOC> 03 PROPORTIONS AND DISTRIBUTIONS 193 -#TOC> 03.1 barplot() 198 -#TOC> 03.2 pie() 222 -#TOC> 03.3 boxplot() 254 -#TOC> 03.4 hist() 312 -#TOC> 03.4.1 overlaying histograms 357 -#TOC> 04 THE plot() FUNCTION 400 -#TOC> 04.1 line plots 404 -#TOC> 05 ENCODING INFORMATION: SYMBOL, SIZE, COLOuR 503 -#TOC> 05.1 pch ("plotting character" symbols) 509 -#TOC> 05.1.1 Line types 684 -#TOC> 05.2 cex ("character expansion" size) 708 -#TOC> 06 COLOUR 768 -#TOC> 06.1 Colours by number 776 -#TOC> 06.2 Colours by name 794 -#TOC> 06.3 Colours as hex-triplets 820 -#TOC> 06.3.1 Inbuilt palettes 875 -#TOC> 06.3.2 Custom palettes 952 -#TOC> 06.3.3 Transparency: The Alpha Channel 1002 -#TOC> 06.4 abline(), lines() and segments() 1047 -#TOC> 07 AXES 1081 -#TOC> 08 LEGENDS 1118 -#TOC> 08.1 basic legends 1121 -#TOC> 08.2 Color bars 1125 -#TOC> 09 LAYOUT 1246 -#TOC> 10 TEXT 1281 -#TOC> 11 DRAWING ON PLOTS 1309 -#TOC> 12 IMAGES 1376 -#TOC> 13 CONTOUR LINES 1381 -#TOC> 14 3D PLOTS 1386 -#TOC> 15 GRAPHS AND NETWORKS 1391 -#TOC> 16 OTHER GRPAHICS PACKAGES 1396 -#TOC> 17 INTERACTIVE PLOTS 1420 -#TOC> 17.1 locator() 1424 -#TOC> 17.2 plotly:: 1427 -#TOC> -#TOC> ========================================================================== - - -# = 01 INITIALIZE ========================================================= - -SC <- readRDS("data/SC.rds") # <<<- execute this line first - - -# = 02 THIS REFERENCE ... ================================================= - -# This script covers basic plotting and graphical output options of R. The -# functions are demonstrated with an integrated data set of yeast gene -# expression data and annotations. - - -# == 02.1 Dataset Documentation ============================================ - -# You do not need to study the dataset in detail but it will be useful to refer -# to this documentation from time to time to understand what data is being -# plotted and what one can therefore learn from the results. - -# The integrated dataset SC is a list that contains an analysis of yeast gene -# expression profiles originally published by Pramila et al. (2002; PMID: -# 12464633) and accessible as GSE3653 on GEO -# (https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE3635). This is a -# high-resolution (5 min. interval) data set spanning two cycles of a -# synchronized yeast culture. It includes 6228 expression profiles with 25 -# time-points assigned to yeast systematic names. It is complemented with gene -# annotations taken from SGD, and augmented with a set of GO slims. GO slims -# were rerieved by navigating to https://www.yeastgenome.org/ and using the menu -# to choose Function >> Gene Ontology >> GOslim Mapping File. This downloads -# go_slim_mapping.tab which was further processed to annotate each gene with its -# corresponding GO terms. To evaluate cyclical regulation, a curve-fitting -# protocol was followed to fit a cyclical epxpression model with parameters -# amplitude, phase, frequency, exponential damping, and baseline shift. After -# fitting the profiles, correlations with the fitted model were calculated and -# the first peak of the model was determined as a marker of when the expression -# was ON in the cell-cycle. Finally, the expression peak markers were assigned -# to seven phases of the cell cycle, and GO term enrichments were computed. A -# A subset was selected with the following parameters: - -# selCCl <- -# nlsParams$A > 0.075 & # reasonably high Amplitude -# nlsParams$cor > 0.6 & # good correlation with the parametrized model -# nlsParams$f > 0.75 & # period between 0.75 ... -# nlsParams$f < 1.333 & # ... and 1.333 hours -# nlsParams$k < 0.03 & # limiting the exponential damping -# nlsParams$k > -0.001 -# sum(selCCl) # 1,297 genes in the data set show some level -# # of periodic expression-variation in the cell -# # cycle. -# -# Thus the dataset comprises numeric and categorical data -# Here are the data details: -# SC$xpr : expression profiles. Numeric matrix with 1,297 rows of genes -# ====== and 25 colums of time points in 5 minute -# intervals -# Example: -# -------- -# SC$xpr[169, 1:5] -# > t.0 t.5 t.10 t.15 t.20 -# > -0.055703429 -0.116124955 -0.135965733 -0.068665035 -0.001819363 -# -# -# SC$mdl : parametrized model. Data frame with 1,297 rows of genes -# ====== -# SC$mdl$A : model parameter: amplitude (log ratio) -# SC$mdl$phi : model parameter: phase (degrees) -# SC$mdl$f : model parameter: 1/frequency (hours) -# SC$mdl$k : model parameter: damping -# SC$mdl$B : model parameter: baseline shift -# SC$mdl$cor : correlation of observation and model -# SC$mdl$peaks : timepoint of first expression peak of model (minutes) -# -# # Example: -# -------- -# SC$mdl[169, ] -# > A phi f k B cor peaks -# > 0.1007908 -81.04413 1.012092 0.00656052 -0.01857916 0.8437175 37.52217 -# -# -# SC$ann : annotations. Data frame with 1,297 rows of genes -# ====== -# SC$ann$SGD : Saccharomyces Gene Database identifier -# SC$ann$sysName : Yeast gene systematic name -# SC$ann$stdName : The standard name under which the gene is known -# SC$ann$alias : common alias name(s) -# SC$ann$description : free-text description of the gene -# SC$ann$GO : GO IDs of the SGD GO slim subset annotated to the gene -# -# Example: -# -------- -# SC$ann[169, ] -# > SGD sysName stdName alias -# > S000002214 YDL056W MBP1 transcription factor MBP1 -# > description -# > YDL056W Transcription factor; involved in regulation [...] -# > GO -# > YDL056W GO:0005634 GO:0003677 GO:0001071 GO:0000278 -# -# SC$phases -# --------- -# Data frame with a definition of yeast cell cycle phase names and -# time-points derived from inspection of the SC$mdl$peaks distribution. -# names start ends -# 1 Sense 0 6 -# 2 Prep 6 15 -# 3 Replicate 15 30 -# 4 Assemble 30 37 -# 5 Segregate 37 43 -# 6 Duplicate 43 55 -# 7 Stabilize 55 65 -# -# SC$GO -# ----- -# Data frame with GO term information and GO term enrichment data -# SC$GO$ontology : {C|F|P} identifying the "cellular component", "molecular -# function" or "biological process" ontology -# SC$GO$GOid : Gene Ontyology ID of the term -# SC$GO$label : Short label of the term -# SC$GO$tAll : Count of times the term is annotated in any gene -# SC$GO$tCC : ... times term is annotated to a gene in this dataset -# SC$GO$t... : ... annotated to one ofg the cell-cycle phases -# SC$GO$xs... : ... enrichment factor in each cell cycle phase -# - - -# = 03 PROPORTIONS AND DISTRIBUTIONS ====================================== - -# Distributions of numeric variable characterize the values. Proportions compare values. A typical use case is to characterize a set of measurements, or compare several sets of measurements. - - -# == 03.1 barplot() ======================================================== -# Draws a bar with height proportional to a given number. - -barplot(mean(SC$xpr[ , "t.20"])) # barplot of the mean expression at t.20 - -# Barplots show only a single number. They tell us nothing about the underlying distribution. They are commonly used to compare several distributions: - -barplot(colMeans(SC$xpr[ , c("t.0", "t.20", "t.40", "t.60")])) - -# barplots take the usual plotting parameters -myPal <- colorRampPalette(c("#00FF0055", "#0066FF55", # a "palette" function - "#00FFFF55", "#CCCCAA55", - "#FF00FF55", "#FF006655", - "#FFFFFF55"), alpha = TRUE) # transparent colors - -barplot(colMeans(SC$xpr[ , 1:13]), # mean expression changes, first hour - main = "Mean expression changes", - xlab = "time points", - cex.names = 0.6, # scale column names - ylab = "Expression (log ratio)", - cex.axis = 0.8, # scale of y-axis labels - col = myPal(13)) # get 13 color values from myPal() - - -# == 03.2 pie() ============================================================ -# Generally not preferred, but simple to do - -table(SC$GO$ontology) -# Example: how many genes are anotated to the GO terms in the Cellular Component -# category? -CCids <- SC$GO$GOid[SC$GO$ontology == "C"] # get GO ids for "C" ontology -x <- unlist(strsplit(SC$ann$GO, " ")) # split GO term strings on blank-spaces - # and dump them all into one single vector -x <- x[x %in% CCids] # subset the ones in CCIDs (about 40%) - -pie(table(x), cex = 0.5) - -# This can be better visualized in a barplot -myT <- sort(table(x), decreasing = TRUE) -b <- barplot(myT, # assign the plot - we need the x-coordinates - main = "Genes annotated to GO terms in the Cellular Component Ontology", - cex.main = 0.8, - names.arg = "", # blank the names - otherwise they are - ylab = "counts", # taken from the names of the object - cex.axis = 0.8, - col = colorRampPalette(c("#CCAAFF", "#FFDDFF", "#FFFFFF"))(length(myT)), - ylim = c(0, 1.5 * max(myT))) # make space at the top - -# Add the GOids as text() -text(b, myT, # b holds the x coordinates, myT is y - labels = names(myT), # take the names from the table - names - srt = 90, # rotate to vertical - adj = c(-0.1, 0.5), # align center, top - cex = 0.5) - - -# == 03.3 boxplot() ======================================================== -# A boxplot() is almost always preferred to a barplot, since it includes an -# estimate of the distribution: - -boxplot(SC$xpr[ , "t.20"]) # boxplot of expression values at t.20 - -# What are these elements? -# Assigning the plot to a variable makes the numbers available so we can -# use them for annotation: -oPar <- par(mar = c(0.2,3,0.2,0.2)) # reduce the margins -( b <- boxplot(SC$xpr[ , "t.20"])) - -xT <- 1.3 -cT <- "#DD0000" -# outliers -myOut <- mean(b$out[b$out > b$stats[5]]) # outliers above the whiskers -myOut[2] <- mean(b$out[b$out < b$stats[1]]) # outliers below the whiskers -text(1.04, myOut, adj=c(0,0.5), cex=0.7, col=cT, "outliers") - -# whiskers -text(1.12, b$stats[1,1], adj=c(0,0.5), cex=0.7, col=cT, "min(x_i > Q1-1.5*IQR)") -text(1.12, b$stats[5,1], adj=c(0,0.5), cex=0.7, col=cT, "max(x_i < Q3+1.5*IQR)") - -# quartiles -# "min(x_i > Q1-1.5*IQR)" is "the smallest x in the data that still lies -# within 1.5 times the inter-quartile range below Q1 -text(1.23, b$stats[2,1], adj=c(0,0.5), cex=0.7, col=cT, "Q1 (lower quartile)") -text(1.23, b$stats[4,1], adj=c(0,0.5), cex=0.7, col=cT, "Q3 (upper quartile)") - -# median -text(1.23, b$stats[3,1], adj=c(0,0.5), cex=0.9, col=cT, "median") - -# the mean is not shown -text(0.79, mean(SC$xpr[,"t.20"]), adj=c(1,0.5), cex=0.7, col="#999999", "mean") - -par(oPar) # reset the margins - -# If we have datasets with more columns, each column gets its own boxplot -boxplot(SC$xpr[ , c("t.0", "t.20", "t.40", "t.60")]) - -# boxplots take the usual plotting parameters -myPal <- colorRampPalette(c("#00FF0055", "#0066FF55", # a "palette" function - "#00FFFF55", "#CCCCAA55", - "#FF00FF55", "#FF006655", - "#FFFFFF55"), alpha = TRUE) # transparent colors - -boxplot(SC$xpr[ , 1:13], # expression changes, first hour - main = "Expression levels", - xlab = "time points", - cex.axis = 0.6, # scale axis names - ylab = "Expression (log ratio)", - col = myPal(13)) # get 13 color values from myPal() - -# This plot shows that there is a noticable fluctuation of expression levels -# over the course of the first 60 minutes of the experiment. This may be due to -# these genes being selected as having cyclically varying expression profiles. - - -# == 03.4 hist() =========================================================== -# Histograms are superbly informative and one of the workhorses of our analyses. A histogram answers the question how many observations do we have in a particular range of a (continuously varying) variable. - -# Here we plot a histogram of the first expression peaks of genes, computed as -# the first peak of the fitted model for every gene in our set. We might be -# interested in whether the expression of different genes peaks continuously -# over the cycle, or whetehr there are time intervals where waves of expression -# of different genes can be observed in response to cycle-control signals. -hist(SC$mdl$peaks) - -# We can explicitly set breakpoints for the histogram: -# Here we set breaks at 4 minute intervals -( myBreaks <- seq(0, 80, by = 4) ) # Note: 21 values bound 20 intervals -hist(SC$mdl$peaks, breaks = myBreaks) - -# Assigning the output of hist() makes the values -# used in constructing the histogram accessible: - -( H <- hist(SC$mdl$peaks) ) - -# for example, we can use this to plot the actual numbers: -text(H$mids, # midpoints of the bars - H$counts, # counts -> probabilities - labels = H$counts, # add labels to each bar: count numbers - adj = c(0.5, -0.5), # text is centered on x and raised in y - cex = 0.6, - col = "#8888FF") - -# histograms take the usual plotting parameters -myPal <- colorRampPalette(c("#00FF0055", "#0066FF55", # a "palette" function - "#00FFFF55", "#CCCCAA55", - "#FF00FF55", "#FF006655", - "#FFFFFF55"), alpha = TRUE) # transparent colors - -myBreaks <- seq(0, 80, length.out = 81) # one-minute intervals -hist(SC$mdl$peaks, # gene expression first peaks - breaks = myBreaks, - main = "Timing of first peaks of during the cell-cycle", - sub = "The bimodal distribution distinguishes replication from division", - cex.sub = 0.8, - xlab = "t (min.)", - ylab = "counts", - col = myPal(81)) # get 81 color values from myPal() - - -# === 03.4.1 overlaying histograms - -# Histograms can be plotted one-over another to compare them -# Example: when do genes with different GO term annotations first peak? - -# GO:0005730 "nucleolus" -# GO:0032200 "telomere organization" -# GO:0006260 "DNA replication" -sel1 <- grep("GO:0005730", SC$ann$GO) # 103 genes -sel2 <- grep("GO:0032200", SC$ann$GO) # 32 genes -sel3 <- grep("GO:0006260", SC$ann$GO) # 67 genes - -# define breaks. This is important to make the histograms comparable -myBreaks <- seq(0, 80, by = 4) -# plot the first histogram - -hist(SC$mdl$peaks[sel1], breaks = myBreaks, - main = "Peak timing for different GO terms", - xlab = "t (min)", - ylab = "Counts", - ylim = c(0, 50), - col = "#FF007955") - -# first overlay -hist(SC$mdl$peaks[sel2], breaks = myBreaks, - col = "#00B2FF55", - add = TRUE) - -# second overlay -hist(SC$mdl$peaks[sel3], breaks = myBreaks, - col = "#7FDFC955", - add = TRUE) - -# Legend -legend("topright", - fill = c("#FF007955", "#00B2FF55", "#7FDFC955"), - legend = c("GO:0005730\n(nucleolus)\n", # "\n" is a line-break - "GO:0032200\n(telomere organization)\n", - "GO:0006260\n(DNA replication)\n"), - cex = 0.6, - bty = "n") # no box around the legend - - -# = 04 THE plot() FUNCTION ================================================ -# plot() is the workhorse of data visualization in R. But plot() is also a "generic" - i.e. different "classes" can define their own plot-methods and plot will "dispatch" the right method for a class. - - -# == 04.1 line plots ======================================================= - -# Lines are useful to visually associate ralated data points, like points in a -# sequence of events. - -# plot an expression profile: value over time -plot(SC$xpr[169, ]) - -# note the x is implied and plotted as "index", the expression values are used -# for the y-axis by default. - -# plot types -plot(SC$xpr[169, ], type = "p") # points, the default -plot(SC$xpr[169, ], type = "l") # lines -plot(SC$xpr[169, ], type = "b") # both points and lines -plot(SC$xpr[169, ], type = "c") # empty points and lines -plot(SC$xpr[169, ], type = "o") # overplotted -plot(SC$xpr[169, ], type = "s") # steps -plot(SC$xpr[169, ], type = "h") # like histogram -plot(SC$xpr[169, ], type = "n") # none - useful to create an empty frame - # to add other elements later -text(SC$xpr[169, ], colnames(SC$xpr), cex = 0.5) # ... such as labels - -# title and axis labels -iRow <- 169 -t <- seq(0, 120, by = 5) # set actual x-values -plot(t, SC$xpr[iRow, ], - type = "b", - main = "Expression profile", - sub = "Data: GSE3653 (Pramila et al. 2002)", - xlab = "time(min)", - ylab = "Expression (log ratio)") - -# adjusting font sizes -plot(t, SC$xpr[iRow, ], - type = "b", - main = "Expression profile", - sub = "Data: GSE3653 (Pramila et al. 2002)", - xlab = "time(min)", - ylab = "Expression (log ratio)", - cex.main = 1.1, # title - cex.sub = 0.6, # subtitle - cex.axis = 0.7, # axis values - cex.lab = 0.8) # axis labels - -# x and y axis ranges can be defined with a two-element vector -plot(t, SC$xpr[iRow, ], - type = "b", - xlim = c(0, 120), # tight against the values - ylim = c(-max(abs(SC$xpr[iRow, ])), - max(abs(SC$xpr[iRow, ]))), # symmetric around 0 - main = "", sub = "", xlab = "", ylab = "") -abline(h = 0, col = "#FF000044") - -# pull in annotations with sprintf() -plot(t, SC$xpr[iRow, ], - type = "b", - main = sprintf("Expression profile: %s (%s)", - SC$ann$stdName[iRow], - SC$ann$sysName[iRow]), - sub = "", xlab = "", ylab = "") - -# When exploring data, it is useful to have a standard view of data as a -# function: - -xprPlot <- function(iRow) { - t <- seq(0, 120, by=5) - yMax <- max(abs(SC$xpr[iRow, ])) * 1.1 - - plot(t, SC$xpr[iRow, ], - ylim = c(-yMax, yMax), - type = "b", - main = sprintf("Expression profile: %s (%s)", - SC$ann$stdName[iRow], - SC$ann$sysName[iRow]), - xlab = "time(min)", - ylab = "Expression (log ratio)", - cex.main = 1.1, - cex.axis = 0.7, - cex.lab = 0.8) - abline(h = 0, col = "#FF000044") -} - -xprPlot(169) -xprPlot(1124) - -# better to visualize by plotting one OVER the other. -# This is done with the function points() - -xprPlot(1124) -points(t, SC$xpr[169, ], type = "b", cex = 0.7, col = "#EE5500CC") - - - -# In general, when we plot(), we produce a "scatterplot" of X and y values. -# scatterplot: one against the other -plot(SC$xpr[169, ], SC$xpr[1124, ]) # these two profiles are anticorrelated - - -# = 05 ENCODING INFORMATION: SYMBOL, SIZE, COLOuR ========================= - -# We have many options to encode information in scatter plots (and others), in order to be able to visualize and discover patterns and relationships. The most important ones are the type of symbol to use, its size, and its color. - - - -# == 05.1 pch ("plotting character" symbols) =============================== -# There are many types of symbols available to plot points and they can all be varied by type, size, and color to present additional information. Which one to use is defined in the argument pch . The default is pch = 1: the open circle. Characters 1:20 are regular symbols: - -# reduce margins -oPar <- par(mar = c(1, 1, 1, 1)) - -# Empty plot frame ... -plot(c(0,11), c(0,11), type = "n", axes = FALSE, xlab = "", ylab = "") - -# coordinates for first 25 symbols -x1 <- c(1:10, 1:10) -y1 <- c(rep(10, 10),rep(9, 10)) -myPch <- 1:20 - -points(x1, y1, pch = myPch, cex = 1.2) - -# pch 21:25 can have different border and fill colours. Borders are defined with -# "col", fills are defined with "fill": - -x2 <- 1:5 -y2 <- rep(8,5) - -myCols <- c("#4B0055", "#00588B", "#009B95", "#53CC67", "#FDE333") - -points(x2, y2, pch=21:25, col="#708090", bg = myCols, cex = 1.8) - -# ten more symbols are defined as characters -x3 <- 1:10 -y3 <- rep(6,10) -myPch <- c(".", "o", "O", "0","a","A", "*", "+","-","|") -points(x3, y3, pch = myPch) # note: "myPCh" is a character vector while - # the other pch were identified by integers - -# The ASCII codes for characters 32 to 126 can also be used as plotting symbols -myPch <- 32:126 -x4 <- (((myPch - 32) %% 19) + 2) / 2 -y4 <- 5 - ((myPch - 32) %/% 19) -points(x4, y4, pch=32:126, col="#0055AA") - -# I don't think I have ever actually used characters as plotting characters in -# this way; it is much more straightforward to just use the text() function in -# that case, rather than having to look up which ASCII code is which character, -# and remembering which ones are available as numbers, and which ones are -# identified by the character itself. But the first twenty five I use a lot, and -# I also end up looking up their codes a lot. So here is a function to plot them for reference. You can paste it into your .Rprofile to keep it at hand: - -pchRef <- function() { - # a reference plot for the first twenty five plotting characters - - oPar <- par(mar = c(1, 1, 1, 1), mfrow = c(1, 1)) - plot(c(0,6), c(0,6), type = "n", axes = FALSE, xlab = "", ylab = "") - - x <- ((0:24) %% 5) + 1 - y <- rep(5:1, each = 5) - - idx <- 1:20 - points(x[idx], y[idx], pch = idx, cex = 2) - - idx <- 21:25 - points(x[idx], y[idx], pch = idx, cex = 2, col = "#708090", - bg=c("#CC0033AA", "#991566AA", "#662A99AA", "#323FCCAA", "#0055FFAA")) - - text(x - 0.3, y, labels = sprintf("%d:", 1:25), col = "#7766AA", cex = 0.8) - - par(oPar) -} - - -# reset margins -par(oPar) - - -# In addition to the default fonts, a large set of Hershey vector fonts is -# available which gives access to many more plotting and labeling options via -# text() -demo(Hershey) - -# Plotting other symbols: -# In the most general way, Unicode characters can be plotted as text. -# The code is passed in hexadecimal, long integer, with a negative sign. -# Here is a quarter note (Unicode: 266a) using plot() -plot(0.5,0.5, pch=-0x266aL, cex=5, xlab="", ylab="") - -# However, rendering may vary across platforms since it depends on unicode -# support. If your character can't be rendered, you'll only get an empty box. - - -# 1.1.1 Using pch to emphasize different categories - -# In general, when we plot(), we produce a "scatterplot" of X and y values. -# scatterplot: one against the other - -tRep <- c("t.15", "t.20", "t.25", "t.30") # Replication-phase time points -tDup <- c("t.40", "t.45", "t.50", "t.55") # Duplication-phase time points - -plot(rowMeans(SC$xpr[ , tRep]), rowMeans(SC$xpr[ , tDup])) - -# select top ten replication enriched GO terms -sel <- order(SC$GO$xsReplicate, decreasing = TRUE)[1:10] -SC$GO$label[sel] # what are these? -GOrep <- SC$GO$GOid[sel] # GO terms that are enriched in the Replication phase - -sel <- order(SC$GO$xsDuplicate, decreasing = TRUE)[1:10] -SC$GO$label[sel] # what are these? -GOdup <- SC$GO$GOid[sel] # GO terms that are enriched in the Duplication phase - -# define sets of genes that are annotated to one or the other GO id set -repGenes <- logical(nrow(SC$ann)) # prepare an empty vector -for (id in GOrep) { # whenever we find one of the - repGenes <- repGenes | grepl(id, SC$ann$GO) # characteristic GO IDs annotated -} # to a a gene, we put TRUE in its -sum(repGenes) # spot of the repGenes vector. -xRep <- rowMeans(SC$xpr[ repGenes, tRep]) # repGenes in the replication phase -yRep <- rowMeans(SC$xpr[ repGenes, tDup]) # repGenes in the duplication phase - -# same thing for the genes that are enriched in the duplication phase -dupGenes <- logical(nrow(SC$ann)) -for (id in GOdup) { - dupGenes <- dupGenes | grepl(id, SC$ann$GO) -} -sum(dupGenes) -xDup <- rowMeans(SC$xpr[ dupGenes, tRep]) # dupGenes in the replication phase -yDup <- rowMeans(SC$xpr[ dupGenes, tDup]) # dupGenes in the duplication phase - -# Ready to plot: -# base plot without the ref... and dup... genes -basePlot <- function(...) { - sel <- ! (repGenes | dupGenes) - m <- sprintf("Expression changes between phases (%d genes)", - nrow(SC$xpr)) - plot(rowMeans(SC$xpr[ sel, tRep]), - rowMeans(SC$xpr[ sel, tDup]), - main = m, - xlab = "Expression in Replication phase", - ylab = "Expression in Duplication phase", - cex.main = 0.9, - cex.lab = 0.8, - ...) - abline(h = 0, col = "#0088FF44") # horizontal zero - abline(v = 0, col = "#0088FF44") # vertical zero -} - -basePlot() -# plotting the rep.. and dup... sets with different pch -points(xRep, yRep, pch=24, col="#000000", bg="#FFFFFF") # white up triangle -points(xDup, yDup, pch=25, col="#000000", bg="#FFFFFF") # white down triangle - -# These are clearly different distributions, but the plot is overall too busy. - -# Using color improves the plot: -basePlot(pch=21, col="#AAAAAA", bg="#DDDDDD") -points(xRep, yRep, pch=24, col="#000000", bg="#66DDFF") -points(xDup, yDup, pch=25, col="#000000", bg="#FF77FF") - -# Even better may be to use transparent colors, to address the overlap: -basePlot(pch=19, col="#00000022") -points(xRep, yRep, pch=19, col="#33BBFF66") -points(xDup, yDup, pch=19, col="#FF44AA44") - -# this needs a legend: -legend ("bottom", - legend = c( - sprintf("%d Genes with Replication-\nenriched GO terms\n ", sum(repGenes)), - sprintf("%d Genes with Duplication-\nenriched GO terms\n ", sum(dupGenes)), - "Other Genes\n " - ), - horiz = TRUE, - pch = 19, - col = c("#33BBFF66", "#FF44AA44", "#00000022"), - cex = 0.6, - pt.cex = 1.0, - inset = 0.02, - box.col = "#DDDDDD", - bg = "#FFFFFF") - -# === 05.1.1 Line types - -# Basically all plots take arguments lty to define the line type, and lwd -# to define line width - -# empty plot ... -plot(c(0,10), c(0,10), type = "n", axes = FALSE, xlab = "", ylab = "") - -# Line type -for (i in 1:8) { - y <- 10.5-(i/2) - segments(1,y,5,y, lty=i) - text(6, y, paste("lty = ", i), col="grey60", adj=0, cex=0.75) -} - -# Line width -for (i in 1:10) { - y <- 5.5-(i/2) - segments(1,y,5,y, lwd=(0.3*i)^2) - text(6, y, paste("lwd = ", (0.3*i)^2), col="grey60", adj=0, cex=0.75) -} - - - -# == 05.2 cex ("character expansion" size) ================================= - -# The size of characters can be controlled with the cex parameter. cex takes a -# vector of numbers, mapped to the vecors of plotted elements. The usual R -# conventions of vector recycling apply, so if cex s only a single number, it is -# applied to all plotted elements. Here is an example plotting expression -# amplitudes in a comparison of pre-replication vs. replication phase -# expression. - - -tPre <- c("t.0", "t.5", "t.10") # Pre replication-phase time points -tMid <- c("t.25", "t.30", "t.35") # Midway between replication and duplication - -x <- rowMeans(SC$xpr[ , tPre]) # row means average out fluctuations -y <- rowMeans(SC$xpr[ , tMid]) -plot(x, y) - -myAmps <- SC$mdl$A # fetch the correlations of the fitted - # low correlations are not well modeled - # with a periodic function - -hist(myAmps, breaks = 40) # examine the distribution -hist(log(myAmps), breaks = 40) # sometimes log() is be better suited - # to map to symbol size - -# useful cex sizes are approximately between 0.5 and 5 -# Example: -N <- 10 -cexMin <- 0.5 -cexMax <- 5.0 -myCex <- seq(cexMax, cexMin, length.out=N) # Vector of cex values of length N -# We plot these points from largest to smallest, so we don't overplot -x1 <- runif(N) -y1 <- runif(N) -plot(x1, y1, xlim = 0:1, ylim = 0:1, xlab = "", ylab = "", pch = 16, - cex = myCex, col= colorRampPalette(c("#F4F0F8", "#3355DD"))(N)) - -# Note that the smallest cex at 0.5 is _really_ small. -points(x1[N], y1[N], cex = 3.0, col = "#FF000077") # Here it is! - -# To rescale a vector into the desired interval (lo, up) we write a little -# function. First we normalize the vector into the interval (0, 1), then we -# multiply it by up-lo, and add lo. -# - -reScale <- function(x, lo = 0, up = 1) { - return((((x-min(x)) / (max(x)-min(x))) * (up-lo)) + lo ) -} - -# with this, our coding amplitudes as plot character size becomes quite easy: -plot(x, y, pch=16, - cex = reScale(myAmps, lo=0.5, up=5), # <<<---- That's all we need - col="#4499BB22") -abline(a = 0, b = 1, col = "#DD333344") -abline(h = 0, col = "#33333344") -abline(v = 0, col = "#33333344") - -# ToDo: add titles, scale legend, and interpretation - - -# = 06 COLOUR ============================================================= - -# Colour is immensely important for data visualization, and colours in R can be -# specified by number, by name, as hex-triplets, as rgb or hsv values, and -# through several color-space specifications. The can be used individually, as -# vectors that are defined manually, and through colour palettes. And the can be -# solid and transparent. - -# == 06.1 Colours by number ================================================ -# The col=... parameter for plots is 1 by default and you can -# set it to the range 0:8. -# 0: white -# 1: black (the default) -# 2: red -# 3: green -# 4: blue -# 5: cyan -# 6: magenta -# 7: yellow -# 8: grey -barplot(rep(1,9), col=0:8, axes=FALSE, names.arg=c(0:8)) - -# As you can see, the default primary colours are garish and offend even the -# most rudimentary sense of aesthetics. Using these colors won't earn you -# respect. Fortunately we have many more sophisticated ways to define colours. - -# == 06.2 Colours by name ================================================== -# You may have noticed that "red", "green", and "blue" work for the col=... -# parameter, but you probably would not have imagined that "peachpuff", -# "firebrick" and "goldenrod" are valid as well. In fact, there are 657 named -# colours in R. Access them all by typing: -colors() - -myCols <- c( - "firebrick2", - "tomato", - "goldenrod1", - "peachpuff", - "papayawhip", - "seashell", - "whitesmoke" -) -pie(c(1, 1, 2, 3, 5, 8, 13), - col = myCols, - labels = myCols) - -# Read more about named colours (and related topics) in Melanie Frazier's pdf: -# https://www.nceas.ucsb.edu/sites/default/files/2020-04/colorPaletteCheatsheet.pdf - -# I almost never use named colours anymore but use hex-triplets instead... - - -# == 06.3 Colours as hex-triplets ========================================== -# Hex triplets in R work exactly as in HTML: a triplet of -# RGB values in two-digit hexadecimal representation. The -# first two digits specify the red value, the second two -# are for green, then blue. R accepts a fourth pair of -# digits to optionally specify the transparency - the "Alpha" channel. The -# semantics of the hex-triplet is thus "#RRGGBB" or "#RRGGBBAA". -# Read more e.g. at http://en.wikipedia.org/wiki/Web_colors - -# The function col2rgb() converts colour names to rgb values ... -col2rgb("violetred") - -# ... and rgb() converts rgb values to hex-code: -rgb(1, 0.5, 0.23) - -# to get hexcodes from names takes a bit more: divide and transpose - -rgb(t(col2rgb("violetred")/255)) - -# Here is a utility function to convert all manners of color-vectors to -# hex-triplets. You can copy it into your .Rprofile if you want to keep it at hand. - -col2hex <- function(colV, dput = FALSE, pal = FALSE, N = NULL) { - # colV a vector or scalar of color names, hex-codes or integers - # dput logical. If TRUE, character output is suitable for pasting into code. - # pal logical. If TRUE, the colors will be used in a palette. N must - # be defined in that case - # value: a vector of hex-codes of the same length, or a dput() string - - h <- rgb(t(col2rgb(colV) / 255)) - if (pal == TRUE) { - if (is.null(N)) { stop("N must be defined if pal is TRUE.") } - h <- colorRampPalette(h)(N) - } - if (dput == TRUE) { - dput(h) - return(invisible(h)) - } - return(h) -} - -# Examples: -myCols <- c( "firebrick2", "tomato", "goldenrod1", "peachpuff", - "papayawhip", "seashell", "whitesmoke") - -col2hex(myCols) -col2hex(myCols, dput = TRUE) - -# barplot with the original colors -barplot(rep(1, length(myCols)), col=myCols) - -# expanding the palette with col2hex() -N <- 40 -barplot(rep(1, N), col = col2hex(myCols,pal=TRUE,N=N) ) - - -# === 06.3.1 Inbuilt palettes - -# In R, a palette is a function (!) that takes a number as its argument and -# returns that number of colors, those colors can then be used to color points -# in a plot or other elements. In principle, such colors can serve three -# distinct puposes: - -# Qualitative colors have a different color for different types of entities. -# Here the color serves simply to distinguish the types, it represents -# "categorical information". For example, we can assign different colors to each -# individual amino acid. - -# Sequential colors distinguish order in a sequence: the colors distinguish the first from the last element in the order. For example we often color the N-terminus of a protein blue(ish) and the C-terminus red(dish). - -# Diverging colors encode some property and are scaled to represent particular -# values of the property. For example we might represent temperature with a -# black-body radiation color palette. Note that "sequential" can be seen as -# "diverging on order". - -# R has are a number of inbuilt palettes; Here is a convenience function to view -# palettes. Input can be either a palette, the name of a hcl.colors palette, or a vector of colors: -plotPal <- function(pal, N = 40) { - if (is.character(pal)) { - if (length(pal) == 1) { # name of a hcl palette - myCols <- hcl.colors(N, pal) - m <- pal - } else { # already a color vector - myCols <- colorRampPalette(pal)(N) - m <- sprintf("Custom palette (spread to %d values)", N) - } - } else { # palette function - myCols <- pal(N) - m <- as.character(substitute(pal)) - } - barplot(rep(1,N), main = m, axes = FALSE, col = myCols) -} - -plotPal(rainbow) # rainbow() is the quintessential qualitative palette -plotPal(cm.colors) # cm.colors() is sequential: cyan-white-magenta -plotPal(terrain.colors) # a diverging palette: map elevation colors - -# A lot of thought has gone into the construction of palettes in the -# colorspace:: package, now available as hcl.colors in R (hcl: hue, chroma, -# luminance), which is a better way to specify perceptually equidistant colors. -# It's worthwhile to read through the help-file for more information - -?hcl.colors -# ... and to sample the 110 available palettes: -hcl.pals() - -# Examples: -plotPal("Viridis") -plotPal("Pastel 1") -plotPal("Spectral") -plotPal("OrRd") -plotPal("Cold") -plotPal("Mint") -plotPal("Berlin") - -# If you are curious, you can execute the code below, then select the line that -# draws the plot and press ctrl+enter repeatedly to step through the entire -# set of palettes. - -# i <- 0 -# plotPal(hcl.pals()[( i<-i+1 )]) - -# Worthy of special mention are the color-Brewer palettes, in particular for -# their accessibility considerations. Do consider that not all of us view colors -# in the same way! -if (! requireNamespace("RColorBrewer", quietly = TRUE)) { - install.packages("RColorBrewer") -} -?RColorBrewer -RColorBrewer::display.brewer.all(colorblindFriendly = TRUE) - -plotPal(RColorBrewer::brewer.pal(11, "PuOr"), N = 11) - - -# === 06.3.2 Custom palettes -# -# Bespoke palettes are easily created with colorRampPalette(). The function -# returns a palette, i.e. a function (not a vector of colors). You assign the -# function to a variable (your palette), and you call it with an argument of how -# many color values you want it to return. - - -myPal <- colorRampPalette(c("#000000", "#FFFFFF", "#FF0000")) -myPal(10) -plotPal(myPal) - -# The parameter "bias" controls the spacing of colors at the end of the palette: -plotPal(colorRampPalette(c("#000000", "#FFFFFF", "#FF0000"), bias = 0.5)) -plotPal(colorRampPalette(c("#000000", "#FFFFFF", "#FF0000"), bias = 1.0)) -plotPal(colorRampPalette(c("#000000", "#FFFFFF", "#FF0000"), bias = 2.0)) - -# But a similar effect can be obtained by duplicating one or more colours to -# spread the range ... -plotPal(colorRampPalette(c("#000000", "#FFFFFF", "#FF0000", "#FF0000"))) - -# ... and this can also be used to spread the middle -plotPal(colorRampPalette(c("#000000", "#FFFFFF", "#FFFFFF", "#FF0000"))) - -# nicer pastels -myPastels <- colorRampPalette(c("#FFFFFF", - "#FF9AA2", - "#FFB7B2", - "#FFDAC1", - "#E2F0CB", - "#B5EAD7", - "#C7CEEA", - "#FFFFFF")) -plotPal(myPastels) - -# outliers -myOutliers <- colorRampPalette(c("#66666A", - "#9999A6", - "#CCCCCA", - "#EEEEF9", - "#FFBBA8", - "#F30000"), bias = 0.5) -plotPal(myOutliers) - -# Other many sources on the Web that help to generate matching colors upon which -# to build palette. One such site with a very large selection of -# community-contributed palettes is: https://color.adobe.com/ ... and there is -# also an option to extract palettes from user-supplied images. - - -# === 06.3.3 Transparency: The Alpha Channel - -# R colours are actually specified as quartets: the fourth value -# the "Alpha channel" defines the transparency. Setting this to -# values other than "FF" (the default) can be useful for very -# crowded plots, or for creating overlays. - - -x <- SC$xpr[, "t.10"] # towards the beginning of the cycle -y <- SC$xpr[, "t.50"] # towards the end of the cycle - -# compare: -plot(x,y, pch = 19, col = "#EE3A8C") -plot(x,y, pch = 19, col = "#EE3A8C12") # Alpha at ~ 10% - -# or with multiple overlays of varying size using points() ... -plot( x,y, pch = 16, cex = 1, col = "#AA330009") -points(x,y, pch = 19, cex = 2, col = "#44558803") -points(x,y, pch = 20, cex = 0.5, col = "#EE3A8C08") - -# A similar behaviour can be obtained from "density adapted colors with the -# densCols() function -plot (x, y, col = densCols(x, y), pch = 19, cex = 1.5) - - -# ... or with the smootScatter function -smoothScatter(x, y) - -smoothScatter(x, y, - colramp = colorRampPalette(c("#66666A", - "#9999A6", - "#CCCCCA", - "#EEEEF9", - "#FFBBA8", - "#F30000"), bias = 0.5), - nrpoints = 0, - xlim = c(-0.4, 0.3), - ylim = c(-0.4, 0.3), - xlab = "Expression (t = 10 min.)", - ylab = "Expression (t = 50 min.)") -abline(h = 0, col = "#FFFFFF", lwd = 0.5) -abline(v = 0, col = "#FFFFFF", lwd = 0.5) - -# ToDo: expand to "real" density plots (cf. ) - -# == 06.4 abline(), lines() and segments() ================================ - -# lines() draws an arbitrary line from the supplied points - -N <- 300 -x <- seq(0.8 * pi, 40 * pi, length.out = N) -y <- sin(x)/x -plot(x, y, type = "n") # only set up the axes -abline(h = 0) -lines(x, y, lwd = 4, col = "#FFFFFF") # "erase" parts of the axis -lines(x, y, col = "#CC0000") # draw the line we want - - -# Varying the color of a plotted line can't be done in base r. Use -# ggplot2:: or plotrix::color.scale.lines() instead - -if (! requireNamespace("plotrix", quietly = TRUE)) { - install.packages("plotrix") -} - -# plotrix::color.scale.lines() can change color as well as width of a line -# to give you more ways to visually display features of your data - -N <- 300 -x <- seq(0.8 * pi, 40 * pi, length.out = N) -y <- sin(x)/x -myCol <- myPastels(N) # colors -myLwd <- seq(0.5, 10, length.out = N) # line width - -plot(x, y, type = "n") # only set up the axes -abline(h = 0, lwd = 2, col = "#CCCCCC") - -plotrix::color.scale.lines(x, y, col = myCol, lwd = myLwd) - -# = 07 AXES =============================================================== - -# For Details, see: -?plot.default - -n <- 1000 -x <- rnorm(n) -y <- x^3 * 0.25 + rnorm(n, sd=0.75) - -plot(x,y) # Default - -# Axes -plot(x,y, xlim=c(-4, 4)) # fixed limits -plot(x,y, xlim=c(-4, 4), ylim=c(10, -10)) # reverse is possible -plot(x,y, log="xy") # log axes - -# The axis parameters in the default plot are limited. -# If you want more control, suppress the printing of an axis -# in the plot and use the axis() function instead. -?axis - - -# Axis-labels and title are straightforward parameters of plot -plot(x,y, xlab="rnorm(n)", - ylab="x^3 * 0.25 + rnorm(n, sd=0.75)", - cex.main=1.3, - main="Sample\nPlot", - cex.sub=0.75, - col.sub="grey", - sub="Scatterplot of noisy 3d-degree polynomial" - ) - -# Add gridlines -?grid -grid() - - -# = 08 LEGENDS ============================================================ - - -# == 08.1 basic legends ==================================================== -# -# ToDo: basic legend syntax - -# == 08.2 Color bars ======================================================= - -# Legends for a plot with a sequential or divergent spectrum are a special case, since we need to map a continuum of colors to a scale - -# Example: plotting expression levels in two cell-cycle phases against each other, and applying a divergent color spectrum that displays the model correlations: genes with low correlations have expression profiles that can not be well approximated with a periodic function. - - -tRep <- c("t.15", "t.20", "t.25") # Replication-phase time points -tDup <- c("t.40", "t.45", "t.50") # Duplication-phase time points -x <- rowMeans(SC$xpr[ , tRep]) -y <- rowMeans(SC$xpr[ , tDup]) -plot(x, y) - -myCors <- SC$mdl$cor -hist(myCors, breaks = 40) - -# The values are of course continuous, but we need to map them to a discrete set of colors. The strategy is as follows: -# - scale the values we wish to map into the interval [0, 1] -# - multiply with the desired number of intervals minus one, round, and add one -# - these integers can be used as indices into a vector of colors, ... -# - ... which gives the colors for the plot - -# A divergent palette -corPal <- colorRampPalette(c("#90005DAA", "#D44F99AA", "#F4C2B8AA", - "#F8DEB9AA", "#EEFAE9AA", "#D7F1C8AA", - "#BBE9C4AA", "#7CB8A6AA"), alpha = TRUE) -hist(myCors, - breaks = seq(min(myCors), max(myCors), length.out = 21), - col = corPal(20)) - -N <- 10 # We'll map into N intervals - - -#$$$ -# The usual way to scale a vector x to the [0,1] interval -# is: x-min / max-min -idx <- (myCors - min(myCors)) / (max(myCors) - min(myCors)) -# Now: expand this to N-1, round, and add 1 -idx <- round(idx * (N-1)) + 1 -# confirm that these numbers are now suitable as indices into an 1:N vector -table(idx) -# create the color vector -( corCols <- corPal(N) ) -# and make a vector of colors, one for each gene -myCols <- corCols[idx] - -# then we plot ... -plot(x, y, pch = 16, col = myCols, cex = 1.2) - -# there is a lot of overlap - let's re-plot in order of decreasing correlations -# so the low correlations (reds) get plotted last. Ordering this way will give a -# "cleaner" appearance for divergent plots. -ord <- order(myCors, decreasing = TRUE) -plot(x[ord], y[ord], pch = 16, col = myCols[ord], cex = 1.2) - -#: Titles etc. -basePlot <- function() { - m <- sprintf("Expression changes between phases (%d genes)", - length(x)) - plot(x[ord], y[ord], - main = m, - xlab = "mean Expression in Replication phase", - ylab = "mean Expression in Duplication phase", - sub = paste("Coloured by Correlation of", - "Expression Profile (xpr) to", - "Fitted Periodic Function (mdl)."), - cex.main = 0.9, - cex.lab = 0.7, - cex.sub = 0.7, - pch = 16, - col = myCols[ord], - cex = 1.2) - abline(h = 0, col = "#0088FF44") # horizontal zero - abline(v = 0, col = "#0088FF44") # vertical zero -} - -basePlot() - -# to print a color-bar legend, we use the plotrix package - -if (! requireNamespace("plotrix", quietly = TRUE)) { - install.packages("plotrix") -} - -corLabels <- sprintf("%4.2f", # craft the labels to plot - seq(min(myCors), - max(myCors), - length.out = length(corCols))) - -oPar <- par(mar=c(5,4,4,7)) # more space on the margin -par("xpd" = FALSE) -basePlot() - -# we need to figure out where to put the legend. par("usr") gives us the coordinates of the last plot window. We'll space the legend between 1.05 and 1.1 times the plot width, and centred along the y-axis with a height of 0.8 times the plot height. -dx <- par("usr")[2] - par("usr")[1] -dy <- par("usr")[4] - par("usr")[3] -xl <- par("usr")[2] + (dx * 0.05) # left -xr <- xl + (0.05 * dx) # right -yb <- par("usr")[4] - (0.9 * dy) # bottom -yt <- yb + (0.8 * dy) # top - - -plotrix::color.legend(xl, yb, xr, yt, - corLabels, - corCols, - align = "rb", # labels to the right of the bar - cex = 0.8, - gradient = "y") # vertical gradient - -# Almost perfect. Except we need a title for the color bar. -# in this case the title is "r:" ... but the "r" should be in italics. -par("xpd" = TRUE) # enable plotting into the margin -text(xr + (0.01 * dx), yt + 0.015 * dy, - expression(italic(r)["xpr,mdl"]), - adj = c(0, 0), - cex = 0.9) - -par(oPar) - -# ToDo - this is a common plot prototype - cast it into a function - -# = 09 LAYOUT ============================================================= - -# par, lattice, constant aspect ratio - - -# Most parameters of the plot window can be set via -# the functions plot(), hist() etc., but some need to -# be set via the par() function. Calling par() without -# arguments lists the current state of the plotting -# parameters. Calling it with arguments, returns the -# old parameters and sets new parameters. Thus setting -# new parameters and saving the old ones can be done -# in one step. The parameters that have to be set via -# par include: - -# - multiple plots in one window (mfrow, mfcol, mfg) -# - margin layout (mai, mar mex, oma, omd, omi) -# - controlling position and size of a plot in the figure (fig, plt, ps, pty) -# - see ?par for details. - -n <- 1000 -x <- rnorm(n) -y <- x^3 * 0.25 + rnorm(n, sd=0.75) - -# set window background and plotting axes via par -opar <- par(bg="steelblue", fg="lightyellow") -# set axis lables and titles via plot parameters -plot(x,y, col.axis="lightyellow", col.lab="lightyellow") -par(opar) # reset to old values - -plot(x,y) # confirm reset - -# aspect! ... -# - -# = 10 TEXT =============================================================== - - -# ToDo: sprintf() - -# Plotting arbitrary text -# use the text() function to plot characters and strings to coordinates -?text - -# Example: add labels to the symbols -# first set: plain symbols (1 to 20) -text(x1-0.4, y1, paste(1:20), cex=0.75) -# symbols with separate background (21 to 25) -text(x2-0.4, y2, paste(21:25), cex=0.75) -# third set: special characters, change font for clarity -text(x3-0.4, y3, extra, col="slateblue", cex=0.75, vfont=c("serif", "plain")) - - -# ToDo: writing into the margin ... -# par("mar") -# par("xpd") -# par("srt") -# -# ToDo: plotmath() # demo(plotmath) -# ToDo: expression() - - - -# = 11 DRAWING ON PLOTS =================================================== - - -# To plot lines on top of plots there are several options: - -# segments() # for lines with known endpoints -# lines() # joining x,y coordinate lists with lines -# arrows() # ... but to get a filled arrow use polygon() -# curve() # drawing a curve based on a given expression -# abline() # drawing horizontal or vertical lines or lines with -# # given slope and intercept () - - -# Example: dividing a plot into 60° regions, centred on a point. -# A general approach to "lines" on a plot is provided by segments(). -# However in this special case one can use abline(). -# We have to take care though that the aspect ratio for the -# plot is exactly 1 - otherwise our angles are not right. -# Therefore we need to set the asp parameter for plots. - -# For a general sketch -# - we plot the frame a bit larger, don't draw axes -# - draw the ablines -# - draw two arrows to symbolize the coordinate axes - -p <- c(4, 2) -plot(p[1], p[2], - xlim=c(-0.5,10.5), - ylim=c(-0.5,10.5), - xlab="", ylab="", - axes=FALSE, - asp=1.0) -abline(h=p[2], lty=2) # horizontal -abline(p[2] - (p[1]*tan(pi/3)), tan(pi/3), lty=2) # intercept, slope -abline(p[2] + (p[1]*tan(pi/3)), -tan(pi/3), lty=2) # intercept, slope -arrows(0, 0, 10, 0, length=0.1) # length of arrow -arrows(0, 0, 0, 10, length=0.1) - - -# curves() -# rect() -# polygon() - -# example: plot the area under the normal distribution as a polygon, and overlay -# a histogram -set.seed(12357) -x <- rnorm(50) -sig <- 1.0 -myBreaks <- seq(-3 * sig, 3 * sig, by = 0.5 * sig) - -# first, draw a histogram but don't show the bars -hist(x, breaks = myBreaks, freq = FALSE, col = "#FFFFFF", border = "#FFFFFF") - -# next, plot the curve as a polygon() into the existing plot area -dn <- seq(-3, 3, length.out = 100) -polygon(dn, dnorm(dn), col = "#00FF8822", border = "#FFFFFF") - -# finally, replot the histogram. Setting "add = TRUE" plots it over the -# previous histogram -hist(x, breaks = myBreaks, freq = FALSE, - col = "#0000FF22", border = "#00000033", # note: transparent colours - add = TRUE) - -# -# More: see the Index of functions for the graphics package - - -# = 12 IMAGES ============================================================= - -# Todo - - -# = 13 CONTOUR LINES ====================================================== - -# ToDo - - -# = 14 3D PLOTS =========================================================== - -# ToDo - - -# = 15 GRAPHS AND NETWORKS ================================================ - -# ToDo - - -# = 16 OTHER GRPAHICS PACKAGES ============================================ - -# Packages in the standard distribution ... -# -# graphics:: -# grid:: -# lattice:: - -# Packages that can be downloaded from CRAN -# ... use with install.packages("package"), then -# library("package") - -# hexbin:: -# ggplot2:: - -# Packages that can be downloaded from BioConductor -# prada: -# if (! requireNamespace("prada", quietly=TRUE)) { -# if (! requireNamespace("BiocManager", quietly=TRUE)) { -# install.packages("BiocManager") -# } -# BiocManager::install("prada") -# } - -# = 17 INTERACTIVE PLOTS ================================================== - -# ToDo - -# == 17.1 locator() ======================================================== -# ToDo - -# == 17.2 plotly:: ========================================================= -# ToDo - - - - -# [End] - +# tocID <- "plottingReference.R" +# +# Purpose: Reference to graphical output in R. +# +# +# Version: 2.1 +# +# Date: 2017 09 - 2021 09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# V 2.1 First minor updates 2021 +# V 2.0 Comprehensive reference with basic and advanced options based on +# an integrated yeast gene expression dataset. Full rewrite of most +# sections. +# V 1.1 Stylistic improvements, code polish, and additional examples +# V 1.0 Digest from "plotting reference" files +# +# ToDo: Demo 6.3.2 in parallel plots +# +# + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ------------------------------------------------------------------- +#TOC> 01 INITIALIZE 69 +#TOC> 02 THIS REFERENCE ... 74 +#TOC> 02.1 Dataset Documentation 81 +#TOC> 03 PROPORTIONS AND DISTRIBUTIONS 193 +#TOC> 03.1 barplot() 198 +#TOC> 03.2 pie() 222 +#TOC> 03.3 boxplot() 254 +#TOC> 03.4 hist() 312 +#TOC> 03.4.1 overlaying histograms 357 +#TOC> 04 THE plot() FUNCTION 400 +#TOC> 04.1 line plots 404 +#TOC> 05 ENCODING INFORMATION: SYMBOL, SIZE, COLOuR 503 +#TOC> 05.1 pch ("plotting character" symbols) 509 +#TOC> 05.1.1 Line types 684 +#TOC> 05.2 cex ("character expansion" size) 708 +#TOC> 06 COLOUR 768 +#TOC> 06.1 Colours by number 776 +#TOC> 06.2 Colours by name 794 +#TOC> 06.3 Colours as hex-triplets 820 +#TOC> 06.3.1 Inbuilt palettes 875 +#TOC> 06.3.2 Custom palettes 952 +#TOC> 06.3.3 Transparency: The Alpha Channel 1002 +#TOC> 06.4 abline(), lines() and segments() 1047 +#TOC> 07 AXES 1081 +#TOC> 08 LEGENDS 1118 +#TOC> 08.1 basic legends 1121 +#TOC> 08.2 Color bars 1125 +#TOC> 09 LAYOUT 1246 +#TOC> 10 TEXT 1281 +#TOC> 11 DRAWING ON PLOTS 1309 +#TOC> 12 IMAGES 1376 +#TOC> 13 CONTOUR LINES 1381 +#TOC> 14 3D PLOTS 1386 +#TOC> 15 GRAPHS AND NETWORKS 1391 +#TOC> 16 OTHER GRPAHICS PACKAGES 1396 +#TOC> 17 INTERACTIVE PLOTS 1420 +#TOC> 17.1 locator() 1424 +#TOC> 17.2 plotly:: 1427 +#TOC> +#TOC> ========================================================================== + + +# = 01 INITIALIZE ========================================================= + +SC <- readRDS("data/SC.rds") # <<<- execute this line first + + +# = 02 THIS REFERENCE ... ================================================= + +# This script covers basic plotting and graphical output options of R. The +# functions are demonstrated with an integrated data set of yeast gene +# expression data and annotations. + + +# == 02.1 Dataset Documentation ============================================ + +# You do not need to study the dataset in detail but it will be useful to refer +# to this documentation from time to time to understand what data is being +# plotted and what one can therefore learn from the results. + +# The integrated dataset SC is a list that contains an analysis of yeast gene +# expression profiles originally published by Pramila et al. (2002; PMID: +# 12464633) and accessible as GSE3653 on GEO +# (https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE3635). This is a +# high-resolution (5 min. interval) data set spanning two cycles of a +# synchronized yeast culture. It includes 6228 expression profiles with 25 +# time-points assigned to yeast systematic names. It is complemented with gene +# annotations taken from SGD, and augmented with a set of GO slims. GO slims +# were rerieved by navigating to https://www.yeastgenome.org/ and using the menu +# to choose Function >> Gene Ontology >> GOslim Mapping File. This downloads +# go_slim_mapping.tab which was further processed to annotate each gene with its +# corresponding GO terms. To evaluate cyclical regulation, a curve-fitting +# protocol was followed to fit a cyclical epxpression model with parameters +# amplitude, phase, frequency, exponential damping, and baseline shift. After +# fitting the profiles, correlations with the fitted model were calculated and +# the first peak of the model was determined as a marker of when the expression +# was ON in the cell-cycle. Finally, the expression peak markers were assigned +# to seven phases of the cell cycle, and GO term enrichments were computed. A +# A subset was selected with the following parameters: + +# selCCl <- +# nlsParams$A > 0.075 & # reasonably high Amplitude +# nlsParams$cor > 0.6 & # good correlation with the parametrized model +# nlsParams$f > 0.75 & # period between 0.75 ... +# nlsParams$f < 1.333 & # ... and 1.333 hours +# nlsParams$k < 0.03 & # limiting the exponential damping +# nlsParams$k > -0.001 +# sum(selCCl) # 1,297 genes in the data set show some level +# # of periodic expression-variation in the cell +# # cycle. +# +# Thus the dataset comprises numeric and categorical data +# Here are the data details: +# SC$xpr : expression profiles. Numeric matrix with 1,297 rows of genes +# ====== and 25 colums of time points in 5 minute +# intervals +# Example: +# -------- +# SC$xpr[169, 1:5] +# > t.0 t.5 t.10 t.15 t.20 +# > -0.055703429 -0.116124955 -0.135965733 -0.068665035 -0.001819363 +# +# +# SC$mdl : parametrized model. Data frame with 1,297 rows of genes +# ====== +# SC$mdl$A : model parameter: amplitude (log ratio) +# SC$mdl$phi : model parameter: phase (degrees) +# SC$mdl$f : model parameter: 1/frequency (hours) +# SC$mdl$k : model parameter: damping +# SC$mdl$B : model parameter: baseline shift +# SC$mdl$cor : correlation of observation and model +# SC$mdl$peaks : timepoint of first expression peak of model (minutes) +# +# # Example: +# -------- +# SC$mdl[169, ] +# > A phi f k B cor peaks +# > 0.1007908 -81.04413 1.012092 0.00656052 -0.01857916 0.8437175 37.52217 +# +# +# SC$ann : annotations. Data frame with 1,297 rows of genes +# ====== +# SC$ann$SGD : Saccharomyces Gene Database identifier +# SC$ann$sysName : Yeast gene systematic name +# SC$ann$stdName : The standard name under which the gene is known +# SC$ann$alias : common alias name(s) +# SC$ann$description : free-text description of the gene +# SC$ann$GO : GO IDs of the SGD GO slim subset annotated to the gene +# +# Example: +# -------- +# SC$ann[169, ] +# > SGD sysName stdName alias +# > S000002214 YDL056W MBP1 transcription factor MBP1 +# > description +# > YDL056W Transcription factor; involved in regulation [...] +# > GO +# > YDL056W GO:0005634 GO:0003677 GO:0001071 GO:0000278 +# +# SC$phases +# --------- +# Data frame with a definition of yeast cell cycle phase names and +# time-points derived from inspection of the SC$mdl$peaks distribution. +# names start ends +# 1 Sense 0 6 +# 2 Prep 6 15 +# 3 Replicate 15 30 +# 4 Assemble 30 37 +# 5 Segregate 37 43 +# 6 Duplicate 43 55 +# 7 Stabilize 55 65 +# +# SC$GO +# ----- +# Data frame with GO term information and GO term enrichment data +# SC$GO$ontology : {C|F|P} identifying the "cellular component", "molecular +# function" or "biological process" ontology +# SC$GO$GOid : Gene Ontyology ID of the term +# SC$GO$label : Short label of the term +# SC$GO$tAll : Count of times the term is annotated in any gene +# SC$GO$tCC : ... times term is annotated to a gene in this dataset +# SC$GO$t... : ... annotated to one ofg the cell-cycle phases +# SC$GO$xs... : ... enrichment factor in each cell cycle phase +# + + +# = 03 PROPORTIONS AND DISTRIBUTIONS ====================================== + +# Distributions of numeric variable characterize the values. Proportions compare values. A typical use case is to characterize a set of measurements, or compare several sets of measurements. + + +# == 03.1 barplot() ======================================================== +# Draws a bar with height proportional to a given number. + +barplot(mean(SC$xpr[ , "t.20"])) # barplot of the mean expression at t.20 + +# Barplots show only a single number. They tell us nothing about the underlying distribution. They are commonly used to compare several distributions: + +barplot(colMeans(SC$xpr[ , c("t.0", "t.20", "t.40", "t.60")])) + +# barplots take the usual plotting parameters +myPal <- colorRampPalette(c("#00FF0055", "#0066FF55", # a "palette" function + "#00FFFF55", "#CCCCAA55", + "#FF00FF55", "#FF006655", + "#FFFFFF55"), alpha = TRUE) # transparent colors + +barplot(colMeans(SC$xpr[ , 1:13]), # mean expression changes, first hour + main = "Mean expression changes", + xlab = "time points", + cex.names = 0.6, # scale column names + ylab = "Expression (log ratio)", + cex.axis = 0.8, # scale of y-axis labels + col = myPal(13)) # get 13 color values from myPal() + + +# == 03.2 pie() ============================================================ +# Generally not preferred, but simple to do + +table(SC$GO$ontology) +# Example: how many genes are anotated to the GO terms in the Cellular Component +# category? +CCids <- SC$GO$GOid[SC$GO$ontology == "C"] # get GO ids for "C" ontology +x <- unlist(strsplit(SC$ann$GO, " ")) # split GO term strings on blank-spaces + # and dump them all into one single vector +x <- x[x %in% CCids] # subset the ones in CCIDs (about 40%) + +pie(table(x), cex = 0.5) + +# This can be better visualized in a barplot +myT <- sort(table(x), decreasing = TRUE) +b <- barplot(myT, # assign the plot - we need the x-coordinates + main = "Genes annotated to GO terms in the Cellular Component Ontology", + cex.main = 0.8, + names.arg = "", # blank the names - otherwise they are + ylab = "counts", # taken from the names of the object + cex.axis = 0.8, + col = colorRampPalette(c("#CCAAFF", "#FFDDFF", "#FFFFFF"))(length(myT)), + ylim = c(0, 1.5 * max(myT))) # make space at the top + +# Add the GOids as text() +text(b, myT, # b holds the x coordinates, myT is y + labels = names(myT), # take the names from the table - names + srt = 90, # rotate to vertical + adj = c(-0.1, 0.5), # align center, top + cex = 0.5) + + +# == 03.3 boxplot() ======================================================== +# A boxplot() is almost always preferred to a barplot, since it includes an +# estimate of the distribution: + +boxplot(SC$xpr[ , "t.20"]) # boxplot of expression values at t.20 + +# What are these elements? +# Assigning the plot to a variable makes the numbers available so we can +# use them for annotation: +oPar <- par(mar = c(0.2,3,0.2,0.2)) # reduce the margins +( b <- boxplot(SC$xpr[ , "t.20"])) + +xT <- 1.3 +cT <- "#DD0000" +# outliers +myOut <- mean(b$out[b$out > b$stats[5]]) # outliers above the whiskers +myOut[2] <- mean(b$out[b$out < b$stats[1]]) # outliers below the whiskers +text(1.04, myOut, adj=c(0,0.5), cex=0.7, col=cT, "outliers") + +# whiskers +text(1.12, b$stats[1,1], adj=c(0,0.5), cex=0.7, col=cT, "min(x_i > Q1-1.5*IQR)") +text(1.12, b$stats[5,1], adj=c(0,0.5), cex=0.7, col=cT, "max(x_i < Q3+1.5*IQR)") + +# quartiles +# "min(x_i > Q1-1.5*IQR)" is "the smallest x in the data that still lies +# within 1.5 times the inter-quartile range below Q1 +text(1.23, b$stats[2,1], adj=c(0,0.5), cex=0.7, col=cT, "Q1 (lower quartile)") +text(1.23, b$stats[4,1], adj=c(0,0.5), cex=0.7, col=cT, "Q3 (upper quartile)") + +# median +text(1.23, b$stats[3,1], adj=c(0,0.5), cex=0.9, col=cT, "median") + +# the mean is not shown +text(0.79, mean(SC$xpr[,"t.20"]), adj=c(1,0.5), cex=0.7, col="#999999", "mean") + +par(oPar) # reset the margins + +# If we have datasets with more columns, each column gets its own boxplot +boxplot(SC$xpr[ , c("t.0", "t.20", "t.40", "t.60")]) + +# boxplots take the usual plotting parameters +myPal <- colorRampPalette(c("#00FF0055", "#0066FF55", # a "palette" function + "#00FFFF55", "#CCCCAA55", + "#FF00FF55", "#FF006655", + "#FFFFFF55"), alpha = TRUE) # transparent colors + +boxplot(SC$xpr[ , 1:13], # expression changes, first hour + main = "Expression levels", + xlab = "time points", + cex.axis = 0.6, # scale axis names + ylab = "Expression (log ratio)", + col = myPal(13)) # get 13 color values from myPal() + +# This plot shows that there is a noticable fluctuation of expression levels +# over the course of the first 60 minutes of the experiment. This may be due to +# these genes being selected as having cyclically varying expression profiles. + + +# == 03.4 hist() =========================================================== +# Histograms are superbly informative and one of the workhorses of our analyses. A histogram answers the question how many observations do we have in a particular range of a (continuously varying) variable. + +# Here we plot a histogram of the first expression peaks of genes, computed as +# the first peak of the fitted model for every gene in our set. We might be +# interested in whether the expression of different genes peaks continuously +# over the cycle, or whetehr there are time intervals where waves of expression +# of different genes can be observed in response to cycle-control signals. +hist(SC$mdl$peaks) + +# We can explicitly set breakpoints for the histogram: +# Here we set breaks at 4 minute intervals +( myBreaks <- seq(0, 80, by = 4) ) # Note: 21 values bound 20 intervals +hist(SC$mdl$peaks, breaks = myBreaks) + +# Assigning the output of hist() makes the values +# used in constructing the histogram accessible: + +( H <- hist(SC$mdl$peaks) ) + +# for example, we can use this to plot the actual numbers: +text(H$mids, # midpoints of the bars + H$counts, # counts -> probabilities + labels = H$counts, # add labels to each bar: count numbers + adj = c(0.5, -0.5), # text is centered on x and raised in y + cex = 0.6, + col = "#8888FF") + +# histograms take the usual plotting parameters +myPal <- colorRampPalette(c("#00FF0055", "#0066FF55", # a "palette" function + "#00FFFF55", "#CCCCAA55", + "#FF00FF55", "#FF006655", + "#FFFFFF55"), alpha = TRUE) # transparent colors + +myBreaks <- seq(0, 80, length.out = 81) # one-minute intervals +hist(SC$mdl$peaks, # gene expression first peaks + breaks = myBreaks, + main = "Timing of first peaks of during the cell-cycle", + sub = "The bimodal distribution distinguishes replication from division", + cex.sub = 0.8, + xlab = "t (min.)", + ylab = "counts", + col = myPal(81)) # get 81 color values from myPal() + + +# === 03.4.1 overlaying histograms + +# Histograms can be plotted one-over another to compare them +# Example: when do genes with different GO term annotations first peak? + +# GO:0005730 "nucleolus" +# GO:0032200 "telomere organization" +# GO:0006260 "DNA replication" +sel1 <- grep("GO:0005730", SC$ann$GO) # 103 genes +sel2 <- grep("GO:0032200", SC$ann$GO) # 32 genes +sel3 <- grep("GO:0006260", SC$ann$GO) # 67 genes + +# define breaks. This is important to make the histograms comparable +myBreaks <- seq(0, 80, by = 4) +# plot the first histogram + +hist(SC$mdl$peaks[sel1], breaks = myBreaks, + main = "Peak timing for different GO terms", + xlab = "t (min)", + ylab = "Counts", + ylim = c(0, 50), + col = "#FF007955") + +# first overlay +hist(SC$mdl$peaks[sel2], breaks = myBreaks, + col = "#00B2FF55", + add = TRUE) + +# second overlay +hist(SC$mdl$peaks[sel3], breaks = myBreaks, + col = "#7FDFC955", + add = TRUE) + +# Legend +legend("topright", + fill = c("#FF007955", "#00B2FF55", "#7FDFC955"), + legend = c("GO:0005730\n(nucleolus)\n", # "\n" is a line-break + "GO:0032200\n(telomere organization)\n", + "GO:0006260\n(DNA replication)\n"), + cex = 0.6, + bty = "n") # no box around the legend + + +# = 04 THE plot() FUNCTION ================================================ +# plot() is the workhorse of data visualization in R. But plot() is also a "generic" - i.e. different "classes" can define their own plot-methods and plot will "dispatch" the right method for a class. + + +# == 04.1 line plots ======================================================= + +# Lines are useful to visually associate ralated data points, like points in a +# sequence of events. + +# plot an expression profile: value over time +plot(SC$xpr[169, ]) + +# note the x is implied and plotted as "index", the expression values are used +# for the y-axis by default. + +# plot types +plot(SC$xpr[169, ], type = "p") # points, the default +plot(SC$xpr[169, ], type = "l") # lines +plot(SC$xpr[169, ], type = "b") # both points and lines +plot(SC$xpr[169, ], type = "c") # empty points and lines +plot(SC$xpr[169, ], type = "o") # overplotted +plot(SC$xpr[169, ], type = "s") # steps +plot(SC$xpr[169, ], type = "h") # like histogram +plot(SC$xpr[169, ], type = "n") # none - useful to create an empty frame + # to add other elements later +text(SC$xpr[169, ], colnames(SC$xpr), cex = 0.5) # ... such as labels + +# title and axis labels +iRow <- 169 +t <- seq(0, 120, by = 5) # set actual x-values +plot(t, SC$xpr[iRow, ], + type = "b", + main = "Expression profile", + sub = "Data: GSE3653 (Pramila et al. 2002)", + xlab = "time(min)", + ylab = "Expression (log ratio)") + +# adjusting font sizes +plot(t, SC$xpr[iRow, ], + type = "b", + main = "Expression profile", + sub = "Data: GSE3653 (Pramila et al. 2002)", + xlab = "time(min)", + ylab = "Expression (log ratio)", + cex.main = 1.1, # title + cex.sub = 0.6, # subtitle + cex.axis = 0.7, # axis values + cex.lab = 0.8) # axis labels + +# x and y axis ranges can be defined with a two-element vector +plot(t, SC$xpr[iRow, ], + type = "b", + xlim = c(0, 120), # tight against the values + ylim = c(-max(abs(SC$xpr[iRow, ])), + max(abs(SC$xpr[iRow, ]))), # symmetric around 0 + main = "", sub = "", xlab = "", ylab = "") +abline(h = 0, col = "#FF000044") + +# pull in annotations with sprintf() +plot(t, SC$xpr[iRow, ], + type = "b", + main = sprintf("Expression profile: %s (%s)", + SC$ann$stdName[iRow], + SC$ann$sysName[iRow]), + sub = "", xlab = "", ylab = "") + +# When exploring data, it is useful to have a standard view of data as a +# function: + +xprPlot <- function(iRow) { + t <- seq(0, 120, by=5) + yMax <- max(abs(SC$xpr[iRow, ])) * 1.1 + + plot(t, SC$xpr[iRow, ], + ylim = c(-yMax, yMax), + type = "b", + main = sprintf("Expression profile: %s (%s)", + SC$ann$stdName[iRow], + SC$ann$sysName[iRow]), + xlab = "time(min)", + ylab = "Expression (log ratio)", + cex.main = 1.1, + cex.axis = 0.7, + cex.lab = 0.8) + abline(h = 0, col = "#FF000044") +} + +xprPlot(169) +xprPlot(1124) + +# better to visualize by plotting one OVER the other. +# This is done with the function points() + +xprPlot(1124) +points(t, SC$xpr[169, ], type = "b", cex = 0.7, col = "#EE5500CC") + + + +# In general, when we plot(), we produce a "scatterplot" of X and y values. +# scatterplot: one against the other +plot(SC$xpr[169, ], SC$xpr[1124, ]) # these two profiles are anticorrelated + + +# = 05 ENCODING INFORMATION: SYMBOL, SIZE, COLOuR ========================= + +# We have many options to encode information in scatter plots (and others), in order to be able to visualize and discover patterns and relationships. The most important ones are the type of symbol to use, its size, and its color. + + + +# == 05.1 pch ("plotting character" symbols) =============================== +# There are many types of symbols available to plot points and they can all be varied by type, size, and color to present additional information. Which one to use is defined in the argument pch . The default is pch = 1: the open circle. Characters 1:20 are regular symbols: + +# reduce margins +oPar <- par(mar = c(1, 1, 1, 1)) + +# Empty plot frame ... +plot(c(0,11), c(0,11), type = "n", axes = FALSE, xlab = "", ylab = "") + +# coordinates for first 25 symbols +x1 <- c(1:10, 1:10) +y1 <- c(rep(10, 10),rep(9, 10)) +myPch <- 1:20 + +points(x1, y1, pch = myPch, cex = 1.2) + +# pch 21:25 can have different border and fill colours. Borders are defined with +# "col", fills are defined with "fill": + +x2 <- 1:5 +y2 <- rep(8,5) + +myCols <- c("#4B0055", "#00588B", "#009B95", "#53CC67", "#FDE333") + +points(x2, y2, pch=21:25, col="#708090", bg = myCols, cex = 1.8) + +# ten more symbols are defined as characters +x3 <- 1:10 +y3 <- rep(6,10) +myPch <- c(".", "o", "O", "0","a","A", "*", "+","-","|") +points(x3, y3, pch = myPch) # note: "myPCh" is a character vector while + # the other pch were identified by integers + +# The ASCII codes for characters 32 to 126 can also be used as plotting symbols +myPch <- 32:126 +x4 <- (((myPch - 32) %% 19) + 2) / 2 +y4 <- 5 - ((myPch - 32) %/% 19) +points(x4, y4, pch=32:126, col="#0055AA") + +# I don't think I have ever actually used characters as plotting characters in +# this way; it is much more straightforward to just use the text() function in +# that case, rather than having to look up which ASCII code is which character, +# and remembering which ones are available as numbers, and which ones are +# identified by the character itself. But the first twenty five I use a lot, and +# I also end up looking up their codes a lot. So here is a function to plot them for reference. You can paste it into your .Rprofile to keep it at hand: + +pchRef <- function() { + # a reference plot for the first twenty five plotting characters + + oPar <- par(mar = c(1, 1, 1, 1), mfrow = c(1, 1)) + plot(c(0,6), c(0,6), type = "n", axes = FALSE, xlab = "", ylab = "") + + x <- ((0:24) %% 5) + 1 + y <- rep(5:1, each = 5) + + idx <- 1:20 + points(x[idx], y[idx], pch = idx, cex = 2) + + idx <- 21:25 + points(x[idx], y[idx], pch = idx, cex = 2, col = "#708090", + bg=c("#CC0033AA", "#991566AA", "#662A99AA", "#323FCCAA", "#0055FFAA")) + + text(x - 0.3, y, labels = sprintf("%d:", 1:25), col = "#7766AA", cex = 0.8) + + par(oPar) +} + + +# reset margins +par(oPar) + + +# In addition to the default fonts, a large set of Hershey vector fonts is +# available which gives access to many more plotting and labeling options via +# text() +demo(Hershey) + +# Plotting other symbols: +# In the most general way, Unicode characters can be plotted as text. +# The code is passed in hexadecimal, long integer, with a negative sign. +# Here is a quarter note (Unicode: 266a) using plot() +plot(0.5,0.5, pch=-0x266aL, cex=5, xlab="", ylab="") + +# However, rendering may vary across platforms since it depends on unicode +# support. If your character can't be rendered, you'll only get an empty box. + + +# 1.1.1 Using pch to emphasize different categories + +# In general, when we plot(), we produce a "scatterplot" of X and y values. +# scatterplot: one against the other + +tRep <- c("t.15", "t.20", "t.25", "t.30") # Replication-phase time points +tDup <- c("t.40", "t.45", "t.50", "t.55") # Duplication-phase time points + +plot(rowMeans(SC$xpr[ , tRep]), rowMeans(SC$xpr[ , tDup])) + +# select top ten replication enriched GO terms +sel <- order(SC$GO$xsReplicate, decreasing = TRUE)[1:10] +SC$GO$label[sel] # what are these? +GOrep <- SC$GO$GOid[sel] # GO terms that are enriched in the Replication phase + +sel <- order(SC$GO$xsDuplicate, decreasing = TRUE)[1:10] +SC$GO$label[sel] # what are these? +GOdup <- SC$GO$GOid[sel] # GO terms that are enriched in the Duplication phase + +# define sets of genes that are annotated to one or the other GO id set +repGenes <- logical(nrow(SC$ann)) # prepare an empty vector +for (id in GOrep) { # whenever we find one of the + repGenes <- repGenes | grepl(id, SC$ann$GO) # characteristic GO IDs annotated +} # to a a gene, we put TRUE in its +sum(repGenes) # spot of the repGenes vector. +xRep <- rowMeans(SC$xpr[ repGenes, tRep]) # repGenes in the replication phase +yRep <- rowMeans(SC$xpr[ repGenes, tDup]) # repGenes in the duplication phase + +# same thing for the genes that are enriched in the duplication phase +dupGenes <- logical(nrow(SC$ann)) +for (id in GOdup) { + dupGenes <- dupGenes | grepl(id, SC$ann$GO) +} +sum(dupGenes) +xDup <- rowMeans(SC$xpr[ dupGenes, tRep]) # dupGenes in the replication phase +yDup <- rowMeans(SC$xpr[ dupGenes, tDup]) # dupGenes in the duplication phase + +# Ready to plot: +# base plot without the ref... and dup... genes +basePlot <- function(...) { + sel <- ! (repGenes | dupGenes) + m <- sprintf("Expression changes between phases (%d genes)", + nrow(SC$xpr)) + plot(rowMeans(SC$xpr[ sel, tRep]), + rowMeans(SC$xpr[ sel, tDup]), + main = m, + xlab = "Expression in Replication phase", + ylab = "Expression in Duplication phase", + cex.main = 0.9, + cex.lab = 0.8, + ...) + abline(h = 0, col = "#0088FF44") # horizontal zero + abline(v = 0, col = "#0088FF44") # vertical zero +} + +basePlot() +# plotting the rep.. and dup... sets with different pch +points(xRep, yRep, pch=24, col="#000000", bg="#FFFFFF") # white up triangle +points(xDup, yDup, pch=25, col="#000000", bg="#FFFFFF") # white down triangle + +# These are clearly different distributions, but the plot is overall too busy. + +# Using color improves the plot: +basePlot(pch=21, col="#AAAAAA", bg="#DDDDDD") +points(xRep, yRep, pch=24, col="#000000", bg="#66DDFF") +points(xDup, yDup, pch=25, col="#000000", bg="#FF77FF") + +# Even better may be to use transparent colors, to address the overlap: +basePlot(pch=19, col="#00000022") +points(xRep, yRep, pch=19, col="#33BBFF66") +points(xDup, yDup, pch=19, col="#FF44AA44") + +# this needs a legend: +legend ("bottom", + legend = c( + sprintf("%d Genes with Replication-\nenriched GO terms\n ", sum(repGenes)), + sprintf("%d Genes with Duplication-\nenriched GO terms\n ", sum(dupGenes)), + "Other Genes\n " + ), + horiz = TRUE, + pch = 19, + col = c("#33BBFF66", "#FF44AA44", "#00000022"), + cex = 0.6, + pt.cex = 1.0, + inset = 0.02, + box.col = "#DDDDDD", + bg = "#FFFFFF") + +# === 05.1.1 Line types + +# Basically all plots take arguments lty to define the line type, and lwd +# to define line width + +# empty plot ... +plot(c(0,10), c(0,10), type = "n", axes = FALSE, xlab = "", ylab = "") + +# Line type +for (i in 1:8) { + y <- 10.5-(i/2) + segments(1,y,5,y, lty=i) + text(6, y, paste("lty = ", i), col="grey60", adj=0, cex=0.75) +} + +# Line width +for (i in 1:10) { + y <- 5.5-(i/2) + segments(1,y,5,y, lwd=(0.3*i)^2) + text(6, y, paste("lwd = ", (0.3*i)^2), col="grey60", adj=0, cex=0.75) +} + + + +# == 05.2 cex ("character expansion" size) ================================= + +# The size of characters can be controlled with the cex parameter. cex takes a +# vector of numbers, mapped to the vecors of plotted elements. The usual R +# conventions of vector recycling apply, so if cex s only a single number, it is +# applied to all plotted elements. Here is an example plotting expression +# amplitudes in a comparison of pre-replication vs. replication phase +# expression. + + +tPre <- c("t.0", "t.5", "t.10") # Pre replication-phase time points +tMid <- c("t.25", "t.30", "t.35") # Midway between replication and duplication + +x <- rowMeans(SC$xpr[ , tPre]) # row means average out fluctuations +y <- rowMeans(SC$xpr[ , tMid]) +plot(x, y) + +myAmps <- SC$mdl$A # fetch the correlations of the fitted + # low correlations are not well modeled + # with a periodic function + +hist(myAmps, breaks = 40) # examine the distribution +hist(log(myAmps), breaks = 40) # sometimes log() is be better suited + # to map to symbol size + +# useful cex sizes are approximately between 0.5 and 5 +# Example: +N <- 10 +cexMin <- 0.5 +cexMax <- 5.0 +myCex <- seq(cexMax, cexMin, length.out=N) # Vector of cex values of length N +# We plot these points from largest to smallest, so we don't overplot +x1 <- runif(N) +y1 <- runif(N) +plot(x1, y1, xlim = 0:1, ylim = 0:1, xlab = "", ylab = "", pch = 16, + cex = myCex, col= colorRampPalette(c("#F4F0F8", "#3355DD"))(N)) + +# Note that the smallest cex at 0.5 is _really_ small. +points(x1[N], y1[N], cex = 3.0, col = "#FF000077") # Here it is! + +# To rescale a vector into the desired interval (lo, up) we write a little +# function. First we normalize the vector into the interval (0, 1), then we +# multiply it by up-lo, and add lo. +# + +reScale <- function(x, lo = 0, up = 1) { + return((((x-min(x)) / (max(x)-min(x))) * (up-lo)) + lo ) +} + +# with this, our coding amplitudes as plot character size becomes quite easy: +plot(x, y, pch=16, + cex = reScale(myAmps, lo=0.5, up=5), # <<<---- That's all we need + col="#4499BB22") +abline(a = 0, b = 1, col = "#DD333344") +abline(h = 0, col = "#33333344") +abline(v = 0, col = "#33333344") + +# ToDo: add titles, scale legend, and interpretation + + +# = 06 COLOUR ============================================================= + +# Colour is immensely important for data visualization, and colours in R can be +# specified by number, by name, as hex-triplets, as rgb or hsv values, and +# through several color-space specifications. The can be used individually, as +# vectors that are defined manually, and through colour palettes. And the can be +# solid and transparent. + +# == 06.1 Colours by number ================================================ +# The col=... parameter for plots is 1 by default and you can +# set it to the range 0:8. +# 0: white +# 1: black (the default) +# 2: red +# 3: green +# 4: blue +# 5: cyan +# 6: magenta +# 7: yellow +# 8: grey +barplot(rep(1,9), col=0:8, axes=FALSE, names.arg=c(0:8)) + +# As you can see, the default primary colours are garish and offend even the +# most rudimentary sense of aesthetics. Using these colors won't earn you +# respect. Fortunately we have many more sophisticated ways to define colours. + +# == 06.2 Colours by name ================================================== +# You may have noticed that "red", "green", and "blue" work for the col=... +# parameter, but you probably would not have imagined that "peachpuff", +# "firebrick" and "goldenrod" are valid as well. In fact, there are 657 named +# colours in R. Access them all by typing: +colors() + +myCols <- c( + "firebrick2", + "tomato", + "goldenrod1", + "peachpuff", + "papayawhip", + "seashell", + "whitesmoke" +) +pie(c(1, 1, 2, 3, 5, 8, 13), + col = myCols, + labels = myCols) + +# Read more about named colours (and related topics) in Melanie Frazier's pdf: +# https://www.nceas.ucsb.edu/sites/default/files/2020-04/colorPaletteCheatsheet.pdf + +# I almost never use named colours anymore but use hex-triplets instead... + + +# == 06.3 Colours as hex-triplets ========================================== +# Hex triplets in R work exactly as in HTML: a triplet of +# RGB values in two-digit hexadecimal representation. The +# first two digits specify the red value, the second two +# are for green, then blue. R accepts a fourth pair of +# digits to optionally specify the transparency - the "Alpha" channel. The +# semantics of the hex-triplet is thus "#RRGGBB" or "#RRGGBBAA". +# Read more e.g. at http://en.wikipedia.org/wiki/Web_colors + +# The function col2rgb() converts colour names to rgb values ... +col2rgb("violetred") + +# ... and rgb() converts rgb values to hex-code: +rgb(1, 0.5, 0.23) + +# to get hexcodes from names takes a bit more: divide and transpose - +rgb(t(col2rgb("violetred")/255)) + +# Here is a utility function to convert all manners of color-vectors to +# hex-triplets. You can copy it into your .Rprofile if you want to keep it at hand. + +col2hex <- function(colV, dput = FALSE, pal = FALSE, N = NULL) { + # colV a vector or scalar of color names, hex-codes or integers + # dput logical. If TRUE, character output is suitable for pasting into code. + # pal logical. If TRUE, the colors will be used in a palette. N must + # be defined in that case + # value: a vector of hex-codes of the same length, or a dput() string + + h <- rgb(t(col2rgb(colV) / 255)) + if (pal == TRUE) { + if (is.null(N)) { stop("N must be defined if pal is TRUE.") } + h <- colorRampPalette(h)(N) + } + if (dput == TRUE) { + dput(h) + return(invisible(h)) + } + return(h) +} + +# Examples: +myCols <- c( "firebrick2", "tomato", "goldenrod1", "peachpuff", + "papayawhip", "seashell", "whitesmoke") + +col2hex(myCols) +col2hex(myCols, dput = TRUE) + +# barplot with the original colors +barplot(rep(1, length(myCols)), col=myCols) + +# expanding the palette with col2hex() +N <- 40 +barplot(rep(1, N), col = col2hex(myCols,pal=TRUE,N=N) ) + + +# === 06.3.1 Inbuilt palettes + +# In R, a palette is a function (!) that takes a number as its argument and +# returns that number of colors, those colors can then be used to color points +# in a plot or other elements. In principle, such colors can serve three +# distinct puposes: + +# Qualitative colors have a different color for different types of entities. +# Here the color serves simply to distinguish the types, it represents +# "categorical information". For example, we can assign different colors to each +# individual amino acid. + +# Sequential colors distinguish order in a sequence: the colors distinguish the first from the last element in the order. For example we often color the N-terminus of a protein blue(ish) and the C-terminus red(dish). + +# Diverging colors encode some property and are scaled to represent particular +# values of the property. For example we might represent temperature with a +# black-body radiation color palette. Note that "sequential" can be seen as +# "diverging on order". + +# R has are a number of inbuilt palettes; Here is a convenience function to view +# palettes. Input can be either a palette, the name of a hcl.colors palette, or a vector of colors: +plotPal <- function(pal, N = 40) { + if (is.character(pal)) { + if (length(pal) == 1) { # name of a hcl palette + myCols <- hcl.colors(N, pal) + m <- pal + } else { # already a color vector + myCols <- colorRampPalette(pal)(N) + m <- sprintf("Custom palette (spread to %d values)", N) + } + } else { # palette function + myCols <- pal(N) + m <- as.character(substitute(pal)) + } + barplot(rep(1,N), main = m, axes = FALSE, col = myCols) +} + +plotPal(rainbow) # rainbow() is the quintessential qualitative palette +plotPal(cm.colors) # cm.colors() is sequential: cyan-white-magenta +plotPal(terrain.colors) # a diverging palette: map elevation colors + +# A lot of thought has gone into the construction of palettes in the +# colorspace:: package, now available as hcl.colors in R (hcl: hue, chroma, +# luminance), which is a better way to specify perceptually equidistant colors. +# It's worthwhile to read through the help-file for more information - +?hcl.colors +# ... and to sample the 110 available palettes: +hcl.pals() + +# Examples: +plotPal("Viridis") +plotPal("Pastel 1") +plotPal("Spectral") +plotPal("OrRd") +plotPal("Cold") +plotPal("Mint") +plotPal("Berlin") + +# If you are curious, you can execute the code below, then select the line that +# draws the plot and press ctrl+enter repeatedly to step through the entire +# set of palettes. + +# i <- 0 +# plotPal(hcl.pals()[( i<-i+1 )]) + +# Worthy of special mention are the color-Brewer palettes, in particular for +# their accessibility considerations. Do consider that not all of us view colors +# in the same way! +if (! requireNamespace("RColorBrewer", quietly = TRUE)) { + install.packages("RColorBrewer") +} +?RColorBrewer +RColorBrewer::display.brewer.all(colorblindFriendly = TRUE) + +plotPal(RColorBrewer::brewer.pal(11, "PuOr"), N = 11) + + +# === 06.3.2 Custom palettes +# +# Bespoke palettes are easily created with colorRampPalette(). The function +# returns a palette, i.e. a function (not a vector of colors). You assign the +# function to a variable (your palette), and you call it with an argument of how +# many color values you want it to return. + + +myPal <- colorRampPalette(c("#000000", "#FFFFFF", "#FF0000")) +myPal(10) +plotPal(myPal) + +# The parameter "bias" controls the spacing of colors at the end of the palette: +plotPal(colorRampPalette(c("#000000", "#FFFFFF", "#FF0000"), bias = 0.5)) +plotPal(colorRampPalette(c("#000000", "#FFFFFF", "#FF0000"), bias = 1.0)) +plotPal(colorRampPalette(c("#000000", "#FFFFFF", "#FF0000"), bias = 2.0)) + +# But a similar effect can be obtained by duplicating one or more colours to +# spread the range ... +plotPal(colorRampPalette(c("#000000", "#FFFFFF", "#FF0000", "#FF0000"))) + +# ... and this can also be used to spread the middle +plotPal(colorRampPalette(c("#000000", "#FFFFFF", "#FFFFFF", "#FF0000"))) + +# nicer pastels +myPastels <- colorRampPalette(c("#FFFFFF", + "#FF9AA2", + "#FFB7B2", + "#FFDAC1", + "#E2F0CB", + "#B5EAD7", + "#C7CEEA", + "#FFFFFF")) +plotPal(myPastels) + +# outliers +myOutliers <- colorRampPalette(c("#66666A", + "#9999A6", + "#CCCCCA", + "#EEEEF9", + "#FFBBA8", + "#F30000"), bias = 0.5) +plotPal(myOutliers) + +# Other many sources on the Web that help to generate matching colors upon which +# to build palette. One such site with a very large selection of +# community-contributed palettes is: https://color.adobe.com/ ... and there is +# also an option to extract palettes from user-supplied images. + + +# === 06.3.3 Transparency: The Alpha Channel + +# R colours are actually specified as quartets: the fourth value +# the "Alpha channel" defines the transparency. Setting this to +# values other than "FF" (the default) can be useful for very +# crowded plots, or for creating overlays. + + +x <- SC$xpr[, "t.10"] # towards the beginning of the cycle +y <- SC$xpr[, "t.50"] # towards the end of the cycle + +# compare: +plot(x,y, pch = 19, col = "#EE3A8C") +plot(x,y, pch = 19, col = "#EE3A8C12") # Alpha at ~ 10% + +# or with multiple overlays of varying size using points() ... +plot( x,y, pch = 16, cex = 1, col = "#AA330009") +points(x,y, pch = 19, cex = 2, col = "#44558803") +points(x,y, pch = 20, cex = 0.5, col = "#EE3A8C08") + +# A similar behaviour can be obtained from "density adapted colors with the +# densCols() function +plot (x, y, col = densCols(x, y), pch = 19, cex = 1.5) + + +# ... or with the smootScatter function +smoothScatter(x, y) + +smoothScatter(x, y, + colramp = colorRampPalette(c("#66666A", + "#9999A6", + "#CCCCCA", + "#EEEEF9", + "#FFBBA8", + "#F30000"), bias = 0.5), + nrpoints = 0, + xlim = c(-0.4, 0.3), + ylim = c(-0.4, 0.3), + xlab = "Expression (t = 10 min.)", + ylab = "Expression (t = 50 min.)") +abline(h = 0, col = "#FFFFFF", lwd = 0.5) +abline(v = 0, col = "#FFFFFF", lwd = 0.5) + +# ToDo: expand to "real" density plots (cf. ) + +# == 06.4 abline(), lines() and segments() ================================ + +# lines() draws an arbitrary line from the supplied points + +N <- 300 +x <- seq(0.8 * pi, 40 * pi, length.out = N) +y <- sin(x)/x +plot(x, y, type = "n") # only set up the axes +abline(h = 0) +lines(x, y, lwd = 4, col = "#FFFFFF") # "erase" parts of the axis +lines(x, y, col = "#CC0000") # draw the line we want + + +# Varying the color of a plotted line can't be done in base r. Use +# ggplot2:: or plotrix::color.scale.lines() instead + +if (! requireNamespace("plotrix", quietly = TRUE)) { + install.packages("plotrix") +} + +# plotrix::color.scale.lines() can change color as well as width of a line +# to give you more ways to visually display features of your data + +N <- 300 +x <- seq(0.8 * pi, 40 * pi, length.out = N) +y <- sin(x)/x +myCol <- myPastels(N) # colors +myLwd <- seq(0.5, 10, length.out = N) # line width + +plot(x, y, type = "n") # only set up the axes +abline(h = 0, lwd = 2, col = "#CCCCCC") + +plotrix::color.scale.lines(x, y, col = myCol, lwd = myLwd) + +# = 07 AXES =============================================================== + +# For Details, see: +?plot.default + +n <- 1000 +x <- rnorm(n) +y <- x^3 * 0.25 + rnorm(n, sd=0.75) + +plot(x,y) # Default + +# Axes +plot(x,y, xlim=c(-4, 4)) # fixed limits +plot(x,y, xlim=c(-4, 4), ylim=c(10, -10)) # reverse is possible +plot(x,y, log="xy") # log axes + +# The axis parameters in the default plot are limited. +# If you want more control, suppress the printing of an axis +# in the plot and use the axis() function instead. +?axis + + +# Axis-labels and title are straightforward parameters of plot +plot(x,y, xlab="rnorm(n)", + ylab="x^3 * 0.25 + rnorm(n, sd=0.75)", + cex.main=1.3, + main="Sample\nPlot", + cex.sub=0.75, + col.sub="grey", + sub="Scatterplot of noisy 3d-degree polynomial" + ) + +# Add gridlines +?grid +grid() + + +# = 08 LEGENDS ============================================================ + + +# == 08.1 basic legends ==================================================== +# +# ToDo: basic legend syntax + +# == 08.2 Color bars ======================================================= + +# Legends for a plot with a sequential or divergent spectrum are a special case, since we need to map a continuum of colors to a scale + +# Example: plotting expression levels in two cell-cycle phases against each other, and applying a divergent color spectrum that displays the model correlations: genes with low correlations have expression profiles that can not be well approximated with a periodic function. + + +tRep <- c("t.15", "t.20", "t.25") # Replication-phase time points +tDup <- c("t.40", "t.45", "t.50") # Duplication-phase time points +x <- rowMeans(SC$xpr[ , tRep]) +y <- rowMeans(SC$xpr[ , tDup]) +plot(x, y) + +myCors <- SC$mdl$cor +hist(myCors, breaks = 40) + +# The values are of course continuous, but we need to map them to a discrete set of colors. The strategy is as follows: +# - scale the values we wish to map into the interval [0, 1] +# - multiply with the desired number of intervals minus one, round, and add one +# - these integers can be used as indices into a vector of colors, ... +# - ... which gives the colors for the plot + +# A divergent palette +corPal <- colorRampPalette(c("#90005DAA", "#D44F99AA", "#F4C2B8AA", + "#F8DEB9AA", "#EEFAE9AA", "#D7F1C8AA", + "#BBE9C4AA", "#7CB8A6AA"), alpha = TRUE) +hist(myCors, + breaks = seq(min(myCors), max(myCors), length.out = 21), + col = corPal(20)) + +N <- 10 # We'll map into N intervals + + +#$$$ +# The usual way to scale a vector x to the [0,1] interval +# is: x-min / max-min +idx <- (myCors - min(myCors)) / (max(myCors) - min(myCors)) +# Now: expand this to N-1, round, and add 1 +idx <- round(idx * (N-1)) + 1 +# confirm that these numbers are now suitable as indices into an 1:N vector +table(idx) +# create the color vector +( corCols <- corPal(N) ) +# and make a vector of colors, one for each gene +myCols <- corCols[idx] + +# then we plot ... +plot(x, y, pch = 16, col = myCols, cex = 1.2) + +# there is a lot of overlap - let's re-plot in order of decreasing correlations +# so the low correlations (reds) get plotted last. Ordering this way will give a +# "cleaner" appearance for divergent plots. +ord <- order(myCors, decreasing = TRUE) +plot(x[ord], y[ord], pch = 16, col = myCols[ord], cex = 1.2) + +#: Titles etc. +basePlot <- function() { + m <- sprintf("Expression changes between phases (%d genes)", + length(x)) + plot(x[ord], y[ord], + main = m, + xlab = "mean Expression in Replication phase", + ylab = "mean Expression in Duplication phase", + sub = paste("Coloured by Correlation of", + "Expression Profile (xpr) to", + "Fitted Periodic Function (mdl)."), + cex.main = 0.9, + cex.lab = 0.7, + cex.sub = 0.7, + pch = 16, + col = myCols[ord], + cex = 1.2) + abline(h = 0, col = "#0088FF44") # horizontal zero + abline(v = 0, col = "#0088FF44") # vertical zero +} + +basePlot() + +# to print a color-bar legend, we use the plotrix package + +if (! requireNamespace("plotrix", quietly = TRUE)) { + install.packages("plotrix") +} + +corLabels <- sprintf("%4.2f", # craft the labels to plot + seq(min(myCors), + max(myCors), + length.out = length(corCols))) + +oPar <- par(mar=c(5,4,4,7)) # more space on the margin +par("xpd" = FALSE) +basePlot() + +# we need to figure out where to put the legend. par("usr") gives us the coordinates of the last plot window. We'll space the legend between 1.05 and 1.1 times the plot width, and centred along the y-axis with a height of 0.8 times the plot height. +dx <- par("usr")[2] - par("usr")[1] +dy <- par("usr")[4] - par("usr")[3] +xl <- par("usr")[2] + (dx * 0.05) # left +xr <- xl + (0.05 * dx) # right +yb <- par("usr")[4] - (0.9 * dy) # bottom +yt <- yb + (0.8 * dy) # top + + +plotrix::color.legend(xl, yb, xr, yt, + corLabels, + corCols, + align = "rb", # labels to the right of the bar + cex = 0.8, + gradient = "y") # vertical gradient + +# Almost perfect. Except we need a title for the color bar. +# in this case the title is "r:" ... but the "r" should be in italics. +par("xpd" = TRUE) # enable plotting into the margin +text(xr + (0.01 * dx), yt + 0.015 * dy, + expression(italic(r)["xpr,mdl"]), + adj = c(0, 0), + cex = 0.9) + +par(oPar) + +# ToDo - this is a common plot prototype - cast it into a function + +# = 09 LAYOUT ============================================================= + +# par, lattice, constant aspect ratio + + +# Most parameters of the plot window can be set via +# the functions plot(), hist() etc., but some need to +# be set via the par() function. Calling par() without +# arguments lists the current state of the plotting +# parameters. Calling it with arguments, returns the +# old parameters and sets new parameters. Thus setting +# new parameters and saving the old ones can be done +# in one step. The parameters that have to be set via +# par include: + +# - multiple plots in one window (mfrow, mfcol, mfg) +# - margin layout (mai, mar mex, oma, omd, omi) +# - controlling position and size of a plot in the figure (fig, plt, ps, pty) +# - see ?par for details. + +n <- 1000 +x <- rnorm(n) +y <- x^3 * 0.25 + rnorm(n, sd=0.75) + +# set window background and plotting axes via par +opar <- par(bg="steelblue", fg="lightyellow") +# set axis lables and titles via plot parameters +plot(x,y, col.axis="lightyellow", col.lab="lightyellow") +par(opar) # reset to old values + +plot(x,y) # confirm reset + +# aspect! ... +# + +# = 10 TEXT =============================================================== + + +# ToDo: sprintf() + +# Plotting arbitrary text +# use the text() function to plot characters and strings to coordinates +?text + +# Example: add labels to the symbols +# first set: plain symbols (1 to 20) +text(x1-0.4, y1, paste(1:20), cex=0.75) +# symbols with separate background (21 to 25) +text(x2-0.4, y2, paste(21:25), cex=0.75) +# third set: special characters, change font for clarity +text(x3-0.4, y3, extra, col="slateblue", cex=0.75, vfont=c("serif", "plain")) + + +# ToDo: writing into the margin ... +# par("mar") +# par("xpd") +# par("srt") +# +# ToDo: plotmath() # demo(plotmath) +# ToDo: expression() + + + +# = 11 DRAWING ON PLOTS =================================================== + + +# To plot lines on top of plots there are several options: + +# segments() # for lines with known endpoints +# lines() # joining x,y coordinate lists with lines +# arrows() # ... but to get a filled arrow use polygon() +# curve() # drawing a curve based on a given expression +# abline() # drawing horizontal or vertical lines or lines with +# # given slope and intercept () + + +# Example: dividing a plot into 60° regions, centred on a point. +# A general approach to "lines" on a plot is provided by segments(). +# However in this special case one can use abline(). +# We have to take care though that the aspect ratio for the +# plot is exactly 1 - otherwise our angles are not right. +# Therefore we need to set the asp parameter for plots. + +# For a general sketch +# - we plot the frame a bit larger, don't draw axes +# - draw the ablines +# - draw two arrows to symbolize the coordinate axes + +p <- c(4, 2) +plot(p[1], p[2], + xlim=c(-0.5,10.5), + ylim=c(-0.5,10.5), + xlab="", ylab="", + axes=FALSE, + asp=1.0) +abline(h=p[2], lty=2) # horizontal +abline(p[2] - (p[1]*tan(pi/3)), tan(pi/3), lty=2) # intercept, slope +abline(p[2] + (p[1]*tan(pi/3)), -tan(pi/3), lty=2) # intercept, slope +arrows(0, 0, 10, 0, length=0.1) # length of arrow +arrows(0, 0, 0, 10, length=0.1) + + +# curves() +# rect() +# polygon() + +# example: plot the area under the normal distribution as a polygon, and overlay +# a histogram +set.seed(12357) +x <- rnorm(50) +sig <- 1.0 +myBreaks <- seq(-3 * sig, 3 * sig, by = 0.5 * sig) + +# first, draw a histogram but don't show the bars +hist(x, breaks = myBreaks, freq = FALSE, col = "#FFFFFF", border = "#FFFFFF") + +# next, plot the curve as a polygon() into the existing plot area +dn <- seq(-3, 3, length.out = 100) +polygon(dn, dnorm(dn), col = "#00FF8822", border = "#FFFFFF") + +# finally, replot the histogram. Setting "add = TRUE" plots it over the +# previous histogram +hist(x, breaks = myBreaks, freq = FALSE, + col = "#0000FF22", border = "#00000033", # note: transparent colours + add = TRUE) + +# +# More: see the Index of functions for the graphics package + + +# = 12 IMAGES ============================================================= + +# Todo + + +# = 13 CONTOUR LINES ====================================================== + +# ToDo + + +# = 14 3D PLOTS =========================================================== + +# ToDo + + +# = 15 GRAPHS AND NETWORKS ================================================ + +# ToDo + + +# = 16 OTHER GRPAHICS PACKAGES ============================================ + +# Packages in the standard distribution ... +# +# graphics:: +# grid:: +# lattice:: + +# Packages that can be downloaded from CRAN +# ... use with install.packages("package"), then +# library("package") + +# hexbin:: +# ggplot2:: + +# Packages that can be downloaded from BioConductor +# prada: +# if (! requireNamespace("prada", quietly=TRUE)) { +# if (! requireNamespace("BiocManager", quietly=TRUE)) { +# install.packages("BiocManager") +# } +# BiocManager::install("prada") +# } + +# = 17 INTERACTIVE PLOTS ================================================== + +# ToDo + +# == 17.1 locator() ======================================================== +# ToDo + +# == 17.2 plotly:: ========================================================= +# ToDo + + + + +# [End] + diff --git a/scriptTemplate.R b/scriptTemplate.R index 0f252e9..dee6447 100644 --- a/scriptTemplate.R +++ b/scriptTemplate.R @@ -1,75 +1,75 @@ -# scriptTemplate.R -# -# Purpose: -# Version: -# Date: -# Author: -# -# Input: -# Output: -# Dependencies: -# -# ToDo: -# Notes: -# -# ============================================================================== - -setwd("") - -# ==== PARAMETERS ============================================================ -# Define and explain all parameters. No "magic numbers" in your code below. - - - -# ==== PACKAGES ============================================================== -# Check that required packages have been installed. Install if needed. - -if (! requireNamespace("seqinr", quietly=TRUE)) { - install.packages("seqinr") -} -# Package information: -# library(help = seqinr) # basic information -# browseVignettes("seqinr") # available vignettes -# data(package = "seqinr") # available datasets - -# Note: use package functions with the :: operator - eg. -# seqinr::aaa("K") - - - -# ==== FUNCTIONS ============================================================= - -# Define functions or source external files -source("") - -myFunction <- function(a, b=1) { - # Purpose: - # Describe ... - # Parameters: - # a: ... - # b: ... - # Value: - # result: ... - - # code ... - - return(result) -} - - - -# ==== PROCESS =============================================================== -# Enter the step-by-step process of your project here. Strive to write your -# code so that you can simply run this entire file and re-create all -# intermediate results. - - - - - - -# ==== TESTS ================================================================= -# Enter your function tests here... - - -# [END] +# scriptTemplate.R +# +# Purpose: +# Version: +# Date: +# Author: +# +# Input: +# Output: +# Dependencies: +# +# ToDo: +# Notes: +# +# ============================================================================== + +setwd("") + +# ==== PARAMETERS ============================================================ +# Define and explain all parameters. No "magic numbers" in your code below. + + + +# ==== PACKAGES ============================================================== +# Check that required packages have been installed. Install if needed. + +if (! requireNamespace("seqinr", quietly=TRUE)) { + install.packages("seqinr") +} +# Package information: +# library(help = seqinr) # basic information +# browseVignettes("seqinr") # available vignettes +# data(package = "seqinr") # available datasets + +# Note: use package functions with the :: operator - eg. +# seqinr::aaa("K") + + + +# ==== FUNCTIONS ============================================================= + +# Define functions or source external files +source("") + +myFunction <- function(a, b=1) { + # Purpose: + # Describe ... + # Parameters: + # a: ... + # b: ... + # Value: + # result: ... + + # code ... + + return(result) +} + + + +# ==== PROCESS =============================================================== +# Enter the step-by-step process of your project here. Strive to write your +# code so that you can simply run this entire file and re-create all +# intermediate results. + + + + + + +# ==== TESTS ================================================================= +# Enter your function tests here... + + +# [END] diff --git a/scripts/ABC-createRefDB.R b/scripts/ABC-createRefDB.R index 3df8d08..fa144f6 100644 --- a/scripts/ABC-createRefDB.R +++ b/scripts/ABC-createRefDB.R @@ -1,30 +1,30 @@ -# ABC-createRefDB.R -# -# Create a reference protein database for Mbp1-like proteins -# -# Boris Steipe for ABC learning units -# -# For the species, see: -# http://steipe.biochemistry.utoronto.ca/abc/index.php/Reference_species_for_fungi -# -# For the data model, see -# https://docs.google.com/presentation/d/13vWaVcFpWEOGeSNhwmqugj2qTQuH1eZROgxWdHGEMr0 -# For the schema, see dbInit() in ./scripts/ABC-dbUtilities.R -# -# ============================================================================== - - -myDB <- dbInit() - -myDB <- dbAddProtein(myDB, jsonlite::fromJSON("./data/MBP1_SACCE.json")) -myDB <- dbAddProtein(myDB, jsonlite::fromJSON("./data/refMBP1Proteins.json")) -myDB <- dbAddProtein(myDB, jsonlite::fromJSON("./data/refAPSES_PSI-BLAST.json")) - -myDB <- dbAddTaxonomy(myDB, jsonlite::fromJSON("./data/refTaxonomy.json")) - -myDB <- dbAddFeature(myDB, jsonlite::fromJSON("./data/refFeatures.json")) - -myDB <- dbAddAnnotation( myDB, jsonlite::fromJSON("./data/refAnnotations.json")) - - -# [END] +# ABC-createRefDB.R +# +# Create a reference protein database for Mbp1-like proteins +# +# Boris Steipe for ABC learning units +# +# For the species, see: +# http://steipe.biochemistry.utoronto.ca/abc/index.php/Reference_species_for_fungi +# +# For the data model, see +# https://docs.google.com/presentation/d/13vWaVcFpWEOGeSNhwmqugj2qTQuH1eZROgxWdHGEMr0 +# For the schema, see dbInit() in ./scripts/ABC-dbUtilities.R +# +# ============================================================================== + + +myDB <- dbInit() + +myDB <- dbAddProtein(myDB, jsonlite::fromJSON("./data/MBP1_SACCE.json")) +myDB <- dbAddProtein(myDB, jsonlite::fromJSON("./data/refMBP1Proteins.json")) +myDB <- dbAddProtein(myDB, jsonlite::fromJSON("./data/refAPSES_PSI-BLAST.json")) + +myDB <- dbAddTaxonomy(myDB, jsonlite::fromJSON("./data/refTaxonomy.json")) + +myDB <- dbAddFeature(myDB, jsonlite::fromJSON("./data/refFeatures.json")) + +myDB <- dbAddAnnotation( myDB, jsonlite::fromJSON("./data/refAnnotations.json")) + + +# [END] diff --git a/scripts/ABC-dbUtilities.R b/scripts/ABC-dbUtilities.R index 71709c8..9aa9b1d 100644 --- a/scripts/ABC-dbUtilities.R +++ b/scripts/ABC-dbUtilities.R @@ -1,674 +1,674 @@ -# tocID <- "scripts/ABC-dbUtilities.R" -# -# Purpose: Database utilities for ABC learning units. -# -# Version 2.3 -# -# Date: 2017-11 - 2020-11 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 2.3 Bug in treatment of single-column dataframes which returns -# a deparsed expression from paste() -# 2.2 Bugfixes -# 2.1 Add JSON export functions -# 2.0 Test all JSON import and prevent addition of duplicates. This -# is necessary for import of data from the public page -# 1.1 2020 Updates -# 1.0 Live version 2017 -# -# Notes: -# There are no functions to modify or delete entries. To do either, -# recreate the database with correct data in the creation script. This is the -# preferred way that ensures the entire database can be reproduced by -# source()'ing its generating script. -# -# Inserting data goes only through the very most minimal validation steps. For -# production applications, more validation would need to be added, as well -# as an overall validation of database integrity -# -# ToDo: -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ------------------------------------------------------- -#TOC> 1 INITIALISATIONS AND PARAMETERS 63 -#TOC> 2 PACKAGES 68 -#TOC> 3 FUNCTIONS 84 -#TOC> 3.01 dbSanitizeSequence() 87 -#TOC> 3.02 dbConfirmUnique() 122 -#TOC> 3.03 dbInit() 140 -#TOC> 3.04 dbAutoincrement() 180 -#TOC> 3.05 dbAddProtein() 193 -#TOC> 3.06 dbAddFeature() 229 -#TOC> 3.07 dbAddTaxonomy() 260 -#TOC> 3.08 dbAddAnnotation() 295 -#TOC> 3.09 dbFetchUniProtSeq() 342 -#TOC> 3.10 dbFetchPrositeFeatures() 388 -#TOC> 3.11 node2text() 438 -#TOC> 3.12 dbFetchNCBItaxData() 450 -#TOC> 3.13 UniProtIDmap() 489 -#TOC> 3.14 dbProt2JSON() 528 -#TOC> 3.15 dbSeq2JSON() 613 -#TOC> 3.16 dbRow2JSON() 642 -#TOC> 4 TESTS 662 -#TOC> -#TOC> ========================================================================== - - -# = 1 INITIALISATIONS AND PARAMETERS ====================================== - -doTESTS <- FALSE # run tests if TRUE - - -# = 2 PACKAGES ============================================================ - - -if (! requireNamespace("jsonlite", quietly = TRUE)) { - install.packages("jsonlite") -} - -if (! requireNamespace("httr", quietly = TRUE)) { - install.packages("httr") -} - -if (! requireNamespace("xml2", quietly = TRUE)) { - install.packages("xml2") -} - - -# = 3 FUNCTIONS =========================================================== - - -# == 3.01 dbSanitizeSequence() ============================================= -dbSanitizeSequence <- function(s, unambiguous = TRUE) { - # Remove FASTA header lines, if any, - # flatten any structure that s has, - # remove all non-letters except "-" (gap) and "*" (stop), - # convert to uppercase. - # - # Parameters: - # s chr A DNA or protein sequence plus other characters - # unambiguous bool if TRUE, stop() if any letter remaining after - # processing matches an ambiguity code. This is likely - # due to inadvertently including meta-data, such as - # a FASTA header, with the sequence. - # Note: since U is an ambiguity code for amino acid sequences, you need - # to set unambiguous = FALSE to process RNA sequences with Uracil. - # Value: chr a valid, uppercase, amino acid sequence - # - - s <- as.character(unlist(s)) # convert complex object to plain chr vector - s <- unlist(strsplit(s, "\n")) # split up at linebreaks, if any - s <- s[! grepl("^>", s)] # drop all lines beginning">" (FASTA header) - s <- paste(s, collapse="") # combine into single string - s <- toupper(gsub("[^a-zA-Z*-]", "", s)) - if (unambiguous) { - amb <- "([bjouxzBJOUXZ])" # parentheses capture the match - ambChar <- unlist(regmatches(s, regexec(amb, s)))[1] - if (! is.na(ambChar)) { - stop(paste("Input contains ambiguous codes(s): \"", - ambChar, "\".", sep="")) - } - } - return(s) -} - - -# == 3.02 dbConfirmUnique() ================================================ -dbConfirmUnique <- function(x) { - # x is a vector of logicals. - # returns x if x has exactly one TRUE element. - # stop() otherwise. - - if (any(!is.logical(x))) { - stop("PANIC: Input is not a boolean vector.") - } else if (sum(x) == 0) { - stop("PANIC: No match found.") - } else if (sum(x) > 1) { - stop("PANIC: More than one match found.") - } else { - return(x) - } -} - - -# == 3.03 dbInit() ========================================================= -dbInit <- function() { - # Return an empty instance of the protein database - # The schema is here: - # https://docs.google.com/presentation/d/13vWaVcFpWEOGeSNhwmqugj2qTQuH1eZROgxWdHGEMr0 - - db <- list() - - db$version <- "1.0" - - db$protein <- data.frame( - ID = numeric(), - name = character(), - RefSeqID = character(), - UniProtID = character(), - taxonomyID = numeric(), - sequence = character()) - - db$taxonomy <- data.frame( - ID = numeric(), - species = character()) - - db$annotation <- data.frame( - ID = numeric(), - proteinID = numeric(), - featureID = numeric(), - start = numeric(), - end = numeric()) - - db$feature <- data.frame( - ID = numeric(), - name = character(), - description = character(), - sourceDB = character(), - accession = character()) - - return(db) -} - - -# == 3.04 dbAutoincrement() ================================================ -dbAutoincrement <- function(tb) { - # Return a unique integer that can be used as a primary key - # Value: - # num a number one-larger than the largest current value in table$ID - if (length(tb$ID) == 0) { - return(1) - } else { - return(max(tb$ID) + 1) - } -} - - -# == 3.05 dbAddProtein() =================================================== -dbAddProtein <- function(db, jsonDF) { - # Add one or more protein entries to the database db if a protein with the - # same name does not yet exist. This enforces that protein names are unique. - # Parameters: - # db list a database created with dbInit() - # jsonDF data frame protein data imported into a data frame with - # fromJSON() - - for (i in seq_along(jsonDF$name)) { - isValid <- TRUE - if (jsonDF$name[i] %in% db$protein$name) { - cat(sprintf("Note: Protein No. %d in the input is \"%s\", but %s.\n", - i, jsonDF$name[i], - "a protein with this name already exists in the database. ", - "Skipping this input.")) - isValid <- FALSE - } - - if (isValid) { - if (length(jsonDF$name) == 1) { # jsonlite:: oversimplifies - jsonDF$sequence <- paste0(unlist(jsonDF$sequence), collapse = "") - } - x <- data.frame(ID = dbAutoincrement(db$protein), - name = jsonDF$name[i], - RefSeqID = jsonDF$RefSeqID[i], - UniProtID = jsonDF$UniProtID[i], - taxonomyID = as.integer(jsonDF$taxonomyID[i]), - sequence = dbSanitizeSequence(jsonDF$sequence[i])) - db$protein <- rbind(db$protein, x) - } - } - return(db) -} - - -# == 3.06 dbAddFeature() =================================================== -dbAddFeature <- function(db, jsonDF) { - # Add one or more feature entries to the database db. Skip if a feature with - # the same name already exists. - # Parameters: - # db list a database created with dbInit() - # jsonDF data frame feature data imported into a data frame with - # fromJSON() - for (i in seq_along(jsonDF$name)) { - isValid <- TRUE - if (jsonDF$name[i] %in% db$feature$name) { - cat(sprintf("Note: Feature No. %d in the input is \"%s\", but %s.\n", - i, jsonDF$name[i], - "a feature with this name already exists in the database. ", - "Skipping this input.")) - isValid <- FALSE - } - - if (isValid) { - x <- data.frame(ID = dbAutoincrement(db$feature), - name = jsonDF$name[i], - description = jsonDF$description[i], - sourceDB = jsonDF$sourceDB[i], - accession = jsonDF$accession[i]) - db$feature <- rbind(db$feature, x) - } - } - return(db) -} - - -# == 3.07 dbAddTaxonomy() ================================================== -dbAddTaxonomy <- function(db, jsonDF) { - # Add one or more taxonomy entries to the database db. Skip if species name - # or taxonomy ID already exist in the database. - # Parameters: - # db list A database created with dbInit() - # jsonDF data frame Taxonomy data imported into a data frame with - # fromJSON() - for (i in seq_along(jsonDF$species)) { - isValid <- TRUE - - if (jsonDF$species[i] %in% db$taxonomy$species) { - cat(sprintf("Note: Species No. %d in the input is \"%s\", but %s%s\n", - i, jsonDF$name[i], - "a species with this name already exists in the database. ", - "Skipping this input.")) - isValid <- FALSE - } else if (jsonDF$ID[i] %in% db$taxonomy$ID) { - cat(sprintf("Note: Taxonomy ID No. %d in the input is \"%d\", but %s%s\n", - i, jsonDF$ID[i], - "this taxonomy ID already exists in the database. ", - "Skipping this input.")) - isValid <- FALSE - } - if (isValid) { - x <- data.frame( - ID = as.integer(jsonDF$ID[i]), - species = jsonDF$species[i]) - db$taxonomy <- rbind(db$taxonomy, x) - } - } - return(db) -} - - -# == 3.08 dbAddAnnotation() ================================================ -dbAddAnnotation <- function(db, jsonDF) { - # Add one or more annotation entries to the database db. Skip the entry if - # it already exists in the database. - # Parameters: - # db list a database created with dbInit() - # jsonDF data frame annotation data imported into a data frame with - # fromJSON() - for (i in seq_along(jsonDF$pName)) { - isValid <- TRUE - - sel <- jsonDF$pName[i] == db$protein$name - sel <- dbConfirmUnique(sel) # Confirm that this protein ID exists - pID <- db$protein$ID[sel] - - sel <- jsonDF$fName[i] == db$feature$name - sel <- dbConfirmUnique(sel) # Confirm that this feature ID exists - fID <- db$feature$ID[sel] - - sel <- db$annotation$proteinID == pID & - db$annotation$featureID == fID & - db$annotation$start == as.integer(jsonDF$start[i]) & - db$annotation$end == as.integer(jsonDF$end[i]) - - if (any(sel)) { - cat(sprintf("Note: annotation No. %d in the input has %s%s\n", - i, - "the same protein name, feature name, start, and end ", - "as one that already exists in the database. ", - "Skipping this input.")) - - isValid <- FALSE - } - - if (isValid) { - x <- data.frame(ID = dbAutoincrement(db$annotation), - proteinID = pID, - featureID = fID, - start = as.integer(jsonDF$start[i]), - end = as.integer(jsonDF$end[i])) - db$annotation <- rbind(db$annotation, x) - } - } - return(db) -} - - -# == 3.09 dbFetchUniProtSeq() ============================================== -dbFetchUniProtSeq <- function(IDs) { - # Fetch a protein sequence from UniProt. - # Parameters: - # IDs char a vector of UniProt IDs (accession number) - # Value: - # char a vector of the same length as ID. It contains - # sequences where the retrieval was successful, NA where - # it was not successful. The elements are named with - # the ID, the header lines are set as attribute "header" - - - BASE <- "http://www.uniprot.org/uniprot/" - - sq <- character() - hd <- character() - for (i in seq_along(IDs)) { - URL <- sprintf("%s%s.fasta", BASE, IDs[i]) - response <- httr::GET(URL) - if (httr::status_code(response) == 200) { - s <- as.character(response) - s <- unlist(strsplit(s, "\n")) - x <- dbSanitizeSequence(s) - } else { - s <- "" - x <- NA - } - hd[i] <- s[1] - sq[i] <- x - } - names(sq) <- IDs - attr(sq, "headers") <- hd - - return(sq) -} - -if (FALSE) { - inp <- c("P79073", "P0000000", "A0A1W2TKZ7") - s <- dbFetchUniProtSeq(inp) - s[1:3] - str(s) - attr(s, "headers")[1] -} - - - -# == 3.10 dbFetchPrositeFeatures() ========================================= -dbFetchPrositeFeatures <- function(ID) { - # Fetch feature annotations from ScanProsite. - # Parameters: - # ID char a UniProt ID (accession number) - # Value: - # data frame uID char UniProt ID - # start num start of motif - # end num end of motif - # psID char PROSITE motif ID - # psName char PROSITE motif name - # psSeq char sequence annotated to the feature - # If the operation is not successful, a 0-length data frame is returned. - - URL <- "https://prosite.expasy.org/cgi-bin/prosite/PSScan.cgi" - - response <- httr::POST(URL, - body = list(meta = "opt1", - meta1_protein = "opt1", - seq = ID, - skip = "on", - output = "tabular")) - - myFeatures <- data.frame() - if (httr::status_code(response) == 200) { - - lines <- unlist(strsplit(httr::content(response, "text"), "\\n")) - - patt <- sprintf("\\|%s\\|", ID) - lines <- lines[grep(patt, lines)] - - for (line in lines) { - tokens <- unlist(strsplit(line, "\\t|\\|")) - myFeatures <- rbind(myFeatures, - data.frame(uID = tokens[2], - start = as.numeric(tokens[4]), - end = as.numeric(tokens[5]), - psID = tokens[6], - psName = tokens[7], - psSeq = tokens[11])) - } - } - return(myFeatures) -} - -if (FALSE) { - dbFetchPrositeFeatures("P33520") # RES1_SCHPO - -} - -# == 3.11 node2text() ====================================================== -node2text <- function(doc, tag) { - # an extractor function for the contents of elements - # between given tags in an XML response. - # Contents of all matching elements is returned in - # a vector of strings. - path <- paste0("//", tag) - nodes <- xml2::xml_find_all(doc, path) - return(xml2::xml_text(nodes)) -} - - -# == 3.12 dbFetchNCBItaxData() ============================================= -dbFetchNCBItaxData <- function(ID) { - # Fetch feature taxID and Organism from the NCBI. - # Parameters: - # ID char a RefSeq ID (accession number) - # Value: - # data frame taxID num NCBI taxID - # organism char organism for this taxID - # If the operation is not successful, a 0-length data frame is returned. - - eUtilsBase <- "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/" - URL <- paste(eUtilsBase, - "esearch.fcgi?", - "db=protein", - "&term=", ID, - sep="") - myXML <- xml2::read_xml(URL) - GID <- node2text(myXML, "Id") - - URL <- paste0(eUtilsBase, - "esummary.fcgi?", - "db=protein", - "&id=", - GID, - "&version=2.0") - myXML <- xml2::read_xml(URL) - - x <- as.integer(node2text(myXML, "TaxId")) - y <- node2text(myXML, "Organism") - - tID <- data.frame() - if (length(x) > 0 && length(y) > 0) { - tID <- data.frame(taxID = x, organism = y) - } - return(tID) -} - - - -# == 3.13 UniProtIDmap() =================================================== -UniProtIDmap <- function (s, mapFrom = "P_REFSEQ_AC", mapTo = "ACC") { - # Use UniProt ID mapping service to map one or more IDs - # Parameters: - # s char A string of white-space separated IDs - # mapFrom char the database in which the IDs in s are valid. - # Default is RefSeq protein - # mapTo char the database in which the target IDs are valid. - # Default is UniProtKB - # Value - # A data frame of mapped IDs, with column names From and To, or an - # empty data frame if the mapping was unsuccessful. No rows are returned - # for IDs that are not mapped. - - # Initialize curl - httr::set_config(httr::config(http_version = 0)) - - URL <- "https://www.uniprot.org/uploadlists/" - response <- httr::POST(URL, - body = list(from = mapFrom, - to = mapTo, - format = "tab", - query = s)) - - if (httr::status_code(response) == 200) { # 200: oK - myMap <- read.delim(file = textConnection(httr::content(response)), - sep = "\t") - colnames(myMap) <- c("From", "To") - } else { - myMap <- data.frame() - warning(paste("No uniProt ID mapping returned:", - "server sent status", - httr::status_code(response))) - } - - return(myMap) -} - - -# == 3.14 dbProt2JSON() ==================================================== -dbProt2JSON <- function(thisProt) { - # Extract all protein related data from myDB and return in JSON format. - - thisData <- list() - - # add a protein table - sel <- which(myDB$protein$name == thisProt) - thisData$protein <- myDB$protein[sel, ] - - # add a taxonomy table - sel <- which(myDB$taxonomy$ID == thisData$protein$taxonomyID) - thisData$taxonomy <- myDB$taxonomy[sel, ] - - # add the entries for this protein from the annotation table - sel <- which(myDB$annotation$proteinID == thisData$protein$ID) - thisData$annotation <- myDB$annotation[sel, ] - # our .json convention uses pName and fName as keys, not the db-internal IDs - # add empty columns for pName and fName - l <- nrow(thisData$annotation) - thisData$annotation$pName <- character(l) - thisData$annotation$fName <- character(l) - # get the appropriate protein and feature names - for (i in seq_len(l)) { - pID <- thisData$annotation$proteinID[i] - sel <- which(myDB$protein$ID == pID) - thisData$annotation$pName[i] <- myDB$protein$name[sel] # store pName - fID <- thisData$annotation$featureID[i] - sel <- which(myDB$feature$ID == fID) - thisData$annotation$fName[i] <- myDB$feature$name[sel] # store fName - } - - # add the corresponding feature table - sel <- which(myDB$feature$ID %in% thisData$annotation$featureID) - thisData$feature <- myDB$feature[sel, ] - - # remove columns that are not going into JSON output - thisData$protein$ID <- NULL - thisData$annotation$ID <- NULL - thisData$annotation$proteinID <- NULL - thisData$annotation$featureID <- NULL - thisData$feature$ID <- NULL - - # create JSON-formatted output - # ( jsonlite::prettify() is too wordy for a compact Wikipage ) - - out <- character() - out <- c(out, '{') - - out <- c(out, ' "protein": {') - sel <- colnames(thisData$protein) != "sequence" - out <- c(out, sprintf(" %s,", dbRow2JSON(thisData$protein[1, sel], - coll = ",\n "))) - out <- c(out, dbSeq2JSON(thisData$protein$sequence[1])) - out <- c(out, ' },') - - out <- c(out, ' "taxonomy": {') - out <- c(out, sprintf(" %s", dbRow2JSON(thisData$taxonomy))) - out <- c(out, ' },') - - out <- c(out, ' "annotation": [') - for (i in seq_len(nrow(thisData$annotation))) { - out <- c(out, sprintf(" {%s},", dbRow2JSON(thisData$annotation[i, ]))) - } - out[length(out)] <- gsub(",$", "", out[length(out)]) # remove last "," - out <- c(out, ' ],') - - out <- c(out, ' "feature": [') - sel <- colnames(thisData$feature) != "description" - for (i in seq_len(nrow(thisData$feature))) { - out <- c(out, sprintf(" {%s,", - dbRow2JSON(thisData$feature[i, sel]))) - out <- c(out, sprintf(" %s},", - dbRow2JSON(thisData$feature[i, "description", - drop = FALSE]))) - } - out[length(out)] <- gsub(",$", "", out[length(out)]) # remove last "," - out <- c(out, ' ]') - - out <- c(out, '}') - - return(paste0(out, collapse = "\n")) -} - - -# == 3.15 dbSeq2JSON() ===================================================== - -dbSeq2JSON <- function(s, nIndents = 4, width = 70) { - # Turn a sequence into a JSON key-value pair, with the value being a JSON - # array of elements not exceeding a width of "width", and an indent of - # "indents" spaces. - ind <- paste0(rep(" ", nIndents), collapse = "") - - out <- character() - out <- c(out, sprintf("%s\"sequence\": [", ind)) - - for (i in seq_along(s)) { - l <- nchar(s[i]) - if (l <= width) { - out <- c(out, s[i]) - } else { - starts <- seq(1, l, by = width) - ends <- seq(width, l, by = width) - if (length(ends) < length(starts)) { ends <- c(ends, l) } - out <- c(out, sprintf("%s \"%s\",", ind, substring(s[i], starts, ends))) - } - } - out[length(out)] <- gsub(",$", "", out[length(out)]) # remove last "," - - out <- c(out, sprintf("%s]", ind)) - return(paste0(out, collapse = "\n")) -} - - -# == 3.16 dbRow2JSON() ===================================================== - -dbRow2JSON <- function(df, coll = ", ") { - # Turn a single dataframe row into JSON key value pairs, where the keys are the - # column names. Respects character / numeric mode. - out <- character() - for (i in 1:ncol(df)) { - if (class(df[1, i]) == "integer") { - val <- sprintf("%d", df[1, i]) - } else if (class(df[1, i]) == "numeric") { - val <- sprintf("%f", df[1, i]) - } else { - val <- sprintf("\"%s\"", as.character(df[1, i])) - } - out <- c(out, sprintf("\"%s\": %s", colnames(df)[i], val)) - } - return(paste0(out, collapse = coll)) -} - - -# = 4 TESTS =============================================================== - -if (doTESTS) { - if (! requireNamespace("testthat", quietly = TRUE)) { - install.packages("testthat") - } - - # ToDo: test everything here - -} - - -# [END] +# tocID <- "scripts/ABC-dbUtilities.R" +# +# Purpose: Database utilities for ABC learning units. +# +# Version 2.3 +# +# Date: 2017-11 - 2020-11 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 2.3 Bug in treatment of single-column dataframes which returns +# a deparsed expression from paste() +# 2.2 Bugfixes +# 2.1 Add JSON export functions +# 2.0 Test all JSON import and prevent addition of duplicates. This +# is necessary for import of data from the public page +# 1.1 2020 Updates +# 1.0 Live version 2017 +# +# Notes: +# There are no functions to modify or delete entries. To do either, +# recreate the database with correct data in the creation script. This is the +# preferred way that ensures the entire database can be reproduced by +# source()'ing its generating script. +# +# Inserting data goes only through the very most minimal validation steps. For +# production applications, more validation would need to be added, as well +# as an overall validation of database integrity +# +# ToDo: +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ------------------------------------------------------- +#TOC> 1 INITIALISATIONS AND PARAMETERS 63 +#TOC> 2 PACKAGES 68 +#TOC> 3 FUNCTIONS 84 +#TOC> 3.01 dbSanitizeSequence() 87 +#TOC> 3.02 dbConfirmUnique() 122 +#TOC> 3.03 dbInit() 140 +#TOC> 3.04 dbAutoincrement() 180 +#TOC> 3.05 dbAddProtein() 193 +#TOC> 3.06 dbAddFeature() 229 +#TOC> 3.07 dbAddTaxonomy() 260 +#TOC> 3.08 dbAddAnnotation() 295 +#TOC> 3.09 dbFetchUniProtSeq() 342 +#TOC> 3.10 dbFetchPrositeFeatures() 388 +#TOC> 3.11 node2text() 438 +#TOC> 3.12 dbFetchNCBItaxData() 450 +#TOC> 3.13 UniProtIDmap() 489 +#TOC> 3.14 dbProt2JSON() 528 +#TOC> 3.15 dbSeq2JSON() 613 +#TOC> 3.16 dbRow2JSON() 642 +#TOC> 4 TESTS 662 +#TOC> +#TOC> ========================================================================== + + +# = 1 INITIALISATIONS AND PARAMETERS ====================================== + +doTESTS <- FALSE # run tests if TRUE + + +# = 2 PACKAGES ============================================================ + + +if (! requireNamespace("jsonlite", quietly = TRUE)) { + install.packages("jsonlite") +} + +if (! requireNamespace("httr", quietly = TRUE)) { + install.packages("httr") +} + +if (! requireNamespace("xml2", quietly = TRUE)) { + install.packages("xml2") +} + + +# = 3 FUNCTIONS =========================================================== + + +# == 3.01 dbSanitizeSequence() ============================================= +dbSanitizeSequence <- function(s, unambiguous = TRUE) { + # Remove FASTA header lines, if any, + # flatten any structure that s has, + # remove all non-letters except "-" (gap) and "*" (stop), + # convert to uppercase. + # + # Parameters: + # s chr A DNA or protein sequence plus other characters + # unambiguous bool if TRUE, stop() if any letter remaining after + # processing matches an ambiguity code. This is likely + # due to inadvertently including meta-data, such as + # a FASTA header, with the sequence. + # Note: since U is an ambiguity code for amino acid sequences, you need + # to set unambiguous = FALSE to process RNA sequences with Uracil. + # Value: chr a valid, uppercase, amino acid sequence + # + + s <- as.character(unlist(s)) # convert complex object to plain chr vector + s <- unlist(strsplit(s, "\n")) # split up at linebreaks, if any + s <- s[! grepl("^>", s)] # drop all lines beginning">" (FASTA header) + s <- paste(s, collapse="") # combine into single string + s <- toupper(gsub("[^a-zA-Z*-]", "", s)) + if (unambiguous) { + amb <- "([bjouxzBJOUXZ])" # parentheses capture the match + ambChar <- unlist(regmatches(s, regexec(amb, s)))[1] + if (! is.na(ambChar)) { + stop(paste("Input contains ambiguous codes(s): \"", + ambChar, "\".", sep="")) + } + } + return(s) +} + + +# == 3.02 dbConfirmUnique() ================================================ +dbConfirmUnique <- function(x) { + # x is a vector of logicals. + # returns x if x has exactly one TRUE element. + # stop() otherwise. + + if (any(!is.logical(x))) { + stop("PANIC: Input is not a boolean vector.") + } else if (sum(x) == 0) { + stop("PANIC: No match found.") + } else if (sum(x) > 1) { + stop("PANIC: More than one match found.") + } else { + return(x) + } +} + + +# == 3.03 dbInit() ========================================================= +dbInit <- function() { + # Return an empty instance of the protein database + # The schema is here: + # https://docs.google.com/presentation/d/13vWaVcFpWEOGeSNhwmqugj2qTQuH1eZROgxWdHGEMr0 + + db <- list() + + db$version <- "1.0" + + db$protein <- data.frame( + ID = numeric(), + name = character(), + RefSeqID = character(), + UniProtID = character(), + taxonomyID = numeric(), + sequence = character()) + + db$taxonomy <- data.frame( + ID = numeric(), + species = character()) + + db$annotation <- data.frame( + ID = numeric(), + proteinID = numeric(), + featureID = numeric(), + start = numeric(), + end = numeric()) + + db$feature <- data.frame( + ID = numeric(), + name = character(), + description = character(), + sourceDB = character(), + accession = character()) + + return(db) +} + + +# == 3.04 dbAutoincrement() ================================================ +dbAutoincrement <- function(tb) { + # Return a unique integer that can be used as a primary key + # Value: + # num a number one-larger than the largest current value in table$ID + if (length(tb$ID) == 0) { + return(1) + } else { + return(max(tb$ID) + 1) + } +} + + +# == 3.05 dbAddProtein() =================================================== +dbAddProtein <- function(db, jsonDF) { + # Add one or more protein entries to the database db if a protein with the + # same name does not yet exist. This enforces that protein names are unique. + # Parameters: + # db list a database created with dbInit() + # jsonDF data frame protein data imported into a data frame with + # fromJSON() + + for (i in seq_along(jsonDF$name)) { + isValid <- TRUE + if (jsonDF$name[i] %in% db$protein$name) { + cat(sprintf("Note: Protein No. %d in the input is \"%s\", but %s.\n", + i, jsonDF$name[i], + "a protein with this name already exists in the database. ", + "Skipping this input.")) + isValid <- FALSE + } + + if (isValid) { + if (length(jsonDF$name) == 1) { # jsonlite:: oversimplifies + jsonDF$sequence <- paste0(unlist(jsonDF$sequence), collapse = "") + } + x <- data.frame(ID = dbAutoincrement(db$protein), + name = jsonDF$name[i], + RefSeqID = jsonDF$RefSeqID[i], + UniProtID = jsonDF$UniProtID[i], + taxonomyID = as.integer(jsonDF$taxonomyID[i]), + sequence = dbSanitizeSequence(jsonDF$sequence[i])) + db$protein <- rbind(db$protein, x) + } + } + return(db) +} + + +# == 3.06 dbAddFeature() =================================================== +dbAddFeature <- function(db, jsonDF) { + # Add one or more feature entries to the database db. Skip if a feature with + # the same name already exists. + # Parameters: + # db list a database created with dbInit() + # jsonDF data frame feature data imported into a data frame with + # fromJSON() + for (i in seq_along(jsonDF$name)) { + isValid <- TRUE + if (jsonDF$name[i] %in% db$feature$name) { + cat(sprintf("Note: Feature No. %d in the input is \"%s\", but %s.\n", + i, jsonDF$name[i], + "a feature with this name already exists in the database. ", + "Skipping this input.")) + isValid <- FALSE + } + + if (isValid) { + x <- data.frame(ID = dbAutoincrement(db$feature), + name = jsonDF$name[i], + description = jsonDF$description[i], + sourceDB = jsonDF$sourceDB[i], + accession = jsonDF$accession[i]) + db$feature <- rbind(db$feature, x) + } + } + return(db) +} + + +# == 3.07 dbAddTaxonomy() ================================================== +dbAddTaxonomy <- function(db, jsonDF) { + # Add one or more taxonomy entries to the database db. Skip if species name + # or taxonomy ID already exist in the database. + # Parameters: + # db list A database created with dbInit() + # jsonDF data frame Taxonomy data imported into a data frame with + # fromJSON() + for (i in seq_along(jsonDF$species)) { + isValid <- TRUE + + if (jsonDF$species[i] %in% db$taxonomy$species) { + cat(sprintf("Note: Species No. %d in the input is \"%s\", but %s%s\n", + i, jsonDF$name[i], + "a species with this name already exists in the database. ", + "Skipping this input.")) + isValid <- FALSE + } else if (jsonDF$ID[i] %in% db$taxonomy$ID) { + cat(sprintf("Note: Taxonomy ID No. %d in the input is \"%d\", but %s%s\n", + i, jsonDF$ID[i], + "this taxonomy ID already exists in the database. ", + "Skipping this input.")) + isValid <- FALSE + } + if (isValid) { + x <- data.frame( + ID = as.integer(jsonDF$ID[i]), + species = jsonDF$species[i]) + db$taxonomy <- rbind(db$taxonomy, x) + } + } + return(db) +} + + +# == 3.08 dbAddAnnotation() ================================================ +dbAddAnnotation <- function(db, jsonDF) { + # Add one or more annotation entries to the database db. Skip the entry if + # it already exists in the database. + # Parameters: + # db list a database created with dbInit() + # jsonDF data frame annotation data imported into a data frame with + # fromJSON() + for (i in seq_along(jsonDF$pName)) { + isValid <- TRUE + + sel <- jsonDF$pName[i] == db$protein$name + sel <- dbConfirmUnique(sel) # Confirm that this protein ID exists + pID <- db$protein$ID[sel] + + sel <- jsonDF$fName[i] == db$feature$name + sel <- dbConfirmUnique(sel) # Confirm that this feature ID exists + fID <- db$feature$ID[sel] + + sel <- db$annotation$proteinID == pID & + db$annotation$featureID == fID & + db$annotation$start == as.integer(jsonDF$start[i]) & + db$annotation$end == as.integer(jsonDF$end[i]) + + if (any(sel)) { + cat(sprintf("Note: annotation No. %d in the input has %s%s\n", + i, + "the same protein name, feature name, start, and end ", + "as one that already exists in the database. ", + "Skipping this input.")) + + isValid <- FALSE + } + + if (isValid) { + x <- data.frame(ID = dbAutoincrement(db$annotation), + proteinID = pID, + featureID = fID, + start = as.integer(jsonDF$start[i]), + end = as.integer(jsonDF$end[i])) + db$annotation <- rbind(db$annotation, x) + } + } + return(db) +} + + +# == 3.09 dbFetchUniProtSeq() ============================================== +dbFetchUniProtSeq <- function(IDs) { + # Fetch a protein sequence from UniProt. + # Parameters: + # IDs char a vector of UniProt IDs (accession number) + # Value: + # char a vector of the same length as ID. It contains + # sequences where the retrieval was successful, NA where + # it was not successful. The elements are named with + # the ID, the header lines are set as attribute "header" + + + BASE <- "http://www.uniprot.org/uniprot/" + + sq <- character() + hd <- character() + for (i in seq_along(IDs)) { + URL <- sprintf("%s%s.fasta", BASE, IDs[i]) + response <- httr::GET(URL) + if (httr::status_code(response) == 200) { + s <- as.character(response) + s <- unlist(strsplit(s, "\n")) + x <- dbSanitizeSequence(s) + } else { + s <- "" + x <- NA + } + hd[i] <- s[1] + sq[i] <- x + } + names(sq) <- IDs + attr(sq, "headers") <- hd + + return(sq) +} + +if (FALSE) { + inp <- c("P79073", "P0000000", "A0A1W2TKZ7") + s <- dbFetchUniProtSeq(inp) + s[1:3] + str(s) + attr(s, "headers")[1] +} + + + +# == 3.10 dbFetchPrositeFeatures() ========================================= +dbFetchPrositeFeatures <- function(ID) { + # Fetch feature annotations from ScanProsite. + # Parameters: + # ID char a UniProt ID (accession number) + # Value: + # data frame uID char UniProt ID + # start num start of motif + # end num end of motif + # psID char PROSITE motif ID + # psName char PROSITE motif name + # psSeq char sequence annotated to the feature + # If the operation is not successful, a 0-length data frame is returned. + + URL <- "https://prosite.expasy.org/cgi-bin/prosite/PSScan.cgi" + + response <- httr::POST(URL, + body = list(meta = "opt1", + meta1_protein = "opt1", + seq = ID, + skip = "on", + output = "tabular")) + + myFeatures <- data.frame() + if (httr::status_code(response) == 200) { + + lines <- unlist(strsplit(httr::content(response, "text"), "\\n")) + + patt <- sprintf("\\|%s\\|", ID) + lines <- lines[grep(patt, lines)] + + for (line in lines) { + tokens <- unlist(strsplit(line, "\\t|\\|")) + myFeatures <- rbind(myFeatures, + data.frame(uID = tokens[2], + start = as.numeric(tokens[4]), + end = as.numeric(tokens[5]), + psID = tokens[6], + psName = tokens[7], + psSeq = tokens[11])) + } + } + return(myFeatures) +} + +if (FALSE) { + dbFetchPrositeFeatures("P33520") # RES1_SCHPO + +} + +# == 3.11 node2text() ====================================================== +node2text <- function(doc, tag) { + # an extractor function for the contents of elements + # between given tags in an XML response. + # Contents of all matching elements is returned in + # a vector of strings. + path <- paste0("//", tag) + nodes <- xml2::xml_find_all(doc, path) + return(xml2::xml_text(nodes)) +} + + +# == 3.12 dbFetchNCBItaxData() ============================================= +dbFetchNCBItaxData <- function(ID) { + # Fetch feature taxID and Organism from the NCBI. + # Parameters: + # ID char a RefSeq ID (accession number) + # Value: + # data frame taxID num NCBI taxID + # organism char organism for this taxID + # If the operation is not successful, a 0-length data frame is returned. + + eUtilsBase <- "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/" + URL <- paste(eUtilsBase, + "esearch.fcgi?", + "db=protein", + "&term=", ID, + sep="") + myXML <- xml2::read_xml(URL) + GID <- node2text(myXML, "Id") + + URL <- paste0(eUtilsBase, + "esummary.fcgi?", + "db=protein", + "&id=", + GID, + "&version=2.0") + myXML <- xml2::read_xml(URL) + + x <- as.integer(node2text(myXML, "TaxId")) + y <- node2text(myXML, "Organism") + + tID <- data.frame() + if (length(x) > 0 && length(y) > 0) { + tID <- data.frame(taxID = x, organism = y) + } + return(tID) +} + + + +# == 3.13 UniProtIDmap() =================================================== +UniProtIDmap <- function (s, mapFrom = "P_REFSEQ_AC", mapTo = "ACC") { + # Use UniProt ID mapping service to map one or more IDs + # Parameters: + # s char A string of white-space separated IDs + # mapFrom char the database in which the IDs in s are valid. + # Default is RefSeq protein + # mapTo char the database in which the target IDs are valid. + # Default is UniProtKB + # Value + # A data frame of mapped IDs, with column names From and To, or an + # empty data frame if the mapping was unsuccessful. No rows are returned + # for IDs that are not mapped. + + # Initialize curl + httr::set_config(httr::config(http_version = 0)) + + URL <- "https://www.uniprot.org/uploadlists/" + response <- httr::POST(URL, + body = list(from = mapFrom, + to = mapTo, + format = "tab", + query = s)) + + if (httr::status_code(response) == 200) { # 200: oK + myMap <- read.delim(file = textConnection(httr::content(response)), + sep = "\t") + colnames(myMap) <- c("From", "To") + } else { + myMap <- data.frame() + warning(paste("No uniProt ID mapping returned:", + "server sent status", + httr::status_code(response))) + } + + return(myMap) +} + + +# == 3.14 dbProt2JSON() ==================================================== +dbProt2JSON <- function(thisProt) { + # Extract all protein related data from myDB and return in JSON format. + + thisData <- list() + + # add a protein table + sel <- which(myDB$protein$name == thisProt) + thisData$protein <- myDB$protein[sel, ] + + # add a taxonomy table + sel <- which(myDB$taxonomy$ID == thisData$protein$taxonomyID) + thisData$taxonomy <- myDB$taxonomy[sel, ] + + # add the entries for this protein from the annotation table + sel <- which(myDB$annotation$proteinID == thisData$protein$ID) + thisData$annotation <- myDB$annotation[sel, ] + # our .json convention uses pName and fName as keys, not the db-internal IDs + # add empty columns for pName and fName + l <- nrow(thisData$annotation) + thisData$annotation$pName <- character(l) + thisData$annotation$fName <- character(l) + # get the appropriate protein and feature names + for (i in seq_len(l)) { + pID <- thisData$annotation$proteinID[i] + sel <- which(myDB$protein$ID == pID) + thisData$annotation$pName[i] <- myDB$protein$name[sel] # store pName + fID <- thisData$annotation$featureID[i] + sel <- which(myDB$feature$ID == fID) + thisData$annotation$fName[i] <- myDB$feature$name[sel] # store fName + } + + # add the corresponding feature table + sel <- which(myDB$feature$ID %in% thisData$annotation$featureID) + thisData$feature <- myDB$feature[sel, ] + + # remove columns that are not going into JSON output + thisData$protein$ID <- NULL + thisData$annotation$ID <- NULL + thisData$annotation$proteinID <- NULL + thisData$annotation$featureID <- NULL + thisData$feature$ID <- NULL + + # create JSON-formatted output + # ( jsonlite::prettify() is too wordy for a compact Wikipage ) + + out <- character() + out <- c(out, '{') + + out <- c(out, ' "protein": {') + sel <- colnames(thisData$protein) != "sequence" + out <- c(out, sprintf(" %s,", dbRow2JSON(thisData$protein[1, sel], + coll = ",\n "))) + out <- c(out, dbSeq2JSON(thisData$protein$sequence[1])) + out <- c(out, ' },') + + out <- c(out, ' "taxonomy": {') + out <- c(out, sprintf(" %s", dbRow2JSON(thisData$taxonomy))) + out <- c(out, ' },') + + out <- c(out, ' "annotation": [') + for (i in seq_len(nrow(thisData$annotation))) { + out <- c(out, sprintf(" {%s},", dbRow2JSON(thisData$annotation[i, ]))) + } + out[length(out)] <- gsub(",$", "", out[length(out)]) # remove last "," + out <- c(out, ' ],') + + out <- c(out, ' "feature": [') + sel <- colnames(thisData$feature) != "description" + for (i in seq_len(nrow(thisData$feature))) { + out <- c(out, sprintf(" {%s,", + dbRow2JSON(thisData$feature[i, sel]))) + out <- c(out, sprintf(" %s},", + dbRow2JSON(thisData$feature[i, "description", + drop = FALSE]))) + } + out[length(out)] <- gsub(",$", "", out[length(out)]) # remove last "," + out <- c(out, ' ]') + + out <- c(out, '}') + + return(paste0(out, collapse = "\n")) +} + + +# == 3.15 dbSeq2JSON() ===================================================== + +dbSeq2JSON <- function(s, nIndents = 4, width = 70) { + # Turn a sequence into a JSON key-value pair, with the value being a JSON + # array of elements not exceeding a width of "width", and an indent of + # "indents" spaces. + ind <- paste0(rep(" ", nIndents), collapse = "") + + out <- character() + out <- c(out, sprintf("%s\"sequence\": [", ind)) + + for (i in seq_along(s)) { + l <- nchar(s[i]) + if (l <= width) { + out <- c(out, s[i]) + } else { + starts <- seq(1, l, by = width) + ends <- seq(width, l, by = width) + if (length(ends) < length(starts)) { ends <- c(ends, l) } + out <- c(out, sprintf("%s \"%s\",", ind, substring(s[i], starts, ends))) + } + } + out[length(out)] <- gsub(",$", "", out[length(out)]) # remove last "," + + out <- c(out, sprintf("%s]", ind)) + return(paste0(out, collapse = "\n")) +} + + +# == 3.16 dbRow2JSON() ===================================================== + +dbRow2JSON <- function(df, coll = ", ") { + # Turn a single dataframe row into JSON key value pairs, where the keys are the + # column names. Respects character / numeric mode. + out <- character() + for (i in 1:ncol(df)) { + if (class(df[1, i]) == "integer") { + val <- sprintf("%d", df[1, i]) + } else if (class(df[1, i]) == "numeric") { + val <- sprintf("%f", df[1, i]) + } else { + val <- sprintf("\"%s\"", as.character(df[1, i])) + } + out <- c(out, sprintf("\"%s\": %s", colnames(df)[i], val)) + } + return(paste0(out, collapse = coll)) +} + + +# = 4 TESTS =============================================================== + +if (doTESTS) { + if (! requireNamespace("testthat", quietly = TRUE)) { + install.packages("testthat") + } + + # ToDo: test everything here + +} + + +# [END] diff --git a/scripts/ABC-makeMYSPElist.R b/scripts/ABC-makeMYSPElist.R index b519dd6..7544851 100644 --- a/scripts/ABC-makeMYSPElist.R +++ b/scripts/ABC-makeMYSPElist.R @@ -1,443 +1,443 @@ -# tocID <- "scripts/ABC-makeMYSPElist.R" -# -# Purpose: Create a list of genome sequenced fungi with protein annotations and -# Mbp1 homologues. -# -# Version: 1.4 -# -# Date: 2016 09 - 2021 09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions -# 1.4 New retrieval logic -# 1.3 Rewrite to change datasource. NCBI has not been updated -# since 2012. Use ensembl fungi as initial source. -# 1.2 Change from require() to requireNamespace() -# 1.1.2 Moved BLAST.R to ./scripts directory -# 1.1 Update 2017 -# 1.0 First code 2016 -# -# TODO: -# -# ============================================================================== -# -# DO NOT source() THIS FILE! -# -# This file is code I provide for your deeper understanding of a process and -# to provide you with useful sample code. It is not actually necessary for -# you to run this code, but I encourage you to read it carefully and discuss -# if there are parts you don't understand. -# -# Run the commands that interact with the NCBI servers only if you want to -# experiment specifically with the code and/or parameters. I have commented out -# those parts. If you only want to study the general workflow, just load() -# the respective intermediate results. -# - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> -------------------------------------------------------- -#TOC> 1 The strategy 55 -#TOC> 2 PACKAGES AND INITIALIZATIONS 67 -#TOC> 3 ENSEMBL FUNGI 75 -#TOC> 3.1 Import 78 -#TOC> 4 BLAST SEARCH 155 -#TOC> 4.1 find homologous proteins 161 -#TOC> 4.2 Identify species in "hits" 192 -#TOC> 5 MERGE ENSEMBL AND BLAST RESULTS 282 -#TOC> 6 STUDENT NUMBERS 375 -#TOC> -#TOC> ========================================================================== - - -# = 1 The strategy ======================================================== - -# This script will create a list of "MYSPE" species and save it in an R object -# MYSPEspecies that is stored in the data subdirectory of this project from -# where it can be loaded. The strategy is as follows: we download a list of -# annotated fungal genomes from ensembl.fungi. All these are genome-sequenced -# species that have been annotated. -# Next we perform a BLAST search, to identify fungal species that have -# genes that are homologous to yeast MBP1. -# -# ... - -# = 2 PACKAGES AND INITIALIZATIONS ======================================== - -# httr provides interfaces to Webservers on the Internet -if (! requireNamespace("httr", quietly = TRUE)) { - install.packages("httr") -} - - -# = 3 ENSEMBL FUNGI ======================================================= - - -# == 3.1 Import ============================================================ - -# Navigate to https://fungi.ensembl.org and click on the link to the full -# list of all species: https://fungi.ensembl.org/species.html -# On the page, click on the spreadsheet symbol top right and choose -# "download whole table". The file will be named "Species.csv", in your -# usual downloads folder. Move it to the data folder, and read it. - -sDat <- read.csv("./data/Species.csv") -str(sDat) - -# The most obvious way to partition these is according to Classification ... -# (poking around a bit in the UniProt taxonomy database shows that the -# classification used here is the taxonomic rank of "order"). -# how many classifications do we have? -length(unique(sDat$Classification)) # 66 - -# To have a good set for the class, we should have about 100. -# Let's see for which of these we can find Mbp1 homologues. -# First, we'll keep only the colums for name, classification, and taxID, and -# drop the rest ... -sDat <- sDat[ , c("Name", "Classification", "Taxon.ID")] -colnames(sDat) <- c("name", "order", "taxID") - -# Next, we make an extra column: genus - the first part of the binomial name. -# We'll use the gsub() function, and for that we need a "regular expression" -# that matches to all characters from the first blank to the end of the string: -myPatt <- "\\s.*$" # one whitespace (\\s) ... - # followed by any character (.) 0..n times (*) ... - # until the end of the string - -# using gsub() we substitue all matching characters with the empty string "" - -# this deletes the matching characters -# Test this: -gsub(myPatt, "", "Genus") # one word: unchanged -gsub(myPatt, "", "gEnus species") # two words: return only first -gsub(myPatt, "", "geNus species strain 123") # many words: return only first - -# apply this to the "name" column and add the result as a separate column -# called "genus" -sDat$genus <- gsub(myPatt, "", sDat$name) - -# what do we get? -c(head(unique(sDat$genus)), - tail(unique(sDat$genus))) # inspect the first and last few. Note that there - # is a problem that we have to keep in mind. - # (Always inspect your results!) -# Drop all rows for which the genus contains special chracters - -# like "[Candida]" -sDat <- sDat[ ! grepl("[^a-zA-Z]", sDat$genus) , ] - -length(table(sDat$genus)) # how many genus? -hist(table(sDat$genus), col = "#E9F4FF") # Distribution ... - # most genus have very few, but - # some have very many species. -sort(table(sDat$genus), decreasing = TRUE)[1:10] # Top ten... - -# We should have at least one species from each taxonomic order, but we can -# add a few genus until we have about 100 validated species. - -# Let's add a column for species, by changing our regular expression a bit, -# using ^ (start of string), \\S (NOT a whitespace), -# and + (one or more matches), capturing the match (...), and returning -# it as the substitution (\\1) ... - -myPatt <- "^(\\S+\\s\\S+)\\s.*$" -sDat$species <- gsub(myPatt, "\\1", sDat$name) - -# And we reorder the columns, just for aesthetics: -sDat <- sDat[ , c("name", "species", "genus", "order", "taxID")] - -# Final check: -any(grepl("[^a-zA-Z -]", sDat$species)) # FALSE means no special characters - -# -# Now we check which of these have Mbp1 homologues ... - -# = 4 BLAST SEARCH ======================================================== - - -# We run a BLAST search to find all proteins related to yeast Mbp1 in any -# fungus. With the results, we'll annotate our sDat table. - -# == 4.1 find homologous proteins ========================================== -# -# Use BLAST to fetch proteins related to Mbp1 and identify the species that -# contain them. - -# Scripting against NCBI APIs is not exactly enjoyable - there is usually a fair -# amount of error handling involved that is not supported by the API in a -# principled way but requires rather ad hoc solutions. The code I threw together -# to make a BLAST interface (demo-quality, not research-quality) is in the file -# ./scripts/BLAST.R Feel encouraged to study how this works. It's a pretty -# standard task of communicating with servers and parsing responses - everyday -# fare in the bioinformatics lab. Surprisingly, there seems to be no good BLAST -# parser in currently available packages. -# -# DON'T use this for BLAST searches unless you have read the NCBI policy -# for automated tasks. If you indicriminately pound on the NCBI's BLAST -# server, they will blacklist your IP-address. See: -# https://blast.ncbi.nlm.nih.gov/Blast.cgi?CMD=Web&PAGE_TYPE=BlastDocs&DOC_TYPE=DeveloperInfo -# -# Use BLAST() to find yeast Mbp1 homologues in other fungi in refseq -# BLASThits <- BLAST("NP_010227", # Yeast Mbp1 RefSeq ID -# db = "refseq_protein", # database to search in -# nHits = 3000, # 945 hits in 2020 -# E = 0.01, # -# limits = "txid4751[ORGN]") # = fungi -# saveRDS(BLASThits, file="data/BLASThits.rds") -# -# NO NEED TO ACTUALLY RUN THIS:you can load the results from the data directory -# -BLASThits <- readRDS(file = "data/BLASThits.rds") - -# == 4.2 Identify species in "hits" ======================================== - -# This is a very big list that can't be usefully analyzed manually. Here -# we are only interested in the species names that it contains. - -# How many hits in the list? -length(BLASThits$hits) # 1,134 - -# Let's look at a hit somewhere down the list -str(BLASThits$hit[[277]]) - -# A fair amount of parsing has gone into the BLAST.R code to prepare the results -# in a useful way. The species information is in the $species element of every -# hit. - -# Run a loop to extract all the species names into a vector. We subset ... -# Blasthits$hits ... the list of hits, from which we choose ... -# Blasthits$hits[[i]] ... the i-th hit, and get ... -# Blasthits$hits[[i]]$species ... the species element from that. -# Subsetting FTW. - -BLASTspecies <- character() -for (i in seq_along(BLASThits$hits)) { - BLASTspecies[i] <- BLASThits$hits[[i]]$species -} - -# You can confirm that BLASTspecies has the expected size. -length(BLASTspecies) - -# if we delete some of these later on, we still want to remember which hit -# they came from. Thus we name() the elements with their index, which is the -# same as the index of the hit in BLASThits -names(BLASTspecies) <- 1:length(BLASTspecies) - - -# let's plot the distribution of E-values -eVals <- numeric() -for (i in seq_along(BLASThits$hits)) { - eVals[i] <- BLASThits$hits[[i]]$E -} -range(eVals) -sum(eVals == 0) - -# let's plot the log of all values > 0 to see how they are distributed -# plotting only one vectyor of numbers plots their index as x, and -# their value as y ... -plot(log(eVals[eVals > 0]), col = "#CC0000") - -# This is very informative: I would suspect that the first ten or so are -# virtually identical to the yeast protein, then we have about 800 hits with -# decreasing similarity, and then about 200 more that may actually be false -# positives. Also - we plotted them by index, that means the table is SORTED: -# Lower E-values strictly come before higher E-values. - -# Again, some species appear more than once, e.g. ... -sum(BLASTspecies == "Saccharomyces cerevisiae") - -# ... corresponding to the five homologous gene sequences (paralogues) of yeast. - -# Therefore we remove duplicates. Removing duplicates will leave the FIRST -# in a list alone, and only remove the SUBSEQUENT ones. Which means, from each -# species, we will retain only the protein that has the highest similarity -# to yeast Mbp1, not any of its more distant paralogues. -sel <- ! duplicated(BLASTspecies) -BLASTspecies <- BLASTspecies[sel] - -length(BLASTspecies) -# i.e. we got rid of about two thirds of the hits. -tail(BLASTspecies) # see how the names are useful! - # again - there are some special characters ... - # what are they? -BLASTspecies[grep("[^a-zA-Z ]", BLASTspecies)] - -# remove the brackets ... -BLASTspecies <- gsub("\\[|\\]", "", BLASTspecies) -# drop any new duplicates ... -BLASTspecies <- BLASTspecies[ ! duplicated(BLASTspecies)] - -# check the number again: -length(BLASTspecies) -# Think a bit about this: what may be the biological reason to find that -# on average, in 388 fungi across the entire phylogenetic tree, we have -# three sequences that are homologous to yeast Mbp1? - -# Let's look at the distribution of E-values in this selection (Subsetting FTW): -# we plot all values that are TRUE in the vector "sel" that we created above, -# AND greater than 0 -plot(log(eVals[sel & eVals > 0]), col = "#00CC00") - - -# = 5 MERGE ENSEMBL AND BLAST RESULTS ===================================== - -# Next we add the blast result to our sDat dataframe. We'll store the index, -# the E-value, and the Query-bounds from which we can estimate which domains -# of Mbp1 are actually covered by the hit. (True orthologues MUST align with -# Mbp1's N-terminal APSES domain.) -# -# First we pull the hits we wanted from the BLASTspecies: -iHits <- as.numeric(names(BLASTspecies)) -length(iHits) # one index for each TRUE in sel - -# add columns to sDat -l <- nrow(sDat) -sDat$iHit <- numeric(l) # index of the hit in the BLAST results -sDat$eVal <- numeric(l) # E-value of the hit -sDat$lAli <- numeric(l) # length of the aligned region - -# extract and merge -for (iHit in iHits) { - thisSp <- BLASThits$hits[[iHit]]$species - sel <- sDat$species == thisSp - - sDat$iHit[sel] <- iHit - sDat$eVal[sel] <- BLASThits$hits[[iHit]]$E - sDat$lAli[sel] <- BLASThits$hits[[iHit]]$lengthAli -} - -# Are all reference species accounted for? -selA <- sDat$iHit != 0 # all rows which matched to a BLAST hit -REFspecies %in% sDat$species[selA] # yes, all there - -selB <- sDat$species %in% REFspecies # all rows which have one of REF species - -sum(selA & selB) # How many rows? - -# sDat of course includes all duplicates. Some may be multiply sequenced, some -# may be different strains. We'll use the same strategy as before and keep -# only the best hit: order the rows by E-value, then drop all rows which -# are duplicated. - - -# drop all rows without BLAST hits ... -sDat <- sDat[ ! (sDat$iHit == 0) , ] - -# order sDat by E-value ... -sDat <- sDat[order(sDat$eVal, decreasing = FALSE) , ] - -# drop all rows with duplicated species ... -sDat <- sDat[ ! duplicated(sDat$species) , ] - -# Lets look at the E-values ... -plot(log(sDat$eVal[sDat$eVal > 0]), col = "#00CC00") - -# and alignment lengths ... -plot(sDat$lAli, col = "#00DDAA") - -# How many ... -length(unique(sDat$name)) -length(unique(sDat$species)) -length(unique(sDat$genus)) -length(unique(sDat$order)) - -# I need an extra species for admin purposes later on ... -sel <- grep("Sporothrix schenckii", sDat$species) -SPOSCdat <- sDat[sel, ] -sDat <- sDat[-sel, ] - -# To get the final dataset, we remove the reference species with their -# entire orders ... -REForders <- unique(sDat$order[sDat$species %in% REFspecies]) -sel <- sDat$order %in% REForders -REFdat <- sDat[sel , ] -sDat <- sDat[ ! sel , ] - -# REFdat should now contain only the REFspecies ... -( REFdat <- REFdat[REFdat$species %in% REFspecies , ] ) - -# ... but all of them -sum(REFspecies %in% REFdat$species) - -# ... and we have enough left in sDat to prune sDat to unique genus -sDat <- sDat[ ! duplicated(sDat$genus) , ] -nrow(sDat) # 84 - -# I add back "Sporothrix schenckii" ... -sDat <- rbind(SPOSCdat, sDat) - -# ... and save for future use. -# saveRDS(sDat, file = "data/sDat.rds") -# saveRDS(REFdat, file = "data/REFdat.rds") - - - -# = 6 STUDENT NUMBERS ===================================================== -# -# An asymmetric function to retrieve a MYSPE species -# -sDat <- readRDS(file = "data/sDat.rds") - -students <- read.csv("../BCH441-2021-students.csv") -sN <- students$Integration.ID -sN <- sN[! is.na(sN)] -sN <- as.character(sN) -sN <- c("1003141593", sN) # will map to "Sporothrix schenckii" - -set.seed(112358) -theseSpecies <- sDat[sample(1:nrow(sDat)), ] -all(sort(theseSpecies$name) == sort(sDat$name)) -nrow((theseSpecies)) -(iX <- grep("Sporothrix schenckii", theseSpecies$name)) -theseSpecies <- rbind(theseSpecies[iX, ], theseSpecies[-iX, ]) -rndMin <- 992000000 -rndMax <- 1020000000 -N <- 10000 -keys <- as.character(sample(rndMin:rndMax, N + 1000)) -keys <- keys[! (keys %in% sN)] -keys <- keys[1:N] -keys[1:length(sN)] <- sN - -nRep <- floor(N/nrow(theseSpecies)) -MYSPEdat <- theseSpecies -for(i in 1:nRep) { - MYSPEdat <- rbind(MYSPEdat, theseSpecies) -} -MYSPEdat <- MYSPEdat[1:N, ] -for (i in 1:N) { - rownames(MYSPEdat)[i] <- digest::digest(keys[i], algo = "md5") -} -set.seed(NULL) -MYSPEdat <- MYSPEdat[sample(1:N), ] - -# saveRDS(MYSPEdat, file = "data/MYSPEdat.rds") - -# === validate -x <- character() -for (n in sN) { - sp <- getMYSPE(n) - if (length(sp) != 1) { - stop(print(as.character(n))) - } else { - x <- c(x, sp) - } -} - -# === species for late-comers -y <- unique(MYSPEdat$species) -print(y[!(y %in% x)]) - - -# === validate -l <- length(sN) -sp <- character(l) -for(i in 1:l) { - sp[i] <- getMYSPE(sN[i]) -} -any(duplicated(sp)) -length(unique(sp)) -which(! sDat$species %in% sp) # these can be assigned to late-comers - -# Done. - -# [END] +# tocID <- "scripts/ABC-makeMYSPElist.R" +# +# Purpose: Create a list of genome sequenced fungi with protein annotations and +# Mbp1 homologues. +# +# Version: 1.4 +# +# Date: 2016 09 - 2021 09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions +# 1.4 New retrieval logic +# 1.3 Rewrite to change datasource. NCBI has not been updated +# since 2012. Use ensembl fungi as initial source. +# 1.2 Change from require() to requireNamespace() +# 1.1.2 Moved BLAST.R to ./scripts directory +# 1.1 Update 2017 +# 1.0 First code 2016 +# +# TODO: +# +# ============================================================================== +# +# DO NOT source() THIS FILE! +# +# This file is code I provide for your deeper understanding of a process and +# to provide you with useful sample code. It is not actually necessary for +# you to run this code, but I encourage you to read it carefully and discuss +# if there are parts you don't understand. +# +# Run the commands that interact with the NCBI servers only if you want to +# experiment specifically with the code and/or parameters. I have commented out +# those parts. If you only want to study the general workflow, just load() +# the respective intermediate results. +# + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> -------------------------------------------------------- +#TOC> 1 The strategy 55 +#TOC> 2 PACKAGES AND INITIALIZATIONS 67 +#TOC> 3 ENSEMBL FUNGI 75 +#TOC> 3.1 Import 78 +#TOC> 4 BLAST SEARCH 155 +#TOC> 4.1 find homologous proteins 161 +#TOC> 4.2 Identify species in "hits" 192 +#TOC> 5 MERGE ENSEMBL AND BLAST RESULTS 282 +#TOC> 6 STUDENT NUMBERS 375 +#TOC> +#TOC> ========================================================================== + + +# = 1 The strategy ======================================================== + +# This script will create a list of "MYSPE" species and save it in an R object +# MYSPEspecies that is stored in the data subdirectory of this project from +# where it can be loaded. The strategy is as follows: we download a list of +# annotated fungal genomes from ensembl.fungi. All these are genome-sequenced +# species that have been annotated. +# Next we perform a BLAST search, to identify fungal species that have +# genes that are homologous to yeast MBP1. +# +# ... + +# = 2 PACKAGES AND INITIALIZATIONS ======================================== + +# httr provides interfaces to Webservers on the Internet +if (! requireNamespace("httr", quietly = TRUE)) { + install.packages("httr") +} + + +# = 3 ENSEMBL FUNGI ======================================================= + + +# == 3.1 Import ============================================================ + +# Navigate to https://fungi.ensembl.org and click on the link to the full +# list of all species: https://fungi.ensembl.org/species.html +# On the page, click on the spreadsheet symbol top right and choose +# "download whole table". The file will be named "Species.csv", in your +# usual downloads folder. Move it to the data folder, and read it. + +sDat <- read.csv("./data/Species.csv") +str(sDat) + +# The most obvious way to partition these is according to Classification ... +# (poking around a bit in the UniProt taxonomy database shows that the +# classification used here is the taxonomic rank of "order"). +# how many classifications do we have? +length(unique(sDat$Classification)) # 66 + +# To have a good set for the class, we should have about 100. +# Let's see for which of these we can find Mbp1 homologues. +# First, we'll keep only the colums for name, classification, and taxID, and +# drop the rest ... +sDat <- sDat[ , c("Name", "Classification", "Taxon.ID")] +colnames(sDat) <- c("name", "order", "taxID") + +# Next, we make an extra column: genus - the first part of the binomial name. +# We'll use the gsub() function, and for that we need a "regular expression" +# that matches to all characters from the first blank to the end of the string: +myPatt <- "\\s.*$" # one whitespace (\\s) ... + # followed by any character (.) 0..n times (*) ... + # until the end of the string + +# using gsub() we substitue all matching characters with the empty string "" - +# this deletes the matching characters +# Test this: +gsub(myPatt, "", "Genus") # one word: unchanged +gsub(myPatt, "", "gEnus species") # two words: return only first +gsub(myPatt, "", "geNus species strain 123") # many words: return only first + +# apply this to the "name" column and add the result as a separate column +# called "genus" +sDat$genus <- gsub(myPatt, "", sDat$name) + +# what do we get? +c(head(unique(sDat$genus)), + tail(unique(sDat$genus))) # inspect the first and last few. Note that there + # is a problem that we have to keep in mind. + # (Always inspect your results!) +# Drop all rows for which the genus contains special chracters - +# like "[Candida]" +sDat <- sDat[ ! grepl("[^a-zA-Z]", sDat$genus) , ] + +length(table(sDat$genus)) # how many genus? +hist(table(sDat$genus), col = "#E9F4FF") # Distribution ... + # most genus have very few, but + # some have very many species. +sort(table(sDat$genus), decreasing = TRUE)[1:10] # Top ten... + +# We should have at least one species from each taxonomic order, but we can +# add a few genus until we have about 100 validated species. + +# Let's add a column for species, by changing our regular expression a bit, +# using ^ (start of string), \\S (NOT a whitespace), +# and + (one or more matches), capturing the match (...), and returning +# it as the substitution (\\1) ... + +myPatt <- "^(\\S+\\s\\S+)\\s.*$" +sDat$species <- gsub(myPatt, "\\1", sDat$name) + +# And we reorder the columns, just for aesthetics: +sDat <- sDat[ , c("name", "species", "genus", "order", "taxID")] + +# Final check: +any(grepl("[^a-zA-Z -]", sDat$species)) # FALSE means no special characters + +# +# Now we check which of these have Mbp1 homologues ... + +# = 4 BLAST SEARCH ======================================================== + + +# We run a BLAST search to find all proteins related to yeast Mbp1 in any +# fungus. With the results, we'll annotate our sDat table. + +# == 4.1 find homologous proteins ========================================== +# +# Use BLAST to fetch proteins related to Mbp1 and identify the species that +# contain them. + +# Scripting against NCBI APIs is not exactly enjoyable - there is usually a fair +# amount of error handling involved that is not supported by the API in a +# principled way but requires rather ad hoc solutions. The code I threw together +# to make a BLAST interface (demo-quality, not research-quality) is in the file +# ./scripts/BLAST.R Feel encouraged to study how this works. It's a pretty +# standard task of communicating with servers and parsing responses - everyday +# fare in the bioinformatics lab. Surprisingly, there seems to be no good BLAST +# parser in currently available packages. +# +# DON'T use this for BLAST searches unless you have read the NCBI policy +# for automated tasks. If you indicriminately pound on the NCBI's BLAST +# server, they will blacklist your IP-address. See: +# https://blast.ncbi.nlm.nih.gov/Blast.cgi?CMD=Web&PAGE_TYPE=BlastDocs&DOC_TYPE=DeveloperInfo +# +# Use BLAST() to find yeast Mbp1 homologues in other fungi in refseq +# BLASThits <- BLAST("NP_010227", # Yeast Mbp1 RefSeq ID +# db = "refseq_protein", # database to search in +# nHits = 3000, # 945 hits in 2020 +# E = 0.01, # +# limits = "txid4751[ORGN]") # = fungi +# saveRDS(BLASThits, file="data/BLASThits.rds") +# +# NO NEED TO ACTUALLY RUN THIS:you can load the results from the data directory +# +BLASThits <- readRDS(file = "data/BLASThits.rds") + +# == 4.2 Identify species in "hits" ======================================== + +# This is a very big list that can't be usefully analyzed manually. Here +# we are only interested in the species names that it contains. + +# How many hits in the list? +length(BLASThits$hits) # 1,134 + +# Let's look at a hit somewhere down the list +str(BLASThits$hit[[277]]) + +# A fair amount of parsing has gone into the BLAST.R code to prepare the results +# in a useful way. The species information is in the $species element of every +# hit. + +# Run a loop to extract all the species names into a vector. We subset ... +# Blasthits$hits ... the list of hits, from which we choose ... +# Blasthits$hits[[i]] ... the i-th hit, and get ... +# Blasthits$hits[[i]]$species ... the species element from that. +# Subsetting FTW. + +BLASTspecies <- character() +for (i in seq_along(BLASThits$hits)) { + BLASTspecies[i] <- BLASThits$hits[[i]]$species +} + +# You can confirm that BLASTspecies has the expected size. +length(BLASTspecies) + +# if we delete some of these later on, we still want to remember which hit +# they came from. Thus we name() the elements with their index, which is the +# same as the index of the hit in BLASThits +names(BLASTspecies) <- 1:length(BLASTspecies) + + +# let's plot the distribution of E-values +eVals <- numeric() +for (i in seq_along(BLASThits$hits)) { + eVals[i] <- BLASThits$hits[[i]]$E +} +range(eVals) +sum(eVals == 0) + +# let's plot the log of all values > 0 to see how they are distributed +# plotting only one vectyor of numbers plots their index as x, and +# their value as y ... +plot(log(eVals[eVals > 0]), col = "#CC0000") + +# This is very informative: I would suspect that the first ten or so are +# virtually identical to the yeast protein, then we have about 800 hits with +# decreasing similarity, and then about 200 more that may actually be false +# positives. Also - we plotted them by index, that means the table is SORTED: +# Lower E-values strictly come before higher E-values. + +# Again, some species appear more than once, e.g. ... +sum(BLASTspecies == "Saccharomyces cerevisiae") + +# ... corresponding to the five homologous gene sequences (paralogues) of yeast. + +# Therefore we remove duplicates. Removing duplicates will leave the FIRST +# in a list alone, and only remove the SUBSEQUENT ones. Which means, from each +# species, we will retain only the protein that has the highest similarity +# to yeast Mbp1, not any of its more distant paralogues. +sel <- ! duplicated(BLASTspecies) +BLASTspecies <- BLASTspecies[sel] + +length(BLASTspecies) +# i.e. we got rid of about two thirds of the hits. +tail(BLASTspecies) # see how the names are useful! + # again - there are some special characters ... + # what are they? +BLASTspecies[grep("[^a-zA-Z ]", BLASTspecies)] + +# remove the brackets ... +BLASTspecies <- gsub("\\[|\\]", "", BLASTspecies) +# drop any new duplicates ... +BLASTspecies <- BLASTspecies[ ! duplicated(BLASTspecies)] + +# check the number again: +length(BLASTspecies) +# Think a bit about this: what may be the biological reason to find that +# on average, in 388 fungi across the entire phylogenetic tree, we have +# three sequences that are homologous to yeast Mbp1? + +# Let's look at the distribution of E-values in this selection (Subsetting FTW): +# we plot all values that are TRUE in the vector "sel" that we created above, +# AND greater than 0 +plot(log(eVals[sel & eVals > 0]), col = "#00CC00") + + +# = 5 MERGE ENSEMBL AND BLAST RESULTS ===================================== + +# Next we add the blast result to our sDat dataframe. We'll store the index, +# the E-value, and the Query-bounds from which we can estimate which domains +# of Mbp1 are actually covered by the hit. (True orthologues MUST align with +# Mbp1's N-terminal APSES domain.) +# +# First we pull the hits we wanted from the BLASTspecies: +iHits <- as.numeric(names(BLASTspecies)) +length(iHits) # one index for each TRUE in sel + +# add columns to sDat +l <- nrow(sDat) +sDat$iHit <- numeric(l) # index of the hit in the BLAST results +sDat$eVal <- numeric(l) # E-value of the hit +sDat$lAli <- numeric(l) # length of the aligned region + +# extract and merge +for (iHit in iHits) { + thisSp <- BLASThits$hits[[iHit]]$species + sel <- sDat$species == thisSp + + sDat$iHit[sel] <- iHit + sDat$eVal[sel] <- BLASThits$hits[[iHit]]$E + sDat$lAli[sel] <- BLASThits$hits[[iHit]]$lengthAli +} + +# Are all reference species accounted for? +selA <- sDat$iHit != 0 # all rows which matched to a BLAST hit +REFspecies %in% sDat$species[selA] # yes, all there + +selB <- sDat$species %in% REFspecies # all rows which have one of REF species + +sum(selA & selB) # How many rows? + +# sDat of course includes all duplicates. Some may be multiply sequenced, some +# may be different strains. We'll use the same strategy as before and keep +# only the best hit: order the rows by E-value, then drop all rows which +# are duplicated. + + +# drop all rows without BLAST hits ... +sDat <- sDat[ ! (sDat$iHit == 0) , ] + +# order sDat by E-value ... +sDat <- sDat[order(sDat$eVal, decreasing = FALSE) , ] + +# drop all rows with duplicated species ... +sDat <- sDat[ ! duplicated(sDat$species) , ] + +# Lets look at the E-values ... +plot(log(sDat$eVal[sDat$eVal > 0]), col = "#00CC00") + +# and alignment lengths ... +plot(sDat$lAli, col = "#00DDAA") + +# How many ... +length(unique(sDat$name)) +length(unique(sDat$species)) +length(unique(sDat$genus)) +length(unique(sDat$order)) + +# I need an extra species for admin purposes later on ... +sel <- grep("Sporothrix schenckii", sDat$species) +SPOSCdat <- sDat[sel, ] +sDat <- sDat[-sel, ] + +# To get the final dataset, we remove the reference species with their +# entire orders ... +REForders <- unique(sDat$order[sDat$species %in% REFspecies]) +sel <- sDat$order %in% REForders +REFdat <- sDat[sel , ] +sDat <- sDat[ ! sel , ] + +# REFdat should now contain only the REFspecies ... +( REFdat <- REFdat[REFdat$species %in% REFspecies , ] ) + +# ... but all of them +sum(REFspecies %in% REFdat$species) + +# ... and we have enough left in sDat to prune sDat to unique genus +sDat <- sDat[ ! duplicated(sDat$genus) , ] +nrow(sDat) # 84 + +# I add back "Sporothrix schenckii" ... +sDat <- rbind(SPOSCdat, sDat) + +# ... and save for future use. +# saveRDS(sDat, file = "data/sDat.rds") +# saveRDS(REFdat, file = "data/REFdat.rds") + + + +# = 6 STUDENT NUMBERS ===================================================== +# +# An asymmetric function to retrieve a MYSPE species +# +sDat <- readRDS(file = "data/sDat.rds") + +students <- read.csv("../BCH441-2021-students.csv") +sN <- students$Integration.ID +sN <- sN[! is.na(sN)] +sN <- as.character(sN) +sN <- c("1003141593", sN) # will map to "Sporothrix schenckii" + +set.seed(112358) +theseSpecies <- sDat[sample(1:nrow(sDat)), ] +all(sort(theseSpecies$name) == sort(sDat$name)) +nrow((theseSpecies)) +(iX <- grep("Sporothrix schenckii", theseSpecies$name)) +theseSpecies <- rbind(theseSpecies[iX, ], theseSpecies[-iX, ]) +rndMin <- 992000000 +rndMax <- 1020000000 +N <- 10000 +keys <- as.character(sample(rndMin:rndMax, N + 1000)) +keys <- keys[! (keys %in% sN)] +keys <- keys[1:N] +keys[1:length(sN)] <- sN + +nRep <- floor(N/nrow(theseSpecies)) +MYSPEdat <- theseSpecies +for(i in 1:nRep) { + MYSPEdat <- rbind(MYSPEdat, theseSpecies) +} +MYSPEdat <- MYSPEdat[1:N, ] +for (i in 1:N) { + rownames(MYSPEdat)[i] <- digest::digest(keys[i], algo = "md5") +} +set.seed(NULL) +MYSPEdat <- MYSPEdat[sample(1:N), ] + +# saveRDS(MYSPEdat, file = "data/MYSPEdat.rds") + +# === validate +x <- character() +for (n in sN) { + sp <- getMYSPE(n) + if (length(sp) != 1) { + stop(print(as.character(n))) + } else { + x <- c(x, sp) + } +} + +# === species for late-comers +y <- unique(MYSPEdat$species) +print(y[!(y %in% x)]) + + +# === validate +l <- length(sN) +sp <- character(l) +for(i in 1:l) { + sp[i] <- getMYSPE(sN[i]) +} +any(duplicated(sp)) +length(unique(sp)) +which(! sDat$species %in% sp) # these can be assigned to late-comers + +# Done. + +# [END] diff --git a/scripts/ABC-makeSTRINGedges.R b/scripts/ABC-makeSTRINGedges.R index 0da774a..e4c050d 100644 --- a/scripts/ABC-makeSTRINGedges.R +++ b/scripts/ABC-makeSTRINGedges.R @@ -1,168 +1,168 @@ -# tocID <- "scripts/ABC-makeSTRINGedges.R" -# -# Create a subnetwork of high-confidence human STRING edges. -# -# Notes: -# -# The large source- datafile is NOT posted to github. If you want to -# experiment with the original data, download it and place it into your -# local ./data directory. -# -# STRING data source: -# Download page: -# https://string-db.org/cgi/download.pl?species_text=Homo+sapiens -# Data: (127.6 Mb) -# https://stringdb-static.org/download/protein.links.full.v11.0/9606.protein.links.full.v11.0.txt.gz -# -# Version: 1.0 -# -# Date: 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.0 Rewrite -# -# TODO: -# -# ============================================================================== - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> ------------------------------------------------- -#TOC> 1 Initialize 44 -#TOC> 2 Read STRING Data 51 -#TOC> 3 Define cutoff and subset 63 -#TOC> 4 Drop duplicates 103 -#TOC> 5 Simple statistics 127 -#TOC> 6 Write to file 160 -#TOC> -#TOC> ========================================================================== - - -# = 1 Initialize ========================================================== - -if (! requireNamespace("readr", quietly = TRUE)) { - install.packages("readr") -} - - -# = 2 Read STRING Data ==================================================== - -# Read STRING Data (needs to be downloaded from database, see URL in Notes) -# The .gz compressed version is 127.6MB, the uncompressed version is probably -# 848 Mb. Fortunately readr:: can read from compressed -# files, and does so automatically, based on the file extension. -( fn <- file.path("~", "9606.protein.links.full.v11.0.txt.gz") ) -STR <- readr::read_delim(fn, delim = " ") -nrow(STR) # 11,759,454 rows -head(STR) - - -# = 3 Define cutoff and subset ============================================ - -# approximate distribution of combined_score -hist(sample(STR$combined_score, 10000), breaks = 50, col = "#6699FF") - -# Let's table the counts >= 850 and plot them for better resolution. - -myTb <- table(STR$combined_score[STR$combined_score >= 850]) -is.unsorted(as.integer(names(myTb))) # Good - they are all in order - -plot(myTb, type = "b", cex = 0.5, col = "#BB0000") -myTb[myTb == max(myTb)] # Apparently there is an algorithmic effect that - # frequently assigns a combined score of 0.900 - -# Let's plot these counts as cumulative sums, in reverse order, scaled -# as combined scores. -myX <- 1 - (1:length(myTb)) / 1000 # x-values, decreasing -plot(myX, - cumsum(myTb[length(myTb):1]), # cumulative sum, decreasing - xlim = c(1.0, 0.85), # reverse x-axis - type = "l", - main = "STRING interactions for 9606 (top 600,000)", - xlab = "combined_score", - ylab = "cumulative counts", - col = "#CC0000") -abline(h = seq(50000, sum(myTb), by = 50000), lwd = 0.5, col = "#DDDDFF") - -# What's the cutoff for 100,000 edges? -which(cumsum(myTb[length(myTb):1]) >= 100000)[1] # p = 0.964 - -# confirm -sum(STR$combined_score >= 964) # 101,348 -abline(v = 0.964, lwd = 0.5, col = "#DDDDFF") - -# subset the table, and use only the protein IDs and the combined_score -STR <- STR[STR$combined_score >= 964, - c("protein1", "protein2", "combined_score")] -colnames(STR) <- c("a", "b", "score") - - -# = 4 Drop duplicates ==================================================== - -# identify duplicate interactions by creating keys in a defined alphabetical -# sort order, then checking for duplicated(). -# e.g if we have (X:U, U:X), we change U:X to X:U and now find that -# (X:U, X:U) has a duplicate. - -AB <- STR$a < STR$b # logical vector: genes we need to swap -tmp <- STR$b # copy column b -STR$b[AB] <- STR$a[AB] # copy a's into b -STR$a[AB] <- tmp[AB] # copy tmp's into a -all(STR$a >= STR$b) # confirm: TRUE - -# now, make combined keys, like this: -paste0(STR$a[1:10], ":", STR$b[1:10]) - -tmp <- paste0(STR$a, ":", STR$b) -sum(duplicated(tmp)) # That's half of them ... i.e. STRING reports - # both a:b and b:a ! - -# drop all duplicated interactions from tmp -STR <- STR[ ! duplicated(tmp), ] # 50,674 interactions remain - - -# = 5 Simple statistics =================================================== - -# how many unique genes? -length(unique(c(STR$a, STR$b))) # 8,445 - -# how many self-edges? -sum(STR$a == STR$b) # none - -# log(rank) / log(frequency) -myTbl <- table(c(STR$a, STR$b)) -myTbl <- myTbl[order(myTbl, decreasing = TRUE)] - -hist(myTbl, breaks = 40, col = "#FFEEBB") - -# number of singletons -sum(myTbl == 1) # almost a quarter - -# maximum? -myTbl[which(myTbl == max(myTbl))] # 9606.ENSP00000360532: 465 - # Google: CDC5L - -# Zipf-plot -plot(log(1:length(myTbl)), log(as.numeric(myTbl)), - type = "b", cex = 0.7, - main = "STRINGedges - degrees", - xlab = "log(rank)", - ylab = "log(frequency)", - col = "#FFBB88") - -sprintf("Average number of interactions: %5.2f", - nrow(STR) / length(unique(c(STR$a, STR$b)))) - - -# = 6 Write to file ======================================================= - -saveRDS(STR, file = "./data/STRINGedges.rds") - -# STRINGedges <- readRDS("./data/STRINGedges.rds") # use this to restore the - # object when needed - - -# [END] +# tocID <- "scripts/ABC-makeSTRINGedges.R" +# +# Create a subnetwork of high-confidence human STRING edges. +# +# Notes: +# +# The large source- datafile is NOT posted to github. If you want to +# experiment with the original data, download it and place it into your +# local ./data directory. +# +# STRING data source: +# Download page: +# https://string-db.org/cgi/download.pl?species_text=Homo+sapiens +# Data: (127.6 Mb) +# https://stringdb-static.org/download/protein.links.full.v11.0/9606.protein.links.full.v11.0.txt.gz +# +# Version: 1.0 +# +# Date: 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.0 Rewrite +# +# TODO: +# +# ============================================================================== + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> ------------------------------------------------- +#TOC> 1 Initialize 44 +#TOC> 2 Read STRING Data 51 +#TOC> 3 Define cutoff and subset 63 +#TOC> 4 Drop duplicates 103 +#TOC> 5 Simple statistics 127 +#TOC> 6 Write to file 160 +#TOC> +#TOC> ========================================================================== + + +# = 1 Initialize ========================================================== + +if (! requireNamespace("readr", quietly = TRUE)) { + install.packages("readr") +} + + +# = 2 Read STRING Data ==================================================== + +# Read STRING Data (needs to be downloaded from database, see URL in Notes) +# The .gz compressed version is 127.6MB, the uncompressed version is probably +# 848 Mb. Fortunately readr:: can read from compressed +# files, and does so automatically, based on the file extension. +( fn <- file.path("~", "9606.protein.links.full.v11.0.txt.gz") ) +STR <- readr::read_delim(fn, delim = " ") +nrow(STR) # 11,759,454 rows +head(STR) + + +# = 3 Define cutoff and subset ============================================ + +# approximate distribution of combined_score +hist(sample(STR$combined_score, 10000), breaks = 50, col = "#6699FF") + +# Let's table the counts >= 850 and plot them for better resolution. + +myTb <- table(STR$combined_score[STR$combined_score >= 850]) +is.unsorted(as.integer(names(myTb))) # Good - they are all in order + +plot(myTb, type = "b", cex = 0.5, col = "#BB0000") +myTb[myTb == max(myTb)] # Apparently there is an algorithmic effect that + # frequently assigns a combined score of 0.900 + +# Let's plot these counts as cumulative sums, in reverse order, scaled +# as combined scores. +myX <- 1 - (1:length(myTb)) / 1000 # x-values, decreasing +plot(myX, + cumsum(myTb[length(myTb):1]), # cumulative sum, decreasing + xlim = c(1.0, 0.85), # reverse x-axis + type = "l", + main = "STRING interactions for 9606 (top 600,000)", + xlab = "combined_score", + ylab = "cumulative counts", + col = "#CC0000") +abline(h = seq(50000, sum(myTb), by = 50000), lwd = 0.5, col = "#DDDDFF") + +# What's the cutoff for 100,000 edges? +which(cumsum(myTb[length(myTb):1]) >= 100000)[1] # p = 0.964 + +# confirm +sum(STR$combined_score >= 964) # 101,348 +abline(v = 0.964, lwd = 0.5, col = "#DDDDFF") + +# subset the table, and use only the protein IDs and the combined_score +STR <- STR[STR$combined_score >= 964, + c("protein1", "protein2", "combined_score")] +colnames(STR) <- c("a", "b", "score") + + +# = 4 Drop duplicates ==================================================== + +# identify duplicate interactions by creating keys in a defined alphabetical +# sort order, then checking for duplicated(). +# e.g if we have (X:U, U:X), we change U:X to X:U and now find that +# (X:U, X:U) has a duplicate. + +AB <- STR$a < STR$b # logical vector: genes we need to swap +tmp <- STR$b # copy column b +STR$b[AB] <- STR$a[AB] # copy a's into b +STR$a[AB] <- tmp[AB] # copy tmp's into a +all(STR$a >= STR$b) # confirm: TRUE + +# now, make combined keys, like this: +paste0(STR$a[1:10], ":", STR$b[1:10]) + +tmp <- paste0(STR$a, ":", STR$b) +sum(duplicated(tmp)) # That's half of them ... i.e. STRING reports + # both a:b and b:a ! + +# drop all duplicated interactions from tmp +STR <- STR[ ! duplicated(tmp), ] # 50,674 interactions remain + + +# = 5 Simple statistics =================================================== + +# how many unique genes? +length(unique(c(STR$a, STR$b))) # 8,445 + +# how many self-edges? +sum(STR$a == STR$b) # none + +# log(rank) / log(frequency) +myTbl <- table(c(STR$a, STR$b)) +myTbl <- myTbl[order(myTbl, decreasing = TRUE)] + +hist(myTbl, breaks = 40, col = "#FFEEBB") + +# number of singletons +sum(myTbl == 1) # almost a quarter + +# maximum? +myTbl[which(myTbl == max(myTbl))] # 9606.ENSP00000360532: 465 + # Google: CDC5L + +# Zipf-plot +plot(log(1:length(myTbl)), log(as.numeric(myTbl)), + type = "b", cex = 0.7, + main = "STRINGedges - degrees", + xlab = "log(rank)", + ylab = "log(frequency)", + col = "#FFBB88") + +sprintf("Average number of interactions: %5.2f", + nrow(STR) / length(unique(c(STR$a, STR$b)))) + + +# = 6 Write to file ======================================================= + +saveRDS(STR, file = "./data/STRINGedges.rds") + +# STRINGedges <- readRDS("./data/STRINGedges.rds") # use this to restore the + # object when needed + + +# [END] diff --git a/scripts/ABC-makeScCCnet.R b/scripts/ABC-makeScCCnet.R index b464d54..bd31a3e 100644 --- a/scripts/ABC-makeScCCnet.R +++ b/scripts/ABC-makeScCCnet.R @@ -1,167 +1,167 @@ -# tocID <- "scripts/ABC-makeScCCnet.R" -# -# Create a subnetwork of high-confidence yeast genes with a "mitotic cell cycle" -# GOSlim annotation. -# -# Boris Steipe for ABC learning units -# -# Notes: -# -# The large source- datafiles are NOT posted to github. If you want to -# experiment with your own code, download them and place them into your -# local ./data directory. -# -# STRING data source: -# Download page: -# https://string-db.org/cgi/download.pl?species_text=Saccharomyces+cerevisiae -# Data: (20.1 mb) -# https://stringdb-static.org/download/protein.links.full.v11.0/4932.protein.links.full.v11.0.txt.gz -# -# GOSlim data source: (Note: this has moved from GO to SGD) -# Info page: https://www.yeastgenome.org/downloads -# Info page: http://sgd-archive.yeastgenome.org/curation/literature/ -# Data: (3 mb) -# http://sgd-archive.yeastgenome.org/curation/literature/go_slim_mapping.tab -# -# -# Version: 1.2 -# -# Date: 2017-10 - 2020-09 -# Author: Boris Steipe (boris.steipe@utoronto.ca) -# -# Versions: -# 1.2 2020 Update. GO Slim Yeast mow at SGD -# 1.1 Change from require() to requireNamespace(), -# use ::() idiom throughout -# 1.0 First code copied from 2016 material. -# -# TODO: -# -# ============================================================================== -# SRCDIR <- "./instructor" - - -#TOC> ========================================================================== -#TOC> -#TOC> Section Title Line -#TOC> --------------------------------------------------------------- -#TOC> 1 INITIALIZE 58 -#TOC> 2 STRING FUNCTIONAL INTERACTION DATA 66 -#TOC> 3 GOSlim FUNCTIONAL ANNOTATIONS 96 -#TOC> 3.1 Intersect interactions and annotations 122 -#TOC> 4 DEFINE THE CELL-CYCLE NETWORK 128 -#TOC> -#TOC> ========================================================================== - - -# = 1 INITIALIZE ========================================================== - -SRCDIR <- "./data" -if (! requireNamespace("readr", quietly = TRUE)) { - install.packages("readr") -} - - -# = 2 STRING FUNCTIONAL INTERACTION DATA ================================== - -# Read STRING Data (needs to be downloaded from database, see URL in Notes) -# The .gz compressed version is 20MB, the uncompressed versioj is 110MB - -# really not necessary to uncompress since readr:: can read from compressed -# files, and does so automatically, based on the file extension. -( fn <- file.path(SRCDIR, "4932.protein.links.full.v11.0.txt.gz") ) -STR <- readr::read_delim(fn, delim = " ") - -# Subset only IDs and combined_score column -STR <- STR[ , c("protein1", "protein2", "combined_score")] - -# head(STR) -# sum(STR$combined_score > 909) # 100270 edges -# subset for 100,000 highest confidence edges -STR <- STR[(STR$combined_score > 909), ] -head(STR) - -# IDs are formatted like 4932.YAL005C ... drop the "4932." prefix -STR$protein1 <- gsub("^4932\\.", "", STR$protein1) -STR$protein2 <- gsub("^4932\\.", "", STR$protein2) -head(STR) - -# get a vector of gene names in this list -myIntxGenes <- unique(c(STR$protein1, STR$protein2)) # yeast systematic gene - # names -length(myIntxGenes) -sample(myIntxGenes, 10) # choose 10 at random (sanity check) - - -# = 3 GOSlim FUNCTIONAL ANNOTATIONS ======================================= -# -# Read GOSlim data (needs to be downloaded from database, see URL in Notes) -( fn <- file.path(SRCDIR, "go_slim_mapping.tab") ) - -Gsl <- readr::read_tsv(fn, - col_names = c("ID", - "name", - "SGDId", - "Ontology", - "termName", - "termID", - "status")) - -head(Gsl) - -# What cell cycle names does it contain? -myGslTermNames <- unique(Gsl$termName) # 169 unique terms -myGslTermNames[grep("cycle", myGslTermNames)] -# [1] "regulation of cell cycle" "mitotic cell cycle" "meiotic cell cycle" - -# Choose "mitotic cell cycle" as the GOslim term to subset with - -scCCgenes <- unique(Gsl$ID[Gsl$termName == "mitotic cell cycle"]) -length(scCCgenes) # 324 genes annotated to that term - -# == 3.1 Intersect interactions and annotations ============================ - -sum(scCCgenes %in% myIntxGenes) # 307 of these have high-confidence -# # functional interactions - - -# = 4 DEFINE THE CELL-CYCLE NETWORK ======================================= -# -# Define scCCnet ... the S. Cervisiae Cell Cycle network -# Subset all rows for which BOTH genes are in the GOslim cell cycle set -# -scCCnet <- STR[(STR$protein1 %in% scCCgenes) & - (STR$protein2 %in% scCCgenes), ] - -# How many genes are there? -length(unique(c(scCCnet$protein1, scCCnet$protein2))) #283 - -# Each edge is listed twice - now remove duplicates. - -# Step 1: make a vector: sort two names so the fiRst one is alphabetically -# smaller Than the second one. This brings the two names into a defined -# order. Then concatenate them with a "." - the resulting string -# is always the same, for any order. E.g. c("A", "B") gives "A.B" -# and c("B", "A") also gives "A.B". This identifies duplicates. - -x <- apply(cbind(scCCnet$protein1, scCCnet$protein2), - 1, - FUN = function(x) { return(paste(sort(x), collapse = ".")) }) -head(x) # "YAL016W.YGR040W" "YAL016W.YOR014W" "YAL016W.YDL188C" ... etc. - -sum(duplicated(x)) # 1453 - -# Step 2: drop all rows that contain duplicates in x -scCCnet <- scCCnet[! duplicated(x), ] - -# Confirm we didn't loose genes -length(unique(c(scCCnet$protein1, scCCnet$protein2))) # 283, no change -nrow(scCCnet) -# Network has 283 nodes, 1453 edges - -saveRDS(scCCnet, file = "./data/scCCnet.rds") - -# scCCnet <- readRDS("./data/scCCnet.rds") # <<<- use this to restore the - # object when needed - - -# [END] +# tocID <- "scripts/ABC-makeScCCnet.R" +# +# Create a subnetwork of high-confidence yeast genes with a "mitotic cell cycle" +# GOSlim annotation. +# +# Boris Steipe for ABC learning units +# +# Notes: +# +# The large source- datafiles are NOT posted to github. If you want to +# experiment with your own code, download them and place them into your +# local ./data directory. +# +# STRING data source: +# Download page: +# https://string-db.org/cgi/download.pl?species_text=Saccharomyces+cerevisiae +# Data: (20.1 mb) +# https://stringdb-static.org/download/protein.links.full.v11.0/4932.protein.links.full.v11.0.txt.gz +# +# GOSlim data source: (Note: this has moved from GO to SGD) +# Info page: https://www.yeastgenome.org/downloads +# Info page: http://sgd-archive.yeastgenome.org/curation/literature/ +# Data: (3 mb) +# http://sgd-archive.yeastgenome.org/curation/literature/go_slim_mapping.tab +# +# +# Version: 1.2 +# +# Date: 2017-10 - 2020-09 +# Author: Boris Steipe (boris.steipe@utoronto.ca) +# +# Versions: +# 1.2 2020 Update. GO Slim Yeast mow at SGD +# 1.1 Change from require() to requireNamespace(), +# use ::() idiom throughout +# 1.0 First code copied from 2016 material. +# +# TODO: +# +# ============================================================================== +# SRCDIR <- "./instructor" + + +#TOC> ========================================================================== +#TOC> +#TOC> Section Title Line +#TOC> --------------------------------------------------------------- +#TOC> 1 INITIALIZE 58 +#TOC> 2 STRING FUNCTIONAL INTERACTION DATA 66 +#TOC> 3 GOSlim FUNCTIONAL ANNOTATIONS 96 +#TOC> 3.1 Intersect interactions and annotations 122 +#TOC> 4 DEFINE THE CELL-CYCLE NETWORK 128 +#TOC> +#TOC> ========================================================================== + + +# = 1 INITIALIZE ========================================================== + +SRCDIR <- "./data" +if (! requireNamespace("readr", quietly = TRUE)) { + install.packages("readr") +} + + +# = 2 STRING FUNCTIONAL INTERACTION DATA ================================== + +# Read STRING Data (needs to be downloaded from database, see URL in Notes) +# The .gz compressed version is 20MB, the uncompressed versioj is 110MB - +# really not necessary to uncompress since readr:: can read from compressed +# files, and does so automatically, based on the file extension. +( fn <- file.path(SRCDIR, "4932.protein.links.full.v11.0.txt.gz") ) +STR <- readr::read_delim(fn, delim = " ") + +# Subset only IDs and combined_score column +STR <- STR[ , c("protein1", "protein2", "combined_score")] + +# head(STR) +# sum(STR$combined_score > 909) # 100270 edges +# subset for 100,000 highest confidence edges +STR <- STR[(STR$combined_score > 909), ] +head(STR) + +# IDs are formatted like 4932.YAL005C ... drop the "4932." prefix +STR$protein1 <- gsub("^4932\\.", "", STR$protein1) +STR$protein2 <- gsub("^4932\\.", "", STR$protein2) +head(STR) + +# get a vector of gene names in this list +myIntxGenes <- unique(c(STR$protein1, STR$protein2)) # yeast systematic gene + # names +length(myIntxGenes) +sample(myIntxGenes, 10) # choose 10 at random (sanity check) + + +# = 3 GOSlim FUNCTIONAL ANNOTATIONS ======================================= +# +# Read GOSlim data (needs to be downloaded from database, see URL in Notes) +( fn <- file.path(SRCDIR, "go_slim_mapping.tab") ) + +Gsl <- readr::read_tsv(fn, + col_names = c("ID", + "name", + "SGDId", + "Ontology", + "termName", + "termID", + "status")) + +head(Gsl) + +# What cell cycle names does it contain? +myGslTermNames <- unique(Gsl$termName) # 169 unique terms +myGslTermNames[grep("cycle", myGslTermNames)] +# [1] "regulation of cell cycle" "mitotic cell cycle" "meiotic cell cycle" + +# Choose "mitotic cell cycle" as the GOslim term to subset with + +scCCgenes <- unique(Gsl$ID[Gsl$termName == "mitotic cell cycle"]) +length(scCCgenes) # 324 genes annotated to that term + +# == 3.1 Intersect interactions and annotations ============================ + +sum(scCCgenes %in% myIntxGenes) # 307 of these have high-confidence +# # functional interactions + + +# = 4 DEFINE THE CELL-CYCLE NETWORK ======================================= +# +# Define scCCnet ... the S. Cervisiae Cell Cycle network +# Subset all rows for which BOTH genes are in the GOslim cell cycle set +# +scCCnet <- STR[(STR$protein1 %in% scCCgenes) & + (STR$protein2 %in% scCCgenes), ] + +# How many genes are there? +length(unique(c(scCCnet$protein1, scCCnet$protein2))) #283 + +# Each edge is listed twice - now remove duplicates. + +# Step 1: make a vector: sort two names so the fiRst one is alphabetically +# smaller Than the second one. This brings the two names into a defined +# order. Then concatenate them with a "." - the resulting string +# is always the same, for any order. E.g. c("A", "B") gives "A.B" +# and c("B", "A") also gives "A.B". This identifies duplicates. + +x <- apply(cbind(scCCnet$protein1, scCCnet$protein2), + 1, + FUN = function(x) { return(paste(sort(x), collapse = ".")) }) +head(x) # "YAL016W.YGR040W" "YAL016W.YOR014W" "YAL016W.YDL188C" ... etc. + +sum(duplicated(x)) # 1453 + +# Step 2: drop all rows that contain duplicates in x +scCCnet <- scCCnet[! duplicated(x), ] + +# Confirm we didn't loose genes +length(unique(c(scCCnet$protein1, scCCnet$protein2))) # 283, no change +nrow(scCCnet) +# Network has 283 nodes, 1453 edges + +saveRDS(scCCnet, file = "./data/scCCnet.rds") + +# scCCnet <- readRDS("./data/scCCnet.rds") # <<<- use this to restore the + # object when needed + + +# [END] diff --git a/scripts/ABC-writeALN.R b/scripts/ABC-writeALN.R index a8b7d80..b84d15a 100644 --- a/scripts/ABC-writeALN.R +++ b/scripts/ABC-writeALN.R @@ -1,135 +1,135 @@ -# tocID <- "scripts/ABC-writeALN.R" -# -# ToDo: calculate consensus line -# append sequence numbers -# Notes: -# -# ============================================================================== - - -writeALN <- function(ali, - range, - note = "", - myCon = stdout(), - blockWidth = 60) { - # Purpose: - # Write an MsaAAMultipleAlignment or AAStringSet object to stdout() or - # a file in multi-FASTA format. - # Version: 2.0 - # Date: 2017 10 - # Author: Boris Steipe - # - # Parameters: - # ali MsaAAMultipleAlignment or AAStringSet or character - # vector. - # range num a two-integer vector of start and end positions if - # only a range of the MSA should be written, e.g. - # a domain. Defaults to the full alignment length. - # note chr a vector of character that is appended to the name - # of a sequence in the FASTA header. Recycling of - # shorter vectors applies, thus a vector of length one - # is added to all headers. - # myCon a connection (cf. the con argument for writeLines). - # Defaults to stdout() - # blockWidth int width of sequence block. Default 80 characters. - # Value: - # NA the function is invoked for its side effect of printing an - # alignment to stdout() or file. - - blockWidth <- as.integer(blockWidth) - if (is.na(blockWidth)) { - stop("PANIC: parameter \"blockWidth\" must be numeric.") - } - if (blockWidth < 1) { - stop("PANIC: parameter \"blockWidth\" must be greater than zero.") - } - if (blockWidth > 60) { - warning("Programs that read CLUSTAL format might not expect blockWidth > 60.") - } - - # Extract the raw data from the objects depending on their respective class - # and put it into a named vector of strings. - - # Extract XStringSet from MsaXMultipleAlignment ... - if (class(ali) == "MsaAAMultipleAlignment" | - class(ali) == "MsaDNAMultipleAlignment" | - class(ali) == "MsaRNAMultipleAlignment") { - ali <- ali@unmasked - } - - # Process XStringSet - if (class(ali) == "AAStringSet" | - class(ali) == "DNAStringSet" | - class(ali) == "RNAStringSet") { - sSet <- as.character(ali) # we use as.character(), not toString() thus - # we don't _have_ to load Biostrings - } else if (class(ali) == "character") { - sSet <- ali - } else { - stop(paste("Input object of class", - class(ali), - "can't be handled by this function.")) - } - - if (missing(range)) { - range <- 1 - range[2] <- max(nchar(sSet)) - } else { - range <- as.integer(range) - if(length(range) != 2 || - any(is.na(range)) || - range[1] > range[2] || - range[1] < 1) { - stop("PANIC: \"range\" parameter must contain valid start and end index.") - } - } - - # Right-pad any sequence with "-" that is shorter than ranges[2] - for (i in seq_along(sSet)) { - if (nchar(sSet[i]) < range[2]) { - sSet[i] <- paste0(sSet[i], - paste0(rep("-", range[2] - nchar(sSet[i])), - collapse = "")) - } - } - - # Right-pad sequence names - sNames <- names(sSet) - len <- max(nchar(sNames)) + 2 # longest name plus two spaces - for (i in seq_along(sNames)) { - sNames[i] <- paste0(sNames[i], - paste0(rep(" ", len - nchar(sNames[i])), - collapse = "")) - } - - - # Process each sequence - txt <- paste0("CLUSTAL W format. ", note) - txt[2] <- "" - - iStarts <- seq(range[1], range[2], by = blockWidth) - iEnds <- c((iStarts[-1] - 1), range[2]) - - for (i in seq_along(iStarts)) { - for (j in seq_along(sSet)) { - txt <- c(txt, - paste0(sNames[j], substring(sSet[j], iStarts[i], iEnds[i]))) - } - txt <- c(txt, "") # append a blank consenus line - txt <- c(txt, "") # append a separator line - } - - writeLines(txt, con= myCon) - -} - -# ==== TESTS ================================================================= -# Enter your function tests here... - -if (FALSE) { - # test ... -} - - - -# [END] +# tocID <- "scripts/ABC-writeALN.R" +# +# ToDo: calculate consensus line +# append sequence numbers +# Notes: +# +# ============================================================================== + + +writeALN <- function(ali, + range, + note = "", + myCon = stdout(), + blockWidth = 60) { + # Purpose: + # Write an MsaAAMultipleAlignment or AAStringSet object to stdout() or + # a file in multi-FASTA format. + # Version: 2.0 + # Date: 2017 10 + # Author: Boris Steipe + # + # Parameters: + # ali MsaAAMultipleAlignment or AAStringSet or character + # vector. + # range num a two-integer vector of start and end positions if + # only a range of the MSA should be written, e.g. + # a domain. Defaults to the full alignment length. + # note chr a vector of character that is appended to the name + # of a sequence in the FASTA header. Recycling of + # shorter vectors applies, thus a vector of length one + # is added to all headers. + # myCon a connection (cf. the con argument for writeLines). + # Defaults to stdout() + # blockWidth int width of sequence block. Default 80 characters. + # Value: + # NA the function is invoked for its side effect of printing an + # alignment to stdout() or file. + + blockWidth <- as.integer(blockWidth) + if (is.na(blockWidth)) { + stop("PANIC: parameter \"blockWidth\" must be numeric.") + } + if (blockWidth < 1) { + stop("PANIC: parameter \"blockWidth\" must be greater than zero.") + } + if (blockWidth > 60) { + warning("Programs that read CLUSTAL format might not expect blockWidth > 60.") + } + + # Extract the raw data from the objects depending on their respective class + # and put it into a named vector of strings. + + # Extract XStringSet from MsaXMultipleAlignment ... + if (class(ali) == "MsaAAMultipleAlignment" | + class(ali) == "MsaDNAMultipleAlignment" | + class(ali) == "MsaRNAMultipleAlignment") { + ali <- ali@unmasked + } + + # Process XStringSet + if (class(ali) == "AAStringSet" | + class(ali) == "DNAStringSet" | + class(ali) == "RNAStringSet") { + sSet <- as.character(ali) # we use as.character(), not toString() thus + # we don't _have_ to load Biostrings + } else if (class(ali) == "character") { + sSet <- ali + } else { + stop(paste("Input object of class", + class(ali), + "can't be handled by this function.")) + } + + if (missing(range)) { + range <- 1 + range[2] <- max(nchar(sSet)) + } else { + range <- as.integer(range) + if(length(range) != 2 || + any(is.na(range)) || + range[1] > range[2] || + range[1] < 1) { + stop("PANIC: \"range\" parameter must contain valid start and end index.") + } + } + + # Right-pad any sequence with "-" that is shorter than ranges[2] + for (i in seq_along(sSet)) { + if (nchar(sSet[i]) < range[2]) { + sSet[i] <- paste0(sSet[i], + paste0(rep("-", range[2] - nchar(sSet[i])), + collapse = "")) + } + } + + # Right-pad sequence names + sNames <- names(sSet) + len <- max(nchar(sNames)) + 2 # longest name plus two spaces + for (i in seq_along(sNames)) { + sNames[i] <- paste0(sNames[i], + paste0(rep(" ", len - nchar(sNames[i])), + collapse = "")) + } + + + # Process each sequence + txt <- paste0("CLUSTAL W format. ", note) + txt[2] <- "" + + iStarts <- seq(range[1], range[2], by = blockWidth) + iEnds <- c((iStarts[-1] - 1), range[2]) + + for (i in seq_along(iStarts)) { + for (j in seq_along(sSet)) { + txt <- c(txt, + paste0(sNames[j], substring(sSet[j], iStarts[i], iEnds[i]))) + } + txt <- c(txt, "") # append a blank consenus line + txt <- c(txt, "") # append a separator line + } + + writeLines(txt, con= myCon) + +} + +# ==== TESTS ================================================================= +# Enter your function tests here... + +if (FALSE) { + # test ... +} + + + +# [END] diff --git a/scripts/ABC-writeMFA.R b/scripts/ABC-writeMFA.R index 90471d3..d634959 100644 --- a/scripts/ABC-writeMFA.R +++ b/scripts/ABC-writeMFA.R @@ -1,121 +1,121 @@ -# ABC-writeMFA.R -# -# ToDo: -# Notes: 2.1 bugfix: empty notes caused superfluous blank after header. -# -# -# ============================================================================== - - -writeMFA <- function(ali, - range, - note = "", - myCon = stdout(), - blockWidth = 80) { - # Purpose: - # Write an MsaAAMultipleAlignment or AAStringSet object to stdout() or - # a file in multi-FASTA format. - # Version: 2.1 - # Date: 2017 10 - # Author: Boris Steipe - # - # Parameters: - # ali MsaAAMultipleAlignment or AAStringSet or character - # vector - # range num a two-integer vector of start and end positions if - # only a range of the MSA should be written, e.g. - # a domain. Defaults to the full sequence length. - # note chr a vector of character that is appended to the name - # of a sequence in the FASTA header. Recycling of - # shorter vectors applies, thus a vector of length one - # is added to all headers. - # myCon a connection (cf. the con argument for writeLines). - # Defaults to stdout() - # blockWidth int width of sequence block. Default 80 characters. - # Value: - # NA the function is invoked for its side effect of printing an - # alignment to stdout() or file. - - blockWidth <- as.integer(blockWidth) - if (is.na(blockWidth)) { - stop("PANIC: parameter \"blockWidth\" must be numeric.") - } - if (! blockWidth > 0){ - stop("PANIC: parameter \"blockWidth\" must be greater than zero.") - } - - # Extract the raw data from the objects depending on their respective class - # and put it into a named vector of strings. - - # Extract XStringSet from MsaXMultipleAlignment ... - if (class(ali) == "MsaAAMultipleAlignment" | - class(ali) == "MsaDNAMultipleAlignment" | - class(ali) == "MsaRNAMultipleAlignment") { - ali <- ali@unmasked - } - - # Process XStringSet - if (class(ali) == "AAStringSet" | - class(ali) == "DNAStringSet" | - class(ali) == "RNAStringSet") { - sSet <- as.character(ali) # we use as.character(), not toString() thus - # we don't _have_ to load Biostrings - } else if (class(ali) == "character") { - sSet <- ali - } else { - stop(paste("Input object of class", - class(ali), - "can't be handled by this function.")) - } - - if (missing(range)) { - range <- 1 - range[2] <- max(nchar(sSet)) - } else { - range <- as.integer(range) - if(length(range) != 2 || - any(is.na(range)) || - range[1] > range[2] || - range[1] < 1) { - stop("PANIC: \"range\" parameter must contain valid start and end index.") - } - } - - # Process each sequence - txt <- character() - if (note != "") { # construct header line - headers <- paste(names(sSet), note) - } else { - headers <- names(sSet) - } - - for (i in seq_along(sSet)) { - - # output FASTA header - txt <- c(txt, sprintf(">%s", headers[i])) - - # output the sequence in blocks of blockWidth per line ... - iStarts <- seq(range[1], range[2], by = blockWidth) - iEnds <- c((iStarts[-1] - 1), range[2]) - - thisSeq <- substring(sSet[i], iStarts, iEnds) # collect all blocks - thisSeq <- thisSeq[! nchar(thisSeq) == 0] # drop empty blocks - txt <- c(txt, thisSeq) - - txt <- c(txt, "") # append an empty line for readability - } - - writeLines(txt, con = myCon) - -} - -# ==== TESTS ================================================================= -# Enter your function tests here... - -if (FALSE) { - # test ... -} - - - -# [END] +# ABC-writeMFA.R +# +# ToDo: +# Notes: 2.1 bugfix: empty notes caused superfluous blank after header. +# +# +# ============================================================================== + + +writeMFA <- function(ali, + range, + note = "", + myCon = stdout(), + blockWidth = 80) { + # Purpose: + # Write an MsaAAMultipleAlignment or AAStringSet object to stdout() or + # a file in multi-FASTA format. + # Version: 2.1 + # Date: 2017 10 + # Author: Boris Steipe + # + # Parameters: + # ali MsaAAMultipleAlignment or AAStringSet or character + # vector + # range num a two-integer vector of start and end positions if + # only a range of the MSA should be written, e.g. + # a domain. Defaults to the full sequence length. + # note chr a vector of character that is appended to the name + # of a sequence in the FASTA header. Recycling of + # shorter vectors applies, thus a vector of length one + # is added to all headers. + # myCon a connection (cf. the con argument for writeLines). + # Defaults to stdout() + # blockWidth int width of sequence block. Default 80 characters. + # Value: + # NA the function is invoked for its side effect of printing an + # alignment to stdout() or file. + + blockWidth <- as.integer(blockWidth) + if (is.na(blockWidth)) { + stop("PANIC: parameter \"blockWidth\" must be numeric.") + } + if (! blockWidth > 0){ + stop("PANIC: parameter \"blockWidth\" must be greater than zero.") + } + + # Extract the raw data from the objects depending on their respective class + # and put it into a named vector of strings. + + # Extract XStringSet from MsaXMultipleAlignment ... + if (class(ali) == "MsaAAMultipleAlignment" | + class(ali) == "MsaDNAMultipleAlignment" | + class(ali) == "MsaRNAMultipleAlignment") { + ali <- ali@unmasked + } + + # Process XStringSet + if (class(ali) == "AAStringSet" | + class(ali) == "DNAStringSet" | + class(ali) == "RNAStringSet") { + sSet <- as.character(ali) # we use as.character(), not toString() thus + # we don't _have_ to load Biostrings + } else if (class(ali) == "character") { + sSet <- ali + } else { + stop(paste("Input object of class", + class(ali), + "can't be handled by this function.")) + } + + if (missing(range)) { + range <- 1 + range[2] <- max(nchar(sSet)) + } else { + range <- as.integer(range) + if(length(range) != 2 || + any(is.na(range)) || + range[1] > range[2] || + range[1] < 1) { + stop("PANIC: \"range\" parameter must contain valid start and end index.") + } + } + + # Process each sequence + txt <- character() + if (note != "") { # construct header line + headers <- paste(names(sSet), note) + } else { + headers <- names(sSet) + } + + for (i in seq_along(sSet)) { + + # output FASTA header + txt <- c(txt, sprintf(">%s", headers[i])) + + # output the sequence in blocks of blockWidth per line ... + iStarts <- seq(range[1], range[2], by = blockWidth) + iEnds <- c((iStarts[-1] - 1), range[2]) + + thisSeq <- substring(sSet[i], iStarts, iEnds) # collect all blocks + thisSeq <- thisSeq[! nchar(thisSeq) == 0] # drop empty blocks + txt <- c(txt, thisSeq) + + txt <- c(txt, "") # append an empty line for readability + } + + writeLines(txt, con = myCon) + +} + +# ==== TESTS ================================================================= +# Enter your function tests here... + +if (FALSE) { + # test ... +} + + + +# [END] diff --git a/scripts/BLAST.R b/scripts/BLAST.R index e10a613..491dad6 100644 --- a/scripts/BLAST.R +++ b/scripts/BLAST.R @@ -1,384 +1,384 @@ -# BLAST.R -# -# Purpose: Send off one BLAST search and return parsed list of results -# This script uses the BLAST URL-API -# (Application Programming Interface) at the NCBI. -# Read about the constraints here: -# https://blast.ncbi.nlm.nih.gov/Blast.cgi?CMD=Web&PAGE_TYPE=BlastDocs&DOC_TYPE=DeveloperInfo -# -# -# Version: 3.2 -# Date: 2016 09 - 2020 09 -# Author: Boris Steipe -# -# Versions: -# 3.2 2020 updates -# 3.1 Change from require() to requireNamespace(), -# use ::() idiom throughout -# 3.0 parsing logic had not been fully implemented; Fixed. -# 2.1 bugfix in BLAST(), bug was blanking non-split deflines; -# refactored parseBLASTalignment() to handle lists with multiple hits. -# 2.0 Completely rewritten because the interface completely changed. -# Code adpated in part from NCBI Perl sample code: -# $Id: web_blast.pl,v 1.10 2016/07/13 14:32:50 merezhuk Exp $ -# 1.0 first version posted for BCH441 2016, based on BLAST - API -# -# ToDo: Return the organism/strain name in the output, and propagate -# into MYSPE selection script. -# -# Notes: This is somewhat pedestrian, but apparently there are currently -# no R packages that contain such code. -# -# ============================================================================== - - -if (! requireNamespace("httr", quietly = TRUE)) { - install.packages("httr") -} - - -BLAST <- function(Q, - db = "refseq_protein", - nHits = 30, - E = 0.1, - limits = "", - rid = "", - query = "", - quietly = FALSE, - myTimeout = 120) { - # Purpose: - # Basic BLAST search - # - # Parameters: - # Q: query - either a valid ID or a sequence - # db: "refseq_protein" by default, - # other legal values include: "nr", "pdb", "swissprot" ... - # nHits: number of hits to maximally return - # E: E-value cutoff. Do not return hits whose score would be expected - # to occur E or more times in a database of random sequence. - # limits: a valid ENTREZ filter - # rid: a request ID - to retrieve earlier search results - # query: the actual query string (needed when retrieving results - # with an rid) - # quietly: controls printing of wait-time progress bar - # timeout: how much longer _after_ rtoe to wait for a result - # before giving up (seconds) - # Value: - # result: list of process status or resulting hits, and some metadata - - - EXTRAWAIT <- 10 # duration of extra wait cycles if BLAST search is not done - - results <- list() - results$query = query - results$rid <- rid - results$rtoe <- 0 - - if (rid == "") { # If no rid is available, spawn a search. - # Else, proceed directly to retrieval. - - # prepare query, GET(), and parse rid and rtoe from BLAST server response - results$query <- paste0("https://blast.ncbi.nlm.nih.gov/blast/Blast.cgi", - "?", - "CMD=Put", - "&PROGRAM=", "blastp", - "&QUERY=", URLencode(Q), - "&DATABASE=", db, - "&MATRIX=", "BLOSUM62", - "&EXPECT=", as.character(E), - "&HITLIST_SIZE=", as.character(nHits), - "&ALIGNMENTS=", as.character(nHits), - "&FORMAT_TYPE=Text") - - if (limits != "") { - results$query <- paste0( - results$query, - "&ENTREZ_QUERY=", limits) - } - - # send it off ... - response <- httr::GET(results$query) - if (httr::http_status(response)$category != "Success" ) { - stop(sprintf("PANIC: Can't send query. BLAST server status error: %s", - httr::http_status(response)$message)) - } - - txt <- httr::content(response, "text", encoding = "UTF-8") - - patt <- "RID = (\\w+)" # match the request id - results$rid <- regmatches(txt, regexec(patt, txt))[[1]][2] - - patt <- "RTOE = (\\d+)" # match the expected completion time - results$rtoe <- as.numeric(regmatches(txt, regexec(patt, txt))[[1]][2]) - - # Now we wait ... - if (quietly) { - Sys.sleep(results$rtoe) - } else { - cat(sprintf("BLAST is processing %s:\n", results$rid)) - waitTimer(results$rtoe) - } - - } # done sending query and retrieving rid, rtoe - - # Enter an infinite loop to check for result availability - checkStatus <- paste("https://blast.ncbi.nlm.nih.gov/blast/Blast.cgi", - "?", - "CMD=Get", - "&RID=", results$rid, - "&FORMAT_TYPE=Text", - "&FORMAT_OBJECT=SearchInfo", - sep = "") - - while (TRUE) { - # Check whether the result is ready - response <- httr::GET(checkStatus) - if (httr::http_status(response)$category != "Success" ) { - stop(sprintf("PANIC: Can't check status. BLAST server status error: %s", - httr::http_status(response)$message)) - } - - txt <- httr::content(response, "text", encoding = "UTF-8") - - if (length(grep("Status=WAITING", txt)) > 0) { - myTimeout <- myTimeout - EXTRAWAIT - - if (myTimeout <= 0) { # abort - cat("BLAST search not concluded before timeout. Aborting.\n") - cat(sprintf("%s BLASThits <- BLAST(rid=\"%s\")\n", - "Trying checking back later with >", - results$rid)) - return(results) - } - - if (quietly) { - Sys.sleep(EXTRAWAIT) - } else { - cat(sprintf("Status: Waiting. Wait %d more seconds (max. %d more)", - EXTRAWAIT, - myTimeout)) - waitTimer(EXTRAWAIT) - next - } - - } else if (length(grep("Status=FAILED", txt)) > 0) { - cat("BLAST search returned status \"FAILED\". Aborting.\n") - return(results) - - } else if (length(grep("Status=UNKNOWN", txt)) > 0) { - cat("BLAST search returned status \"UNKNOWN\".\n") - cat("This probably means the rid has expired. Aborting.\n") - return(results) - - } else if (length(grep("Status=READY", txt)) > 0) { # Done - - if (length(grep("ThereAreHits=yes", txt)) == 0) { # No hits - cat("BLAST search ready but no hits found. Aborting.\n") - return(results) - - } else { - break # done ... retrieve search result - } - } - } # end result-check loop - - # retrieve results from BLAST server - retrieve <- paste("https://blast.ncbi.nlm.nih.gov/blast/Blast.cgi", - "?", - "&CMD=Get", - "&RID=", results$rid, - "&FORMAT_TYPE=Text", - sep = "") - - response <- httr::GET(retrieve) - if (httr::http_status(response)$category != "Success" ) { - stop(sprintf("PANIC: Can't retrieve. BLAST server status error: %s", - httr::http_status(response)$message)) - } - - txt <- httr::content(response, "text", encoding = "UTF-8") - - # txt contains the whole set of results. Process: - - # First, we strsplit() on linebreaks: - txt <- unlist(strsplit(txt, "\n")) - - # The alignments range from the first line that begins with ">" ... - iFirst <- grep("^>", txt)[1] - - # ... to the last line that begins with "Sbjct" - x <- grep("^Sbjct", txt) - iLast <- x[length(x)] - - # Get the alignments block - txt <- txt[iFirst:iLast] - - # Drop empty lines - txt <- txt[!(nchar(txt) == 0)] - - # A line that ends "]" but does not begin ">" seems to be a split - # defline ... eg. - # [1] ">XP_013349208.1 AUEXF2481DRAFT_695809 [Aureobasidium subglaciale " - # [2] "EXF-2481]" - # Merge these lines to the preceding lines and delete them. - # - x <- which(grepl("]$", txt) & !(grepl("^>", txt))) - if (length(x) > 0) { - txt[x-1] <- paste0(txt[x-1], txt[x]) - txt <- txt[-x] - } - - # Special case: there may be multiple deflines when the BLAST hit is to - # redundant, identical sequences. Keep only the first instance. - iKeep <- ! grepl("^>", txt) - x <- rle(iKeep) - x$positions <- cumsum(x$lengths) - i <- which(x$lengths > 1 & x$values == FALSE) - if (length(i) > 0) { - firsts <- x$positions[i] - x$lengths[i] + 1 - iKeep[firsts] <- TRUE - txt <- txt[iKeep] - } - - # After this preprocessing the following should be true: - # - Every alignment block begins with a defline in which the - # first character is ">" - # - There is only one defline in each block. - # - Lines are not split. - - # Make a dataframe of first and last indices of alignment blocks - x <- grep("^>", txt) - blocks <- data.frame(iFirst = x, - iLast = c((x[-1] - 1), length(txt))) - - # Build the hits list by parsing the blocks - results$hits <- list() - - for (i in seq_len(nrow(blocks))) { - thisBlock <- txt[blocks$iFirst[i]:blocks$iLast[i]] - results$hits[[i]] <- parseBLASTalignment(thisBlock) - } - - return(results) -} - -parseBLASTalignment <- function(hit) { - # Parse data from a character vector containing a BLAST hit - # Parameters: - # hit char one BLAST hit as char vector - # Value: - # list $def chr defline - # $accession chr accession number - # $organism chr complete organism definition - # $species chr binomial species - # $E num E value - # $lengthAli num length of the alignment - # $nIdentitites num number of identities - # $nGaps num number of gaps - # $Qbounds num 2-element vector of query start-end - # $Sbounds num 2-element vector of subject start-end - # $Qseq chr query sequence - # $midSeq chr midline string - # $Sseq chr subject sequence - - getToken <- function(patt, v) { - # get the first token identified by pattern patt in character vector v - v <- v[grep(patt, v)] - if (length(v) > 1) { v <- v[1] } - if (length(v) == 0) { token <- NA - } else { - token <- regmatches(v, regexec(patt, v))[[1]][2] } - return(token) - } - - h <- list() - - # FASTA defline - h$def <- hit[1] - - # accesion number (ID), use the first if there are several, separated by "|" - patt <- "^>(.+?)(\\s|\\|)" # from ">" to space or "|" - h$accession <- regmatches(h$def, regexec(patt, h$def))[[1]][2] - - # organism - patt <- "\\[(.+)]" - h$organism <- regmatches(h$def, regexec(patt, h$def))[[1]][2] - - # species - x <- unlist(strsplit(h$organism, "\\s+")) - if (length(x) >= 2) { - h$species <- paste(x[1], x[2]) - } else if (length(x) == 1) { - h$species <- paste(x[1], "sp.") - } else { - h$species <- NA - } - - # E-value - h$E <- as.numeric(getToken("Expect\\s*=(.+?), Method", hit)) - - # length of alignment - h$lengthAli <- as.numeric(getToken("^\\s*Length\\s*=(.+)$", hit)) - - # number of identities - h$nIdentities <- as.numeric(getToken("^\\s*Identities\\s*=(.+?)/", hit)) - - # number of gaps - h$nGaps <- as.numeric(getToken("\\s*Gaps\\s*=(.+?)/", hit)) - - # split up alignment section - idx <- grep("^Query ", hit) - Que <- hit[idx] - Mid <- hit[idx + 1] - Sbj <- hit[idx + 2] - - # first and last positions - h$Qbounds <- c(start = 0, end = 0) - h$Qbounds[1] <- as.numeric(getToken("^Query\\s*(\\d+)", Que[1])) - h$Qbounds[2] <- as.numeric(getToken("\\s*(\\d+)\\s*$", Que[length(Que)])) - - h$Sbounds <- c(start = 0, end = 0) - h$Sbounds[1] <- as.numeric(getToken("^Sbjct\\s*(\\d+)", Sbj[1])) - h$Sbounds[2] <- as.numeric(getToken("\\s*(\\d+)\\s*$", Sbj[length(Sbj)])) - - # aligned sequences - for (i in seq_along(Que)) { - patt <- ("^\\s*Query\\s*\\d+\\s*([A-Za-z-]+)") # capture aligned string - m <- regexec(patt, Que[i]) - iFirst <- m[[1]][2] - iLast <- iFirst + attr(m[[1]], which = "match.length")[2] - 1 - Que[i] <- substring(Que[i], iFirst, iLast) - Mid[i] <- substring(Mid[i], iFirst, iLast) - Sbj[i] <- substring(Sbj[i], iFirst, iLast) - } - - h$Qseq <- paste0(Que, collapse = "") - h$midSeq <- paste0(Mid, collapse = "") - h$Sseq <- paste0(Sbj, collapse = "") - - return(h) -} - - -# ==== TESTS =================================================================== - -if (FALSE) { - # define query: - q <- paste("IYSARYSGVDVYEFIHSTGSIMKRKKDDWVNATHI", # Mbp1 APSES domain - "LKAANFAKAKRTRILEKEVLKETHEKVQGGFGKYQ", - "GTWVPLNIAKQLAEKFSVYDQLKPLFDFTQTDGSASP", - sep="") - # or ... - q <- "NP_010227" # refseq ID - - test <- BLAST(q, - nHits = 100, - E = 0.001, - rid = "", - limits = "txid4751[ORGN]") # Fungi - str(test) - length(test$hits) -} - -# [END] - +# BLAST.R +# +# Purpose: Send off one BLAST search and return parsed list of results +# This script uses the BLAST URL-API +# (Application Programming Interface) at the NCBI. +# Read about the constraints here: +# https://blast.ncbi.nlm.nih.gov/Blast.cgi?CMD=Web&PAGE_TYPE=BlastDocs&DOC_TYPE=DeveloperInfo +# +# +# Version: 3.2 +# Date: 2016 09 - 2020 09 +# Author: Boris Steipe +# +# Versions: +# 3.2 2020 updates +# 3.1 Change from require() to requireNamespace(), +# use ::() idiom throughout +# 3.0 parsing logic had not been fully implemented; Fixed. +# 2.1 bugfix in BLAST(), bug was blanking non-split deflines; +# refactored parseBLASTalignment() to handle lists with multiple hits. +# 2.0 Completely rewritten because the interface completely changed. +# Code adpated in part from NCBI Perl sample code: +# $Id: web_blast.pl,v 1.10 2016/07/13 14:32:50 merezhuk Exp $ +# 1.0 first version posted for BCH441 2016, based on BLAST - API +# +# ToDo: Return the organism/strain name in the output, and propagate +# into MYSPE selection script. +# +# Notes: This is somewhat pedestrian, but apparently there are currently +# no R packages that contain such code. +# +# ============================================================================== + + +if (! requireNamespace("httr", quietly = TRUE)) { + install.packages("httr") +} + + +BLAST <- function(Q, + db = "refseq_protein", + nHits = 30, + E = 0.1, + limits = "", + rid = "", + query = "", + quietly = FALSE, + myTimeout = 120) { + # Purpose: + # Basic BLAST search + # + # Parameters: + # Q: query - either a valid ID or a sequence + # db: "refseq_protein" by default, + # other legal values include: "nr", "pdb", "swissprot" ... + # nHits: number of hits to maximally return + # E: E-value cutoff. Do not return hits whose score would be expected + # to occur E or more times in a database of random sequence. + # limits: a valid ENTREZ filter + # rid: a request ID - to retrieve earlier search results + # query: the actual query string (needed when retrieving results + # with an rid) + # quietly: controls printing of wait-time progress bar + # timeout: how much longer _after_ rtoe to wait for a result + # before giving up (seconds) + # Value: + # result: list of process status or resulting hits, and some metadata + + + EXTRAWAIT <- 10 # duration of extra wait cycles if BLAST search is not done + + results <- list() + results$query = query + results$rid <- rid + results$rtoe <- 0 + + if (rid == "") { # If no rid is available, spawn a search. + # Else, proceed directly to retrieval. + + # prepare query, GET(), and parse rid and rtoe from BLAST server response + results$query <- paste0("https://blast.ncbi.nlm.nih.gov/blast/Blast.cgi", + "?", + "CMD=Put", + "&PROGRAM=", "blastp", + "&QUERY=", URLencode(Q), + "&DATABASE=", db, + "&MATRIX=", "BLOSUM62", + "&EXPECT=", as.character(E), + "&HITLIST_SIZE=", as.character(nHits), + "&ALIGNMENTS=", as.character(nHits), + "&FORMAT_TYPE=Text") + + if (limits != "") { + results$query <- paste0( + results$query, + "&ENTREZ_QUERY=", limits) + } + + # send it off ... + response <- httr::GET(results$query) + if (httr::http_status(response)$category != "Success" ) { + stop(sprintf("PANIC: Can't send query. BLAST server status error: %s", + httr::http_status(response)$message)) + } + + txt <- httr::content(response, "text", encoding = "UTF-8") + + patt <- "RID = (\\w+)" # match the request id + results$rid <- regmatches(txt, regexec(patt, txt))[[1]][2] + + patt <- "RTOE = (\\d+)" # match the expected completion time + results$rtoe <- as.numeric(regmatches(txt, regexec(patt, txt))[[1]][2]) + + # Now we wait ... + if (quietly) { + Sys.sleep(results$rtoe) + } else { + cat(sprintf("BLAST is processing %s:\n", results$rid)) + waitTimer(results$rtoe) + } + + } # done sending query and retrieving rid, rtoe + + # Enter an infinite loop to check for result availability + checkStatus <- paste("https://blast.ncbi.nlm.nih.gov/blast/Blast.cgi", + "?", + "CMD=Get", + "&RID=", results$rid, + "&FORMAT_TYPE=Text", + "&FORMAT_OBJECT=SearchInfo", + sep = "") + + while (TRUE) { + # Check whether the result is ready + response <- httr::GET(checkStatus) + if (httr::http_status(response)$category != "Success" ) { + stop(sprintf("PANIC: Can't check status. BLAST server status error: %s", + httr::http_status(response)$message)) + } + + txt <- httr::content(response, "text", encoding = "UTF-8") + + if (length(grep("Status=WAITING", txt)) > 0) { + myTimeout <- myTimeout - EXTRAWAIT + + if (myTimeout <= 0) { # abort + cat("BLAST search not concluded before timeout. Aborting.\n") + cat(sprintf("%s BLASThits <- BLAST(rid=\"%s\")\n", + "Trying checking back later with >", + results$rid)) + return(results) + } + + if (quietly) { + Sys.sleep(EXTRAWAIT) + } else { + cat(sprintf("Status: Waiting. Wait %d more seconds (max. %d more)", + EXTRAWAIT, + myTimeout)) + waitTimer(EXTRAWAIT) + next + } + + } else if (length(grep("Status=FAILED", txt)) > 0) { + cat("BLAST search returned status \"FAILED\". Aborting.\n") + return(results) + + } else if (length(grep("Status=UNKNOWN", txt)) > 0) { + cat("BLAST search returned status \"UNKNOWN\".\n") + cat("This probably means the rid has expired. Aborting.\n") + return(results) + + } else if (length(grep("Status=READY", txt)) > 0) { # Done + + if (length(grep("ThereAreHits=yes", txt)) == 0) { # No hits + cat("BLAST search ready but no hits found. Aborting.\n") + return(results) + + } else { + break # done ... retrieve search result + } + } + } # end result-check loop + + # retrieve results from BLAST server + retrieve <- paste("https://blast.ncbi.nlm.nih.gov/blast/Blast.cgi", + "?", + "&CMD=Get", + "&RID=", results$rid, + "&FORMAT_TYPE=Text", + sep = "") + + response <- httr::GET(retrieve) + if (httr::http_status(response)$category != "Success" ) { + stop(sprintf("PANIC: Can't retrieve. BLAST server status error: %s", + httr::http_status(response)$message)) + } + + txt <- httr::content(response, "text", encoding = "UTF-8") + + # txt contains the whole set of results. Process: + + # First, we strsplit() on linebreaks: + txt <- unlist(strsplit(txt, "\n")) + + # The alignments range from the first line that begins with ">" ... + iFirst <- grep("^>", txt)[1] + + # ... to the last line that begins with "Sbjct" + x <- grep("^Sbjct", txt) + iLast <- x[length(x)] + + # Get the alignments block + txt <- txt[iFirst:iLast] + + # Drop empty lines + txt <- txt[!(nchar(txt) == 0)] + + # A line that ends "]" but does not begin ">" seems to be a split + # defline ... eg. + # [1] ">XP_013349208.1 AUEXF2481DRAFT_695809 [Aureobasidium subglaciale " + # [2] "EXF-2481]" + # Merge these lines to the preceding lines and delete them. + # + x <- which(grepl("]$", txt) & !(grepl("^>", txt))) + if (length(x) > 0) { + txt[x-1] <- paste0(txt[x-1], txt[x]) + txt <- txt[-x] + } + + # Special case: there may be multiple deflines when the BLAST hit is to + # redundant, identical sequences. Keep only the first instance. + iKeep <- ! grepl("^>", txt) + x <- rle(iKeep) + x$positions <- cumsum(x$lengths) + i <- which(x$lengths > 1 & x$values == FALSE) + if (length(i) > 0) { + firsts <- x$positions[i] - x$lengths[i] + 1 + iKeep[firsts] <- TRUE + txt <- txt[iKeep] + } + + # After this preprocessing the following should be true: + # - Every alignment block begins with a defline in which the + # first character is ">" + # - There is only one defline in each block. + # - Lines are not split. + + # Make a dataframe of first and last indices of alignment blocks + x <- grep("^>", txt) + blocks <- data.frame(iFirst = x, + iLast = c((x[-1] - 1), length(txt))) + + # Build the hits list by parsing the blocks + results$hits <- list() + + for (i in seq_len(nrow(blocks))) { + thisBlock <- txt[blocks$iFirst[i]:blocks$iLast[i]] + results$hits[[i]] <- parseBLASTalignment(thisBlock) + } + + return(results) +} + +parseBLASTalignment <- function(hit) { + # Parse data from a character vector containing a BLAST hit + # Parameters: + # hit char one BLAST hit as char vector + # Value: + # list $def chr defline + # $accession chr accession number + # $organism chr complete organism definition + # $species chr binomial species + # $E num E value + # $lengthAli num length of the alignment + # $nIdentitites num number of identities + # $nGaps num number of gaps + # $Qbounds num 2-element vector of query start-end + # $Sbounds num 2-element vector of subject start-end + # $Qseq chr query sequence + # $midSeq chr midline string + # $Sseq chr subject sequence + + getToken <- function(patt, v) { + # get the first token identified by pattern patt in character vector v + v <- v[grep(patt, v)] + if (length(v) > 1) { v <- v[1] } + if (length(v) == 0) { token <- NA + } else { + token <- regmatches(v, regexec(patt, v))[[1]][2] } + return(token) + } + + h <- list() + + # FASTA defline + h$def <- hit[1] + + # accesion number (ID), use the first if there are several, separated by "|" + patt <- "^>(.+?)(\\s|\\|)" # from ">" to space or "|" + h$accession <- regmatches(h$def, regexec(patt, h$def))[[1]][2] + + # organism + patt <- "\\[(.+)]" + h$organism <- regmatches(h$def, regexec(patt, h$def))[[1]][2] + + # species + x <- unlist(strsplit(h$organism, "\\s+")) + if (length(x) >= 2) { + h$species <- paste(x[1], x[2]) + } else if (length(x) == 1) { + h$species <- paste(x[1], "sp.") + } else { + h$species <- NA + } + + # E-value + h$E <- as.numeric(getToken("Expect\\s*=(.+?), Method", hit)) + + # length of alignment + h$lengthAli <- as.numeric(getToken("^\\s*Length\\s*=(.+)$", hit)) + + # number of identities + h$nIdentities <- as.numeric(getToken("^\\s*Identities\\s*=(.+?)/", hit)) + + # number of gaps + h$nGaps <- as.numeric(getToken("\\s*Gaps\\s*=(.+?)/", hit)) + + # split up alignment section + idx <- grep("^Query ", hit) + Que <- hit[idx] + Mid <- hit[idx + 1] + Sbj <- hit[idx + 2] + + # first and last positions + h$Qbounds <- c(start = 0, end = 0) + h$Qbounds[1] <- as.numeric(getToken("^Query\\s*(\\d+)", Que[1])) + h$Qbounds[2] <- as.numeric(getToken("\\s*(\\d+)\\s*$", Que[length(Que)])) + + h$Sbounds <- c(start = 0, end = 0) + h$Sbounds[1] <- as.numeric(getToken("^Sbjct\\s*(\\d+)", Sbj[1])) + h$Sbounds[2] <- as.numeric(getToken("\\s*(\\d+)\\s*$", Sbj[length(Sbj)])) + + # aligned sequences + for (i in seq_along(Que)) { + patt <- ("^\\s*Query\\s*\\d+\\s*([A-Za-z-]+)") # capture aligned string + m <- regexec(patt, Que[i]) + iFirst <- m[[1]][2] + iLast <- iFirst + attr(m[[1]], which = "match.length")[2] - 1 + Que[i] <- substring(Que[i], iFirst, iLast) + Mid[i] <- substring(Mid[i], iFirst, iLast) + Sbj[i] <- substring(Sbj[i], iFirst, iLast) + } + + h$Qseq <- paste0(Que, collapse = "") + h$midSeq <- paste0(Mid, collapse = "") + h$Sseq <- paste0(Sbj, collapse = "") + + return(h) +} + + +# ==== TESTS =================================================================== + +if (FALSE) { + # define query: + q <- paste("IYSARYSGVDVYEFIHSTGSIMKRKKDDWVNATHI", # Mbp1 APSES domain + "LKAANFAKAKRTRILEKEVLKETHEKVQGGFGKYQ", + "GTWVPLNIAKQLAEKFSVYDQLKPLFDFTQTDGSASP", + sep="") + # or ... + q <- "NP_010227" # refseq ID + + test <- BLAST(q, + nHits = 100, + E = 0.001, + rid = "", + limits = "txid4751[ORGN]") # Fungi + str(test) + length(test$hits) +} + +# [END] + diff --git a/tests/test_biCode.R b/tests/test_biCode.R index 7fec038..2090af3 100644 --- a/tests/test_biCode.R +++ b/tests/test_biCode.R @@ -1,32 +1,32 @@ -# test_biCode.R -# - -context("biCode() utility function tests") # A set of tests for some - # functionality - -test_that("expected input is processed correctly", { # Related expectations - expect_equal(biCode("homo sapiens"), "HOMSA") - expect_equal(biCode("[homo sapiens neanderthaliensis]"), "HOMSA") - expect_equal(biCode(c("Phascolarctos cinereus", "Macropus rufus")), - c("PHACI", "MACRU")) -}) - -test_that("unexpected input is managed", { - expect_equal(biCode(""), ".....") - expect_equal(biCode(" "), ".....") - expect_equal(biCode("123 12"), ".....") - expect_equal(biCode("h sapiens"), "H..SA") -}) - -test_that("NA values are preserved", { - expect_true(is.na((biCode(NA)))) - expect_equal(biCode(c("first", NA, "last")), - c("FIRST", NA, "LAST.")) -}) - -test_that("Missing argument throws an error", { - expect_error(biCode(), "argument \"s\" is missing, with no default") -}) - - -# [END] +# test_biCode.R +# + +context("biCode() utility function tests") # A set of tests for some + # functionality + +test_that("expected input is processed correctly", { # Related expectations + expect_equal(biCode("homo sapiens"), "HOMSA") + expect_equal(biCode("[homo sapiens neanderthaliensis]"), "HOMSA") + expect_equal(biCode(c("Phascolarctos cinereus", "Macropus rufus")), + c("PHACI", "MACRU")) +}) + +test_that("unexpected input is managed", { + expect_equal(biCode(""), ".....") + expect_equal(biCode(" "), ".....") + expect_equal(biCode("123 12"), ".....") + expect_equal(biCode("h sapiens"), "H..SA") +}) + +test_that("NA values are preserved", { + expect_true(is.na((biCode(NA)))) + expect_equal(biCode(c("first", NA, "last")), + c("FIRST", NA, "LAST.")) +}) + +test_that("Missing argument throws an error", { + expect_error(biCode(), "argument \"s\" is missing, with no default") +}) + + +# [END]