Excluding or including by awk
$begingroup$
I have a gtf file as attached enter link description here
By this command one could extract coding parts of genome
awk '{if($3=="transcript" && $20==""protein_coding";"){print $0}}' gencode.gtf
How I could exclude coding parts from this file keeping non coding regions
linux wgs bash
$endgroup$
add a comment |
$begingroup$
I have a gtf file as attached enter link description here
By this command one could extract coding parts of genome
awk '{if($3=="transcript" && $20==""protein_coding";"){print $0}}' gencode.gtf
How I could exclude coding parts from this file keeping non coding regions
linux wgs bash
$endgroup$
add a comment |
$begingroup$
I have a gtf file as attached enter link description here
By this command one could extract coding parts of genome
awk '{if($3=="transcript" && $20==""protein_coding";"){print $0}}' gencode.gtf
How I could exclude coding parts from this file keeping non coding regions
linux wgs bash
$endgroup$
I have a gtf file as attached enter link description here
By this command one could extract coding parts of genome
awk '{if($3=="transcript" && $20==""protein_coding";"){print $0}}' gencode.gtf
How I could exclude coding parts from this file keeping non coding regions
linux wgs bash
linux wgs bash
asked 2 hours ago
Feresh TehFeresh Teh
38111
38111
add a comment |
add a comment |
1 Answer
1
active
oldest
votes
$begingroup$
Getting the non coding regions of a protein coding transcript, sounds like you are looking for UTR.
UTR
has its own feature in the gtf file. So you can do this:
$ awk -v FS="t" '$3=="UTR"' gencode.gtf
If the gtf file is compressed use this instead:
$ zcat gencode.gtf.gz | awk -v FS="t" '$3=="UTR"'
BTW: Why are you using such an old release of gencode? The current version is v29.
$endgroup$
$begingroup$
Sorry, literally I need non coding regions of human genome, but for asking my question here I referred to coding parts too
$endgroup$
– Feresh Teh
1 hour ago
$begingroup$
Sorry I tried hat but my output is empty
$endgroup$
– Feresh Teh
1 hour ago
1
$begingroup$
As @Wouter tells you, the non coding region of a genome is the complement of the coding regions. Coding regions have its own feature in the gtf file. You can get them with$ awk -v FS="t" '$3=="CDS"' gencode.gtf
. Reading the manual for bedtools complement is your task.
$endgroup$
– finswimmer
1 hour ago
$begingroup$
Thank you but both of your commands return nothing :(
$endgroup$
– Feresh Teh
1 hour ago
add a comment |
Your Answer
StackExchange.ifUsing("editor", function () {
return StackExchange.using("mathjaxEditing", function () {
StackExchange.MarkdownEditor.creationCallbacks.add(function (editor, postfix) {
StackExchange.mathjaxEditing.prepareWmdForMathJax(editor, postfix, [["$", "$"], ["\\(","\\)"]]);
});
});
}, "mathjax-editing");
StackExchange.ready(function() {
var channelOptions = {
tags: "".split(" "),
id: "676"
};
initTagRenderer("".split(" "), "".split(" "), channelOptions);
StackExchange.using("externalEditor", function() {
// Have to fire editor after snippets, if snippets enabled
if (StackExchange.settings.snippets.snippetsEnabled) {
StackExchange.using("snippets", function() {
createEditor();
});
}
else {
createEditor();
}
});
function createEditor() {
StackExchange.prepareEditor({
heartbeatType: 'answer',
autoActivateHeartbeat: false,
convertImagesToLinks: false,
noModals: true,
showLowRepImageUploadWarning: true,
reputationToPostImages: null,
bindNavPrevention: true,
postfix: "",
imageUploader: {
brandingHtml: "Powered by u003ca class="icon-imgur-white" href="https://imgur.com/"u003eu003c/au003e",
contentPolicyHtml: "User contributions licensed under u003ca href="https://creativecommons.org/licenses/by-sa/3.0/"u003ecc by-sa 3.0 with attribution requiredu003c/au003e u003ca href="https://stackoverflow.com/legal/content-policy"u003e(content policy)u003c/au003e",
allowUrls: true
},
onDemand: true,
discardSelector: ".discard-answer"
,immediatelyShowMarkdownHelp:true
});
}
});
Sign up or log in
StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
var $window = $(window),
onScroll = function(e) {
var $elem = $('.new-login-left'),
docViewTop = $window.scrollTop(),
docViewBottom = docViewTop + $window.height(),
elemTop = $elem.offset().top,
elemBottom = elemTop + $elem.height();
if ((docViewTop elemBottom)) {
StackExchange.using('gps', function() { StackExchange.gps.track('embedded_signup_form.view', { location: 'question_page' }); });
$window.unbind('scroll', onScroll);
}
};
$window.on('scroll', onScroll);
});
Sign up using Google
Sign up using Facebook
Sign up using Email and Password
Post as a guest
Required, but never shown
StackExchange.ready(
function () {
StackExchange.openid.initPostLogin('.new-post-login', 'https%3a%2f%2fbioinformatics.stackexchange.com%2fquestions%2f7098%2fexcluding-or-including-by-awk%23new-answer', 'question_page');
}
);
Post as a guest
Required, but never shown
1 Answer
1
active
oldest
votes
1 Answer
1
active
oldest
votes
active
oldest
votes
active
oldest
votes
$begingroup$
Getting the non coding regions of a protein coding transcript, sounds like you are looking for UTR.
UTR
has its own feature in the gtf file. So you can do this:
$ awk -v FS="t" '$3=="UTR"' gencode.gtf
If the gtf file is compressed use this instead:
$ zcat gencode.gtf.gz | awk -v FS="t" '$3=="UTR"'
BTW: Why are you using such an old release of gencode? The current version is v29.
$endgroup$
$begingroup$
Sorry, literally I need non coding regions of human genome, but for asking my question here I referred to coding parts too
$endgroup$
– Feresh Teh
1 hour ago
$begingroup$
Sorry I tried hat but my output is empty
$endgroup$
– Feresh Teh
1 hour ago
1
$begingroup$
As @Wouter tells you, the non coding region of a genome is the complement of the coding regions. Coding regions have its own feature in the gtf file. You can get them with$ awk -v FS="t" '$3=="CDS"' gencode.gtf
. Reading the manual for bedtools complement is your task.
$endgroup$
– finswimmer
1 hour ago
$begingroup$
Thank you but both of your commands return nothing :(
$endgroup$
– Feresh Teh
1 hour ago
add a comment |
$begingroup$
Getting the non coding regions of a protein coding transcript, sounds like you are looking for UTR.
UTR
has its own feature in the gtf file. So you can do this:
$ awk -v FS="t" '$3=="UTR"' gencode.gtf
If the gtf file is compressed use this instead:
$ zcat gencode.gtf.gz | awk -v FS="t" '$3=="UTR"'
BTW: Why are you using such an old release of gencode? The current version is v29.
$endgroup$
$begingroup$
Sorry, literally I need non coding regions of human genome, but for asking my question here I referred to coding parts too
$endgroup$
– Feresh Teh
1 hour ago
$begingroup$
Sorry I tried hat but my output is empty
$endgroup$
– Feresh Teh
1 hour ago
1
$begingroup$
As @Wouter tells you, the non coding region of a genome is the complement of the coding regions. Coding regions have its own feature in the gtf file. You can get them with$ awk -v FS="t" '$3=="CDS"' gencode.gtf
. Reading the manual for bedtools complement is your task.
$endgroup$
– finswimmer
1 hour ago
$begingroup$
Thank you but both of your commands return nothing :(
$endgroup$
– Feresh Teh
1 hour ago
add a comment |
$begingroup$
Getting the non coding regions of a protein coding transcript, sounds like you are looking for UTR.
UTR
has its own feature in the gtf file. So you can do this:
$ awk -v FS="t" '$3=="UTR"' gencode.gtf
If the gtf file is compressed use this instead:
$ zcat gencode.gtf.gz | awk -v FS="t" '$3=="UTR"'
BTW: Why are you using such an old release of gencode? The current version is v29.
$endgroup$
Getting the non coding regions of a protein coding transcript, sounds like you are looking for UTR.
UTR
has its own feature in the gtf file. So you can do this:
$ awk -v FS="t" '$3=="UTR"' gencode.gtf
If the gtf file is compressed use this instead:
$ zcat gencode.gtf.gz | awk -v FS="t" '$3=="UTR"'
BTW: Why are you using such an old release of gencode? The current version is v29.
edited 1 hour ago
answered 1 hour ago
finswimmerfinswimmer
962210
962210
$begingroup$
Sorry, literally I need non coding regions of human genome, but for asking my question here I referred to coding parts too
$endgroup$
– Feresh Teh
1 hour ago
$begingroup$
Sorry I tried hat but my output is empty
$endgroup$
– Feresh Teh
1 hour ago
1
$begingroup$
As @Wouter tells you, the non coding region of a genome is the complement of the coding regions. Coding regions have its own feature in the gtf file. You can get them with$ awk -v FS="t" '$3=="CDS"' gencode.gtf
. Reading the manual for bedtools complement is your task.
$endgroup$
– finswimmer
1 hour ago
$begingroup$
Thank you but both of your commands return nothing :(
$endgroup$
– Feresh Teh
1 hour ago
add a comment |
$begingroup$
Sorry, literally I need non coding regions of human genome, but for asking my question here I referred to coding parts too
$endgroup$
– Feresh Teh
1 hour ago
$begingroup$
Sorry I tried hat but my output is empty
$endgroup$
– Feresh Teh
1 hour ago
1
$begingroup$
As @Wouter tells you, the non coding region of a genome is the complement of the coding regions. Coding regions have its own feature in the gtf file. You can get them with$ awk -v FS="t" '$3=="CDS"' gencode.gtf
. Reading the manual for bedtools complement is your task.
$endgroup$
– finswimmer
1 hour ago
$begingroup$
Thank you but both of your commands return nothing :(
$endgroup$
– Feresh Teh
1 hour ago
$begingroup$
Sorry, literally I need non coding regions of human genome, but for asking my question here I referred to coding parts too
$endgroup$
– Feresh Teh
1 hour ago
$begingroup$
Sorry, literally I need non coding regions of human genome, but for asking my question here I referred to coding parts too
$endgroup$
– Feresh Teh
1 hour ago
$begingroup$
Sorry I tried hat but my output is empty
$endgroup$
– Feresh Teh
1 hour ago
$begingroup$
Sorry I tried hat but my output is empty
$endgroup$
– Feresh Teh
1 hour ago
1
1
$begingroup$
As @Wouter tells you, the non coding region of a genome is the complement of the coding regions. Coding regions have its own feature in the gtf file. You can get them with
$ awk -v FS="t" '$3=="CDS"' gencode.gtf
. Reading the manual for bedtools complement is your task.$endgroup$
– finswimmer
1 hour ago
$begingroup$
As @Wouter tells you, the non coding region of a genome is the complement of the coding regions. Coding regions have its own feature in the gtf file. You can get them with
$ awk -v FS="t" '$3=="CDS"' gencode.gtf
. Reading the manual for bedtools complement is your task.$endgroup$
– finswimmer
1 hour ago
$begingroup$
Thank you but both of your commands return nothing :(
$endgroup$
– Feresh Teh
1 hour ago
$begingroup$
Thank you but both of your commands return nothing :(
$endgroup$
– Feresh Teh
1 hour ago
add a comment |
Thanks for contributing an answer to Bioinformatics Stack Exchange!
- Please be sure to answer the question. Provide details and share your research!
But avoid …
- Asking for help, clarification, or responding to other answers.
- Making statements based on opinion; back them up with references or personal experience.
Use MathJax to format equations. MathJax reference.
To learn more, see our tips on writing great answers.
Sign up or log in
StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
var $window = $(window),
onScroll = function(e) {
var $elem = $('.new-login-left'),
docViewTop = $window.scrollTop(),
docViewBottom = docViewTop + $window.height(),
elemTop = $elem.offset().top,
elemBottom = elemTop + $elem.height();
if ((docViewTop elemBottom)) {
StackExchange.using('gps', function() { StackExchange.gps.track('embedded_signup_form.view', { location: 'question_page' }); });
$window.unbind('scroll', onScroll);
}
};
$window.on('scroll', onScroll);
});
Sign up using Google
Sign up using Facebook
Sign up using Email and Password
Post as a guest
Required, but never shown
StackExchange.ready(
function () {
StackExchange.openid.initPostLogin('.new-post-login', 'https%3a%2f%2fbioinformatics.stackexchange.com%2fquestions%2f7098%2fexcluding-or-including-by-awk%23new-answer', 'question_page');
}
);
Post as a guest
Required, but never shown
Sign up or log in
StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
var $window = $(window),
onScroll = function(e) {
var $elem = $('.new-login-left'),
docViewTop = $window.scrollTop(),
docViewBottom = docViewTop + $window.height(),
elemTop = $elem.offset().top,
elemBottom = elemTop + $elem.height();
if ((docViewTop elemBottom)) {
StackExchange.using('gps', function() { StackExchange.gps.track('embedded_signup_form.view', { location: 'question_page' }); });
$window.unbind('scroll', onScroll);
}
};
$window.on('scroll', onScroll);
});
Sign up using Google
Sign up using Facebook
Sign up using Email and Password
Post as a guest
Required, but never shown
Sign up or log in
StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
var $window = $(window),
onScroll = function(e) {
var $elem = $('.new-login-left'),
docViewTop = $window.scrollTop(),
docViewBottom = docViewTop + $window.height(),
elemTop = $elem.offset().top,
elemBottom = elemTop + $elem.height();
if ((docViewTop elemBottom)) {
StackExchange.using('gps', function() { StackExchange.gps.track('embedded_signup_form.view', { location: 'question_page' }); });
$window.unbind('scroll', onScroll);
}
};
$window.on('scroll', onScroll);
});
Sign up using Google
Sign up using Facebook
Sign up using Email and Password
Post as a guest
Required, but never shown
Sign up or log in
StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
var $window = $(window),
onScroll = function(e) {
var $elem = $('.new-login-left'),
docViewTop = $window.scrollTop(),
docViewBottom = docViewTop + $window.height(),
elemTop = $elem.offset().top,
elemBottom = elemTop + $elem.height();
if ((docViewTop elemBottom)) {
StackExchange.using('gps', function() { StackExchange.gps.track('embedded_signup_form.view', { location: 'question_page' }); });
$window.unbind('scroll', onScroll);
}
};
$window.on('scroll', onScroll);
});
Sign up using Google
Sign up using Facebook
Sign up using Email and Password
Sign up using Google
Sign up using Facebook
Sign up using Email and Password
Post as a guest
Required, but never shown
Required, but never shown
Required, but never shown
Required, but never shown
Required, but never shown
Required, but never shown
Required, but never shown
Required, but never shown
Required, but never shown