Training Material List
Handles creating, reading and updating training materials.
GET /api/trainingmaterial/?format=api&offset=100&ordering=description
{ "count": 149, "next": "https://catalogue.france-bioinformatique.fr/api/trainingmaterial/?format=api&limit=20&offset=120&ordering=description", "previous": "https://catalogue.france-bioinformatique.fr/api/trainingmaterial/?format=api&limit=20&offset=80&ordering=description", "results": [ { "id": 137, "name": "Linux slides", "description": "Slides for linux session (genotoul bioinfo facility)", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "https://bioinfo.genotoul.fr/wp-content/uploads/Formation_LINUX_GenoToul_2024.pdf", "fileName": "Formation_LINUX_GenoToul_2024.pdf", "topics": [], "keywords": [ "Operating systems" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "Novice", "providedBy": [], "dateCreation": null, "dateUpdate": null, "licence": "CC BY-NC-SA", "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/300/?format=api" ] }, { "id": 1, "name": "SG-ONT-slides", "description": "Slides used for the training \"\t\r\nIntroduction to Oxford Nanopore Technology data analyses\"", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "https://southgreenplatform.github.io/trainings//files/ont_2021.pdf", "fileName": "ont_2021.pdf", "topics": [], "keywords": [], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": "2022-01-24", "dateUpdate": "2022-01-24", "licence": "Creative Commons Attribution 4.0 International License", "maintainers": [] }, { "id": 51, "name": "Eukaryotic small RNA", "description": "\n \n\nSmall RNAseq data analysis for miRNA identification\n \n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "http://ressources.france-bioinformatique.fr/sites/default/files/sRNA-Seq.pdf", "fileName": "missing.txt", "topics": [], "keywords": [ "RNA-seq" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": "2016-11-23", "dateUpdate": null, "licence": null, "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/642/?format=api" ] }, { "id": 81, "name": "Assessing microbial biogeography by using a metagenomic approach", "description": "Soils are highly complex ecosystems and are considered as one of the Earth’s main reservoirs of biological diversity. Bacteria account for a major part of this biodiversity, and it is now clear that such microorganisms have a key role in soil functioning processes. However, environmental factors regulating the diversity of below-ground bacteria still need to be investigated, which limits our understanding of the distribution of such bacteria at various spatial scales. The overall objectives of this study were: (i) to determine the spatial patterning of bacterial community diversity in soils at a broad scale, and (ii) to rank the environmental filters most influencing this distribution.\nThis study was performed at the scale of the France by using the French Soil Quality Monitoring Network. This network includes more than 2,200 soil samples along a systematic grid sampling. For each soil, bacterial diversity was characterized using a pyrosequencing approach targeting the 16S rRNA genes directly amplified from soil DNA, obtaining more than 18 million of high-quality sequences.\nThis study provides the first estimates of microbial diversity at the scale of France, with for example, bacterial richness ranging from 555 to 2,007 OTUs (on average: 1,289 OTUs). It also provides the first extensive map of bacterial diversity, as well as of major bacterial taxa, revealing a bacterial heterogeneous and spatially structured distribution at the scale of France. The main factors driving bacterial community distribution are the soil physico-chemical properties (pH, texture...) and land use (forest, grassland, crop system...), evidencing that bacterial spatial distribution at a broad scale depends on local filters such as soil characteristics and land use when regarding the community (quality, composition) as a whole. Moreover, this study also offers a better evaluation of the impact of land uses on soil microbial diversity and taxa, with consequences in terms of sustainability for agricultural systems.\n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "http://www.france-bioinformatique.fr/sites/default/files/videos/scorms/metagenomics16/session_4/Assessing_microbial_biogeography_by_using_a_metagenomic_approach/scormcontent/index.html", "fileName": "missing.txt", "topics": [], "keywords": [ "Metagenomics" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": "2016-12-16", "dateUpdate": null, "licence": "CC BY-NC-ND", "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/709/?format=api" ] }, { "id": 4, "name": "Support tools for rapid adoption of compact identifiers in the publishing process", "description": "\n \n\nSupport tools for rapid adoption of compact identifiers in the publishing process\n \n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "http://ressources.france-bioinformatique.fr/sites/default/files/videos/scorms/support-tools_78a0/scormcontent/index.html", "fileName": "missing.txt", "topics": [], "keywords": [ "biohackaton 2018" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": "2019-03-21", "dateUpdate": null, "licence": null, "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/668/?format=api" ] }, { "id": 100, "name": "REPET: TEdannot Tutorial", "description": "TEannot is able to annote a genome using DNA sequences library. This library can be a predicted TE library built by TEdenovo\n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "https://urgi.versailles.inra.fr/Tools/REPET/TEannot-tuto", "fileName": "missing.txt", "topics": [], "keywords": [ "genomics", "Annotation" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": null, "dateUpdate": null, "licence": "CeCILL", "maintainers": [] }, { "id": 117, "name": "Chip-seq: Peak calling tutorial", "description": "The aim is to :\nUnderstand how to process reads to obtain peaks (peak-calling).\nBecome familiar with differential analysis of peaks\nIn practice :\nObtain dataset from GEO\nAnalyze mapped reads\nObtain set(s) of peaks, handle replicates\nDifferential analysis of peak\n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "http://dputhier.github.io/EBA_2015_ChIP-Seq/tutorial/01_peak_calling/peak_calling_tutorial.html", "fileName": "missing.txt", "topics": [], "keywords": [ "Chip-Seq", "Peak calling", "NGS" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": null, "dateUpdate": null, "licence": null, "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/698/?format=api", "https://catalogue.france-bioinformatique.fr/api/userprofile/644/?format=api", "https://catalogue.france-bioinformatique.fr/api/userprofile/721/?format=api", "https://catalogue.france-bioinformatique.fr/api/userprofile/512/?format=api" ] }, { "id": 78, "name": "Dr Jekyll and Mr Hyde: The dual face of metagenomics in phylogenetic analysis", "description": "The aim of this lecture is to present the impact of metagenomics and single-cell genomics on public databases. These new powerful approches allow us to have access to the diversity of life on our planet. However, care has to be taken when using these data for posterior analyses, such as phylogenetic studies, as critical errors can still be present in the databases. This course will incorporate examples taken from real studies, and we will investigate methods used for error detection.\n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "http://www.france-bioinformatique.fr/sites/default/files/videos/scorms/metagenomics16/session_5/Dr_Jekyll_and_Mr_Hyde_The_dual_face_of_metagenomics_in_phylogenetic_analysis/scormcontent/index.html", "fileName": "missing.txt", "topics": [], "keywords": [ "Metagenomics" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": "2016-12-16", "dateUpdate": null, "licence": "CC BY-NC-ND", "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/706/?format=api" ] }, { "id": 75, "name": "Fast filtering, mapping and assembly of 16S ribosomal RNA", "description": "The application of next-generation sequencing technologies to RNA or DNA directly extracted from a community of organisms yields a mixture of nucleotide fragments. The task to distinguish amongst these and to further categorize the families of ribosomal RNAs (or any other given marker) is an important step for examining the phylogenetic classification of the constituting species. In this perspective, we have developed a complete bioinformatics suite, called MATAM, capable of handling large sets of reads in a fast and accurate way. MATAM covers all steps of the analysis, from the identification of reads of interest in the raw sequencing data to the reconstruction of the full-length sequences of the marker and alignment to a reference database for taxonomic assignment. Part of MATAM is based on the SortMeRNA software, also developed by the team.\n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "http://www.france-bioinformatique.fr/sites/default/files/videos/scorms/metagenomics16/session_6/Fast_filtering_mapping_and_assembly_of_16S_rRNA/scormcontent/index.html", "fileName": "missing.txt", "topics": [], "keywords": [ "Metagenomics" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": "2016-12-16", "dateUpdate": null, "licence": "CC BY-NC-ND", "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/610/?format=api" ] }, { "id": 83, "name": "Rationale and Tools to look for the unknown in (metagenomic) sequence data", "description": "The interpretation of metagenomic data (environmental, microbiome, etc, ...) usually involves the recognition of sequence similarity with previously identified (micro-organisms). This is for instance the main approach to taxonomical assignments and a starting point to most diversity analyses. When exploring beyond the frontier of known biology, one should expect a large proportion of environmental sequences not exhibiting any significant similarity with known organisms. Notably, this is the case for eukaryotic viruses belonging to new families, for which the proportion of \"no match\" could reach 90%. Most metagenomics studies tend to ignore this large fraction of sequences that might be the equivalent of \"black matter\" in Biology. We will present some of the ideas and tools we are using to extract that information from large metagenomics data sets in search of truly unknown microorganisms.\nOne of the tools, \"Seqtinizer\", an interactive contig selection/inspection interface will also be presented in the context of \"pseudo-metagenomic\" projects, where the main organism under genomic study (such as sponges or corals) turns out to be (highly) mixed with an unexpected population of food, passing-by, or symbiotic microorganisms.\n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "http://www.france-bioinformatique.fr/sites/default/files/videos/scorms/metagenomics16/session_3/Rational_and_tools_to_look_for_the_unknown_in_sequence_data/scormcontent/index.html", "fileName": "missing.txt", "topics": [], "keywords": [ "Metagenomics" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": "2016-12-16", "dateUpdate": null, "licence": "CC BY-NC-ND", "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/123/?format=api" ] }, { "id": 72, "name": "Hidden in the permafrost", "description": "The last decade witnessed the discovery of four families of giant viruses infecting Acanthamoeba. They have genome encoding from 500 to 2000 genes, a large fraction of which encoding proteins of unknown origin. These unique proteins meant to recognize and manipulate the same building blocks as cells raise the question on their origin as well as the role viruses played in the cellular word evolution. The Mimiviridae and the Pandoraviridae are increasingly populated by members from very diverse habitats and are ubiquitous on the planet. After prospecting the space, we went back in the past and isolated two other giant virus families from a 30,000 years old permafrost sample, Pithovirus and Mollivirus sibericum. A metagenomics study of the sample was performed to inventory its biodiversity and assess to what extend the host and the viruses were dominant. I will describe the two sequencing approaches which have been used and compare the results.\n1: Raoult D, Audic S, Robert C, Abergel C, Renesto P, Ogata H, La Scola B, Suzan M, Claverie JM. The 1.2-megabase genome sequence of Mimivirus. Science. 2004 Nov 19;306(5700):1344-50.\n2: Philippe N, Legendre M, Doutre G, Couté Y, Poirot O, Lescot M, Arslan D, Seltzer V, Bertaux L, Bruley C, Garin J, Claverie JM, Abergel C. Pandoraviruses: amoeba viruses with genomes up to 2.5 Mb reaching that of parasitic eukaryotes. Science. 2013 Jul 19;341(6143):281-6. \n3: Legendre M, Bartoli J, Shmakova L, Jeudy S, Labadie K, Adrait A, Lescot M, Poirot O, Bertaux L, Bruley C, Couté Y, Rivkina E, Abergel C, Claverie JM. Thirty-thousand-year-old distant relative of giant icosahedral DNA viruses with a pandoravirus morphology. Proc Natl Acad Sci U S A. 2014 Mar 18;111(11):4274-9.\n4: Legendre M, Lartigue A, Bertaux L, Jeudy S, Bartoli J, Lescot M, Alempic JM, Ramus C, Bruley C, Labadie K, Shmakova L, Rivkina E, Couté Y, Abergel C, Claverie JM. In-depth study of Mollivirus sibericum, a new 30,000-y-old giant virus infecting Acanthamoeba. Proc Natl Acad Sci U S A. 2015 Sep 22;112(38):E5327-35.\n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "http://www.france-bioinformatique.fr/sites/default/files/videos/scorms/metagenomics16/session_7/Hidden_in_permafrost/scormcontent/index.html", "fileName": "missing.txt", "topics": [], "keywords": [ "Metagenomics" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": "2016-12-16", "dateUpdate": null, "licence": "CC BY-NC-ND", "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/123/?format=api", "https://catalogue.france-bioinformatique.fr/api/userprofile/703/?format=api" ] }, { "id": 150, "name": "Plant Data Managment for Phenotyping Experiments - MIAPPE", "description": "The Minimal Information About Plant Phenotyping Experiment, MIAPPE (www.miappe.org) has been designed by ELIXIR, EMPHASIS and Bioversity international, to guide plant scientist in the management of experimental data. Furthermore, since genetic studies relies on the integration and the linking between phenotype and genotype datasets, relevant section of MIAPPE are beginning to be used for genotyping standards. This Webinar will give an overview of the current practices and methods for plant phenotyping data standardization, and how to deal with the variability and heterogeneity inherent to research and breeding data sets. Data management approaches at some of the major research organizations will be given as examples.", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "https://hal.inrae.fr/hal-03102944", "fileName": "2020-12-MIAPPE-Webinar.pdf", "topics": [ "http://edamontology.org/topic_0625" ], "keywords": [ "Données" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "Novice", "providedBy": [], "dateCreation": null, "dateUpdate": null, "licence": "CC BY-SA 4.0", "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/441/?format=api" ] }, { "id": 99, "name": " PASTEClassifier Tutorial", "description": "The PASTEClassifier (Pseudo Agent System for Transposable Elements Classification) is a transposable element (TE) classifier searching for structural features and similarity to classify TEs ( Hoede C. et al. 2014 )\n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "https://urgi.versailles.inra.fr/Tools/PASTEClassifier/PASTEClassifier-tuto", "fileName": "missing.txt", "topics": [], "keywords": [ "genomics", "Transposons" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": null, "dateUpdate": null, "licence": "CeCILL", "maintainers": [] }, { "id": 79, "name": "Soil metagenomics, potential and pitfalls", "description": "The soil microorganisms are responsible for a range of critical functions including those that directly affect our quality of life (e.g., antibiotic production and resistance – human and animal health, nitrogen fixation -agriculture, pollutant degradation – environmental bioremediation). Nevertheless, genome structure information has been restricted by a large extent to a small fraction of cultivated species. This limitation can be circumvented now by modern alternative approaches including metagenomics or single cell genomics. Metagenomics includes the data treatment of DNA sequences from many members of the microbial community, in order to either extract a specific microorganism’s genome sequence or to evaluate the community function based on the relative quantities of different gene families. In my talk I will show how these metagenomic datasets can be used to estimate and compare the functional potential of microbial communities from various environments with a special focus on antibiotic resistance genes. However, metagenomic datasets can also in some cases be partially assembled into longer sequences representing microbial genetic structures for trying to correlate different functions to their co-location on the same genetic structure. I will show how the microbial community composition of a natural grassland soil characterized by extremely high microbial diversity could be managed for sequentially attempt to reconstruct some bacterial genomes.\nMetagenomics can also be used to exploit the genetic potential of environmental microorganisms. I will present an integrative approach coupling rrs phylochip and high throughput shotgun sequencing to investigate the shift in bacterial community structure and functions after incubation with chitin. In a second step, these functions of potential industrial interest can be discovered by using hybridization of soil metagenomic DNA clones spotted on high density membranes by a mix of oligonucleotide probes designed to target genes encoding for these enzymes. After affiliation of the positive hybridizing spots to the corresponding clones in the metagenomic library the inserts are sequenced, DNA assembled and annotated leading to identify new coding DNA sequences related to genes of interest with a good coverage but a low similarity against closest hits in the databases confirming novelty of the detected and cloned genes.\n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "http://www.france-bioinformatique.fr/sites/default/files/videos/scorms/metagenomics16/session_4/Soil_metagenomics_fundamental_and_applications/scormcontent/index.html", "fileName": "missing.txt", "topics": [], "keywords": [ "Metagenomics" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": "2016-12-16", "dateUpdate": null, "licence": "CC BY-NC-ND", "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/707/?format=api" ] }, { "id": 101, "name": "REPET: TEdenovo tutorial", "description": "The TEdenovo pipeline follows a philosophy in three first steps:\nDetection of repeated sequences (potential TE)\nClustering of these sequences\nGeneration of consensus sequences for each cluster, representing the ancestral TE\n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "https://urgi.versailles.inra.fr/Tools/REPET/TEdenovo-tuto", "fileName": "missing.txt", "topics": [], "keywords": [ "genomics", "Annotation" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": null, "dateUpdate": null, "licence": "CeCILL", "maintainers": [] }, { "id": 136, "name": "training RNASeq biostat part", "description": "This course is part of the INRAE training session about “bioinformatics and biostatistics analysis of RNA-seq data” and of the Biostatistics platform “Initiation à LA statistique, niveau 4”. \r\nThe material provided on the present webpage is related to the biostatistics part and covers the following topics:\r\n\r\nR and RStudio\r\ndesign of experiments\r\nvariability\r\ncount data normalization\r\ndifferential analysis\r\nThe material has originally been prepared by Ignacio Gonzales, Annick Moisan and myself. The class has already been taught by these persons but also by Gaëlle Lefort and Jérôme Mariette.\r\n\r\nPre-requisites: A background in R programming is necessary for this class. Before the class, please download the course material and install R, RStudio and the packages as described below. To produce high quality figures, I will use ggplot2 for plots but will not enter into details about the ggplot2 syntax. If you are not familiar with it, you can just use these command lines or switch to base plots instead.", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "https://www.nathalievialaneix.eu/teaching/rnaseq.html", "fileName": "rnaseq.html", "topics": [], "keywords": [], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "Intermediate", "providedBy": [], "dateCreation": null, "dateUpdate": null, "licence": null, "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/300/?format=api" ] }, { "id": 104, "name": "Exploring microbiomes with the MicroScope Platform", "description": "This module is separated in different courses:\nMicroScope: General overview, Keyword search and gene cart functionalities\n\n\n\n\n\n\n\n\n\n\n\n\nFunctional annotation of microbial genomes\n\n\n\n\n\n\n\n\nFunctional annotation of microbial genomes: Prediction of enzymatic functions\n\n\n\n\n\n\n\n\nRelational annotation of bacterial genomes: synteny\n\n\n\n\n\n\n\n\nAutomatic functional assignation and expert annotation of genes\n\n\n\n\n\n\n\n\nRelational annotation of bacterial genomes: phylogenetic profiles\n\n\n\n\n\n\n\n\nRelational annotation of bacterial genomes: pan-genome analysis\n\n\n\n\n\n\n\n\nRelational annotation of bacterial genomes: metabolic pathways\n\n\n\n\nSyntactic re-annotation of public microbial genomes\n\n\n\n\nSyntactic annotation of microbial genomes\n\n\n\n\n \n", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "http://www.france-bioinformatique.fr/sites/default/files/Cours_MicroScope_mars2016_18-125.pdf", "fileName": "missing.txt", "topics": [], "keywords": [ "genomics", "Annotation", "Transcriptomics", "Microbial evolution", "Metabolomics" ], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": "2016-03-01", "dateUpdate": null, "licence": null, "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/718/?format=api" ] }, { "id": 126, "name": "Galaxy 101 for everyone", "description": "This practical aims at familiarizing you with the Galaxy user interface. It will teach you how to perform basic tasks such as importing data, running tools, working with histories, creating workflows and sharing your work. Not everyone has the same background and that’s ok!", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "https://training.galaxyproject.org/training-material/topics/introduction/tutorials/galaxy-intro-101-everyone/tutorial.html", "fileName": "galaxy-intro-101-everyone", "topics": [], "keywords": [], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [], "dateCreation": null, "dateUpdate": null, "licence": "CC-BY-4.0", "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/677/?format=api" ] }, { "id": 147, "name": "Data-brokering script", "description": "This project generates metadata in JSON-LD format for plant and animal biological samples and submits them to the European Nucleotide Archive (ENA)'s BioSamples database. The metadata is extracted from an Excel file and validated against the Plant MIAPPE checklist for plant samples and against the BioSamples minimal checklist for animal samples. Samples are then either submitted as new entries or updated if they already exist in the database.", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "https://forgemia.inra.fr/urgi-is/data-brokering", "fileName": "submit_data_biosamples_X.py", "topics": [], "keywords": [], "audienceTypes": [], "audienceRoles": [], "difficultyLevel": "", "providedBy": [ { "id": 26, "name": "URGI", "url": "https://catalogue.france-bioinformatique.fr/api/team/URGI/?format=api" } ], "dateCreation": null, "dateUpdate": null, "licence": "CC-BY-4.0", "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/441/?format=api", "https://catalogue.france-bioinformatique.fr/api/userprofile/813/?format=api" ] }, { "id": 146, "name": "Processing_large_files_with_sed_awk_2024", "description": "This “Sed and AWK to modify large text files” training session is organized by the Genotoul bioinfo platform.\r\n\r\nThe Linux sed command is a powerful and very fast text editor without an interface. Sed can select, substitute, add, delete, and modify text in files and streams. Sed relies heavily on regular expressions for pattern matching and text selection. We’ll manipulate regexes and the sed command to modify and filter several type of file often used in bioinformatics.\r\n\r\nAWK enables to easily process columns in large text files but is also a quite powerfull programming language. This training session aims at introducing you AWK principles. You will learn about variables, operators and functions useful to manipulate very large files. \r\n\r\nFor example you can use AWK to generate your unix command lines to be launched on the cluster. AWK enables to process millions of lines in text files. The course includes short feature presentations between long hands-on sessions in which you will be able to understand the global ideas as well as details.", "communities": [], "elixirPlatforms": [], "doi": null, "fileLocation": "https://web-genobioinfo.toulouse.inrae.fr/~klopp/SedAwk2024/Processing_large_files_with_sed_awk_2024.pdf", "fileName": "Processing_large_files_with_sed_awk_2024.pdf", "topics": [], "keywords": [], "audienceTypes": [ "Professional (continued)" ], "audienceRoles": [ "Biologists", "Bioinformaticians" ], "difficultyLevel": "Intermediate", "providedBy": [ { "id": 22, "name": "Genotoul-bioinfo", "url": "https://catalogue.france-bioinformatique.fr/api/team/Genotoul-bioinfo/?format=api" } ], "dateCreation": null, "dateUpdate": "2024-03-01", "licence": null, "maintainers": [ "https://catalogue.france-bioinformatique.fr/api/userprofile/300/?format=api" ] } ] }