<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
    <channel>
        <title>ELIXIR-UK Fellowship</title>
        <description>ELIXIR-UK Fellowship</description>
        <link>https://mingkai14.github.io/fellowship/</link>
        <atom:link href="https://mingkai14.github.io/fellowship/feed.xml" rel="self" type="application/rss+xml"/>
        <pubDate>Mon, 04 Mar 2024 05:03:43 +0000</pubDate>
        <lastBuildDate>Mon, 04 Mar 2024 05:03:43 +0000</lastBuildDate>
        <generator>Jekyll v3.9.5</generator>
        
            <item>
                <title>GTN tutorial. Making clinical datasets FAIR</title>
                <description>&lt;p&gt;The life science community is generally very good at sharing omics data on platforms such as GEO and ArrayExpress. However, the metadata and clinical data associated with the omics datasets are often incredibly sparse. Tracking down the meta- and clinical data of omics datasets can be time-consuming for both data owner and researcher and is a significant hurdle when trying to explore enriched omics data.&lt;/p&gt;

&lt;p&gt;In this tutorial, you will learn the benefits of making clinical datasets FAIR (Findable, Accessible, Interoperable, and Reusable) and how to make them FAIR.&lt;/p&gt;
</description>
                <pubDate>Wed, 01 Nov 2023 00:00:00 +0000</pubDate>
                <link>https://mingkai14.github.io/fellowship/latest/gtn-tutorial-fair-clinical-data</link>
                <guid isPermaLink="true">https://mingkai14.github.io/fellowship/latest/gtn-tutorial-fair-clinical-data</guid>
                
                <category>Courses</category>
                
                <category>FAIR data</category>
                
                <category>Health data</category>
                
                
            </item>
        
            <item>
                <title>Using a data catalogue within a research team</title>
                <description>&lt;p&gt;Learn what is a basic data catalogue, understand how it can help you manage data files and start with the first steps to create a simple data catalogue using a given example.&lt;/p&gt;

&lt;ul&gt;
  &lt;li&gt;00:00 Learning objectives&lt;/li&gt;
  &lt;li&gt;00:25 Definition of a data catalogue&lt;/li&gt;
  &lt;li&gt;03:00 Metadata for data catalogues&lt;/li&gt;
  &lt;li&gt;04:06 Benefits of a well-managed catalogue&lt;/li&gt;
  &lt;li&gt;05:31 Example of data&lt;/li&gt;
  &lt;li&gt;06:50 Acknowledgements&lt;/li&gt;
&lt;/ul&gt;
</description>
                <pubDate>Wed, 04 Oct 2023 00:00:00 +0000</pubDate>
                <link>https://mingkai14.github.io/fellowship/latest/rdmbites-using-a-data-catalogue-within-a-research-team</link>
                <guid isPermaLink="true">https://mingkai14.github.io/fellowship/latest/rdmbites-using-a-data-catalogue-within-a-research-team</guid>
                
                <category>RDMbites</category>
                
                <category>Data management essentials</category>
                
                
            </item>
        
            <item>
                <title>Data catalogues for large projects</title>
                <description>&lt;p&gt;Understand how to make a data catalogue work for your project, manage details of projects that feed into yours and make the data catalogue easy to use.&lt;/p&gt;

&lt;ul&gt;
  &lt;li&gt;00:00 Learning objectives&lt;/li&gt;
  &lt;li&gt;00:43 Data catalogue: definition&lt;/li&gt;
  &lt;li&gt;01:44 Study tab&lt;/li&gt;
  &lt;li&gt;02:25 Data dictionary for the data catalogue&lt;/li&gt;
  &lt;li&gt;03:47 Tips&lt;/li&gt;
  &lt;li&gt;05:16 Acknowledgments&lt;/li&gt;
&lt;/ul&gt;
</description>
                <pubDate>Wed, 04 Oct 2023 00:00:00 +0000</pubDate>
                <link>https://mingkai14.github.io/fellowship/latest/rdmbites-data-catalogues-for-large-projects</link>
                <guid isPermaLink="true">https://mingkai14.github.io/fellowship/latest/rdmbites-data-catalogues-for-large-projects</guid>
                
                <category>RDMbites</category>
                
                <category>Data management essentials</category>
                
                
            </item>
        
            <item>
                <title>Data catalogues for different data types</title>
                <description>&lt;p&gt;Capture details of transcriptomic data in a data catalogue, adapt your data catalogue for different data types and understand how to link together related datasets.&lt;/p&gt;

&lt;ul&gt;
  &lt;li&gt;00:00 Learning objectives&lt;/li&gt;
  &lt;li&gt;00:30 Data catalogue: definition&lt;/li&gt;
  &lt;li&gt;00:58 Example: transcriptomic metadata&lt;/li&gt;
  &lt;li&gt;01:49 Columns relevant to transcriptomic data&lt;/li&gt;
  &lt;li&gt;02:40 Image datasets&lt;/li&gt;
  &lt;li&gt;05:32 Grouping linked datasets&lt;/li&gt;
  &lt;li&gt;05:00 Acknowledgments&lt;/li&gt;
&lt;/ul&gt;
</description>
                <pubDate>Wed, 04 Oct 2023 00:00:00 +0000</pubDate>
                <link>https://mingkai14.github.io/fellowship/latest/rdmbites-data-catalogues-for-different-data-types</link>
                <guid isPermaLink="true">https://mingkai14.github.io/fellowship/latest/rdmbites-data-catalogues-for-different-data-types</guid>
                
                <category>RDMbites</category>
                
                <category>Data management essentials</category>
                
                
            </item>
        
            <item>
                <title>GTN tutorial. Sequence data submission to ENA</title>
                <description>&lt;p&gt;In this Galaxy Training Network tutorial you will learn:&lt;/p&gt;

&lt;ul&gt;
  &lt;li&gt;To populate ENA metadata objects through the Webin portal&lt;/li&gt;
  &lt;li&gt;To submit raw reads to ENA using FTP&lt;/li&gt;
&lt;/ul&gt;

&lt;p&gt;Time estimation: 1 hour&lt;/p&gt;
</description>
                <pubDate>Sat, 30 Sep 2023 00:00:00 +0000</pubDate>
                <link>https://mingkai14.github.io/fellowship/latest/gtn-tutorial-ena-sequence-submission</link>
                <guid isPermaLink="true">https://mingkai14.github.io/fellowship/latest/gtn-tutorial-ena-sequence-submission</guid>
                
                <category>Courses</category>
                
                <category>Sequencing data</category>
                
                
            </item>
        
            <item>
                <title>Tutorial for Canto – PomBase's online community curation tool</title>
                <description>&lt;p&gt;Canto is PomBase’s online community curation tool. It enables researchers to participate directly in curating data from new publications to support the small staff of professional curators. 
This step-by-step tutorial helps these community contributors to curate papers using Canto.&lt;/p&gt;

&lt;p&gt;&lt;img src=&quot;/fellowship/images/canto-tutorial-demo.png&quot; alt=&quot;Canto Tutorial Demo&quot; /&gt;
&lt;em&gt;Screenshot of Canto tutorial&lt;/em&gt;&lt;/p&gt;
</description>
                <pubDate>Thu, 28 Sep 2023 00:00:00 +0000</pubDate>
                <link>https://mingkai14.github.io/fellowship/latest/contribution-tutorial-canto</link>
                <guid isPermaLink="true">https://mingkai14.github.io/fellowship/latest/contribution-tutorial-canto</guid>
                
                <category>Contribution to resources</category>
                
                
            </item>
        
            <item>
                <title>GTN tutorial. FAIR data management solutions</title>
                <description>&lt;p&gt;The FAIR (Findable, Accessible, Interoperable, Reusable) data stewardship created the foundation for sharing and publishing digital assets, especially data. This apply to machine accessibility and emphasize that all digital assets should share data in a way that will enable maximum use and reuse.&lt;/p&gt;

&lt;p&gt;This tutorial is a short introduction to the FAIR data management framework.&lt;/p&gt;
</description>
                <pubDate>Wed, 27 Sep 2023 00:00:00 +0000</pubDate>
                <link>https://mingkai14.github.io/fellowship/latest/gtn-tutorial-fair-data-management-solutions</link>
                <guid isPermaLink="true">https://mingkai14.github.io/fellowship/latest/gtn-tutorial-fair-data-management-solutions</guid>
                
                <category>Courses</category>
                
                <category>FAIR data</category>
                
                
            </item>
        
            <item>
                <title>FAIRytale. Common themes in data management emerge at the MRC’s open data workshop</title>
                <description>&lt;p&gt;In October of 2022, I hosted an all-day seminar at the MRC Biostatistics unit to give a community of like-minded researchers a chance to discuss and explain the implications of open-data practice for their research [1]. The day was a resounding success, with a number of excellent talks and conversations. One thing I found particularly interesting – as a member of the research support team – was how often the same themes re-emerged despite the range of research interests represented. This feeling has only strengthened during my time as a fellow.&lt;/p&gt;

&lt;p&gt;While all the conference attendees were from fields broadly considered ‘the life sciences’, the event had an interdisciplinary feel. Even so, throughout various applications, the data needs (and challenges) remained remarkably consistent. Many attendees had heard of the FAIR principles [2][3][4] before, but those that were new to the concepts were surprised by how well FAIR captures the challenges they faced. The dominant feeling over our four sessions was that often, researchers get half/most of the way with their open data effort but then undervalue how important those final steps are.&lt;/p&gt;

&lt;p&gt;One ‘final step’ that was often missed was providing long-term hosting solutions for data, and several conversations revolved around how important this is. We heard several horror stories of important data sets that were (in theory) ‘available on request from the corresponding author’ but in actuality, could not be accessed, sometimes as close to 6 months after publication date. Similarly, several attendees had navigated to self-hosted websites that gave 404 errors within a year of being mentioned in published research. While this might seem disheartening, this is something of a solved problem with Figshare [5] and Zenodo [6] providing hosting platforms that will last for as good as forever.&lt;/p&gt;

&lt;p&gt;The presence (or absence) of appropriate metadata was a second key finding of our workshop. This was particularly important to researchers using genetics data as minor convention/naming differences could cause several hours to be lost when trying to run the data through a new algorithm. Unfortunately, it can be difficult to establish one-size-fits-all metadata principles as the required information tends to be very field-specific. In an ideal world, everyone would provide ‘as much metadata as possible’, but several colleagues were keen to point out that this is often impractical and leads to crude full data dumps in which useful information is drowned out by unhelpfully large numbers of files containing information of little to no value.&lt;/p&gt;

&lt;p&gt;The workshop had a huge range of perspectives, and I found the day fascinating. I hope this FAIRy Tale has helped to illustrate that doing the basics really well can be a huge source of value for both you and future researchers. In particular, it’s essential to use a long-term, stable hosting platform for as much of your research data as possible and to provide accurate, complete and (ideally) concise metadata so that a new researcher can get up to speed with your data as quickly as possible.&lt;/p&gt;

&lt;h2 id=&quot;further-reading&quot;&gt;Further reading&lt;/h2&gt;

&lt;ol&gt;
  &lt;li&gt;Open data. &lt;a href=&quot;https://www.ukri.org/manage-your-award/publishing-your-research-findings/making-your-research-data-open/&quot;&gt;https://www.ukri.org/manage-your-award/publishing-your-research-findings/making-your-research-data-open/&lt;/a&gt;&lt;/li&gt;
  &lt;li&gt;FAIR principles. &lt;a href=&quot;https://www.nature.com/articles/sdata201618&quot;&gt;https://www.nature.com/articles/sdata201618&lt;/a&gt;&lt;/li&gt;
  &lt;li&gt;FAIR pointers Carpentries course: &lt;a href=&quot;https://elixir-uk-dash.github.io/FAIR-Pointers/&quot;&gt;https://elixir-uk-dash.github.io/FAIR-Pointers/&lt;/a&gt;&lt;/li&gt;
  &lt;li&gt;FAIR in (biological) practice Carpentries course: &lt;a href=&quot;https://carpentries-incubator.github.io/fair-bio-practice/&quot;&gt;https://carpentries-incubator.github.io/fair-bio-practice/&lt;/a&gt;&lt;/li&gt;
  &lt;li&gt;Figshare. &lt;a href=&quot;https://figshare.com/&quot;&gt;https://figshare.com/&lt;/a&gt;&lt;/li&gt;
  &lt;li&gt;Zenodo.  &lt;a href=&quot;https://zenodo.org/&quot;&gt;https://zenodo.org/&lt;/a&gt;&lt;/li&gt;
&lt;/ol&gt;
</description>
                <pubDate>Mon, 25 Sep 2023 00:00:00 +0000</pubDate>
                <link>https://mingkai14.github.io/fellowship/latest/outreach-fairytale-phillip</link>
                <guid isPermaLink="true">https://mingkai14.github.io/fellowship/latest/outreach-fairytale-phillip</guid>
                
                <category>Outreach</category>
                
                <category>FAIR data</category>
                
                
            </item>
        
            <item>
                <title>GTN tutorial. REMBI, Recommended Metadata for Biological Images – metadata guidelines for bioimaging data</title>
                <description>&lt;p&gt;In this Galaxy Training Network tutorial you will:&lt;/p&gt;
&lt;ul&gt;
  &lt;li&gt;Organise bioimage metadata&lt;/li&gt;
  &lt;li&gt;Find out what REMBI is and why it is useful&lt;/li&gt;
  &lt;li&gt;Categorise what metadata belongs to each of the submodules of REMBI&lt;/li&gt;
  &lt;li&gt;Gather the metadata for an example bioimage dataset&lt;/li&gt;
&lt;/ul&gt;

&lt;p&gt;Time estimation: 15 minutes&lt;/p&gt;

</description>
                <pubDate>Mon, 11 Sep 2023 00:00:00 +0000</pubDate>
                <link>https://mingkai14.github.io/fellowship/latest/gtn-tutorial-rembi-metadata</link>
                <guid isPermaLink="true">https://mingkai14.github.io/fellowship/latest/gtn-tutorial-rembi-metadata</guid>
                
                <category>Courses</category>
                
                <category>Bioimage data</category>
                
                
            </item>
        
            <item>
                <title>GTN tutorial. Filter, plot and explore single-cell RNA-seq data</title>
                <description>&lt;p&gt;You’ve done all the work to make a single cell matrix, with gene counts and mitochondrial counts and buckets of cell metadata from all your variables of interest. Now it’s time to fully process your data, to remove low quality cells, to reduce the many dimensions of data that make it difficult to work with, and ultimately to try to define clusters and to find biological meaning and insights.&lt;/p&gt;

&lt;p&gt;This tutorial works with Scanpy, because currently Galaxy hosts the most Scanpy tools of all of those options.&lt;/p&gt;
</description>
                <pubDate>Mon, 11 Sep 2023 00:00:00 +0000</pubDate>
                <link>https://mingkai14.github.io/fellowship/latest/gtn-tutorial-single-cell</link>
                <guid isPermaLink="true">https://mingkai14.github.io/fellowship/latest/gtn-tutorial-single-cell</guid>
                
                <category>Courses</category>
                
                <category>Sequencing data</category>
                
                <category>Single-cell data</category>
                
                
            </item>
        
    </channel>
</rss>