<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v22i7e18059</article-id>
      <article-id pub-id-type="pmid">32459633</article-id>
      <article-id pub-id-type="doi">10.2196/18059</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Characterization and Correction of Bias Due to Nonparticipation and the Degree of Loyalty in Large-Scale Finnish Loyalty Card Data on Grocery Purchases: Cohort Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Sperrin</surname>
            <given-names>Matthew</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Morris</surname>
            <given-names>Michelle</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Vuorinen</surname>
            <given-names>Anna-Leena</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Faculty of Social Sciences (Health Sciences)</institution>
            <institution>Tampere University</institution>
            <addr-line>Arvo Ylpön katu 34</addr-line>
            <addr-line>FI-33014</addr-line>
            <addr-line>Tampere, </addr-line>
            <country>Finland</country>
            <phone>358 408485966</phone>
            <email>anna-leena.vuorinen@vtt.fi</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5658-1305</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Erkkola</surname>
            <given-names>Maijaliisa</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6966-1523</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Fogelholm</surname>
            <given-names>Mikael</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8110-102X</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Kinnunen</surname>
            <given-names>Satu</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7673-0243</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Saarijärvi</surname>
            <given-names>Hannu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5803-9037</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Uusitalo</surname>
            <given-names>Liisa</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2616-5260</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Näppilä</surname>
            <given-names>Turkka</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0562-7254</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Nevalainen</surname>
            <given-names>Jaakko</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6295-0245</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Faculty of Social Sciences (Health Sciences)</institution>
        <institution>Tampere University</institution>
        <addr-line>Tampere</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>VTT Technical Research Centre of Finland Ltd</institution>
        <addr-line>Tampere</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Food and Nutrition</institution>
        <institution>University of Helsinki</institution>
        <addr-line>Helsinki</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Faculty of Management and Business</institution>
        <institution>Tampere University</institution>
        <addr-line>Tampere</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Tampere University Library</institution>
        <institution>Tampere University</institution>
        <addr-line>Tampere</addr-line>
        <country>Finland</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Anna-Leena Vuorinen <email>anna-leena.vuorinen@vtt.fi</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>7</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>15</day>
        <month>7</month>
        <year>2020</year>
      </pub-date>
      <volume>22</volume>
      <issue>7</issue>
      <elocation-id>e18059</elocation-id>
      <history>
        <date date-type="received">
          <day>31</day>
          <month>1</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>1</day>
          <month>4</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>18</day>
          <month>4</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>14</day>
          <month>5</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Anna-Leena Vuorinen, Maijaliisa Erkkola, Mikael Fogelholm, Satu Kinnunen, Hannu Saarijärvi, Liisa Uusitalo, Turkka Näppilä, Jaakko Nevalainen. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 15.07.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://www.jmir.org/2020/7/e18059/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>To date, the evaluation of diet has mostly been based on questionnaires and diaries that have their limitations in terms of being time and resource intensive, and a tendency toward social desirability. Loyalty card data obtained in retailing provides timely and objective information on diet-related behaviors. In Finland, the market is highly concentrated, which provides a unique opportunity to investigate diet through grocery purchases.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aims of this study were as follows: (1) to investigate and quantify the selection bias in large-scale (n=47,066) loyalty card (LoCard) data and correct the bias by developing weighting schemes and (2) to investigate how the degree of loyalty relates to food purchases.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Members of a loyalty card program from a large retailer in Finland were contacted via email and invited to take part in the study, which involved consenting to the release of their grocery purchase data for research purposes. Participants’ sociodemographic background was obtained through a web-based questionnaire and was compared to that of the general Finnish adult population obtained via Statistics Finland. To match the distributions of sociodemographic variables, poststratification weights were constructed by using the raking method. The degree of loyalty was self-estimated on a 5-point rating scale.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>On comparing our study sample with the general Finnish adult population, in our sample, there were more women (65.25%, 30,696/47,045 vs 51.12%, 2,273,139/4,446,869), individuals with higher education (56.91%, 20,684/36,348 vs 32.21%, 1,432,276/4,446,869), and employed individuals (60.53%, 22,086/36,487 vs 52.35%, 2,327,730/4,446,869). Additionally, in our sample, there was underrepresentation of individuals aged under 30 years (14.44%, 6,791/47,045 vs 18.04%,  802,295/4,446,869) and over 70 years (7.94%, 3,735/47,045 vs  18.20%, 809,317/4,446,869), as well as retired individuals (23.51%, 8,578/36,487 vs 31.82%, 1,414,785/4,446,869). Food purchases differed by the degree of loyalty, with higher shares of vegetable, red meat &#38; processed meat, and fat spread purchases in the higher loyalty groups.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Individuals who consented to the use of their loyalty card data for research purposes tended to diverge from the general Finnish adult population. However, the high volume of data enabled the inclusion of sociodemographically diverse subgroups and successful correction of the differences found in the distributions of sociodemographic variables. In addition, it seems that food purchases differ according to the degree of loyalty, which should be taken into account when researching loyalty card data. Despite the limitations, loyalty card data provide a cost-effective approach to reach large groups of people, including hard-to-reach population subgroups.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>loyalty card data</kwd>
        <kwd>diet</kwd>
        <kwd>selection bias</kwd>
        <kwd>weighting</kwd>
        <kwd>raking</kwd>
        <kwd>food</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Diet has a substantial impact on human health. Poor dietary habits are associated with obesity and a wide range of chronic diseases, including type 2 diabetes, cancer, and cardiovascular diseases [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Suboptimal diet is responsible for more deaths than any other risk factor globally [<xref ref-type="bibr" rid="ref3">3</xref>]. It is therefore imperative to collect timely and valid information on diet and individual risk factors.</p>
      <p>To date, the evaluation of diet has mostly been based on questionnaires and diaries [<xref ref-type="bibr" rid="ref4">4</xref>]. Although valuable in research, data collection with such instruments, particularly food diaries, is time and resource intensive, and the information is gained with a considerable delay. They also suffer from participant tendency toward social desirability [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. Moreover, the information gained through questionnaires is subject to recall bias with participants not reporting all foods consumed [<xref ref-type="bibr" rid="ref4">4</xref>]. Another limitation with dietary surveys as well as health surveys in general is selection bias, which manifests as healthy, socioeconomically advantaged, middle-aged women being the most likely to enroll in these studies [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>].</p>
      <p>The continued development of innovative digital tools and digital data repositories provides novel opportunities for epidemiological research [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. Web-based data collection instruments [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>] and consumer-generated data are increasingly being used for health research purposes [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref19">19</xref>]. While such novel data collection methods and tools may overcome some of the problems faced with traditional methods, some of the limitations remain, of which selection bias is a major concern [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Namely, those who generate the data are frequently highly selected and likely to differ from the general population representing wealthy and healthy individuals. For instance, smartphone users, and subsequently mobile health app and social media users, are younger, better educated, and represent wealthier individuals than those in the general population [<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref23">23</xref>]. However, automated data collection, which is a typical feature for these instruments and tools, provides objective measures on individuals’ health behaviors and thus decreases information bias.</p>
      <p>Food purchase data have invoked interest as a novel approach to enrich diet and nutrition research efforts [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. So far, most of the published studies have used panel-based data, with all grocery purchase receipts scanned at home [<xref ref-type="bibr" rid="ref26">26</xref>]. While such studies are frequently large and may include data from multiple sources, they are limited by recording discrepancies [<xref ref-type="bibr" rid="ref27">27</xref>]. In addition, receipt scanning requires consistent efforts and long-term engagement from the participants [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. In this study, we used loyalty card data (ie, individual-level grocery transaction data generated by retail food chains). Importantly, loyalty card data contain information about what, where, when, and who has bought, thus enabling longitudinal tracking of the purchase behaviors of a single customer or a household over time. Objective measures of food purchases have been shown to correlate with one’s food intake and overall diet quality [<xref ref-type="bibr" rid="ref28">28</xref>]. Loyalty card data also accumulates automatically in retailers’ information technology systems, producing objective and up-to-date information in a cost-effective manner. However, loyalty card data have shortfalls that could impede the usefulness for research. First, consumers may distribute their purchases among different retailers. Therefore, loyalty card data from a single retailer most likely does not include all food purchases conducted by consumers. However, in Finland, the market is highly centralized with the three biggest market chains claiming over 90% of the market share, and the largest operator having a market share as high as 47% [<xref ref-type="bibr" rid="ref30">30</xref>]. Such centralization provides a unique opportunity to investigate heterogeneous populations through a single retailer.</p>
      <p>The aims of this study were as follows: (1) to investigate and quantify selection bias in Finnish large-scale loyalty card (LoCard) data and further develop a means to correct this bias by characterizing the loyalty card data consenters and comparing their sociodemographic background to that of the general Finnish adult population and (2) to assess how the degree of loyalty relates to food purchases by investigating the self-perceived degree of loyalty (share of total grocery purchases in retailers’ shops and supermarkets) and its association with food purchases. The overall purpose of this research was to increase the understanding of how loyalty card data should be understood and subsequently analyzed in dietary and health research.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design and Participation</title>
        <p>The LoCard data used in this study were obtained from S Group, which is the largest commercial operator of retail grocery stores in Finland. According to S Group, their full coverage is 2.4 million households, meaning that 88% of households in Finland have registered purchases in their databases. The members of S Group’s loyalty card program are provided with an electronic customer card to be used when making purchases, and customers are rewarded for their purchases by getting a maximum 5% financial bonus that is refunded to them on a monthly basis. Individuals of the same household may link their purchases to the same loyalty account. In this study, only purchases of the household’s main cardholder were used.</p>
        <p>Members of S Group’s loyalty card program (primary cardholders) across Finland were contacted via email and were invited to take part in the study, which involved consenting to the release of their grocery purchase data to be used for research purposes and voluntarily responding to the study questionnaire. Members who did not have an email address declared or who had prohibited the retailer from contact them with any marketing or research-related material were excluded. Cardholders under 18 years of age were also excluded. All invitations were sent by S Group as they had customers’ contact information.</p>
        <p>The grocery purchase data used in this study covered the period from January 1, 2017, to December 31, 2018. Each purchase was associated with item description, time stamp, quantity (ie, weight, volume, or number of packages), and expenditure on the item.</p>
      </sec>
      <sec>
        <title>Background Variables</title>
        <p>All consenting participants were asked to fill out a web-based background questionnaire that included the following sociodemographic variables: education, marital status, size of the household, number and age of children, occupational status, income, and perceived health. The background data were complemented with information on participant sex, age, and postal code obtained from the retailer’s electronic database.</p>
      </sec>
      <sec>
        <title>Degree of Loyalty</title>
        <p>As part of the baseline questionnaire, all participants were asked to estimate their degree of loyalty as a share of purchases made in the retailer’s shops and supermarkets on a five-item ordinal scale. The response categories were as follows: “0%-20%,” “21%-40%,” “41%-60%,” “61%-80%,” and “81%-100%.”</p>
      </sec>
      <sec>
        <title>Food Variables and Food Groups</title>
        <p>The LoCard grocery purchase data required preprocessing to be usable in further analyses. First, we identified food groups from all the grocery product groups. Second, we regrouped the identified food groups into new groups that were formed on the basis of the commonly used food groupings in nutritional studies [<xref ref-type="bibr" rid="ref31">31</xref>] and earlier findings on the associations between dietary components and health [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]. For instance, skimmed liquid milk and buttermilk were aggregated into “skimmed milk &#38; sour milk” and foods and mixed dishes with red or processed meat as the main ingredient were aggregated into “red meat &#38; processed meat.”</p>
        <p>Out of 4234 grocery product groups, 865 (20.4%) were assigned into one of the new food groups used in this study. In addition, 42 food groups were left out as they involved either (1) a mixed dish or food group with no definite primary ingredient or (2) a rarely purchased product. The food groups used in this study included “vegetables,” “skimmed milk &#38; sour milk,” “sugar-sweetened beverages,” “rye bread,” “red meat &#38; processed meat,” “fat spreads,” and “sweets &#38; chocolate.” These groups were used as indicators for evaluating the nutritional quality of household food purchases. A detailed description about the grouping of the food purchase data is included in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
      </sec>
      <sec>
        <title>Reference Material</title>
        <p>Population statistics on the general adult population were obtained from Statistics Finland using StatFin databases that can be freely accessed [<xref ref-type="bibr" rid="ref34">34</xref>]. The databases include tabulated data on Finnish citizens and Finland in general that are collected on a yearly basis. Data from 2017 were used because of the availability of the latest data tables for all sociodemographic variables used in the analyses. For this study, individuals aged at least 18 years were included.</p>
        <p>The FinHealth survey is a national population health study on Finnish citizens. The study encompasses a series of cross-sectional population surveys carried out every 5 years in Finland. The latest FinHealth survey was carried out at 50 localities in 2017, with a participation rate of 71% among those invited for the study [<xref ref-type="bibr" rid="ref35">35</xref>]. The purpose of the FinHealth study is to collect up-to-date information about the health and well-being of adults residing in Finland and on the factors influencing their health and well-being. Each survey invites 10,000 randomly selected individuals aged over 18 years. The study consists of physical examinations and study questionnaires. The latest report (values used in this study) is restricted to adults aged 30 years or older to make the results comparable with earlier FinHealth studies. A subgroup of the participants was also invited to undergo a nutrition review; the FinDiet survey is a substudy (n=1655) of the FinHealth survey, which monitors the nutrition and dietary habits of the Finnish population [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
      </sec>
      <sec>
        <title>Statistical Methods</title>
        <sec>
          <title>Analysis of and Correction for Selection Bias</title>
          <p>The sociodemographic characteristics of the LoCard study participants were first compared with the characteristics of the Finnish adult population and participants of the FinHealth study to identify traits in LoCard participants that deviated from traits in the general Finnish adult population.</p>
          <p>Second, we constructed poststratification weights for the LoCard participants to match their sociodemographic distributions with the adult Finnish population distributions as closely as possible. The individual weights were calculated using the raking function available in the <italic>survey</italic> package in R [<xref ref-type="bibr" rid="ref37">37</xref>]. The raking function uses iterative proportional fitting (IPF), which is a technique that can be used to adjust a distribution reported in one dataset by totals reported in another. For a given two-way contingency table, the IPF proportionally adjusts each row of the sample distribution in the two-way contingency table to have its total equal the reference population row distribution and adjusts each column of the sample distribution to have its total equal the column total in the reference table [<xref ref-type="bibr" rid="ref38">38</xref>].</p>
          <p>The advantage of the raking function is that the algorithm allows multiple two-dimensional (or higher dimensional) tables to be matched simultaneously [<xref ref-type="bibr" rid="ref37">37</xref>]. For example, instead of matching age, sex, and education univariate distributions separately, we can match all bivariate distributions (ie, age and education, sex and education, and sex and age) simultaneously. The adjustment process is repeated iteratively until the weights converge for each table used in the analysis. The raking function requires that the two contingency tables have the same classes for the row and column variables and no zero values in any of the cells.</p>
          <p>The following two-way tables were available for both the LoCard data and the Finnish adult population: sex and age, sex and education, sex and marital status, sex and occupational status, age and education, age and marital status, age and occupational status, and education and occupational status. All tables were subsequently used to construct the poststratification weights. In addition, the distribution of children aged under 18 years living in the household was used alone because corresponding two-dimensional tables with any of the background variables were not available in Statistics Finland. In total, eight two-way tables and a single one-way table were used in the construction of the weights. Finally, the obtained weights were trimmed to avoid extreme values and instability by setting a minimum value of 0.1 and a maximum value of 10. Without trimming, the poststratification weights ranged from 0.04 to 32.7, and there was a single extremely high weight of 82.4.</p>
          <p>Owing to missing data, the poststratification weights were constructed in two phases. First, the weights were calculated as described above for participants for whom all baseline characteristics used in the matching were available. These data were available for 36,094 individuals. Participants with missing data for any of these variables (n=10,972) obtained their weights in the second phase, where the poststratification weights were calculated for the whole LoCard sample using sex and age variables only. This information was available for 47,045 participants. Finally, the combined weights were rescaled to add up to 47,045. Twenty-one participants without data on sex and/or age remained without weights.</p>
          <p>The selected food group variables were analyzed to describe the volume and money (€) spent on their purchases over the 2-year period (2017-2018). For descriptive purposes, median values and IQRs were reported for each variable because the distributions were strongly skewed to the right, and there was an excess number of zero values in some of the food variables. The same variables were used to demonstrate how the poststratification weights affected the results.</p>
        </sec>
        <sec>
          <title>Degree of Loyalty</title>
          <p>To validate the self-assessed degree of loyalty, we conducted the recency, frequency, and monetary (RFM) value analysis using the transaction data of all participants and compared the RFM scores across the five degree of loyalty groups. RFM analysis is a behavior-based technique used to segment customers by examining their transaction history from three dimensions (how recently a customer made purchases, how often they purchased, and how much they purchased). RFM analysis is also widely used in customer relationship management. Based on these three dimensions, the RFM score is generated for each individual, with a higher score indicating higher loyalty. The analysis was conducted using the <italic>rfm</italic> package in R [<xref ref-type="bibr" rid="ref39">39</xref>]. In addition, total volume and total money (€) spent on food purchases were calculated for each degree of loyalty group to investigate how closely the self-reported degree of loyalty relates to volume and money spent on the purchases.</p>
          <p>To assess the impact of the degree of loyalty on food purchasing profiles, the selected food group variables were compared among the five degree of loyalty groups. The Kruskal-Wallis test was applied for differences across the groups.</p>
          <p>The association between the degree of loyalty and background characteristics was analyzed by comparing the distribution of each sociodemographic variable among the five degree of loyalty groups. The differences across the groups were tested using the chi-square test.</p>
        </sec>
      </sec>
      <sec>
        <title>Ethical Aspects</title>
        <p>The study was approved by the University of Helsinki Review Board in the Humanities and Social and Behavioral Sciences (Statement 21/2018). Informed consent was electronically obtained from all participants included in the study when they were invited via email to release their loyalty card data and fill out the background questionnaire. The data were pseudonymized by S Group before the researchers could obtain the data.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Recruitment</title>
        <p>S Group had approximately 2.4 million primary loyalty card owners, and all of them were assessed for eligibility (<xref rid="figure1" ref-type="fig">Figure 1</xref>). Approximately half (1,214,663, 51%) of the loyalty card owners were contacted, and of these, 47,066 (4%) consented to participate. We did not have information on the number of valid email addresses or what proportion of emails reached the card owners (eg, by passing through trash email filters). Among the participants, 36,621 (78%) responded to the background questionnaire. Nearly all participants (46,825, 99.5%) purchased at least one grocery item from 2017 to 2018.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Participant recruitment and eligibility flow chart.</p>
          </caption>
          <graphic xlink:href="jmir_v22i7e18059_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Participant Characteristics</title>
        <p><xref ref-type="table" rid="table1">Table 1</xref> shows the participant characteristics compared with those of the Finnish adult population and the FinHealth study participants. Discrepancies were found in sex, age, education, and occupational status when compared with the general Finnish adult population. Namely, there were more women, more individuals with a higher education, and more employed individuals in the LoCard sample. On the contrary, individuals aged under 30 years and over 70 years (correspondingly, retired individuals) were underrepresented in the LoCard sample. Selectivity associated with education was strong in the LoCard sample. The proportion of individuals having a basic education level was clearly lower in the LoCard sample (6% of participants had basic education) than in the Finnish adult population (25% had basic education). There were no major differences in the distribution of marital status. However, there were fewer individuals living in a household with children aged under 18 years in the LoCard sample. The LoCard sample was widely distributed across Finland and comparable to the geographical distribution of Finnish citizens (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>).</p>
        <p>On comparing the LoCard sample to the FinHealth study participants, there were differences in sex, education, and marital status distributions, with more women and individuals with higher education and fewer married individuals in the LoCard sample. The age distributions were not comparable owing to the fact that the FinHealth study included only individuals aged at least 30 years. Distortion in the distribution of occupational status was similar in the two studies compared with the Finnish adult population.</p>
        <p>The reweighted distributions of the sociodemographic variables demonstrated that the constructed poststratification weights corrected the deviations successfully, and thereafter, the sociodemographic distributions of the LoCard sample matched well with the Finnish adult population.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>LoCard participant characteristics compared with those of the general Finnish adult population and participants of the FinHealth study.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="320"/>
            <col width="180"/>
            <col width="160"/>
            <col width="150"/>
            <col width="160"/>
            <thead>
              <tr valign="bottom">
                <td colspan="2">Characteristic</td>
                <td>Finnish general adult population (N=4,446,869)</td>
                <td>FinHealth study<sup>a</sup> (N=6545)</td>
                <td>LoCard sample (N=47,066)<sup>b</sup></td>
                <td>Weighted LoCard sample<sup>c</sup> (N=47,045)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Sex (women), n (%)</td>
                <td>2,273,139 (51.12%)</td>
                <td>3496 (53.42%)</td>
                <td>30,696 (65.25%)</td>
                <td>23,837 (50.67%)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Age (years), mean (SD)</td>
                <td>50.23 (19.06)</td>
                <td>—<sup>d</sup></td>
                <td>47.10 (15.21)</td>
                <td>49.5 (0.14)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Age distribution (years), n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≤29</td>
                <td>802,295 (18.04%)</td>
                <td>N/A<sup>e</sup></td>
                <td>6791 (14.44%)</td>
                <td>8532 (18.14%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>30-39</td>
                <td>702,767 (15.80%)</td>
                <td>Men, 483 (15.8%); <break/>women, 539 (15.4%)</td>
                <td>9982 (21.22%)</td>
                <td>7505 (15.95%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>40-49</td>
                <td>660,703 (14.86%)</td>
                <td>Men, 530 (17.4%); <break/>women, 561 (16.1%)</td>
                <td>9503 (20.20%)</td>
                <td>6986 (14.85%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>50-59</td>
                <td>734,554 (16.52%)</td>
                <td>Men, 608 (20.0%); <break/>women, 661 (18.9%)</td>
                <td>9154 (19.45%)</td>
                <td>7715 (16.40%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>60-69</td>
                <td>737,233 (16.58%)</td>
                <td>Men, 727 (23.8%); <break/>women, 774 (22.4%)</td>
                <td>7880 (16.75%)</td>
                <td>7734 (16.44%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥70</td>
                <td>809,317 (18.20%)</td>
                <td>Men, 701 (23.0%); <break/>women, 961 (27.5%)</td>
                <td>3735 (7.94%)</td>
                <td>8572 (18.22%)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Marital status, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Presently married</td>
                <td>1,990,928 (44.77%)</td>
                <td>Men, 58.0%; <break/>women, 52.3%</td>
                <td>17,240 (47.32%)</td>
                <td>16,254 (45.12%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Cohabiting</td>
                <td>—</td>
                <td>Men, 16.7%; <break/>women, 14.4%</td>
                <td>7408 (20.33%)</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Single</td>
                <td>1,599,827 (35.98%)<sup>f</sup></td>
                <td>Men, 13.3%; <break/>women, 10.3%</td>
                <td>6412 (17.60%)</td>
                <td>12,762 (35.43%)<sup>f</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Divorced or separated</td>
                <td>574,620 (12.92%)</td>
                <td>Men, 8.7%; <break/>women, 12.2%</td>
                <td>4331 (11.89%)</td>
                <td>4713 (13.08%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Widowed</td>
                <td>281,494 (6.33%)</td>
                <td>Men, 3.4%; <break/>women, 10.9%</td>
                <td>1040 (2.86%)</td>
                <td>2295 (6.37%)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Household, mean number of members (SD)</td>
                <td>2.8 (not available)</td>
                <td>—</td>
                <td>2.36 (1.25)</td>
                <td>2.42 (0.01)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Children aged under 18 years living in the household, n (%)</td>
                <td>566,242 (38.48%)</td>
                <td>31<sup>g</sup> (31.52%)</td>
                <td>11,705 (32.08%)</td>
                <td>13,567 (37.61%)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Education, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Primary school or less</td>
                <td>1,112,261 (25.01%)</td>
                <td>Men, 23.2%; <break/>women, 21.0%</td>
                <td>2259 (6.21%)</td>
                <td>7881 (23.54%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Upper secondary school</td>
                <td>1,902,332 (42.78%)</td>
                <td>Men, 38.3%; <break/>women, 29.1%</td>
                <td>13,405 (36.88%)</td>
                <td>15,534 (43.25%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bachelor’s degree or equivalent</td>
                <td>955,395 (21.49%)</td>
                <td>Men, 38.5%<sup>h</sup>; <break/>women, 49.9%<sup>h</sup></td>
                <td>11,787 (32.43%)</td>
                <td>8453 (21.94%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Master’s degree or higher</td>
                <td>476,881 (10.72%)</td>
                <td>—</td>
                <td>8897 (24.48%)</td>
                <td>4049 (11.27%)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Occupational status, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Employed</td>
                <td>2,327,730 (52.35%)</td>
                <td>Men, 65.9%; <break/>women, 62.3%</td>
                <td>22,086 (60.53%)</td>
                <td>19,027 (52.75%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unemployed</td>
                <td>296,191 (6.66%)</td>
                <td>Men, 8.5%; <break/>women, 7.0%</td>
                <td>1637 (4.49%)</td>
                <td>2417 (6.70%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Student</td>
                <td>230,489 (5.18%)</td>
                <td>Men, 2.4%; <break/>women, 3.5%</td>
                <td>1824 (5.00%)</td>
                <td>1619 (4.49%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Retired</td>
                <td>1,414,785 (31.82%)</td>
                <td>Men, 21.3%; <break/>women, 20.0%</td>
                <td>8578 (23.51%)</td>
                <td>11,600 (32.16%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Parental leave</td>
                <td>
                  <break/>
                </td>
                <td>Men, 0.2%; <break/>women, 4.2%</td>
                <td>1255 (3.44%)</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other</td>
                <td>177,674 (4.00%)</td>
                <td>Men, 1.8%; <break/>women, 3.0%</td>
                <td>1107 (3.03%)</td>
                <td>1411 (3.91%)<sup>i</sup></td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Degree of loyalty, n (%)</bold>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>0%-20%</td>
                <td>—</td>
                <td>—</td>
                <td>2283 (6.25%)</td>
                <td>2132 (5.90%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>21%-40%</td>
                <td>—</td>
                <td>—</td>
                <td>4670 (12.79%)</td>
                <td>4160 (11.52%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>41%-60%</td>
                <td>—</td>
                <td>—</td>
                <td>6155 (16.85%)</td>
                <td>5828 (16.14%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>61%-80%</td>
                <td>—</td>
                <td>—</td>
                <td>9224 (25.25%)</td>
                <td>8962 (24.82%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>81%-100%</td>
                <td>—</td>
                <td>—</td>
                <td>14,194 (38.86%)</td>
                <td>15,031 (41.62%)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>FinHealth study included individuals aged ≥30 years, which makes the age distribution not comparable to other data listed in the table.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>Data for the following numbers of participants were missing in the LoCard sample: sex, 21; age, 21; marital status, 10,635; household, 10,689; children aged under 18 years, 10,576; education, 10,718; occupational status, 10,579; degree of loyalty, 10,540.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>Weighted LoCard sample refers to the descriptive statistics calculated using the poststratification weights of the LoCard participants.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>Not available.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>N/A: not applicable.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup>Cohabitating included in this category.</p>
            </fn>
            <fn id="table1fn7">
              <p><sup>g</sup>Households with three or more persons.</p>
            </fn>
            <fn id="table1fn8">
              <p><sup>h</sup>Bachelor’s degree or higher.</p>
            </fn>
            <fn id="table1fn9">
              <p><sup>i</sup>Parental leave included.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Food Purchase</title>
        <p><xref ref-type="table" rid="table2">Table 2</xref> shows the purchases of selected food groups in the original LoCard sample and in the weighted LoCard sample. Over 95% of the participants had purchased at least one food product in all food groups, except skimmed milk &#38; sour milk. Skimmed milk &#38; sour milk had been purchased by 74% of the participants. Among them, the median expenditure and the median weight were €23.0 (€1=US $1.13 in 2017) and 23.5 kg, respectively, during the 2-year follow-up.</p>
        <p>After applying the poststratification weights, there was an increase in the purchase of red meat &#38; processed meat and small increases in sugar-sweetened beverages and fat spreads. The purchase of vegetables and sweets &#38; chocolate decreased as a result of reweighting. The largest change was seen in red meat &#38; processed meat; the weighted amount of purchase increased from €387 to €417 (cost) and from 48 kg to 54 kg (weight), corresponding to relative percentage increases of 7.8% and 12.6%, respectively.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Purchase of selected food groups (measured in € and kg) in the original LoCard sample and in the weighted LoCard sample.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="120"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <col width="110"/>
            <thead>
              <tr valign="top">
                <td rowspan="2">Food group</td>
                <td colspan="4">Original LoCard sample<sup>a</sup> (N=47,066)</td>
                <td colspan="4">Weighted LoCard sample<sup>a</sup> (N=47,045)</td>
              </tr>
              <tr valign="bottom">
                <td>€, median [IQR]</td>
                <td>€ (%)<sup>b</sup>, median [IQR]</td>
                <td>kg, median [IQR]</td>
                <td>kg (%)<sup>c</sup>, median [IQR]</td>
                <td>€, median [IQR]</td>
                <td>€ (%)<sup>b</sup>, median [IQR]</td>
                <td>kg, median [IQR]</td>
                <td>kg (%)<sup>c</sup>, median [IQR]</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Vegetables</td>
                <td>284.3 [124.9-520.1]</td>
                <td>7.7 [5.4-10.5]</td>
                <td>76.6 [33.2-144.4]</td>
                <td>8.2 [5.4-11.7]</td>
                <td>263.7 [107.3-487.6]</td>
                <td>7.2 [4.8- 9.9]</td>
                <td>73.4 [29.6- 139.6]</td>
                <td>7.6 [4.8- 11.0]</td>
              </tr>
              <tr valign="top">
                <td>Skimmed milk &#38; sour milk</td>
                <td>6.9 [0-60.9]</td>
                <td>0.2 [0-1.7]</td>
                <td>7.0 [0-65.6]</td>
                <td>0.9 [0-7.3]</td>
                <td>6.6 [0-60.5]</td>
                <td>0.2 [0-1.8]</td>
                <td>6.5 [0-66.0]</td>
                <td>0.9 [0-7.2]</td>
              </tr>
              <tr valign="top">
                <td>Sugar-sweetened beverages</td>
                <td>45.3 [15.1-111.9]</td>
                <td>1.3 [0.6-2.7]</td>
                <td>23.5 [7.5-63.4]</td>
                <td>2.8 [1.1-6.0]</td>
                <td>47.4 [15.0-120.2]</td>
                <td>1.4 [0.6-3.0]</td>
                <td>25.6 [7.7-69.8]</td>
                <td>3.0 [1.1-6.7]</td>
              </tr>
              <tr valign="top">
                <td>Rye bread</td>
                <td>50.7 [18.1-112.7]</td>
                <td>1.5 [0.8-2.5]</td>
                <td>12.9 [4.6-28.9]</td>
                <td>1.5 [0.8-2.4]</td>
                <td>50.5 [17.3-114.9]</td>
                <td>1.5 [0.7-2.5]</td>
                <td>13.2 [4.6-29.8]</td>
                <td>1.5 [0.7-2.5]</td>
              </tr>
              <tr valign="top">
                <td>Red meat &#38; processed meat</td>
                <td>386.5 [153.6-778.1]</td>
                <td>11.3 [7.5-15.2]</td>
                <td>47.5 [18.3-98.2]</td>
                <td>5.3 [3.4-7.5]</td>
                <td>416.8 [170.1-816.7]</td>
                <td>12.1 [8.2-16.0]</td>
                <td>53.5 [21.4-106.1]</td>
                <td>5.7 [3.8-8.0]</td>
              </tr>
              <tr valign="top">
                <td>Fat spreads</td>
                <td>53.1 [20.1-114.8]</td>
                <td>1.5 [0.9-2.3]</td>
                <td>10.1 [3.8-21.6]</td>
                <td>1.1 [0.7-1.7]</td>
                <td>56.3 [20.3-122.0]</td>
                <td>1.6 [0.9-2.5]</td>
                <td>10.9 [4.0-23.2]</td>
                <td>1.2 [0.7-1.8]</td>
              </tr>
              <tr valign="top">
                <td>Sweets &#38; chocolate</td>
                <td>119.2 [48.9 - 243.4]</td>
                <td>3.5 [1.9-5.8]</td>
                <td>10.3 [4.1-21.6]</td>
                <td>1.2 [0.6-2.0]</td>
                <td>109.9 [42.1-232.7]</td>
                <td>3.2 [1.7-5.5]</td>
                <td>9.5 [3.6-20.8]</td>
                <td>1.1 [0.5-1.9]</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Purchases are aggregated over a 2-year period from January 1, 2017, to December 31, 2018 (€1=US $1.13 in 2017).</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>Share of the food group purchase among all grocery purchases measured in euros.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>Share of the food group purchase among all grocery purchases measured in kilograms.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Degree of Loyalty</title>
        <p><xref ref-type="table" rid="table1">Table 1</xref> shows the self-assessed degree of loyalty. Almost 40% (14,194/36,526) of the participants reported that they made 80% or more of their food purchases at S Group shops and supermarkets, and 64% (23,418/36,526) reported making at least 60% of their purchases at the retailer’s shops and supermarkets.</p>
        <p>The RFM scores were significantly different among the five degree of loyalty groups, with the lowest scores in the lowest degree of loyalty group and a steady increasing trend toward the highest degree of loyalty group (<italic>F</italic><sub>4</sub>=4625.5, <italic>P</italic>&#60;.001). The poststratification weights also differed significantly across the five groups (<italic>F</italic><sub>4</sub>=24.1, <italic>P</italic>&#60;.001), indicating that the degree of loyalty was associated with individuals’ sociodemographic characteristics. However, the observed differences were rather small, with a maximum difference of six percentage points between the groups (<xref ref-type="table" rid="table3">Table 3</xref>). In the highest degree of loyalty group, there were slightly more young and married participants, and the percentage of households with children was higher, whereas the percentage of divorced or separated participants and those with a master’s degree declined with the degree of loyalty.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>LoCard participant characteristics and RFM scores across the five degree of loyalty groups.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="250"/>
            <col width="0"/>
            <col width="160"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td rowspan="2" colspan="3">Characteristic</td>
                <td colspan="9">Degree of loyalty</td>
              </tr>
              <tr valign="top">
                <td colspan="2">0%-20% (n=2283)</td>
                <td colspan="2">21%-40% (n=4670)</td>
                <td colspan="2">41%-60% (n=6155)</td>
                <td colspan="2">61%-80% (n=9224)</td>
                <td>81%-100% (n=14,194)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">RFM<sup>a</sup> analysis score, median [IQR]</td>
                <td colspan="2">182.5 [111.0-321.0]</td>
                <td colspan="2">311.0 [122.0-442.0]</td>
                <td colspan="2">335.0 [221.0-522.0]</td>
                <td colspan="2">432.0 [244.0-534.0]</td>
                <td>445.0 [324.0-545.0]</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Sex (women), n (%)</td>
                <td colspan="2">1472 (64.6%)</td>
                <td colspan="2">3176 (68.1%)</td>
                <td colspan="2">4150 (67.5)%</td>
                <td colspan="2">6101 (66.2)%</td>
                <td>9317 (65.7%)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Age, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≤29</td>
                <td colspan="2">227 (10.0%)</td>
                <td colspan="2">571 (12.2%)</td>
                <td colspan="2">866 (14.1%)</td>
                <td colspan="2">1284 (13.9%)</td>
                <td colspan="2">2089 (14.7%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>30-39</td>
                <td colspan="2">406 (17.8%)</td>
                <td colspan="2">935 (20.0%)</td>
                <td colspan="2">1232 (20.0%)</td>
                <td colspan="2">1993 (21.6%)</td>
                <td colspan="2">3107 (21.9%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>40-49</td>
                <td colspan="2">512 (22.5%)</td>
                <td colspan="2">1003 (21.5%)</td>
                <td colspan="2">1327 (21.6%)</td>
                <td colspan="2">1838 (19.9%)</td>
                <td colspan="2">2779 (19.6%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>50-59</td>
                <td colspan="2">536 (23.5%)</td>
                <td colspan="2">1035 (22.2%)</td>
                <td colspan="2">1273 (20.7%)</td>
                <td colspan="2">1763 (19.1%)</td>
                <td colspan="2">2664 (18.8%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>60-69</td>
                <td colspan="2">411 (18%)</td>
                <td colspan="2">797 (17.1%)</td>
                <td colspan="2">1003 (16.3%)</td>
                <td colspan="2">1585 (17.2%)</td>
                <td colspan="2">2409 (17.0%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≥70</td>
                <td colspan="2">188 (8.2%)</td>
                <td colspan="2">325 (7.0%)</td>
                <td colspan="2">450 (7.3%)</td>
                <td colspan="2">759 (8.2%)</td>
                <td colspan="2">1143 (8.1%)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Marital status, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Presently married</td>
                <td colspan="2">1021 (45.0%)</td>
                <td colspan="2">2039 (43.9%)</td>
                <td colspan="2">2733 (44.5%)</td>
                <td colspan="2">4379 (47.6%)</td>
                <td colspan="2">7056 (49.8%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Cohabitating</td>
                <td colspan="2">437 (19.3%)</td>
                <td colspan="2">982 (21.1%)</td>
                <td colspan="2">1321 (21.5%)</td>
                <td colspan="2">1862 (20.3%)</td>
                <td colspan="2">2803 (19.8%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Single</td>
                <td colspan="2">416 (18.3%)</td>
                <td colspan="2">910 (19.6%)</td>
                <td colspan="2">1187 (19.3%)</td>
                <td colspan="2">1593 (17.3%)</td>
                <td colspan="2">2303 (16.3%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Divorced or separated</td>
                <td colspan="2">323 (14.2%)</td>
                <td colspan="2">600 (12.9%)</td>
                <td colspan="2">729 (11.9%)</td>
                <td colspan="2">1090 (11.9%)</td>
                <td colspan="2">1588 (11.2%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Widowed</td>
                <td colspan="2">73 (3.2%)</td>
                <td colspan="2">116 (2.5%)</td>
                <td colspan="2">166 (2.7%)</td>
                <td colspan="2">271 (3.0%)</td>
                <td colspan="2">412 (2.9%)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Household, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Children aged under 18 years living in the household</td>
                <td colspan="2">649 (28.5%)</td>
                <td colspan="2">1398 (30.0%)</td>
                <td colspan="2">1846 (30.1%)</td>
                <td colspan="2">2995 (32.5%)</td>
                <td colspan="2">4814 (34.0%)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Education, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Primary school or less</td>
                <td colspan="2">144 (6.3%)</td>
                <td colspan="2">231 (5.0%)</td>
                <td colspan="2">335 (5.5%)</td>
                <td colspan="2">525 (5.7%)</td>
                <td colspan="2">1023 (7.3%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Upper secondary school</td>
                <td colspan="2">756 (33.3%)</td>
                <td colspan="2">1645 (35.4%)</td>
                <td colspan="2">2201 (36.0%)</td>
                <td colspan="2">3343 (36.4%)</td>
                <td colspan="2">5451 (38.6%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bachelor’s degree or equivalent</td>
                <td colspan="2">735 (32.4%)</td>
                <td colspan="2">1538 (33.1%)</td>
                <td colspan="2">2046 (33.4%)</td>
                <td colspan="2">3020 (32.9%)</td>
                <td colspan="2">4446 (31.5%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Master’s degree or higher</td>
                <td colspan="2">635 (28.0%)</td>
                <td colspan="2">1228 (26.5%)</td>
                <td colspan="2">1538 (25.1%)</td>
                <td colspan="2">2302 (25.1%)</td>
                <td colspan="2">3189 (22.6%)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Occupational status, n (%)</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Employed</td>
                <td colspan="2">1348 (59.2%)</td>
                <td colspan="2">2892 (62.2%)</td>
                <td colspan="2">3761 (61.2%)</td>
                <td colspan="2">5544 (60.2%)</td>
                <td colspan="2">8533 (60.2%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unemployed</td>
                <td colspan="2">124 (5.5%)</td>
                <td colspan="2">219 (4.7%)</td>
                <td colspan="2">284 (4.6%)</td>
                <td colspan="2">408 (4.4%)</td>
                <td colspan="2">602 (4.3%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Student</td>
                <td colspan="2">125 (5.5%)</td>
                <td colspan="2">236 (5.1%)</td>
                <td colspan="2">329 (5.4%)</td>
                <td colspan="2">461 (5.0%)</td>
                <td colspan="2">673 (4.7%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Retired</td>
                <td colspan="2">563 (24.7%)</td>
                <td colspan="2">1018 (21.9%)</td>
                <td colspan="2">1381 (22.5%)</td>
                <td colspan="2">2207 (24.0%)</td>
                <td colspan="2">3391 (23.9%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Parental leave</td>
                <td colspan="2">51 (2.2%)</td>
                <td colspan="2">137 (2.9%)</td>
                <td colspan="2">174 (2.8%)</td>
                <td colspan="2">318 (3.5%)</td>
                <td colspan="2">575 (4.1%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other</td>
                <td colspan="2">65 (2.9%)</td>
                <td colspan="2">151 (3.2%)</td>
                <td colspan="2">214 (3.5%)</td>
                <td colspan="2">273 (3.0%)</td>
                <td colspan="2">402 (2.8%)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>RFM: recency, frequency, and monetary.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p><xref ref-type="table" rid="table4">Table 4</xref> shows food purchases in the degree of loyalty groups, and all showed significant associations (<italic>P</italic>&#60;.001 for all food groups, except sweets &#38; chocolate [<italic>P</italic>=.007]). The result was expected owing to the large sample size. The shares of vegetable, red meat &#38; processed meat, and fat spread purchases increased as the degree of loyalty increased. In the other food groups, there were no major differences across the degree of loyalty groups.</p>
        <p>Additionally, <xref ref-type="table" rid="table4">Table 4</xref> shows that the quantity and expenditure regarding food groups increased steadily with the self-assessed degree of loyalty, suggesting that the self-assessment can be relied upon.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Purchases (in € and kg) of selected food groups across the five degree of loyalty groups.</p>
          </caption>
          <table width="1040" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="90"/>
            <col width="40"/>
            <col width="40"/>
            <col width="40"/>
            <col width="60"/>
            <col width="50"/>
            <col width="50"/>
            <col width="40"/>
            <col width="50"/>
            <col width="50"/>
            <col width="50"/>
            <col width="40"/>
            <col width="50"/>
            <col width="50"/>
            <col width="50"/>
            <col width="40"/>
            <col width="50"/>
            <col width="50"/>
            <col width="50"/>
            <col width="40"/>
            <col width="60"/>
            <thead>
              <tr valign="top">
                <td rowspan="3">Food group</td>
                <td colspan="20">Degree of loyalty</td>
              </tr>
              <tr valign="top">
                <td colspan="4">0%-20% (n=2216)</td>
                <td colspan="4">21%-40% (n=4611)</td>
                <td colspan="4">41%-60% (n=6119)</td>
                <td colspan="4">61%-80% (n=9168)</td>
                <td colspan="4">81%-100% (n=14,133)</td>
              </tr>
              <tr valign="top">
                <td>€<sup>a,b</sup></td>
                <td>€%<sup>b,c</sup></td>
                <td>kg<sup>b</sup></td>
                <td>kg%<sup>b,d</sup></td>
                <td>€<sup>b</sup></td>
                <td>€%<sup>b,c</sup></td>
                <td>kg<sup>b</sup></td>
                <td>kg%<sup>b,d</sup></td>
                <td>€<sup>b</sup></td>
                <td>€%<sup>b,c</sup></td>
                <td>kg<sup>b</sup></td>
                <td>kg%<sup>b,d</sup></td>
                <td>€<sup>b</sup></td>
                <td>€%<sup>b,c</sup></td>
                <td>kg<sup>b</sup></td>
                <td>kg%<sup>b,d</sup></td>
                <td>€<sup>b</sup></td>
                <td>€%<sup>b,c</sup></td>
                <td>kg<sup>b</sup></td>
                <td>kg%<sup>b,d</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Vegetables</td>
                <td>58.0</td>
                <td>6.6</td>
                <td>15.2</td>
                <td>7.1</td>
                <td>131.1</td>
                <td>7.4</td>
                <td>35.0</td>
                <td>7.9</td>
                <td>232.0</td>
                <td>7.9</td>
                <td>60.6</td>
                <td>8.4</td>
                <td>344.2</td>
                <td>8.1</td>
                <td>93.7</td>
                <td>8.7</td>
                <td>441.9</td>
                <td>7.9</td>
                <td>122.5</td>
                <td>8.5</td>
              </tr>
              <tr valign="top">
                <td>Skimmed milk &#38; sour milk</td>
                <td>1.8</td>
                <td>0.2</td>
                <td>2.0</td>
                <td>0.8</td>
                <td>3.6</td>
                <td>0.2</td>
                <td>3.0</td>
                <td>0.9</td>
                <td>5.6</td>
                <td>0.2</td>
                <td>5.0</td>
                <td>0.8</td>
                <td>8.8</td>
                <td>0.2</td>
                <td>8.0</td>
                <td>0.9</td>
                <td>14.0</td>
                <td>0.3</td>
                <td>13.5</td>
                <td>1.1</td>
              </tr>
              <tr valign="top">
                <td>Sugar-sweetened beverages</td>
                <td>10.9</td>
                <td>1.3</td>
                <td>5.5</td>
                <td>2.7</td>
                <td>23.7</td>
                <td>1.4</td>
                <td>12.2</td>
                <td>2.9</td>
                <td>37.2</td>
                <td>1.3</td>
                <td>19.1</td>
                <td>2.8</td>
                <td>52.2</td>
                <td>1.3</td>
                <td>27.4</td>
                <td>2.7</td>
                <td>67.9</td>
                <td>1.3</td>
                <td>35.7</td>
                <td>2.7</td>
              </tr>
              <tr valign="top">
                <td>Rye bread</td>
                <td>10.9</td>
                <td>1.3</td>
                <td>2.7</td>
                <td>1.3</td>
                <td>24.1</td>
                <td>1.4</td>
                <td>6.2</td>
                <td>1.4</td>
                <td>41.9</td>
                <td>1.5</td>
                <td>10.4</td>
                <td>1.5</td>
                <td>61.9</td>
                <td>1.5</td>
                <td>15.5</td>
                <td>1.5</td>
                <td>82.9</td>
                <td>1.5</td>
                <td>21.4</td>
                <td>1.5</td>
              </tr>
              <tr valign="top">
                <td>Red meat &#38; processed meat</td>
                <td>80.4</td>
                <td>9.9</td>
                <td>9.9</td>
                <td>5.0</td>
                <td>186.4</td>
                <td>10.7</td>
                <td>22.8</td>
                <td>5.2</td>
                <td>297.8</td>
                <td>10.9</td>
                <td>36.8</td>
                <td>5.2</td>
                <td>457.4</td>
                <td>11.3</td>
                <td>55.2</td>
                <td>5.3</td>
                <td>621.5</td>
                <td>11.6</td>
                <td>76.9</td>
                <td>5.4</td>
              </tr>
              <tr valign="top">
                <td>Fat spreads</td>
                <td>10.2</td>
                <td>1.2</td>
                <td>1.8</td>
                <td>0.9</td>
                <td>23.5</td>
                <td>1.3</td>
                <td>4.4</td>
                <td>1.0</td>
                <td>41.0</td>
                <td>1.4</td>
                <td>7.8</td>
                <td>1.1</td>
                <td>65.4</td>
                <td>1.6</td>
                <td>12.3</td>
                <td>1.2</td>
                <td>87.2</td>
                <td>1.6</td>
                <td>16.7</td>
                <td>1.2</td>
              </tr>
              <tr valign="top">
                <td>Sweets &#38; chocolate</td>
                <td>32.3</td>
                <td>3.7</td>
                <td>2.8</td>
                <td>1.3</td>
                <td>64.1</td>
                <td>3.7</td>
                <td>5.4</td>
                <td>1.3</td>
                <td>95.4</td>
                <td>3.4</td>
                <td>8.3</td>
                <td>1.2</td>
                <td>134.6</td>
                <td>3.3</td>
                <td>11.6</td>
                <td>1.1</td>
                <td>183.9</td>
                <td>3.5</td>
                <td>15.6</td>
                <td>1.2</td>
              </tr>
              <tr valign="top">
                <td>Total amount of grocery purchases, median [IQR]</td>
                <td colspan="2">873.4 [442.0-1602.5]</td>
                <td colspan="2">215.9 [105.6-393.2]</td>
                <td colspan="2">1883.8 [1095.7-2924.2]</td>
                <td colspan="2">460.7 [258.5-756.1]</td>
                <td colspan="2">2958.6 [1840.0-4528.8]</td>
                <td colspan="2">734.0 [452.8-1169.5]</td>
                <td colspan="2">4320.2 [2726.5-6479.0]</td>
                <td colspan="2">1095.3 [671.5-1698.1]</td>
                <td colspan="2">5680.1 [3616.4-8531.8]</td>
                <td colspan="2">1462.7 [913.0-2250.6]</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>€1=US $1.13 in 2017.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>Median value.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>Share of the food group purchase among all grocery purchases measured in euros.</p>
            </fn>
            <fn id="table4fn4">
              <p><sup>d</sup>Share of the food group purchase among all grocery purchases measured in kilograms.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The findings of this study showed that individuals who consented to the release of their loyalty card data for research purposes tended to diverge from the general Finnish adult population. Similar to many other health and nutrition studies, including those encompassing electronic data collection tools [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>], the LoCard participants manifested volunteer bias, with employed individuals, middle-aged individuals, women, and individuals with higher education being overrepresented in the sample. The LoCard sample included fewer retired individuals, fewer individuals with basic education, and fewer individuals who had children aged under 18 years living in the household. Compared with the Finnish national FinHealth and FinDiet studies, the selection mechanism appeared to be somewhat different in the LoCard sample. While employed individuals were overrepresented in all these three studies, the gender and education biases were stronger in the LoCard sample. Moreover, the LoCard sample had a rather similar distribution of marital status as among Finnish adults, whereas in the FinHealth study, married individuals were overrepresented [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref42">42</xref>].</p>
        <p>However, the size (n=47,066) and heterogeneity of the LoCard sample enabled a successful correction of the differences seen in the sociodemographic variables. We developed the poststratification weights using all sociodemographic background variables available with the two-way joint distributions to correct the background distributions of the LoCard participants to make them closer to the Finnish adult population. The large sample size provided a sufficient number of participants for hard-to-reach population subgroups, and thus, it was possible to construct the poststratification weights for them as well. The highest weights were seen for unmarried men aged under 30 years, who indeed are often underrepresented or not enrolled in health studies [<xref ref-type="bibr" rid="ref41">41</xref>].</p>
        <p>Of the 1.1 million loyalty card holders contacted, approximately 4% (n=47,066) took part in the LoCard study. Although low, the participation rate was similar to that for other massive data collection methods [<xref ref-type="bibr" rid="ref7">7</xref>]. The advantage of the use of digital tools is that they reach a large number of potential study participants with relatively low effort in data collection. After all, we reached substantially more individuals than in the majority of dietary studies using traditional data collection methods with minimum human involvement in data collection. A likely reason for the low participation rate was that the participants were contacted via email, which may not have reached them (invalid email address or contact email classified as “junk email”) or may have limited their participation and induced selection bias. Although 88% of households in Finland have an internet connection and 83% use email [<xref ref-type="bibr" rid="ref43">43</xref>], email use varies according to sociodemographic profiles and is relatively low at 62% among individuals aged over 65 years and among individuals with basic education [<xref ref-type="bibr" rid="ref44">44</xref>]. This may partly explain the baseline characteristics of the LoCard sample. However, it has been shown that the use of digital tools in recruitment and data collection does not increase the selection bias, but the traits of participants in health studies are rather similar regardless of the recruitment method used [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]. Moreover, it is likely that many simply ignored an email coming from a commercial party.</p>
        <p>Important aspects are whether and when informed consent from loyalty card owners is needed. Recently, Aiello et al [<xref ref-type="bibr" rid="ref45">45</xref>] published an interesting ecological study on the associations between loyalty card food purchase data and prescription records that were used as a proxy for real disease profiles in London. Their dataset included 1.6 million loyalty card users, and they used the anonymized data without the consent of the individuals. In our study, consent and a positive reply were required for two reasons. First, transparent use of loyalty card data on customers for a common good builds trust among them, researchers, and the company, and reduces the likelihood of negative publicity. Second, contact was needed to obtain information about participants’ background characteristics for use in further analyses. A future scenario could involve a consent request when the customer becomes a member of the loyalty card program. This would create an ethically sound and transparent research protocol for the use of customer data.</p>
        <p>Poststratification weights were further applied in evaluating the purchases of the main food groups. The corrections demonstrated small changes in some food groups; the purchase of vegetables and sweets &#38; chocolate decreased after the correction, whereas the purchase of red meat &#38; processed meat, sugar-sweetened beverages, and fat spreads increased<italic>.</italic> The sociodemographic profiles of the LoCard participants and bias related to them might, at least partly, explain these results. The FinDiet study showed that women, who were overrepresented in the LoCard sample and thus had smaller weights, tended to consume more fruits and vegetables than men [<xref ref-type="bibr" rid="ref36">36</xref>]. In line with this, after applying the poststratification weights, the purchase of vegetables decreased. It has also been shown that socioeconomically advantaged individuals, who likewise were overrepresented in the LoCard sample, consumed healthy foods, such as fruits and vegetables and low-fat dairy products, more frequently [<xref ref-type="bibr" rid="ref46">46</xref>]. Moreover, the increased amount of red meat &#38; processed meat purchase is likely related to male participants who tend to consume more meat [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref47">47</xref>]. In line with the overall findings of this study, the NutriNet-Santé study showed that the consumption of fruits and vegetables was higher and the consumption of meat was lower in the cohort than in the general population in France [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
        <p>The degree of loyalty was fairly high in the LoCard sample with 64% (23,418/36,526) of the participants reporting making over 60% of their grocery purchases at the retailer’s shops and supermarkets. The food purchases were rather similar in the higher loyalty group (60% or higher), whereas individuals making less purchases in the retailer’s grocery stores showed some differences. In particular, individuals reporting the lowest degree of loyalty tended to buy fewer vegetables and fat spreads and fewer red meat &#38; processed meat products. Although some variation was seen, the differences across the loyalty groups were smaller than expected. One reason could be the food groups selected for the current analyses. There could be other products, such as alcohol and tobacco, that are differently purchased. These results, together with the differences seen in the sociodemographic variables between the loyalty groups, underline the importance of estimating and accounting for the degree of loyalty in future studies using loyalty card data. A direct way to address the problem of coincidental purchases is to focus on a subsample with at least 60% loyalty. It is also important to note that loyalty card data can enable research on longitudinal trends in food purchases, which can be performed regardless of the degree of loyalty.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Although we used a large set of matching variables for developing the poststratification weights, some limitations concerning these remain. First, we were not able to compare or account for possible differences in income, as there was no comparable reference data available in Statistics Finland. Therefore, it remains unclear whether the LoCard sample was representative in terms of income, which is an important contributor to food purchase. The higher education level of the LoCard participants and the lower prevalence of young and retired individuals clearly suggest that the income levels might be overestimated in our sample. Second, although we matched families with children, the number of children and their ages, which can clearly affect a household’s food purchases, were not used in weighting. Importantly, we were able to correct the differences only in the observed sociodemographic variables, and thus, unidentifiable selection bias cannot be ruled out. This may include factors that would be associated with willingness to participate, such as special dietary restrictions and socially excluded people. In particular, among those participants who did not have complete background information and whose poststratification weights were thus based on sex and age only, the risk for unidentifiable selection bias could be even higher.</p>
        <p>It is important to note that grocery purchases reflect consumption on a household level, which may consist of more than one person, and not everybody might eat the same foods. Thus, accuracy of loyalty card data in investigating individual diet may not be as high as that obtained with traditional data collection methods. However, good compatibility between respondent-collected household-level food purchase data and individual-level dietary data has been demonstrated [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref48">48</xref>]. Moreover, foods purchased from stores do not necessarily indicate foods consumed owing to many different reasons. These include, for example, foods that are not included in loyalty card data, such as dinner foods at restaurants or lunch foods at work. Cardholders may also buy foods that are consumed by others, for example, grandchildren, other relatives or close friends invited for dinner, and pets. Some foods are not consumed at all, resulting in food wastage [<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>].</p>
        <p>Finally, the degree of loyalty remains a challenge. In this study, the degree of loyalty was self-estimated, and it is difficult to estimate possible bias related to this self-report. However, we showed that the RFM scores increased steadily with the groups of loyalty, indicating that higher frequency, higher engagement, and more money spent on grocery purchases were associated with a higher degree of loyalty. Moreover, a positive correlation was found between the proportional increases in money spent (€) and weight (kg) regarding food purchases and the degree of loyalty. These results suggest that this self-assessment seemed to provide a feasible estimate of the true values. In another study, the researchers defined loyalty through the frequency of purchases made in the supermarket combined with the amount of money spent on purchases. However, in this study, the degree of loyalty was not specifically defined [<xref ref-type="bibr" rid="ref51">51</xref>].</p>
        <p>Despite its limitations, we see real potential in the use of these automatically collected longitudinal food purchase data in the population-based assessment of dietary patterns, which are important determinants of health and carbon footprint [<xref ref-type="bibr" rid="ref52">52</xref>]. Loyalty card data provide a cost-effective tool to reach large groups of individuals with minimum data collection efforts and to investigate diet-related behaviors with less information bias. Linking these data with other health data (such as electronic health records and health registers) would provide new opportunities to understand diet and related outcomes. However, such research settings include privacy concerns that need to be carefully addressed to guarantee individual anonymity and consent. In addition, loyalty card data enable the monitoring of longitudinal trends in food purchases including timely monitoring and evaluation of the impact of population-level steering instruments such as taxation.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Individuals who consented to the use of their loyalty card data for research purposes tended to differ from individuals in the general Finnish adult population. The sociodemographic distributions were toward similar characteristics, as is frequently seen in health and nutrition studies. However, the high volume of data enabled the inclusion of sociodemographically heterogeneous subgroups, potentially including hard-to-reach subgroups, and further correction of the differences so that distributions matched well with those of the general Finnish adult population. A potential confounder in studies using loyalty card data is the degree of loyalty, which in this study, was associated with food-purchasing profiles and also the participants’ background characteristics. This underlines the importance of obtaining sufficient background information when using loyalty card data for health research.</p>
        <p>Despite the limitations, loyalty card data provide a cost-effective approach for large groups of individuals with minimum data collection effort and for the investigation of diet-related behaviors on a large scale with less information bias. Importantly, loyalty card data enable the monitoring of longitudinal trends in grocery purchases.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Grouping of the food purchase data.</p>
        <media xlink:href="jmir_v22i7e18059_app1.docx" xlink:title="DOCX File , 16 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>The percentage of individuals living in each of the 19 regions in Finland, in the LoCard sample, and in the weighted LoCard sample.</p>
        <media xlink:href="jmir_v22i7e18059_app2.docx" xlink:title="DOCX File , 15 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Regions of Finland.</p>
        <media xlink:href="jmir_v22i7e18059_app3.png" xlink:title="PNG File , 33 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">IPF</term>
          <def>
            <p>iterative proportional fitting</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">RFM</term>
          <def>
            <p>recency, frequency, and monetary</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We thank S Group for collaboration. We are also grateful to the loyalty card holders who provided consent for the use of their loyalty card data in this research project. This work was funded by Tampere University, the University of Helsinki, the Finnish Foundation for Alcohol Studies, and EIT Food (“Towards a smarter shopping list” #20041). EIT Food is the Innovation Community on Food of the European Innovation and Technology (EIT), a body of the EU, under Horizon 2020, the EU Framework Programme for Research and Innovation.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>ME, JN, HS, LU, and MF participated in data collection and transfer. All authors participated in the design of the study. TN, ME, SK, and JN performed data management. A-LV and JN planned the data analyses, which A-LV conducted. A-LV wrote the original draft. All authors participated in reviewing and writing the drafts, including approval of the final version of the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schwingshackl</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Knüppel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Michels</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Schwedhelm</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffmann</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Iqbal</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>De Henauw</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Boeing</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Devleesschauwer</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Intake of 12 food groups and disability-adjusted life years from coronary heart disease, stroke, type 2 diabetes, and colorectal cancer in 16 European countries</article-title>
          <source>Eur J Epidemiol</source>
          <year>2019</year>
          <month>08</month>
          <volume>34</volume>
          <issue>8</issue>
          <fpage>765</fpage>
          <lpage>775</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31030306"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10654-019-00523-4</pub-id>
          <pub-id pub-id-type="medline">31030306</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10654-019-00523-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC6602984</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <article-title>Global action plan for the prevention and control of NCDs 2013-2020</article-title>
          <source>World Health Organization</source>
          <year>2013</year>
          <access-date>2020-06-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/nmh/publications/ncd-action-plan/en/">https://www.who.int/nmh/publications/ncd-action-plan/en/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>GBD 2017 Diet Collaborators</collab>
          </person-group>
          <article-title>Health effects of dietary risks in 195 countries, 1990-2017: a systematic analysis for the Global Burden of Disease Study 2017</article-title>
          <source>Lancet</source>
          <year>2019</year>
          <month>05</month>
          <day>11</day>
          <volume>393</volume>
          <issue>10184</issue>
          <fpage>1958</fpage>
          <lpage>1972</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0140-6736(19)30041-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(19)30041-8</pub-id>
          <pub-id pub-id-type="medline">30954305</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(19)30041-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC6899507</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Willett</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <source>Nutritional Epidemiology</source>
          <year>2013</year>
          <publisher-loc>Oxford</publisher-loc>
          <publisher-name>Oxford University Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lovefrove</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hodson</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lanham-New</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <source>Nutrition Research Methodologies</source>
          <year>2015</year>
          <publisher-loc>Hoboken, New Jersey</publisher-loc>
          <publisher-name>Wiley-Blackwell</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Murakami</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Livingstone</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and characteristics of misreporting of energy intake in US children and adolescents: National Health and Nutrition Examination Survey (NHANES) 2003-2012</article-title>
          <source>Br J Nutr</source>
          <year>2016</year>
          <month>01</month>
          <day>28</day>
          <volume>115</volume>
          <issue>2</issue>
          <fpage>294</fpage>
          <lpage>304</lpage>
          <pub-id pub-id-type="doi">10.1017/S0007114515004304</pub-id>
          <pub-id pub-id-type="medline">26525591</pub-id>
          <pub-id pub-id-type="pii">S0007114515004304</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fry</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Littlejohns</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sudlow</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Doherty</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Adamska</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sprosen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>NE</given-names>
            </name>
          </person-group>
          <article-title>Comparison of Sociodemographic and Health-Related Characteristics of UK Biobank Participants With Those of the General Population</article-title>
          <source>Am J Epidemiol</source>
          <year>2017</year>
          <month>11</month>
          <day>01</day>
          <volume>186</volume>
          <issue>9</issue>
          <fpage>1026</fpage>
          <lpage>1034</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28641372"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/aje/kwx246</pub-id>
          <pub-id pub-id-type="medline">28641372</pub-id>
          <pub-id pub-id-type="pii">3883629</pub-id>
          <pub-id pub-id-type="pmcid">PMC5860371</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Strandhagen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Berg</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lissner</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Nunez</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Rosengren</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Torén</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Thelle</surname>
              <given-names>DS</given-names>
            </name>
          </person-group>
          <article-title>Selection bias in a population survey with registry linkage: potential effect on socioeconomic gradient in cardiovascular risk</article-title>
          <source>Eur J Epidemiol</source>
          <year>2010</year>
          <month>03</month>
          <volume>25</volume>
          <issue>3</issue>
          <fpage>163</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1007/s10654-010-9427-7</pub-id>
          <pub-id pub-id-type="medline">20127393</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kesse-Guyot</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Andreeva</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Castetbon</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Vernay</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Touvier</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Méjean</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Julia</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Galan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hercberg</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Participant profiles according to recruitment source in a large Web-based prospective study: experience from the Nutrinet-Santé study</article-title>
          <source>J Med Internet Res</source>
          <year>2013</year>
          <month>09</month>
          <day>13</day>
          <volume>15</volume>
          <issue>9</issue>
          <fpage>e205</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2013/9/e205/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.2488</pub-id>
          <pub-id pub-id-type="medline">24036068</pub-id>
          <pub-id pub-id-type="pii">v15i9e205</pub-id>
          <pub-id pub-id-type="pmcid">PMC3785981</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Salathé</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Digital epidemiology: what is it, and where is it going?</article-title>
          <source>Life Sci Soc Policy</source>
          <year>2018</year>
          <month>01</month>
          <day>04</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29302758"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s40504-017-0065-7</pub-id>
          <pub-id pub-id-type="medline">29302758</pub-id>
          <pub-id pub-id-type="pii">10.1186/s40504-017-0065-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC5754279</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mooney</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Westreich</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>El-Sayed</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Commentary: Epidemiology in the era of big data</article-title>
          <source>Epidemiology</source>
          <year>2015</year>
          <month>05</month>
          <volume>26</volume>
          <issue>3</issue>
          <fpage>390</fpage>
          <lpage>4</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25756221"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/EDE.0000000000000274</pub-id>
          <pub-id pub-id-type="medline">25756221</pub-id>
          <pub-id pub-id-type="pmcid">PMC4385465</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tin</surname>
              <given-names>ST</given-names>
            </name>
            <name name-style="western">
              <surname>Mhurchu</surname>
              <given-names>CN</given-names>
            </name>
            <name name-style="western">
              <surname>Bullen</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Supermarket sales data: feasibility and applicability in population food and nutrition monitoring</article-title>
          <source>Nutr Rev</source>
          <year>2007</year>
          <month>01</month>
          <volume>65</volume>
          <issue>1</issue>
          <fpage>20</fpage>
          <lpage>30</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1753-4887.2007.tb00264.x</pub-id>
          <pub-id pub-id-type="medline">17310856</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kesse-Guyot</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Assmann</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Andreeva</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Castetbon</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Méjean</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Touvier</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Salanave</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Deschamps</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Péneau</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fezeu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Julia</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Allès</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Galan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hercberg</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Lessons Learned From Methodological Validation Research in E-Epidemiology</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2016</year>
          <month>10</month>
          <day>18</day>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>e160</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2016/2/e160/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.5880</pub-id>
          <pub-id pub-id-type="medline">27756715</pub-id>
          <pub-id pub-id-type="pii">v2i2e160</pub-id>
          <pub-id pub-id-type="pmcid">PMC5087563</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Méjean</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Szabo de Edelenyi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Touvier</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kesse-Guyot</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Julia</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Andreeva</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Hercberg</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Motives for participating in a web-based nutrition cohort according to sociodemographic, lifestyle, and health characteristics: the NutriNet-Santé cohort study</article-title>
          <source>J Med Internet Res</source>
          <year>2014</year>
          <month>08</month>
          <day>07</day>
          <volume>16</volume>
          <issue>8</issue>
          <fpage>e189</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2014/8/e189/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.3161</pub-id>
          <pub-id pub-id-type="medline">25135800</pub-id>
          <pub-id pub-id-type="pii">v16i8e189</pub-id>
          <pub-id pub-id-type="pmcid">PMC4137145</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pietilä</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Helander</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Korhonen</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Myllymäki</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kujala</surname>
              <given-names>UM</given-names>
            </name>
            <name name-style="western">
              <surname>Lindholm</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Acute Effect of Alcohol Intake on Cardiovascular Autonomic Regulation During the First Hours of Sleep in a Large Real-World Sample of Finnish Employees: Observational Study</article-title>
          <source>JMIR Ment Health</source>
          <year>2018</year>
          <month>03</month>
          <day>16</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>e23</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2018/1/e23/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/mental.9519</pub-id>
          <pub-id pub-id-type="medline">29549064</pub-id>
          <pub-id pub-id-type="pii">v5i1e23</pub-id>
          <pub-id pub-id-type="pmcid">PMC5878366</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Helander</surname>
              <given-names>EE</given-names>
            </name>
            <name name-style="western">
              <surname>Vuorinen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wansink</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Korhonen</surname>
              <given-names>IK</given-names>
            </name>
          </person-group>
          <article-title>Are breaks in daily self-weighing associated with weight gain?</article-title>
          <source>PLoS One</source>
          <year>2014</year>
          <volume>9</volume>
          <issue>11</issue>
          <fpage>e113164</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0113164"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0113164</pub-id>
          <pub-id pub-id-type="medline">25397613</pub-id>
          <pub-id pub-id-type="pii">PONE-D-14-21664</pub-id>
          <pub-id pub-id-type="pmcid">PMC4232563</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sperrin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rushton</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Dixon</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Normand</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Villard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chieh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Buchan</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Who Self-Weighs and What Do They Gain From It? A Retrospective Comparison Between Smart Scale Users and the General Population in England</article-title>
          <source>J Med Internet Res</source>
          <year>2016</year>
          <month>01</month>
          <day>21</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>e17</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2016/1/e17/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.4767</pub-id>
          <pub-id pub-id-type="medline">26794900</pub-id>
          <pub-id pub-id-type="pii">v18i1e17</pub-id>
          <pub-id pub-id-type="pmcid">PMC4742620</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Olson</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Konty</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Paladini</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Viboud</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Simonsen</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Reassessing Google Flu Trends data for detection of seasonal and pandemic influenza: a comparative epidemiological study at three geographic scales</article-title>
          <source>PLoS Comput Biol</source>
          <year>2013</year>
          <volume>9</volume>
          <issue>10</issue>
          <fpage>e1003256</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1003256"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pcbi.1003256</pub-id>
          <pub-id pub-id-type="medline">24146603</pub-id>
          <pub-id pub-id-type="pii">PCOMPBIOL-D-13-00957</pub-id>
          <pub-id pub-id-type="pmcid">PMC3798275</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aledavood</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Torous</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Triana Hoyos</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Naslund</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Onnela</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Keshavan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Smartphone-Based Tracking of Sleep in Depression, Anxiety, and Psychotic Disorders</article-title>
          <source>Curr Psychiatry Rep</source>
          <year>2019</year>
          <month>06</month>
          <day>04</day>
          <volume>21</volume>
          <issue>7</issue>
          <fpage>49</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31161412"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11920-019-1043-y</pub-id>
          <pub-id pub-id-type="medline">31161412</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11920-019-1043-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC6546650</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ekman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Litton</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>New times, new needs; e-epidemiology</article-title>
          <source>Eur J Epidemiol</source>
          <year>2007</year>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>285</fpage>
          <lpage>92</lpage>
          <pub-id pub-id-type="doi">10.1007/s10654-007-9119-0</pub-id>
          <pub-id pub-id-type="medline">17505896</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Moorhead</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bond</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>LeBlanc</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Petrella</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Fiscella</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Who Uses Mobile Phone Health Apps and Does Use Matter? A Secondary Data Analytics Approach</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>04</month>
          <day>19</day>
          <volume>19</volume>
          <issue>4</issue>
          <fpage>e125</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/4/e125/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.5604</pub-id>
          <pub-id pub-id-type="medline">28428170</pub-id>
          <pub-id pub-id-type="pii">v19i4e125</pub-id>
          <pub-id pub-id-type="pmcid">PMC5415654</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>Who is Tracking Health on Mobile Devices: Behavioral Logfile Analysis in Hong Kong</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2019</year>
          <month>05</month>
          <day>23</day>
          <volume>7</volume>
          <issue>5</issue>
          <fpage>e13679</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2019/5/e13679/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13679</pub-id>
          <pub-id pub-id-type="medline">31120429</pub-id>
          <pub-id pub-id-type="pii">v7i5e13679</pub-id>
          <pub-id pub-id-type="pmcid">PMC6552450</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hargittai</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Potential Biases in Big Data: Omitted Voices on Social Media</article-title>
          <source>Social Science Computer Review</source>
          <year>2018</year>
          <month>07</month>
          <day>30</day>
          <volume>38</volume>
          <issue>1</issue>
          <fpage>10</fpage>
          <lpage>24</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1177/0894439318788322"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/0894439318788322</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nevalainen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Erkkola</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Saarijärvi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Näppilä</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fogelholm</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Large-scale loyalty card data in health research</article-title>
          <source>Digit Health</source>
          <year>2018</year>
          <volume>4</volume>
          <fpage>2055207618816898</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30546912"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/2055207618816898</pub-id>
          <pub-id pub-id-type="medline">30546912</pub-id>
          <pub-id pub-id-type="pii">10.1177_2055207618816898</pub-id>
          <pub-id pub-id-type="pmcid">PMC6287323</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mamiya</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Moodie</surname>
              <given-names>EE</given-names>
            </name>
            <name name-style="western">
              <surname>Buckeridge</surname>
              <given-names>DL</given-names>
            </name>
          </person-group>
          <article-title>A novel application of point-of-sales grocery transaction data to enhance community nutrition monitoring</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>1253</fpage>
          <lpage>1261</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854194"/>
          </comment>
          <pub-id pub-id-type="medline">29854194</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977589</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bandy</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Adhikari</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Jebb</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rayner</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The use of commercial food purchase data for public health nutrition research: A systematic review</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>e0210192</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0210192"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0210192</pub-id>
          <pub-id pub-id-type="medline">30615664</pub-id>
          <pub-id pub-id-type="pii">PONE-D-18-20802</pub-id>
          <pub-id pub-id-type="pmcid">PMC6322827</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Einav</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Leibtag</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Nevo</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Recording discrepancies in Nielsen Homescan data: Are they present and do they matter?</article-title>
          <source>Quant Mark Econ</source>
          <year>2009</year>
          <month>8</month>
          <day>25</day>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>207</fpage>
          <lpage>239</lpage>
          <pub-id pub-id-type="doi">10.1007/s11129-009-9073-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Appelhans</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>French</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Tangney</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Powell</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>To what extent do food purchases reflect shoppers' diet quality and nutrient intake?</article-title>
          <source>Int J Behav Nutr Phys Act</source>
          <year>2017</year>
          <month>04</month>
          <day>11</day>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>46</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ijbnpa.biomedcentral.com/articles/10.1186/s12966-017-0502-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12966-017-0502-2</pub-id>
          <pub-id pub-id-type="medline">28399887</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12966-017-0502-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC5387266</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>French</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Wall</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>NR</given-names>
            </name>
            <name name-style="western">
              <surname>Shimotsu</surname>
              <given-names>ST</given-names>
            </name>
            <name name-style="western">
              <surname>Welsh</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Annotated receipts capture household food purchases from a broad range of sources</article-title>
          <source>Int J Behav Nutr Phys Act</source>
          <year>2009</year>
          <month>07</month>
          <day>01</day>
          <volume>6</volume>
          <fpage>37</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ijbnpa.biomedcentral.com/articles/10.1186/1479-5868-6-37"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1479-5868-6-37</pub-id>
          <pub-id pub-id-type="medline">19570234</pub-id>
          <pub-id pub-id-type="pii">1479-5868-6-37</pub-id>
          <pub-id pub-id-type="pmcid">PMC2714491</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <collab>Finnish Grocery Trade Association</collab>
          </person-group>
          <source>Finnish Grocery Trade 2019</source>
          <year>2019</year>
          <publisher-loc>Helsinki</publisher-loc>
          <publisher-name>Finnish Grocery Trade Association</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Nutrition Unit of the National Institute for Health and Welfare (THL)</collab>
          </person-group>
          <article-title>Food Composition Database Release 20</article-title>
          <source>Fineli</source>
          <year>2019</year>
          <access-date>2019-01-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://fineli.fi">https://fineli.fi</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fogelholm</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Anderssen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gunnarsdottir</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Lahti-Koski</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Dietary macronutrients and food consumption as determinants of long-term weight change in adult populations: a systematic literature review</article-title>
          <source>Food Nutr Res</source>
          <year>2012</year>
          <volume>56</volume>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3402/fnr.v56i0.19103"/>
          </comment>
          <pub-id pub-id-type="doi">10.3402/fnr.v56i0.19103</pub-id>
          <pub-id pub-id-type="medline">22893781</pub-id>
          <pub-id pub-id-type="pii">19103</pub-id>
          <pub-id pub-id-type="pmcid">PMC3418611</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fardet</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Boirie</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Associations between food and beverage groups and major diet-related chronic diseases: an exhaustive review of pooled/meta-analyses and systematic reviews</article-title>
          <source>Nutr Rev</source>
          <year>2014</year>
          <month>12</month>
          <volume>72</volume>
          <issue>12</issue>
          <fpage>741</fpage>
          <lpage>62</lpage>
          <pub-id pub-id-type="doi">10.1111/nure.12153</pub-id>
          <pub-id pub-id-type="medline">25406801</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <source>StatFin statistical database</source>
          <access-date>2019-06-26</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://pxnet2.stat.fi/PXWeb/pxweb/en/StatFin/">http://pxnet2.stat.fi/PXWeb/pxweb/en/StatFin/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Koponen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Borodulin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lundqvist</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sääksjärvi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Koskinen</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <source>Terveys, toimintakyky ja hyvinvointi Suomessa FinTerveys 2017-tutkimus</source>
          <year>2018</year>
          <publisher-loc>Helsinki</publisher-loc>
          <publisher-name>Terveyden ja hyvinvoinnin laitos (THL)</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Valsta</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kaartinen</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Tapanainen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Männistö</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sääksjärvi</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <source>Ravitsemus Suomessa - FinRavinto 2017 -tutkimus / Nutrition in Finland - The National FinDiet 2017 Survey,?</source>
          <year>2018</year>
          <publisher-loc>Helsinki</publisher-loc>
          <publisher-name>Terveyden ja hyvinvoinnin laitos (THL)</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lumley</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Analysis of Complex Survey Samples</article-title>
          <source>J. Stat. Soft</source>
          <year>2004</year>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>1</fpage>
          <lpage>19</lpage>
          <comment>R package verson 2.2</comment>
          <pub-id pub-id-type="doi">10.18637/jss.v009.i08</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Deming</surname>
              <given-names>WE</given-names>
            </name>
            <name name-style="western">
              <surname>Stephan</surname>
              <given-names>FF</given-names>
            </name>
          </person-group>
          <article-title>On a Least Squares Adjustment of a Sampled Frequency Table When the Expected Marginal Totals are Known</article-title>
          <source>Ann. Math. Statist</source>
          <year>1940</year>
          <month>12</month>
          <volume>11</volume>
          <issue>4</issue>
          <fpage>427</fpage>
          <lpage>444</lpage>
          <pub-id pub-id-type="doi">10.1214/aoms/1177731829</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hebbali</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>rfm: Recency, Frequency and Monetary Value Analysis</article-title>
          <source>R package</source>
          <year>2020</year>
          <access-date>2020-06-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/rfm/index.html">https://cran.r-project.org/web/packages/rfm/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ekman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dickman</surname>
              <given-names>PW</given-names>
            </name>
            <name name-style="western">
              <surname>Klint</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weiderpass</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Litton</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Feasibility of using web-based questionnaires in large population-based epidemiological studies</article-title>
          <source>Eur J Epidemiol</source>
          <year>2006</year>
          <volume>21</volume>
          <issue>2</issue>
          <fpage>103</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1007/s10654-005-6030-4</pub-id>
          <pub-id pub-id-type="medline">16518678</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Andreeva</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Salanave</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Castetbon</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Deschamps</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Vernay</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kesse-Guyot</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hercberg</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Comparison of the sociodemographic characteristics of the large NutriNet-Santé e-cohort with French Census data: the issue of volunteer bias revisited</article-title>
          <source>J Epidemiol Community Health</source>
          <year>2015</year>
          <month>09</month>
          <volume>69</volume>
          <issue>9</issue>
          <fpage>893</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1136/jech-2014-205263</pub-id>
          <pub-id pub-id-type="medline">25832451</pub-id>
          <pub-id pub-id-type="pii">jech-2014-205263</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reinikainen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tolonen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Borodulin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Härkänen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Jousilahti</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Karvanen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Koskinen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kuulasmaa</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Männistö</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rissanen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Vartiainen</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Participation rates by educational levels have diverged during 25 years in Finnish health examination surveys</article-title>
          <source>Eur J Public Health</source>
          <year>2018</year>
          <month>04</month>
          <day>01</day>
          <volume>28</volume>
          <issue>2</issue>
          <fpage>237</fpage>
          <lpage>243</lpage>
          <pub-id pub-id-type="doi">10.1093/eurpub/ckx151</pub-id>
          <pub-id pub-id-type="medline">29036286</pub-id>
          <pub-id pub-id-type="pii">4316094</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <collab>Official Statistics of Finland</collab>
          </person-group>
          <source>Väestön Tieto- Ja Viestintätekniikan Käyttö [Verkkojulkaisu]. Liitetaulukko 5. Kotitaloudessa internetyhteys 2017, %-osuus talouksista</source>
          <year>2017</year>
          <publisher-loc>Helsinki</publisher-loc>
          <publisher-name>Statistics Finland</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <collab>Official Statistics of Finland</collab>
          </person-group>
          <source>Väestön tieto- ja viestintätekniikan käyttö [verkkojulkaisu]. Liitetaulukko 20. Internetin käyttö puheluihin, pikaviestintään älypuhelimella, sähköpostiin ja pilvitallentamiseen</source>
          <year>2017</year>
          <publisher-loc>Helsinki</publisher-loc>
          <publisher-name>Statistics Finland</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aiello</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Schifanella</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Quercia</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Del Prete</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Large-scale and high-resolution analysis of food purchases and health outcomes</article-title>
          <source>EPJ Data Sci</source>
          <year>2019</year>
          <month>4</month>
          <day>30</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>14</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1140/epjds/s13688-019-0191-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1140/epjds/s13688-019-0191-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Giskes</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Avendano</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brug</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kunst</surname>
              <given-names>AE</given-names>
            </name>
          </person-group>
          <article-title>A systematic review of studies on socioeconomic inequalities in dietary intakes associated with weight gain and overweight/obesity conducted among European adults</article-title>
          <source>Obes Rev</source>
          <year>2010</year>
          <month>06</month>
          <volume>11</volume>
          <issue>6</issue>
          <fpage>413</fpage>
          <lpage>29</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1467-789X.2009.00658.x</pub-id>
          <pub-id pub-id-type="medline">19889178</pub-id>
          <pub-id pub-id-type="pii">OBR658</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fogelholm</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kanerva</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Männistö</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Association between red and processed meat consumption and chronic diseases: the confounding role of other dietary factors</article-title>
          <source>Eur J Clin Nutr</source>
          <year>2015</year>
          <month>09</month>
          <volume>69</volume>
          <issue>9</issue>
          <fpage>1060</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1038/ejcn.2015.63</pub-id>
          <pub-id pub-id-type="medline">25969395</pub-id>
          <pub-id pub-id-type="pii">ejcn201563</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Becker</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Comparability of household and individual food consumption data--evidence from Sweden</article-title>
          <source>Public Health Nutr</source>
          <year>2001</year>
          <month>10</month>
          <volume>4</volume>
          <issue>5B</issue>
          <fpage>1177</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="medline">11924944</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saarijärvi</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <source>Customer Value Co-Creation through Reverse Use of Customer Data</source>
          <year>2011</year>
          <publisher-loc>Tampere</publisher-loc>
          <publisher-name>Acta Universitatis Tamperensis</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Katajajuuri</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Silvennoinen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hartikainen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Heikkilä</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Reinikainen</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Food waste in the Finnish food chain</article-title>
          <source>Journal of Cleaner Production</source>
          <year>2014</year>
          <month>06</month>
          <volume>73</volume>
          <fpage>322</fpage>
          <lpage>329</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jclepro.2013.12.057</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hansel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Roussel</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Diguet</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Deplaude</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bruckert</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Relationships between consumption of alcoholic beverages and healthy foods: the French supermarket cohort of 196,000 subjects</article-title>
          <source>Eur J Prev Cardiol</source>
          <year>2015</year>
          <month>02</month>
          <volume>22</volume>
          <issue>2</issue>
          <fpage>215</fpage>
          <lpage>22</lpage>
          <pub-id pub-id-type="doi">10.1177/2047487313506829</pub-id>
          <pub-id pub-id-type="medline">24065742</pub-id>
          <pub-id pub-id-type="pii">2047487313506829</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Willett</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Rockström</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Loken</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Springmann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Vermeulen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Garnett</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tilman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>DeClerck</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wood</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jonell</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gordon</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Fanzo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hawkes</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zurayk</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rivera</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>De Vries</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Majele Sibanda</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Afshin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chaudhary</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Herrero</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Agustina</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Branca</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lartey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Crona</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bignet</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Troell</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lindahl</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cornell</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Srinath Reddy</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Narain</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nishtar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>CJ</given-names>
            </name>
          </person-group>
          <article-title>Food in the Anthropocene: the EAT-Lancet Commission on healthy diets from sustainable food systems</article-title>
          <source>Lancet</source>
          <year>2019</year>
          <month>02</month>
          <day>02</day>
          <volume>393</volume>
          <issue>10170</issue>
          <fpage>447</fpage>
          <lpage>492</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(18)31788-4</pub-id>
          <pub-id pub-id-type="medline">30660336</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(18)31788-4</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
