<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: CSV log unexpectedly breaking by lines in Getting Data In</title>
    <link>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/678346#M113356</link>
    <description>&lt;P&gt;The props.conf settings are missing &lt;FONT face="courier new,courier"&gt;TIME_FORMAT&lt;/FONT&gt;.&amp;nbsp; Other settings may need to be changed, but we need to see the raw data (the CSV file before it gets to Splunk) to determine that.&lt;/P&gt;</description>
    <pubDate>Thu, 22 Feb 2024 14:55:00 GMT</pubDate>
    <dc:creator>richgalloway</dc:creator>
    <dc:date>2024-02-22T14:55:00Z</dc:date>
    <item>
      <title>CSV log unexpectedly breaking by lines</title>
      <link>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/678092#M113326</link>
      <description>&lt;P&gt;Hello to everyone!&lt;BR /&gt;I have a Win server with Splunk UF installed that consumes MS Exchange logs&lt;BR /&gt;This logs is stored in CSV format&lt;BR /&gt;&lt;BR /&gt;Splunk UF settings look like this:&lt;BR /&gt;props.conf&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;[exch_file_httpproxy-mapi]
ANNOTATE_PUNCT = false
BREAK_ONLY_BEFORE_DATE = true
INDEXED_EXTRACTIONS = csv
initCrcLength = 2735
HEADER_FIELD_LINE_NUMBER = 1
MAX_TIMESTAMP_LOOKAHEAD = 24
SHOULD_LINEMERGE = false
TIMESTAMP_FIELDS = DateTime
TRANSFORMS-no_column_headers = no_column_headers&lt;/LI-CODE&gt;&lt;P&gt;transforms.conf&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;[no_column_headers]
REGEX = ^#.*
DEST_KEY = queue
FORMAT = nullQueue&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks to the data quality report on the indexers layer, I found out that this source type has some timestamp issues&lt;BR /&gt;I investigated this problem by executing a search on the searched layer and found surprising events breaking&lt;BR /&gt;You can see an example in the attachment&lt;BR /&gt;_raw data is OK and is not contain "unxepected" next-line characters&lt;/P&gt;&lt;P&gt;What is wrong with my settings?&lt;/P&gt;</description>
      <pubDate>Tue, 20 Feb 2024 14:55:56 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/678092#M113326</guid>
      <dc:creator>NoSpaces</dc:creator>
      <dc:date>2024-02-20T14:55:56Z</dc:date>
    </item>
    <item>
      <title>Re: CSV log unexpectedly breaking by lines</title>
      <link>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/678313#M113354</link>
      <description>&lt;P&gt;Up&lt;/P&gt;</description>
      <pubDate>Thu, 22 Feb 2024 09:23:08 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/678313#M113354</guid>
      <dc:creator>NoSpaces</dc:creator>
      <dc:date>2024-02-22T09:23:08Z</dc:date>
    </item>
    <item>
      <title>Re: CSV log unexpectedly breaking by lines</title>
      <link>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/678346#M113356</link>
      <description>&lt;P&gt;The props.conf settings are missing &lt;FONT face="courier new,courier"&gt;TIME_FORMAT&lt;/FONT&gt;.&amp;nbsp; Other settings may need to be changed, but we need to see the raw data (the CSV file before it gets to Splunk) to determine that.&lt;/P&gt;</description>
      <pubDate>Thu, 22 Feb 2024 14:55:00 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/678346#M113356</guid>
      <dc:creator>richgalloway</dc:creator>
      <dc:date>2024-02-22T14:55:00Z</dc:date>
    </item>
    <item>
      <title>Re: CSV log unexpectedly breaking by lines</title>
      <link>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/678477#M113384</link>
      <description>&lt;P&gt;Is TIME_FORMAT necessarily? Events that are not broken haven't problem with timestamp determination&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;This is the log example that contains headers, a preamble, and one event&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;DateTime,RequestId,MajorVersion,MinorVersion,BuildVersion,RevisionVersion,ClientRequestId,Protocol,UrlHost,UrlStem,ProtocolAction,AuthenticationType,IsAuthenticated,AuthenticatedUser,Organization,AnchorMailbox,UserAgent,ClientIpAddress,ServerHostName,HttpStatus,BackEndStatus,ErrorCode,Method,ProxyAction,TargetServer,TargetServerVersion,RoutingType,RoutingHint,BackEndCookie,ServerLocatorHost,ServerLocatorLatency,RequestBytes,ResponseBytes,TargetOutstandingRequests,AuthModulePerfContext,HttpPipelineLatency,CalculateTargetBackEndLatency,GlsLatencyBreakup,TotalGlsLatency,AccountForestLatencyBreakup,TotalAccountForestLatency,ResourceForestLatencyBreakup,TotalResourceForestLatency,ADLatency,SharedCacheLatencyBreakup,TotalSharedCacheLatency,ActivityContextLifeTime,ModuleToHandlerSwitchingLatency,ClientReqStreamLatency,BackendReqInitLatency,BackendReqStreamLatency,BackendProcessingLatency,BackendRespInitLatency,BackendRespStreamLatency,ClientRespStreamLatency,KerberosAuthHeaderLatency,HandlerCompletionLatency,RequestHandlerLatency,HandlerToModuleSwitchingLatency,ProxyTime,CoreLatency,RoutingLatency,HttpProxyOverhead,TotalRequestTime,RouteRefresherLatency,UrlQuery,BackEndGenericInfo,GenericInfo,GenericErrors,EdgeTraceId,DatabaseGuid,UserADObjectGuid,PartitionEndpointLookupLatency,RoutingStatus
#Software: Microsoft Exchange Server
#Version: 15.02.1118.040
#Log-type: HttpProxy Logs
#Date: 2024-02-20T14:00:01.019Z
#Fields: DateTime,RequestId,MajorVersion,MinorVersion,BuildVersion,RevisionVersion,ClientRequestId,Protocol,UrlHost,UrlStem,ProtocolAction,AuthenticationType,IsAuthenticated,AuthenticatedUser,Organization,AnchorMailbox,UserAgent,ClientIpAddress,ServerHostName,HttpStatus,BackEndStatus,ErrorCode,Method,ProxyAction,TargetServer,TargetServerVersion,RoutingType,RoutingHint,BackEndCookie,ServerLocatorHost,ServerLocatorLatency,RequestBytes,ResponseBytes,TargetOutstandingRequests,AuthModulePerfContext,HttpPipelineLatency,CalculateTargetBackEndLatency,GlsLatencyBreakup,TotalGlsLatency,AccountForestLatencyBreakup,TotalAccountForestLatency,ResourceForestLatencyBreakup,TotalResourceForestLatency,ADLatency,SharedCacheLatencyBreakup,TotalSharedCacheLatency,ActivityContextLifeTime,ModuleToHandlerSwitchingLatency,ClientReqStreamLatency,BackendReqInitLatency,BackendReqStreamLatency,BackendProcessingLatency,BackendRespInitLatency,BackendRespStreamLatency,ClientRespStreamLatency,KerberosAuthHeaderLatency,HandlerCompletionLatency,RequestHandlerLatency,HandlerToModuleSwitchingLatency,ProxyTime,CoreLatency,RoutingLatency,HttpProxyOverhead,TotalRequestTime,RouteRefresherLatency,UrlQuery,BackEndGenericInfo,GenericInfo,GenericErrors,EdgeTraceId,DatabaseGuid,UserADObjectGuid,PartitionEndpointLookupLatency,RoutingStatus
2024-02-20T14:00:00.980Z,c3581a8e-2033-4fa0-8dbf-3efdc06ba7c3,15,2,1118,40,{5745B4EE-6A69-4E12-8EBD-6AD2820CA5D1},Mapi,mail.domain.com,/mapi/nspi/,,,false,,,,Microsoft Office/15.0 (Windows NT 10.0; Microsoft Outlook 15.0.5589; Pro),172.16.5.94,SERVERMBX06,401,,,POST,,,,,,,,,13,,,,,,,,,,,,,,,38,,,,,,,,,,,,,,0,,0,0,,?MailboxId=5918ae5a-9281-4301-b94e-407395ba2824@domain.com,,BeginRequest=2024-02-20T14:00:00.980Z;CorrelationID=&amp;lt;empty&amp;gt;;SharedCacheGuard=0;EndRequest=2024-02-20T14:00:00.980Z;S:ServiceLatencyMetadata.AuthModuleLatency=0,,,,,,&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 23 Feb 2024 12:41:42 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/678477#M113384</guid>
      <dc:creator>NoSpaces</dc:creator>
      <dc:date>2024-02-23T12:41:42Z</dc:date>
    </item>
    <item>
      <title>Re: CSV log unexpectedly breaking by lines</title>
      <link>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/678486#M113385</link>
      <description>&lt;P&gt;&lt;FONT face="courier new,courier"&gt;TIME_FORMAT&lt;/FONT&gt; is one of the "Great 8" settings every sourcetype should have.&amp;nbsp; They help ensure events are onboarded properly.&amp;nbsp; See if these settings help.&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;[exch_file_httpproxy-mapi]
ANNOTATE_PUNCT = false
LINE_BREAKER = ([\r\n]+)\d\d\d\d-\d\d
INDEXED_EXTRACTIONS = csv
initCrcLength = 2735
HEADER_FIELD_LINE_NUMBER = 1
MAX_TIMESTAMP_LOOKAHEAD = 24
SHOULD_LINEMERGE = false
TIMESTAMP_FIELDS = DateTime
TIME_FORMAT = %Y-%m-%dT%H:%M:%S.%3N%Z
TRANSFORMS-no_column_headers = no_column_headers
EVENT_BREAKER_ENABLE = true
EVENT_BREAKER = ([\r\n]+)\d\d\d\d-\d\d
TRUNCATE = 10000&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 23 Feb 2024 13:51:26 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/678486#M113385</guid>
      <dc:creator>richgalloway</dc:creator>
      <dc:date>2024-02-23T13:51:26Z</dc:date>
    </item>
    <item>
      <title>Re: CSV log unexpectedly breaking by lines</title>
      <link>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/679761#M113588</link>
      <description>&lt;P&gt;Sorry for the long answer&lt;BR /&gt;I tested your settings and I can&amp;nbsp;say with confidence that there is no difference&lt;BR /&gt;Events also unexpectedly break&lt;/P&gt;</description>
      <pubDate>Wed, 06 Mar 2024 10:42:14 GMT</pubDate>
      <guid>https://community.splunk.com/t5/Getting-Data-In/CSV-log-unexpectedly-breaking-by-lines/m-p/679761#M113588</guid>
      <dc:creator>NoSpaces</dc:creator>
      <dc:date>2024-03-06T10:42:14Z</dc:date>
    </item>
  </channel>
</rss>

