Skip to content

Commit 814dc61

Browse files
committed
update test files for code ID
1 parent d9827c7 commit 814dc61

37 files changed

+190
-190
lines changed

examples/2408.09869v3.json

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1316,7 +1316,7 @@
13161316
"captions": [],
13171317
"references": [],
13181318
"footnotes": [],
1319-
"code_language": "unknown"
1319+
"code_language": "Python"
13201320
},
13211321
{
13221322
"self_ref": "#/texts/23",
@@ -1347,7 +1347,7 @@
13471347
"captions": [],
13481348
"references": [],
13491349
"footnotes": [],
1350-
"code_language": "unknown"
1350+
"code_language": "Python"
13511351
},
13521352
{
13531353
"self_ref": "#/texts/24",

test/data/chunker/0_inp_dl_doc.json

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1317,7 +1317,7 @@
13171317
"captions": [],
13181318
"references": [],
13191319
"footnotes": [],
1320-
"code_language": "unknown"
1320+
"code_language": "Python"
13211321
},
13221322
{
13231323
"self_ref": "#/texts/23",
@@ -1348,7 +1348,7 @@
13481348
"captions": [],
13491349
"references": [],
13501350
"footnotes": [],
1351-
"code_language": "unknown"
1351+
"code_language": "Python"
13521352
},
13531353
{
13541354
"self_ref": "#/texts/24",

test/data/chunker_repo/C/repo_out_chunks.json

Lines changed: 37 additions & 37 deletions
Large diffs are not rendered by default.

test/data/chunker_repo/Java/repo_out_chunks.json

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
{
44
"text": "package com.acmeair;\n\npublic interface AcmeAirConstants {\n\n\t\n}",
55
"meta": {
6-
"schema_name": "docling_core.transforms.chunker.DocMeta",
6+
"schema_name": "docling_core.transforms.chunker.CodeDocMeta",
77
"version": "1.0.0",
88
"origin": {
99
"mimetype": "text/plain",
@@ -23,7 +23,7 @@
2323
{
2424
"text": "package com.acmeair.loader;\nimport com.acmeair.entities.Customer.PhoneType;\nimport com.acmeair.entities.Customer;\nimport com.acmeair.entities.CustomerAddress;\nimport com.acmeair.service.CustomerService;\nimport com.acmeair.service.ServiceLocator;\npublic class CustomerLoader {\n\n private CustomerService customerService = ServiceLocator.instance().getService(CustomerService.class);} public void loadCustomers(long numCustomers) {\n\t\tCustomerAddress address = customerService.createAddress(\"123 Main St.\", null, \"Anytown\", \"NC\", \"USA\", \"27617\");\n\t\tfor (long ii = 0; ii < numCustomers; ii++) {\n\t\t\tcustomerService.createCustomer(\"uid\"+ii+\"@email.com\", \"password\", Customer.MemberShipStatus.GOLD, 1000000, 1000, \"919-123-4567\", PhoneType.BUSINESS, address);\n\t\t}\n\t}",
2525
"meta": {
26-
"schema_name": "docling_core.transforms.chunker.DocMeta",
26+
"schema_name": "docling_core.transforms.chunker.CodeDocMeta",
2727
"version": "1.0.0",
2828
"origin": {
2929
"mimetype": "text/plain",
@@ -43,7 +43,7 @@
4343
{
4444
"text": "package com.acmeair.loader;\nimport com.acmeair.entities.AirportCodeMapping;\nimport com.acmeair.service.FlightService;\nimport com.acmeair.service.ServiceLocator;\nimport java.io.InputStream;\nimport java.io.InputStreamReader;\nimport java.io.LineNumberReader;\nimport java.math.*;\nimport java.util.*;\npublic class FlightLoader {\n\n private static final int MAX_FLIGHTS_PER_SEGMENT = 30; private FlightService flightService = ServiceLocator.instance().getService(FlightService.class);} public void loadFlights() throws Exception {\n\t\tInputStream csvInputStream = FlightLoader.class.getResourceAsStream(\"/mileage.csv\");\n\t\t\n\t\tLineNumberReader lnr = new LineNumberReader(new InputStreamReader(csvInputStream));\n\t\tString line1 = lnr.readLine();\n\t\tStringTokenizer st = new StringTokenizer(line1, \",\");\n\t\tArrayList<AirportCodeMapping> airports = new ArrayList<AirportCodeMapping>();\n\t\t\n\t\t// read the first line which are airport names\n\t\twhile (st.hasMoreTokens()) {\n\t\t\tAirportCodeMapping acm = flightService.createAirportCodeMapping(null, st.nextToken());\n\t\t//\tacm.setAirportName(st.nextToken());\n\t\t\tairports.add(acm);\n\t\t}\n\t\t// read the second line which contains matching airport codes for the first line\n\t\tString line2 = lnr.readLine();\n\t\tst = new StringTokenizer(line2, \",\");\n\t\tint ii = 0;\n\t\twhile (st.hasMoreTokens()) {\n\t\t\tString airportCode = st.nextToken();\n\t\t\tairports.get(ii).setAirportCode(airportCode);\n\t\t\tii++;\n\t\t}\n\t\t// read the other lines which are of format:\n\t\t// airport name, aiport code, distance from this airport to whatever airport is in the column from lines one and two\n\t\tString line;\n\t\tint flightNumber = 0;\n\t\twhile (true) {\n\t\t\tline = lnr.readLine();\n\t\t\tif (line == null || line.trim().equals(\"\")) {\n\t\t\t\tbreak;\n\t\t\t}\n\t\t\tst = new StringTokenizer(line, \",\");\n\t\t\tString airportName = st.nextToken();\n\t\t\tString airportCode = st.nextToken();\n\t\t\tif (!alreadyInCollection(airportCode, airports)) {\n\t\t\t\tAirportCodeMapping acm = flightService.createAirportCodeMapping(airportCode, airportName);\n\t\t\t\tairports.add(acm);\n\t\t\t}\n\t\t\tint indexIntoTopLine = 0;\n\t\t\twhile (st.hasMoreTokens()) {\n\t\t\t\tString milesString = st.nextToken();\n\t\t\t\tif (milesString.equals(\"NA\")) {\n\t\t\t\t\tindexIntoTopLine++;\n\t\t\t\t\tcontinue;\n\t\t\t\t}\n\t\t\t\tint miles = Integer.parseInt(milesString);\n\t\t\t\tString toAirport = airports.get(indexIntoTopLine).getAirportCode();\n\t\t\t\tString flightId = \"AA\" + flightNumber;\t\t\t\n\t\t\t\tflightService.storeFlightSegment(flightId, airportCode, toAirport, miles);\n\t\t\t\tDate now = new Date();\n\t\t\t\tfor (int daysFromNow = 0; daysFromNow < MAX_FLIGHTS_PER_SEGMENT; daysFromNow++) {\n\t\t\t\t\tCalendar c = Calendar.getInstance();\n\t\t\t\t\tc.setTime(now);\n\t\t\t\t\tc.set(Calendar.HOUR_OF_DAY, 0);\n\t\t\t\t c.set(Calendar.MINUTE, 0);\n\t\t\t\t c.set(Calendar.SECOND, 0);\n\t\t\t\t c.set(Calendar.MILLISECOND, 0);\n\t\t\t\t\tc.add(Calendar.DATE, daysFromNow);\n\t\t\t\t\tDate departureTime = c.getTime();\n\t\t\t\t\tDate arrivalTime = getArrivalTime(departureTime, miles);\n\t\t\t\t\tflightService.createNewFlight(flightId, departureTime, arrivalTime, new BigDecimal(500), new BigDecimal(200), 10, 200, \"B747\");\n\t\t\t\t\t\n\t\t\t\t}\n\t\t\t\tflightNumber++;\n\t\t\t\tindexIntoTopLine++;\n\t\t\t}\n\t\t}\n\t\t\n\t\tfor (int jj = 0; jj < airports.size(); jj++) {\n\t\t\tflightService.storeAirportMapping(airports.get(jj));\n\t\t}\n\t\tlnr.close();\n\t}",
4545
"meta": {
46-
"schema_name": "docling_core.transforms.chunker.DocMeta",
46+
"schema_name": "docling_core.transforms.chunker.CodeDocMeta",
4747
"version": "1.0.0",
4848
"origin": {
4949
"mimetype": "text/plain",
@@ -63,7 +63,7 @@
6363
{
6464
"text": "package com.acmeair.loader;\nimport com.acmeair.service.FlightService;\nimport com.acmeair.service.ServiceLocator;\nimport java.math.*;\nimport java.util.*;\npublic class FlightLoader {\n\n private static final int MAX_FLIGHTS_PER_SEGMENT = 30; private FlightService flightService = ServiceLocator.instance().getService(FlightService.class);} private static Date getArrivalTime(Date departureTime, int mileage) {\n\t\tdouble averageSpeed = 600.0; // 600 miles/hours\n\t\tdouble hours = (double) mileage / averageSpeed; // miles / miles/hour = hours\n\t\tdouble partsOfHour = hours % 1.0;\n\t\tint minutes = (int)(60.0 * partsOfHour);\n\t\tCalendar c = Calendar.getInstance();\n\t\tc.setTime(departureTime);\n\t\tc.add(Calendar.HOUR, (int)hours);\n\t\tc.add(Calendar.MINUTE, minutes);\n\t\treturn c.getTime();\n\t}",
6565
"meta": {
66-
"schema_name": "docling_core.transforms.chunker.DocMeta",
66+
"schema_name": "docling_core.transforms.chunker.CodeDocMeta",
6767
"version": "1.0.0",
6868
"origin": {
6969
"mimetype": "text/plain",
@@ -83,7 +83,7 @@
8383
{
8484
"text": "package com.acmeair.loader;\nimport com.acmeair.entities.AirportCodeMapping;\nimport com.acmeair.service.FlightService;\nimport com.acmeair.service.ServiceLocator;\nimport java.math.*;\nimport java.util.*;\npublic class FlightLoader {\n\n private static final int MAX_FLIGHTS_PER_SEGMENT = 30; private FlightService flightService = ServiceLocator.instance().getService(FlightService.class);} static private boolean alreadyInCollection(String airportCode, ArrayList<AirportCodeMapping> airports) {\n\t\tfor (int ii = 0; ii < airports.size(); ii++) {\n\t\t\tif (airports.get(ii).getAirportCode().equals(airportCode)) {\n\t\t\t\treturn true;\n\t\t\t}\n\t\t}\n\t\treturn false;\n\t}",
8585
"meta": {
86-
"schema_name": "docling_core.transforms.chunker.DocMeta",
86+
"schema_name": "docling_core.transforms.chunker.CodeDocMeta",
8787
"version": "1.0.0",
8888
"origin": {
8989
"mimetype": "text/plain",

0 commit comments

Comments
 (0)