CintraAI commited on
Commit
a50881d
·
1 Parent(s): ce480bd

Add tests for Go, CSS, and various programming languages

Browse files

- Introduced a new test suite for Go language support, validating chunking functionality for simple code, structs, interfaces, and goroutines.
- Added test cases for CSS chunking, covering both media queries and simple styles.
- Established a base test class for code chunking tests, allowing for consistent setup and utility methods across different language tests.
- Created individual test files for JavaScript, PHP, Python, Ruby, TypeScript, and CSS, ensuring comprehensive coverage of chunking functionality across multiple languages.

mock_codefiles.json CHANGED
@@ -15,7 +15,7 @@
15
  "main.js": "const express = require('express');\nconst routes = require('./routes');\n\n// Create the Express application\nconst app = express();\n\n// Register the routes from the routes.js file\napp.use('/', routes);\n\n// Configuration settings for the app can go here\napp.set('port', process.env.PORT || 3000);\n\n// More complex app initialization steps can be added here\n// For example, database initialization, middleware setups, etc.\n\n// This function can be used to create a database schema\nfunction createDatabase() {\n // Code to create database schema\n console.log('Created Database!');\n}\n\n// Optionally, call database creation or other setup functions here\ncreateDatabase();\n\n// Start the server\napp.listen(app.get('port'), () => {\n console.log(`Server running on port ${app.get('port')}`);\n});",
16
  "utilities.js": "// Example of utility functions for common tasks\n\n// Function to hash a password\nfunction hashPassword(password) {\n const salt = uuidv4();\n return sha256(salt + password) + ':' + salt;\n}\n\n// Function to check a hashed password\nfunction checkPassword(hashedPassword, userPassword) {\n const [password, salt] = hashedPassword.split(':');\n return sha256(salt + userPassword) === password;\n}\n\n// Function to validate an email address\nfunction validateEmail(email) {\n const pattern = /^[a-zA-Z0-9_.+-]+@[a-zA-Z0-9-]+\\.[a-zA-Z0-9-.]+$/;\n return pattern.test(email);\n}\n\n// Function to generate a token expiration date\nfunction generateExpirationDate(days = 1) {\n const expirationDate = new Date();\n expirationDate.setDate(expirationDate.getDate() + days);\n return expirationDate;\n}\n\n// Function to convert a string to a Date object\nfunction stringToDate(dateString, format = 'YYYY-MM-DD HH:mm:ss') {\n return new Date(dateString);\n}\n\n// Function to convert a Date object to a string\nfunction dateToString(date, format = 'YYYY-MM-DD HH:mm:ss') {\n return date.toISOString();\n}",
17
  "services.js": "// Example of service functions for handling data operations\n\n// Function to fetch data from an external API\nasync function fetchExternalData(apiUrl) {\n try {\n const response = await fetch(apiUrl);\n if (response.ok) {\n return await response.json();\n } else {\n return { error: 'Failed to fetch data' };\n }\n } catch (error) {\n return { error: error.message };\n }\n}\n\n// Function to save user data to the database\nasync function saveUserData(name, email) {\n try {\n const newUser = new UserData({ name, email });\n await newUser.save();\n return { message: 'User saved successfully' };\n } catch (error) {\n return { error: error.message };\n }\n}\n\n// Function to update user data in the database\nasync function updateUserData(userId, name, email) {\n try {\n const user = await UserData.findById(userId);\n if (!user) {\n return { error: 'User not found' };\n }\n if (name) {\n user.name = name;\n }\n if (email) {\n user.email = email;\n }\n await user.save();\n return { message: 'User updated successfully' };\n } catch (error) {\n return { error: error.message };\n }\n}\n\n// Function to delete user data from the database\nasync function deleteUserData(userId) {\n try {\n const user = await UserData.findById(userId);\n if (!user) {\n return { error: 'User not found' };\n }\n await user.remove();\n return { message: 'User deleted successfully' };\n } catch (error) {\n return { error: error.message };\n }\n}",
18
- "react_component.js": "import React from 'react';\n\nimport './SearchResults.css';\n\nimport TrackList from '../TrackList/TrackList.js';\n\n constructor(props) {\n super(props);\n this.addTopFive = this.addTopFive.bind(this);\n this.addTopTen = this.addTopTen.bind(this);\n this.addAll = this.addAll.bind(this);\n }\n\n //add the top five tracks to the playlist\n addTopFive() {\n this.props.onAdd(this.props.searchResults.slice(0, 5));\n }\n\n //add top 10 tracks to the playlist\n addTopTen() {\n this.props.onAdd(this.props.searchResults.slice(0, 10));\n }\n\n addAll() {\n this.props.onAdd(this.props.searchResults);\n }\n render() {\n return (\n <div className=\"SearchResults\">\n <h2>Results</h2>\n <TrackList tracks={this.props.searchResults} onAdd={this.props.onAdd} onToggle={this.props.onToggle} currentTrack={this.props.currentTrack}/>\n </div>\n );\n }\n}\n\nexport default SearchResults;'",
19
  "simple_styles.css": "/* Example of CSS styles for a web page */\n\nbody {\n font-family: Arial, sans-serif;\n background-color: #f4f4f4;\n margin: 0;\n padding: 0;\n}\n\nh1 {\n color: #333;\n text-align: center;\n}\n\nbutton {\n padding: 10px 20px;\n font-size: 16px;\n background-color: #007bff;\n color: #fff;\n border: none;\n cursor: pointer;\n}\n\nbutton:hover {\n background-color: #0056b3;\n}",
20
  "media_queries.css": "/* Example of CSS styles with media queries for responsive design */\n\nbody {\n font-family: Arial, sans-serif;\n background-color: #f4f4f4;\n margin: 0;\n padding: 0;\n}\n\nh1 {\n color: #333;\n text-align: center;\n}\n\nbutton {\n padding: 10px 20px;\n font-size: 16px;\n background-color: #007bff;\n color: #fff;\n border: none;\n cursor: pointer;\n}\n\nbutton:hover {\n background-color: #0056b3;\n}\n\n/* Media query for smaller screens */\n@media (max-width: 768px) {\n button {\n padding: 8px 16px;\n font-size: 14px;\n }\n}",
21
  "single_syntax_error_example.py": "# This is a sample Python file\n\nprint('Hello, world!'\n\n",
@@ -26,5 +26,9 @@
26
  "multiple_syntax_errors.css": "body {\n font-family: Arial, sans-serif;\n background-color: #f4f4f4;\n margin: 0;\n padding: 0;\n}\n\nh1 {\n color: #333;\n text-align: center;\n}\n\nbutton {\n padding: 10px 20px;\n font-size: 16px;\n background-color: #007bff;\n color: #fff;\n border: none;\n cursor: pointer;\n :hover {\n background-color: #0056b3;\n}\n\n/* Media query for smaller screens */\n@media (max-width: 768px) {\n button {\n padding: 8px 16px;\n font-size: 14px;\n }\n}",
27
  "example.ts": "interface User {\n id: number;\n name: string;\n email: string;\n}\n\nclass UserManager {\n private users: User[] = [];\n\n addUser(user: User): void {\n this.users.push(user);\n }\n\n getUser(id: number): User | undefined {\n return this.users.find(user => user.id === id);\n }\n\n updateUser(id: number, updatedUser: Partial<User>): void {\n const userIndex = this.users.findIndex(user => user.id === id);\n if (userIndex !== -1) {\n this.users[userIndex] = { ...this.users[userIndex], ...updatedUser };\n }\n }\n\n deleteUser(id: number): void {\n this.users = this.users.filter(user => user.id !== id);\n }\n}\n\nconst userManager = new UserManager();\nuserManager.addUser({ id: 1, name: 'John Doe', email: '[email protected]' });\nconsole.log(userManager.getUser(1));",
28
  "example.rb": "class User\n attr_accessor :id, :name, :email\n\n def initialize(id, name, email)\n @id = id\n @name = name\n @email = email\n end\n\n def to_s\n \"User: #{@name} (#{@email})\"\n end\nend\n\nclass UserManager\n def initialize\n @users = []\n end\n\n def add_user(user)\n @users << user\n end\n\n def get_user(id)\n @users.find { |user| user.id == id }\n end\n\n def update_user(id, updated_user)\n user = get_user(id)\n user.name = updated_user.name if updated_user.name\n user.email = updated_user.email if updated_user.email\n end\n\n def delete_user(id)\n @users.delete_if { |user| user.id == id }\n end\nend\n\nuser_manager = UserManager.new\nuser_manager.add_user(User.new(1, 'John Doe', '[email protected]'))\nputs user_manager.get_user(1)",
29
- "example.php": "<?php\n\nclass User {\n public $id;\n public $name;\n public $email;\n\n public function __construct($id, $name, $email) {\n $this->id = $id;\n $this->name = $name;\n $this->email = $email;\n }\n}\n\nclass UserManager {\n private $users = [];\n\n public function addUser($user) {\n $this->users[] = $user;\n }\n\n public function getUser($id) {\n foreach ($this->users as $user) {\n if ($user->id === $id) {\n return $user;\n }\n }\n return null;\n }\n\n public function updateUser($id, $updatedUser) {\n foreach ($this->users as &$user) {\n if ($user->id === $id) {\n $user->name = $updatedUser->name ?? $user->name;\n $user->email = $updatedUser->email ?? $user->email;\n break;\n }\n }\n }\n\n public function deleteUser($id) {\n $this->users = array_filter($this->users, function($user) use ($id) {\n return $user->id !== $id;\n });\n }\n}\n\n$userManager = new UserManager();\n$userManager->addUser(new User(1, 'John Doe', '[email protected]'));\nvar_dump($userManager->getUser(1));\n?>"
 
 
 
 
30
  }
 
15
  "main.js": "const express = require('express');\nconst routes = require('./routes');\n\n// Create the Express application\nconst app = express();\n\n// Register the routes from the routes.js file\napp.use('/', routes);\n\n// Configuration settings for the app can go here\napp.set('port', process.env.PORT || 3000);\n\n// More complex app initialization steps can be added here\n// For example, database initialization, middleware setups, etc.\n\n// This function can be used to create a database schema\nfunction createDatabase() {\n // Code to create database schema\n console.log('Created Database!');\n}\n\n// Optionally, call database creation or other setup functions here\ncreateDatabase();\n\n// Start the server\napp.listen(app.get('port'), () => {\n console.log(`Server running on port ${app.get('port')}`);\n});",
16
  "utilities.js": "// Example of utility functions for common tasks\n\n// Function to hash a password\nfunction hashPassword(password) {\n const salt = uuidv4();\n return sha256(salt + password) + ':' + salt;\n}\n\n// Function to check a hashed password\nfunction checkPassword(hashedPassword, userPassword) {\n const [password, salt] = hashedPassword.split(':');\n return sha256(salt + userPassword) === password;\n}\n\n// Function to validate an email address\nfunction validateEmail(email) {\n const pattern = /^[a-zA-Z0-9_.+-]+@[a-zA-Z0-9-]+\\.[a-zA-Z0-9-.]+$/;\n return pattern.test(email);\n}\n\n// Function to generate a token expiration date\nfunction generateExpirationDate(days = 1) {\n const expirationDate = new Date();\n expirationDate.setDate(expirationDate.getDate() + days);\n return expirationDate;\n}\n\n// Function to convert a string to a Date object\nfunction stringToDate(dateString, format = 'YYYY-MM-DD HH:mm:ss') {\n return new Date(dateString);\n}\n\n// Function to convert a Date object to a string\nfunction dateToString(date, format = 'YYYY-MM-DD HH:mm:ss') {\n return date.toISOString();\n}",
17
  "services.js": "// Example of service functions for handling data operations\n\n// Function to fetch data from an external API\nasync function fetchExternalData(apiUrl) {\n try {\n const response = await fetch(apiUrl);\n if (response.ok) {\n return await response.json();\n } else {\n return { error: 'Failed to fetch data' };\n }\n } catch (error) {\n return { error: error.message };\n }\n}\n\n// Function to save user data to the database\nasync function saveUserData(name, email) {\n try {\n const newUser = new UserData({ name, email });\n await newUser.save();\n return { message: 'User saved successfully' };\n } catch (error) {\n return { error: error.message };\n }\n}\n\n// Function to update user data in the database\nasync function updateUserData(userId, name, email) {\n try {\n const user = await UserData.findById(userId);\n if (!user) {\n return { error: 'User not found' };\n }\n if (name) {\n user.name = name;\n }\n if (email) {\n user.email = email;\n }\n await user.save();\n return { message: 'User updated successfully' };\n } catch (error) {\n return { error: error.message };\n }\n}\n\n// Function to delete user data from the database\nasync function deleteUserData(userId) {\n try {\n const user = await UserData.findById(userId);\n if (!user) {\n return { error: 'User not found' };\n }\n await user.remove();\n return { message: 'User deleted successfully' };\n } catch (error) {\n return { error: error.message };\n }\n}",
18
+ "react_component.js": "import React from 'react';\n\nimport './SearchResults.css';\n\nimport TrackList from '../TrackList/TrackList.js';\n\n constructor(props) {\n super(props);\n this.addTopFive = this.addTopFive.bind(this);\n this.addTopTen = this.addTopTen.bind(this);\n this.addAll = this.addAll.bind(this);\n }\n\n //add the top five tracks to the playlist\n addTopFive() {\n this.props.onAdd(this.props.searchResults.slice(0, 5));\n }\n\n //add top 10 tracks to the playlist\n addTopTen() {\n this.props.onAdd(this.props.searchResults.slice(0, 10));\n }\n\n addAll() {\n this.props.onAdd(this.props.searchResults);\n }\n render() {\n return (\n <div className=\"SearchResults\">\n <h2>Results</h2>\n <TrackList tracks={this.props.searchResults} onAdd={this.props.onAdd} onToggle={this.props.onToggle} currentTrack={this.props.currentTrack}/>\n </div>\n );\n }\n}\n\nexport default SearchResults;",
19
  "simple_styles.css": "/* Example of CSS styles for a web page */\n\nbody {\n font-family: Arial, sans-serif;\n background-color: #f4f4f4;\n margin: 0;\n padding: 0;\n}\n\nh1 {\n color: #333;\n text-align: center;\n}\n\nbutton {\n padding: 10px 20px;\n font-size: 16px;\n background-color: #007bff;\n color: #fff;\n border: none;\n cursor: pointer;\n}\n\nbutton:hover {\n background-color: #0056b3;\n}",
20
  "media_queries.css": "/* Example of CSS styles with media queries for responsive design */\n\nbody {\n font-family: Arial, sans-serif;\n background-color: #f4f4f4;\n margin: 0;\n padding: 0;\n}\n\nh1 {\n color: #333;\n text-align: center;\n}\n\nbutton {\n padding: 10px 20px;\n font-size: 16px;\n background-color: #007bff;\n color: #fff;\n border: none;\n cursor: pointer;\n}\n\nbutton:hover {\n background-color: #0056b3;\n}\n\n/* Media query for smaller screens */\n@media (max-width: 768px) {\n button {\n padding: 8px 16px;\n font-size: 14px;\n }\n}",
21
  "single_syntax_error_example.py": "# This is a sample Python file\n\nprint('Hello, world!'\n\n",
 
26
  "multiple_syntax_errors.css": "body {\n font-family: Arial, sans-serif;\n background-color: #f4f4f4;\n margin: 0;\n padding: 0;\n}\n\nh1 {\n color: #333;\n text-align: center;\n}\n\nbutton {\n padding: 10px 20px;\n font-size: 16px;\n background-color: #007bff;\n color: #fff;\n border: none;\n cursor: pointer;\n :hover {\n background-color: #0056b3;\n}\n\n/* Media query for smaller screens */\n@media (max-width: 768px) {\n button {\n padding: 8px 16px;\n font-size: 14px;\n }\n}",
27
  "example.ts": "interface User {\n id: number;\n name: string;\n email: string;\n}\n\nclass UserManager {\n private users: User[] = [];\n\n addUser(user: User): void {\n this.users.push(user);\n }\n\n getUser(id: number): User | undefined {\n return this.users.find(user => user.id === id);\n }\n\n updateUser(id: number, updatedUser: Partial<User>): void {\n const userIndex = this.users.findIndex(user => user.id === id);\n if (userIndex !== -1) {\n this.users[userIndex] = { ...this.users[userIndex], ...updatedUser };\n }\n }\n\n deleteUser(id: number): void {\n this.users = this.users.filter(user => user.id !== id);\n }\n}\n\nconst userManager = new UserManager();\nuserManager.addUser({ id: 1, name: 'John Doe', email: '[email protected]' });\nconsole.log(userManager.getUser(1));",
28
  "example.rb": "class User\n attr_accessor :id, :name, :email\n\n def initialize(id, name, email)\n @id = id\n @name = name\n @email = email\n end\n\n def to_s\n \"User: #{@name} (#{@email})\"\n end\nend\n\nclass UserManager\n def initialize\n @users = []\n end\n\n def add_user(user)\n @users << user\n end\n\n def get_user(id)\n @users.find { |user| user.id == id }\n end\n\n def update_user(id, updated_user)\n user = get_user(id)\n user.name = updated_user.name if updated_user.name\n user.email = updated_user.email if updated_user.email\n end\n\n def delete_user(id)\n @users.delete_if { |user| user.id == id }\n end\nend\n\nuser_manager = UserManager.new\nuser_manager.add_user(User.new(1, 'John Doe', '[email protected]'))\nputs user_manager.get_user(1)",
29
+ "example.php": "<?php\n\nclass User {\n public $id;\n public $name;\n public $email;\n\n public function __construct($id, $name, $email) {\n $this->id = $id;\n $this->name = $name;\n $this->email = $email;\n }\n}\n\nclass UserManager {\n private $users = [];\n\n public function addUser($user) {\n $this->users[] = $user;\n }\n\n public function getUser($id) {\n foreach ($this->users as $user) {\n if ($user->id === $id) {\n return $user;\n }\n }\n return null;\n }\n\n public function updateUser($id, $updatedUser) {\n foreach ($this->users as &$user) {\n if ($user->id === $id) {\n $user->name = $updatedUser->name ?? $user->name;\n $user->email = $updatedUser->email ?? $user->email;\n break;\n }\n }\n }\n\n public function deleteUser($id) {\n $this->users = array_filter($this->users, function($user) use ($id) {\n return $user->id !== $id;\n });\n }\n}\n\n$userManager = new UserManager();\n$userManager->addUser(new User(1, 'John Doe', '[email protected]'));\nvar_dump($userManager->getUser(1));\n?>",
30
+ "simple.go": "package main\n\nimport \"fmt\"\n\nfunc main() {\n fmt.Println(\"Hello, Go!\")\n \n // Simple variable declaration\n message := \"Welcome to Go programming\"\n fmt.Println(message)\n \n // Simple conditionals\n x := 10\n if x > 5 {\n fmt.Println(\"x is greater than 5\")\n } else {\n fmt.Println(\"x is not greater than 5\")\n }\n}",
31
+ "structs.go": "package main\n\nimport \"fmt\"\n\n// Person represents information about a person\ntype Person struct {\n Name string\n Age int\n Address string\n}\n\n// Employee extends Person with job-related fields\ntype Employee struct {\n Person\n Title string\n Salary float64\n EmployeeID int\n}\n\nfunc main() {\n // Create a new person\n person := Person{\n Name: \"John Doe\",\n Age: 30,\n Address: \"123 Main St\",\n }\n \n // Create a new employee\n employee := Employee{\n Person: Person{\n Name: \"Jane Smith\",\n Age: 28,\n Address: \"456 Oak Ave\",\n },\n Title: \"Software Engineer\",\n Salary: 85000.0,\n EmployeeID: 12345,\n }\n \n fmt.Printf(\"Person: %+v\\n\", person)\n fmt.Printf(\"Employee: %+v\\n\", employee)\n}",
32
+ "interfaces.go": "package main\n\nimport (\n \"fmt\"\n \"math\"\n)\n\n// Shape interface defines methods for calculating area and perimeter\ntype Shape interface {\n Area() float64\n Perimeter() float64\n}\n\n// Circle implements the Shape interface\ntype Circle struct {\n Radius float64\n}\n\nfunc (c Circle) Area() float64 {\n return math.Pi * c.Radius * c.Radius\n}\n\nfunc (c Circle) Perimeter() float64 {\n return 2 * math.Pi * c.Radius\n}\n\n// Rectangle implements the Shape interface\ntype Rectangle struct {\n Width, Height float64\n}\n\nfunc (r Rectangle) Area() float64 {\n return r.Width * r.Height\n}\n\nfunc (r Rectangle) Perimeter() float64 {\n return 2 * (r.Width + r.Height)\n}\n\n// PrintShapeInfo prints information about any shape\nfunc PrintShapeInfo(s Shape) {\n fmt.Printf(\"Area: %.2f\\n\", s.Area())\n fmt.Printf(\"Perimeter: %.2f\\n\", s.Perimeter())\n}\n\nfunc main() {\n circle := Circle{Radius: 5.0}\n rectangle := Rectangle{Width: 4.0, Height: 6.0}\n \n fmt.Println(\"Circle:\")\n PrintShapeInfo(circle)\n \n fmt.Println(\"\\nRectangle:\")\n PrintShapeInfo(rectangle)\n}",
33
+ "goroutines.go": "package main\n\nimport (\n \"fmt\"\n \"sync\"\n \"time\"\n)\n\n// Simple goroutine example\nfunc worker(id int, wg *sync.WaitGroup) {\n defer wg.Done()\n \n fmt.Printf(\"Worker %d starting\\n\", id)\n time.Sleep(time.Second)\n fmt.Printf(\"Worker %d done\\n\", id)\n}\n\n// Goroutine with channel communication\nfunc sender(ch chan<- int, count int) {\n for i := 0; i < count; i++ {\n ch <- i\n fmt.Printf(\"Sent: %d\\n\", i)\n time.Sleep(time.Millisecond * 100)\n }\n close(ch)\n}\n\nfunc receiver(ch <-chan int, done chan<- bool) {\n for num := range ch {\n fmt.Printf(\"Received: %d\\n\", num)\n }\n done <- true\n}\n\nfunc main() {\n // Using wait groups\n var wg sync.WaitGroup\n \n for i := 1; i <= 3; i++ {\n wg.Add(1)\n go worker(i, &wg)\n }\n \n // Wait for all goroutines to complete\n wg.Wait()\n \n // Using channels\n numbers := make(chan int, 5)\n done := make(chan bool)\n \n go sender(numbers, 10)\n go receiver(numbers, done)\n \n // Wait for receiver to process all numbers\n <-done\n \n fmt.Println(\"All operations completed\")\n}"
34
  }
test_code_chunker.py CHANGED
@@ -278,5 +278,57 @@ class TestCodeChunkerPHP(unittest.TestCase):
278
  self.assertIn(php_code, final_code)
279
  self.assertGreater(len(chunks), 1) # Ensure the code is actually chunked
280
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
281
  if __name__ == '__main__':
282
  unittest.main()
 
278
  self.assertIn(php_code, final_code)
279
  self.assertGreater(len(chunks), 1) # Ensure the code is actually chunked
280
 
281
+ # Golang Test Class
282
+ class TestCodeChunkerGolang(unittest.TestCase):
283
+
284
+ def setUp(self):
285
+ self.patcher = patch('utils.count_tokens', side_effect=mock_count_tokens)
286
+ self.mock_count_tokens = self.patcher.start()
287
+ self.code_chunker = CodeChunker(file_extension='go')
288
+ self.mock_codebase = load_json('mock_codefiles.json')
289
+
290
+ def tearDown(self):
291
+ self.patcher.stop()
292
+
293
+ def test_chunk_golang_simple_code(self):
294
+ go_code = self.mock_codebase['simple.go']
295
+ chunks = self.code_chunker.chunk(go_code, token_limit=20)
296
+ Chunker.print_chunks(chunks)
297
+ final_code = Chunker.consolidate_chunks_into_file(chunks)
298
+ num_lines = Chunker.count_lines(final_code)
299
+ self.assertEqual(num_lines, len(go_code.split("\n")))
300
+ self.assertIn(go_code, final_code)
301
+ self.assertGreater(len(chunks), 1) # Ensure the code is actually chunked
302
+
303
+ def test_chunk_golang_with_structs(self):
304
+ go_code = self.mock_codebase['structs.go']
305
+ chunks = self.code_chunker.chunk(go_code, token_limit=20)
306
+ Chunker.print_chunks(chunks)
307
+ final_code = Chunker.consolidate_chunks_into_file(chunks)
308
+ num_lines = Chunker.count_lines(final_code)
309
+ self.assertEqual(num_lines, len(go_code.split("\n")))
310
+ self.assertIn(go_code, final_code)
311
+ self.assertGreater(len(chunks), 1)
312
+
313
+ def test_chunk_golang_with_interfaces(self):
314
+ go_code = self.mock_codebase['interfaces.go']
315
+ chunks = self.code_chunker.chunk(go_code, token_limit=20)
316
+ Chunker.print_chunks(chunks)
317
+ final_code = Chunker.consolidate_chunks_into_file(chunks)
318
+ num_lines = Chunker.count_lines(final_code)
319
+ self.assertEqual(num_lines, len(go_code.split("\n")))
320
+ self.assertIn(go_code, final_code)
321
+ self.assertGreater(len(chunks), 1)
322
+
323
+ def test_chunk_golang_with_goroutines(self):
324
+ go_code = self.mock_codebase['goroutines.go']
325
+ chunks = self.code_chunker.chunk(go_code, token_limit=20)
326
+ Chunker.print_chunks(chunks)
327
+ final_code = Chunker.consolidate_chunks_into_file(chunks)
328
+ num_lines = Chunker.count_lines(final_code)
329
+ self.assertEqual(num_lines, len(go_code.split("\n")))
330
+ self.assertIn(go_code, final_code)
331
+ self.assertGreater(len(chunks), 1)
332
+
333
  if __name__ == '__main__':
334
  unittest.main()
tests/__init__.py ADDED
@@ -0,0 +1 @@
 
 
1
+ # This file makes the tests directory a Python package
tests/test_base.py ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import unittest
2
+ from unittest.mock import patch
3
+ import tiktoken
4
+ import sys
5
+ import os
6
+
7
+ # Add parent directory to path to allow imports
8
+ sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), '..')))
9
+
10
+ from Chunker import Chunker, CodeChunker
11
+ from utils import load_json
12
+
13
+ # Mocking the count_tokens function as it's external and not the focus of these tests
14
+ def mock_count_tokens(string: str, encoding_name='gpt-4') -> int:
15
+ """Returns the number of tokens in a text string."""
16
+ encoding = tiktoken.encoding_for_model(encoding_name)
17
+ num_tokens = len(encoding.encode(string))
18
+ return num_tokens
19
+
20
+ class BaseChunkerTest(unittest.TestCase):
21
+ """Base class for all code chunker tests with common setup and utilities."""
22
+
23
+ def setUp(self):
24
+ self.patcher = patch('utils.count_tokens', side_effect=mock_count_tokens)
25
+ self.mock_count_tokens = self.patcher.start()
26
+ self.mock_codebase = load_json('mock_codefiles.json')
27
+
28
+ def tearDown(self):
29
+ self.patcher.stop()
30
+
31
+ def run_chunker_test(self, code, token_limit=20):
32
+ """Helper method to run standard chunker tests."""
33
+ chunks = self.code_chunker.chunk(code, token_limit=token_limit)
34
+ Chunker.print_chunks(chunks)
35
+ final_code = Chunker.consolidate_chunks_into_file(chunks)
36
+ num_lines = Chunker.count_lines(final_code)
37
+
38
+ # Common assertions
39
+ self.assertEqual(num_lines, len(code.split("\n")))
40
+ self.assertIn(code, final_code)
41
+
42
+ return chunks, final_code
tests/test_css.py ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import unittest
2
+ from test_base import BaseChunkerTest
3
+ from Chunker import CodeChunker
4
+
5
+ class TestCodeChunkerCSS(BaseChunkerTest):
6
+ def setUp(self):
7
+ super().setUp()
8
+ self.code_chunker = CodeChunker(file_extension='css')
9
+
10
+ def test_chunk_css_with_media_query(self):
11
+ css_code = self.mock_codebase['media_queries.css']
12
+ self.run_chunker_test(css_code)
13
+
14
+ def test_chunk_css_with_simple_css(self):
15
+ css_code = self.mock_codebase['simple_styles.css']
16
+ self.run_chunker_test(css_code)
17
+
18
+ if __name__ == '__main__':
19
+ unittest.main()
tests/test_golang.py ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import unittest
2
+ from test_base import BaseChunkerTest
3
+ from Chunker import CodeChunker
4
+
5
+ class TestCodeChunkerGolang(BaseChunkerTest):
6
+ def setUp(self):
7
+ super().setUp()
8
+ self.code_chunker = CodeChunker(file_extension='go')
9
+
10
+ def test_chunk_golang_simple_code(self):
11
+ go_code = self.mock_codebase['simple.go']
12
+ chunks, _ = self.run_chunker_test(go_code)
13
+ self.assertGreater(len(chunks), 1) # Ensure the code is actually chunked
14
+
15
+ def test_chunk_golang_with_structs(self):
16
+ go_code = self.mock_codebase['structs.go']
17
+ chunks, _ = self.run_chunker_test(go_code)
18
+ self.assertGreater(len(chunks), 1)
19
+
20
+ def test_chunk_golang_with_interfaces(self):
21
+ go_code = self.mock_codebase['interfaces.go']
22
+ chunks, _ = self.run_chunker_test(go_code)
23
+ self.assertGreater(len(chunks), 1)
24
+
25
+ def test_chunk_golang_with_goroutines(self):
26
+ go_code = self.mock_codebase['goroutines.go']
27
+ chunks, _ = self.run_chunker_test(go_code)
28
+ self.assertGreater(len(chunks), 1)
29
+
30
+ if __name__ == '__main__':
31
+ unittest.main()
tests/test_javascript.py ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import unittest
2
+ from test_base import BaseChunkerTest
3
+ from Chunker import CodeChunker
4
+
5
+ class TestCodeChunkerJavaScript(BaseChunkerTest):
6
+ def setUp(self):
7
+ super().setUp()
8
+ self.code_chunker = CodeChunker(file_extension='js')
9
+
10
+ def test_chunk_javascript_simple_code(self):
11
+ js_code = self.mock_codebase['simple.js']
12
+ self.run_chunker_test(js_code)
13
+
14
+ def test_chunk_javascript_with_routes(self):
15
+ js_code = self.mock_codebase['routes.js']
16
+ self.run_chunker_test(js_code)
17
+
18
+ def test_chunk_javascript_with_models(self):
19
+ js_code = self.mock_codebase['models.js']
20
+ self.run_chunker_test(js_code)
21
+
22
+ def test_chunk_javascript_with_main(self):
23
+ js_code = self.mock_codebase['main.js']
24
+ self.run_chunker_test(js_code)
25
+
26
+ def test_chunk_javascript_with_utilities(self):
27
+ js_code = self.mock_codebase['utilities.js']
28
+ self.run_chunker_test(js_code)
29
+
30
+ def test_chunk_javascript_with_big_class(self):
31
+ js_code = self.mock_codebase['big_class.js']
32
+ self.run_chunker_test(js_code)
33
+
34
+ def test_chunk_javascript_with_react_component(self):
35
+ js_code = self.mock_codebase['react_component.js']
36
+ self.run_chunker_test(js_code)
37
+
38
+ if __name__ == '__main__':
39
+ unittest.main()
tests/test_php.py ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import unittest
2
+ from test_base import BaseChunkerTest
3
+ from Chunker import CodeChunker
4
+
5
+ class TestCodeChunkerPHP(BaseChunkerTest):
6
+ def setUp(self):
7
+ super().setUp()
8
+ self.code_chunker = CodeChunker(file_extension='php')
9
+
10
+ def test_chunk_php_code(self):
11
+ php_code = self.mock_codebase['example.php']
12
+ chunks, _ = self.run_chunker_test(php_code)
13
+ self.assertGreater(len(chunks), 1) # Ensure the code is actually chunked
14
+
15
+ if __name__ == '__main__':
16
+ unittest.main()
tests/test_python.py ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import unittest
2
+ from test_base import BaseChunkerTest, mock_count_tokens
3
+ from Chunker import CodeChunker
4
+
5
+ class TestCodeChunkerPython(BaseChunkerTest):
6
+ def setUp(self):
7
+ super().setUp()
8
+ self.code_chunker = CodeChunker(file_extension='py')
9
+
10
+ def test_chunk_simple_code(self):
11
+ py_code = self.mock_codebase['simple.py']
12
+ first_chunk_token_limit = mock_count_tokens("import sys")
13
+ print(f"first_chunk_token_limit = {first_chunk_token_limit}")
14
+ chunks = self.code_chunker.chunk(py_code, token_limit=25)
15
+ token_count = self.mock_count_tokens(py_code)
16
+ print(f"token_count = {token_count}")
17
+ print(f"original code:\n {py_code}")
18
+
19
+ chunks, full_code = self.run_chunker_test(py_code, token_limit=25)
20
+
21
+ self.assertEqual(len(chunks), 2) # There should be 2 chunks
22
+ self.assertIn("import sys", chunks[1]) # The first chunk should contain the import statement
23
+ self.assertIn("print('Hello, world!')", chunks[2]) # The second chunk should contain the print statement
24
+
25
+ def test_chunk_code_text_only(self):
26
+ py_code = self.mock_codebase['text_only.py']
27
+ chunks, final_code = self.run_chunker_test(py_code)
28
+
29
+ self.assertEqual(len(chunks), 1)
30
+ self.assertIn("This file is empty and should test the chunker's ability to handle empty files", chunks[1])
31
+
32
+ def test_chunk_code_with_routes(self):
33
+ py_code = self.mock_codebase['routes.py']
34
+ self.run_chunker_test(py_code)
35
+
36
+ def test_chunk_code_with_models(self):
37
+ py_code = self.mock_codebase['models.py']
38
+ self.run_chunker_test(py_code)
39
+
40
+ def test_chunk_code_with_main(self):
41
+ py_code = self.mock_codebase['main.py']
42
+ self.run_chunker_test(py_code)
43
+
44
+ def test_chunk_code_with_utilities(self):
45
+ py_code = self.mock_codebase['utilities.py']
46
+ self.run_chunker_test(py_code)
47
+
48
+ def test_chunk_code_with_big_class(self):
49
+ py_code = self.mock_codebase['big_class.py']
50
+ self.run_chunker_test(py_code)
51
+
52
+ if __name__ == '__main__':
53
+ unittest.main()
tests/test_ruby.py ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import unittest
2
+ from test_base import BaseChunkerTest
3
+ from Chunker import CodeChunker
4
+
5
+ class TestCodeChunkerRuby(BaseChunkerTest):
6
+ def setUp(self):
7
+ super().setUp()
8
+ self.code_chunker = CodeChunker(file_extension='rb')
9
+
10
+ def test_chunk_ruby_code(self):
11
+ rb_code = self.mock_codebase['example.rb']
12
+ chunks, _ = self.run_chunker_test(rb_code)
13
+ self.assertGreater(len(chunks), 1) # Ensure the code is actually chunked
14
+
15
+ if __name__ == '__main__':
16
+ unittest.main()
tests/test_typescript.py ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import unittest
2
+ from test_base import BaseChunkerTest
3
+ from Chunker import CodeChunker
4
+
5
+ class TestCodeChunkerTypeScript(BaseChunkerTest):
6
+ def setUp(self):
7
+ super().setUp()
8
+ self.code_chunker = CodeChunker(file_extension='ts')
9
+
10
+ def test_chunk_typescript_code(self):
11
+ ts_code = self.mock_codebase['example.ts']
12
+ chunks, _ = self.run_chunker_test(ts_code)
13
+ self.assertGreater(len(chunks), 1) # Ensure the code is actually chunked
14
+
15
+ if __name__ == '__main__':
16
+ unittest.main()