]>
Commit | Line | Data |
---|---|---|
1 | /* Name: usbdrvasm18.inc | |
2 | * Project: V-USB, virtual USB port for Atmel's(r) AVR(r) microcontrollers | |
3 | * Author: Lukas Schrittwieser (based on 20 MHz usbdrvasm20.inc by Jeroen Benschop) | |
4 | * Creation Date: 2009-01-20 | |
5 | * Tabsize: 4 | |
6 | * Copyright: (c) 2008 by Lukas Schrittwieser and OBJECTIVE DEVELOPMENT Software GmbH | |
7 | * License: GNU GPL v2 (see License.txt), GNU GPL v3 or proprietary (CommercialLicense.txt) | |
8 | * Revision: $Id: usbdrvasm18-crc.inc 740 2009-04-13 18:23:31Z cs $ | |
9 | */ | |
10 | ||
11 | /* Do not link this file! Link usbdrvasm.S instead, which includes the | |
12 | * appropriate implementation! | |
13 | */ | |
14 | ||
15 | /* | |
16 | General Description: | |
17 | This file is the 18 MHz version of the asssembler part of the USB driver. It | |
18 | requires a 18 MHz crystal (not a ceramic resonator and not a calibrated RC | |
19 | oscillator). | |
20 | ||
21 | See usbdrv.h for a description of the entire driver. | |
22 | ||
23 | Since almost all of this code is timing critical, don't change unless you | |
24 | really know what you are doing! Many parts require not only a maximum number | |
25 | of CPU cycles, but even an exact number of cycles! | |
26 | */ | |
27 | ||
28 | ||
29 | ;max stack usage: [ret(2), YL, SREG, YH, [sofError], bitcnt(x5), shift, x1, x2, x3, x4, cnt, ZL, ZH] = 14 bytes | |
30 | ;nominal frequency: 18 MHz -> 12 cycles per bit | |
31 | ; Numbers in brackets are clocks counted from center of last sync bit | |
32 | ; when instruction starts | |
33 | ;register use in receive loop to receive the data bytes: | |
34 | ; shift assembles the byte currently being received | |
35 | ; x1 holds the D+ and D- line state | |
36 | ; x2 holds the previous line state | |
37 | ; cnt holds the number of bytes left in the receive buffer | |
38 | ; x3 holds the higher crc byte (see algorithm below) | |
39 | ; x4 is used as temporary register for the crc algorithm | |
40 | ; x5 is used for unstuffing: when unstuffing the last received bit is inverted in shift (to prevent further | |
41 | ; unstuffing calls. In the same time the corresponding bit in x5 is cleared to mark the bit as beening iverted | |
42 | ; zl lower crc value and crc table index | |
43 | ; zh used for crc table accesses | |
44 | ||
45 | ;-------------------------------------------------------------------------------------------------------------- | |
46 | ; CRC mods: | |
47 | ; table driven crc checker, Z points to table in prog space | |
48 | ; ZL is the lower crc byte, x3 is the higher crc byte | |
49 | ; x4 is used as temp register to store different results | |
50 | ; the initialization of the crc register is not 0xFFFF but 0xFE54. This is because during the receipt of the | |
51 | ; first data byte an virtual zero data byte is added to the crc register, this results in the correct initial | |
52 | ; value of 0xFFFF at beginning of the second data byte before the first data byte is added to the crc. | |
53 | ; The magic number 0xFE54 results form the crc table: At tabH[0x54] = 0xFF = crcH (required) and | |
54 | ; tabL[0x54] = 0x01 -> crcL = 0x01 xor 0xFE = 0xFF | |
55 | ; bitcnt is renamed to x5 and is used for unstuffing purposes, the unstuffing works like in the 12MHz version | |
56 | ;-------------------------------------------------------------------------------------------------------------- | |
57 | ; CRC algorithm: | |
58 | ; The crc register is formed by x3 (higher byte) and ZL (lower byte). The algorithm uses a 'reversed' form | |
59 | ; i.e. that it takes the least significant bit first and shifts to the right. So in fact the highest order | |
60 | ; bit seen from the polynomial devision point of view is the lsb of ZL. (If this sounds strange to you i | |
61 | ; propose a research on CRC :-) ) | |
62 | ; Each data byte received is xored to ZL, the lower crc byte. This byte now builds the crc | |
63 | ; table index. Next the new high byte is loaded from the table and stored in x4 until we have space in x3 | |
64 | ; (its destination). | |
65 | ; Afterwards the lower table is loaded from the table and stored in ZL (the old index is overwritten as | |
66 | ; we don't need it anymore. In fact this is a right shift by 8 bits.) Now the old crc high value is xored | |
67 | ; to ZL, this is the second shift of the old crc value. Now x4 (the temp reg) is moved to x3 and the crc | |
68 | ; calculation is done. | |
69 | ; Prior to the first byte the two CRC register have to be initialized to 0xFFFF (as defined in usb spec) | |
70 | ; however the crc engine also runs during the receipt of the first byte, therefore x3 and zl are initialized | |
71 | ; to a magic number which results in a crc value of 0xFFFF after the first complete byte. | |
72 | ; | |
73 | ; This algorithm is split into the extra cycles of the different bits: | |
74 | ; bit7: XOR the received byte to ZL | |
75 | ; bit5: load the new high byte to x4 | |
76 | ; bit6: load the lower xor byte from the table, xor zl and x3, store result in zl (=the new crc low value) | |
77 | ; move x4 (the new high byte) to x3, the crc value is ready | |
78 | ; | |
79 | ||
80 | ||
81 | macro POP_STANDARD ; 18 cycles | |
82 | pop ZH | |
83 | pop ZL | |
84 | pop cnt | |
85 | pop x5 | |
86 | pop x3 | |
87 | pop x2 | |
88 | pop x1 | |
89 | pop shift | |
90 | pop x4 | |
91 | endm | |
92 | macro POP_RETI ; 7 cycles | |
93 | pop YH | |
94 | pop YL | |
95 | out SREG, YL | |
96 | pop YL | |
97 | endm | |
98 | ||
99 | macro CRC_CLEANUP_AND_CHECK | |
100 | ; the last byte has already been xored with the lower crc byte, we have to do the table lookup and xor | |
101 | ; x3 is the higher crc byte, zl the lower one | |
102 | ldi ZH, hi8(usbCrcTableHigh);[+1] get the new high byte from the table | |
103 | lpm x2, Z ;[+2][+3][+4] | |
104 | ldi ZH, hi8(usbCrcTableLow);[+5] get the new low xor byte from the table | |
105 | lpm ZL, Z ;[+6][+7][+8] | |
106 | eor ZL, x3 ;[+7] xor the old high byte with the value from the table, x2:ZL now holds the crc value | |
107 | cpi ZL, 0x01 ;[+8] if the crc is ok we have a fixed remainder value of 0xb001 in x2:ZL (see usb spec) | |
108 | brne ignorePacket ;[+9] detected a crc fault -> paket is ignored and retransmitted by the host | |
109 | cpi x2, 0xb0 ;[+10] | |
110 | brne ignorePacket ;[+11] detected a crc fault -> paket is ignored and retransmitted by the host | |
111 | endm | |
112 | ||
113 | ||
114 | USB_INTR_VECTOR: | |
115 | ;order of registers pushed: YL, SREG, YH, [sofError], x4, shift, x1, x2, x3, x5, cnt, ZL, ZH | |
116 | push YL ;[-28] push only what is necessary to sync with edge ASAP | |
117 | in YL, SREG ;[-26] | |
118 | push YL ;[-25] | |
119 | push YH ;[-23] | |
120 | ;---------------------------------------------------------------------------- | |
121 | ; Synchronize with sync pattern: | |
122 | ;---------------------------------------------------------------------------- | |
123 | ;sync byte (D-) pattern LSb to MSb: 01010100 [1 = idle = J, 0 = K] | |
124 | ;sync up with J to K edge during sync pattern -- use fastest possible loops | |
125 | ;The first part waits at most 1 bit long since we must be in sync pattern. | |
126 | ;YL is guarenteed to be < 0x80 because I flag is clear. When we jump to | |
127 | ;waitForJ, ensure that this prerequisite is met. | |
128 | waitForJ: | |
129 | inc YL | |
130 | sbis USBIN, USBMINUS | |
131 | brne waitForJ ; just make sure we have ANY timeout | |
132 | waitForK: | |
133 | ;The following code results in a sampling window of < 1/4 bit which meets the spec. | |
134 | sbis USBIN, USBMINUS ;[-17] | |
135 | rjmp foundK ;[-16] | |
136 | sbis USBIN, USBMINUS | |
137 | rjmp foundK | |
138 | sbis USBIN, USBMINUS | |
139 | rjmp foundK | |
140 | sbis USBIN, USBMINUS | |
141 | rjmp foundK | |
142 | sbis USBIN, USBMINUS | |
143 | rjmp foundK | |
144 | sbis USBIN, USBMINUS | |
145 | rjmp foundK | |
146 | sbis USBIN, USBMINUS | |
147 | rjmp foundK | |
148 | sbis USBIN, USBMINUS | |
149 | rjmp foundK | |
150 | sbis USBIN, USBMINUS | |
151 | rjmp foundK | |
152 | #if USB_COUNT_SOF | |
153 | lds YL, usbSofCount | |
154 | inc YL | |
155 | sts usbSofCount, YL | |
156 | #endif /* USB_COUNT_SOF */ | |
157 | #ifdef USB_SOF_HOOK | |
158 | USB_SOF_HOOK | |
159 | #endif | |
160 | rjmp sofError | |
161 | foundK: ;[-15] | |
162 | ;{3, 5} after falling D- edge, average delay: 4 cycles | |
163 | ;bit0 should be at 30 (2.5 bits) for center sampling. Currently at 4 so 26 cylces till bit 0 sample | |
164 | ;use 1 bit time for setup purposes, then sample again. Numbers in brackets | |
165 | ;are cycles from center of first sync (double K) bit after the instruction | |
166 | push x4 ;[-14] | |
167 | ; [---] ;[-13] | |
168 | lds YL, usbInputBufOffset;[-12] used to toggle the two usb receive buffers | |
169 | ; [---] ;[-11] | |
170 | clr YH ;[-10] | |
171 | subi YL, lo8(-(usbRxBuf));[-9] [rx loop init] | |
172 | sbci YH, hi8(-(usbRxBuf));[-8] [rx loop init] | |
173 | push shift ;[-7] | |
174 | ; [---] ;[-6] | |
175 | ldi shift, 0x80 ;[-5] the last bit is the end of byte marker for the pid receiver loop | |
176 | clc ;[-4] the carry has to be clear for receipt of pid bit 0 | |
177 | sbis USBIN, USBMINUS ;[-3] we want two bits K (sample 3 cycles too early) | |
178 | rjmp haveTwoBitsK ;[-2] | |
179 | pop shift ;[-1] undo the push from before | |
180 | pop x4 ;[1] | |
181 | rjmp waitForK ;[3] this was not the end of sync, retry | |
182 | ; The entire loop from waitForK until rjmp waitForK above must not exceed two | |
183 | ; bit times (= 24 cycles). | |
184 | ||
185 | ;---------------------------------------------------------------------------- | |
186 | ; push more registers and initialize values while we sample the first bits: | |
187 | ;---------------------------------------------------------------------------- | |
188 | haveTwoBitsK: | |
189 | push x1 ;[0] | |
190 | push x2 ;[2] | |
191 | push x3 ;[4] crc high byte | |
192 | ldi x2, 1<<USBPLUS ;[6] [rx loop init] current line state is K state. D+=="1", D-=="0" | |
193 | push x5 ;[7] | |
194 | push cnt ;[9] | |
195 | ldi cnt, USB_BUFSIZE ;[11] | |
196 | ||
197 | ||
198 | ;-------------------------------------------------------------------------------------------------------------- | |
199 | ; receives the pid byte | |
200 | ; there is no real unstuffing algorithm implemented here as a stuffing bit is impossible in the pid byte. | |
201 | ; That's because the last four bits of the byte are the inverted of the first four bits. If we detect a | |
202 | ; unstuffing condition something went wrong and abort | |
203 | ; shift has to be initialized to 0x80 | |
204 | ;-------------------------------------------------------------------------------------------------------------- | |
205 | ||
206 | ; pid bit 0 - used for even more register saving (we need the z pointer) | |
207 | in x1, USBIN ;[0] sample line state | |
208 | andi x1, USBMASK ;[1] filter only D+ and D- bits | |
209 | eor x2, x1 ;[2] generate inverted of actual bit | |
210 | sbrc x2, USBMINUS ;[3] if the bit is set we received a zero | |
211 | sec ;[4] | |
212 | ror shift ;[5] we perform no unstuffing check here as this is the first bit | |
213 | mov x2, x1 ;[6] | |
214 | push ZL ;[7] | |
215 | ;[8] | |
216 | push ZH ;[9] | |
217 | ;[10] | |
218 | ldi x3, 0xFE ;[11] x3 is the high order crc value | |
219 | ||
220 | ||
221 | bitloopPid: | |
222 | in x1, USBIN ;[0] sample line state | |
223 | andi x1, USBMASK ;[1] filter only D+ and D- bits | |
224 | breq nse0 ;[2] both lines are low so handle se0 | |
225 | eor x2, x1 ;[3] generate inverted of actual bit | |
226 | sbrc x2, USBMINUS ;[4] set the carry if we received a zero | |
227 | sec ;[5] | |
228 | ror shift ;[6] | |
229 | ldi ZL, 0x54 ;[7] ZL is the low order crc value | |
230 | ser x4 ;[8] the is no bit stuffing check here as the pid bit can't be stuffed. if so | |
231 | ; some error occured. In this case the paket is discarded later on anyway. | |
232 | mov x2, x1 ;[9] prepare for the next cycle | |
233 | brcc bitloopPid ;[10] while 0s drop out of shift we get the next bit | |
234 | eor x4, shift ;[11] invert all bits in shift and store result in x4 | |
235 | ||
236 | ;-------------------------------------------------------------------------------------------------------------- | |
237 | ; receives data bytes and calculates the crc | |
238 | ; the last USBIN state has to be in x2 | |
239 | ; this is only the first half, due to branch distanc limitations the second half of the loop is near the end | |
240 | ; of this asm file | |
241 | ;-------------------------------------------------------------------------------------------------------------- | |
242 | ||
243 | rxDataStart: | |
244 | in x1, USBIN ;[0] sample line state (note: a se0 check is not useful due to bit dribbling) | |
245 | ser x5 ;[1] prepare the unstuff marker register | |
246 | eor x2, x1 ;[2] generates the inverted of the actual bit | |
247 | bst x2, USBMINUS ;[3] copy the bit from x2 | |
248 | bld shift, 0 ;[4] and store it in shift | |
249 | mov x2, shift ;[5] make a copy of shift for unstuffing check | |
250 | andi x2, 0xF9 ;[6] mask the last six bits, if we got six zeros (which are six ones in fact) | |
251 | breq unstuff0 ;[7] then Z is set now and we branch to the unstuffing handler | |
252 | didunstuff0: | |
253 | subi cnt, 1 ;[8] cannot use dec because it doesn't affect the carry flag | |
254 | brcs nOverflow ;[9] Too many bytes received. Ignore packet | |
255 | st Y+, x4 ;[10] store the last received byte | |
256 | ;[11] st needs two cycles | |
257 | ||
258 | ; bit1 | |
259 | in x2, USBIN ;[0] sample line state | |
260 | andi x1, USBMASK ;[1] check for se0 during bit 0 | |
261 | breq nse0 ;[2] | |
262 | andi x2, USBMASK ;[3] check se0 during bit 1 | |
263 | breq nse0 ;[4] | |
264 | eor x1, x2 ;[5] | |
265 | bst x1, USBMINUS ;[6] | |
266 | bld shift, 1 ;[7] | |
267 | mov x1, shift ;[8] | |
268 | andi x1, 0xF3 ;[9] | |
269 | breq unstuff1 ;[10] | |
270 | didunstuff1: | |
271 | nop ;[11] | |
272 | ||
273 | ; bit2 | |
274 | in x1, USBIN ;[0] sample line state | |
275 | andi x1, USBMASK ;[1] check for se0 (as there is nothing else to do here | |
276 | breq nOverflow ;[2] | |
277 | eor x2, x1 ;[3] generates the inverted of the actual bit | |
278 | bst x2, USBMINUS ;[4] | |
279 | bld shift, 2 ;[5] store the bit | |
280 | mov x2, shift ;[6] | |
281 | andi x2, 0xE7 ;[7] if we have six zeros here (which means six 1 in the stream) | |
282 | breq unstuff2 ;[8] the next bit is a stuffing bit | |
283 | didunstuff2: | |
284 | nop2 ;[9] | |
285 | ;[10] | |
286 | nop ;[11] | |
287 | ||
288 | ; bit3 | |
289 | in x2, USBIN ;[0] sample line state | |
290 | andi x2, USBMASK ;[1] check for se0 | |
291 | breq nOverflow ;[2] | |
292 | eor x1, x2 ;[3] | |
293 | bst x1, USBMINUS ;[4] | |
294 | bld shift, 3 ;[5] | |
295 | mov x1, shift ;[6] | |
296 | andi x1, 0xCF ;[7] | |
297 | breq unstuff3 ;[8] | |
298 | didunstuff3: | |
299 | nop ;[9] | |
300 | rjmp rxDataBit4 ;[10] | |
301 | ;[11] | |
302 | ||
303 | ; the avr branch instructions allow an offset of +63 insturction only, so we need this | |
304 | ; 'local copy' of se0 | |
305 | nse0: | |
306 | rjmp se0 ;[4] | |
307 | ;[5] | |
308 | ; the same same as for se0 is needed for overflow and StuffErr | |
309 | nOverflow: | |
310 | stuffErr: | |
311 | rjmp overflow | |
312 | ||
313 | ||
314 | unstuff0: ;[8] this is the branch delay of breq unstuffX | |
315 | andi x1, USBMASK ;[9] do an se0 check here (if the last crc byte ends with 5 one's we might end up here | |
316 | breq didunstuff0 ;[10] event tough the message is complete -> jump back and store the byte | |
317 | ori shift, 0x01 ;[11] invert the last received bit to prevent furhter unstuffing | |
318 | in x2, USBIN ;[0] we have some free cycles so we could check for bit stuffing errors | |
319 | andi x5, 0xFE ;[1] mark this bit as inverted (will be corrected before storing shift) | |
320 | eor x1, x2 ;[2] x1 and x2 have to be different because the stuff bit is always a zero | |
321 | andi x1, USBMASK ;[3] mask the interesting bits | |
322 | breq stuffErr ;[4] if the stuff bit is a 1-bit something went wrong | |
323 | mov x1, x2 ;[5] the next bit expects the last state to be in x1 | |
324 | rjmp didunstuff0 ;[6] | |
325 | ;[7] jump delay of rjmp didunstuffX | |
326 | ||
327 | unstuff1: ;[11] this is the jump delay of breq unstuffX | |
328 | in x1, USBIN ;[0] we have some free cycles so we could check for bit stuffing errors | |
329 | ori shift, 0x02 ;[1] invert the last received bit to prevent furhter unstuffing | |
330 | andi x5, 0xFD ;[2] mark this bit as inverted (will be corrected before storing shift) | |
331 | eor x2, x1 ;[3] x1 and x2 have to be different because the stuff bit is always a zero | |
332 | andi x2, USBMASK ;[4] mask the interesting bits | |
333 | breq stuffErr ;[5] if the stuff bit is a 1-bit something went wrong | |
334 | mov x2, x1 ;[6] the next bit expects the last state to be in x2 | |
335 | nop2 ;[7] | |
336 | ;[8] | |
337 | rjmp didunstuff1 ;[9] | |
338 | ;[10] jump delay of rjmp didunstuffX | |
339 | ||
340 | unstuff2: ;[9] this is the jump delay of breq unstuffX | |
341 | ori shift, 0x04 ;[10] invert the last received bit to prevent furhter unstuffing | |
342 | andi x5, 0xFB ;[11] mark this bit as inverted (will be corrected before storing shift) | |
343 | in x2, USBIN ;[0] we have some free cycles so we could check for bit stuffing errors | |
344 | eor x1, x2 ;[1] x1 and x2 have to be different because the stuff bit is always a zero | |
345 | andi x1, USBMASK ;[2] mask the interesting bits | |
346 | breq stuffErr ;[3] if the stuff bit is a 1-bit something went wrong | |
347 | mov x1, x2 ;[4] the next bit expects the last state to be in x1 | |
348 | nop2 ;[5] | |
349 | ;[6] | |
350 | rjmp didunstuff2 ;[7] | |
351 | ;[8] jump delay of rjmp didunstuffX | |
352 | ||
353 | unstuff3: ;[9] this is the jump delay of breq unstuffX | |
354 | ori shift, 0x08 ;[10] invert the last received bit to prevent furhter unstuffing | |
355 | andi x5, 0xF7 ;[11] mark this bit as inverted (will be corrected before storing shift) | |
356 | in x1, USBIN ;[0] we have some free cycles so we could check for bit stuffing errors | |
357 | eor x2, x1 ;[1] x1 and x2 have to be different because the stuff bit is always a zero | |
358 | andi x2, USBMASK ;[2] mask the interesting bits | |
359 | breq stuffErr ;[3] if the stuff bit is a 1-bit something went wrong | |
360 | mov x2, x1 ;[4] the next bit expects the last state to be in x2 | |
361 | nop2 ;[5] | |
362 | ;[6] | |
363 | rjmp didunstuff3 ;[7] | |
364 | ;[8] jump delay of rjmp didunstuffX | |
365 | ||
366 | ||
367 | ||
368 | ; the include has to be here due to branch distance restirctions | |
369 | #define __USE_CRC__ | |
370 | #include "asmcommon.inc" | |
371 | ||
372 | ||
373 | ||
374 | ; USB spec says: | |
375 | ; idle = J | |
376 | ; J = (D+ = 0), (D- = 1) | |
377 | ; K = (D+ = 1), (D- = 0) | |
378 | ; Spec allows 7.5 bit times from EOP to SOP for replies | |
379 | ; 7.5 bit times is 90 cycles. ...there is plenty of time | |
380 | ||
381 | ||
382 | sendNakAndReti: | |
383 | ldi x3, USBPID_NAK ;[-18] | |
384 | rjmp sendX3AndReti ;[-17] | |
385 | sendAckAndReti: | |
386 | ldi cnt, USBPID_ACK ;[-17] | |
387 | sendCntAndReti: | |
388 | mov x3, cnt ;[-16] | |
389 | sendX3AndReti: | |
390 | ldi YL, 20 ;[-15] x3==r20 address is 20 | |
391 | ldi YH, 0 ;[-14] | |
392 | ldi cnt, 2 ;[-13] | |
393 | ; rjmp usbSendAndReti fallthrough | |
394 | ||
395 | ;usbSend: | |
396 | ;pointer to data in 'Y' | |
397 | ;number of bytes in 'cnt' -- including sync byte [range 2 ... 12] | |
398 | ;uses: x1...x4, btcnt, shift, cnt, Y | |
399 | ;Numbers in brackets are time since first bit of sync pattern is sent | |
400 | ||
401 | usbSendAndReti: ; 12 cycles until SOP | |
402 | in x2, USBDDR ;[-12] | |
403 | ori x2, USBMASK ;[-11] | |
404 | sbi USBOUT, USBMINUS;[-10] prepare idle state; D+ and D- must have been 0 (no pullups) | |
405 | in x1, USBOUT ;[-8] port mirror for tx loop | |
406 | out USBDDR, x2 ;[-6] <- acquire bus | |
407 | ldi x2, 0 ;[-6] init x2 (bitstuff history) because sync starts with 0 | |
408 | ldi x4, USBMASK ;[-5] exor mask | |
409 | ldi shift, 0x80 ;[-4] sync byte is first byte sent | |
410 | txByteLoop: | |
411 | ldi bitcnt, 0x40 ;[-3]=[9] binary 01000000 | |
412 | txBitLoop: ; the loop sends the first 7 bits of the byte | |
413 | sbrs shift, 0 ;[-2]=[10] if we have to send a 1 don't change the line state | |
414 | eor x1, x4 ;[-1]=[11] | |
415 | out USBOUT, x1 ;[0] | |
416 | ror shift ;[1] | |
417 | ror x2 ;[2] transfers the last sent bit to the stuffing history | |
418 | didStuffN: | |
419 | nop ;[3] | |
420 | nop ;[4] | |
421 | cpi x2, 0xfc ;[5] if we sent six consecutive ones | |
422 | brcc bitstuffN ;[6] | |
423 | lsr bitcnt ;[7] | |
424 | brne txBitLoop ;[8] restart the loop while the 1 is still in the bitcount | |
425 | ||
426 | ; transmit bit 7 | |
427 | sbrs shift, 0 ;[9] | |
428 | eor x1, x4 ;[10] | |
429 | didStuff7: | |
430 | ror shift ;[11] | |
431 | out USBOUT, x1 ;[0] transfer bit 7 to the pins | |
432 | ror x2 ;[1] move the bit into the stuffing history | |
433 | cpi x2, 0xfc ;[2] | |
434 | brcc bitstuff7 ;[3] | |
435 | ld shift, y+ ;[4] get next byte to transmit | |
436 | dec cnt ;[5] decrement byte counter | |
437 | brne txByteLoop ;[7] if we have more bytes start next one | |
438 | ;[8] branch delay | |
439 | ||
440 | ;make SE0: | |
441 | cbr x1, USBMASK ;[8] prepare SE0 [spec says EOP may be 25 to 30 cycles] | |
442 | lds x2, usbNewDeviceAddr;[9] | |
443 | lsl x2 ;[11] we compare with left shifted address | |
444 | out USBOUT, x1 ;[0] <-- out SE0 -- from now 2 bits = 24 cycles until bus idle | |
445 | subi YL, 20 + 2 ;[1] Only assign address on data packets, not ACK/NAK in x3 | |
446 | sbci YH, 0 ;[2] | |
447 | ;2006-03-06: moved transfer of new address to usbDeviceAddr from C-Code to asm: | |
448 | ;set address only after data packet was sent, not after handshake | |
449 | breq skipAddrAssign ;[3] | |
450 | sts usbDeviceAddr, x2 ; if not skipped: SE0 is one cycle longer | |
451 | skipAddrAssign: | |
452 | ;end of usbDeviceAddress transfer | |
453 | ldi x2, 1<<USB_INTR_PENDING_BIT;[5] int0 occurred during TX -- clear pending flag | |
454 | USB_STORE_PENDING(x2) ;[6] | |
455 | ori x1, USBIDLE ;[7] | |
456 | in x2, USBDDR ;[8] | |
457 | cbr x2, USBMASK ;[9] set both pins to input | |
458 | mov x3, x1 ;[10] | |
459 | cbr x3, USBMASK ;[11] configure no pullup on both pins | |
460 | ldi x4, 4 ;[12] | |
461 | se0Delay: | |
462 | dec x4 ;[13] [16] [19] [22] | |
463 | brne se0Delay ;[14] [17] [20] [23] | |
464 | out USBOUT, x1 ;[24] <-- out J (idle) -- end of SE0 (EOP signal) | |
465 | out USBDDR, x2 ;[25] <-- release bus now | |
466 | out USBOUT, x3 ;[26] <-- ensure no pull-up resistors are active | |
467 | rjmp doReturn | |
468 | ||
469 | bitstuffN: | |
470 | eor x1, x4 ;[8] generate a zero | |
471 | ldi x2, 0 ;[9] reset the bit stuffing history | |
472 | nop2 ;[10] | |
473 | out USBOUT, x1 ;[0] <-- send the stuffing bit | |
474 | rjmp didStuffN ;[1] | |
475 | ||
476 | bitstuff7: | |
477 | eor x1, x4 ;[5] | |
478 | ldi x2, 0 ;[6] reset bit stuffing history | |
479 | clc ;[7] fill a zero into the shift register | |
480 | rol shift ;[8] compensate for ror shift at branch destination | |
481 | rjmp didStuff7 ;[9] | |
482 | ;[10] jump delay | |
483 | ||
484 | ;-------------------------------------------------------------------------------------------------------------- | |
485 | ; receives data bytes and calculates the crc | |
486 | ; second half of the data byte receiver loop | |
487 | ; most parts of the crc algorithm are here | |
488 | ;-------------------------------------------------------------------------------------------------------------- | |
489 | ||
490 | nOverflow2: | |
491 | rjmp overflow | |
492 | ||
493 | rxDataBit4: | |
494 | in x1, USBIN ;[0] sample line state | |
495 | andi x1, USBMASK ;[1] check for se0 | |
496 | breq nOverflow2 ;[2] | |
497 | eor x2, x1 ;[3] | |
498 | bst x2, USBMINUS ;[4] | |
499 | bld shift, 4 ;[5] | |
500 | mov x2, shift ;[6] | |
501 | andi x2, 0x9F ;[7] | |
502 | breq unstuff4 ;[8] | |
503 | didunstuff4: | |
504 | nop2 ;[9][10] | |
505 | nop ;[11] | |
506 | ||
507 | ; bit5 | |
508 | in x2, USBIN ;[0] sample line state | |
509 | ldi ZH, hi8(usbCrcTableHigh);[1] use the table for the higher byte | |
510 | eor x1, x2 ;[2] | |
511 | bst x1, USBMINUS ;[3] | |
512 | bld shift, 5 ;[4] | |
513 | mov x1, shift ;[5] | |
514 | andi x1, 0x3F ;[6] | |
515 | breq unstuff5 ;[7] | |
516 | didunstuff5: | |
517 | lpm x4, Z ;[8] load the higher crc xor-byte and store it for later use | |
518 | ;[9] lpm needs 3 cycles | |
519 | ;[10] | |
520 | ldi ZH, hi8(usbCrcTableLow);[11] load the lower crc xor byte adress | |
521 | ||
522 | ; bit6 | |
523 | in x1, USBIN ;[0] sample line state | |
524 | eor x2, x1 ;[1] | |
525 | bst x2, USBMINUS ;[2] | |
526 | bld shift, 6 ;[3] | |
527 | mov x2, shift ;[4] | |
528 | andi x2, 0x7E ;[5] | |
529 | breq unstuff6 ;[6] | |
530 | didunstuff6: | |
531 | lpm ZL, Z ;[7] load the lower xor crc byte | |
532 | ;[8] lpm needs 3 cycles | |
533 | ;[9] | |
534 | eor ZL, x3 ;[10] xor the old high crc byte with the low xor-byte | |
535 | mov x3, x4 ;[11] move the new high order crc value from temp to its destination | |
536 | ||
537 | ; bit7 | |
538 | in x2, USBIN ;[0] sample line state | |
539 | eor x1, x2 ;[1] | |
540 | bst x1, USBMINUS ;[2] | |
541 | bld shift, 7 ;[3] now shift holds the complete but inverted data byte | |
542 | mov x1, shift ;[4] | |
543 | andi x1, 0xFC ;[5] | |
544 | breq unstuff7 ;[6] | |
545 | didunstuff7: | |
546 | eor x5, shift ;[7] x5 marks all bits which have not been inverted by the unstuffing subs | |
547 | mov x4, x5 ;[8] keep a copy of the data byte it will be stored during next bit0 | |
548 | eor ZL, x4 ;[9] feed the actual byte into the crc algorithm | |
549 | rjmp rxDataStart ;[10] next byte | |
550 | ;[11] during the reception of the next byte this one will be fed int the crc algorithm | |
551 | ||
552 | unstuff4: ;[9] this is the jump delay of rjmp unstuffX | |
553 | ori shift, 0x10 ;[10] invert the last received bit to prevent furhter unstuffing | |
554 | andi x5, 0xEF ;[11] mark this bit as inverted (will be corrected before storing shift) | |
555 | in x2, USBIN ;[0] we have some free cycles so we could check for bit stuffing errors | |
556 | eor x1, x2 ;[1] x1 and x2 have to be different because the stuff bit is always a zero | |
557 | andi x1, USBMASK ;[2] mask the interesting bits | |
558 | breq stuffErr2 ;[3] if the stuff bit is a 1-bit something went wrong | |
559 | mov x1, x2 ;[4] the next bit expects the last state to be in x1 | |
560 | nop2 ;[5] | |
561 | ;[6] | |
562 | rjmp didunstuff4 ;[7] | |
563 | ;[8] jump delay of rjmp didunstuffX | |
564 | ||
565 | unstuff5: ;[8] this is the jump delay of rjmp unstuffX | |
566 | nop ;[9] | |
567 | ori shift, 0x20 ;[10] invert the last received bit to prevent furhter unstuffing | |
568 | andi x5, 0xDF ;[11] mark this bit as inverted (will be corrected before storing shift) | |
569 | in x1, USBIN ;[0] we have some free cycles so we could check for bit stuffing errors | |
570 | eor x2, x1 ;[1] x1 and x2 have to be different because the stuff bit is always a zero | |
571 | andi x2, USBMASK ;[2] mask the interesting bits | |
572 | breq stuffErr2 ;[3] if the stuff bit is a 1-bit something went wrong | |
573 | mov x2, x1 ;[4] the next bit expects the last state to be in x2 | |
574 | nop ;[5] | |
575 | rjmp didunstuff5 ;[6] | |
576 | ;[7] jump delay of rjmp didunstuffX | |
577 | ||
578 | unstuff6: ;[7] this is the jump delay of rjmp unstuffX | |
579 | nop2 ;[8] | |
580 | ;[9] | |
581 | ori shift, 0x40 ;[10] invert the last received bit to prevent furhter unstuffing | |
582 | andi x5, 0xBF ;[11] mark this bit as inverted (will be corrected before storing shift) | |
583 | in x2, USBIN ;[0] we have some free cycles so we could check for bit stuffing errors | |
584 | eor x1, x2 ;[1] x1 and x2 have to be different because the stuff bit is always a zero | |
585 | andi x1, USBMASK ;[2] mask the interesting bits | |
586 | breq stuffErr2 ;[3] if the stuff bit is a 1-bit something went wrong | |
587 | mov x1, x2 ;[4] the next bit expects the last state to be in x1 | |
588 | rjmp didunstuff6 ;[5] | |
589 | ;[6] jump delay of rjmp didunstuffX | |
590 | ||
591 | unstuff7: ;[7] this is the jump delay of rjmp unstuffX | |
592 | nop ;[8] | |
593 | nop ;[9] | |
594 | ori shift, 0x80 ;[10] invert the last received bit to prevent furhter unstuffing | |
595 | andi x5, 0x7F ;[11] mark this bit as inverted (will be corrected before storing shift) | |
596 | in x1, USBIN ;[0] we have some free cycles so we could check for bit stuffing errors | |
597 | eor x2, x1 ;[1] x1 and x2 have to be different because the stuff bit is always a zero | |
598 | andi x2, USBMASK ;[2] mask the interesting bits | |
599 | breq stuffErr2 ;[3] if the stuff bit is a 1-bit something went wrong | |
600 | mov x2, x1 ;[4] the next bit expects the last state to be in x2 | |
601 | rjmp didunstuff7 ;[5] | |
602 | ;[6] jump delay of rjmp didunstuff7 | |
603 | ||
604 | ; local copy of the stuffErr desitnation for the second half of the receiver loop | |
605 | stuffErr2: | |
606 | rjmp stuffErr | |
607 | ||
608 | ;-------------------------------------------------------------------------------------------------------------- | |
609 | ; The crc table follows. It has to be aligned to enable a fast loading of the needed bytes. | |
610 | ; There are two tables of 256 entries each, the low and the high byte table. | |
611 | ; Table values were generated with the following C code: | |
612 | /* | |
613 | #include <stdio.h> | |
614 | int main (int argc, char **argv) | |
615 | { | |
616 | int i, j; | |
617 | for (i=0; i<512; i++){ | |
618 | unsigned short crc = i & 0xff; | |
619 | for(j=0; j<8; j++) crc = (crc >> 1) ^ ((crc & 1) ? 0xa001 : 0); | |
620 | if((i & 7) == 0) printf("\n.byte "); | |
621 | printf("0x%02x, ", (i > 0xff ? (crc >> 8) : crc) & 0xff); | |
622 | if(i == 255) printf("\n"); | |
623 | } | |
624 | return 0; | |
625 | } | |
626 | ||
627 | // Use the following algorithm to compute CRC values: | |
628 | ushort computeCrc(uchar *msg, uchar msgLen) | |
629 | { | |
630 | uchar i; | |
631 | ushort crc = 0xffff; | |
632 | for(i = 0; i < msgLen; i++) | |
633 | crc = usbCrcTable16[lo8(crc) ^ msg[i]] ^ hi8(crc); | |
634 | return crc; | |
635 | } | |
636 | */ | |
637 | ||
638 | .balign 256 | |
639 | usbCrcTableLow: | |
640 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
641 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
642 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
643 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
644 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
645 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
646 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
647 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
648 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
649 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
650 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
651 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
652 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
653 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
654 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
655 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
656 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
657 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
658 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
659 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
660 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
661 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
662 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
663 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
664 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
665 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
666 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
667 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
668 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
669 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
670 | .byte 0x00, 0xC1, 0x81, 0x40, 0x01, 0xC0, 0x80, 0x41 | |
671 | .byte 0x01, 0xC0, 0x80, 0x41, 0x00, 0xC1, 0x81, 0x40 | |
672 | ||
673 | ; .balign 256 | |
674 | usbCrcTableHigh: | |
675 | .byte 0x00, 0xC0, 0xC1, 0x01, 0xC3, 0x03, 0x02, 0xC2 | |
676 | .byte 0xC6, 0x06, 0x07, 0xC7, 0x05, 0xC5, 0xC4, 0x04 | |
677 | .byte 0xCC, 0x0C, 0x0D, 0xCD, 0x0F, 0xCF, 0xCE, 0x0E | |
678 | .byte 0x0A, 0xCA, 0xCB, 0x0B, 0xC9, 0x09, 0x08, 0xC8 | |
679 | .byte 0xD8, 0x18, 0x19, 0xD9, 0x1B, 0xDB, 0xDA, 0x1A | |
680 | .byte 0x1E, 0xDE, 0xDF, 0x1F, 0xDD, 0x1D, 0x1C, 0xDC | |
681 | .byte 0x14, 0xD4, 0xD5, 0x15, 0xD7, 0x17, 0x16, 0xD6 | |
682 | .byte 0xD2, 0x12, 0x13, 0xD3, 0x11, 0xD1, 0xD0, 0x10 | |
683 | .byte 0xF0, 0x30, 0x31, 0xF1, 0x33, 0xF3, 0xF2, 0x32 | |
684 | .byte 0x36, 0xF6, 0xF7, 0x37, 0xF5, 0x35, 0x34, 0xF4 | |
685 | .byte 0x3C, 0xFC, 0xFD, 0x3D, 0xFF, 0x3F, 0x3E, 0xFE | |
686 | .byte 0xFA, 0x3A, 0x3B, 0xFB, 0x39, 0xF9, 0xF8, 0x38 | |
687 | .byte 0x28, 0xE8, 0xE9, 0x29, 0xEB, 0x2B, 0x2A, 0xEA | |
688 | .byte 0xEE, 0x2E, 0x2F, 0xEF, 0x2D, 0xED, 0xEC, 0x2C | |
689 | .byte 0xE4, 0x24, 0x25, 0xE5, 0x27, 0xE7, 0xE6, 0x26 | |
690 | .byte 0x22, 0xE2, 0xE3, 0x23, 0xE1, 0x21, 0x20, 0xE0 | |
691 | .byte 0xA0, 0x60, 0x61, 0xA1, 0x63, 0xA3, 0xA2, 0x62 | |
692 | .byte 0x66, 0xA6, 0xA7, 0x67, 0xA5, 0x65, 0x64, 0xA4 | |
693 | .byte 0x6C, 0xAC, 0xAD, 0x6D, 0xAF, 0x6F, 0x6E, 0xAE | |
694 | .byte 0xAA, 0x6A, 0x6B, 0xAB, 0x69, 0xA9, 0xA8, 0x68 | |
695 | .byte 0x78, 0xB8, 0xB9, 0x79, 0xBB, 0x7B, 0x7A, 0xBA | |
696 | .byte 0xBE, 0x7E, 0x7F, 0xBF, 0x7D, 0xBD, 0xBC, 0x7C | |
697 | .byte 0xB4, 0x74, 0x75, 0xB5, 0x77, 0xB7, 0xB6, 0x76 | |
698 | .byte 0x72, 0xB2, 0xB3, 0x73, 0xB1, 0x71, 0x70, 0xB0 | |
699 | .byte 0x50, 0x90, 0x91, 0x51, 0x93, 0x53, 0x52, 0x92 | |
700 | .byte 0x96, 0x56, 0x57, 0x97, 0x55, 0x95, 0x94, 0x54 | |
701 | .byte 0x9C, 0x5C, 0x5D, 0x9D, 0x5F, 0x9F, 0x9E, 0x5E | |
702 | .byte 0x5A, 0x9A, 0x9B, 0x5B, 0x99, 0x59, 0x58, 0x98 | |
703 | .byte 0x88, 0x48, 0x49, 0x89, 0x4B, 0x8B, 0x8A, 0x4A | |
704 | .byte 0x4E, 0x8E, 0x8F, 0x4F, 0x8D, 0x4D, 0x4C, 0x8C | |
705 | .byte 0x44, 0x84, 0x85, 0x45, 0x87, 0x47, 0x46, 0x86 | |
706 | .byte 0x82, 0x42, 0x43, 0x83, 0x41, 0x81, 0x80, 0x40 | |
707 |