#include "dda.h" /** \file \brief Digital differential analyser - this is where we figure out which steppers need to move, and when they need to move */ #include #include #include #include #include "timer.h" #include "serial.h" #include "sermsg.h" #include "gcode_parse.h" #include "dda_queue.h" #include "debug.h" #include "sersendf.h" #include "pinio.h" #include "config.h" //#include "graycode.c" #ifdef DC_EXTRUDER #include "heater.h" #endif /// step timeout volatile uint8_t steptimeout = 0; /* position tracking */ /// \var startpoint /// \brief target position of last move in queue TARGET startpoint __attribute__ ((__section__ (".bss"))); /// \var current_position /// \brief actual position of extruder head /// \todo make current_position = real_position (from endstops) + offset from G28 and friends TARGET current_position __attribute__ ((__section__ (".bss"))); /// \var move_state /// \brief numbers for tracking the current state of movement MOVE_STATE move_state __attribute__ ((__section__ (".bss"))); /* utility functions */ // courtesy of http://www.flipcode.com/archives/Fast_Approximate_Distance_Functions.shtml /*! linear approximation 2d distance formula \param dx distance in X plane \param dy distance in Y plane \return 3-part linear approximation of \f$\sqrt{\Delta x^2 + \Delta y^2}\f$ see http://www.flipcode.com/archives/Fast_Approximate_Distance_Functions.shtml */ uint32_t approx_distance( uint32_t dx, uint32_t dy ) { uint32_t min, max, approx; if ( dx < dy ) { min = dx; max = dy; } else { min = dy; max = dx; } approx = ( max * 1007 ) + ( min * 441 ); if ( max < ( min << 4 )) approx -= ( max * 40 ); // add 512 for proper rounding return (( approx + 512 ) >> 10 ); } // courtesy of http://www.oroboro.com/rafael/docserv.php/index/programming/article/distance /*! linear approximation 3d distance formula \param dx distance in X plane \param dy distance in Y plane \param dz distance in Z plane \return 3-part linear approximation of \f$\sqrt{\Delta x^2 + \Delta y^2 + \Delta z^2}\f$ see http://www.oroboro.com/rafael/docserv.php/index/programming/article/distance */ uint32_t approx_distance_3( uint32_t dx, uint32_t dy, uint32_t dz ) { uint32_t min, med, max, approx; if ( dx < dy ) { min = dy; med = dx; } else { min = dx; med = dy; } if ( dz < min ) { max = med; med = min; min = dz; } else if ( dz < med ) { max = med; med = dz; } else { max = dz; } approx = ( max * 860 ) + ( med * 851 ) + ( min * 520 ); if ( max < ( med << 1 )) approx -= ( max * 294 ); if ( max < ( min << 2 )) approx -= ( max * 113 ); if ( med < ( min << 2 )) approx -= ( med * 40 ); // add 512 for proper rounding return (( approx + 512 ) >> 10 ); } /*! integer square root algorithm \param a find square root of this number \return sqrt(a - 1) < returnvalue <= sqrt(a) see http://www.embedded-systems.com/98/9802fe2.htm */ // courtesy of http://www.embedded-systems.com/98/9802fe2.htm uint16_t int_sqrt(uint32_t a) { uint32_t rem = 0; uint32_t root = 0; uint16_t i; for (i = 0; i < 16; i++) { root <<= 1; rem = ((rem << 2) + (a >> 30)); a <<= 2; root++; if (root <= rem) { rem -= root; root++; } else root--; } return (uint16_t) ((root >> 1) & 0xFFFFL); } // this is an ultra-crude pseudo-logarithm routine, such that: // 2 ^ msbloc(v) >= v /*! crude logarithm algorithm \param v value to find \f$log_2\f$ of \return floor(log(v) / log(2)) */ const uint8_t msbloc (uint32_t v) { uint8_t i; uint32_t c; for (i = 31, c = 0x80000000; i; i--) { if (v & c) return i; c >>= 1; } return 0; } /*! Inititalise DDA movement structures */ void dda_init(void) { // set up default feedrate current_position.F = startpoint.F = next_target.target.F = SEARCH_FEEDRATE_Z; #ifdef ACCELERATION_RAMPING move_state.n = 1; move_state.c = ((uint32_t)((double)F_CPU / sqrt((double)(STEPS_PER_MM_X * ACCELERATION)))) << 8; #endif } /*! CREATE a dda given current_position and a target, save to passed location so we can write directly into the queue \param *dda pointer to a dda_queue entry to overwrite \param *target the target position of this move \ref startpoint the beginning position of this move This function does a /lot/ of math. It works out directions for each axis, distance travelled, the time between the first and second step It also pre-fills any data that the selected accleration algorithm needs, and can be pre-computed for the whole move. This algorithm is probably the main limiting factor to print speed in terms of firmware limitations */ void dda_create(DDA *dda, TARGET *target) { uint32_t distance, c_limit, c_limit_calc; // initialise DDA to a known state dda->allflags = 0; if (DEBUG_DDA && (debug_flags & DEBUG_DDA)) serial_writestr_P(PSTR("\n{DDA_CREATE: [")); // we end at the passed target memcpy(&(dda->endpoint), target, sizeof(TARGET)); dda->x_delta = labs(target->X - startpoint.X); dda->y_delta = labs(target->Y - startpoint.Y); dda->z_delta = labs(target->Z - startpoint.Z); dda->e_delta = labs(target->E - startpoint.E); dda->x_direction = (target->X >= startpoint.X)?1:0; dda->y_direction = (target->Y >= startpoint.Y)?1:0; dda->z_direction = (target->Z >= startpoint.Z)?1:0; dda->e_direction = (target->E >= startpoint.E)?1:0; if (DEBUG_DDA && (debug_flags & DEBUG_DDA)) sersendf_P(PSTR("%ld,%ld,%ld,%ld] ["), target->X - startpoint.X, target->Y - startpoint.Y, target->Z - startpoint.Z, target->E - startpoint.E); dda->total_steps = dda->x_delta; if (dda->y_delta > dda->total_steps) dda->total_steps = dda->y_delta; if (dda->z_delta > dda->total_steps) dda->total_steps = dda->z_delta; if (dda->e_delta > dda->total_steps) dda->total_steps = dda->e_delta; if (DEBUG_DDA && (debug_flags & DEBUG_DDA)) sersendf_P(PSTR("ts:%lu"), dda->total_steps); if (dda->total_steps == 0) { dda->nullmove = 1; } else { // get steppers ready to go steptimeout = 0; power_on(); x_enable(); y_enable(); // Z is enabled in dda_start() e_enable(); // since it's unusual to combine X, Y and Z changes in a single move on reprap, check if we can use simpler approximations before trying the full 3d approximation. if (dda->z_delta == 0) distance = approx_distance(dda->x_delta * UM_PER_STEP_X, dda->y_delta * UM_PER_STEP_Y); else if (dda->x_delta == 0 && dda->y_delta == 0) distance = dda->z_delta * UM_PER_STEP_Z; else distance = approx_distance_3(dda->x_delta * UM_PER_STEP_X, dda->y_delta * UM_PER_STEP_Y, dda->z_delta * UM_PER_STEP_Z); if (distance < 2) distance = dda->e_delta * UM_PER_STEP_E; if (DEBUG_DDA && (debug_flags & DEBUG_DDA)) sersendf_P(PSTR(",ds:%lu"), distance); #ifdef ACCELERATION_TEMPORAL // bracket part of this equation in an attempt to avoid overflow: 60 * 16MHz * 5mm is >32 bits uint32_t move_duration = distance * (60 * F_CPU / startpoint.F); #else // pre-calculate move speed in millimeter microseconds per step minute for less math in interrupt context // mm (distance) * 60000000 us/min / step (total_steps) = mm.us per step.min // note: um (distance) * 60000 == mm * 60000000 // so in the interrupt we must simply calculate // mm.us per step.min / mm per min (F) = us per step // break this calculation up a bit and lose some precision because 300,000um * 60000 is too big for a uint32 // calculate this with a uint64 if you need the precision, but it'll take longer so routines with lots of short moves may suffer // 2^32/6000 is about 715mm which should be plenty // changed * 10 to * (F_CPU / 100000) so we can work in cpu_ticks rather than microseconds. // timer.c setTimer() routine altered for same reason // changed distance * 6000 .. * F_CPU / 100000 to // distance * 2400 .. * F_CPU / 40000 so we can move a distance of up to 1800mm without overflowing uint32_t move_duration = ((distance * 2400) / dda->total_steps) * (F_CPU / 40000); #endif // similarly, find out how fast we can run our axes. // do this for each axis individually, as the combined speed of two or more axes can be higher than the capabilities of a single one. c_limit = 0; // check X axis c_limit_calc = ( (dda->x_delta * (UM_PER_STEP_X * 2400L)) / dda->total_steps * (F_CPU / 40000) / MAXIMUM_FEEDRATE_X) << 8; if (c_limit_calc > c_limit) c_limit = c_limit_calc; // check Y axis c_limit_calc = ( (dda->y_delta * (UM_PER_STEP_Y * 2400L)) / dda->total_steps * (F_CPU / 40000) / MAXIMUM_FEEDRATE_Y) << 8; if (c_limit_calc > c_limit) c_limit = c_limit_calc; // check Z axis c_limit_calc = ( (dda->z_delta * (UM_PER_STEP_Z * 2400L)) / dda->total_steps * (F_CPU / 40000) / MAXIMUM_FEEDRATE_Z) << 8; if (c_limit_calc > c_limit) c_limit = c_limit_calc; // check E axis c_limit_calc = ( (dda->e_delta * (UM_PER_STEP_E * 2400L)) / dda->total_steps * (F_CPU / 40000) / MAXIMUM_FEEDRATE_E) << 8; if (c_limit_calc > c_limit) c_limit = c_limit_calc; #ifdef ACCELERATION_REPRAP // c is initial step time in IOclk ticks dda->c = (move_duration / startpoint.F) << 8; if (dda->c < c_limit) dda->c = c_limit; dda->end_c = (move_duration / target->F) << 8; if (dda->end_c < c_limit) dda->end_c = c_limit; if (DEBUG_DDA && (debug_flags & DEBUG_DDA)) sersendf_P(PSTR(",md:%lu,c:%lu"), move_duration, dda->c >> 8); if (dda->c != dda->end_c) { uint32_t stF = startpoint.F / 4; uint32_t enF = target->F / 4; // now some constant acceleration stuff, courtesy of http://www.embedded.com/columns/technicalinsights/56800129?printable=true uint32_t ssq = (stF * stF); uint32_t esq = (enF * enF); int32_t dsq = (int32_t) (esq - ssq) / 4; uint8_t msb_ssq = msbloc(ssq); uint8_t msb_tot = msbloc(dda->total_steps); // the raw equation WILL overflow at high step rates, but 64 bit math routines take waay too much space // at 65536 mm/min (1092mm/s), ssq/esq overflows, and dsq is also close to overflowing if esq/ssq is small // but if ssq-esq is small, ssq/dsq is only a few bits // we'll have to do it a few different ways depending on the msb locations of each if ((msb_tot + msb_ssq) <= 30) { // we have room to do all the multiplies first if (DEBUG_DDA && (debug_flags & DEBUG_DDA)) serial_writechar('A'); dda->n = ((int32_t) (dda->total_steps * ssq) / dsq) + 1; } else if (msb_tot >= msb_ssq) { // total steps has more precision if (DEBUG_DDA && (debug_flags & DEBUG_DDA)) serial_writechar('B'); dda->n = (((int32_t) dda->total_steps / dsq) * (int32_t) ssq) + 1; } else { // otherwise if (DEBUG_DDA && (debug_flags & DEBUG_DDA)) serial_writechar('C'); dda->n = (((int32_t) ssq / dsq) * (int32_t) dda->total_steps) + 1; } if (DEBUG_DDA && (debug_flags & DEBUG_DDA)) sersendf_P(PSTR("\n{DDA:CA end_c:%lu, n:%ld, md:%lu, ssq:%lu, esq:%lu, dsq:%lu, msbssq:%u, msbtot:%u}\n"), dda->end_c >> 8, dda->n, move_duration, ssq, esq, dsq, msb_ssq, msb_tot); dda->accel = 1; } else dda->accel = 0; #elif defined ACCELERATION_RAMPING // remove this when people have swallowed the new config item #ifdef ACCELERATION_STEEPNESS #error ACCELERATION_STEEPNESS is gone, review your config.h and use ACCELERATION #endif // yes, this assumes always the x axis as the critical one regarding acceleration. If we want to implement per-axis acceleration, things get tricky ... dda->c_min = (move_duration / target->F) << 8; if (dda->c_min < c_limit) dda->c_min = c_limit; // overflows at target->F > 65535; factor 16. found by try-and-error; will overshoot target speed a bit dda->rampup_steps = target->F * target->F / (uint32_t)(STEPS_PER_MM_X * ACCELERATION / 16.); if (dda->rampup_steps > dda->total_steps / 2) dda->rampup_steps = dda->total_steps / 2; dda->rampdown_steps = dda->total_steps - dda->rampup_steps; #else dda->c = (move_duration / target->F) << 8; if (dda->c < c_limit) dda->c = c_limit; #endif } if (DEBUG_DDA && (debug_flags & DEBUG_DDA)) serial_writestr_P(PSTR("] }\n")); // next dda starts where we finish memcpy(&startpoint, target, sizeof(TARGET)); // if E is relative, reset it here #ifndef E_ABSOLUTE startpoint.E = 0; #endif } /*! Start a prepared DDA \param *dda pointer to entry in dda_queue to start This function actually begins the move described by the passed DDA entry. We set direction and enable outputs, and set the timer for the first step from the precalculated value. We also mark this DDA as running, so other parts of the firmware know that something is happening Called both inside and outside of interrupts. */ void dda_start(DDA *dda) { // called from interrupt context: keep it simple! if (dda->nullmove) { // just change speed? current_position.F = dda->endpoint.F; // keep dda->live = 0 } else { // get ready to go steptimeout = 0; if (dda->z_delta) z_enable(); // set direction outputs x_direction(dda->x_direction); y_direction(dda->y_direction); z_direction(dda->z_direction); e_direction(dda->e_direction); #ifdef DC_EXTRUDER if (dda->e_delta) heater_set(DC_EXTRUDER, DC_EXTRUDER_PWM); #endif // initialise state variable move_state.x_counter = move_state.y_counter = move_state.z_counter = \ move_state.e_counter = -(dda->total_steps >> 1); memcpy(&move_state.x_steps, &dda->x_delta, sizeof(uint32_t) * 4); #ifdef ACCELERATION_RAMPING move_state.step_no = 0; #endif // ensure this dda starts dda->live = 1; // set timeout for first step #ifdef ACCELERATION_RAMPING if (dda->c_min > move_state.c) // can be true when look-ahead removed all deceleration steps setTimer(dda->c_min >> 8); else setTimer(move_state.c >> 8); #else setTimer(dda->c >> 8); #endif } } /*! STEP \param *dda the current move This is called from our timer interrupt every time a step needs to occur. Keep it as simple as possible! We first work out which axes need to step, and generate step pulses for them Then we re-enable global interrupts so serial data reception and other important things can occur while we do some math. Next, we work out how long until our next step using the selected acceleration algorithm and set the timer. Then we decide if this was the last step for this move, and if so mark this dda as dead so next timer interrupt we can start a new one. Finally we de-assert any asserted step pins. \todo take into account the time that interrupt takes to run */ void dda_step(DDA *dda) { uint8_t did_step = 0; if ((move_state.x_steps) /* && (x_max() != dda->x_direction) && (x_min() == dda->x_direction) */) { move_state.x_counter -= dda->x_delta; if (move_state.x_counter < 0) { x_step(); did_step = 1; move_state.x_steps--; move_state.x_counter += dda->total_steps; } } if ((move_state.y_steps) /* && (y_max() != dda->y_direction) && (y_min() == dda->y_direction) */) { move_state.y_counter -= dda->y_delta; if (move_state.y_counter < 0) { y_step(); did_step = 1; move_state.y_steps--; move_state.y_counter += dda->total_steps; } } if ((move_state.z_steps) /* && (z_max() != dda->z_direction) && (z_min() == dda->z_direction) */) { move_state.z_counter -= dda->z_delta; if (move_state.z_counter < 0) { z_step(); did_step = 1; move_state.z_steps--; move_state.z_counter += dda->total_steps; } } if (move_state.e_steps) { move_state.e_counter -= dda->e_delta; if (move_state.e_counter < 0) { e_step(); did_step = 1; move_state.e_steps--; move_state.e_counter += dda->total_steps; } } #if STEP_INTERRUPT_INTERRUPTIBLE // since we have sent steps to all the motors that will be stepping and the rest of this function isn't so time critical, // this interrupt can now be interruptible // however we must ensure that we don't step again while computing the below, so disable *this* interrupt but allow others to fire // disableTimerInterrupt(); sei(); #endif #ifdef ACCELERATION_REPRAP // linear acceleration magic, courtesy of http://www.embedded.com/columns/technicalinsights/56800129?printable=true if (dda->accel) { if ((dda->c > dda->end_c) && (dda->n > 0)) { uint32_t new_c = dda->c - (dda->c * 2) / dda->n; if (new_c <= dda->c && new_c > dda->end_c) { dda->c = new_c; dda->n += 4; } else dda->c = dda->end_c; } else if ((dda->c < dda->end_c) && (dda->n < 0)) { uint32_t new_c = dda->c + ((dda->c * 2) / -dda->n); if (new_c >= dda->c && new_c < dda->end_c) { dda->c = new_c; dda->n += 4; } else dda->c = dda->end_c; } else if (dda->c != dda->end_c) { dda->c = dda->end_c; } // else we are already at target speed } #endif #ifdef ACCELERATION_RAMPING // - algorithm courtesy of http://www.embedded.com/columns/technicalinsights/56800129?printable=true // - precalculate ramp lengths instead of counting them, see AVR446 tech note uint8_t recalc_speed; // debug ramping algorithm //if (move_state.step_no == 0) { // sersendf_P(PSTR("\r\nc %lu c_min %lu n %d"), dda->c, dda->c_min, move_state.n); //} recalc_speed = 0; if (move_state.step_no < dda->rampup_steps) { if (move_state.n < 0) // wrong ramp direction move_state.n = -((int32_t)2) - move_state.n; recalc_speed = 1; } else if (move_state.step_no > dda->rampdown_steps) { if (move_state.n > 0) // wrong ramp direction move_state.n = -((int32_t)2) - move_state.n; recalc_speed = 1; } if (recalc_speed) { move_state.n += 4; // be careful of signedness! move_state.c = (int32_t)move_state.c - ((int32_t)(move_state.c * 2) / (int32_t)move_state.n); } move_state.step_no++; // debug ramping algorithm // for very low speeds like 10 mm/min, only //if (move_state.step_no % 10 /* 10, 100, ...*/ == 0) // sersendf_P(PSTR("\r\nc %lu c_min %lu n %d"), dda->c, dda->c_min, move_state.n); #endif // TODO: did_step is obsolete ... if (did_step) { // we stepped, reset timeout steptimeout = 0; // if we could do anything at all, we're still running // otherwise, must have finished } else if (move_state.x_steps == 0 && move_state.y_steps == 0 && move_state.z_steps == 0 && move_state.e_steps == 0) { dda->live = 0; // if E is relative reset it #ifndef E_ABSOLUTE current_position.E = 0; #endif // linear acceleration code doesn't alter F during a move, so we must update it here // in theory, we *could* update F every step, but that would require a divide in interrupt context which should be avoided if at all possible current_position.F = dda->endpoint.F; #ifdef DC_EXTRUDER heater_set(DC_EXTRUDER, 0); #endif // z stepper is only enabled while moving z_disable(); } cli(); #ifdef ACCELERATION_RAMPING // we don't hit maximum speed exactly with acceleration calculation, so limit it here // the nice thing about _not_ setting dda->c to dda->c_min is, the move stops at the exact same c as it started, so we have to calculate c only once for the time being // TODO: set timer only if dda->c has changed if (dda->c_min > move_state.c) setTimer(dda->c_min >> 8); else setTimer(move_state.c >> 8); #else setTimer(dda->c >> 8); #endif // turn off step outputs, hopefully they've been on long enough by now to register with the drivers // if not, too bad. or insert a (very!) small delay here, or fire up a spare timer or something. // we also hope that we don't step before the drivers register the low- limit maximum speed if you think this is a problem. unstep(); } /// update global current_position struct void update_position() { DDA *dda = &movebuffer[mb_tail]; if (dda->live == 0) return; if (dda->x_direction) current_position.X = dda->endpoint.X - move_state.x_steps; else current_position.X = dda->endpoint.X + move_state.x_steps; if (dda->y_direction) current_position.Y = dda->endpoint.Y - move_state.y_steps; else current_position.Y = dda->endpoint.Y + move_state.y_steps; if (dda->z_direction) current_position.Z = dda->endpoint.Z - move_state.z_steps; else current_position.Z = dda->endpoint.Z + move_state.z_steps; #ifndef E_ABSOLUTE current_position.E = move_state.e_steps; #else if (dda->e_direction) current_position.E = dda->endpoint.E - move_state.e_steps; else current_position.E = dda->endpoint.E + move_state.e_steps; #endif }